upstream/ipython Commit - r4018:9950e71b

update recently changed modules with Authors in docstring

MinRK -

r4018:9950e71b

parent child

Expand all files

The requested changes are too big and content was truncated. Show full diff

IPython/config/application.py

0 +1 0

              # encoding: utf-8
              """
              A base class for a configurable application.
              Authors:
              * Brian Granger
+             * Min RK
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from copy import deepcopy
              import logging
              import re
              import sys
              from IPython.config.configurable import SingletonConfigurable
              from IPython.config.loader import (
                  KeyValueConfigLoader, PyFileConfigLoader, Config, ArgumentError
              )
              from IPython.utils.traitlets import (
                  Unicode, List, Int, Enum, Dict, Instance
              )
              from IPython.utils.importstring import import_item
              from IPython.utils.text import indent
              #-----------------------------------------------------------------------------
              # Descriptions for the various sections
              #-----------------------------------------------------------------------------
              flag_description = """
              Flags are command-line arguments passed as '--<flag>'.
              These take no parameters, unlike regular key-value arguments.
              They are typically used for setting boolean flags, or enabling
              modes that involve setting multiple options together.
              """.strip() # trim newlines of front and back
              alias_description = """
              These are commonly set parameters, given abbreviated aliases for convenience.
              They are set in the same `name=value` way as class parameters, where
              <name> is replaced by the real parameter for which it is an alias.
              """.strip() # trim newlines of front and back
              keyvalue_description = """
              Parameters are set from command-line arguments of the form:
              `Class.trait=value`.  Parameters will *never* be prefixed with '-'.
              This line is evaluated in Python, so simple expressions are allowed, e.g.
                  `C.a='range(3)'`   For setting C.a=[0,1,2]
              """.strip() # trim newlines of front and back
              #-----------------------------------------------------------------------------
              # Application class
              #-----------------------------------------------------------------------------
              class ApplicationError(Exception):
                  pass
              class Application(SingletonConfigurable):
                  """A singleton application with full configuration support."""
                  # The name of the application, will usually match the name of the command
                  # line application
                  name = Unicode(u'application')
                  # The description of the application that is printed at the beginning
                  # of the help.
                  description = Unicode(u'This is an application.')
                  # default section descriptions
                  flag_description = Unicode(flag_description)
                  alias_description = Unicode(alias_description)
                  keyvalue_description = Unicode(keyvalue_description)
                  # A sequence of Configurable subclasses whose config=True attributes will
                  # be exposed at the command line.
                  classes = List([])
                  # The version string of this application.
                  version = Unicode(u'0.0')
                  # The log level for the application
                  log_level = Enum((0,10,20,30,40,50), default_value=logging.WARN,
                                   config=True,
                                   help="Set the log level.")
                  # the alias map for configurables
                  aliases = Dict(dict(log_level='Application.log_level'))
                  # flags for loading Configurables or store_const style flags
                  # flags are loaded from this dict by '--key' flags
                  # this must be a dict of two-tuples, the first element being the Config/dict
                  # and the second being the help string for the flag
                  flags = Dict()
                  # subcommands for launching other applications
                  # if this is not empty, this will be a parent Application
                  # this must be a dict of two-tuples, the first element being the application class/import string
                  # and the second being the help string for the subcommand
                  subcommands = Dict()
                  # parse_command_line will initialize a subapp, if requested
                  subapp = Instance('IPython.config.application.Application', allow_none=True)
                  # extra command-line arguments that don't set config values
                  extra_args = List(Unicode)
                  def __init__(self, **kwargs):
                      SingletonConfigurable.__init__(self, **kwargs)
                      # Add my class to self.classes so my attributes appear in command line
                      # options.
                      self.classes.insert(0, self.__class__)
                      # ensure self.flags dict is valid
                      for key,value in self.flags.iteritems():
                          assert len(value) == 2, "Bad flag: %r:%s"%(key,value)
                          assert isinstance(value[0], (dict, Config)), "Bad flag: %r:%s"%(key,value)
                          assert isinstance(value[1], basestring), "Bad flag: %r:%s"%(key,value)
                      self.init_logging()
                  def _config_changed(self, name, old, new):
                      SingletonConfigurable._config_changed(self, name, old, new)
                      self.log.debug('Config changed:')
                      self.log.debug(repr(new))
                  def init_logging(self):
                      """Start logging for this application.
                      The default is to log to stdout using a StreaHandler. The log level
                      starts at loggin.WARN, but this can be adjusted by setting the
                      ``log_level`` attribute.
                      """
                      self.log = logging.getLogger(self.__class__.__name__)
                      self.log.setLevel(self.log_level)
                      self._log_handler = logging.StreamHandler()
                      self._log_formatter = logging.Formatter("[%(name)s] %(message)s")
                      self._log_handler.setFormatter(self._log_formatter)
                      self.log.addHandler(self._log_handler)
                  def initialize(self, argv=None):
                      """Do the basic steps to configure me.
                      Override in subclasses.
                      """
                      self.parse_command_line(argv)
                  def start(self):
                      """Start the app mainloop.
                      Override in subclasses.
                      """
                      if self.subapp is not None:
                          return self.subapp.start()
                  def _log_level_changed(self, name, old, new):
                      """Adjust the log level when log_level is set."""
                      self.log.setLevel(new)
                  def print_alias_help(self):
                      """print the alias part of the help"""
                      if not self.aliases:
                          return
                      lines = ['Aliases']
                      lines.append('-'*len(lines[0]))
                      lines.append(self.alias_description)
                      lines.append('')
                      classdict = {}
                      for cls in self.classes:
                          # include all parents (up to, but excluding Configurable) in available names
                          for c in cls.mro()[:-3]:
                              classdict[c.__name__] = c
                      for alias, longname in self.aliases.iteritems():
                          classname, traitname = longname.split('.',1)
                          cls = classdict[classname]
                          trait = cls.class_traits(config=True)[traitname]
                          help = cls.class_get_trait_help(trait)
                          help = help.replace(longname, "%s (%s)"%(alias, longname), 1)
                          lines.append(help)
                      lines.append('')
                      print '\n'.join(lines)
                  def print_flag_help(self):
                      """print the flag part of the help"""
                      if not self.flags:
                          return
                      lines = ['Flags']
                      lines.append('-'*len(lines[0]))
                      lines.append(self.flag_description)
                      lines.append('')
                      for m, (cfg,help) in self.flags.iteritems():
                          lines.append('--'+m)
                          lines.append(indent(help.strip(), flatten=True))
                      lines.append('')
                      print '\n'.join(lines)
                  def print_subcommands(self):
                      """print the subcommand part of the help"""
                      if not self.subcommands:
                          return
                      lines = ["Subcommands"]
                      lines.append('-'*len(lines[0]))
                      for subc, (cls,help) in self.subcommands.iteritems():
                          lines.append("%s : %s"%(subc, cls))
                          if help:
                              lines.append(indent(help.strip(), flatten=True))
                      lines.append('')
                      print '\n'.join(lines)
                  def print_help(self, classes=False):
                      """Print the help for each Configurable class in self.classes.
                      If classes=False (the default), only flags and aliases are printed
                      """
                      self.print_subcommands()
                      self.print_flag_help()
                      self.print_alias_help()
                      if classes:
                          if self.classes:
                              print "Class parameters"
                              print "----------------"
                              print self.keyvalue_description
                              print
                          for cls in self.classes:
                              cls.class_print_help()
                              print
                      else:
                          print "To see all available configurables, use `--help-all`"
                          print
                  def print_description(self):
                      """Print the application description."""
                      print self.description
                      print
                  def print_version(self):
                      """Print the version string."""
                      print self.version
                  def update_config(self, config):
                      """Fire the traits events when the config is updated."""
                      # Save a copy of the current config.
                      newconfig = deepcopy(self.config)
                      # Merge the new config into the current one.
                      newconfig._merge(config)
                      # Save the combined config as self.config, which triggers the traits
                      # events.
                      self.config = newconfig
                  def initialize_subcommand(self, subc, argv=None):
                      """Initialize a subcommand with argv"""
                      subapp,help = self.subcommands.get(subc)
                      if isinstance(subapp, basestring):
                          subapp = import_item(subapp)
                      # clear existing instances
                      self.__class__.clear_instance()
                      # instantiate
                      self.subapp = subapp.instance()
                      # and initialize subapp
                      self.subapp.initialize(argv)
                  def parse_command_line(self, argv=None):
                      """Parse the command line arguments."""
                      argv = sys.argv[1:] if argv is None else argv
                      if self.subcommands and len(argv) > 0:
                          # we have subcommands, and one may have been specified
                          subc, subargv = argv[0], argv[1:]
                          if re.match(r'^\w(\-?\w)*$', subc) and subc in self.subcommands:
                              # it's a subcommand, and *not* a flag or class parameter
                              return self.initialize_subcommand(subc, subargv)
                      if '-h' in argv or '--help' in argv or '--help-all' in argv:
                          self.print_description()
                          self.print_help('--help-all' in argv)
                          self.exit(0)
                      if '--version' in argv:
                          self.print_version()
                          self.exit(0)
                      loader = KeyValueConfigLoader(argv=argv, aliases=self.aliases,
                                                      flags=self.flags)
                      try:
                          config = loader.load_config()
                      except ArgumentError as e:
                          self.log.fatal(str(e))
                          self.print_description()
                          self.print_help()
                          self.exit(1)
                      self.update_config(config)
                      # store unparsed args in extra_args
                      self.extra_args = loader.extra_args
                  def load_config_file(self, filename, path=None):
                      """Load a .py based config file by filename and path."""
                      loader = PyFileConfigLoader(filename, path=path)
                      config = loader.load_config()
                      self.update_config(config)
                  def exit(self, exit_status=0):
                      self.log.debug("Exiting application: %s" % self.name)
                      sys.exit(exit_status)
              #-----------------------------------------------------------------------------
              # utility functions, for convenience
              #-----------------------------------------------------------------------------
              def boolean_flag(name, configurable, set_help='', unset_help=''):
                  """helper for building basic --trait, --no-trait flags
                  Parameters
                  ----------
                  name : str
                      The name of the flag.
                  configurable : str
                      The 'Class.trait' string of the trait to be set/unset with the flag
                  set_help : unicode
                      help string for --name flag
                  unset_help : unicode
                      help string for --no-name flag
                  Returns
                  -------
                  cfg : dict
                      A dict with two keys: 'name', and 'no-name', for setting and unsetting
                      the trait, respectively.
                  """
                  # default helpstrings
                  set_help = set_help or "set %s=True"%configurable
                  unset_help = unset_help or "set %s=False"%configurable
                  cls,trait = configurable.split('.')
                  setter = {cls : {trait : True}}
                  unsetter = {cls : {trait : False}}
                  return {name : (setter, set_help), 'no-'+name : (unsetter, unset_help)}

IPython/config/configurable.py

0 +2 -1

              #!/usr/bin/env python
              # encoding: utf-8
              """
              A base class for objects that are configurable.
              Authors:
              * Brian Granger
              * Fernando Perez
+             * Min RK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2010  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from copy import deepcopy
              import datetime
              from loader import Config
              from IPython.utils.traitlets import HasTraits, Instance
              from IPython.utils.text import indent
              #-----------------------------------------------------------------------------
              # Helper classes for Configurables
              #-----------------------------------------------------------------------------
              class ConfigurableError(Exception):
                  pass
              class MultipleInstanceError(ConfigurableError):
                  pass
              #-----------------------------------------------------------------------------
              # Configurable implementation
              #-----------------------------------------------------------------------------
              class Configurable(HasTraits):
                  config = Instance(Config,(),{})
                  created = None
                  def __init__(self, **kwargs):
                      """Create a conigurable given a config config.
                      Parameters
                      ----------
                      config : Config
                          If this is empty, default values are used. If config is a
                          :class:`Config` instance, it will be used to configure the
                          instance.
                      Notes
                      -----
                      Subclasses of Configurable must call the :meth:`__init__` method of
                      :class:`Configurable` *before* doing anything else and using
                      :func:`super`::
                          class MyConfigurable(Configurable):
                              def __init__(self, config=None):
                                  super(MyConfigurable, self).__init__(config)
                                  # Then any other code you need to finish initialization.
                      This ensures that instances will be configured properly.
                      """
                      config = kwargs.pop('config', None)
                      if config is not None:
                          # We used to deepcopy, but for now we are trying to just save
                          # by reference.  This *could* have side effects as all components
                          # will share config. In fact, I did find such a side effect in
                          # _config_changed below. If a config attribute value was a mutable type
                          # all instances of a component were getting the same copy, effectively
                          # making that a class attribute.
                          # self.config = deepcopy(config)
                          self.config = config
                      # This should go second so individual keyword arguments override
                      # the values in config.
                      super(Configurable, self).__init__(**kwargs)
                      self.created = datetime.datetime.now()
                  #-------------------------------------------------------------------------
                  # Static trait notifiations
                  #-------------------------------------------------------------------------
                  def _config_changed(self, name, old, new):
                      """Update all the class traits having ``config=True`` as metadata.
                      For any class trait with a ``config`` metadata attribute that is
                      ``True``, we update the trait with the value of the corresponding
                      config entry.
                      """
                      # Get all traits with a config metadata entry that is True
                      traits = self.traits(config=True)
                      # We auto-load config section for this class as well as any parent
                      # classes that are Configurable subclasses.  This starts with Configurable
                      # and works down the mro loading the config for each section.
                      section_names = [cls.__name__ for cls in \
                          reversed(self.__class__.__mro__) if
                          issubclass(cls, Configurable) and issubclass(self.__class__, cls)]
                      for sname in section_names:
                          # Don't do a blind getattr as that would cause the config to
                          # dynamically create the section with name self.__class__.__name__.
                          if new._has_section(sname):
                              my_config = new[sname]
                              for k, v in traits.iteritems():
                                  # Don't allow traitlets with config=True to start with
                                  # uppercase.  Otherwise, they are confused with Config
                                  # subsections.  But, developers shouldn't have uppercase
                                  # attributes anyways! (PEP 6)
                                  if k[0].upper()==k[0] and not k.startswith('_'):
                                      raise ConfigurableError('Configurable traitlets with '
                                      'config=True must start with a lowercase so they are '
                                      'not confused with Config subsections: %s.%s' % \
                                      (self.__class__.__name__, k))
                                  try:
                                      # Here we grab the value from the config
                                      # If k has the naming convention of a config
                                      # section, it will be auto created.
                                      config_value = my_config[k]
                                  except KeyError:
                                      pass
                                  else:
                                      # print "Setting %s.%s from %s.%s=%r" % \
                                      #     (self.__class__.__name__,k,sname,k,config_value)
                                      # We have to do a deepcopy here if we don't deepcopy the entire
                                      # config object. If we don't, a mutable config_value will be
                                      # shared by all instances, effectively making it a class attribute.
                                      setattr(self, k, deepcopy(config_value))
                  @classmethod
                  def class_get_help(cls):
                      """Get the help string for this class in ReST format."""
                      cls_traits = cls.class_traits(config=True)
                      final_help = []
                      final_help.append(u'%s options' % cls.__name__)
                      final_help.append(len(final_help[0])*u'-')
                      for k,v in cls.class_traits(config=True).iteritems():
                          help = cls.class_get_trait_help(v)
                          final_help.append(help)
                      return '\n'.join(final_help)
                  @classmethod
                  def class_get_trait_help(cls, trait):
                      """Get the help string for a single """
                      lines = []
                      header = "%s.%s : %s" % (cls.__name__, trait.name, trait.__class__.__name__)
                      try:
                          dvr = repr(trait.get_default_value())
                      except Exception:
                          dvr = None # ignore defaults we can't construct
                      if dvr is not None:
                          header += ' [default: %s]'%dvr
                      lines.append(header)
                      help = trait.get_metadata('help')
                      if help is not None:
                          lines.append(indent(help.strip(), flatten=True))
                      if 'Enum' in trait.__class__.__name__:
                          # include Enum choices
                          lines.append(indent('Choices: %r'%(trait.values,), flatten=True))
                      return '\n'.join(lines)
                  @classmethod
                  def class_print_help(cls):
                      print cls.class_get_help()
              class SingletonConfigurable(Configurable):
                  """A configurable that only allows one instance.
                  This class is for classes that should only have one instance of itself
                  or *any* subclass. To create and retrieve such a class use the
                  :meth:`SingletonConfigurable.instance` method.
                  """
                  _instance = None
                  @classmethod
                  def _walk_mro(cls):
                      """Walk the cls.mro() for parent classes that are also singletons
                      For use in instance()
                      """
                      for subclass in cls.mro():
                          if issubclass(cls, subclass) and \
                                  issubclass(subclass, SingletonConfigurable) and \
                                  subclass != SingletonConfigurable:
                              yield subclass
                  @classmethod
                  def clear_instance(cls):
                      """unset _instance for this class and singleton parents.
                      """
                      if not cls.initialized():
                          return
                      for subclass in cls._walk_mro():
                          if isinstance(subclass._instance, cls):
                              # only clear instances that are instances
                              # of the calling class
                              subclass._instance = None
                  @classmethod
                  def instance(cls, *args, **kwargs):
                      """Returns a global instance of this class.
                      This method create a new instance if none have previously been created
                      and returns a previously created instance is one already exists.
                      The arguments and keyword arguments passed to this method are passed
                      on to the :meth:`__init__` method of the class upon instantiation.
                      Examples
                      --------
                      Create a singleton class using instance, and retrieve it::
                          >>> from IPython.config.configurable import SingletonConfigurable
                          >>> class Foo(SingletonConfigurable): pass
                          >>> foo = Foo.instance()
                          >>> foo == Foo.instance()
                          True
                      Create a subclass that is retrived using the base class instance::
                          >>> class Bar(SingletonConfigurable): pass
                          >>> class Bam(Bar): pass
                          >>> bam = Bam.instance()
                          >>> bam == Bar.instance()
                          True
                      """
                      # Create and save the instance
                      if cls._instance is None:
                          inst = cls(*args, **kwargs)
                          # Now make sure that the instance will also be returned by
                          # parent classes' _instance attribute.
                          for subclass in cls._walk_mro():
                              subclass._instance = inst
                      if isinstance(cls._instance, cls):
                          return cls._instance
                      else:
                          raise MultipleInstanceError(
                              'Multiple incompatible subclass instances of '
                              '%s are being created.' % cls.__name__
                          )
                  @classmethod
                  def initialized(cls):
                      """Has an instance been created?"""
                      return hasattr(cls, "_instance") and cls._instance is not None
              class LoggingConfigurable(Configurable):
                  """A parent class for Configurables that log.
                  Subclasses have a log trait, and the default behavior
                  is to get the logger from the currently running Application
                  via Application.instance().log.
                  """
                  log = Instance('logging.Logger')
                  def _log_default(self):
                      from IPython.config.application import Application
                      return Application.instance().log
   No newline at end of file

IPython/config/loader.py

0 +2 -1

              """A simple configuration system.
              Authors
              -------
              * Brian Granger
              * Fernando Perez
+             * Min RK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2009  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import __builtin__
              import re
              import sys
              from IPython.external import argparse
              from IPython.utils.path import filefind
              #-----------------------------------------------------------------------------
              # Exceptions
              #-----------------------------------------------------------------------------
              class ConfigError(Exception):
                  pass
              class ConfigLoaderError(ConfigError):
                  pass
              class ArgumentError(ConfigLoaderError):
                  pass
              #-----------------------------------------------------------------------------
              # Argparse fix
              #-----------------------------------------------------------------------------
              # Unfortunately argparse by default prints help messages to stderr instead of
              # stdout.  This makes it annoying to capture long help screens at the command
              # line, since one must know how to pipe stderr, which many users don't know how
              # to do.  So we override the print_help method with one that defaults to
              # stdout and use our class instead.
              class ArgumentParser(argparse.ArgumentParser):
                  """Simple argparse subclass that prints help to stdout by default."""
                  def print_help(self, file=None):
                      if file is None:
                          file = sys.stdout
                      return super(ArgumentParser, self).print_help(file)
                  print_help.__doc__ = argparse.ArgumentParser.print_help.__doc__
              #-----------------------------------------------------------------------------
              # Config class for holding config information
              #-----------------------------------------------------------------------------
              class Config(dict):
                  """An attribute based dict that can do smart merges."""
                  def __init__(self, *args, **kwds):
                      dict.__init__(self, *args, **kwds)
                      # This sets self.__dict__ = self, but it has to be done this way
                      # because we are also overriding __setattr__.
                      dict.__setattr__(self, '__dict__', self)
                  def _merge(self, other):
                      to_update = {}
                      for k, v in other.iteritems():
                          if not self.has_key(k):
                              to_update[k] = v
                          else: # I have this key
                              if isinstance(v, Config):
                                  # Recursively merge common sub Configs
                                  self[k]._merge(v)
                              else:
                                  # Plain updates for non-Configs
                                  to_update[k] = v
                      self.update(to_update)
                  def _is_section_key(self, key):
                      if key[0].upper()==key[0] and not key.startswith('_'):
                          return True
                      else:
                          return False
                  def __contains__(self, key):
                      if self._is_section_key(key):
                          return True
                      else:
                          return super(Config, self).__contains__(key)
                  # .has_key is deprecated for dictionaries.
                  has_key = __contains__
                  def _has_section(self, key):
                      if self._is_section_key(key):
                          if super(Config, self).__contains__(key):
                              return True
                      return False
                  def copy(self):
                      return type(self)(dict.copy(self))
                  def __copy__(self):
                      return self.copy()
                  def __deepcopy__(self, memo):
                      import copy
                      return type(self)(copy.deepcopy(self.items()))
                  def __getitem__(self, key):
                      # We cannot use directly self._is_section_key, because it triggers
                      # infinite recursion on top of PyPy. Instead, we manually fish the
                      # bound method.
                      is_section_key = self.__class__._is_section_key.__get__(self)
                      # Because we use this for an exec namespace, we need to delegate
                      # the lookup of names in __builtin__ to itself.  This means
                      # that you can't have section or attribute names that are
                      # builtins.
                      try:
                          return getattr(__builtin__, key)
                      except AttributeError:
                          pass
                      if is_section_key(key):
                          try:
                              return dict.__getitem__(self, key)
                          except KeyError:
                              c = Config()
                              dict.__setitem__(self, key, c)
                              return c
                      else:
                          return dict.__getitem__(self, key)
                  def __setitem__(self, key, value):
                      # Don't allow names in __builtin__ to be modified.
                      if hasattr(__builtin__, key):
                          raise ConfigError('Config variable names cannot have the same name '
                                            'as a Python builtin: %s' % key)
                      if self._is_section_key(key):
                          if not isinstance(value, Config):
                              raise ValueError('values whose keys begin with an uppercase '
                                               'char must be Config instances: %r, %r' % (key, value))
                      else:
                          dict.__setitem__(self, key, value)
                  def __getattr__(self, key):
                      try:
                          return self.__getitem__(key)
                      except KeyError, e:
                          raise AttributeError(e)
                  def __setattr__(self, key, value):
                      try:
                          self.__setitem__(key, value)
                      except KeyError, e:
                          raise AttributeError(e)
                  def __delattr__(self, key):
                      try:
                          dict.__delitem__(self, key)
                      except KeyError, e:
                          raise AttributeError(e)
              #-----------------------------------------------------------------------------
              # Config loading classes
              #-----------------------------------------------------------------------------
              class ConfigLoader(object):
                  """A object for loading configurations from just about anywhere.
                  The resulting configuration is packaged as a :class:`Struct`.
                  Notes
                  -----
                  A :class:`ConfigLoader` does one thing: load a config from a source
                  (file, command line arguments) and returns the data as a :class:`Struct`.
                  There are lots of things that :class:`ConfigLoader` does not do.  It does
                  not implement complex logic for finding config files.  It does not handle
                  default values or merge multiple configs.  These things need to be
                  handled elsewhere.
                  """
                  def __init__(self):
                      """A base class for config loaders.
                      Examples
                      --------
                      >>> cl = ConfigLoader()
                      >>> config = cl.load_config()
                      >>> config
                      {}
                      """
                      self.clear()
                  def clear(self):
                      self.config = Config()
                  def load_config(self):
                      """Load a config from somewhere, return a :class:`Config` instance.
                      Usually, this will cause self.config to be set and then returned.
                      However, in most cases, :meth:`ConfigLoader.clear` should be called
                      to erase any previous state.
                      """
                      self.clear()
                      return self.config
              class FileConfigLoader(ConfigLoader):
                  """A base class for file based configurations.
                  As we add more file based config loaders, the common logic should go
                  here.
                  """
                  pass
              class PyFileConfigLoader(FileConfigLoader):
                  """A config loader for pure python files.
                  This calls execfile on a plain python file and looks for attributes
                  that are all caps.  These attribute are added to the config Struct.
                  """
                  def __init__(self, filename, path=None):
                      """Build a config loader for a filename and path.
                      Parameters
                      ----------
                      filename : str
                          The file name of the config file.
                      path : str, list, tuple
                          The path to search for the config file on, or a sequence of
                          paths to try in order.
                      """
                      super(PyFileConfigLoader, self).__init__()
                      self.filename = filename
                      self.path = path
                      self.full_filename = ''
                      self.data = None
                  def load_config(self):
                      """Load the config from a file and return it as a Struct."""
                      self.clear()
                      self._find_file()
                      self._read_file_as_dict()
                      self._convert_to_config()
                      return self.config
                  def _find_file(self):
                      """Try to find the file by searching the paths."""
                      self.full_filename = filefind(self.filename, self.path)
                  def _read_file_as_dict(self):
                      """Load the config file into self.config, with recursive loading."""
                      # This closure is made available in the namespace that is used
                      # to exec the config file.  This allows users to call
                      # load_subconfig('myconfig.py') to load config files recursively.
                      # It needs to be a closure because it has references to self.path
                      # and self.config.  The sub-config is loaded with the same path
                      # as the parent, but it uses an empty config which is then merged
                      # with the parents.
                      def load_subconfig(fname):
                          loader = PyFileConfigLoader(fname, self.path)
                          try:
                              sub_config = loader.load_config()
                          except IOError:
                              # Pass silently if the sub config is not there. This happens
                              # when a user us using a profile, but not the default config.
                              pass
                          else:
                              self.config._merge(sub_config)
                      # Again, this needs to be a closure and should be used in config
                      # files to get the config being loaded.
                      def get_config():
                          return self.config
                      namespace = dict(load_subconfig=load_subconfig, get_config=get_config)
                      fs_encoding = sys.getfilesystemencoding() or 'ascii'
                      conf_filename = self.full_filename.encode(fs_encoding)
                      execfile(conf_filename, namespace)
                  def _convert_to_config(self):
                      if self.data is None:
                          ConfigLoaderError('self.data does not exist')
              class CommandLineConfigLoader(ConfigLoader):
                  """A config loader for command line arguments.
                  As we add more command line based loaders, the common logic should go
                  here.
                  """
              kv_pattern = re.compile(r'[A-Za-z]\w*(\.\w+)*\=.*')
              flag_pattern = re.compile(r'\-\-\w+(\-\w)*')
              class KeyValueConfigLoader(CommandLineConfigLoader):
                  """A config loader that loads key value pairs from the command line.
                  This allows command line options to be gives in the following form::
                      ipython Global.profile="foo" InteractiveShell.autocall=False
                  """
                  def __init__(self, argv=None, aliases=None, flags=None):
                      """Create a key value pair config loader.
                      Parameters
                      ----------
                      argv : list
                          A list that has the form of sys.argv[1:] which has unicode
                          elements of the form u"key=value". If this is None (default),
                          then sys.argv[1:] will be used.
                      aliases : dict
                          A dict of aliases for configurable traits.
                          Keys are the short aliases, Values are the resolved trait.
                          Of the form: `{'alias' : 'Configurable.trait'}`
                      flags : dict
                          A dict of flags, keyed by str name. Vaues can be Config objects,
                          dicts, or "key=value" strings.  If Config or dict, when the flag
                          is triggered, The flag is loaded as `self.config.update(m)`.
                      Returns
                      -------
                      config : Config
                          The resulting Config object.
                      Examples
                      --------
                          >>> from IPython.config.loader import KeyValueConfigLoader
                          >>> cl = KeyValueConfigLoader()
                          >>> cl.load_config(["foo='bar'","A.name='brian'","B.number=0"])
                          {'A': {'name': 'brian'}, 'B': {'number': 0}, 'foo': 'bar'}
                      """
                      if argv is None:
                          argv = sys.argv[1:]
                      self.argv = argv
                      self.aliases = aliases or {}
                      self.flags = flags or {}
                  def load_config(self, argv=None, aliases=None, flags=None):
                      """Parse the configuration and generate the Config object.
                      Parameters
                      ----------
                      argv : list, optional
                          A list that has the form of sys.argv[1:] which has unicode
                          elements of the form u"key=value". If this is None (default),
                          then self.argv will be used.
                      aliases : dict
                          A dict of aliases for configurable traits.
                          Keys are the short aliases, Values are the resolved trait.
                          Of the form: `{'alias' : 'Configurable.trait'}`
                      flags : dict
                          A dict of flags, keyed by str name. Values can be Config objects
                          or dicts.  When the flag is triggered, The config is loaded as
                          `self.config.update(cfg)`.
                      """
                      from IPython.config.configurable import Configurable
                      self.clear()
                      if argv is None:
                          argv = self.argv
                      if aliases is None:
                          aliases = self.aliases
                      if flags is None:
                          flags = self.flags
                      self.extra_args = []
                      for item in argv:
                          if kv_pattern.match(item):
                              lhs,rhs = item.split('=',1)
                              # Substitute longnames for aliases.
                              if lhs in aliases:
                                  lhs = aliases[lhs]
                              exec_str = 'self.config.' + lhs + '=' + rhs
                              try:
                                  # Try to see if regular Python syntax will work. This
                                  # won't handle strings as the quote marks are removed
                                  # by the system shell.
                                  exec exec_str in locals(), globals()
                              except (NameError, SyntaxError):
                                  # This case happens if the rhs is a string but without
                                  # the quote marks.  We add the quote marks and see if
                                  # it succeeds. If it still fails, we let it raise.
                                  exec_str = 'self.config.' + lhs + '="' + rhs + '"'
                                  exec exec_str in locals(), globals()
                          elif flag_pattern.match(item):
                              # trim leading '--'
                              m = item[2:]
                              cfg,_ = flags.get(m, (None,None))
                              if cfg is None:
                                  raise ArgumentError("Unrecognized flag: %r"%item)
                              elif isinstance(cfg, (dict, Config)):
                                  # don't clobber whole config sections, update
                                  # each section from config:
                                  for sec,c in cfg.iteritems():
                                      self.config[sec].update(c)
                              else:
                                  raise ValueError("Invalid flag: %r"%flag)
                          elif item.startswith('-'):
                              # this shouldn't ever be valid
                              raise ArgumentError("Invalid argument: %r"%item)
                          else:
                              # keep all args that aren't valid in a list,
                              # in case our parent knows what to do with them.
                              self.extra_args.append(item)
                      return self.config
              class ArgParseConfigLoader(CommandLineConfigLoader):
                  """A loader that uses the argparse module to load from the command line."""
                  def __init__(self, argv=None, *parser_args, **parser_kw):
                      """Create a config loader for use with argparse.
                      Parameters
                      ----------
                      argv : optional, list
                        If given, used to read command-line arguments from, otherwise
                        sys.argv[1:] is used.
                      parser_args : tuple
                        A tuple of positional arguments that will be passed to the
                        constructor of :class:`argparse.ArgumentParser`.
                      parser_kw : dict
                        A tuple of keyword arguments that will be passed to the
                        constructor of :class:`argparse.ArgumentParser`.
                      Returns
                      -------
                      config : Config
                          The resulting Config object.
                      """
                      super(CommandLineConfigLoader, self).__init__()
                      if argv == None:
                          argv = sys.argv[1:]
                      self.argv = argv
                      self.parser_args = parser_args
                      self.version = parser_kw.pop("version", None)
                      kwargs = dict(argument_default=argparse.SUPPRESS)
                      kwargs.update(parser_kw)
                      self.parser_kw = kwargs
                  def load_config(self, argv=None):
                      """Parse command line arguments and return as a Config object.
                      Parameters
                      ----------
                      args : optional, list
                        If given, a list with the structure of sys.argv[1:] to parse
                        arguments from. If not given, the instance's self.argv attribute
                        (given at construction time) is used."""
                      self.clear()
                      if argv is None:
                          argv = self.argv
                      self._create_parser()
                      self._parse_args(argv)
                      self._convert_to_config()
                      return self.config
                  def get_extra_args(self):
                      if hasattr(self, 'extra_args'):
                          return self.extra_args
                      else:
                          return []
                  def _create_parser(self):
                      self.parser = ArgumentParser(*self.parser_args, **self.parser_kw)
                      self._add_arguments()
                  def _add_arguments(self):
                      raise NotImplementedError("subclasses must implement _add_arguments")
                  def _parse_args(self, args):
                      """self.parser->self.parsed_data"""
                      # decode sys.argv to support unicode command-line options
                      uargs = []
                      for a in args:
                          if isinstance(a, str):
                              # don't decode if we already got unicode
                              a = a.decode(sys.stdin.encoding or
                                                          sys.getdefaultencoding())
                          uargs.append(a)
                      self.parsed_data, self.extra_args = self.parser.parse_known_args(uargs)
                  def _convert_to_config(self):
                      """self.parsed_data->self.config"""
                      for k, v in vars(self.parsed_data).iteritems():
                          exec_str = 'self.config.' + k + '= v'
                          exec exec_str in locals(), globals()

IPython/core/newapplication.py

0 +1 0

              # encoding: utf-8
              """
              An application for IPython.
              All top-level applications should use the classes in this module for
              handling configuration and creating componenets.
              The job of an :class:`Application` is to create the master configuration
              object and then create the configurable objects, passing the config to them.
              Authors:
              * Brian Granger
              * Fernando Perez
+             * Min RK
              Notes
              -----
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2008-2009  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import logging
              import os
              import shutil
              import sys
              from IPython.config.application import Application
              from IPython.config.configurable import Configurable
              from IPython.config.loader import Config
              from IPython.core import release, crashhandler
              from IPython.utils.path import get_ipython_dir, get_ipython_package_dir, expand_path
              from IPython.utils.traitlets import List, Unicode, Type, Bool, Dict
              #-----------------------------------------------------------------------------
              # Classes and functions
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Module errors
              #-----------------------------------------------------------------------------
              class ProfileDirError(Exception):
                  pass
              #-----------------------------------------------------------------------------
              # Class for managing profile directories
              #-----------------------------------------------------------------------------
              class ProfileDir(Configurable):
                  """An object to manage the profile directory and its resources.
                  The profile directory is used by all IPython applications, to manage
                  configuration, logging and security.
                  This object knows how to find, create and manage these directories. This
                  should be used by any code that wants to handle profiles.
                  """
                  security_dir_name = Unicode('security')
                  log_dir_name = Unicode('log')
                  pid_dir_name = Unicode('pid')
                  security_dir = Unicode(u'')
                  log_dir = Unicode(u'')
                  pid_dir = Unicode(u'')
                  location = Unicode(u'', config=True,
                      help="""Set the profile location directly. This overrides the logic used by the
                      `profile` option.""",
                      )
                  _location_isset = Bool(False) # flag for detecting multiply set location
                  def _location_changed(self, name, old, new):
                      if self._location_isset:
                          raise RuntimeError("Cannot set profile location more than once.")
                      self._location_isset = True
                      if not os.path.isdir(new):
                          os.makedirs(new)
                      # ensure config files exist:
                      self.security_dir = os.path.join(new, self.security_dir_name)
                      self.log_dir = os.path.join(new, self.log_dir_name)
                      self.pid_dir = os.path.join(new, self.pid_dir_name)
                      self.check_dirs()
                  def _log_dir_changed(self, name, old, new):
                      self.check_log_dir()
                  def check_log_dir(self):
                      if not os.path.isdir(self.log_dir):
                          os.mkdir(self.log_dir)
                  def _security_dir_changed(self, name, old, new):
                      self.check_security_dir()
                  def check_security_dir(self):
                      if not os.path.isdir(self.security_dir):
                          os.mkdir(self.security_dir, 0700)
                      else:
                          os.chmod(self.security_dir, 0700)
                  def _pid_dir_changed(self, name, old, new):
                      self.check_pid_dir()
                  def check_pid_dir(self):
                      if not os.path.isdir(self.pid_dir):
                          os.mkdir(self.pid_dir, 0700)
                      else:
                          os.chmod(self.pid_dir, 0700)
                  def check_dirs(self):
                      self.check_security_dir()
                      self.check_log_dir()
                      self.check_pid_dir()
                  def copy_config_file(self, config_file, path=None, overwrite=False):
                      """Copy a default config file into the active profile directory.
                      Default configuration files are kept in :mod:`IPython.config.default`.
                      This function moves these from that location to the working profile
                      directory.
                      """
                      dst = os.path.join(self.location, config_file)
                      if os.path.isfile(dst) and not overwrite:
                          return
                      if path is None:
                          path = os.path.join(get_ipython_package_dir(), u'config', u'profile', u'default')
                      src = os.path.join(path, config_file)
                      shutil.copy(src, dst)
                  @classmethod
                  def create_profile_dir(cls, profile_dir, config=None):
                      """Create a new profile directory given a full path.
                      Parameters
                      ----------
                      profile_dir : str
                          The full path to the profile directory.  If it does exist, it will
                          be used.  If not, it will be created.
                      """
                      return cls(location=profile_dir, config=config)
                  @classmethod
                  def create_profile_dir_by_name(cls, path, name=u'default', config=None):
                      """Create a profile dir by profile name and path.
                      Parameters
                      ----------
                      path : unicode
                          The path (directory) to put the profile directory in.
                      name : unicode
                          The name of the profile.  The name of the profile directory will
                          be "profile_<profile>".
                      """
                      if not os.path.isdir(path):
                          raise ProfileDirError('Directory not found: %s' % path)
                      profile_dir = os.path.join(path, u'profile_' + name)
                      return cls(location=profile_dir, config=config)
                  @classmethod
                  def find_profile_dir_by_name(cls, ipython_dir, name=u'default', config=None):
                      """Find an existing profile dir by profile name, return its ProfileDir.
                      This searches through a sequence of paths for a profile dir.  If it
                      is not found, a :class:`ProfileDirError` exception will be raised.
                      The search path algorithm is:
 . ``os.getcwd()``
 . ``ipython_dir``
 . The directories found in the ":" separated
                         :env:`IPCLUSTER_DIR_PATH` environment variable.
                      Parameters
                      ----------
                      ipython_dir : unicode or str
                          The IPython directory to use.
                      name : unicode or str
                          The name of the profile.  The name of the profile directory
                          will be "profile_<profile>".
                      """
                      dirname = u'profile_' + name
                      profile_dir_paths = os.environ.get('IPYTHON_PROFILE_PATH','')
                      if profile_dir_paths:
                          profile_dir_paths = profile_dir_paths.split(os.pathsep)
                      else:
                          profile_dir_paths = []
                      paths = [os.getcwd(), ipython_dir] + profile_dir_paths
                      for p in paths:
                          profile_dir = os.path.join(p, dirname)
                          if os.path.isdir(profile_dir):
                              return cls(location=profile_dir, config=config)
                      else:
                          raise ProfileDirError('Profile directory not found in paths: %s' % dirname)
                  @classmethod
                  def find_profile_dir(cls, profile_dir, config=None):
                      """Find/create a profile dir and return its ProfileDir.
                      This will create the profile directory if it doesn't exist.
                      Parameters
                      ----------
                      profile_dir : unicode or str
                          The path of the profile directory.  This is expanded using
                          :func:`IPython.utils.genutils.expand_path`.
                      """
                      profile_dir = expand_path(profile_dir)
                      if not os.path.isdir(profile_dir):
                          raise ProfileDirError('Profile directory not found: %s' % profile_dir)
                      return cls(location=profile_dir, config=config)
              #-----------------------------------------------------------------------------
              # Base Application Class
              #-----------------------------------------------------------------------------
              # aliases and flags
              base_aliases = dict(
                  profile='BaseIPythonApplication.profile',
                  ipython_dir='BaseIPythonApplication.ipython_dir',
              )
              base_flags = dict(
                  debug = ({'Application' : {'log_level' : logging.DEBUG}},
                          "set log level to logging.DEBUG (maximize logging output)"),
                  quiet = ({'Application' : {'log_level' : logging.CRITICAL}},
                          "set log level to logging.CRITICAL (minimize logging output)"),
                  init = ({'BaseIPythonApplication' : {
                                  'copy_config_files' : True,
                                  'auto_create' : True}
                          }, "Initialize profile with default config files")
              )
              class BaseIPythonApplication(Application):
                  name = Unicode(u'ipython')
                  description = Unicode(u'IPython: an enhanced interactive Python shell.')
                  version = Unicode(release.version)
                  aliases = Dict(base_aliases)
                  flags = Dict(base_flags)
                  # Track whether the config_file has changed,
                  # because some logic happens only if we aren't using the default.
                  config_file_specified = Bool(False)
                  config_file_name = Unicode(u'ipython_config.py')
                  def _config_file_name_changed(self, name, old, new):
                      if new != old:
                          self.config_file_specified = True
                  # The directory that contains IPython's builtin profiles.
                  builtin_profile_dir = Unicode(
                      os.path.join(get_ipython_package_dir(), u'config', u'profile', u'default')
                  )
                  config_file_paths = List(Unicode)
                  def _config_file_paths_default(self):
                      return [os.getcwdu()]
                  profile = Unicode(u'default', config=True,
                      help="""The IPython profile to use."""
                  )
                  def _profile_changed(self, name, old, new):
                      self.builtin_profile_dir = os.path.join(
                              get_ipython_package_dir(), u'config', u'profile', new
                      )
                  ipython_dir = Unicode(get_ipython_dir(), config=True,
                      help="""
                      The name of the IPython directory. This directory is used for logging
                      configuration (through profiles), history storage, etc. The default
                      is usually $HOME/.ipython. This options can also be specified through
                      the environment variable IPYTHON_DIR.
                      """
                  )
                  overwrite = Bool(False, config=True,
                      help="""Whether to overwrite existing config files when copying""")
                  auto_create = Bool(False, config=True,
                      help="""Whether to create profile dir if it doesn't exist""")
                  config_files = List(Unicode)
                  def _config_files_default(self):
                      return [u'ipython_config.py']
                  copy_config_files = Bool(False, config=True,
                      help="""Whether to copy the default config files into the profile dir.""")
                  # The class to use as the crash handler.
                  crash_handler_class = Type(crashhandler.CrashHandler)
                  def __init__(self, **kwargs):
                      super(BaseIPythonApplication, self).__init__(**kwargs)
                      # ensure even default IPYTHON_DIR exists
                      if not os.path.exists(self.ipython_dir):
                          self._ipython_dir_changed('ipython_dir', self.ipython_dir, self.ipython_dir)
                  #-------------------------------------------------------------------------
                  # Various stages of Application creation
                  #-------------------------------------------------------------------------
                  def init_crash_handler(self):
                      """Create a crash handler, typically setting sys.excepthook to it."""
                      self.crash_handler = self.crash_handler_class(self)
                      sys.excepthook = self.crash_handler
                  def _ipython_dir_changed(self, name, old, new):
                      if old in sys.path:
                          sys.path.remove(old)
                      sys.path.append(os.path.abspath(new))
                      if not os.path.isdir(new):
                          os.makedirs(new, mode=0777)
                      readme = os.path.join(new, 'README')
                      if not os.path.exists(readme):
                          path = os.path.join(get_ipython_package_dir(), u'config', u'profile')
                          shutil.copy(os.path.join(path, 'README'), readme)
                      self.log.debug("IPYTHON_DIR set to: %s" % new)
                  def load_config_file(self, suppress_errors=True):
                      """Load the config file.
                      By default, errors in loading config are handled, and a warning
                      printed on screen. For testing, the suppress_errors option is set
                      to False, so errors will make tests fail.
                      """
                      self.log.debug("Attempting to load config file: %s" %
                                     self.config_file_name)
                      try:
                          Application.load_config_file(
                              self,
                              self.config_file_name,
                              path=self.config_file_paths
                          )
                      except IOError:
                          # Only warn if the default config file was NOT being used.
                          if self.config_file_specified:
                              self.log.warn("Config file not found, skipping: %s" %
                                             self.config_file_name)
                      except:
                          # For testing purposes.
                          if not suppress_errors:
                              raise
                          self.log.warn("Error loading config file: %s" %
                                        self.config_file_name, exc_info=True)
                  def init_profile_dir(self):
                      """initialize the profile dir"""
                      try:
                          # location explicitly specified:
                          location = self.config.ProfileDir.location
                      except AttributeError:
                          # location not specified, find by profile name
                          try:
                              p = ProfileDir.find_profile_dir_by_name(self.ipython_dir, self.profile, self.config)
                          except ProfileDirError:
                              # not found, maybe create it (always create default profile)
                              if self.auto_create or self.profile=='default':
                                  try:
                                      p = ProfileDir.create_profile_dir_by_name(self.ipython_dir, self.profile, self.config)
                                  except ProfileDirError:
                                      self.log.fatal("Could not create profile: %r"%self.profile)
                                      self.exit(1)
                                  else:
                                      self.log.info("Created profile dir: %r"%p.location)
                              else:
                                  self.log.fatal("Profile %r not found."%self.profile)
                                  self.exit(1)
                          else:
                              self.log.info("Using existing profile dir: %r"%p.location)
                      else:
                          # location is fully specified
                          try:
                              p = ProfileDir.find_profile_dir(location, self.config)
                          except ProfileDirError:
                              # not found, maybe create it
                              if self.auto_create:
                                  try:
                                      p = ProfileDir.create_profile_dir(location, self.config)
                                  except ProfileDirError:
                                      self.log.fatal("Could not create profile directory: %r"%location)
                                      self.exit(1)
                                  else:
                                      self.log.info("Creating new profile dir: %r"%location)
                              else:
                                  self.log.fatal("Profile directory %r not found."%location)
                                  self.exit(1)
                          else:
                              self.log.info("Using existing profile dir: %r"%location)
                      self.profile_dir = p
                      self.config_file_paths.append(p.location)
                  def init_config_files(self):
                      """[optionally] copy default config files into profile dir."""
                      # copy config files
                      if self.copy_config_files:
                          path = self.builtin_profile_dir
                          src = self.profile
                          if not os.path.exists(path):
                              # use default if new profile doesn't have a preset
                              path = None
                              src = 'default'
                          self.log.debug("Staging %s config files into %r [overwrite=%s]"%(
                                  src, self.profile_dir.location, self.overwrite)
                          )
                          for cfg in self.config_files:
                              self.profile_dir.copy_config_file(cfg, path=path, overwrite=self.overwrite)
                  def initialize(self, argv=None):
                      self.init_crash_handler()
                      self.parse_command_line(argv)
                      cl_config = self.config
                      self.init_profile_dir()
                      self.init_config_files()
                      self.load_config_file()
                      # enforce cl-opts override configfile opts:
                      self.update_config(cl_config)

IPython/parallel/__init__.py

0 +6 -1

-             """The IPython ZMQ-based parallel computing interface."""
+             """The IPython ZMQ-based parallel computing interface.
+             Authors:
+             * MinRK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2011 The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import os
              import zmq
              if os.name == 'nt':
                  if zmq.__version__ < '2.1.7':
                      raise ImportError("IPython.parallel requires pyzmq/0MQ >= 2.1.7 on Windows, "
                      "and you appear to have %s"%zmq.__version__)
              elif zmq.__version__ < '2.1.4':
                  raise ImportError("IPython.parallel requires pyzmq/0MQ >= 2.1.4, you appear to have %s"%zmq.__version__)
              from IPython.utils.pickleutil import Reference
              from .client.asyncresult import *
              from .client.client import Client
              from .client.remotefunction import *
              from .client.view import *
              from .controller.dependency import *

IPython/parallel/apps/baseapp.py

0 +8 -2

              #!/usr/bin/env python
              # encoding: utf-8
              """
-             The IPython cluster directory
+             The Base Application class for IPython.parallel apps
+             Authors:
+             * Brian Granger
+             * Min RK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2009  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from __future__ import with_statement
              import os
              import logging
              import re
              import sys
              from subprocess import Popen, PIPE
              from IPython.core import release
              from IPython.core.crashhandler import CrashHandler
              from IPython.core.newapplication import (
                  BaseIPythonApplication,
                  base_aliases as base_ip_aliases,
                  base_flags as base_ip_flags
              )
              from IPython.utils.path import expand_path
              from IPython.utils.traitlets import Unicode, Bool, Instance, Dict, List
              #-----------------------------------------------------------------------------
              # Module errors
              #-----------------------------------------------------------------------------
              class PIDFileError(Exception):
                  pass
              #-----------------------------------------------------------------------------
              # Crash handler for this application
              #-----------------------------------------------------------------------------
              _message_template = """\
              Oops, $self.app_name crashed. We do our best to make it stable, but...
              A crash report was automatically generated with the following information:
                - A verbatim copy of the crash traceback.
                - Data on your current $self.app_name configuration.
              It was left in the file named:
              \t'$self.crash_report_fname'
              If you can email this file to the developers, the information in it will help
              them in understanding and correcting the problem.
              You can mail it to: $self.contact_name at $self.contact_email
              with the subject '$self.app_name Crash Report'.
              If you want to do it now, the following command will work (under Unix):
              mail -s '$self.app_name Crash Report' $self.contact_email < $self.crash_report_fname
              To ensure accurate tracking of this issue, please file a report about it at:
              $self.bug_tracker
              """
              class ParallelCrashHandler(CrashHandler):
                  """sys.excepthook for IPython itself, leaves a detailed report on disk."""
                  message_template = _message_template
                  def __init__(self, app):
                      contact_name = release.authors['Min'][0]
                      contact_email = release.authors['Min'][1]
                      bug_tracker = 'http://github.com/ipython/ipython/issues'
                      super(ParallelCrashHandler,self).__init__(
                          app, contact_name, contact_email, bug_tracker
                      )
              #-----------------------------------------------------------------------------
              # Main application
              #-----------------------------------------------------------------------------
              base_aliases = {}
              base_aliases.update(base_ip_aliases)
              base_aliases.update({
                  'profile_dir' : 'ProfileDir.location',
                  'log_level' : 'BaseParallelApplication.log_level',
                  'work_dir' : 'BaseParallelApplication.work_dir',
                  'log_to_file' : 'BaseParallelApplication.log_to_file',
                  'clean_logs' : 'BaseParallelApplication.clean_logs',
                  'log_url' : 'BaseParallelApplication.log_url',
              })
              base_flags = {
                  'log-to-file' : (
                      {'BaseParallelApplication' : {'log_to_file' : True}},
                      "send log output to a file"
                  )
              }
              base_flags.update(base_ip_flags)
              class BaseParallelApplication(BaseIPythonApplication):
                  """The base Application for IPython.parallel apps
                  Principle extensions to BaseIPyythonApplication:
                  * work_dir
                  * remote logging via pyzmq
                  * IOLoop instance
                  """
                  crash_handler_class = ParallelCrashHandler
                  def _log_level_default(self):
                      # temporarily override default_log_level to INFO
                      return logging.INFO
                  work_dir = Unicode(os.getcwdu(), config=True,
                      help='Set the working dir for the process.'
                  )
                  def _work_dir_changed(self, name, old, new):
                      self.work_dir = unicode(expand_path(new))
                  log_to_file = Bool(config=True,
                      help="whether to log to a file")
                  clean_logs = Bool(False, config=True,
                      help="whether to cleanup old logfiles before starting")
                  log_url = Unicode('', config=True,
                      help="The ZMQ URL of the iplogger to aggregate logging.")
                  def _config_files_default(self):
                      return ['ipcontroller_config.py', 'ipengine_config.py', 'ipcluster_config.py']
                  loop = Instance('zmq.eventloop.ioloop.IOLoop')
                  def _loop_default(self):
                      from zmq.eventloop.ioloop import IOLoop
                      return IOLoop.instance()
                  aliases = Dict(base_aliases)
                  flags = Dict(base_flags)
                  def initialize(self, argv=None):
                      """initialize the app"""
                      super(BaseParallelApplication, self).initialize(argv)
                      self.to_work_dir()
                      self.reinit_logging()
                  def to_work_dir(self):
                      wd = self.work_dir
                      if unicode(wd) != os.getcwdu():
                          os.chdir(wd)
                          self.log.info("Changing to working dir: %s" % wd)
                      # This is the working dir by now.
                      sys.path.insert(0, '')
                  def reinit_logging(self):
                      # Remove old log files
                      log_dir = self.profile_dir.log_dir
                      if self.clean_logs:
                          for f in os.listdir(log_dir):
                              if re.match(r'%s-\d+\.(log|err|out)'%self.name,f):
                                  os.remove(os.path.join(log_dir, f))
                      if self.log_to_file:
                          # Start logging to the new log file
                          log_filename = self.name + u'-' + str(os.getpid()) + u'.log'
                          logfile = os.path.join(log_dir, log_filename)
                          open_log_file = open(logfile, 'w')
                      else:
                          open_log_file = None
                      if open_log_file is not None:
                          self.log.removeHandler(self._log_handler)
                          self._log_handler = logging.StreamHandler(open_log_file)
                          self._log_formatter = logging.Formatter("[%(name)s] %(message)s")
                          self._log_handler.setFormatter(self._log_formatter)
                          self.log.addHandler(self._log_handler)
                  def write_pid_file(self, overwrite=False):
                      """Create a .pid file in the pid_dir with my pid.
                      This must be called after pre_construct, which sets `self.pid_dir`.
                      This raises :exc:`PIDFileError` if the pid file exists already.
                      """
                      pid_file = os.path.join(self.profile_dir.pid_dir, self.name + u'.pid')
                      if os.path.isfile(pid_file):
                          pid = self.get_pid_from_file()
                          if not overwrite:
                              raise PIDFileError(
                                  'The pid file [%s] already exists. \nThis could mean that this '
                                  'server is already running with [pid=%s].' % (pid_file, pid)
                              )
                      with open(pid_file, 'w') as f:
                          self.log.info("Creating pid file: %s" % pid_file)
                          f.write(repr(os.getpid())+'\n')
                  def remove_pid_file(self):
                      """Remove the pid file.
                      This should be called at shutdown by registering a callback with
                      :func:`reactor.addSystemEventTrigger`. This needs to return
                      ``None``.
                      """
                      pid_file = os.path.join(self.profile_dir.pid_dir, self.name + u'.pid')
                      if os.path.isfile(pid_file):
                          try:
                              self.log.info("Removing pid file: %s" % pid_file)
                              os.remove(pid_file)
                          except:
                              self.log.warn("Error removing the pid file: %s" % pid_file)
                  def get_pid_from_file(self):
                      """Get the pid from the pid file.
                      If the  pid file doesn't exist a :exc:`PIDFileError` is raised.
                      """
                      pid_file = os.path.join(self.profile_dir.pid_dir, self.name + u'.pid')
                      if os.path.isfile(pid_file):
                          with open(pid_file, 'r') as f:
                              pid = int(f.read().strip())
                              return pid
                      else:
                          raise PIDFileError('pid file not found: %s' % pid_file)
                  def check_pid(self, pid):
                      if os.name == 'nt':
                          try:
                              import ctypes
                              # returns 0 if no such process (of ours) exists
                              # positive int otherwise
                              p = ctypes.windll.kernel32.OpenProcess(1,0,pid)
                          except Exception:
                              self.log.warn(
                                  "Could not determine whether pid %i is running via `OpenProcess`. "
                                  " Making the likely assumption that it is."%pid
                              )
                              return True
                          return bool(p)
                      else:
                          try:
                              p = Popen(['ps','x'], stdout=PIPE, stderr=PIPE)
                              output,_ = p.communicate()
                          except OSError:
                              self.log.warn(
                                  "Could not determine whether pid %i is running via `ps x`. "
                                  " Making the likely assumption that it is."%pid
                              )
                              return True
                          pids = map(int, re.findall(r'^\W*\d+', output, re.MULTILINE))
                          return pid in pids

IPython/parallel/apps/ipclusterapp.py

0 +7 -1

              #!/usr/bin/env python
              # encoding: utf-8
              """
              The ipcluster application.
+             Authors:
+             * Brian Granger
+             * MinRK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2009  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import errno
              import logging
              import os
              import re
              import signal
              from subprocess import check_call, CalledProcessError, PIPE
              import zmq
              from zmq.eventloop import ioloop
              from IPython.config.application import Application, boolean_flag
              from IPython.config.loader import Config
              from IPython.core.newapplication import BaseIPythonApplication, ProfileDir
              from IPython.utils.importstring import import_item
              from IPython.utils.traitlets import Int, Unicode, Bool, CFloat, Dict, List
              from IPython.parallel.apps.baseapp import (
                  BaseParallelApplication,
                  PIDFileError,
                  base_flags, base_aliases
              )
              #-----------------------------------------------------------------------------
              # Module level variables
              #-----------------------------------------------------------------------------
              default_config_file_name = u'ipcluster_config.py'
              _description = """Start an IPython cluster for parallel computing.
              An IPython cluster consists of 1 controller and 1 or more engines.
              This command automates the startup of these processes using a wide
              range of startup methods (SSH, local processes, PBS, mpiexec,
              Windows HPC Server 2008). To start a cluster with 4 engines on your
              local host simply do 'ipcluster start n=4'. For more complex usage
              you will typically do 'ipcluster create profile=mycluster', then edit
              configuration files, followed by 'ipcluster start profile=mycluster n=4'.
              """
              # Exit codes for ipcluster
              # This will be the exit code if the ipcluster appears to be running because
              # a .pid file exists
              ALREADY_STARTED = 10
              # This will be the exit code if ipcluster stop is run, but there is not .pid
              # file to be found.
              ALREADY_STOPPED = 11
              # This will be the exit code if ipcluster engines is run, but there is not .pid
              # file to be found.
              NO_CLUSTER = 12
              #-----------------------------------------------------------------------------
              # Main application
              #-----------------------------------------------------------------------------
              start_help = """Start an IPython cluster for parallel computing
              Start an ipython cluster by its profile name or cluster
              directory. Cluster directories contain configuration, log and
              security related files and are named using the convention
              'cluster_<profile>' and should be creating using the 'start'
              subcommand of 'ipcluster'. If your cluster directory is in
              the cwd or the ipython directory, you can simply refer to it
              using its profile name, 'ipcluster start n=4 profile=<profile>`,
              otherwise use the 'profile_dir' option.
              """
              stop_help = """Stop a running IPython cluster
              Stop a running ipython cluster by its profile name or cluster
              directory. Cluster directories are named using the convention
              'cluster_<profile>'. If your cluster directory is in
              the cwd or the ipython directory, you can simply refer to it
              using its profile name, 'ipcluster stop profile=<profile>`, otherwise
              use the 'profile_dir' option.
              """
              engines_help = """Start engines connected to an existing IPython cluster
              Start one or more engines to connect to an existing Cluster
              by profile name or cluster directory.
              Cluster directories contain configuration, log and
              security related files and are named using the convention
              'cluster_<profile>' and should be creating using the 'start'
              subcommand of 'ipcluster'. If your cluster directory is in
              the cwd or the ipython directory, you can simply refer to it
              using its profile name, 'ipcluster engines n=4 profile=<profile>`,
              otherwise use the 'profile_dir' option.
              """
              create_help = """Create an ipcluster profile by name
              Create an ipython cluster directory by its profile name or
              cluster directory path. Cluster directories contain
              configuration, log and security related files and are named
              using the convention 'cluster_<profile>'. By default they are
              located in your ipython directory. Once created, you will
              probably need to edit the configuration files in the cluster
              directory to configure your cluster. Most users will create a
              cluster directory by profile name,
              `ipcluster create profile=mycluster`, which will put the directory
              in `<ipython_dir>/cluster_mycluster`.
              """
              list_help = """List available cluster profiles
              List all available clusters, by cluster directory, that can
              be found in the current working directly or in the ipython
              directory. Cluster directories are named using the convention
              'cluster_<profile>'.
              """
              class IPClusterList(BaseIPythonApplication):
                  name = u'ipcluster-list'
                  description = list_help
                  # empty aliases
                  aliases=Dict()
                  flags = Dict(base_flags)
                  def _log_level_default(self):
                      return 20
                  def list_profile_dirs(self):
                      # Find the search paths
                      profile_dir_paths = os.environ.get('IPYTHON_PROFILE_PATH','')
                      if profile_dir_paths:
                          profile_dir_paths = profile_dir_paths.split(':')
                      else:
                          profile_dir_paths = []
                      ipython_dir = self.ipython_dir
                      paths = [os.getcwd(), ipython_dir] + profile_dir_paths
                      paths = list(set(paths))
                      self.log.info('Searching for cluster profiles in paths: %r' % paths)
                      for path in paths:
                          files = os.listdir(path)
                          for f in files:
                              full_path = os.path.join(path, f)
                              if os.path.isdir(full_path) and f.startswith('profile_') and \
                                  os.path.isfile(os.path.join(full_path, 'ipcontroller_config.py')):
                                  profile = f.split('_')[-1]
                                  start_cmd = 'ipcluster start profile=%s n=4' % profile
                                  print start_cmd + " ==> " + full_path
                  def start(self):
                      self.list_profile_dirs()
              # `ipcluster create` will be deprecated when `ipython profile create` or equivalent exists
              create_flags = {}
              create_flags.update(base_flags)
              create_flags.update(boolean_flag('reset', 'IPClusterCreate.overwrite',
                              "reset config files to defaults", "leave existing config files"))
              class IPClusterCreate(BaseParallelApplication):
                  name = u'ipcluster-create'
                  description = create_help
                  auto_create = Bool(True)
                  config_file_name = Unicode(default_config_file_name)
                  flags = Dict(create_flags)
                  aliases = Dict(dict(profile='BaseIPythonApplication.profile'))
                  classes = [ProfileDir]
              stop_aliases = dict(
                  signal='IPClusterStop.signal',
                  profile='BaseIPythonApplication.profile',
                  profile_dir='ProfileDir.location',
              )
              class IPClusterStop(BaseParallelApplication):
                  name = u'ipcluster'
                  description = stop_help
                  config_file_name = Unicode(default_config_file_name)
                  signal = Int(signal.SIGINT, config=True,
                      help="signal to use for stopping processes.")
                  aliases = Dict(stop_aliases)
                  def start(self):
                      """Start the app for the stop subcommand."""
                      try:
                          pid = self.get_pid_from_file()
                      except PIDFileError:
                          self.log.critical(
                              'Could not read pid file, cluster is probably not running.'
                          )
                          # Here I exit with a unusual exit status that other processes
                          # can watch for to learn how I existed.
                          self.remove_pid_file()
                          self.exit(ALREADY_STOPPED)
                      if not self.check_pid(pid):
                          self.log.critical(
                              'Cluster [pid=%r] is not running.' % pid
                          )
                          self.remove_pid_file()
                          # Here I exit with a unusual exit status that other processes
                          # can watch for to learn how I existed.
                          self.exit(ALREADY_STOPPED)
                      elif os.name=='posix':
                          sig = self.signal
                          self.log.info(
                              "Stopping cluster [pid=%r] with [signal=%r]" % (pid, sig)
                          )
                          try:
                              os.kill(pid, sig)
                          except OSError:
                              self.log.error("Stopping cluster failed, assuming already dead.",
                                  exc_info=True)
                              self.remove_pid_file()
                      elif os.name=='nt':
                          try:
                              # kill the whole tree
                              p = check_call(['taskkill', '-pid', str(pid), '-t', '-f'], stdout=PIPE,stderr=PIPE)
                          except (CalledProcessError, OSError):
                              self.log.error("Stopping cluster failed, assuming already dead.",
                                  exc_info=True)
                          self.remove_pid_file()
              engine_aliases = {}
              engine_aliases.update(base_aliases)
              engine_aliases.update(dict(
                  n='IPClusterEngines.n',
                  elauncher = 'IPClusterEngines.engine_launcher_class',
              ))
              class IPClusterEngines(BaseParallelApplication):
                  name = u'ipcluster'
                  description = engines_help
                  usage = None
                  config_file_name = Unicode(default_config_file_name)
                  default_log_level = logging.INFO
                  classes = List()
                  def _classes_default(self):
                      from IPython.parallel.apps import launcher
                      launchers = launcher.all_launchers
                      eslaunchers = [ l for l in launchers if 'EngineSet' in l.__name__]
                      return [ProfileDir]+eslaunchers
                  n = Int(2, config=True,
                      help="The number of engines to start.")
                  engine_launcher_class = Unicode('LocalEngineSetLauncher',
                      config=True,
                      help="The class for launching a set of Engines."
                      )
                  daemonize = Bool(False, config=True,
                      help='Daemonize the ipcluster program. This implies --log-to-file')
                  def _daemonize_changed(self, name, old, new):
                      if new:
                          self.log_to_file = True
                  aliases = Dict(engine_aliases)
                  # flags = Dict(flags)
                  _stopping = False
                  def initialize(self, argv=None):
                      super(IPClusterEngines, self).initialize(argv)
                      self.init_signal()
                      self.init_launchers()
                  def init_launchers(self):
                      self.engine_launcher = self.build_launcher(self.engine_launcher_class)
                      self.engine_launcher.on_stop(lambda r: self.loop.stop())
                  def init_signal(self):
                      # Setup signals
                      signal.signal(signal.SIGINT, self.sigint_handler)
                  def build_launcher(self, clsname):
                      """import and instantiate a Launcher based on importstring"""
                      if '.' not in clsname:
                          # not a module, presume it's the raw name in apps.launcher
                          clsname = 'IPython.parallel.apps.launcher.'+clsname
                      # print repr(clsname)
                      klass = import_item(clsname)
                      launcher = klass(
                          work_dir=self.profile_dir.location, config=self.config, log=self.log
                      )
                      return launcher
                  def start_engines(self):
                      self.log.info("Starting %i engines"%self.n)
                      self.engine_launcher.start(
                          self.n,
                          self.profile_dir.location
                      )
                  def stop_engines(self):
                      self.log.info("Stopping Engines...")
                      if self.engine_launcher.running:
                          d = self.engine_launcher.stop()
                          return d
                      else:
                          return None
                  def stop_launchers(self, r=None):
                      if not self._stopping:
                          self._stopping = True
                          self.log.error("IPython cluster: stopping")
                          self.stop_engines()
                          # Wait a few seconds to let things shut down.
                          dc = ioloop.DelayedCallback(self.loop.stop, 4000, self.loop)
                          dc.start()
                  def sigint_handler(self, signum, frame):
                      self.log.debug("SIGINT received, stopping launchers...")
                      self.stop_launchers()
                  def start_logging(self):
                      # Remove old log files of the controller and engine
                      if self.clean_logs:
                          log_dir = self.profile_dir.log_dir
                          for f in os.listdir(log_dir):
                              if re.match(r'ip(engine|controller)z-\d+\.(log|err|out)',f):
                                  os.remove(os.path.join(log_dir, f))
                      # This will remove old log files for ipcluster itself
                      # super(IPBaseParallelApplication, self).start_logging()
                  def start(self):
                      """Start the app for the engines subcommand."""
                      self.log.info("IPython cluster: started")
                      # First see if the cluster is already running
                      # Now log and daemonize
                      self.log.info(
                          'Starting engines with [daemon=%r]' % self.daemonize
                      )
                      # TODO: Get daemonize working on Windows or as a Windows Server.
                      if self.daemonize:
                          if os.name=='posix':
                              from twisted.scripts._twistd_unix import daemonize
                              daemonize()
                      dc = ioloop.DelayedCallback(self.start_engines, 0, self.loop)
                      dc.start()
                      # Now write the new pid file AFTER our new forked pid is active.
                      # self.write_pid_file()
                      try:
                          self.loop.start()
                      except KeyboardInterrupt:
                          pass
                      except zmq.ZMQError as e:
                          if e.errno == errno.EINTR:
                              pass
                          else:
                              raise
              start_aliases = {}
              start_aliases.update(engine_aliases)
              start_aliases.update(dict(
                  delay='IPClusterStart.delay',
                  clean_logs='IPClusterStart.clean_logs',
              ))
              class IPClusterStart(IPClusterEngines):
                  name = u'ipcluster'
                  description = start_help
                  default_log_level = logging.INFO
                  auto_create = Bool(True, config=True,
                      help="whether to create the profile_dir if it doesn't exist")
                  classes = List()
                  def _classes_default(self,):
                      from IPython.parallel.apps import launcher
                      return [ProfileDir]+launcher.all_launchers
                  clean_logs = Bool(True, config=True,
                      help="whether to cleanup old logs before starting")
                  delay = CFloat(1., config=True,
                      help="delay (in s) between starting the controller and the engines")
                  controller_launcher_class = Unicode('LocalControllerLauncher',
                      config=True,
                      help="The class for launching a Controller."
                      )
                  reset = Bool(False, config=True,
                      help="Whether to reset config files as part of '--create'."
                      )
                  # flags = Dict(flags)
                  aliases = Dict(start_aliases)
                  def init_launchers(self):
                      self.controller_launcher = self.build_launcher(self.controller_launcher_class)
                      self.engine_launcher = self.build_launcher(self.engine_launcher_class)
                      self.controller_launcher.on_stop(self.stop_launchers)
                  def start_controller(self):
                      self.controller_launcher.start(
                          self.profile_dir.location
                      )
                  def stop_controller(self):
                      # self.log.info("In stop_controller")
                      if self.controller_launcher and self.controller_launcher.running:
                          return self.controller_launcher.stop()
                  def stop_launchers(self, r=None):
                      if not self._stopping:
                          self.stop_controller()
                          super(IPClusterStart, self).stop_launchers()
                  def start(self):
                      """Start the app for the start subcommand."""
                      # First see if the cluster is already running
                      try:
                          pid = self.get_pid_from_file()
                      except PIDFileError:
                          pass
                      else:
                          if self.check_pid(pid):
                              self.log.critical(
                                  'Cluster is already running with [pid=%s]. '
                                  'use "ipcluster stop" to stop the cluster.' % pid
                              )
                              # Here I exit with a unusual exit status that other processes
                              # can watch for to learn how I existed.
                              self.exit(ALREADY_STARTED)
                          else:
                              self.remove_pid_file()
                      # Now log and daemonize
                      self.log.info(
                          'Starting ipcluster with [daemon=%r]' % self.daemonize
                      )
                      # TODO: Get daemonize working on Windows or as a Windows Server.
                      if self.daemonize:
                          if os.name=='posix':
                              from twisted.scripts._twistd_unix import daemonize
                              daemonize()
                      dc = ioloop.DelayedCallback(self.start_controller, 0, self.loop)
                      dc.start()
                      dc = ioloop.DelayedCallback(self.start_engines, 1000*self.delay, self.loop)
                      dc.start()
                      # Now write the new pid file AFTER our new forked pid is active.
                      self.write_pid_file()
                      try:
                          self.loop.start()
                      except KeyboardInterrupt:
                          pass
                      except zmq.ZMQError as e:
                          if e.errno == errno.EINTR:
                              pass
                          else:
                              raise
                      finally:
                          self.remove_pid_file()
              base='IPython.parallel.apps.ipclusterapp.IPCluster'
              class IPBaseParallelApplication(Application):
                  name = u'ipcluster'
                  description = _description
                  subcommands = {'create' : (base+'Create', create_help),
                              'list' : (base+'List', list_help),
                              'start' : (base+'Start', start_help),
                              'stop' : (base+'Stop', stop_help),
                              'engines' : (base+'Engines', engines_help),
                  }
                  # no aliases or flags for parent App
                  aliases = Dict()
                  flags = Dict()
                  def start(self):
                      if self.subapp is None:
                          print "No subcommand specified! Must specify one of: %s"%(self.subcommands.keys())
                          print
                          self.print_subcommands()
                          self.exit(1)
                      else:
                          return self.subapp.start()
              def launch_new_instance():
                  """Create and run the IPython cluster."""
                  app = IPBaseParallelApplication.instance()
                  app.initialize()
                  app.start()
              if __name__ == '__main__':
                  launch_new_instance()

IPython/parallel/apps/ipcontrollerapp.py

0 +7 -1

              #!/usr/bin/env python
              # encoding: utf-8
              """
              The IPython controller application.
+             Authors:
+             * Brian Granger
+             * MinRK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2009  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from __future__ import with_statement
              import os
              import socket
              import stat
              import sys
              import uuid
              from multiprocessing import Process
              import zmq
              from zmq.devices import ProcessMonitoredQueue
              from zmq.log.handlers import PUBHandler
              from zmq.utils import jsonapi as json
              from IPython.config.application import boolean_flag
              from IPython.core.newapplication import ProfileDir
              from IPython.parallel.apps.baseapp import (
                  BaseParallelApplication,
                  base_flags
              )
              from IPython.utils.importstring import import_item
              from IPython.utils.traitlets import Instance, Unicode, Bool, List, Dict
              # from IPython.parallel.controller.controller import ControllerFactory
              from IPython.zmq.session import Session
              from IPython.parallel.controller.heartmonitor import HeartMonitor
              from IPython.parallel.controller.hub import HubFactory
              from IPython.parallel.controller.scheduler import TaskScheduler,launch_scheduler
              from IPython.parallel.controller.sqlitedb import SQLiteDB
              from IPython.parallel.util import signal_children, split_url
              # conditional import of MongoDB backend class
              try:
                  from IPython.parallel.controller.mongodb import MongoDB
              except ImportError:
                  maybe_mongo = []
              else:
                  maybe_mongo = [MongoDB]
              #-----------------------------------------------------------------------------
              # Module level variables
              #-----------------------------------------------------------------------------
              #: The default config file name for this application
              default_config_file_name = u'ipcontroller_config.py'
              _description = """Start the IPython controller for parallel computing.
              The IPython controller provides a gateway between the IPython engines and
              clients. The controller needs to be started before the engines and can be
              configured using command line options or using a cluster directory. Cluster
              directories contain config, log and security files and are usually located in
              your ipython directory and named as "cluster_<profile>". See the `profile`
              and `profile_dir` options for details.
              """
              #-----------------------------------------------------------------------------
              # The main application
              #-----------------------------------------------------------------------------
              flags = {}
              flags.update(base_flags)
              flags.update({
                  'usethreads' : ( {'IPControllerApp' : {'use_threads' : True}},
                                  'Use threads instead of processes for the schedulers'),
                  'sqlitedb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.sqlitedb.SQLiteDB'}},
                                  'use the SQLiteDB backend'),
                  'mongodb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.mongodb.MongoDB'}},
                                  'use the MongoDB backend'),
                  'dictdb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.dictdb.DictDB'}},
                                  'use the in-memory DictDB backend'),
                  'reuse' : ({'IPControllerApp' : {'reuse_files' : True}},
                                  'reuse existing json connection files')
              })
              flags.update(boolean_flag('secure', 'IPControllerApp.secure',
                  "Use HMAC digests for authentication of messages.",
                  "Don't authenticate messages."
              ))
              class IPControllerApp(BaseParallelApplication):
                  name = u'ipcontroller'
                  description = _description
                  config_file_name = Unicode(default_config_file_name)
                  classes = [ProfileDir, Session, HubFactory, TaskScheduler, HeartMonitor, SQLiteDB] + maybe_mongo
                  # change default to True
                  auto_create = Bool(True, config=True,
                      help="""Whether to create profile dir if it doesn't exist.""")
                  reuse_files = Bool(False, config=True,
                      help='Whether to reuse existing json connection files.'
                  )
                  secure = Bool(True, config=True,
                      help='Whether to use HMAC digests for extra message authentication.'
                  )
                  ssh_server = Unicode(u'', config=True,
                      help="""ssh url for clients to use when connecting to the Controller
                      processes. It should be of the form: [user@]server[:port]. The
                      Controller's listening addresses must be accessible from the ssh server""",
                  )
                  location = Unicode(u'', config=True,
                      help="""The external IP or domain name of the Controller, used for disambiguating
                      engine and client connections.""",
                  )
                  import_statements = List([], config=True,
                      help="import statements to be run at startup.  Necessary in some environments"
                  )
                  use_threads = Bool(False, config=True,
                      help='Use threads instead of processes for the schedulers',
                      )
                  # internal
                  children = List()
                  mq_class = Unicode('zmq.devices.ProcessMonitoredQueue')
                  def _use_threads_changed(self, name, old, new):
                      self.mq_class = 'zmq.devices.%sMonitoredQueue'%('Thread' if new else 'Process')
                  aliases = Dict(dict(
                      log_level = 'IPControllerApp.log_level',
                      log_url = 'IPControllerApp.log_url',
                      reuse_files = 'IPControllerApp.reuse_files',
                      secure = 'IPControllerApp.secure',
                      ssh = 'IPControllerApp.ssh_server',
                      use_threads = 'IPControllerApp.use_threads',
                      import_statements = 'IPControllerApp.import_statements',
                      location = 'IPControllerApp.location',
                      ident = 'Session.session',
                      user = 'Session.username',
                      exec_key = 'Session.keyfile',
                      url = 'HubFactory.url',
                      ip = 'HubFactory.ip',
                      transport = 'HubFactory.transport',
                      port = 'HubFactory.regport',
                      ping = 'HeartMonitor.period',
                      scheme = 'TaskScheduler.scheme_name',
                      hwm = 'TaskScheduler.hwm',
                      profile = "BaseIPythonApplication.profile",
                      profile_dir = 'ProfileDir.location',
                  ))
                  flags = Dict(flags)
                  def save_connection_dict(self, fname, cdict):
                      """save a connection dict to json file."""
                      c = self.config
                      url = cdict['url']
                      location = cdict['location']
                      if not location:
                          try:
                              proto,ip,port = split_url(url)
                          except AssertionError:
                              pass
                          else:
                              location = socket.gethostbyname_ex(socket.gethostname())[2][-1]
                          cdict['location'] = location
                      fname = os.path.join(self.profile_dir.security_dir, fname)
                      with open(fname, 'w') as f:
                          f.write(json.dumps(cdict, indent=2))
                      os.chmod(fname, stat.S_IRUSR|stat.S_IWUSR)
                  def load_config_from_json(self):
                      """load config from existing json connector files."""
                      c = self.config
                      # load from engine config
                      with open(os.path.join(self.profile_dir.security_dir, 'ipcontroller-engine.json')) as f:
                          cfg = json.loads(f.read())
                      key = c.Session.key = cfg['exec_key']
                      xport,addr = cfg['url'].split('://')
                      c.HubFactory.engine_transport = xport
                      ip,ports = addr.split(':')
                      c.HubFactory.engine_ip = ip
                      c.HubFactory.regport = int(ports)
                      self.location = cfg['location']
                      # load client config
                      with open(os.path.join(self.profile_dir.security_dir, 'ipcontroller-client.json')) as f:
                          cfg = json.loads(f.read())
                      assert key == cfg['exec_key'], "exec_key mismatch between engine and client keys"
                      xport,addr = cfg['url'].split('://')
                      c.HubFactory.client_transport = xport
                      ip,ports = addr.split(':')
                      c.HubFactory.client_ip = ip
                      self.ssh_server = cfg['ssh']
                      assert int(ports) == c.HubFactory.regport, "regport mismatch"
                  def init_hub(self):
                      c = self.config
                      self.do_import_statements()
                      reusing = self.reuse_files
                      if reusing:
                          try:
                              self.load_config_from_json()
                          except (AssertionError,IOError):
                              reusing=False
                      # check again, because reusing may have failed:
                      if reusing:
                          pass
                      elif self.secure:
                          key = str(uuid.uuid4())
                          # keyfile = os.path.join(self.profile_dir.security_dir, self.exec_key)
                          # with open(keyfile, 'w') as f:
                          #     f.write(key)
                          # os.chmod(keyfile, stat.S_IRUSR|stat.S_IWUSR)
                          c.Session.key = key
                      else:
                          key = c.Session.key = ''
                      try:
                          self.factory = HubFactory(config=c, log=self.log)
                          # self.start_logging()
                          self.factory.init_hub()
                      except:
                          self.log.error("Couldn't construct the Controller", exc_info=True)
                          self.exit(1)
                      if not reusing:
                          # save to new json config files
                          f = self.factory
                          cdict = {'exec_key' : key,
                                  'ssh' : self.ssh_server,
                                  'url' : "%s://%s:%s"%(f.client_transport, f.client_ip, f.regport),
                                  'location' : self.location
                                  }
                          self.save_connection_dict('ipcontroller-client.json', cdict)
                          edict = cdict
                          edict['url']="%s://%s:%s"%((f.client_transport, f.client_ip, f.regport))
                          self.save_connection_dict('ipcontroller-engine.json', edict)
                  #
                  def init_schedulers(self):
                      children = self.children
                      mq = import_item(str(self.mq_class))
                      hub = self.factory
                      # maybe_inproc = 'inproc://monitor' if self.use_threads else self.monitor_url
                      # IOPub relay (in a Process)
                      q = mq(zmq.PUB, zmq.SUB, zmq.PUB, 'N/A','iopub')
                      q.bind_in(hub.client_info['iopub'])
                      q.bind_out(hub.engine_info['iopub'])
                      q.setsockopt_out(zmq.SUBSCRIBE, '')
                      q.connect_mon(hub.monitor_url)
                      q.daemon=True
                      children.append(q)
                      # Multiplexer Queue (in a Process)
                      q = mq(zmq.XREP, zmq.XREP, zmq.PUB, 'in', 'out')
                      q.bind_in(hub.client_info['mux'])
                      q.setsockopt_in(zmq.IDENTITY, 'mux')
                      q.bind_out(hub.engine_info['mux'])
                      q.connect_mon(hub.monitor_url)
                      q.daemon=True
                      children.append(q)
                      # Control Queue (in a Process)
                      q = mq(zmq.XREP, zmq.XREP, zmq.PUB, 'incontrol', 'outcontrol')
                      q.bind_in(hub.client_info['control'])
                      q.setsockopt_in(zmq.IDENTITY, 'control')
                      q.bind_out(hub.engine_info['control'])
                      q.connect_mon(hub.monitor_url)
                      q.daemon=True
                      children.append(q)
                      try:
                          scheme = self.config.TaskScheduler.scheme_name
                      except AttributeError:
                          scheme = TaskScheduler.scheme_name.get_default_value()
                      # Task Queue (in a Process)
                      if scheme == 'pure':
                          self.log.warn("task::using pure XREQ Task scheduler")
                          q = mq(zmq.XREP, zmq.XREQ, zmq.PUB, 'intask', 'outtask')
                          # q.setsockopt_out(zmq.HWM, hub.hwm)
                          q.bind_in(hub.client_info['task'][1])
                          q.setsockopt_in(zmq.IDENTITY, 'task')
                          q.bind_out(hub.engine_info['task'])
                          q.connect_mon(hub.monitor_url)
                          q.daemon=True
                          children.append(q)
                      elif scheme == 'none':
                          self.log.warn("task::using no Task scheduler")
                      else:
                          self.log.info("task::using Python %s Task scheduler"%scheme)
                          sargs = (hub.client_info['task'][1], hub.engine_info['task'],
                                              hub.monitor_url, hub.client_info['notification'])
                          kwargs = dict(logname='scheduler', loglevel=self.log_level,
                                          log_url = self.log_url, config=dict(self.config))
                          q = Process(target=launch_scheduler, args=sargs, kwargs=kwargs)
                          q.daemon=True
                          children.append(q)
                  def save_urls(self):
                      """save the registration urls to files."""
                      c = self.config
                      sec_dir = self.profile_dir.security_dir
                      cf = self.factory
                      with open(os.path.join(sec_dir, 'ipcontroller-engine.url'), 'w') as f:
                          f.write("%s://%s:%s"%(cf.engine_transport, cf.engine_ip, cf.regport))
                      with open(os.path.join(sec_dir, 'ipcontroller-client.url'), 'w') as f:
                          f.write("%s://%s:%s"%(cf.client_transport, cf.client_ip, cf.regport))
                  def do_import_statements(self):
                      statements = self.import_statements
                      for s in statements:
                          try:
                              self.log.msg("Executing statement: '%s'" % s)
                              exec s in globals(), locals()
                          except:
                              self.log.msg("Error running statement: %s" % s)
                  def forward_logging(self):
                      if self.log_url:
                          self.log.info("Forwarding logging to %s"%self.log_url)
                          context = zmq.Context.instance()
                          lsock = context.socket(zmq.PUB)
                          lsock.connect(self.log_url)
                          handler = PUBHandler(lsock)
                          self.log.removeHandler(self._log_handler)
                          handler.root_topic = 'controller'
                          handler.setLevel(self.log_level)
                          self.log.addHandler(handler)
                          self._log_handler = handler
                  # #
                  def initialize(self, argv=None):
                      super(IPControllerApp, self).initialize(argv)
                      self.forward_logging()
                      self.init_hub()
                      self.init_schedulers()
                  def start(self):
                      # Start the subprocesses:
                      self.factory.start()
                      child_procs = []
                      for child in self.children:
                          child.start()
                          if isinstance(child, ProcessMonitoredQueue):
                              child_procs.append(child.launcher)
                          elif isinstance(child, Process):
                              child_procs.append(child)
                      if child_procs:
                          signal_children(child_procs)
                      self.write_pid_file(overwrite=True)
                      try:
                          self.factory.loop.start()
                      except KeyboardInterrupt:
                          self.log.critical("Interrupted, Exiting...\n")
              def launch_new_instance():
                  """Create and run the IPython controller"""
                  app = IPControllerApp.instance()
                  app.initialize()
                  app.start()
              if __name__ == '__main__':
                  launch_new_instance()

IPython/parallel/apps/ipengineapp.py

0 +7 -1

              #!/usr/bin/env python
              # encoding: utf-8
              """
              The IPython engine application
+             Authors:
+             * Brian Granger
+             * MinRK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2009  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import json
              import os
              import sys
              import zmq
              from zmq.eventloop import ioloop
              from IPython.core.newapplication import ProfileDir
              from IPython.parallel.apps.baseapp import BaseParallelApplication
              from IPython.zmq.log import EnginePUBHandler
              from IPython.config.configurable import Configurable
              from IPython.zmq.session import Session
              from IPython.parallel.engine.engine import EngineFactory
              from IPython.parallel.engine.streamkernel import Kernel
              from IPython.parallel.util import disambiguate_url
              from IPython.utils.importstring import import_item
              from IPython.utils.traitlets import Bool, Unicode, Dict, List
              #-----------------------------------------------------------------------------
              # Module level variables
              #-----------------------------------------------------------------------------
              #: The default config file name for this application
              default_config_file_name = u'ipengine_config.py'
              _description = """Start an IPython engine for parallel computing.
              IPython engines run in parallel and perform computations on behalf of a client
              and controller. A controller needs to be started before the engines. The
              engine can be configured using command line options or using a cluster
              directory. Cluster directories contain config, log and security files and are
              usually located in your ipython directory and named as "cluster_<profile>".
              See the `profile` and `profile_dir` options for details.
              """
              #-----------------------------------------------------------------------------
              # MPI configuration
              #-----------------------------------------------------------------------------
              mpi4py_init = """from mpi4py import MPI as mpi
              mpi.size = mpi.COMM_WORLD.Get_size()
              mpi.rank = mpi.COMM_WORLD.Get_rank()
              """
              pytrilinos_init = """from PyTrilinos import Epetra
              class SimpleStruct:
              pass
              mpi = SimpleStruct()
              mpi.rank = 0
              mpi.size = 0
              """
              class MPI(Configurable):
                  """Configurable for MPI initialization"""
                  use = Unicode('', config=True,
                      help='How to enable MPI (mpi4py, pytrilinos, or empty string to disable).'
                      )
                  def _on_use_changed(self, old, new):
                      # load default init script if it's not set
                      if not self.init_script:
                          self.init_script = self.default_inits.get(new, '')
                  init_script = Unicode('', config=True,
                      help="Initialization code for MPI")
                  default_inits = Dict({'mpi4py' : mpi4py_init, 'pytrilinos':pytrilinos_init},
                      config=True)
              #-----------------------------------------------------------------------------
              # Main application
              #-----------------------------------------------------------------------------
              class IPEngineApp(BaseParallelApplication):
                  app_name = Unicode(u'ipengine')
                  description = Unicode(_description)
                  config_file_name = Unicode(default_config_file_name)
                  classes = List([ProfileDir, Session, EngineFactory, Kernel, MPI])
                  startup_script = Unicode(u'', config=True,
                      help='specify a script to be run at startup')
                  startup_command = Unicode('', config=True,
                          help='specify a command to be run at startup')
                  url_file = Unicode(u'', config=True,
                      help="""The full location of the file containing the connection information for
                      the controller. If this is not given, the file must be in the
                      security directory of the cluster directory.  This location is
                      resolved using the `profile` or `profile_dir` options.""",
                      )
                  url_file_name = Unicode(u'ipcontroller-engine.json')
                  log_url = Unicode('', config=True,
                      help="""The URL for the iploggerapp instance, for forwarding
                      logging to a central location.""")
                  aliases = Dict(dict(
                      file = 'IPEngineApp.url_file',
                      c = 'IPEngineApp.startup_command',
                      s = 'IPEngineApp.startup_script',
                      ident = 'Session.session',
                      user = 'Session.username',
                      exec_key = 'Session.keyfile',
                      url = 'EngineFactory.url',
                      ip = 'EngineFactory.ip',
                      transport = 'EngineFactory.transport',
                      port = 'EngineFactory.regport',
                      location = 'EngineFactory.location',
                      timeout = 'EngineFactory.timeout',
                      profile = "IPEngineApp.profile",
                      profile_dir = 'ProfileDir.location',
                      mpi = 'MPI.use',
                      log_level = 'IPEngineApp.log_level',
                      log_url = 'IPEngineApp.log_url'
                  ))
                  # def find_key_file(self):
                  #     """Set the key file.
                  #
                  #     Here we don't try to actually see if it exists for is valid as that
                  #     is hadled by the connection logic.
                  #     """
                  #     config = self.master_config
                  #     # Find the actual controller key file
                  #     if not config.Global.key_file:
                  #         try_this = os.path.join(
                  #             config.Global.profile_dir,
                  #             config.Global.security_dir,
                  #             config.Global.key_file_name
                  #         )
                  #         config.Global.key_file = try_this
                  def find_url_file(self):
                      """Set the key file.
                      Here we don't try to actually see if it exists for is valid as that
                      is hadled by the connection logic.
                      """
                      config = self.config
                      # Find the actual controller key file
                      if not self.url_file:
                          self.url_file = os.path.join(
                              self.profile_dir.security_dir,
                              self.url_file_name
                          )
                  def init_engine(self):
                      # This is the working dir by now.
                      sys.path.insert(0, '')
                      config = self.config
                      # print config
                      self.find_url_file()
                      # if os.path.exists(config.Global.key_file) and config.Global.secure:
                      #     config.SessionFactory.exec_key = config.Global.key_file
                      if os.path.exists(self.url_file):
                          with open(self.url_file) as f:
                              d = json.loads(f.read())
                              for k,v in d.iteritems():
                                  if isinstance(v, unicode):
                                      d[k] = v.encode()
                          if d['exec_key']:
                              config.Session.key = d['exec_key']
                          d['url'] = disambiguate_url(d['url'], d['location'])
                          config.EngineFactory.url = d['url']
                          config.EngineFactory.location = d['location']
                      try:
                          exec_lines = config.Kernel.exec_lines
                      except AttributeError:
                          config.Kernel.exec_lines = []
                          exec_lines = config.Kernel.exec_lines
                      if self.startup_script:
                          enc = sys.getfilesystemencoding() or 'utf8'
                          cmd="execfile(%r)"%self.startup_script.encode(enc)
                          exec_lines.append(cmd)
                      if self.startup_command:
                          exec_lines.append(self.startup_command)
                      # Create the underlying shell class and Engine
                      # shell_class = import_item(self.master_config.Global.shell_class)
                      # print self.config
                      try:
                          self.engine = EngineFactory(config=config, log=self.log)
                      except:
                          self.log.error("Couldn't start the Engine", exc_info=True)
                          self.exit(1)
                  def forward_logging(self):
                      if self.log_url:
                          self.log.info("Forwarding logging to %s"%self.log_url)
                          context = self.engine.context
                          lsock = context.socket(zmq.PUB)
                          lsock.connect(self.log_url)
                          self.log.removeHandler(self._log_handler)
                          handler = EnginePUBHandler(self.engine, lsock)
                          handler.setLevel(self.log_level)
                          self.log.addHandler(handler)
                          self._log_handler = handler
                  #
                  def init_mpi(self):
                      global mpi
                      self.mpi = MPI(config=self.config)
                      mpi_import_statement = self.mpi.init_script
                      if mpi_import_statement:
                          try:
                              self.log.info("Initializing MPI:")
                              self.log.info(mpi_import_statement)
                              exec mpi_import_statement in globals()
                          except:
                              mpi = None
                      else:
                          mpi = None
                  def initialize(self, argv=None):
                      super(IPEngineApp, self).initialize(argv)
                      self.init_mpi()
                      self.init_engine()
                      self.forward_logging()
                  def start(self):
                      self.engine.start()
                      try:
                          self.engine.loop.start()
                      except KeyboardInterrupt:
                          self.log.critical("Engine Interrupted, shutting down...\n")
              def launch_new_instance():
                  """Create and run the IPython engine"""
                  app = IPEngineApp.instance()
                  app.initialize()
                  app.start()
              if __name__ == '__main__':
                  launch_new_instance()

IPython/parallel/apps/iploggerapp.py

0 +5 0

              #!/usr/bin/env python
              # encoding: utf-8
              """
              A simple IPython logger application
+             Authors:
+             * MinRK
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import os
              import sys
              import zmq
              from IPython.core.newapplication import ProfileDir
              from IPython.utils.traitlets import Bool, Dict, Unicode
              from IPython.parallel.apps.baseapp import (
                  BaseParallelApplication,
                  base_aliases
              )
              from IPython.parallel.apps.logwatcher import LogWatcher
              #-----------------------------------------------------------------------------
              # Module level variables
              #-----------------------------------------------------------------------------
              #: The default config file name for this application
              default_config_file_name = u'iplogger_config.py'
              _description = """Start an IPython logger for parallel computing.
              IPython controllers and engines (and your own processes) can broadcast log messages
              by registering a `zmq.log.handlers.PUBHandler` with the `logging` module. The
              logger can be configured using command line options or using a cluster
              directory. Cluster directories contain config, log and security files and are
              usually located in your ipython directory and named as "cluster_<profile>".
              See the `profile` and `profile_dir` options for details.
              """
              #-----------------------------------------------------------------------------
              # Main application
              #-----------------------------------------------------------------------------
              aliases = {}
              aliases.update(base_aliases)
              aliases.update(dict(url='LogWatcher.url', topics='LogWatcher.topics'))
              class IPLoggerApp(BaseParallelApplication):
                  name = u'iploggerz'
                  description = _description
                  config_file_name = Unicode(default_config_file_name)
                  classes = [LogWatcher, ProfileDir]
                  aliases = Dict(aliases)
                  def initialize(self, argv=None):
                      super(IPLoggerApp, self).initialize(argv)
                      self.init_watcher()
                  def init_watcher(self):
                      try:
                          self.watcher = LogWatcher(config=self.config, log=self.log)
                      except:
                          self.log.error("Couldn't start the LogWatcher", exc_info=True)
                          self.exit(1)
                      self.log.info("Listening for log messages on %r"%self.watcher.url)
                  def start(self):
                      self.watcher.start()
                      try:
                          self.watcher.loop.start()
                      except KeyboardInterrupt:
                          self.log.critical("Logging Interrupted, shutting down...\n")
              def launch_new_instance():
                  """Create and run the IPython LogWatcher"""
                  app = IPLoggerApp.instance()
                  app.initialize()
                  app.start()
              if __name__ == '__main__':
                  launch_new_instance()

IPython/parallel/apps/launcher.py

0 +6 -1

              #!/usr/bin/env python
              # encoding: utf-8
              """
              Facilities for launching IPython processes asynchronously.
+             Authors:
+             * Brian Granger
+             * MinRK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2009  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import copy
              import logging
              import os
              import re
              import stat
              # signal imports, handling various platforms, versions
              from signal import SIGINT, SIGTERM
              try:
                  from signal import SIGKILL
              except ImportError:
                  # Windows
                  SIGKILL=SIGTERM
              try:
                  # Windows >= 2.7, 3.2
                  from signal import CTRL_C_EVENT as SIGINT
              except ImportError:
                  pass
              from subprocess import Popen, PIPE, STDOUT
              try:
                  from subprocess import check_output
              except ImportError:
                  # pre-2.7, define check_output with Popen
                  def check_output(*args, **kwargs):
                      kwargs.update(dict(stdout=PIPE))
                      p = Popen(*args, **kwargs)
                      out,err = p.communicate()
                      return out
              from zmq.eventloop import ioloop
              from IPython.config.application import Application
              from IPython.config.configurable import LoggingConfigurable
              from IPython.utils.text import EvalFormatter
              from IPython.utils.traitlets import Any, Int, List, Unicode, Dict, Instance
              from IPython.utils.path import get_ipython_module_path
              from IPython.utils.process import find_cmd, pycmd2argv, FindCmdError
              from .win32support import forward_read_events
              from .winhpcjob import IPControllerTask, IPEngineTask, IPControllerJob, IPEngineSetJob
              WINDOWS = os.name == 'nt'
              #-----------------------------------------------------------------------------
              # Paths to the kernel apps
              #-----------------------------------------------------------------------------
              ipcluster_cmd_argv = pycmd2argv(get_ipython_module_path(
                  'IPython.parallel.apps.ipclusterapp'
              ))
              ipengine_cmd_argv = pycmd2argv(get_ipython_module_path(
                  'IPython.parallel.apps.ipengineapp'
              ))
              ipcontroller_cmd_argv = pycmd2argv(get_ipython_module_path(
                  'IPython.parallel.apps.ipcontrollerapp'
              ))
              #-----------------------------------------------------------------------------
              # Base launchers and errors
              #-----------------------------------------------------------------------------
              class LauncherError(Exception):
                  pass
              class ProcessStateError(LauncherError):
                  pass
              class UnknownStatus(LauncherError):
                  pass
              class BaseLauncher(LoggingConfigurable):
                  """An asbtraction for starting, stopping and signaling a process."""
                  # In all of the launchers, the work_dir is where child processes will be
                  # run. This will usually be the profile_dir, but may not be. any work_dir
                  # passed into the __init__ method will override the config value.
                  # This should not be used to set the work_dir for the actual engine
                  # and controller. Instead, use their own config files or the
                  # controller_args, engine_args attributes of the launchers to add
                  # the work_dir option.
                  work_dir = Unicode(u'.')
                  loop = Instance('zmq.eventloop.ioloop.IOLoop')
                  start_data = Any()
                  stop_data = Any()
                  def _loop_default(self):
                      return ioloop.IOLoop.instance()
                  def __init__(self, work_dir=u'.', config=None, **kwargs):
                      super(BaseLauncher, self).__init__(work_dir=work_dir, config=config, **kwargs)
                      self.state = 'before' # can be before, running, after
                      self.stop_callbacks = []
                      self.start_data = None
                      self.stop_data = None
                  @property
                  def args(self):
                      """A list of cmd and args that will be used to start the process.
                      This is what is passed to :func:`spawnProcess` and the first element
                      will be the process name.
                      """
                      return self.find_args()
                  def find_args(self):
                      """The ``.args`` property calls this to find the args list.
                      Subcommand should implement this to construct the cmd and args.
                      """
                      raise NotImplementedError('find_args must be implemented in a subclass')
                  @property
                  def arg_str(self):
                      """The string form of the program arguments."""
                      return ' '.join(self.args)
                  @property
                  def running(self):
                      """Am I running."""
                      if self.state == 'running':
                          return True
                      else:
                          return False
                  def start(self):
                      """Start the process.
                      This must return a deferred that fires with information about the
                      process starting (like a pid, job id, etc.).
                      """
                      raise NotImplementedError('start must be implemented in a subclass')
                  def stop(self):
                      """Stop the process and notify observers of stopping.
                      This must return a deferred that fires with information about the
                      processing stopping, like errors that occur while the process is
                      attempting to be shut down. This deferred won't fire when the process
                      actually stops. To observe the actual process stopping, see
                      :func:`observe_stop`.
                      """
                      raise NotImplementedError('stop must be implemented in a subclass')
                  def on_stop(self, f):
                      """Get a deferred that will fire when the process stops.
                      The deferred will fire with data that contains information about
                      the exit status of the process.
                      """
                      if self.state=='after':
                          return f(self.stop_data)
                      else:
                          self.stop_callbacks.append(f)
                  def notify_start(self, data):
                      """Call this to trigger startup actions.
                      This logs the process startup and sets the state to 'running'.  It is
                      a pass-through so it can be used as a callback.
                      """
                      self.log.info('Process %r started: %r' % (self.args[0], data))
                      self.start_data = data
                      self.state = 'running'
                      return data
                  def notify_stop(self, data):
                      """Call this to trigger process stop actions.
                      This logs the process stopping and sets the state to 'after'. Call
                      this to trigger all the deferreds from :func:`observe_stop`."""
                      self.log.info('Process %r stopped: %r' % (self.args[0], data))
                      self.stop_data = data
                      self.state = 'after'
                      for i in range(len(self.stop_callbacks)):
                          d = self.stop_callbacks.pop()
                          d(data)
                      return data
                  def signal(self, sig):
                      """Signal the process.
                      Return a semi-meaningless deferred after signaling the process.
                      Parameters
                      ----------
                      sig : str or int
                          'KILL', 'INT', etc., or any signal number
                      """
                      raise NotImplementedError('signal must be implemented in a subclass')
              #-----------------------------------------------------------------------------
              # Local process launchers
              #-----------------------------------------------------------------------------
              class LocalProcessLauncher(BaseLauncher):
                  """Start and stop an external process in an asynchronous manner.
                  This will launch the external process with a working directory of
                  ``self.work_dir``.
                  """
                  # This is used to to construct self.args, which is passed to
                  # spawnProcess.
                  cmd_and_args = List([])
                  poll_frequency = Int(100) # in ms
                  def __init__(self, work_dir=u'.', config=None, **kwargs):
                      super(LocalProcessLauncher, self).__init__(
                          work_dir=work_dir, config=config, **kwargs
                      )
                      self.process = None
                      self.start_deferred = None
                      self.poller = None
                  def find_args(self):
                      return self.cmd_and_args
                  def start(self):
                      if self.state == 'before':
                          self.process = Popen(self.args,
                              stdout=PIPE,stderr=PIPE,stdin=PIPE,
                              env=os.environ,
                              cwd=self.work_dir
                          )
                          if WINDOWS:
                              self.stdout = forward_read_events(self.process.stdout)
                              self.stderr = forward_read_events(self.process.stderr)
                          else:
                              self.stdout = self.process.stdout.fileno()
                              self.stderr = self.process.stderr.fileno()
                          self.loop.add_handler(self.stdout, self.handle_stdout, self.loop.READ)
                          self.loop.add_handler(self.stderr, self.handle_stderr, self.loop.READ)
                          self.poller = ioloop.PeriodicCallback(self.poll, self.poll_frequency, self.loop)
                          self.poller.start()
                          self.notify_start(self.process.pid)
                      else:
                          s = 'The process was already started and has state: %r' % self.state
                          raise ProcessStateError(s)
                  def stop(self):
                      return self.interrupt_then_kill()
                  def signal(self, sig):
                      if self.state == 'running':
                          if WINDOWS and sig != SIGINT:
                              # use Windows tree-kill for better child cleanup
                              check_output(['taskkill', '-pid', str(self.process.pid), '-t', '-f'])
                          else:
                              self.process.send_signal(sig)
                  def interrupt_then_kill(self, delay=2.0):
                      """Send INT, wait a delay and then send KILL."""
                      try:
                          self.signal(SIGINT)
                      except Exception:
                          self.log.debug("interrupt failed")
                          pass
                      self.killer  = ioloop.DelayedCallback(lambda : self.signal(SIGKILL), delay*1000, self.loop)
                      self.killer.start()
                  # callbacks, etc:
                  def handle_stdout(self, fd, events):
                      if WINDOWS:
                          line = self.stdout.recv()
                      else:
                          line = self.process.stdout.readline()
                      # a stopped process will be readable but return empty strings
                      if line:
                          self.log.info(line[:-1])
                      else:
                          self.poll()
                  def handle_stderr(self, fd, events):
                      if WINDOWS:
                          line = self.stderr.recv()
                      else:
                          line = self.process.stderr.readline()
                      # a stopped process will be readable but return empty strings
                      if line:
                          self.log.error(line[:-1])
                      else:
                          self.poll()
                  def poll(self):
                      status = self.process.poll()
                      if status is not None:
                          self.poller.stop()
                          self.loop.remove_handler(self.stdout)
                          self.loop.remove_handler(self.stderr)
                          self.notify_stop(dict(exit_code=status, pid=self.process.pid))
                      return status
              class LocalControllerLauncher(LocalProcessLauncher):
                  """Launch a controller as a regular external process."""
                  controller_cmd = List(ipcontroller_cmd_argv, config=True,
                      help="""Popen command to launch ipcontroller.""")
                  # Command line arguments to ipcontroller.
                  controller_args = List(['--log-to-file','log_level=%i'%logging.INFO], config=True,
                      help="""command-line args to pass to ipcontroller""")
                  def find_args(self):
                      return self.controller_cmd + self.controller_args
                  def start(self, profile_dir):
                      """Start the controller by profile_dir."""
                      self.controller_args.extend(['profile_dir=%s'%profile_dir])
                      self.profile_dir = unicode(profile_dir)
                      self.log.info("Starting LocalControllerLauncher: %r" % self.args)
                      return super(LocalControllerLauncher, self).start()
              class LocalEngineLauncher(LocalProcessLauncher):
                  """Launch a single engine as a regular externall process."""
                  engine_cmd = List(ipengine_cmd_argv, config=True,
                      help="""command to launch the Engine.""")
                  # Command line arguments for ipengine.
                  engine_args = List(['--log-to-file','log_level=%i'%logging.INFO], config=True,
                      help="command-line arguments to pass to ipengine"
                  )
                  def find_args(self):
                      return self.engine_cmd + self.engine_args
                  def start(self, profile_dir):
                      """Start the engine by profile_dir."""
                      self.engine_args.extend(['profile_dir=%s'%profile_dir])
                      self.profile_dir = unicode(profile_dir)
                      return super(LocalEngineLauncher, self).start()
              class LocalEngineSetLauncher(BaseLauncher):
                  """Launch a set of engines as regular external processes."""
                  # Command line arguments for ipengine.
                  engine_args = List(
                      ['--log-to-file','log_level=%i'%logging.INFO], config=True,
                      help="command-line arguments to pass to ipengine"
                  )
                  # launcher class
                  launcher_class = LocalEngineLauncher
                  launchers = Dict()
                  stop_data = Dict()
                  def __init__(self, work_dir=u'.', config=None, **kwargs):
                      super(LocalEngineSetLauncher, self).__init__(
                          work_dir=work_dir, config=config, **kwargs
                      )
                      self.stop_data = {}
                  def start(self, n, profile_dir):
                      """Start n engines by profile or profile_dir."""
                      self.profile_dir = unicode(profile_dir)
                      dlist = []
                      for i in range(n):
                          el = self.launcher_class(work_dir=self.work_dir, config=self.config, log=self.log)
                          # Copy the engine args over to each engine launcher.
                          el.engine_args = copy.deepcopy(self.engine_args)
                          el.on_stop(self._notice_engine_stopped)
                          d = el.start(profile_dir)
                          if i==0:
                              self.log.info("Starting LocalEngineSetLauncher: %r" % el.args)
                          self.launchers[i] = el
                          dlist.append(d)
                      self.notify_start(dlist)
                      # The consumeErrors here could be dangerous
                      # dfinal = gatherBoth(dlist, consumeErrors=True)
                      # dfinal.addCallback(self.notify_start)
                      return dlist
                  def find_args(self):
                      return ['engine set']
                  def signal(self, sig):
                      dlist = []
                      for el in self.launchers.itervalues():
                          d = el.signal(sig)
                          dlist.append(d)
                      # dfinal = gatherBoth(dlist, consumeErrors=True)
                      return dlist
                  def interrupt_then_kill(self, delay=1.0):
                      dlist = []
                      for el in self.launchers.itervalues():
                          d = el.interrupt_then_kill(delay)
                          dlist.append(d)
                      # dfinal = gatherBoth(dlist, consumeErrors=True)
                      return dlist
                  def stop(self):
                      return self.interrupt_then_kill()
                  def _notice_engine_stopped(self, data):
                      pid = data['pid']
                      for idx,el in self.launchers.iteritems():
                          if el.process.pid == pid:
                              break
                      self.launchers.pop(idx)
                      self.stop_data[idx] = data
                      if not self.launchers:
                          self.notify_stop(self.stop_data)
              #-----------------------------------------------------------------------------
              # MPIExec launchers
              #-----------------------------------------------------------------------------
              class MPIExecLauncher(LocalProcessLauncher):
                  """Launch an external process using mpiexec."""
                  mpi_cmd = List(['mpiexec'], config=True,
                      help="The mpiexec command to use in starting the process."
                  )
                  mpi_args = List([], config=True,
                      help="The command line arguments to pass to mpiexec."
                  )
                  program = List(['date'], config=True,
                      help="The program to start via mpiexec.")
                  program_args = List([], config=True,
                      help="The command line argument to the program."
                  )
                  n = Int(1)
                  def find_args(self):
                      """Build self.args using all the fields."""
                      return self.mpi_cmd + ['-n', str(self.n)] + self.mpi_args + \
                             self.program + self.program_args
                  def start(self, n):
                      """Start n instances of the program using mpiexec."""
                      self.n = n
                      return super(MPIExecLauncher, self).start()
              class MPIExecControllerLauncher(MPIExecLauncher):
                  """Launch a controller using mpiexec."""
                  controller_cmd = List(ipcontroller_cmd_argv, config=True,
                      help="Popen command to launch the Contropper"
                  )
                  controller_args = List(['--log-to-file','log_level=%i'%logging.INFO], config=True,
                      help="Command line arguments to pass to ipcontroller."
                  )
                  n = Int(1)
                  def start(self, profile_dir):
                      """Start the controller by profile_dir."""
                      self.controller_args.extend(['profile_dir=%s'%profile_dir])
                      self.profile_dir = unicode(profile_dir)
                      self.log.info("Starting MPIExecControllerLauncher: %r" % self.args)
                      return super(MPIExecControllerLauncher, self).start(1)
                  def find_args(self):
                      return self.mpi_cmd + ['-n', self.n] + self.mpi_args + \
                             self.controller_cmd + self.controller_args
              class MPIExecEngineSetLauncher(MPIExecLauncher):
                  program = List(ipengine_cmd_argv, config=True,
                      help="Popen command for ipengine"
                  )
                  program_args = List(
                      ['--log-to-file','log_level=%i'%logging.INFO], config=True,
                      help="Command line arguments for ipengine."
                  )
                  n = Int(1)
                  def start(self, n, profile_dir):
                      """Start n engines by profile or profile_dir."""
                      self.program_args.extend(['profile_dir=%s'%profile_dir])
                      self.profile_dir = unicode(profile_dir)
                      self.n = n
                      self.log.info('Starting MPIExecEngineSetLauncher: %r' % self.args)
                      return super(MPIExecEngineSetLauncher, self).start(n)
              #-----------------------------------------------------------------------------
              # SSH launchers
              #-----------------------------------------------------------------------------
              # TODO: Get SSH Launcher working again.
              class SSHLauncher(LocalProcessLauncher):
                  """A minimal launcher for ssh.
                  To be useful this will probably have to be extended to use the ``sshx``
                  idea for environment variables.  There could be other things this needs
                  as well.
                  """
                  ssh_cmd = List(['ssh'], config=True,
                      help="command for starting ssh")
                  ssh_args = List(['-tt'], config=True,
                      help="args to pass to ssh")
                  program = List(['date'], config=True,
                      help="Program to launch via ssh")
                  program_args = List([], config=True,
                      help="args to pass to remote program")
                  hostname = Unicode('', config=True,
                      help="hostname on which to launch the program")
                  user = Unicode('', config=True,
                      help="username for ssh")
                  location = Unicode('', config=True,
                      help="user@hostname location for ssh in one setting")
                  def _hostname_changed(self, name, old, new):
                      if self.user:
                          self.location = u'%s@%s' % (self.user, new)
                      else:
                          self.location = new
                  def _user_changed(self, name, old, new):
                      self.location = u'%s@%s' % (new, self.hostname)
                  def find_args(self):
                      return self.ssh_cmd + self.ssh_args + [self.location] + \
                             self.program + self.program_args
                  def start(self, profile_dir, hostname=None, user=None):
                      self.profile_dir = unicode(profile_dir)
                      if hostname is not None:
                          self.hostname = hostname
                      if user is not None:
                          self.user = user
                      return super(SSHLauncher, self).start()
                  def signal(self, sig):
                      if self.state == 'running':
                          # send escaped ssh connection-closer
                          self.process.stdin.write('~.')
                          self.process.stdin.flush()
              class SSHControllerLauncher(SSHLauncher):
                  program = List(ipcontroller_cmd_argv, config=True,
                      help="remote ipcontroller command.")
                  program_args = List(['--reuse-files', '--log-to-file','log_level=%i'%logging.INFO], config=True,
                      help="Command line arguments to ipcontroller.")
              class SSHEngineLauncher(SSHLauncher):
                  program = List(ipengine_cmd_argv, config=True,
                      help="remote ipengine command.")
                  # Command line arguments for ipengine.
                  program_args = List(
                      ['--log-to-file','log_level=%i'%logging.INFO], config=True,
                      help="Command line arguments to ipengine."
                  )
              class SSHEngineSetLauncher(LocalEngineSetLauncher):
                  launcher_class = SSHEngineLauncher
                  engines = Dict(config=True,
                      help="""dict of engines to launch.  This is a dict by hostname of ints,
                      corresponding to the number of engines to start on that host.""")
                  def start(self, n, profile_dir):
                      """Start engines by profile or profile_dir.
                      `n` is ignored, and the `engines` config property is used instead.
                      """
                      self.profile_dir = unicode(profile_dir)
                      dlist = []
                      for host, n in self.engines.iteritems():
                          if isinstance(n, (tuple, list)):
                              n, args = n
                          else:
                              args = copy.deepcopy(self.engine_args)
                          if '@' in host:
                              user,host = host.split('@',1)
                          else:
                              user=None
                          for i in range(n):
                              el = self.launcher_class(work_dir=self.work_dir, config=self.config, log=self.log)
                              # Copy the engine args over to each engine launcher.
                              i
                              el.program_args = args
                              el.on_stop(self._notice_engine_stopped)
                              d = el.start(profile_dir, user=user, hostname=host)
                              if i==0:
                                  self.log.info("Starting SSHEngineSetLauncher: %r" % el.args)
                              self.launchers[host+str(i)] = el
                              dlist.append(d)
                      self.notify_start(dlist)
                      return dlist
              #-----------------------------------------------------------------------------
              # Windows HPC Server 2008 scheduler launchers
              #-----------------------------------------------------------------------------
              # This is only used on Windows.
              def find_job_cmd():
                  if WINDOWS:
                      try:
                          return find_cmd('job')
                      except (FindCmdError, ImportError):
                          # ImportError will be raised if win32api is not installed
                          return 'job'
                  else:
                      return 'job'
              class WindowsHPCLauncher(BaseLauncher):
                  job_id_regexp = Unicode(r'\d+', config=True,
                      help="""A regular expression used to get the job id from the output of the
                      submit_command. """
                      )
                  job_file_name = Unicode(u'ipython_job.xml', config=True,
                      help="The filename of the instantiated job script.")
                  # The full path to the instantiated job script. This gets made dynamically
                  # by combining the work_dir with the job_file_name.
                  job_file = Unicode(u'')
                  scheduler = Unicode('', config=True,
                      help="The hostname of the scheduler to submit the job to.")
                  job_cmd = Unicode(find_job_cmd(), config=True,
                      help="The command for submitting jobs.")
                  def __init__(self, work_dir=u'.', config=None, **kwargs):
                      super(WindowsHPCLauncher, self).__init__(
                          work_dir=work_dir, config=config, **kwargs
                      )
                  @property
                  def job_file(self):
                      return os.path.join(self.work_dir, self.job_file_name)
                  def write_job_file(self, n):
                      raise NotImplementedError("Implement write_job_file in a subclass.")
                  def find_args(self):
                      return [u'job.exe']
                  def parse_job_id(self, output):
                      """Take the output of the submit command and return the job id."""
                      m = re.search(self.job_id_regexp, output)
                      if m is not None:
                          job_id = m.group()
                      else:
                          raise LauncherError("Job id couldn't be determined: %s" % output)
                      self.job_id = job_id
                      self.log.info('Job started with job id: %r' % job_id)
                      return job_id
                  def start(self, n):
                      """Start n copies of the process using the Win HPC job scheduler."""
                      self.write_job_file(n)
                      args = [
                          'submit',
                          '/jobfile:%s' % self.job_file,
                          '/scheduler:%s' % self.scheduler
                      ]
                      self.log.info("Starting Win HPC Job: %s" % (self.job_cmd + ' ' + ' '.join(args),))
                      # Twisted will raise DeprecationWarnings if we try to pass unicode to this
                      output = check_output([self.job_cmd]+args,
                          env=os.environ,
                          cwd=self.work_dir,
                          stderr=STDOUT
                      )
                      job_id = self.parse_job_id(output)
                      self.notify_start(job_id)
                      return job_id
                  def stop(self):
                      args = [
                          'cancel',
                          self.job_id,
                          '/scheduler:%s' % self.scheduler
                      ]
                      self.log.info("Stopping Win HPC Job: %s" % (self.job_cmd + ' ' + ' '.join(args),))
                      try:
                          output = check_output([self.job_cmd]+args,
                              env=os.environ,
                              cwd=self.work_dir,
                              stderr=STDOUT
                          )
                      except:
                          output = 'The job already appears to be stoppped: %r' % self.job_id
                      self.notify_stop(dict(job_id=self.job_id, output=output))  # Pass the output of the kill cmd
                      return output
              class WindowsHPCControllerLauncher(WindowsHPCLauncher):
                  job_file_name = Unicode(u'ipcontroller_job.xml', config=True,
                      help="WinHPC xml job file.")
                  extra_args = List([], config=False,
                      help="extra args to pass to ipcontroller")
                  def write_job_file(self, n):
                      job = IPControllerJob(config=self.config)
                      t = IPControllerTask(config=self.config)
                      # The tasks work directory is *not* the actual work directory of
                      # the controller. It is used as the base path for the stdout/stderr
                      # files that the scheduler redirects to.
                      t.work_directory = self.profile_dir
                      # Add the profile_dir and from self.start().
                      t.controller_args.extend(self.extra_args)
                      job.add_task(t)
                      self.log.info("Writing job description file: %s" % self.job_file)
                      job.write(self.job_file)
                  @property
                  def job_file(self):
                      return os.path.join(self.profile_dir, self.job_file_name)
                  def start(self, profile_dir):
                      """Start the controller by profile_dir."""
                      self.extra_args = ['profile_dir=%s'%profile_dir]
                      self.profile_dir = unicode(profile_dir)
                      return super(WindowsHPCControllerLauncher, self).start(1)
              class WindowsHPCEngineSetLauncher(WindowsHPCLauncher):
                  job_file_name = Unicode(u'ipengineset_job.xml', config=True,
                      help="jobfile for ipengines job")
                  extra_args = List([], config=False,
                      help="extra args to pas to ipengine")
                  def write_job_file(self, n):
                      job = IPEngineSetJob(config=self.config)
                      for i in range(n):
                          t = IPEngineTask(config=self.config)
                          # The tasks work directory is *not* the actual work directory of
                          # the engine. It is used as the base path for the stdout/stderr
                          # files that the scheduler redirects to.
                          t.work_directory = self.profile_dir
                          # Add the profile_dir and from self.start().
                          t.engine_args.extend(self.extra_args)
                          job.add_task(t)
                      self.log.info("Writing job description file: %s" % self.job_file)
                      job.write(self.job_file)
                  @property
                  def job_file(self):
                      return os.path.join(self.profile_dir, self.job_file_name)
                  def start(self, n, profile_dir):
                      """Start the controller by profile_dir."""
                      self.extra_args = ['profile_dir=%s'%profile_dir]
                      self.profile_dir = unicode(profile_dir)
                      return super(WindowsHPCEngineSetLauncher, self).start(n)
              #-----------------------------------------------------------------------------
              # Batch (PBS) system launchers
              #-----------------------------------------------------------------------------
              class BatchSystemLauncher(BaseLauncher):
                  """Launch an external process using a batch system.
                  This class is designed to work with UNIX batch systems like PBS, LSF,
                  GridEngine, etc.  The overall model is that there are different commands
                  like qsub, qdel, etc. that handle the starting and stopping of the process.
                  This class also has the notion of a batch script. The ``batch_template``
                  attribute can be set to a string that is a template for the batch script.
                  This template is instantiated using string formatting. Thus the template can
                  use {n} fot the number of instances. Subclasses can add additional variables
                  to the template dict.
                  """
                  # Subclasses must fill these in.  See PBSEngineSet
                  submit_command = List([''], config=True,
                      help="The name of the command line program used to submit jobs.")
                  delete_command = List([''], config=True,
                      help="The name of the command line program used to delete jobs.")
                  job_id_regexp = Unicode('', config=True,
                      help="""A regular expression used to get the job id from the output of the
                      submit_command.""")
                  batch_template = Unicode('', config=True,
                      help="The string that is the batch script template itself.")
                  batch_template_file = Unicode(u'', config=True,
                      help="The file that contains the batch template.")
                  batch_file_name = Unicode(u'batch_script', config=True,
                      help="The filename of the instantiated batch script.")
                  queue = Unicode(u'', config=True,
                      help="The PBS Queue.")
                  # not configurable, override in subclasses
                  # PBS Job Array regex
                  job_array_regexp = Unicode('')
                  job_array_template = Unicode('')
                  # PBS Queue regex
                  queue_regexp = Unicode('')
                  queue_template = Unicode('')
                  # The default batch template, override in subclasses
                  default_template = Unicode('')
                  # The full path to the instantiated batch script.
                  batch_file = Unicode(u'')
                  # the format dict used with batch_template:
                  context = Dict()
                  # the Formatter instance for rendering the templates:
                  formatter = Instance(EvalFormatter, (), {})
                  def find_args(self):
                      return self.submit_command + [self.batch_file]
                  def __init__(self, work_dir=u'.', config=None, **kwargs):
                      super(BatchSystemLauncher, self).__init__(
                          work_dir=work_dir, config=config, **kwargs
                      )
                      self.batch_file = os.path.join(self.work_dir, self.batch_file_name)
                  def parse_job_id(self, output):
                      """Take the output of the submit command and return the job id."""
                      m = re.search(self.job_id_regexp, output)
                      if m is not None:
                          job_id = m.group()
                      else:
                          raise LauncherError("Job id couldn't be determined: %s" % output)
                      self.job_id = job_id
                      self.log.info('Job submitted with job id: %r' % job_id)
                      return job_id
                  def write_batch_script(self, n):
                      """Instantiate and write the batch script to the work_dir."""
                      self.context['n'] = n
                      self.context['queue'] = self.queue
                      # first priority is batch_template if set
                      if self.batch_template_file and not self.batch_template:
                          # second priority is batch_template_file
                          with open(self.batch_template_file) as f:
                              self.batch_template = f.read()
                      if not self.batch_template:
                          # third (last) priority is default_template
                          self.batch_template = self.default_template
                      regex = re.compile(self.job_array_regexp)
                      # print regex.search(self.batch_template)
                      if not regex.search(self.batch_template):
                          self.log.info("adding job array settings to batch script")
                          firstline, rest = self.batch_template.split('\n',1)
                          self.batch_template = u'\n'.join([firstline, self.job_array_template, rest])
                      regex = re.compile(self.queue_regexp)
                      # print regex.search(self.batch_template)
                      if self.queue and not regex.search(self.batch_template):
                          self.log.info("adding PBS queue settings to batch script")
                          firstline, rest = self.batch_template.split('\n',1)
                          self.batch_template = u'\n'.join([firstline, self.queue_template, rest])
                      script_as_string = self.formatter.format(self.batch_template, **self.context)
                      self.log.info('Writing instantiated batch script: %s' % self.batch_file)
                      with open(self.batch_file, 'w') as f:
                          f.write(script_as_string)
                      os.chmod(self.batch_file, stat.S_IRUSR | stat.S_IWUSR | stat.S_IXUSR)
                  def start(self, n, profile_dir):
                      """Start n copies of the process using a batch system."""
                      # Here we save profile_dir in the context so they
                      # can be used in the batch script template as {profile_dir}
                      self.context['profile_dir'] = profile_dir
                      self.profile_dir = unicode(profile_dir)
                      self.write_batch_script(n)
                      output = check_output(self.args, env=os.environ)
                      job_id = self.parse_job_id(output)
                      self.notify_start(job_id)
                      return job_id
                  def stop(self):
                      output = check_output(self.delete_command+[self.job_id], env=os.environ)
                      self.notify_stop(dict(job_id=self.job_id, output=output)) # Pass the output of the kill cmd
                      return output
              class PBSLauncher(BatchSystemLauncher):
                  """A BatchSystemLauncher subclass for PBS."""
                  submit_command = List(['qsub'], config=True,
                      help="The PBS submit command ['qsub']")
                  delete_command = List(['qdel'], config=True,
                      help="The PBS delete command ['qsub']")
                  job_id_regexp = Unicode(r'\d+', config=True,
                      help="Regular expresion for identifying the job ID [r'\d+']")
                  batch_file = Unicode(u'')
                  job_array_regexp = Unicode('#PBS\W+-t\W+[\w\d\-\$]+')
                  job_array_template = Unicode('#PBS -t 1-{n}')
                  queue_regexp = Unicode('#PBS\W+-q\W+\$?\w+')
                  queue_template = Unicode('#PBS -q {queue}')
              class PBSControllerLauncher(PBSLauncher):
                  """Launch a controller using PBS."""
                  batch_file_name = Unicode(u'pbs_controller', config=True,
                      help="batch file name for the controller job.")
                  default_template= Unicode("""#!/bin/sh
              #PBS -V
              #PBS -N ipcontroller
              %s --log-to-file profile_dir={profile_dir}
              """%(' '.join(ipcontroller_cmd_argv)))
                  def start(self, profile_dir):
                      """Start the controller by profile or profile_dir."""
                      self.log.info("Starting PBSControllerLauncher: %r" % self.args)
                      return super(PBSControllerLauncher, self).start(1, profile_dir)
              class PBSEngineSetLauncher(PBSLauncher):
                  """Launch Engines using PBS"""
                  batch_file_name = Unicode(u'pbs_engines', config=True,
                      help="batch file name for the engine(s) job.")
                  default_template= Unicode(u"""#!/bin/sh
              #PBS -V
              #PBS -N ipengine
              %s profile_dir={profile_dir}
              """%(' '.join(ipengine_cmd_argv)))
                  def start(self, n, profile_dir):
                      """Start n engines by profile or profile_dir."""
                      self.log.info('Starting %i engines with PBSEngineSetLauncher: %r' % (n, self.args))
                      return super(PBSEngineSetLauncher, self).start(n, profile_dir)
              #SGE is very similar to PBS
              class SGELauncher(PBSLauncher):
                  """Sun GridEngine is a PBS clone with slightly different syntax"""
                  job_array_regexp = Unicode('#\$\W+\-t')
                  job_array_template = Unicode('#$ -t 1-{n}')
                  queue_regexp = Unicode('#\$\W+-q\W+\$?\w+')
                  queue_template = Unicode('#$ -q $queue')
              class SGEControllerLauncher(SGELauncher):
                  """Launch a controller using SGE."""
                  batch_file_name = Unicode(u'sge_controller', config=True,
                      help="batch file name for the ipontroller job.")
                  default_template= Unicode(u"""#$ -V
              #$ -S /bin/sh
              #$ -N ipcontroller
              %s --log-to-file profile_dir={profile_dir}
              """%(' '.join(ipcontroller_cmd_argv)))
                  def start(self, profile_dir):
                      """Start the controller by profile or profile_dir."""
                      self.log.info("Starting PBSControllerLauncher: %r" % self.args)
                      return super(SGEControllerLauncher, self).start(1, profile_dir)
              class SGEEngineSetLauncher(SGELauncher):
                  """Launch Engines with SGE"""
                  batch_file_name = Unicode(u'sge_engines', config=True,
                      help="batch file name for the engine(s) job.")
                  default_template = Unicode("""#$ -V
              #$ -S /bin/sh
              #$ -N ipengine
              %s profile_dir={profile_dir}
              """%(' '.join(ipengine_cmd_argv)))
                  def start(self, n, profile_dir):
                      """Start n engines by profile or profile_dir."""
                      self.log.info('Starting %i engines with SGEEngineSetLauncher: %r' % (n, self.args))
                      return super(SGEEngineSetLauncher, self).start(n, profile_dir)
              #-----------------------------------------------------------------------------
              # A launcher for ipcluster itself!
              #-----------------------------------------------------------------------------
              class IPClusterLauncher(LocalProcessLauncher):
                  """Launch the ipcluster program in an external process."""
                  ipcluster_cmd = List(ipcluster_cmd_argv, config=True,
                      help="Popen command for ipcluster")
                  ipcluster_args = List(
                      ['--clean-logs', '--log-to-file', 'log_level=%i'%logging.INFO], config=True,
                      help="Command line arguments to pass to ipcluster.")
                  ipcluster_subcommand = Unicode('start')
                  ipcluster_n = Int(2)
                  def find_args(self):
                      return self.ipcluster_cmd + ['--'+self.ipcluster_subcommand] + \
                          ['n=%i'%self.ipcluster_n] + self.ipcluster_args
                  def start(self):
                      self.log.info("Starting ipcluster: %r" % self.args)
                      return super(IPClusterLauncher, self).start()
              #-----------------------------------------------------------------------------
              # Collections of launchers
              #-----------------------------------------------------------------------------
              local_launchers = [
                  LocalControllerLauncher,
                  LocalEngineLauncher,
                  LocalEngineSetLauncher,
              ]
              mpi_launchers = [
                  MPIExecLauncher,
                  MPIExecControllerLauncher,
                  MPIExecEngineSetLauncher,
              ]
              ssh_launchers = [
                  SSHLauncher,
                  SSHControllerLauncher,
                  SSHEngineLauncher,
                  SSHEngineSetLauncher,
              ]
              winhpc_launchers = [
                  WindowsHPCLauncher,
                  WindowsHPCControllerLauncher,
                  WindowsHPCEngineSetLauncher,
              ]
              pbs_launchers = [
                  PBSLauncher,
                  PBSControllerLauncher,
                  PBSEngineSetLauncher,
              ]
              sge_launchers = [
                  SGELauncher,
                  SGEControllerLauncher,
                  SGEEngineSetLauncher,
              ]
              all_launchers = local_launchers + mpi_launchers + ssh_launchers + winhpc_launchers\
                              + pbs_launchers + sge_launchers

IPython/parallel/apps/logwatcher.py

0 +8 -1

              #!/usr/bin/env python
-             """A simple logger object that consolidates messages incoming from ipcluster processes."""
+             """
+             A simple logger object that consolidates messages incoming from ipcluster processes.
+             Authors:
+             * MinRK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import logging
              import sys
              import zmq
              from zmq.eventloop import ioloop, zmqstream
              from IPython.config.configurable import LoggingConfigurable
              from IPython.utils.traitlets import Int, Unicode, Instance, List
              #-----------------------------------------------------------------------------
              # Classes
              #-----------------------------------------------------------------------------
              class LogWatcher(LoggingConfigurable):
                  """A simple class that receives messages on a SUB socket, as published
                  by subclasses of `zmq.log.handlers.PUBHandler`, and logs them itself.
                  This can subscribe to multiple topics, but defaults to all topics.
                  """
                  # configurables
                  topics = List([''], config=True,
                      help="The ZMQ topics to subscribe to. Default is to subscribe to all messages")
                  url = Unicode('tcp://127.0.0.1:20202', config=True,
                      help="ZMQ url on which to listen for log messages")
                  # internals
                  stream = Instance('zmq.eventloop.zmqstream.ZMQStream')
                  context = Instance(zmq.Context)
                  def _context_default(self):
                      return zmq.Context.instance()
                  loop = Instance(zmq.eventloop.ioloop.IOLoop)
                  def _loop_default(self):
                      return ioloop.IOLoop.instance()
                  def __init__(self, **kwargs):
                      super(LogWatcher, self).__init__(**kwargs)
                      s = self.context.socket(zmq.SUB)
                      s.bind(self.url)
                      self.stream = zmqstream.ZMQStream(s, self.loop)
                      self.subscribe()
                      self.on_trait_change(self.subscribe, 'topics')
                  def start(self):
                      self.stream.on_recv(self.log_message)
                  def stop(self):
                      self.stream.stop_on_recv()
                  def subscribe(self):
                      """Update our SUB socket's subscriptions."""
                      self.stream.setsockopt(zmq.UNSUBSCRIBE, '')
                      if '' in self.topics:
                          self.log.debug("Subscribing to: everything")
                          self.stream.setsockopt(zmq.SUBSCRIBE, '')
                      else:
                          for topic in self.topics:
                              self.log.debug("Subscribing to: %r"%(topic))
                              self.stream.setsockopt(zmq.SUBSCRIBE, topic)
                  def _extract_level(self, topic_str):
                      """Turn 'engine.0.INFO.extra' into (logging.INFO, 'engine.0.extra')"""
                      topics = topic_str.split('.')
                      for idx,t in enumerate(topics):
                          level = getattr(logging, t, None)
                          if level is not None:
                              break
                      if level is None:
                          level = logging.INFO
                      else:
                          topics.pop(idx)
                      return level, '.'.join(topics)
                  def log_message(self, raw):
                      """receive and parse a message, then log it."""
                      if len(raw) != 2 or '.' not in raw[0]:
                          self.log.error("Invalid log message: %s"%raw)
                          return
                      else:
                          topic, msg = raw
                          # don't newline, since log messages always newline:
                          topic,level_name = topic.rsplit('.',1)
                          level,topic = self._extract_level(topic)
                          if msg[-1] == '\n':
                              msg = msg[:-1]
                          self.log.log(level, "[%s] %s" % (topic, msg))

IPython/parallel/apps/win32support.py

0 +7 -1

              #!/usr/bin/env python
              """Utility for forwarding file read events over a zmq socket.
-             This is necessary because select on Windows only supports"""
+             This is necessary because select on Windows only supports
+             Authors:
+             * MinRK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import uuid
              import zmq
              from threading import Thread
              #-----------------------------------------------------------------------------
              # Code
              #-----------------------------------------------------------------------------
              class ForwarderThread(Thread):
                  def __init__(self, sock, fd):
                      Thread.__init__(self)
                      self.daemon=True
                      self.sock = sock
                      self.fd = fd
                  def run(self):
                      """loop through lines in self.fd, and send them over self.sock"""
                      line = self.fd.readline()
                      # allow for files opened in unicode mode
                      if isinstance(line, unicode):
                          send = self.sock.send_unicode
                      else:
                          send = self.sock.send
                      while line:
                          send(line)
                          line = self.fd.readline()
                      # line == '' means EOF
                      self.fd.close()
                      self.sock.close()
              def forward_read_events(fd, context=None):
                  """forward read events from an FD over a socket.
                  This method wraps a file in a socket pair, so it can
                  be polled for read events by select (specifically zmq.eventloop.ioloop)
                  """
                  if context is None:
                      context = zmq.Context.instance()
                  push = context.socket(zmq.PUSH)
                  push.setsockopt(zmq.LINGER, -1)
                  pull = context.socket(zmq.PULL)
                  addr='inproc://%s'%uuid.uuid4()
                  push.bind(addr)
                  pull.connect(addr)
                  forwarder = ForwarderThread(push, fd)
                  forwarder.start()
                  return pull
              __all__ = ['forward_read_events']
  No newline at end of file

IPython/parallel/apps/winhpcjob.py

0 +7 -1

              #!/usr/bin/env python
              # encoding: utf-8
              """
              Job and task components for writing .xml files that the Windows HPC Server
 can use to start jobs.
+             Authors:
+             * Brian Granger
+             * MinRK
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2008-2009  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import os
              import re
              import uuid
              from xml.etree import ElementTree as ET
              from IPython.config.configurable import Configurable
              from IPython.utils.traitlets import (
                  Unicode, Int, List, Instance,
                  Enum, Bool
              )
              #-----------------------------------------------------------------------------
              # Job and Task classes
              #-----------------------------------------------------------------------------
              def as_str(value):
                  if isinstance(value, str):
                      return value
                  elif isinstance(value, bool):
                      if value:
                          return 'true'
                      else:
                          return 'false'
                  elif isinstance(value, (int, float)):
                      return repr(value)
                  else:
                      return value
              def indent(elem, level=0):
                  i = "\n" + level*"  "
                  if len(elem):
                      if not elem.text or not elem.text.strip():
                          elem.text = i + "  "
                      if not elem.tail or not elem.tail.strip():
                          elem.tail = i
                      for elem in elem:
                          indent(elem, level+1)
                      if not elem.tail or not elem.tail.strip():
                          elem.tail = i
                  else:
                      if level and (not elem.tail or not elem.tail.strip()):
                          elem.tail = i
              def find_username():
                  domain = os.environ.get('USERDOMAIN')
                  username = os.environ.get('USERNAME','')
                  if domain is None:
                      return username
                  else:
                      return '%s\\%s' % (domain, username)
              class WinHPCJob(Configurable):
                  job_id = Unicode('')
                  job_name = Unicode('MyJob', config=True)
                  min_cores = Int(1, config=True)
                  max_cores = Int(1, config=True)
                  min_sockets = Int(1, config=True)
                  max_sockets = Int(1, config=True)
                  min_nodes = Int(1, config=True)
                  max_nodes = Int(1, config=True)
                  unit_type = Unicode("Core", config=True)
                  auto_calculate_min = Bool(True, config=True)
                  auto_calculate_max = Bool(True, config=True)
                  run_until_canceled = Bool(False, config=True)
                  is_exclusive = Bool(False, config=True)
                  username = Unicode(find_username(), config=True)
                  job_type = Unicode('Batch', config=True)
                  priority = Enum(('Lowest','BelowNormal','Normal','AboveNormal','Highest'),
                      default_value='Highest', config=True)
                  requested_nodes = Unicode('', config=True)
                  project = Unicode('IPython', config=True)
                  xmlns = Unicode('http://schemas.microsoft.com/HPCS2008/scheduler/')
                  version = Unicode("2.000")
                  tasks = List([])
                  @property
                  def owner(self):
                      return self.username
                  def _write_attr(self, root, attr, key):
                      s = as_str(getattr(self, attr, ''))
                      if s:
                          root.set(key, s)
                  def as_element(self):
                      # We have to add _A_ type things to get the right order than
                      # the MSFT XML parser expects.
                      root = ET.Element('Job')
                      self._write_attr(root, 'version', '_A_Version')
                      self._write_attr(root, 'job_name', '_B_Name')
                      self._write_attr(root, 'unit_type', '_C_UnitType')
                      self._write_attr(root, 'min_cores', '_D_MinCores')
                      self._write_attr(root, 'max_cores', '_E_MaxCores')
                      self._write_attr(root, 'min_sockets', '_F_MinSockets')
                      self._write_attr(root, 'max_sockets', '_G_MaxSockets')
                      self._write_attr(root, 'min_nodes', '_H_MinNodes')
                      self._write_attr(root, 'max_nodes', '_I_MaxNodes')
                      self._write_attr(root, 'run_until_canceled', '_J_RunUntilCanceled')
                      self._write_attr(root, 'is_exclusive', '_K_IsExclusive')
                      self._write_attr(root, 'username', '_L_UserName')
                      self._write_attr(root, 'job_type', '_M_JobType')
                      self._write_attr(root, 'priority', '_N_Priority')
                      self._write_attr(root, 'requested_nodes', '_O_RequestedNodes')
                      self._write_attr(root, 'auto_calculate_max', '_P_AutoCalculateMax')
                      self._write_attr(root, 'auto_calculate_min', '_Q_AutoCalculateMin')
                      self._write_attr(root, 'project', '_R_Project')
                      self._write_attr(root, 'owner', '_S_Owner')
                      self._write_attr(root, 'xmlns', '_T_xmlns')
                      dependencies = ET.SubElement(root, "Dependencies")
                      etasks = ET.SubElement(root, "Tasks")
                      for t in self.tasks:
                          etasks.append(t.as_element())
                      return root
                  def tostring(self):
                      """Return the string representation of the job description XML."""
                      root = self.as_element()
                      indent(root)
                      txt = ET.tostring(root, encoding="utf-8")
                      # Now remove the tokens used to order the attributes.
                      txt = re.sub(r'_[A-Z]_','',txt)
                      txt = '<?xml version="1.0" encoding="utf-8"?>\n' + txt
                      return txt
                  def write(self, filename):
                      """Write the XML job description to a file."""
                      txt = self.tostring()
                      with open(filename, 'w') as f:
                          f.write(txt)
                  def add_task(self, task):
                      """Add a task to the job.
                      Parameters
                      ----------
                      task : :class:`WinHPCTask`
                          The task object to add.
                      """
                      self.tasks.append(task)
              class WinHPCTask(Configurable):
                  task_id = Unicode('')
                  task_name = Unicode('')
                  version = Unicode("2.000")
                  min_cores = Int(1, config=True)
                  max_cores = Int(1, config=True)
                  min_sockets = Int(1, config=True)
                  max_sockets = Int(1, config=True)
                  min_nodes = Int(1, config=True)
                  max_nodes = Int(1, config=True)
                  unit_type = Unicode("Core", config=True)
                  command_line = Unicode('', config=True)
                  work_directory = Unicode('', config=True)
                  is_rerunnaable = Bool(True, config=True)
                  std_out_file_path = Unicode('', config=True)
                  std_err_file_path = Unicode('', config=True)
                  is_parametric = Bool(False, config=True)
                  environment_variables = Instance(dict, args=(), config=True)
                  def _write_attr(self, root, attr, key):
                      s = as_str(getattr(self, attr, ''))
                      if s:
                          root.set(key, s)
                  def as_element(self):
                      root = ET.Element('Task')
                      self._write_attr(root, 'version', '_A_Version')
                      self._write_attr(root, 'task_name', '_B_Name')
                      self._write_attr(root, 'min_cores', '_C_MinCores')
                      self._write_attr(root, 'max_cores', '_D_MaxCores')
                      self._write_attr(root, 'min_sockets', '_E_MinSockets')
                      self._write_attr(root, 'max_sockets', '_F_MaxSockets')
                      self._write_attr(root, 'min_nodes', '_G_MinNodes')
                      self._write_attr(root, 'max_nodes', '_H_MaxNodes')
                      self._write_attr(root, 'command_line', '_I_CommandLine')
                      self._write_attr(root, 'work_directory', '_J_WorkDirectory')
                      self._write_attr(root, 'is_rerunnaable', '_K_IsRerunnable')
                      self._write_attr(root, 'std_out_file_path', '_L_StdOutFilePath')
                      self._write_attr(root, 'std_err_file_path', '_M_StdErrFilePath')
                      self._write_attr(root, 'is_parametric', '_N_IsParametric')
                      self._write_attr(root, 'unit_type', '_O_UnitType')
                      root.append(self.get_env_vars())
                      return root
                  def get_env_vars(self):
                      env_vars = ET.Element('EnvironmentVariables')
                      for k, v in self.environment_variables.iteritems():
                          variable = ET.SubElement(env_vars, "Variable")
                          name = ET.SubElement(variable, "Name")
                          name.text = k
                          value = ET.SubElement(variable, "Value")
                          value.text = v
                      return env_vars
              # By declaring these, we can configure the controller and engine separately!
              class IPControllerJob(WinHPCJob):
                  job_name = Unicode('IPController', config=False)
                  is_exclusive = Bool(False, config=True)
                  username = Unicode(find_username(), config=True)
                  priority = Enum(('Lowest','BelowNormal','Normal','AboveNormal','Highest'),
                      default_value='Highest', config=True)
                  requested_nodes = Unicode('', config=True)
                  project = Unicode('IPython', config=True)
              class IPEngineSetJob(WinHPCJob):
                  job_name = Unicode('IPEngineSet', config=False)
                  is_exclusive = Bool(False, config=True)
                  username = Unicode(find_username(), config=True)
                  priority = Enum(('Lowest','BelowNormal','Normal','AboveNormal','Highest'),
                      default_value='Highest', config=True)
                  requested_nodes = Unicode('', config=True)
                  project = Unicode('IPython', config=True)
              class IPControllerTask(WinHPCTask):
                  task_name = Unicode('IPController', config=True)
                  controller_cmd = List(['ipcontroller.exe'], config=True)
                  controller_args = List(['--log-to-file', '--log-level', '40'], config=True)
                  # I don't want these to be configurable
                  std_out_file_path = Unicode('', config=False)
                  std_err_file_path = Unicode('', config=False)
                  min_cores = Int(1, config=False)
                  max_cores = Int(1, config=False)
                  min_sockets = Int(1, config=False)
                  max_sockets = Int(1, config=False)
                  min_nodes = Int(1, config=False)
                  max_nodes = Int(1, config=False)
                  unit_type = Unicode("Core", config=False)
                  work_directory = Unicode('', config=False)
                  def __init__(self, config=None):
                      super(IPControllerTask, self).__init__(config=config)
                      the_uuid = uuid.uuid1()
                      self.std_out_file_path = os.path.join('log','ipcontroller-%s.out' % the_uuid)
                      self.std_err_file_path = os.path.join('log','ipcontroller-%s.err' % the_uuid)
                  @property
                  def command_line(self):
                      return ' '.join(self.controller_cmd + self.controller_args)
              class IPEngineTask(WinHPCTask):
                  task_name = Unicode('IPEngine', config=True)
                  engine_cmd = List(['ipengine.exe'], config=True)
                  engine_args = List(['--log-to-file', '--log-level', '40'], config=True)
                  # I don't want these to be configurable
                  std_out_file_path = Unicode('', config=False)
                  std_err_file_path = Unicode('', config=False)
                  min_cores = Int(1, config=False)
                  max_cores = Int(1, config=False)
                  min_sockets = Int(1, config=False)
                  max_sockets = Int(1, config=False)
                  min_nodes = Int(1, config=False)
                  max_nodes = Int(1, config=False)
                  unit_type = Unicode("Core", config=False)
                  work_directory = Unicode('', config=False)
                  def __init__(self, config=None):
                      super(IPEngineTask,self).__init__(config=config)
                      the_uuid = uuid.uuid1()
                      self.std_out_file_path = os.path.join('log','ipengine-%s.out' % the_uuid)
                      self.std_err_file_path = os.path.join('log','ipengine-%s.err' % the_uuid)
                  @property
                  def command_line(self):
                      return ' '.join(self.engine_cmd + self.engine_args)
              # j = WinHPCJob(None)
              # j.job_name = 'IPCluster'
              # j.username = 'GNET\\bgranger'
              # j.requested_nodes = 'GREEN'
              #
              # t = WinHPCTask(None)
              # t.task_name = 'Controller'
              # t.command_line = r"\\blue\domainusers$\bgranger\Python\Python25\Scripts\ipcontroller.exe --log-to-file -p default --log-level 10"
              # t.work_directory = r"\\blue\domainusers$\bgranger\.ipython\cluster_default"
              # t.std_out_file_path = 'controller-out.txt'
              # t.std_err_file_path = 'controller-err.txt'
              # t.environment_variables['PYTHONPATH'] = r"\\blue\domainusers$\bgranger\Python\Python25\Lib\site-packages"
              # j.add_task(t)

IPython/parallel/client/asyncresult.py

0 +6 -1

-             """AsyncResult objects for the client"""
+             """AsyncResult objects for the client
+             Authors:
+             * MinRK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import time
              from zmq import MessageTracker
              from IPython.external.decorator import decorator
              from IPython.parallel import error
              #-----------------------------------------------------------------------------
              # Classes
              #-----------------------------------------------------------------------------
              # global empty tracker that's always done:
              finished_tracker = MessageTracker()
              @decorator
              def check_ready(f, self, *args, **kwargs):
                  """Call spin() to sync state prior to calling the method."""
                  self.wait(0)
                  if not self._ready:
                      raise error.TimeoutError("result not ready")
                  return f(self, *args, **kwargs)
              class AsyncResult(object):
                  """Class for representing results of non-blocking calls.
                  Provides the same interface as :py:class:`multiprocessing.pool.AsyncResult`.
                  """
                  msg_ids = None
                  _targets = None
                  _tracker = None
                  _single_result = False
                  def __init__(self, client, msg_ids, fname='unknown', targets=None, tracker=None):
                      if isinstance(msg_ids, basestring):
                          # always a list
                          msg_ids = [msg_ids]
                      if tracker is None:
                          # default to always done
                          tracker = finished_tracker
                      self._client = client
                      self.msg_ids = msg_ids
                      self._fname=fname
                      self._targets = targets
                      self._tracker = tracker
                      self._ready = False
                      self._success = None
                      if len(msg_ids) == 1:
                          self._single_result = not isinstance(targets, (list, tuple))
                      else:
                          self._single_result = False
                  def __repr__(self):
                      if self._ready:
                          return "<%s: finished>"%(self.__class__.__name__)
                      else:
                          return "<%s: %s>"%(self.__class__.__name__,self._fname)
                  def _reconstruct_result(self, res):
                      """Reconstruct our result from actual result list (always a list)
                      Override me in subclasses for turning a list of results
                      into the expected form.
                      """
                      if self._single_result:
                          return res[0]
                      else:
                          return res
                  def get(self, timeout=-1):
                      """Return the result when it arrives.
                      If `timeout` is not ``None`` and the result does not arrive within
                      `timeout` seconds then ``TimeoutError`` is raised. If the
                      remote call raised an exception then that exception will be reraised
                      by get() inside a `RemoteError`.
                      """
                      if not self.ready():
                          self.wait(timeout)
                      if self._ready:
                          if self._success:
                              return self._result
                          else:
                              raise self._exception
                      else:
                          raise error.TimeoutError("Result not ready.")
                  def ready(self):
                      """Return whether the call has completed."""
                      if not self._ready:
                          self.wait(0)
                      return self._ready
                  def wait(self, timeout=-1):
                      """Wait until the result is available or until `timeout` seconds pass.
                      This method always returns None.
                      """
                      if self._ready:
                          return
                      self._ready = self._client.wait(self.msg_ids, timeout)
                      if self._ready:
                          try:
                              results = map(self._client.results.get, self.msg_ids)
                              self._result = results
                              if self._single_result:
                                  r = results[0]
                                  if isinstance(r, Exception):
                                      raise r
                              else:
                                  results = error.collect_exceptions(results, self._fname)
                              self._result = self._reconstruct_result(results)
                          except Exception, e:
                              self._exception = e
                              self._success = False
                          else:
                              self._success = True
                          finally:
                              self._metadata = map(self._client.metadata.get, self.msg_ids)
                  def successful(self):
                      """Return whether the call completed without raising an exception.
                      Will raise ``AssertionError`` if the result is not ready.
                      """
                      assert self.ready()
                      return self._success
                  #----------------------------------------------------------------
                  # Extra methods not in mp.pool.AsyncResult
                  #----------------------------------------------------------------
                  def get_dict(self, timeout=-1):
                      """Get the results as a dict, keyed by engine_id.
                      timeout behavior is described in `get()`.
                      """
                      results = self.get(timeout)
                      engine_ids = [ md['engine_id'] for md in self._metadata ]
                      bycount = sorted(engine_ids, key=lambda k: engine_ids.count(k))
                      maxcount = bycount.count(bycount[-1])
                      if maxcount > 1:
                          raise ValueError("Cannot build dict, %i jobs ran on engine #%i"%(
                                  maxcount, bycount[-1]))
                      return dict(zip(engine_ids,results))
                  @property
                  def result(self):
                      """result property wrapper for `get(timeout=0)`."""
                      return self.get()
                  # abbreviated alias:
                  r = result
                  @property
                  @check_ready
                  def metadata(self):
                      """property for accessing execution metadata."""
                      if self._single_result:
                          return self._metadata[0]
                      else:
                          return self._metadata
                  @property
                  def result_dict(self):
                      """result property as a dict."""
                      return self.get_dict()
                  def __dict__(self):
                      return self.get_dict(0)
                  def abort(self):
                      """abort my tasks."""
                      assert not self.ready(), "Can't abort, I am already done!"
                      return self.client.abort(self.msg_ids, targets=self._targets, block=True)
                  @property
                  def sent(self):
                      """check whether my messages have been sent."""
                      return self._tracker.done
                  def wait_for_send(self, timeout=-1):
                      """wait for pyzmq send to complete.
                      This is necessary when sending arrays that you intend to edit in-place.
                      `timeout` is in seconds, and will raise TimeoutError if it is reached
                      before the send completes.
                      """
                      return self._tracker.wait(timeout)
                  #-------------------------------------
                  # dict-access
                  #-------------------------------------
                  @check_ready
                  def __getitem__(self, key):
                      """getitem returns result value(s) if keyed by int/slice, or metadata if key is str.
                      """
                      if isinstance(key, int):
                          return error.collect_exceptions([self._result[key]], self._fname)[0]
                      elif isinstance(key, slice):
                          return error.collect_exceptions(self._result[key], self._fname)
                      elif isinstance(key, basestring):
                          values = [ md[key] for md in self._metadata ]
                          if self._single_result:
                              return values[0]
                          else:
                              return values
                      else:
                          raise TypeError("Invalid key type %r, must be 'int','slice', or 'str'"%type(key))
                  @check_ready
                  def __getattr__(self, key):
                      """getattr maps to getitem for convenient attr access to metadata."""
                      if key not in self._metadata[0].keys():
                          raise AttributeError("%r object has no attribute %r"%(
                                  self.__class__.__name__, key))
                      return self.__getitem__(key)
                  # asynchronous iterator:
                  def __iter__(self):
                      if self._single_result:
                          raise TypeError("AsyncResults with a single result are not iterable.")
                      try:
                          rlist = self.get(0)
                      except error.TimeoutError:
                          # wait for each result individually
                          for msg_id in self.msg_ids:
                              ar = AsyncResult(self._client, msg_id, self._fname)
                              yield ar.get()
                      else:
                          # already done
                          for r in rlist:
                              yield r
              class AsyncMapResult(AsyncResult):
                  """Class for representing results of non-blocking gathers.
                  This will properly reconstruct the gather.
                  """
                  def __init__(self, client, msg_ids, mapObject, fname=''):
                      AsyncResult.__init__(self, client, msg_ids, fname=fname)
                      self._mapObject = mapObject
                      self._single_result = False
                  def _reconstruct_result(self, res):
                      """Perform the gather on the actual results."""
                      return self._mapObject.joinPartitions(res)
                  # asynchronous iterator:
                  def __iter__(self):
                      try:
                          rlist = self.get(0)
                      except error.TimeoutError:
                          # wait for each result individually
                          for msg_id in self.msg_ids:
                              ar = AsyncResult(self._client, msg_id, self._fname)
                              rlist = ar.get()
                              try:
                                  for r in rlist:
                                      yield r
                              except TypeError:
                                  # flattened, not a list
                                  # this could get broken by flattened data that returns iterables
                                  # but most calls to map do not expose the `flatten` argument
                                  yield rlist
                      else:
                          # already done
                          for r in rlist:
                              yield r
              class AsyncHubResult(AsyncResult):
                  """Class to wrap pending results that must be requested from the Hub.
                  Note that waiting/polling on these objects requires polling the Hubover the network,
                  so use `AsyncHubResult.wait()` sparingly.
                  """
                  def wait(self, timeout=-1):
                      """wait for result to complete."""
                      start = time.time()
                      if self._ready:
                          return
                      local_ids = filter(lambda msg_id: msg_id in self._client.outstanding, self.msg_ids)
                      local_ready = self._client.wait(local_ids, timeout)
                      if local_ready:
                          remote_ids = filter(lambda msg_id: msg_id not in self._client.results, self.msg_ids)
                          if not remote_ids:
                              self._ready = True
                          else:
                              rdict = self._client.result_status(remote_ids, status_only=False)
                              pending = rdict['pending']
                              while pending and (timeout < 0 or time.time() < start+timeout):
                                  rdict = self._client.result_status(remote_ids, status_only=False)
                                  pending = rdict['pending']
                                  if pending:
                                      time.sleep(0.1)
                              if not pending:
                                  self._ready = True
                      if self._ready:
                          try:
                              results = map(self._client.results.get, self.msg_ids)
                              self._result = results
                              if self._single_result:
                                  r = results[0]
                                  if isinstance(r, Exception):
                                      raise r
                              else:
                                  results = error.collect_exceptions(results, self._fname)
                              self._result = self._reconstruct_result(results)
                          except Exception, e:
                              self._exception = e
                              self._success = False
                          else:
                              self._success = True
                          finally:
                              self._metadata = map(self._client.metadata.get, self.msg_ids)
              __all__ = ['AsyncResult', 'AsyncMapResult', 'AsyncHubResult']
  No newline at end of file

IPython/parallel/client/client.py

0 +7 -2

-             """A semi-synchronous Client for the ZMQ cluster"""
+             """A semi-synchronous Client for the ZMQ cluster
+             Authors:
+             * MinRK
+             """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2010  The IPython Development Team
+             #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import os
              import json
              import time
              import warnings
              from datetime import datetime
              from getpass import getpass
              from pprint import pprint
              pjoin = os.path.join
              import zmq
              # from zmq.eventloop import ioloop, zmqstream
              from IPython.utils.path import get_ipython_dir
              from IPython.utils.traitlets import (HasTraits, Int, Instance, Unicode,
                                                  Dict, List, Bool, Set)
              from IPython.external.decorator import decorator
              from IPython.external.ssh import tunnel
              from IPython.parallel import error
              from IPython.parallel import util
              from IPython.zmq.session import Session, Message
              from .asyncresult import AsyncResult, AsyncHubResult
              from IPython.core.newapplication import ProfileDir, ProfileDirError
              from .view import DirectView, LoadBalancedView
              #--------------------------------------------------------------------------
              # Decorators for Client methods
              #--------------------------------------------------------------------------
              @decorator
              def spin_first(f, self, *args, **kwargs):
                  """Call spin() to sync state prior to calling the method."""
                  self.spin()
                  return f(self, *args, **kwargs)
              #--------------------------------------------------------------------------
              # Classes
              #--------------------------------------------------------------------------
              class Metadata(dict):
                  """Subclass of dict for initializing metadata values.
                  Attribute access works on keys.
                  These objects have a strict set of keys - errors will raise if you try
                  to add new keys.
                  """
                  def __init__(self, *args, **kwargs):
                      dict.__init__(self)
                      md = {'msg_id' : None,
                            'submitted' : None,
                            'started' : None,
                            'completed' : None,
                            'received' : None,
                            'engine_uuid' : None,
                            'engine_id' : None,
                            'follow' : None,
                            'after' : None,
                            'status' : None,
                            'pyin' : None,
                            'pyout' : None,
                            'pyerr' : None,
                            'stdout' : '',
                            'stderr' : '',
                          }
                      self.update(md)
                      self.update(dict(*args, **kwargs))
                  def __getattr__(self, key):
                      """getattr aliased to getitem"""
                      if key in self.iterkeys():
                          return self[key]
                      else:
                          raise AttributeError(key)
                  def __setattr__(self, key, value):
                      """setattr aliased to setitem, with strict"""
                      if key in self.iterkeys():
                          self[key] = value
                      else:
                          raise AttributeError(key)
                  def __setitem__(self, key, value):
                      """strict static key enforcement"""
                      if key in self.iterkeys():
                          dict.__setitem__(self, key, value)
                      else:
                          raise KeyError(key)
              class Client(HasTraits):
                  """A semi-synchronous client to the IPython ZMQ cluster
                  Parameters
                  ----------
                  url_or_file : bytes; zmq url or path to ipcontroller-client.json
                      Connection information for the Hub's registration.  If a json connector
                      file is given, then likely no further configuration is necessary.
                      [Default: use profile]
                  profile : bytes
                      The name of the Cluster profile to be used to find connector information.
                      [Default: 'default']
                  context : zmq.Context
                      Pass an existing zmq.Context instance, otherwise the client will create its own.
                  debug : bool
                      flag for lots of message printing for debug purposes
                  timeout : int/float
                      time (in seconds) to wait for connection replies from the Hub
                      [Default: 10]
                  #-------------- session related args ----------------
                  config : Config object
                      If specified, this will be relayed to the Session for configuration
                  username : str
                      set username for the session object
                  packer : str (import_string) or callable
                      Can be either the simple keyword 'json' or 'pickle', or an import_string to a
                      function to serialize messages. Must support same input as
                      JSON, and output must be bytes.
                      You can pass a callable directly as `pack`
                  unpacker : str (import_string) or callable
                      The inverse of packer.  Only necessary if packer is specified as *not* one
                      of 'json' or 'pickle'.
                  #-------------- ssh related args ----------------
                  # These are args for configuring the ssh tunnel to be used
                  # credentials are used to forward connections over ssh to the Controller
                  # Note that the ip given in `addr` needs to be relative to sshserver
                  # The most basic case is to leave addr as pointing to localhost (127.0.0.1),
                  # and set sshserver as the same machine the Controller is on. However,
                  # the only requirement is that sshserver is able to see the Controller
                  # (i.e. is within the same trusted network).
                  sshserver : str
                      A string of the form passed to ssh, i.e. 'server.tld' or 'user@server.tld:port'
                      If keyfile or password is specified, and this is not, it will default to
                      the ip given in addr.
                  sshkey : str; path to public ssh key file
                      This specifies a key to be used in ssh login, default None.
                      Regular default ssh keys will be used without specifying this argument.
                  password : str
                      Your ssh password to sshserver. Note that if this is left None,
                      you will be prompted for it if passwordless key based login is unavailable.
                  paramiko : bool
                      flag for whether to use paramiko instead of shell ssh for tunneling.
                      [default: True on win32, False else]
                  ------- exec authentication args -------
                  If even localhost is untrusted, you can have some protection against
                  unauthorized execution by signing messages with HMAC digests.
                  Messages are still sent as cleartext, so if someone can snoop your
                  loopback traffic this will not protect your privacy, but will prevent
                  unauthorized execution.
                  exec_key : str
                      an authentication key or file containing a key
                      default: None
                  Attributes
                  ----------
                  ids : list of int engine IDs
                      requesting the ids attribute always synchronizes
                      the registration state. To request ids without synchronization,
                      use semi-private _ids attributes.
                  history : list of msg_ids
                      a list of msg_ids, keeping track of all the execution
                      messages you have submitted in order.
                  outstanding : set of msg_ids
                      a set of msg_ids that have been submitted, but whose
                      results have not yet been received.
                  results : dict
                      a dict of all our results, keyed by msg_id
                  block : bool
                      determines default behavior when block not specified
                      in execution methods
                  Methods
                  -------
                  spin
                      flushes incoming results and registration state changes
                      control methods spin, and requesting `ids` also ensures up to date
                  wait
                      wait on one or more msg_ids
                  execution methods
                      apply
                      legacy: execute, run
                  data movement
                      push, pull, scatter, gather
                  query methods
                      queue_status, get_result, purge, result_status
                  control methods
                      abort, shutdown
                  """
                  block = Bool(False)
                  outstanding = Set()
                  results = Instance('collections.defaultdict', (dict,))
                  metadata = Instance('collections.defaultdict', (Metadata,))
                  history = List()
                  debug = Bool(False)
                  profile=Unicode('default')
                  _outstanding_dict = Instance('collections.defaultdict', (set,))
                  _ids = List()
                  _connected=Bool(False)
                  _ssh=Bool(False)
                  _context = Instance('zmq.Context')
                  _config = Dict()
                  _engines=Instance(util.ReverseDict, (), {})
                  # _hub_socket=Instance('zmq.Socket')
                  _query_socket=Instance('zmq.Socket')
                  _control_socket=Instance('zmq.Socket')
                  _iopub_socket=Instance('zmq.Socket')
                  _notification_socket=Instance('zmq.Socket')
                  _mux_socket=Instance('zmq.Socket')
                  _task_socket=Instance('zmq.Socket')
                  _task_scheme=Unicode()
                  _closed = False
                  _ignored_control_replies=Int(0)
                  _ignored_hub_replies=Int(0)
                  def __init__(self, url_or_file=None, profile='default', profile_dir=None, ipython_dir=None,
                          context=None, debug=False, exec_key=None,
                          sshserver=None, sshkey=None, password=None, paramiko=None,
                          timeout=10, **extra_args
                          ):
                      super(Client, self).__init__(debug=debug, profile=profile)
                      if context is None:
                          context = zmq.Context.instance()
                      self._context = context
                      self._setup_profile_dir(profile, profile_dir, ipython_dir)
                      if self._cd is not None:
                          if url_or_file is None:
                              url_or_file = pjoin(self._cd.security_dir, 'ipcontroller-client.json')
                      assert url_or_file is not None, "I can't find enough information to connect to a hub!"\
                          " Please specify at least one of url_or_file or profile."
                      try:
                          util.validate_url(url_or_file)
                      except AssertionError:
                          if not os.path.exists(url_or_file):
                              if self._cd:
                                  url_or_file = os.path.join(self._cd.security_dir, url_or_file)
                              assert os.path.exists(url_or_file), "Not a valid connection file or url: %r"%url_or_file
                          with open(url_or_file) as f:
                              cfg = json.loads(f.read())
                      else:
                          cfg = {'url':url_or_file}
                      # sync defaults from args, json:
                      if sshserver:
                          cfg['ssh'] = sshserver
                      if exec_key:
                          cfg['exec_key'] = exec_key
                      exec_key = cfg['exec_key']
                      sshserver=cfg['ssh']
                      url = cfg['url']
                      location = cfg.setdefault('location', None)
                      cfg['url'] = util.disambiguate_url(cfg['url'], location)
                      url = cfg['url']
                      self._config = cfg
                      self._ssh = bool(sshserver or sshkey or password)
                      if self._ssh and sshserver is None:
                          # default to ssh via localhost
                          sshserver = url.split('://')[1].split(':')[0]
                      if self._ssh and password is None:
                          if tunnel.try_passwordless_ssh(sshserver, sshkey, paramiko):
                              password=False
                          else:
                              password = getpass("SSH Password for %s: "%sshserver)
                      ssh_kwargs = dict(keyfile=sshkey, password=password, paramiko=paramiko)
                      # configure and construct the session
                      if exec_key is not None:
                          if os.path.isfile(exec_key):
                              extra_args['keyfile'] = exec_key
                          else:
                              extra_args['key'] = exec_key
                      self.session = Session(**extra_args)
                      self._query_socket = self._context.socket(zmq.XREQ)
                      self._query_socket.setsockopt(zmq.IDENTITY, self.session.session)
                      if self._ssh:
                          tunnel.tunnel_connection(self._query_socket, url, sshserver, **ssh_kwargs)
                      else:
                          self._query_socket.connect(url)
                      self.session.debug = self.debug
                      self._notification_handlers = {'registration_notification' : self._register_engine,
                                                  'unregistration_notification' : self._unregister_engine,
                                                  'shutdown_notification' : lambda msg: self.close(),
                                                  }
                      self._queue_handlers = {'execute_reply' : self._handle_execute_reply,
                                              'apply_reply' : self._handle_apply_reply}
                      self._connect(sshserver, ssh_kwargs, timeout)
                  def __del__(self):
                      """cleanup sockets, but _not_ context."""
                      self.close()
                  def _setup_profile_dir(self, profile, profile_dir, ipython_dir):
                      if ipython_dir is None:
                          ipython_dir = get_ipython_dir()
                      if profile_dir is not None:
                          try:
                              self._cd = ProfileDir.find_profile_dir(profile_dir)
                              return
                          except ProfileDirError:
                              pass
                      elif profile is not None:
                          try:
                              self._cd = ProfileDir.find_profile_dir_by_name(
                                  ipython_dir, profile)
                              return
                          except ProfileDirError:
                              pass
                      self._cd = None
                  def _update_engines(self, engines):
                      """Update our engines dict and _ids from a dict of the form: {id:uuid}."""
                      for k,v in engines.iteritems():
                          eid = int(k)
                          self._engines[eid] = bytes(v) # force not unicode
                          self._ids.append(eid)
                      self._ids = sorted(self._ids)
                      if sorted(self._engines.keys()) != range(len(self._engines)) and \
                                      self._task_scheme == 'pure' and self._task_socket:
                          self._stop_scheduling_tasks()
                  def _stop_scheduling_tasks(self):
                      """Stop scheduling tasks because an engine has been unregistered
                      from a pure ZMQ scheduler.
                      """
                      self._task_socket.close()
                      self._task_socket = None
                      msg = "An engine has been unregistered, and we are using pure " +\
                            "ZMQ task scheduling.  Task farming will be disabled."
                      if self.outstanding:
                          msg += " If you were running tasks when this happened, " +\
                                 "some `outstanding` msg_ids may never resolve."
                      warnings.warn(msg, RuntimeWarning)
                  def _build_targets(self, targets):
                      """Turn valid target IDs or 'all' into two lists:
                      (int_ids, uuids).
                      """
                      if not self._ids:
                          # flush notification socket if no engines yet, just in case
                          if not self.ids:
                              raise error.NoEnginesRegistered("Can't build targets without any engines")
                      if targets is None:
                          targets = self._ids
                      elif isinstance(targets, str):
                          if targets.lower() == 'all':
                              targets = self._ids
                          else:
                              raise TypeError("%r not valid str target, must be 'all'"%(targets))
                      elif isinstance(targets, int):
                          if targets < 0:
                              targets = self.ids[targets]
                          if targets not in self._ids:
                              raise IndexError("No such engine: %i"%targets)
                          targets = [targets]
                      if isinstance(targets, slice):
                          indices = range(len(self._ids))[targets]
                          ids = self.ids
                          targets = [ ids[i] for i in indices ]
                      if not isinstance(targets, (tuple, list, xrange)):
                          raise TypeError("targets by int/slice/collection of ints only, not %s"%(type(targets)))
                      return [self._engines[t] for t in targets], list(targets)
                  def _connect(self, sshserver, ssh_kwargs, timeout):
                      """setup all our socket connections to the cluster. This is called from
                      __init__."""
                      # Maybe allow reconnecting?
                      if self._connected:
                          return
                      self._connected=True
                      def connect_socket(s, url):
                          url = util.disambiguate_url(url, self._config['location'])
                          if self._ssh:
                              return tunnel.tunnel_connection(s, url, sshserver, **ssh_kwargs)
                          else:
                              return s.connect(url)
                      self.session.send(self._query_socket, 'connection_request')
                      r,w,x = zmq.select([self._query_socket],[],[], timeout)
                      if not r:
                          raise error.TimeoutError("Hub connection request timed out")
                      idents,msg = self.session.recv(self._query_socket,mode=0)
                      if self.debug:
                          pprint(msg)
                      msg = Message(msg)
                      content = msg.content
                      self._config['registration'] = dict(content)
                      if content.status == 'ok':
                          if content.mux:
                              self._mux_socket = self._context.socket(zmq.XREQ)
                              self._mux_socket.setsockopt(zmq.IDENTITY, self.session.session)
                              connect_socket(self._mux_socket, content.mux)
                          if content.task:
                              self._task_scheme, task_addr = content.task
                              self._task_socket = self._context.socket(zmq.XREQ)
                              self._task_socket.setsockopt(zmq.IDENTITY, self.session.session)
                              connect_socket(self._task_socket, task_addr)
                          if content.notification:
                              self._notification_socket = self._context.socket(zmq.SUB)
                              connect_socket(self._notification_socket, content.notification)
                              self._notification_socket.setsockopt(zmq.SUBSCRIBE, b'')
                          # if content.query:
                          #     self._query_socket = self._context.socket(zmq.XREQ)
                          #     self._query_socket.setsockopt(zmq.IDENTITY, self.session.session)
                          #     connect_socket(self._query_socket, content.query)
                          if content.control:
                              self._control_socket = self._context.socket(zmq.XREQ)
                              self._control_socket.setsockopt(zmq.IDENTITY, self.session.session)
                              connect_socket(self._control_socket, content.control)
                          if content.iopub:
                              self._iopub_socket = self._context.socket(zmq.SUB)
                              self._iopub_socket.setsockopt(zmq.SUBSCRIBE, b'')
                              self._iopub_socket.setsockopt(zmq.IDENTITY, self.session.session)
                              connect_socket(self._iopub_socket, content.iopub)
                          self._update_engines(dict(content.engines))
                      else:
                          self._connected = False
                          raise Exception("Failed to connect!")
                  #--------------------------------------------------------------------------
                  # handlers and callbacks for incoming messages
                  #--------------------------------------------------------------------------
                  def _unwrap_exception(self, content):
                      """unwrap exception, and remap engine_id to int."""
                      e = error.unwrap_exception(content)
                      # print e.traceback
                      if e.engine_info:
                          e_uuid = e.engine_info['engine_uuid']
                          eid = self._engines[e_uuid]
                          e.engine_info['engine_id'] = eid
                      return e
                  def _extract_metadata(self, header, parent, content):
                      md = {'msg_id' : parent['msg_id'],
                            'received' : datetime.now(),
                            'engine_uuid' : header.get('engine', None),
                            'follow' : parent.get('follow', []),
                            'after' : parent.get('after', []),
                            'status' : content['status'],
                          }
                      if md['engine_uuid'] is not None:
                          md['engine_id'] = self._engines.get(md['engine_uuid'], None)
                      if 'date' in parent:
                          md['submitted'] = parent['date']
                      if 'started' in header:
                          md['started'] = header['started']
                      if 'date' in header:
                          md['completed'] = header['date']
                      return md
                  def _register_engine(self, msg):
                      """Register a new engine, and update our connection info."""
                      content = msg['content']
                      eid = content['id']
                      d = {eid : content['queue']}
                      self._update_engines(d)
                  def _unregister_engine(self, msg):
                      """Unregister an engine that has died."""
                      content = msg['content']
                      eid = int(content['id'])
                      if eid in self._ids:
                          self._ids.remove(eid)
                          uuid = self._engines.pop(eid)
                          self._handle_stranded_msgs(eid, uuid)
                      if self._task_socket and self._task_scheme == 'pure':
                          self._stop_scheduling_tasks()
                  def _handle_stranded_msgs(self, eid, uuid):
                      """Handle messages known to be on an engine when the engine unregisters.
                      It is possible that this will fire prematurely - that is, an engine will
                      go down after completing a result, and the client will be notified
                      of the unregistration and later receive the successful result.
                      """
                      outstanding = self._outstanding_dict[uuid]
                      for msg_id in list(outstanding):
                          if msg_id in self.results:
                              # we already
                              continue
                          try:
                              raise error.EngineError("Engine %r died while running task %r"%(eid, msg_id))
                          except:
                              content = error.wrap_exception()
                          # build a fake message:
                          parent = {}
                          header = {}
                          parent['msg_id'] = msg_id
                          header['engine'] = uuid
                          header['date'] = datetime.now()
                          msg = dict(parent_header=parent, header=header, content=content)
                          self._handle_apply_reply(msg)
                  def _handle_execute_reply(self, msg):
                      """Save the reply to an execute_request into our results.
                      execute messages are never actually used. apply is used instead.
                      """
                      parent = msg['parent_header']
                      msg_id = parent['msg_id']
                      if msg_id not in self.outstanding:
                          if msg_id in self.history:
                              print ("got stale result: %s"%msg_id)
                          else:
                              print ("got unknown result: %s"%msg_id)
                      else:
                          self.outstanding.remove(msg_id)
                      self.results[msg_id] = self._unwrap_exception(msg['content'])
                  def _handle_apply_reply(self, msg):
                      """Save the reply to an apply_request into our results."""
                      parent = msg['parent_header']
                      msg_id = parent['msg_id']
                      if msg_id not in self.outstanding:
                          if msg_id in self.history:
                              print ("got stale result: %s"%msg_id)
                              print self.results[msg_id]
                              print msg
                          else:
                              print ("got unknown result: %s"%msg_id)
                      else:
                          self.outstanding.remove(msg_id)
                      content = msg['content']
                      header = msg['header']
                      # construct metadata:
                      md = self.metadata[msg_id]
                      md.update(self._extract_metadata(header, parent, content))
                      # is this redundant?
                      self.metadata[msg_id] = md
                      e_outstanding = self._outstanding_dict[md['engine_uuid']]
                      if msg_id in e_outstanding:
                          e_outstanding.remove(msg_id)
                      # construct result:
                      if content['status'] == 'ok':
                          self.results[msg_id] = util.unserialize_object(msg['buffers'])[0]
                      elif content['status'] == 'aborted':
                          self.results[msg_id] = error.TaskAborted(msg_id)
                      elif content['status'] == 'resubmitted':
                          # TODO: handle resubmission
                          pass
                      else:
                          self.results[msg_id] = self._unwrap_exception(content)
                  def _flush_notifications(self):
                      """Flush notifications of engine registrations waiting
                      in ZMQ queue."""
                      idents,msg = self.session.recv(self._notification_socket, mode=zmq.NOBLOCK)
                      while msg is not None:
                          if self.debug:
                              pprint(msg)
                          msg_type = msg['msg_type']
                          handler = self._notification_handlers.get(msg_type, None)
                          if handler is None:
                              raise Exception("Unhandled message type: %s"%msg.msg_type)
                          else:
                              handler(msg)
                          idents,msg = self.session.recv(self._notification_socket, mode=zmq.NOBLOCK)
                  def _flush_results(self, sock):
                      """Flush task or queue results waiting in ZMQ queue."""
                      idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                      while msg is not None:
                          if self.debug:
                              pprint(msg)
                          msg_type = msg['msg_type']
                          handler = self._queue_handlers.get(msg_type, None)
                          if handler is None:
                              raise Exception("Unhandled message type: %s"%msg.msg_type)
                          else:
                              handler(msg)
                          idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                  def _flush_control(self, sock):
                      """Flush replies from the control channel waiting
                      in the ZMQ queue.
                      Currently: ignore them."""
                      if self._ignored_control_replies <= 0:
                          return
                      idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                      while msg is not None:
                          self._ignored_control_replies -= 1
                          if self.debug:
                              pprint(msg)
                          idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                  def _flush_ignored_control(self):
                      """flush ignored control replies"""
                      while self._ignored_control_replies > 0:
                          self.session.recv(self._control_socket)
                          self._ignored_control_replies -= 1
                  def _flush_ignored_hub_replies(self):
                      ident,msg = self.session.recv(self._query_socket, mode=zmq.NOBLOCK)
                      while msg is not None:
                          ident,msg = self.session.recv(self._query_socket, mode=zmq.NOBLOCK)
                  def _flush_iopub(self, sock):
                      """Flush replies from the iopub channel waiting
                      in the ZMQ queue.
                      """
                      idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                      while msg is not None:
                          if self.debug:
                              pprint(msg)
                          parent = msg['parent_header']
                          msg_id = parent['msg_id']
                          content = msg['content']
                          header = msg['header']
                          msg_type = msg['msg_type']
                          # init metadata:
                          md = self.metadata[msg_id]
                          if msg_type == 'stream':
                              name = content['name']
                              s = md[name] or ''
                              md[name] = s + content['data']
                          elif msg_type == 'pyerr':
                              md.update({'pyerr' : self._unwrap_exception(content)})
                          elif msg_type == 'pyin':
                              md.update({'pyin' : content['code']})
                          else:
                              md.update({msg_type : content.get('data', '')})
                          # reduntant?
                          self.metadata[msg_id] = md
                          idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                  #--------------------------------------------------------------------------
                  # len, getitem
                  #--------------------------------------------------------------------------
                  def __len__(self):
                      """len(client) returns # of engines."""
                      return len(self.ids)
                  def __getitem__(self, key):
                      """index access returns DirectView multiplexer objects
                      Must be int, slice, or list/tuple/xrange of ints"""
                      if not isinstance(key, (int, slice, tuple, list, xrange)):
                          raise TypeError("key by int/slice/iterable of ints only, not %s"%(type(key)))
                      else:
                          return self.direct_view(key)
                  #--------------------------------------------------------------------------
                  # Begin public methods
                  #--------------------------------------------------------------------------
                  @property
                  def ids(self):
                      """Always up-to-date ids property."""
                      self._flush_notifications()
                      # always copy:
                      return list(self._ids)
                  def close(self):
                      if self._closed:
                          return
                      snames = filter(lambda n: n.endswith('socket'), dir(self))
                      for socket in map(lambda name: getattr(self, name), snames):
                          if isinstance(socket, zmq.Socket) and not socket.closed:
                              socket.close()
                      self._closed = True
                  def spin(self):
                      """Flush any registration notifications and execution results
                      waiting in the ZMQ queue.
                      """
                      if self._notification_socket:
                          self._flush_notifications()
                      if self._mux_socket:
                          self._flush_results(self._mux_socket)
                      if self._task_socket:
                          self._flush_results(self._task_socket)
                      if self._control_socket:
                          self._flush_control(self._control_socket)
                      if self._iopub_socket:
                          self._flush_iopub(self._iopub_socket)
                      if self._query_socket:
                          self._flush_ignored_hub_replies()
                  def wait(self, jobs=None, timeout=-1):
                      """waits on one or more `jobs`, for up to `timeout` seconds.
                      Parameters
                      ----------
                      jobs : int, str, or list of ints and/or strs, or one or more AsyncResult objects
                              ints are indices to self.history
                              strs are msg_ids
                              default: wait on all outstanding messages
                      timeout : float
                              a time in seconds, after which to give up.
                              default is -1, which means no timeout
                      Returns
                      -------
                      True : when all msg_ids are done
                      False : timeout reached, some msg_ids still outstanding
                      """
                      tic = time.time()
                      if jobs is None:
                          theids = self.outstanding
                      else:
                          if isinstance(jobs, (int, str, AsyncResult)):
                              jobs = [jobs]
                          theids = set()
                          for job in jobs:
                              if isinstance(job, int):
                                  # index access
                                  job = self.history[job]
                              elif isinstance(job, AsyncResult):
                                  map(theids.add, job.msg_ids)
                                  continue
                              theids.add(job)
                      if not theids.intersection(self.outstanding):
                          return True
                      self.spin()
                      while theids.intersection(self.outstanding):
                          if timeout >= 0 and ( time.time()-tic ) > timeout:
                              break
                          time.sleep(1e-3)
                          self.spin()
                      return len(theids.intersection(self.outstanding)) == 0
                  #--------------------------------------------------------------------------
                  # Control methods
                  #--------------------------------------------------------------------------
                  @spin_first
                  def clear(self, targets=None, block=None):
                      """Clear the namespace in target(s)."""
                      block = self.block if block is None else block
                      targets = self._build_targets(targets)[0]
                      for t in targets:
                          self.session.send(self._control_socket, 'clear_request', content={}, ident=t)
                      error = False
                      if block:
                          self._flush_ignored_control()
                          for i in range(len(targets)):
                              idents,msg = self.session.recv(self._control_socket,0)
                              if self.debug:
                                  pprint(msg)
                              if msg['content']['status'] != 'ok':
                                  error = self._unwrap_exception(msg['content'])
                      else:
                          self._ignored_control_replies += len(targets)
                      if error:
                          raise error
                  @spin_first
                  def abort(self, jobs=None, targets=None, block=None):
                      """Abort specific jobs from the execution queues of target(s).
                      This is a mechanism to prevent jobs that have already been submitted
                      from executing.
                      Parameters
                      ----------
                      jobs : msg_id, list of msg_ids, or AsyncResult
                          The jobs to be aborted
                      """
                      block = self.block if block is None else block
                      targets = self._build_targets(targets)[0]
                      msg_ids = []
                      if isinstance(jobs, (basestring,AsyncResult)):
                          jobs = [jobs]
                      bad_ids = filter(lambda obj: not isinstance(obj, (basestring, AsyncResult)), jobs)
                      if bad_ids:
                          raise TypeError("Invalid msg_id type %r, expected str or AsyncResult"%bad_ids[0])
                      for j in jobs:
                          if isinstance(j, AsyncResult):
                              msg_ids.extend(j.msg_ids)
                          else:
                              msg_ids.append(j)
                      content = dict(msg_ids=msg_ids)
                      for t in targets:
                          self.session.send(self._control_socket, 'abort_request',
                                  content=content, ident=t)
                      error = False
                      if block:
                          self._flush_ignored_control()
                          for i in range(len(targets)):
                              idents,msg = self.session.recv(self._control_socket,0)
                              if self.debug:
                                  pprint(msg)
                              if msg['content']['status'] != 'ok':
                                  error = self._unwrap_exception(msg['content'])
                      else:
                          self._ignored_control_replies += len(targets)
                      if error:
                          raise error
                  @spin_first
                  def shutdown(self, targets=None, restart=False, hub=False, block=None):
                      """Terminates one or more engine processes, optionally including the hub."""
                      block = self.block if block is None else block
                      if hub:
                          targets = 'all'
                      targets = self._build_targets(targets)[0]
                      for t in targets:
                          self.session.send(self._control_socket, 'shutdown_request',
                                      content={'restart':restart},ident=t)
                      error = False
                      if block or hub:
                          self._flush_ignored_control()
                          for i in range(len(targets)):
                              idents,msg = self.session.recv(self._control_socket, 0)
                              if self.debug:
                                  pprint(msg)
                              if msg['content']['status'] != 'ok':
                                  error = self._unwrap_exception(msg['content'])
                      else:
                          self._ignored_control_replies += len(targets)
                      if hub:
                          time.sleep(0.25)
                          self.session.send(self._query_socket, 'shutdown_request')
                          idents,msg = self.session.recv(self._query_socket, 0)
                          if self.debug:
                              pprint(msg)
                          if msg['content']['status'] != 'ok':
                              error = self._unwrap_exception(msg['content'])
                      if error:
                          raise error
                  #--------------------------------------------------------------------------
                  # Execution related methods
                  #--------------------------------------------------------------------------
                  def _maybe_raise(self, result):
                      """wrapper for maybe raising an exception if apply failed."""
                      if isinstance(result, error.RemoteError):
                          raise result
                      return result
                  def send_apply_message(self, socket, f, args=None, kwargs=None, subheader=None, track=False,
                                          ident=None):
                      """construct and send an apply message via a socket.
                      This is the principal method with which all engine execution is performed by views.
                      """
                      assert not self._closed, "cannot use me anymore, I'm closed!"
                      # defaults:
                      args = args if args is not None else []
                      kwargs = kwargs if kwargs is not None else {}
                      subheader = subheader if subheader is not None else {}
                      # validate arguments
                      if not callable(f):
                          raise TypeError("f must be callable, not %s"%type(f))
                      if not isinstance(args, (tuple, list)):
                          raise TypeError("args must be tuple or list, not %s"%type(args))
                      if not isinstance(kwargs, dict):
                          raise TypeError("kwargs must be dict, not %s"%type(kwargs))
                      if not isinstance(subheader, dict):
                          raise TypeError("subheader must be dict, not %s"%type(subheader))
                      bufs = util.pack_apply_message(f,args,kwargs)
                      msg = self.session.send(socket, "apply_request", buffers=bufs, ident=ident,
                                          subheader=subheader, track=track)
                      msg_id = msg['msg_id']
                      self.outstanding.add(msg_id)
                      if ident:
                          # possibly routed to a specific engine
                          if isinstance(ident, list):
                              ident = ident[-1]
                          if ident in self._engines.values():
                              # save for later, in case of engine death
                              self._outstanding_dict[ident].add(msg_id)
                      self.history.append(msg_id)
                      self.metadata[msg_id]['submitted'] = datetime.now()
                      return msg
                  #--------------------------------------------------------------------------
                  # construct a View object
                  #--------------------------------------------------------------------------
                  def load_balanced_view(self, targets=None):
                      """construct a DirectView object.
                      If no arguments are specified, create a LoadBalancedView
                      using all engines.
                      Parameters
                      ----------
                      targets: list,slice,int,etc. [default: use all engines]
                          The subset of engines across which to load-balance
                      """
                      if targets is not None:
                          targets = self._build_targets(targets)[1]
                      return LoadBalancedView(client=self, socket=self._task_socket, targets=targets)
                  def direct_view(self, targets='all'):
                      """construct a DirectView object.
                      If no targets are specified, create a DirectView
                      using all engines.
                      Parameters
                      ----------
                      targets: list,slice,int,etc. [default: use all engines]
                          The engines to use for the View
                      """
                      single = isinstance(targets, int)
                      targets = self._build_targets(targets)[1]
                      if single:
                          targets = targets[0]
                      return DirectView(client=self, socket=self._mux_socket, targets=targets)
                  #--------------------------------------------------------------------------
                  # Query methods
                  #--------------------------------------------------------------------------
                  @spin_first
                  def get_result(self, indices_or_msg_ids=None, block=None):
                      """Retrieve a result by msg_id or history index, wrapped in an AsyncResult object.
                      If the client already has the results, no request to the Hub will be made.
                      This is a convenient way to construct AsyncResult objects, which are wrappers
                      that include metadata about execution, and allow for awaiting results that
                      were not submitted by this Client.
                      It can also be a convenient way to retrieve the metadata associated with
                      blocking execution, since it always retrieves
                      Examples
                      --------
                      ::
                          In [10]: r = client.apply()
                      Parameters
                      ----------
                      indices_or_msg_ids : integer history index, str msg_id, or list of either
                          The indices or msg_ids of indices to be retrieved
                      block : bool
                          Whether to wait for the result to be done
                      Returns
                      -------
                      AsyncResult
                          A single AsyncResult object will always be returned.
                      AsyncHubResult
                          A subclass of AsyncResult that retrieves results from the Hub
                      """
                      block = self.block if block is None else block
                      if indices_or_msg_ids is None:
                          indices_or_msg_ids = -1
                      if not isinstance(indices_or_msg_ids, (list,tuple)):
                          indices_or_msg_ids = [indices_or_msg_ids]
                      theids = []
                      for id in indices_or_msg_ids:
                          if isinstance(id, int):
                              id = self.history[id]
                          if not isinstance(id, str):
                              raise TypeError("indices must be str or int, not %r"%id)
                          theids.append(id)
                      local_ids = filter(lambda msg_id: msg_id in self.history or msg_id in self.results, theids)
                      remote_ids = filter(lambda msg_id: msg_id not in local_ids, theids)
                      if remote_ids:
                          ar = AsyncHubResult(self, msg_ids=theids)
                      else:
                          ar = AsyncResult(self, msg_ids=theids)
                      if block:
                          ar.wait()
                      return ar
                  @spin_first
                  def resubmit(self, indices_or_msg_ids=None, subheader=None, block=None):
                      """Resubmit one or more tasks.
                      in-flight tasks may not be resubmitted.
                      Parameters
                      ----------
                      indices_or_msg_ids : integer history index, str msg_id, or list of either
                          The indices or msg_ids of indices to be retrieved
                      block : bool
                          Whether to wait for the result to be done
                      Returns
                      -------
                      AsyncHubResult
                          A subclass of AsyncResult that retrieves results from the Hub
                      """
                      block = self.block if block is None else block
                      if indices_or_msg_ids is None:
                          indices_or_msg_ids = -1
                      if not isinstance(indices_or_msg_ids, (list,tuple)):
                          indices_or_msg_ids = [indices_or_msg_ids]
                      theids = []
                      for id in indices_or_msg_ids:
                          if isinstance(id, int):
                              id = self.history[id]
                          if not isinstance(id, str):
                              raise TypeError("indices must be str or int, not %r"%id)
                          theids.append(id)
                      for msg_id in theids:
                          self.outstanding.discard(msg_id)
                          if msg_id in self.history:
                              self.history.remove(msg_id)
                          self.results.pop(msg_id, None)
                          self.metadata.pop(msg_id, None)
                      content = dict(msg_ids = theids)
                      self.session.send(self._query_socket, 'resubmit_request', content)
                      zmq.select([self._query_socket], [], [])
                      idents,msg = self.session.recv(self._query_socket, zmq.NOBLOCK)
                      if self.debug:
                          pprint(msg)
                      content = msg['content']
                      if content['status'] != 'ok':
                          raise self._unwrap_exception(content)
                      ar = AsyncHubResult(self, msg_ids=theids)
                      if block:
                          ar.wait()
                      return ar
                  @spin_first
                  def result_status(self, msg_ids, status_only=True):
                      """Check on the status of the result(s) of the apply request with `msg_ids`.
                      If status_only is False, then the actual results will be retrieved, else
                      only the status of the results will be checked.
                      Parameters
                      ----------
                      msg_ids : list of msg_ids
                          if int:
                              Passed as index to self.history for convenience.
                      status_only : bool (default: True)
                          if False:
                              Retrieve the actual results of completed tasks.
                      Returns
                      -------
                      results : dict
                          There will always be the keys 'pending' and 'completed', which will
                          be lists of msg_ids that are incomplete or complete. If `status_only`
                          is False, then completed results will be keyed by their `msg_id`.
                      """
                      if not isinstance(msg_ids, (list,tuple)):
                          msg_ids = [msg_ids]
                      theids = []
                      for msg_id in msg_ids:
                          if isinstance(msg_id, int):
                              msg_id = self.history[msg_id]
                          if not isinstance(msg_id, basestring):
                              raise TypeError("msg_ids must be str, not %r"%msg_id)
                          theids.append(msg_id)
                      completed = []
                      local_results = {}
                      # comment this block out to temporarily disable local shortcut:
                      for msg_id in theids:
                          if msg_id in self.results:
                              completed.append(msg_id)
                              local_results[msg_id] = self.results[msg_id]
                              theids.remove(msg_id)
                      if theids: # some not locally cached
                          content = dict(msg_ids=theids, status_only=status_only)
                          msg = self.session.send(self._query_socket, "result_request", content=content)
                          zmq.select([self._query_socket], [], [])
                          idents,msg = self.session.recv(self._query_socket, zmq.NOBLOCK)
                          if self.debug:
                              pprint(msg)
                          content = msg['content']
                          if content['status'] != 'ok':
                              raise self._unwrap_exception(content)
                          buffers = msg['buffers']
                      else:
                          content = dict(completed=[],pending=[])
                      content['completed'].extend(completed)
                      if status_only:
                          return content
                      failures = []
                      # load cached results into result:
                      content.update(local_results)
                      # update cache with results:
                      for msg_id in sorted(theids):
                          if msg_id in content['completed']:
                              rec = content[msg_id]
                              parent = rec['header']
                              header = rec['result_header']
                              rcontent = rec['result_content']
                              iodict = rec['io']
                              if isinstance(rcontent, str):
                                  rcontent = self.session.unpack(rcontent)
                              md = self.metadata[msg_id]
                              md.update(self._extract_metadata(header, parent, rcontent))
                              md.update(iodict)
                              if rcontent['status'] == 'ok':
                                  res,buffers = util.unserialize_object(buffers)
                              else:
                                  print rcontent
                                  res = self._unwrap_exception(rcontent)
                                  failures.append(res)
                              self.results[msg_id] = res
                              content[msg_id] = res
                      if len(theids) == 1 and failures:
                              raise failures[0]
                      error.collect_exceptions(failures, "result_status")
                      return content
                  @spin_first
                  def queue_status(self, targets='all', verbose=False):
                      """Fetch the status of engine queues.
                      Parameters
                      ----------
                      targets : int/str/list of ints/strs
                              the engines whose states are to be queried.
                              default : all
                      verbose : bool
                              Whether to return lengths only, or lists of ids for each element
                      """
                      engine_ids = self._build_targets(targets)[1]
                      content = dict(targets=engine_ids, verbose=verbose)
                      self.session.send(self._query_socket, "queue_request", content=content)
                      idents,msg = self.session.recv(self._query_socket, 0)
                      if self.debug:
                          pprint(msg)
                      content = msg['content']
                      status = content.pop('status')
                      if status != 'ok':
                          raise self._unwrap_exception(content)
                      content = util.rekey(content)
                      if isinstance(targets, int):
                          return content[targets]
                      else:
                          return content
                  @spin_first
                  def purge_results(self, jobs=[], targets=[]):
                      """Tell the Hub to forget results.
                      Individual results can be purged by msg_id, or the entire
                      history of specific targets can be purged.
                      Parameters
                      ----------
                      jobs : str or list of str or AsyncResult objects
                              the msg_ids whose results should be forgotten.
                      targets : int/str/list of ints/strs
                              The targets, by uuid or int_id, whose entire history is to be purged.
                              Use `targets='all'` to scrub everything from the Hub's memory.
                              default : None
                      """
                      if not targets and not jobs:
                          raise ValueError("Must specify at least one of `targets` and `jobs`")
                      if targets:
                          targets = self._build_targets(targets)[1]
                      # construct msg_ids from jobs
                      msg_ids = []
                      if isinstance(jobs, (basestring,AsyncResult)):
                          jobs = [jobs]
                      bad_ids = filter(lambda obj: not isinstance(obj, (basestring, AsyncResult)), jobs)
                      if bad_ids:
                          raise TypeError("Invalid msg_id type %r, expected str or AsyncResult"%bad_ids[0])
                      for j in jobs:
                          if isinstance(j, AsyncResult):
                              msg_ids.extend(j.msg_ids)
                          else:
                              msg_ids.append(j)
                      content = dict(targets=targets, msg_ids=msg_ids)
                      self.session.send(self._query_socket, "purge_request", content=content)
                      idents, msg = self.session.recv(self._query_socket, 0)
                      if self.debug:
                          pprint(msg)
                      content = msg['content']
                      if content['status'] != 'ok':
                          raise self._unwrap_exception(content)
                  @spin_first
                  def hub_history(self):
                      """Get the Hub's history
                      Just like the Client, the Hub has a history, which is a list of msg_ids.
                      This will contain the history of all clients, and, depending on configuration,
                      may contain history across multiple cluster sessions.
                      Any msg_id returned here is a valid argument to `get_result`.
                      Returns
                      -------
                      msg_ids : list of strs
                              list of all msg_ids, ordered by task submission time.
                      """
                      self.session.send(self._query_socket, "history_request", content={})
                      idents, msg = self.session.recv(self._query_socket, 0)
                      if self.debug:
                          pprint(msg)
                      content = msg['content']
                      if content['status'] != 'ok':
                          raise self._unwrap_exception(content)
                      else:
                          return content['history']
                  @spin_first
                  def db_query(self, query, keys=None):
                      """Query the Hub's TaskRecord database
                      This will return a list of task record dicts that match `query`
                      Parameters
                      ----------
                      query : mongodb query dict
                          The search dict. See mongodb query docs for details.
                      keys : list of strs [optional]
                          The subset of keys to be returned.  The default is to fetch everything but buffers.
                          'msg_id' will *always* be included.
                      """
                      if isinstance(keys, basestring):
                          keys = [keys]
                      content = dict(query=query, keys=keys)
                      self.session.send(self._query_socket, "db_request", content=content)
                      idents, msg = self.session.recv(self._query_socket, 0)
                      if self.debug:
                          pprint(msg)
                      content = msg['content']
                      if content['status'] != 'ok':
                          raise self._unwrap_exception(content)
                      records = content['records']
                      buffer_lens = content['buffer_lens']
                      result_buffer_lens = content['result_buffer_lens']
                      buffers = msg['buffers']
                      has_bufs = buffer_lens is not None
                      has_rbufs = result_buffer_lens is not None
                      for i,rec in enumerate(records):
                          # relink buffers
                          if has_bufs:
                              blen = buffer_lens[i]
                              rec['buffers'], buffers = buffers[:blen],buffers[blen:]
                          if has_rbufs:
                              blen = result_buffer_lens[i]
                              rec['result_buffers'], buffers = buffers[:blen],buffers[blen:]
                      return records
              __all__ = [ 'Client' ]

IPython/parallel/client/map.py

0 +8 -1

              # encoding: utf-8
              """Classes used in scattering and gathering sequences.
              Scattering consists of partitioning a sequence and sending the various
              pieces to individual nodes in a cluster.
+             Authors:
+             * Brian Granger
+             * MinRK
              """
              __docformat__ = "restructuredtext en"
              #-------------------------------------------------------------------------------
-             #  Copyright (C) 2008  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              import types
              from IPython.utils.data import flatten as utils_flatten
              #-------------------------------------------------------------------------------
              # Figure out which array packages are present and their array types
              #-------------------------------------------------------------------------------
              arrayModules = []
              try:
                  import Numeric
              except ImportError:
                  pass
              else:
                  arrayModules.append({'module':Numeric, 'type':Numeric.arraytype})
              try:
                  import numpy
              except ImportError:
                  pass
              else:
                  arrayModules.append({'module':numpy, 'type':numpy.ndarray})
              try:
                  import numarray
              except ImportError:
                  pass
              else:
                  arrayModules.append({'module':numarray,
                      'type':numarray.numarraycore.NumArray})
              class Map:
                  """A class for partitioning a sequence using a map."""
                  def getPartition(self, seq, p, q):
                      """Returns the pth partition of q partitions of seq."""
                      # Test for error conditions here
                      if p<0 or p>=q:
                        print "No partition exists."
                        return
                      remainder = len(seq)%q
                      basesize = len(seq)/q
                      hi = []
                      lo = []
                      for n in range(q):
                          if n < remainder:
                              lo.append(n * (basesize + 1))
                              hi.append(lo[-1] + basesize + 1)
                          else:
                              lo.append(n*basesize + remainder)
                              hi.append(lo[-1] + basesize)
                      result = seq[lo[p]:hi[p]]
                      return result
                  def joinPartitions(self, listOfPartitions):
                      return self.concatenate(listOfPartitions)
                  def concatenate(self, listOfPartitions):
                      testObject = listOfPartitions[0]
                      # First see if we have a known array type
                      for m in arrayModules:
                          #print m
                          if isinstance(testObject, m['type']):
                              return m['module'].concatenate(listOfPartitions)
                      # Next try for Python sequence types
                      if isinstance(testObject, (types.ListType, types.TupleType)):
                          return utils_flatten(listOfPartitions)
                      # If we have scalars, just return listOfPartitions
                      return listOfPartitions
              class RoundRobinMap(Map):
                  """Partitions a sequence in a roun robin fashion.
                  This currently does not work!
                  """
                  def getPartition(self, seq, p, q):
                      # if not isinstance(seq,(list,tuple)):
                      #     raise NotImplementedError("cannot RR partition type %s"%type(seq))
                      return seq[p:len(seq):q]
                      #result = []
                      #for i in range(p,len(seq),q):
                      #    result.append(seq[i])
                      #return result
                  def joinPartitions(self, listOfPartitions):
                      testObject = listOfPartitions[0]
                      # First see if we have a known array type
                      for m in arrayModules:
                          #print m
                          if isinstance(testObject, m['type']):
                              return self.flatten_array(m['type'], listOfPartitions)
                      if isinstance(testObject, (types.ListType, types.TupleType)):
                          return self.flatten_list(listOfPartitions)
                      return listOfPartitions
                  def flatten_array(self, klass, listOfPartitions):
                      test = listOfPartitions[0]
                      shape = list(test.shape)
                      shape[0] = sum([ p.shape[0] for p in listOfPartitions])
                      A = klass(shape)
                      N = shape[0]
                      q = len(listOfPartitions)
                      for p,part in enumerate(listOfPartitions):
                          A[p:N:q] = part
                      return A
                  def flatten_list(self, listOfPartitions):
                      flat = []
                      for i in range(len(listOfPartitions[0])):
                          flat.extend([ part[i] for part in listOfPartitions if len(part) > i ])
                      return flat
                      #lengths = [len(x) for x in listOfPartitions]
                      #maxPartitionLength = len(listOfPartitions[0])
                      #numberOfPartitions = len(listOfPartitions)
                      #concat = self.concatenate(listOfPartitions)
                      #totalLength = len(concat)
                      #result = []
                      #for i in range(maxPartitionLength):
                      #    result.append(concat[i:totalLength:maxPartitionLength])
                      # return self.concatenate(listOfPartitions)
              def mappable(obj):
                  """return whether an object is mappable or not."""
                  if isinstance(obj, (tuple,list)):
                      return True
                  for m in arrayModules:
                      if isinstance(obj,m['type']):
                          return True
                  return False
              dists = {'b':Map,'r':RoundRobinMap}

IPython/parallel/client/remotefunction.py

0 +8 -2

-             """Remote Functions and decorators for Views."""
+             """Remote Functions and decorators for Views.
+             Authors:
+             * Brian Granger
+             * Min RK
+             """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2010  The IPython Development Team
+             #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import warnings
              from IPython.testing.skipdoctest import skip_doctest
              from . import map as Map
              from .asyncresult import AsyncMapResult
              #-----------------------------------------------------------------------------
              # Decorators
              #-----------------------------------------------------------------------------
              @skip_doctest
              def remote(view, block=None, **flags):
                  """Turn a function into a remote function.
                  This method can be used for map:
                  In [1]: @remote(view,block=True)
                     ...: def func(a):
                     ...:    pass
                  """
                  def remote_function(f):
                      return RemoteFunction(view, f, block=block, **flags)
                  return remote_function
              @skip_doctest
              def parallel(view, dist='b', block=None, **flags):
                  """Turn a function into a parallel remote function.
                  This method can be used for map:
                  In [1]: @parallel(view, block=True)
                     ...: def func(a):
                     ...:    pass
                  """
                  def parallel_function(f):
                      return ParallelFunction(view, f, dist=dist, block=block, **flags)
                  return parallel_function
              #--------------------------------------------------------------------------
              # Classes
              #--------------------------------------------------------------------------
              class RemoteFunction(object):
                  """Turn an existing function into a remote function.
                  Parameters
                  ----------
                  view : View instance
                      The view to be used for execution
                  f : callable
                      The function to be wrapped into a remote function
                  block : bool [default: None]
                      Whether to wait for results or not.  The default behavior is
                      to use the current `block` attribute of `view`
                  **flags : remaining kwargs are passed to View.temp_flags
                  """
                  view = None # the remote connection
                  func = None # the wrapped function
                  block = None # whether to block
                  flags = None # dict of extra kwargs for temp_flags
                  def __init__(self, view, f, block=None, **flags):
                      self.view = view
                      self.func = f
                      self.block=block
                      self.flags=flags
                  def __call__(self, *args, **kwargs):
                      block = self.view.block if self.block is None else self.block
                      with self.view.temp_flags(block=block, **self.flags):
                          return self.view.apply(self.func, *args, **kwargs)
              class ParallelFunction(RemoteFunction):
                  """Class for mapping a function to sequences.
                  This will distribute the sequences according the a mapper, and call
                  the function on each sub-sequence.  If called via map, then the function
                  will be called once on each element, rather that each sub-sequence.
                  Parameters
                  ----------
                  view : View instance
                      The view to be used for execution
                  f : callable
                      The function to be wrapped into a remote function
                  dist : str [default: 'b']
                      The key for which mapObject to use to distribute sequences
                      options are:
                        * 'b' : use contiguous chunks in order
                        * 'r' : use round-robin striping
                  block : bool [default: None]
                      Whether to wait for results or not.  The default behavior is
                      to use the current `block` attribute of `view`
                  chunksize : int or None
                      The size of chunk to use when breaking up sequences in a load-balanced manner
                  **flags : remaining kwargs are passed to View.temp_flags
                  """
                  chunksize=None
                  mapObject=None
                  def __init__(self, view, f, dist='b', block=None, chunksize=None, **flags):
                      super(ParallelFunction, self).__init__(view, f, block=block, **flags)
                      self.chunksize = chunksize
                      mapClass = Map.dists[dist]
                      self.mapObject = mapClass()
                  def __call__(self, *sequences):
                      # check that the length of sequences match
                      len_0 = len(sequences[0])
                      for s in sequences:
                          if len(s)!=len_0:
                              msg = 'all sequences must have equal length, but %i!=%i'%(len_0,len(s))
                              raise ValueError(msg)
                      balanced = 'Balanced' in self.view.__class__.__name__
                      if balanced:
                          if self.chunksize:
                              nparts = len_0/self.chunksize + int(len_0%self.chunksize > 0)
                          else:
                              nparts = len_0
                          targets = [None]*nparts
                      else:
                          if self.chunksize:
                              warnings.warn("`chunksize` is ignored unless load balancing", UserWarning)
                          # multiplexed:
                          targets = self.view.targets
                          nparts = len(targets)
                      msg_ids = []
                      # my_f = lambda *a: map(self.func, *a)
                      client = self.view.client
                      for index, t in enumerate(targets):
                          args = []
                          for seq in sequences:
                              part = self.mapObject.getPartition(seq, index, nparts)
                              if len(part) == 0:
                                  continue
                              else:
                                  args.append(part)
                          if not args:
                              continue
                          # print (args)
                          if hasattr(self, '_map'):
                              f = map
                              args = [self.func]+args
                          else:
                              f=self.func
                          view = self.view if balanced else client[t]
                          with view.temp_flags(block=False, **self.flags):
                              ar = view.apply(f, *args)
                          msg_ids.append(ar.msg_ids[0])
                      r = AsyncMapResult(self.view.client, msg_ids, self.mapObject, fname=self.func.__name__)
                      if self.block:
                          try:
                              return r.get()
                          except KeyboardInterrupt:
                              return r
                      else:
                          return r
                  def map(self, *sequences):
                      """call a function on each element of a sequence remotely.
                      This should behave very much like the builtin map, but return an AsyncMapResult
                      if self.block is False.
                      """
                      # set _map as a flag for use inside self.__call__
                      self._map = True
                      try:
                          ret = self.__call__(*sequences)
                      finally:
                          del self._map
                      return ret
              __all__ = ['remote', 'parallel', 'RemoteFunction', 'ParallelFunction']

IPython/parallel/client/view.py

0 +7 -2

-             """Views of remote engines."""
+             """Views of remote engines.
+             Authors:
+             * Min RK
+             """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2010  The IPython Development Team
+             #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import imp
              import sys
              import warnings
              from contextlib import contextmanager
              from types import ModuleType
              import zmq
              from IPython.testing.skipdoctest import skip_doctest
              from IPython.utils.traitlets import HasTraits, Any, Bool, List, Dict, Set, Int, Instance, CFloat, CInt
              from IPython.external.decorator import decorator
              from IPython.parallel import util
              from IPython.parallel.controller.dependency import Dependency, dependent
              from . import map as Map
              from .asyncresult import AsyncResult, AsyncMapResult
              from .remotefunction import ParallelFunction, parallel, remote
              #-----------------------------------------------------------------------------
              # Decorators
              #-----------------------------------------------------------------------------
              @decorator
              def save_ids(f, self, *args, **kwargs):
                  """Keep our history and outstanding attributes up to date after a method call."""
                  n_previous = len(self.client.history)
                  try:
                      ret = f(self, *args, **kwargs)
                  finally:
                      nmsgs = len(self.client.history) - n_previous
                      msg_ids = self.client.history[-nmsgs:]
                      self.history.extend(msg_ids)
                      map(self.outstanding.add, msg_ids)
                  return ret
              @decorator
              def sync_results(f, self, *args, **kwargs):
                  """sync relevant results from self.client to our results attribute."""
                  ret = f(self, *args, **kwargs)
                  delta = self.outstanding.difference(self.client.outstanding)
                  completed = self.outstanding.intersection(delta)
                  self.outstanding = self.outstanding.difference(completed)
                  for msg_id in completed:
                      self.results[msg_id] = self.client.results[msg_id]
                  return ret
              @decorator
              def spin_after(f, self, *args, **kwargs):
                  """call spin after the method."""
                  ret = f(self, *args, **kwargs)
                  self.spin()
                  return ret
              #-----------------------------------------------------------------------------
              # Classes
              #-----------------------------------------------------------------------------
              @skip_doctest
              class View(HasTraits):
                  """Base View class for more convenint apply(f,*args,**kwargs) syntax via attributes.
                  Don't use this class, use subclasses.
                  Methods
                  -------
                  spin
                      flushes incoming results and registration state changes
                      control methods spin, and requesting `ids` also ensures up to date
                  wait
                      wait on one or more msg_ids
                  execution methods
                      apply
                      legacy: execute, run
                  data movement
                      push, pull, scatter, gather
                  query methods
                      get_result, queue_status, purge_results, result_status
                  control methods
                      abort, shutdown
                  """
                  # flags
                  block=Bool(False)
                  track=Bool(True)
                  targets = Any()
                  history=List()
                  outstanding = Set()
                  results = Dict()
                  client = Instance('IPython.parallel.Client')
                  _socket = Instance('zmq.Socket')
                  _flag_names = List(['targets', 'block', 'track'])
                  _targets = Any()
                  _idents = Any()
                  def __init__(self, client=None, socket=None, **flags):
                      super(View, self).__init__(client=client, _socket=socket)
                      self.block = client.block
                      self.set_flags(**flags)
                      assert not self.__class__ is View, "Don't use base View objects, use subclasses"
                  def __repr__(self):
                      strtargets = str(self.targets)
                      if len(strtargets) > 16:
                          strtargets = strtargets[:12]+'...]'
                      return "<%s %s>"%(self.__class__.__name__, strtargets)
                  def set_flags(self, **kwargs):
                      """set my attribute flags by keyword.
                      Views determine behavior with a few attributes (`block`, `track`, etc.).
                      These attributes can be set all at once by name with this method.
                      Parameters
                      ----------
                      block : bool
                          whether to wait for results
                      track : bool
                          whether to create a MessageTracker to allow the user to
                          safely edit after arrays and buffers during non-copying
                          sends.
                      """
                      for name, value in kwargs.iteritems():
                          if name not in self._flag_names:
                              raise KeyError("Invalid name: %r"%name)
                          else:
                              setattr(self, name, value)
                  @contextmanager
                  def temp_flags(self, **kwargs):
                      """temporarily set flags, for use in `with` statements.
                      See set_flags for permanent setting of flags
                      Examples
                      --------
                      >>> view.track=False
                      ...
                      >>> with view.temp_flags(track=True):
                      ...    ar = view.apply(dostuff, my_big_array)
                      ...    ar.tracker.wait() # wait for send to finish
                      >>> view.track
                      False
                      """
                      # preflight: save flags, and set temporaries
                      saved_flags = {}
                      for f in self._flag_names:
                          saved_flags[f] = getattr(self, f)
                      self.set_flags(**kwargs)
                      # yield to the with-statement block
                      try:
                          yield
                      finally:
                          # postflight: restore saved flags
                          self.set_flags(**saved_flags)
                  #----------------------------------------------------------------
                  # apply
                  #----------------------------------------------------------------
                  @sync_results
                  @save_ids
                  def _really_apply(self, f, args, kwargs, block=None, **options):
                      """wrapper for client.send_apply_message"""
                      raise NotImplementedError("Implement in subclasses")
                  def apply(self, f, *args, **kwargs):
                      """calls f(*args, **kwargs) on remote engines, returning the result.
                      This method sets all apply flags via this View's attributes.
                      if self.block is False:
                          returns AsyncResult
                      else:
                          returns actual result of f(*args, **kwargs)
                      """
                      return self._really_apply(f, args, kwargs)
                  def apply_async(self, f, *args, **kwargs):
                      """calls f(*args, **kwargs) on remote engines in a nonblocking manner.
                      returns AsyncResult
                      """
                      return self._really_apply(f, args, kwargs, block=False)
                  @spin_after
                  def apply_sync(self, f, *args, **kwargs):
                      """calls f(*args, **kwargs) on remote engines in a blocking manner,
                       returning the result.
                      returns: actual result of f(*args, **kwargs)
                      """
                      return self._really_apply(f, args, kwargs, block=True)
                  #----------------------------------------------------------------
                  # wrappers for client and control methods
                  #----------------------------------------------------------------
                  @sync_results
                  def spin(self):
                      """spin the client, and sync"""
                      self.client.spin()
                  @sync_results
                  def wait(self, jobs=None, timeout=-1):
                      """waits on one or more `jobs`, for up to `timeout` seconds.
                      Parameters
                      ----------
                      jobs : int, str, or list of ints and/or strs, or one or more AsyncResult objects
                              ints are indices to self.history
                              strs are msg_ids
                              default: wait on all outstanding messages
                      timeout : float
                              a time in seconds, after which to give up.
                              default is -1, which means no timeout
                      Returns
                      -------
                      True : when all msg_ids are done
                      False : timeout reached, some msg_ids still outstanding
                      """
                      if jobs is None:
                          jobs = self.history
                      return self.client.wait(jobs, timeout)
                  def abort(self, jobs=None, targets=None, block=None):
                      """Abort jobs on my engines.
                      Parameters
                      ----------
                      jobs : None, str, list of strs, optional
                          if None: abort all jobs.
                          else: abort specific msg_id(s).
                      """
                      block = block if block is not None else self.block
                      targets = targets if targets is not None else self.targets
                      return self.client.abort(jobs=jobs, targets=targets, block=block)
                  def queue_status(self, targets=None, verbose=False):
                      """Fetch the Queue status of my engines"""
                      targets = targets if targets is not None else self.targets
                      return self.client.queue_status(targets=targets, verbose=verbose)
                  def purge_results(self, jobs=[], targets=[]):
                      """Instruct the controller to forget specific results."""
                      if targets is None or targets == 'all':
                          targets = self.targets
                      return self.client.purge_results(jobs=jobs, targets=targets)
                  def shutdown(self, targets=None, restart=False, hub=False, block=None):
                      """Terminates one or more engine processes, optionally including the hub.
                      """
                      block = self.block if block is None else block
                      if targets is None or targets == 'all':
                          targets = self.targets
                      return self.client.shutdown(targets=targets, restart=restart, hub=hub, block=block)
                  @spin_after
                  def get_result(self, indices_or_msg_ids=None):
                      """return one or more results, specified by history index or msg_id.
                      See client.get_result for details.
                      """
                      if indices_or_msg_ids is None:
                          indices_or_msg_ids = -1
                      if isinstance(indices_or_msg_ids, int):
                          indices_or_msg_ids = self.history[indices_or_msg_ids]
                      elif isinstance(indices_or_msg_ids, (list,tuple,set)):
                          indices_or_msg_ids = list(indices_or_msg_ids)
                          for i,index in enumerate(indices_or_msg_ids):
                              if isinstance(index, int):
                                  indices_or_msg_ids[i] = self.history[index]
                      return self.client.get_result(indices_or_msg_ids)
                  #-------------------------------------------------------------------
                  # Map
                  #-------------------------------------------------------------------
                  def map(self, f, *sequences, **kwargs):
                      """override in subclasses"""
                      raise NotImplementedError
                  def map_async(self, f, *sequences, **kwargs):
                      """Parallel version of builtin `map`, using this view's engines.
                      This is equivalent to map(...block=False)
                      See `self.map` for details.
                      """
                      if 'block' in kwargs:
                          raise TypeError("map_async doesn't take a `block` keyword argument.")
                      kwargs['block'] = False
                      return self.map(f,*sequences,**kwargs)
                  def map_sync(self, f, *sequences, **kwargs):
                      """Parallel version of builtin `map`, using this view's engines.
                      This is equivalent to map(...block=True)
                      See `self.map` for details.
                      """
                      if 'block' in kwargs:
                          raise TypeError("map_sync doesn't take a `block` keyword argument.")
                      kwargs['block'] = True
                      return self.map(f,*sequences,**kwargs)
                  def imap(self, f, *sequences, **kwargs):
                      """Parallel version of `itertools.imap`.
                      See `self.map` for details.
                      """
                      return iter(self.map_async(f,*sequences, **kwargs))
                  #-------------------------------------------------------------------
                  # Decorators
                  #-------------------------------------------------------------------
                  def remote(self, block=True, **flags):
                      """Decorator for making a RemoteFunction"""
                      block = self.block if block is None else block
                      return remote(self, block=block, **flags)
                  def parallel(self, dist='b', block=None, **flags):
                      """Decorator for making a ParallelFunction"""
                      block = self.block if block is None else block
                      return parallel(self, dist=dist, block=block, **flags)
              @skip_doctest
              class DirectView(View):
                  """Direct Multiplexer View of one or more engines.
                  These are created via indexed access to a client:
                  >>> dv_1 = client[1]
                  >>> dv_all = client[:]
                  >>> dv_even = client[::2]
                  >>> dv_some = client[1:3]
                  This object provides dictionary access to engine namespaces:
                  # push a=5:
                  >>> dv['a'] = 5
                  # pull 'foo':
                  >>> db['foo']
                  """
                  def __init__(self, client=None, socket=None, targets=None):
                      super(DirectView, self).__init__(client=client, socket=socket, targets=targets)
                  @property
                  def importer(self):
                      """sync_imports(local=True) as a property.
                      See sync_imports for details.
                      """
                      return self.sync_imports(True)
                  @contextmanager
                  def sync_imports(self, local=True):
                      """Context Manager for performing simultaneous local and remote imports.
                      'import x as y' will *not* work.  The 'as y' part will simply be ignored.
                      >>> with view.sync_imports():
                      ...    from numpy import recarray
                      importing recarray from numpy on engine(s)
                      """
                      import __builtin__
                      local_import = __builtin__.__import__
                      modules = set()
                      results = []
                      @util.interactive
                      def remote_import(name, fromlist, level):
                          """the function to be passed to apply, that actually performs the import
                          on the engine, and loads up the user namespace.
                          """
                          import sys
                          user_ns = globals()
                          mod = __import__(name, fromlist=fromlist, level=level)
                          if fromlist:
                              for key in fromlist:
                                  user_ns[key] = getattr(mod, key)
                          else:
                              user_ns[name] = sys.modules[name]
                      def view_import(name, globals={}, locals={}, fromlist=[], level=-1):
                          """the drop-in replacement for __import__, that optionally imports
                          locally as well.
                          """
                          # don't override nested imports
                          save_import = __builtin__.__import__
                          __builtin__.__import__ = local_import
                          if imp.lock_held():
                              # this is a side-effect import, don't do it remotely, or even
                              # ignore the local effects
                              return local_import(name, globals, locals, fromlist, level)
                          imp.acquire_lock()
                          if local:
                              mod = local_import(name, globals, locals, fromlist, level)
                          else:
                              raise NotImplementedError("remote-only imports not yet implemented")
                          imp.release_lock()
                          key = name+':'+','.join(fromlist or [])
                          if level == -1 and key not in modules:
                              modules.add(key)
                              if fromlist:
                                  print "importing %s from %s on engine(s)"%(','.join(fromlist), name)
                              else:
                                  print "importing %s on engine(s)"%name
                              results.append(self.apply_async(remote_import, name, fromlist, level))
                          # restore override
                          __builtin__.__import__ = save_import
                          return mod
                      # override __import__
                      __builtin__.__import__ = view_import
                      try:
                          # enter the block
                          yield
                      except ImportError:
                          if not local:
                              # ignore import errors if not doing local imports
                              pass
                      finally:
                          # always restore __import__
                          __builtin__.__import__ = local_import
                      for r in results:
                          # raise possible remote ImportErrors here
                          r.get()
                  @sync_results
                  @save_ids
                  def _really_apply(self, f, args=None, kwargs=None, targets=None, block=None, track=None):
                      """calls f(*args, **kwargs) on remote engines, returning the result.
                      This method sets all of `apply`'s flags via this View's attributes.
                      Parameters
                      ----------
                      f : callable
                      args : list [default: empty]
                      kwargs : dict [default: empty]
                      targets : target list [default: self.targets]
                          where to run
                      block : bool [default: self.block]
                          whether to block
                      track : bool [default: self.track]
                          whether to ask zmq to track the message, for safe non-copying sends
                      Returns
                      -------
                      if self.block is False:
                          returns AsyncResult
                      else:
                          returns actual result of f(*args, **kwargs) on the engine(s)
                          This will be a list of self.targets is also a list (even length 1), or
                          the single result if self.targets is an integer engine id
                      """
                      args = [] if args is None else args
                      kwargs = {} if kwargs is None else kwargs
                      block = self.block if block is None else block
                      track = self.track if track is None else track
                      targets = self.targets if targets is None else targets
                      _idents = self.client._build_targets(targets)[0]
                      msg_ids = []
                      trackers = []
                      for ident in _idents:
                          msg = self.client.send_apply_message(self._socket, f, args, kwargs, track=track,
                                                  ident=ident)
                          if track:
                              trackers.append(msg['tracker'])
                          msg_ids.append(msg['msg_id'])
                      tracker = None if track is False else zmq.MessageTracker(*trackers)
                      ar = AsyncResult(self.client, msg_ids, fname=f.__name__, targets=targets, tracker=tracker)
                      if block:
                          try:
                              return ar.get()
                          except KeyboardInterrupt:
                              pass
                      return ar
                  @spin_after
                  def map(self, f, *sequences, **kwargs):
                      """view.map(f, *sequences, block=self.block) => list|AsyncMapResult
                      Parallel version of builtin `map`, using this View's `targets`.
                      There will be one task per target, so work will be chunked
                      if the sequences are longer than `targets`.
                      Results can be iterated as they are ready, but will become available in chunks.
                      Parameters
                      ----------
                      f : callable
                          function to be mapped
                      *sequences: one or more sequences of matching length
                          the sequences to be distributed and passed to `f`
                      block : bool
                          whether to wait for the result or not [default self.block]
                      Returns
                      -------
                      if block=False:
                          AsyncMapResult
                              An object like AsyncResult, but which reassembles the sequence of results
                              into a single list. AsyncMapResults can be iterated through before all
                              results are complete.
                      else:
                          list
                              the result of map(f,*sequences)
                      """
                      block = kwargs.pop('block', self.block)
                      for k in kwargs.keys():
                          if k not in ['block', 'track']:
                              raise TypeError("invalid keyword arg, %r"%k)
                      assert len(sequences) > 0, "must have some sequences to map onto!"
                      pf = ParallelFunction(self, f, block=block, **kwargs)
                      return pf.map(*sequences)
                  def execute(self, code, targets=None, block=None):
                      """Executes `code` on `targets` in blocking or nonblocking manner.
                      ``execute`` is always `bound` (affects engine namespace)
                      Parameters
                      ----------
                      code : str
                              the code string to be executed
                      block : bool
                              whether or not to wait until done to return
                              default: self.block
                      """
                      return self._really_apply(util._execute, args=(code,), block=block, targets=targets)
                  def run(self, filename, targets=None, block=None):
                      """Execute contents of `filename` on my engine(s).
                      This simply reads the contents of the file and calls `execute`.
                      Parameters
                      ----------
                      filename : str
                              The path to the file
                      targets : int/str/list of ints/strs
                              the engines on which to execute
                              default : all
                      block : bool
                              whether or not to wait until done
                              default: self.block
                      """
                      with open(filename, 'r') as f:
                          # add newline in case of trailing indented whitespace
                          # which will cause SyntaxError
                          code = f.read()+'\n'
                      return self.execute(code, block=block, targets=targets)
                  def update(self, ns):
                      """update remote namespace with dict `ns`
                      See `push` for details.
                      """
                      return self.push(ns, block=self.block, track=self.track)
                  def push(self, ns, targets=None, block=None, track=None):
                      """update remote namespace with dict `ns`
                      Parameters
                      ----------
                      ns : dict
                          dict of keys with which to update engine namespace(s)
                      block : bool [default : self.block]
                          whether to wait to be notified of engine receipt
                      """
                      block = block if block is not None else self.block
                      track = track if track is not None else self.track
                      targets = targets if targets is not None else self.targets
                      # applier = self.apply_sync if block else self.apply_async
                      if not isinstance(ns, dict):
                          raise TypeError("Must be a dict, not %s"%type(ns))
                      return self._really_apply(util._push, (ns,), block=block, track=track, targets=targets)
                  def get(self, key_s):
                      """get object(s) by `key_s` from remote namespace
                      see `pull` for details.
                      """
                      # block = block if block is not None else self.block
                      return self.pull(key_s, block=True)
                  def pull(self, names, targets=None, block=None):
                      """get object(s) by `name` from remote namespace
                      will return one object if it is a key.
                      can also take a list of keys, in which case it will return a list of objects.
                      """
                      block = block if block is not None else self.block
                      targets = targets if targets is not None else self.targets
                      applier = self.apply_sync if block else self.apply_async
                      if isinstance(names, basestring):
                          pass
                      elif isinstance(names, (list,tuple,set)):
                          for key in names:
                              if not isinstance(key, basestring):
                                  raise TypeError("keys must be str, not type %r"%type(key))
                      else:
                          raise TypeError("names must be strs, not %r"%names)
                      return self._really_apply(util._pull, (names,), block=block, targets=targets)
                  def scatter(self, key, seq, dist='b', flatten=False, targets=None, block=None, track=None):
                      """
                      Partition a Python sequence and send the partitions to a set of engines.
                      """
                      block = block if block is not None else self.block
                      track = track if track is not None else self.track
                      targets = targets if targets is not None else self.targets
                      mapObject = Map.dists[dist]()
                      nparts = len(targets)
                      msg_ids = []
                      trackers = []
                      for index, engineid in enumerate(targets):
                          partition = mapObject.getPartition(seq, index, nparts)
                          if flatten and len(partition) == 1:
                              ns = {key: partition[0]}
                          else:
                              ns = {key: partition}
                          r = self.push(ns, block=False, track=track, targets=engineid)
                          msg_ids.extend(r.msg_ids)
                          if track:
                              trackers.append(r._tracker)
                      if track:
                          tracker = zmq.MessageTracker(*trackers)
                      else:
                          tracker = None
                      r = AsyncResult(self.client, msg_ids, fname='scatter', targets=targets, tracker=tracker)
                      if block:
                          r.wait()
                      else:
                          return r
                  @sync_results
                  @save_ids
                  def gather(self, key, dist='b', targets=None, block=None):
                      """
                      Gather a partitioned sequence on a set of engines as a single local seq.
                      """
                      block = block if block is not None else self.block
                      targets = targets if targets is not None else self.targets
                      mapObject = Map.dists[dist]()
                      msg_ids = []
                      for index, engineid in enumerate(targets):
                          msg_ids.extend(self.pull(key, block=False, targets=engineid).msg_ids)
                      r = AsyncMapResult(self.client, msg_ids, mapObject, fname='gather')
                      if block:
                          try:
                              return r.get()
                          except KeyboardInterrupt:
                              pass
                      return r
                  def __getitem__(self, key):
                      return self.get(key)
                  def __setitem__(self,key, value):
                      self.update({key:value})
                  def clear(self, targets=None, block=False):
                      """Clear the remote namespaces on my engines."""
                      block = block if block is not None else self.block
                      targets = targets if targets is not None else self.targets
                      return self.client.clear(targets=targets, block=block)
                  def kill(self, targets=None, block=True):
                      """Kill my engines."""
                      block = block if block is not None else self.block
                      targets = targets if targets is not None else self.targets
                      return self.client.kill(targets=targets, block=block)
                  #----------------------------------------
                  # activate for %px,%autopx magics
                  #----------------------------------------
                  def activate(self):
                      """Make this `View` active for parallel magic commands.
                      IPython has a magic command syntax to work with `MultiEngineClient` objects.
                      In a given IPython session there is a single active one.  While
                      there can be many `Views` created and used by the user,
                      there is only one active one.  The active `View` is used whenever
                      the magic commands %px and %autopx are used.
                      The activate() method is called on a given `View` to make it
                      active.  Once this has been done, the magic commands can be used.
                      """
                      try:
                          # This is injected into __builtins__.
                          ip = get_ipython()
                      except NameError:
                          print "The IPython parallel magics (%result, %px, %autopx) only work within IPython."
                      else:
                          pmagic = ip.plugin_manager.get_plugin('parallelmagic')
                          if pmagic is None:
                              ip.magic_load_ext('parallelmagic')
                              pmagic = ip.plugin_manager.get_plugin('parallelmagic')
                          pmagic.active_view = self
              @skip_doctest
              class LoadBalancedView(View):
                  """An load-balancing View that only executes via the Task scheduler.
                  Load-balanced views can be created with the client's `view` method:
                  >>> v = client.load_balanced_view()
                  or targets can be specified, to restrict the potential destinations:
                  >>> v = client.client.load_balanced_view(([1,3])
                  which would restrict loadbalancing to between engines 1 and 3.
                  """
                  follow=Any()
                  after=Any()
                  timeout=CFloat()
                  retries = CInt(0)
                  _task_scheme = Any()
                  _flag_names = List(['targets', 'block', 'track', 'follow', 'after', 'timeout', 'retries'])
                  def __init__(self, client=None, socket=None, **flags):
                      super(LoadBalancedView, self).__init__(client=client, socket=socket, **flags)
                      self._task_scheme=client._task_scheme
                  def _validate_dependency(self, dep):
                      """validate a dependency.
                      For use in `set_flags`.
                      """
                      if dep is None or isinstance(dep, (str, AsyncResult, Dependency)):
                          return True
                      elif isinstance(dep, (list,set, tuple)):
                          for d in dep:
                              if not isinstance(d, (str, AsyncResult)):
                                  return False
                      elif isinstance(dep, dict):
                          if set(dep.keys()) != set(Dependency().as_dict().keys()):
                              return False
                          if not isinstance(dep['msg_ids'], list):
                              return False
                          for d in dep['msg_ids']:
                              if not isinstance(d, str):
                                  return False
                      else:
                          return False
                      return True
                  def _render_dependency(self, dep):
                      """helper for building jsonable dependencies from various input forms."""
                      if isinstance(dep, Dependency):
                          return dep.as_dict()
                      elif isinstance(dep, AsyncResult):
                          return dep.msg_ids
                      elif dep is None:
                          return []
                      else:
                          # pass to Dependency constructor
                          return list(Dependency(dep))
                  def set_flags(self, **kwargs):
                      """set my attribute flags by keyword.
                      A View is a wrapper for the Client's apply method, but with attributes
                      that specify keyword arguments, those attributes can be set by keyword
                      argument with this method.
                      Parameters
                      ----------
                      block : bool
                          whether to wait for results
                      track : bool
                          whether to create a MessageTracker to allow the user to
                          safely edit after arrays and buffers during non-copying
                          sends.
                      after : Dependency or collection of msg_ids
                          Only for load-balanced execution (targets=None)
                          Specify a list of msg_ids as a time-based dependency.
                          This job will only be run *after* the dependencies
                          have been met.
                      follow : Dependency or collection of msg_ids
                          Only for load-balanced execution (targets=None)
                          Specify a list of msg_ids as a location-based dependency.
                          This job will only be run on an engine where this dependency
                          is met.
                      timeout : float/int or None
                          Only for load-balanced execution (targets=None)
                          Specify an amount of time (in seconds) for the scheduler to
                          wait for dependencies to be met before failing with a
                          DependencyTimeout.
                      retries : int
                          Number of times a task will be retried on failure.
                      """
                      super(LoadBalancedView, self).set_flags(**kwargs)
                      for name in ('follow', 'after'):
                          if name in kwargs:
                              value = kwargs[name]
                              if self._validate_dependency(value):
                                  setattr(self, name, value)
                              else:
                                  raise ValueError("Invalid dependency: %r"%value)
                      if 'timeout' in kwargs:
                          t = kwargs['timeout']
                          if not isinstance(t, (int, long, float, type(None))):
                              raise TypeError("Invalid type for timeout: %r"%type(t))
                          if t is not None:
                              if t < 0:
                                  raise ValueError("Invalid timeout: %s"%t)
                          self.timeout = t
                  @sync_results
                  @save_ids
                  def _really_apply(self, f, args=None, kwargs=None, block=None, track=None,
                                                      after=None, follow=None, timeout=None,
                                                      targets=None, retries=None):
                      """calls f(*args, **kwargs) on a remote engine, returning the result.
                      This method temporarily sets all of `apply`'s flags for a single call.
                      Parameters
                      ----------
                      f : callable
                      args : list [default: empty]
                      kwargs : dict [default: empty]
                      block : bool [default: self.block]
                          whether to block
                      track : bool [default: self.track]
                          whether to ask zmq to track the message, for safe non-copying sends
                      !!!!!! TODO: THE REST HERE  !!!!
                      Returns
                      -------
                      if self.block is False:
                          returns AsyncResult
                      else:
                          returns actual result of f(*args, **kwargs) on the engine(s)
                          This will be a list of self.targets is also a list (even length 1), or
                          the single result if self.targets is an integer engine id
                      """
                      # validate whether we can run
                      if self._socket.closed:
                          msg = "Task farming is disabled"
                          if self._task_scheme == 'pure':
                              msg += " because the pure ZMQ scheduler cannot handle"
                              msg += " disappearing engines."
                          raise RuntimeError(msg)
                      if self._task_scheme == 'pure':
                          # pure zmq scheme doesn't support extra features
                          msg = "Pure ZMQ scheduler doesn't support the following flags:"
                          "follow, after, retries, targets, timeout"
                          if (follow or after or retries or targets or timeout):
                              # hard fail on Scheduler flags
                              raise RuntimeError(msg)
                          if isinstance(f, dependent):
                              # soft warn on functional dependencies
                              warnings.warn(msg, RuntimeWarning)
                      # build args
                      args = [] if args is None else args
                      kwargs = {} if kwargs is None else kwargs
                      block = self.block if block is None else block
                      track = self.track if track is None else track
                      after = self.after if after is None else after
                      retries = self.retries if retries is None else retries
                      follow = self.follow if follow is None else follow
                      timeout = self.timeout if timeout is None else timeout
                      targets = self.targets if targets is None else targets
                      if not isinstance(retries, int):
                          raise TypeError('retries must be int, not %r'%type(retries))
                      if targets is None:
                          idents = []
                      else:
                          idents = self.client._build_targets(targets)[0]
                      after = self._render_dependency(after)
                      follow = self._render_dependency(follow)
                      subheader = dict(after=after, follow=follow, timeout=timeout, targets=idents, retries=retries)
                      msg = self.client.send_apply_message(self._socket, f, args, kwargs, track=track,
                                              subheader=subheader)
                      tracker = None if track is False else msg['tracker']
                      ar = AsyncResult(self.client, msg['msg_id'], fname=f.__name__, targets=None, tracker=tracker)
                      if block:
                          try:
                              return ar.get()
                          except KeyboardInterrupt:
                              pass
                      return ar
                  @spin_after
                  @save_ids
                  def map(self, f, *sequences, **kwargs):
                      """view.map(f, *sequences, block=self.block, chunksize=1) => list|AsyncMapResult
                      Parallel version of builtin `map`, load-balanced by this View.
                      `block`, and `chunksize` can be specified by keyword only.
                      Each `chunksize` elements will be a separate task, and will be
                      load-balanced. This lets individual elements be available for iteration
                      as soon as they arrive.
                      Parameters
                      ----------
                      f : callable
                          function to be mapped
                      *sequences: one or more sequences of matching length
                          the sequences to be distributed and passed to `f`
                      block : bool
                          whether to wait for the result or not [default self.block]
                      track : bool
                          whether to create a MessageTracker to allow the user to
                          safely edit after arrays and buffers during non-copying
                          sends.
                      chunksize : int
                          how many elements should be in each task [default 1]
                      Returns
                      -------
                      if block=False:
                          AsyncMapResult
                              An object like AsyncResult, but which reassembles the sequence of results
                              into a single list. AsyncMapResults can be iterated through before all
                              results are complete.
                          else:
                              the result of map(f,*sequences)
                      """
                      # default
                      block = kwargs.get('block', self.block)
                      chunksize = kwargs.get('chunksize', 1)
                      keyset = set(kwargs.keys())
                      extra_keys = keyset.difference_update(set(['block', 'chunksize']))
                      if extra_keys:
                          raise TypeError("Invalid kwargs: %s"%list(extra_keys))
                      assert len(sequences) > 0, "must have some sequences to map onto!"
                      pf = ParallelFunction(self, f, block=block,  chunksize=chunksize)
                      return pf.map(*sequences)
              __all__ = ['LoadBalancedView', 'DirectView']

IPython/parallel/controller/dependency.py

0 +6 -1

-             """Dependency utilities"""
+             """Dependency utilities
+             Authors:
+             * Min RK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              from types import ModuleType
              from IPython.parallel.client.asyncresult import AsyncResult
              from IPython.parallel.error import UnmetDependency
              from IPython.parallel.util import interactive
              class depend(object):
                  """Dependency decorator, for use with tasks.
                  `@depend` lets you define a function for engine dependencies
                  just like you use `apply` for tasks.
                  Examples
                  --------
                  ::
                      @depend(df, a,b, c=5)
                      def f(m,n,p)
                      view.apply(f, 1,2,3)
                  will call df(a,b,c=5) on the engine, and if it returns False or
                  raises an UnmetDependency error, then the task will not be run
                  and another engine will be tried.
                  """
                  def __init__(self, f, *args, **kwargs):
                      self.f = f
                      self.args = args
                      self.kwargs = kwargs
                  def __call__(self, f):
                      return dependent(f, self.f, *self.args, **self.kwargs)
              class dependent(object):
                  """A function that depends on another function.
                  This is an object to prevent the closure used
                  in traditional decorators, which are not picklable.
                  """
                  def __init__(self, f, df, *dargs, **dkwargs):
                      self.f = f
                      self.func_name = getattr(f, '__name__', 'f')
                      self.df = df
                      self.dargs = dargs
                      self.dkwargs = dkwargs
                  def __call__(self, *args, **kwargs):
                      # if hasattr(self.f, 'func_globals') and hasattr(self.df, 'func_globals'):
                      #     self.df.func_globals = self.f.func_globals
                      if self.df(*self.dargs, **self.dkwargs) is False:
                          raise UnmetDependency()
                      return self.f(*args, **kwargs)
                  @property
                  def __name__(self):
                      return self.func_name
              @interactive
              def _require(*names):
                  """Helper for @require decorator."""
                  from IPython.parallel.error import UnmetDependency
                  user_ns = globals()
                  for name in names:
                      if name in user_ns:
                          continue
                      try:
                          exec 'import %s'%name in user_ns
                      except ImportError:
                          raise UnmetDependency(name)
                  return True
              def require(*mods):
                  """Simple decorator for requiring names to be importable.
                  Examples
                  --------
                  In [1]: @require('numpy')
                     ...: def norm(a):
                     ...:     import numpy
                     ...:     return numpy.linalg.norm(a,2)
                  """
                  names = []
                  for mod in mods:
                      if isinstance(mod, ModuleType):
                          mod = mod.__name__
                      if isinstance(mod, basestring):
                          names.append(mod)
                      else:
                          raise TypeError("names must be modules or module names, not %s"%type(mod))
                  return depend(_require, *names)
              class Dependency(set):
                  """An object for representing a set of msg_id dependencies.
                  Subclassed from set().
                  Parameters
                  ----------
                  dependencies: list/set of msg_ids or AsyncResult objects or output of Dependency.as_dict()
                      The msg_ids to depend on
                  all : bool [default True]
                      Whether the dependency should be considered met when *all* depending tasks have completed
                      or only when *any* have been completed.
                  success : bool [default True]
                      Whether to consider successes as fulfilling dependencies.
                  failure : bool [default False]
                      Whether to consider failures as fulfilling dependencies.
                  If `all=success=True` and `failure=False`, then the task will fail with an ImpossibleDependency
                      as soon as the first depended-upon task fails.
                  """
                  all=True
                  success=True
                  failure=True
                  def __init__(self, dependencies=[], all=True, success=True, failure=False):
                      if isinstance(dependencies, dict):
                          # load from dict
                          all = dependencies.get('all', True)
                          success = dependencies.get('success', success)
                          failure = dependencies.get('failure', failure)
                          dependencies = dependencies.get('dependencies', [])
                      ids = []
                      # extract ids from various sources:
                      if isinstance(dependencies, (basestring, AsyncResult)):
                          dependencies = [dependencies]
                      for d in dependencies:
                          if isinstance(d, basestring):
                              ids.append(d)
                          elif isinstance(d, AsyncResult):
                              ids.extend(d.msg_ids)
                          else:
                              raise TypeError("invalid dependency type: %r"%type(d))
                      set.__init__(self, ids)
                      self.all = all
                      if not (success or failure):
                          raise ValueError("Must depend on at least one of successes or failures!")
                      self.success=success
                      self.failure = failure
                  def check(self, completed, failed=None):
                      """check whether our dependencies have been met."""
                      if len(self) == 0:
                          return True
                      against = set()
                      if self.success:
                          against = completed
                      if failed is not None and self.failure:
                          against = against.union(failed)
                      if self.all:
                          return self.issubset(against)
                      else:
                          return not self.isdisjoint(against)
                  def unreachable(self, completed, failed=None):
                      """return whether this dependency has become impossible."""
                      if len(self) == 0:
                          return False
                      against = set()
                      if not self.success:
                          against = completed
                      if failed is not None and not self.failure:
                          against = against.union(failed)
                      if self.all:
                          return not self.isdisjoint(against)
                      else:
                          return self.issubset(against)
                  def as_dict(self):
                      """Represent this dependency as a dict. For json compatibility."""
                      return dict(
                          dependencies=list(self),
                          all=self.all,
                          success=self.success,
                          failure=self.failure
                      )
              __all__ = ['depend', 'require', 'dependent', 'Dependency']

IPython/parallel/controller/dictdb.py

0 +6 -1

              """A Task logger that presents our DB interface,
              but exists entirely in memory and implemented with dicts.
+             Authors:
+             * Min RK
              TaskRecords are dicts of the form:
              {
                  'msg_id' : str(uuid),
                  'client_uuid' : str(uuid),
                  'engine_uuid' : str(uuid) or None,
                  'header' : dict(header),
                  'content': dict(content),
                  'buffers': list(buffers),
                  'submitted': datetime,
                  'started': datetime or None,
                  'completed': datetime or None,
                  'resubmitted': datetime or None,
                  'result_header' : dict(header) or None,
                  'result_content' : dict(content) or None,
                  'result_buffers' : list(buffers) or None,
              }
              With this info, many of the special categories of tasks can be defined by query:
              pending:  completed is None
              client's outstanding: client_uuid = uuid && completed is None
              MIA: arrived is None (and completed is None)
              etc.
              EngineRecords are dicts of the form:
              {
                  'eid' : int(id),
                  'uuid': str(uuid)
              }
              This may be extended, but is currently.
              We support a subset of mongodb operators:
                  $lt,$gt,$lte,$gte,$ne,$in,$nin,$all,$mod,$exists
              """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2010  The IPython Development Team
+             #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              from datetime import datetime
              from IPython.config.configurable import LoggingConfigurable
              from IPython.utils.traitlets import Dict, Unicode, Instance
              filters = {
               '$lt' : lambda a,b: a < b,
               '$gt' : lambda a,b: b > a,
               '$eq' : lambda a,b: a == b,
               '$ne' : lambda a,b: a != b,
               '$lte': lambda a,b: a <= b,
               '$gte': lambda a,b: a >= b,
               '$in' : lambda a,b: a in b,
               '$nin': lambda a,b: a not in b,
               '$all': lambda a,b: all([ a in bb for bb in b ]),
               '$mod': lambda a,b: a%b[0] == b[1],
               '$exists' : lambda a,b: (b and a is not None) or (a is None and not b)
              }
              class CompositeFilter(object):
                  """Composite filter for matching multiple properties."""
                  def __init__(self, dikt):
                      self.tests = []
                      self.values = []
                      for key, value in dikt.iteritems():
                          self.tests.append(filters[key])
                          self.values.append(value)
                  def __call__(self, value):
                      for test,check in zip(self.tests, self.values):
                          if not test(value, check):
                              return False
                      return True
              class BaseDB(LoggingConfigurable):
                  """Empty Parent class so traitlets work on DB."""
                  # base configurable traits:
                  session = Unicode("")
              class DictDB(BaseDB):
                  """Basic in-memory dict-based object for saving Task Records.
                  This is the first object to present the DB interface
                  for logging tasks out of memory.
                  The interface is based on MongoDB, so adding a MongoDB
                  backend should be straightforward.
                  """
                  _records = Dict()
                  def _match_one(self, rec, tests):
                      """Check if a specific record matches tests."""
                      for key,test in tests.iteritems():
                          if not test(rec.get(key, None)):
                              return False
                      return True
                  def _match(self, check):
                      """Find all the matches for a check dict."""
                      matches = []
                      tests = {}
                      for k,v in check.iteritems():
                          if isinstance(v, dict):
                              tests[k] = CompositeFilter(v)
                          else:
                              tests[k] = lambda o: o==v
                      for rec in self._records.itervalues():
                          if self._match_one(rec, tests):
                              matches.append(rec)
                      return matches
                  def _extract_subdict(self, rec, keys):
                      """extract subdict of keys"""
                      d = {}
                      d['msg_id'] = rec['msg_id']
                      for key in keys:
                          d[key] = rec[key]
                      return d
                  def add_record(self, msg_id, rec):
                      """Add a new Task Record, by msg_id."""
                      if self._records.has_key(msg_id):
                          raise KeyError("Already have msg_id %r"%(msg_id))
                      self._records[msg_id] = rec
                  def get_record(self, msg_id):
                      """Get a specific Task Record, by msg_id."""
                      if not self._records.has_key(msg_id):
                          raise KeyError("No such msg_id %r"%(msg_id))
                      return self._records[msg_id]
                  def update_record(self, msg_id, rec):
                      """Update the data in an existing record."""
                      self._records[msg_id].update(rec)
                  def drop_matching_records(self, check):
                      """Remove a record from the DB."""
                      matches = self._match(check)
                      for m in matches:
                          del self._records[m['msg_id']]
                  def drop_record(self, msg_id):
                      """Remove a record from the DB."""
                      del self._records[msg_id]
                  def find_records(self, check, keys=None):
                      """Find records matching a query dict, optionally extracting subset of keys.
                      Returns dict keyed by msg_id of matching records.
                      Parameters
                      ----------
                      check: dict
                          mongodb-style query argument
                      keys: list of strs [optional]
                          if specified, the subset of keys to extract.  msg_id will *always* be
                          included.
                      """
                      matches = self._match(check)
                      if keys:
                          return [ self._extract_subdict(rec, keys) for rec in matches ]
                      else:
                          return matches
                  def get_history(self):
                      """get all msg_ids, ordered by time submitted."""
                      msg_ids = self._records.keys()
                      return sorted(msg_ids, key=lambda m: self._records[m]['submitted'])

IPython/parallel/controller/heartmonitor.py

0 +4 0

              #!/usr/bin/env python
              """
              A multi-heart Heartbeat system using PUB and XREP sockets. pings are sent out on the PUB,
              and hearts are tracked based on their XREQ identities.
+             Authors:
+             * Min RK
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              from __future__ import print_function
              import time
              import uuid
              import zmq
              from zmq.devices import ThreadDevice
              from zmq.eventloop import ioloop, zmqstream
              from IPython.config.configurable import LoggingConfigurable
              from IPython.utils.traitlets import Set, Instance, CFloat
              class Heart(object):
                  """A basic heart object for responding to a HeartMonitor.
                  This is a simple wrapper with defaults for the most common
                  Device model for responding to heartbeats.
                  It simply builds a threadsafe zmq.FORWARDER Device, defaulting to using
                  SUB/XREQ for in/out.
                  You can specify the XREQ's IDENTITY via the optional heart_id argument."""
                  device=None
                  id=None
                  def __init__(self, in_addr, out_addr, in_type=zmq.SUB, out_type=zmq.XREQ, heart_id=None):
                      self.device = ThreadDevice(zmq.FORWARDER, in_type, out_type)
                      self.device.daemon=True
                      self.device.connect_in(in_addr)
                      self.device.connect_out(out_addr)
                      if in_type == zmq.SUB:
                          self.device.setsockopt_in(zmq.SUBSCRIBE, "")
                      if heart_id is None:
                          heart_id = str(uuid.uuid4())
                      self.device.setsockopt_out(zmq.IDENTITY, heart_id)
                      self.id = heart_id
                  def start(self):
                      return self.device.start()
              class HeartMonitor(LoggingConfigurable):
                  """A basic HeartMonitor class
                  pingstream: a PUB stream
                  pongstream: an XREP stream
                  period: the period of the heartbeat in milliseconds"""
                  period=CFloat(1000, config=True,
                      help='The frequency at which the Hub pings the engines for heartbeats '
                      ' (in ms) [default: 100]',
                  )
                  pingstream=Instance('zmq.eventloop.zmqstream.ZMQStream')
                  pongstream=Instance('zmq.eventloop.zmqstream.ZMQStream')
                  loop = Instance('zmq.eventloop.ioloop.IOLoop')
                  def _loop_default(self):
                      return ioloop.IOLoop.instance()
                  # not settable:
                  hearts=Set()
                  responses=Set()
                  on_probation=Set()
                  last_ping=CFloat(0)
                  _new_handlers = Set()
                  _failure_handlers = Set()
                  lifetime = CFloat(0)
                  tic = CFloat(0)
                  def __init__(self, **kwargs):
                      super(HeartMonitor, self).__init__(**kwargs)
                      self.pongstream.on_recv(self.handle_pong)
                  def start(self):
                      self.caller = ioloop.PeriodicCallback(self.beat, self.period, self.loop)
                      self.caller.start()
                  def add_new_heart_handler(self, handler):
                      """add a new handler for new hearts"""
                      self.log.debug("heartbeat::new_heart_handler: %s"%handler)
                      self._new_handlers.add(handler)
                  def add_heart_failure_handler(self, handler):
                      """add a new handler for heart failure"""
                      self.log.debug("heartbeat::new heart failure handler: %s"%handler)
                      self._failure_handlers.add(handler)
                  def beat(self):
                      self.pongstream.flush()
                      self.last_ping = self.lifetime
                      toc = time.time()
                      self.lifetime += toc-self.tic
                      self.tic = toc
                      # self.log.debug("heartbeat::%s"%self.lifetime)
                      goodhearts = self.hearts.intersection(self.responses)
                      missed_beats = self.hearts.difference(goodhearts)
                      heartfailures = self.on_probation.intersection(missed_beats)
                      newhearts = self.responses.difference(goodhearts)
                      map(self.handle_new_heart, newhearts)
                      map(self.handle_heart_failure, heartfailures)
                      self.on_probation = missed_beats.intersection(self.hearts)
                      self.responses = set()
                      # print self.on_probation, self.hearts
                      # self.log.debug("heartbeat::beat %.3f, %i beating hearts"%(self.lifetime, len(self.hearts)))
                      self.pingstream.send(str(self.lifetime))
                  def handle_new_heart(self, heart):
                      if self._new_handlers:
                          for handler in self._new_handlers:
                              handler(heart)
                      else:
                          self.log.info("heartbeat::yay, got new heart %s!"%heart)
                      self.hearts.add(heart)
                  def handle_heart_failure(self, heart):
                      if self._failure_handlers:
                          for handler in self._failure_handlers:
                              try:
                                  handler(heart)
                              except Exception as e:
                                  self.log.error("heartbeat::Bad Handler! %s"%handler, exc_info=True)
                                  pass
                      else:
                          self.log.info("heartbeat::Heart %s failed :("%heart)
                      self.hearts.remove(heart)
                  def handle_pong(self, msg):
                      "a heart just beat"
                      if msg[1] == str(self.lifetime):
                          delta = time.time()-self.tic
                          # self.log.debug("heartbeat::heart %r took %.2f ms to respond"%(msg[0], 1000*delta))
                          self.responses.add(msg[0])
                      elif msg[1] == str(self.last_ping):
                          delta = time.time()-self.tic + (self.lifetime-self.last_ping)
                          self.log.warn("heartbeat::heart %r missed a beat, and took %.2f ms to respond"%(msg[0], 1000*delta))
                          self.responses.add(msg[0])
                      else:
                          self.log.warn("heartbeat::got bad heartbeat (possibly old?): %s (current=%.3f)"%
                          (msg[1],self.lifetime))
              if __name__ == '__main__':
                  loop = ioloop.IOLoop.instance()
                  context = zmq.Context()
                  pub = context.socket(zmq.PUB)
                  pub.bind('tcp://127.0.0.1:5555')
                  xrep = context.socket(zmq.XREP)
                  xrep.bind('tcp://127.0.0.1:5556')
                  outstream = zmqstream.ZMQStream(pub, loop)
                  instream = zmqstream.ZMQStream(xrep, loop)
                  hb = HeartMonitor(loop, outstream, instream)
                  loop.start()

IPython/parallel/controller/hub.py

0 +4 0

              #!/usr/bin/env python
              """The IPython Controller Hub with 0MQ
              This is the master object that handles connections from engines and clients,
              and monitors traffic through the various queues.
+             Authors:
+             * Min RK
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from __future__ import print_function
              import sys
              import time
              from datetime import datetime
              import zmq
              from zmq.eventloop import ioloop
              from zmq.eventloop.zmqstream import ZMQStream
              # internal:
              from IPython.utils.importstring import import_item
              from IPython.utils.traitlets import (
                      HasTraits, Instance, Int, Unicode, Dict, Set, Tuple, CStr
                      )
              from IPython.parallel import error, util
              from IPython.parallel.factory import RegistrationFactory
              from IPython.zmq.session import SessionFactory
              from .heartmonitor import HeartMonitor
              #-----------------------------------------------------------------------------
              # Code
              #-----------------------------------------------------------------------------
              def _passer(*args, **kwargs):
                  return
              def _printer(*args, **kwargs):
                  print (args)
                  print (kwargs)
              def empty_record():
                  """Return an empty dict with all record keys."""
                  return {
                      'msg_id' : None,
                      'header' : None,
                      'content': None,
                      'buffers': None,
                      'submitted': None,
                      'client_uuid' : None,
                      'engine_uuid' : None,
                      'started': None,
                      'completed': None,
                      'resubmitted': None,
                      'result_header' : None,
                      'result_content' : None,
                      'result_buffers' : None,
                      'queue' : None,
                      'pyin' : None,
                      'pyout': None,
                      'pyerr': None,
                      'stdout': '',
                      'stderr': '',
                  }
              def init_record(msg):
                  """Initialize a TaskRecord based on a request."""
                  header = msg['header']
                  return {
                      'msg_id' : header['msg_id'],
                      'header' : header,
                      'content': msg['content'],
                      'buffers': msg['buffers'],
                      'submitted': header['date'],
                      'client_uuid' : None,
                      'engine_uuid' : None,
                      'started': None,
                      'completed': None,
                      'resubmitted': None,
                      'result_header' : None,
                      'result_content' : None,
                      'result_buffers' : None,
                      'queue' : None,
                      'pyin' : None,
                      'pyout': None,
                      'pyerr': None,
                      'stdout': '',
                      'stderr': '',
                  }
              class EngineConnector(HasTraits):
                  """A simple object for accessing the various zmq connections of an object.
                  Attributes are:
                  id (int): engine ID
                  uuid (str): uuid (unused?)
                  queue (str): identity of queue's XREQ socket
                  registration (str): identity of registration XREQ socket
                  heartbeat (str): identity of heartbeat XREQ socket
                  """
                  id=Int(0)
                  queue=CStr()
                  control=CStr()
                  registration=CStr()
                  heartbeat=CStr()
                  pending=Set()
              class HubFactory(RegistrationFactory):
                  """The Configurable for setting up a Hub."""
                  # port-pairs for monitoredqueues:
                  hb = Tuple(Int,Int,config=True,
                      help="""XREQ/SUB Port pair for Engine heartbeats""")
                  def _hb_default(self):
                      return tuple(util.select_random_ports(2))
                  mux = Tuple(Int,Int,config=True,
                      help="""Engine/Client Port pair for MUX queue""")
                  def _mux_default(self):
                      return tuple(util.select_random_ports(2))
                  task = Tuple(Int,Int,config=True,
                      help="""Engine/Client Port pair for Task queue""")
                  def _task_default(self):
                      return tuple(util.select_random_ports(2))
                  control = Tuple(Int,Int,config=True,
                      help="""Engine/Client Port pair for Control queue""")
                  def _control_default(self):
                      return tuple(util.select_random_ports(2))
                  iopub = Tuple(Int,Int,config=True,
                      help="""Engine/Client Port pair for IOPub relay""")
                  def _iopub_default(self):
                      return tuple(util.select_random_ports(2))
                  # single ports:
                  mon_port = Int(config=True,
                      help="""Monitor (SUB) port for queue traffic""")
                  def _mon_port_default(self):
                      return util.select_random_ports(1)[0]
                  notifier_port = Int(config=True,
                      help="""PUB port for sending engine status notifications""")
                  def _notifier_port_default(self):
                      return util.select_random_ports(1)[0]
                  engine_ip = Unicode('127.0.0.1', config=True,
                      help="IP on which to listen for engine connections. [default: loopback]")
                  engine_transport = Unicode('tcp', config=True,
                      help="0MQ transport for engine connections. [default: tcp]")
                  client_ip = Unicode('127.0.0.1', config=True,
                      help="IP on which to listen for client connections. [default: loopback]")
                  client_transport = Unicode('tcp', config=True,
                      help="0MQ transport for client connections. [default : tcp]")
                  monitor_ip = Unicode('127.0.0.1', config=True,
                      help="IP on which to listen for monitor messages. [default: loopback]")
                  monitor_transport = Unicode('tcp', config=True,
                      help="0MQ transport for monitor messages. [default : tcp]")
                  monitor_url = Unicode('')
                  db_class = Unicode('IPython.parallel.controller.dictdb.DictDB', config=True,
                      help="""The class to use for the DB backend""")
                  # not configurable
                  db = Instance('IPython.parallel.controller.dictdb.BaseDB')
                  heartmonitor = Instance('IPython.parallel.controller.heartmonitor.HeartMonitor')
                  def _ip_changed(self, name, old, new):
                      self.engine_ip = new
                      self.client_ip = new
                      self.monitor_ip = new
                      self._update_monitor_url()
                  def _update_monitor_url(self):
                      self.monitor_url = "%s://%s:%i"%(self.monitor_transport, self.monitor_ip, self.mon_port)
                  def _transport_changed(self, name, old, new):
                      self.engine_transport = new
                      self.client_transport = new
                      self.monitor_transport = new
                      self._update_monitor_url()
                  def __init__(self, **kwargs):
                      super(HubFactory, self).__init__(**kwargs)
                      self._update_monitor_url()
                  def construct(self):
                      self.init_hub()
                  def start(self):
                      self.heartmonitor.start()
                      self.log.info("Heartmonitor started")
                  def init_hub(self):
                      """construct"""
                      client_iface = "%s://%s:"%(self.client_transport, self.client_ip) + "%i"
                      engine_iface = "%s://%s:"%(self.engine_transport, self.engine_ip) + "%i"
                      ctx = self.context
                      loop = self.loop
                      # Registrar socket
                      q = ZMQStream(ctx.socket(zmq.XREP), loop)
                      q.bind(client_iface % self.regport)
                      self.log.info("Hub listening on %s for registration."%(client_iface%self.regport))
                      if self.client_ip != self.engine_ip:
                          q.bind(engine_iface % self.regport)
                          self.log.info("Hub listening on %s for registration."%(engine_iface%self.regport))
                      ### Engine connections ###
                      # heartbeat
                      hpub = ctx.socket(zmq.PUB)
                      hpub.bind(engine_iface % self.hb[0])
                      hrep = ctx.socket(zmq.XREP)
                      hrep.bind(engine_iface % self.hb[1])
                      self.heartmonitor = HeartMonitor(loop=loop, config=self.config, log=self.log,
                                              pingstream=ZMQStream(hpub,loop),
                                              pongstream=ZMQStream(hrep,loop)
                                          )
                      ### Client connections ###
                      # Notifier socket
                      n = ZMQStream(ctx.socket(zmq.PUB), loop)
                      n.bind(client_iface%self.notifier_port)
                      ### build and launch the queues ###
                      # monitor socket
                      sub = ctx.socket(zmq.SUB)
                      sub.setsockopt(zmq.SUBSCRIBE, "")
                      sub.bind(self.monitor_url)
                      sub.bind('inproc://monitor')
                      sub = ZMQStream(sub, loop)
                      # connect the db
                      self.log.info('Hub using DB backend: %r'%(self.db_class.split()[-1]))
                      # cdir = self.config.Global.cluster_dir
                      self.db = import_item(str(self.db_class))(session=self.session.session,
                                                          config=self.config, log=self.log)
                      time.sleep(.25)
                      try:
                          scheme = self.config.TaskScheduler.scheme_name
                      except AttributeError:
                          from .scheduler import TaskScheduler
                          scheme = TaskScheduler.scheme_name.get_default_value()
                      # build connection dicts
                      self.engine_info = {
                          'control' : engine_iface%self.control[1],
                          'mux': engine_iface%self.mux[1],
                          'heartbeat': (engine_iface%self.hb[0], engine_iface%self.hb[1]),
                          'task' : engine_iface%self.task[1],
                          'iopub' : engine_iface%self.iopub[1],
                          # 'monitor' : engine_iface%self.mon_port,
                          }
                      self.client_info = {
                          'control' : client_iface%self.control[0],
                          'mux': client_iface%self.mux[0],
                          'task' : (scheme, client_iface%self.task[0]),
                          'iopub' : client_iface%self.iopub[0],
                          'notification': client_iface%self.notifier_port
                          }
                      self.log.debug("Hub engine addrs: %s"%self.engine_info)
                      self.log.debug("Hub client addrs: %s"%self.client_info)
                      # resubmit stream
                      r = ZMQStream(ctx.socket(zmq.XREQ), loop)
                      url = util.disambiguate_url(self.client_info['task'][-1])
                      r.setsockopt(zmq.IDENTITY, self.session.session)
                      r.connect(url)
                      self.hub = Hub(loop=loop, session=self.session, monitor=sub, heartmonitor=self.heartmonitor,
                              query=q, notifier=n, resubmit=r, db=self.db,
                              engine_info=self.engine_info, client_info=self.client_info,
                              log=self.log)
              class Hub(SessionFactory):
                  """The IPython Controller Hub with 0MQ connections
                  Parameters
                  ==========
                  loop: zmq IOLoop instance
                  session: Session object
                  <removed> context: zmq context for creating new connections (?)
                  queue: ZMQStream for monitoring the command queue (SUB)
                  query: ZMQStream for engine registration and client queries requests (XREP)
                  heartbeat: HeartMonitor object checking the pulse of the engines
                  notifier: ZMQStream for broadcasting engine registration changes (PUB)
                  db: connection to db for out of memory logging of commands
                              NotImplemented
                  engine_info: dict of zmq connection information for engines to connect
                              to the queues.
                  client_info: dict of zmq connection information for engines to connect
                              to the queues.
                  """
                  # internal data structures:
                  ids=Set() # engine IDs
                  keytable=Dict()
                  by_ident=Dict()
                  engines=Dict()
                  clients=Dict()
                  hearts=Dict()
                  pending=Set()
                  queues=Dict()  # pending msg_ids keyed by engine_id
                  tasks=Dict() # pending msg_ids submitted as tasks, keyed by client_id
                  completed=Dict() # completed msg_ids keyed by engine_id
                  all_completed=Set() # completed msg_ids keyed by engine_id
                  dead_engines=Set() # completed msg_ids keyed by engine_id
                  unassigned=Set() # set of task msg_ds not yet assigned a destination
                  incoming_registrations=Dict()
                  registration_timeout=Int()
                  _idcounter=Int(0)
                  # objects from constructor:
                  query=Instance(ZMQStream)
                  monitor=Instance(ZMQStream)
                  notifier=Instance(ZMQStream)
                  resubmit=Instance(ZMQStream)
                  heartmonitor=Instance(HeartMonitor)
                  db=Instance(object)
                  client_info=Dict()
                  engine_info=Dict()
                  def __init__(self, **kwargs):
                      """
                      # universal:
                      loop: IOLoop for creating future connections
                      session: streamsession for sending serialized data
                      # engine:
                      queue: ZMQStream for monitoring queue messages
                      query: ZMQStream for engine+client registration and client requests
                      heartbeat: HeartMonitor object for tracking engines
                      # extra:
                      db: ZMQStream for db connection (NotImplemented)
                      engine_info: zmq address/protocol dict for engine connections
                      client_info: zmq address/protocol dict for client connections
                      """
                      super(Hub, self).__init__(**kwargs)
                      self.registration_timeout = max(5000, 2*self.heartmonitor.period)
                      # validate connection dicts:
                      for k,v in self.client_info.iteritems():
                          if k == 'task':
                              util.validate_url_container(v[1])
                          else:
                              util.validate_url_container(v)
                      # util.validate_url_container(self.client_info)
                      util.validate_url_container(self.engine_info)
                      # register our callbacks
                      self.query.on_recv(self.dispatch_query)
                      self.monitor.on_recv(self.dispatch_monitor_traffic)
                      self.heartmonitor.add_heart_failure_handler(self.handle_heart_failure)
                      self.heartmonitor.add_new_heart_handler(self.handle_new_heart)
                      self.monitor_handlers = { 'in' : self.save_queue_request,
                                              'out': self.save_queue_result,
                                              'intask': self.save_task_request,
                                              'outtask': self.save_task_result,
                                              'tracktask': self.save_task_destination,
                                              'incontrol': _passer,
                                              'outcontrol': _passer,
                                              'iopub': self.save_iopub_message,
                      }
                      self.query_handlers = {'queue_request': self.queue_status,
                                              'result_request': self.get_results,
                                              'history_request': self.get_history,
                                              'db_request': self.db_query,
                                              'purge_request': self.purge_results,
                                              'load_request': self.check_load,
                                              'resubmit_request': self.resubmit_task,
                                              'shutdown_request': self.shutdown_request,
                                              'registration_request' : self.register_engine,
                                              'unregistration_request' : self.unregister_engine,
                                              'connection_request': self.connection_request,
                      }
                      # ignore resubmit replies
                      self.resubmit.on_recv(lambda msg: None, copy=False)
                      self.log.info("hub::created hub")
                  @property
                  def _next_id(self):
                      """gemerate a new ID.
                      No longer reuse old ids, just count from 0."""
                      newid = self._idcounter
                      self._idcounter += 1
                      return newid
                      # newid = 0
                      # incoming = [id[0] for id in self.incoming_registrations.itervalues()]
                      # # print newid, self.ids, self.incoming_registrations
                      # while newid in self.ids or newid in incoming:
                      #     newid += 1
                      # return newid
                  #-----------------------------------------------------------------------------
                  # message validation
                  #-----------------------------------------------------------------------------
                  def _validate_targets(self, targets):
                      """turn any valid targets argument into a list of integer ids"""
                      if targets is None:
                          # default to all
                          targets = self.ids
                      if isinstance(targets, (int,str,unicode)):
                          # only one target specified
                          targets = [targets]
                      _targets = []
                      for t in targets:
                          # map raw identities to ids
                          if isinstance(t, (str,unicode)):
                              t = self.by_ident.get(t, t)
                          _targets.append(t)
                      targets = _targets
                      bad_targets = [ t for t in targets if t not in self.ids ]
                      if bad_targets:
                          raise IndexError("No Such Engine: %r"%bad_targets)
                      if not targets:
                          raise IndexError("No Engines Registered")
                      return targets
                  #-----------------------------------------------------------------------------
                  # dispatch methods (1 per stream)
                  #-----------------------------------------------------------------------------
                  def dispatch_monitor_traffic(self, msg):
                      """all ME and Task queue messages come through here, as well as
                      IOPub traffic."""
                      self.log.debug("monitor traffic: %r"%msg[:2])
                      switch = msg[0]
                      try:
                          idents, msg = self.session.feed_identities(msg[1:])
                      except ValueError:
                          idents=[]
                      if not idents:
                          self.log.error("Bad Monitor Message: %r"%msg)
                          return
                      handler = self.monitor_handlers.get(switch, None)
                      if handler is not None:
                          handler(idents, msg)
                      else:
                          self.log.error("Invalid monitor topic: %r"%switch)
                  def dispatch_query(self, msg):
                      """Route registration requests and queries from clients."""
                      try:
                          idents, msg = self.session.feed_identities(msg)
                      except ValueError:
                          idents = []
                      if not idents:
                          self.log.error("Bad Query Message: %r"%msg)
                          return
                      client_id = idents[0]
                      try:
                          msg = self.session.unpack_message(msg, content=True)
                      except Exception:
                          content = error.wrap_exception()
                          self.log.error("Bad Query Message: %r"%msg, exc_info=True)
                          self.session.send(self.query, "hub_error", ident=client_id,
                                  content=content)
                          return
                      # print client_id, header, parent, content
                      #switch on message type:
                      msg_type = msg['msg_type']
                      self.log.info("client::client %r requested %r"%(client_id, msg_type))
                      handler = self.query_handlers.get(msg_type, None)
                      try:
                          assert handler is not None, "Bad Message Type: %r"%msg_type
                      except:
                          content = error.wrap_exception()
                          self.log.error("Bad Message Type: %r"%msg_type, exc_info=True)
                          self.session.send(self.query, "hub_error", ident=client_id,
                                  content=content)
                          return
                      else:
                          handler(idents, msg)
                  def dispatch_db(self, msg):
                      """"""
                      raise NotImplementedError
                  #---------------------------------------------------------------------------
                  # handler methods (1 per event)
                  #---------------------------------------------------------------------------
                  #----------------------- Heartbeat --------------------------------------
                  def handle_new_heart(self, heart):
                      """handler to attach to heartbeater.
                      Called when a new heart starts to beat.
                      Triggers completion of registration."""
                      self.log.debug("heartbeat::handle_new_heart(%r)"%heart)
                      if heart not in self.incoming_registrations:
                          self.log.info("heartbeat::ignoring new heart: %r"%heart)
                      else:
                          self.finish_registration(heart)
                  def handle_heart_failure(self, heart):
                      """handler to attach to heartbeater.
                      called when a previously registered heart fails to respond to beat request.
                      triggers unregistration"""
                      self.log.debug("heartbeat::handle_heart_failure(%r)"%heart)
                      eid = self.hearts.get(heart, None)
                      queue = self.engines[eid].queue
                      if eid is None:
                          self.log.info("heartbeat::ignoring heart failure %r"%heart)
                      else:
                          self.unregister_engine(heart, dict(content=dict(id=eid, queue=queue)))
                  #----------------------- MUX Queue Traffic ------------------------------
                  def save_queue_request(self, idents, msg):
                      if len(idents) < 2:
                          self.log.error("invalid identity prefix: %r"%idents)
                          return
                      queue_id, client_id = idents[:2]
                      try:
                          msg = self.session.unpack_message(msg)
                      except Exception:
                          self.log.error("queue::client %r sent invalid message to %r: %r"%(client_id, queue_id, msg), exc_info=True)
                          return
                      eid = self.by_ident.get(queue_id, None)
                      if eid is None:
                          self.log.error("queue::target %r not registered"%queue_id)
                          self.log.debug("queue::    valid are: %r"%(self.by_ident.keys()))
                          return
                      record = init_record(msg)
                      msg_id = record['msg_id']
                      record['engine_uuid'] = queue_id
                      record['client_uuid'] = client_id
                      record['queue'] = 'mux'
                      try:
                          # it's posible iopub arrived first:
                          existing = self.db.get_record(msg_id)
                          for key,evalue in existing.iteritems():
                              rvalue = record.get(key, None)
                              if evalue and rvalue and evalue != rvalue:
                                  self.log.warn("conflicting initial state for record: %r:%r <%r> %r"%(msg_id, rvalue, key, evalue))
                              elif evalue and not rvalue:
                                  record[key] = evalue
                          try:
                              self.db.update_record(msg_id, record)
                          except Exception:
                              self.log.error("DB Error updating record %r"%msg_id, exc_info=True)
                      except KeyError:
                          try:
                              self.db.add_record(msg_id, record)
                          except Exception:
                              self.log.error("DB Error adding record %r"%msg_id, exc_info=True)
                      self.pending.add(msg_id)
                      self.queues[eid].append(msg_id)
                  def save_queue_result(self, idents, msg):
                      if len(idents) < 2:
                          self.log.error("invalid identity prefix: %r"%idents)
                          return
                      client_id, queue_id = idents[:2]
                      try:
                          msg = self.session.unpack_message(msg)
                      except Exception:
                          self.log.error("queue::engine %r sent invalid message to %r: %r"%(
                                  queue_id,client_id, msg), exc_info=True)
                          return
                      eid = self.by_ident.get(queue_id, None)
                      if eid is None:
                          self.log.error("queue::unknown engine %r is sending a reply: "%queue_id)
                          return
                      parent = msg['parent_header']
                      if not parent:
                          return
                      msg_id = parent['msg_id']
                      if msg_id in self.pending:
                          self.pending.remove(msg_id)
                          self.all_completed.add(msg_id)
                          self.queues[eid].remove(msg_id)
                          self.completed[eid].append(msg_id)
                      elif msg_id not in self.all_completed:
                          # it could be a result from a dead engine that died before delivering the
                          # result
                          self.log.warn("queue:: unknown msg finished %r"%msg_id)
                          return
                      # update record anyway, because the unregistration could have been premature
                      rheader = msg['header']
                      completed = rheader['date']
                      started = rheader.get('started', None)
                      result = {
                          'result_header' : rheader,
                          'result_content': msg['content'],
                          'started' : started,
                          'completed' : completed
                      }
                      result['result_buffers'] = msg['buffers']
                      try:
                          self.db.update_record(msg_id, result)
                      except Exception:
                          self.log.error("DB Error updating record %r"%msg_id, exc_info=True)
                  #--------------------- Task Queue Traffic ------------------------------
                  def save_task_request(self, idents, msg):
                      """Save the submission of a task."""
                      client_id = idents[0]
                      try:
                          msg = self.session.unpack_message(msg)
                      except Exception:
                          self.log.error("task::client %r sent invalid task message: %r"%(
                                  client_id, msg), exc_info=True)
                          return
                      record = init_record(msg)
                      record['client_uuid'] = client_id
                      record['queue'] = 'task'
                      header = msg['header']
                      msg_id = header['msg_id']
                      self.pending.add(msg_id)
                      self.unassigned.add(msg_id)
                      try:
                          # it's posible iopub arrived first:
                          existing = self.db.get_record(msg_id)
                          if existing['resubmitted']:
                              for key in ('submitted', 'client_uuid', 'buffers'):
                                  # don't clobber these keys on resubmit
                                  # submitted and client_uuid should be different
                                  # and buffers might be big, and shouldn't have changed
                                  record.pop(key)
                                  # still check content,header which should not change
                                  # but are not expensive to compare as buffers
                          for key,evalue in existing.iteritems():
                              if key.endswith('buffers'):
                                  # don't compare buffers
                                  continue
                              rvalue = record.get(key, None)
                              if evalue and rvalue and evalue != rvalue:
                                  self.log.warn("conflicting initial state for record: %r:%r <%r> %r"%(msg_id, rvalue, key, evalue))
                              elif evalue and not rvalue:
                                  record[key] = evalue
                          try:
                              self.db.update_record(msg_id, record)
                          except Exception:
                              self.log.error("DB Error updating record %r"%msg_id, exc_info=True)
                      except KeyError:
                          try:
                              self.db.add_record(msg_id, record)
                          except Exception:
                              self.log.error("DB Error adding record %r"%msg_id, exc_info=True)
                      except Exception:
                          self.log.error("DB Error saving task request %r"%msg_id, exc_info=True)
                  def save_task_result(self, idents, msg):
                      """save the result of a completed task."""
                      client_id = idents[0]
                      try:
                          msg = self.session.unpack_message(msg)
                      except Exception:
                          self.log.error("task::invalid task result message send to %r: %r"%(
                                  client_id, msg), exc_info=True)
                          return
                      parent = msg['parent_header']
                      if not parent:
                          # print msg
                          self.log.warn("Task %r had no parent!"%msg)
                          return
                      msg_id = parent['msg_id']
                      if msg_id in self.unassigned:
                          self.unassigned.remove(msg_id)
                      header = msg['header']
                      engine_uuid = header.get('engine', None)
                      eid = self.by_ident.get(engine_uuid, None)
                      if msg_id in self.pending:
                          self.pending.remove(msg_id)
                          self.all_completed.add(msg_id)
                          if eid is not None:
                              self.completed[eid].append(msg_id)
                              if msg_id in self.tasks[eid]:
                                  self.tasks[eid].remove(msg_id)
                          completed = header['date']
                          started = header.get('started', None)
                          result = {
                              'result_header' : header,
                              'result_content': msg['content'],
                              'started' : started,
                              'completed' : completed,
                              'engine_uuid': engine_uuid
                          }
                          result['result_buffers'] = msg['buffers']
                          try:
                              self.db.update_record(msg_id, result)
                          except Exception:
                              self.log.error("DB Error saving task request %r"%msg_id, exc_info=True)
                      else:
                          self.log.debug("task::unknown task %r finished"%msg_id)
                  def save_task_destination(self, idents, msg):
                      try:
                          msg = self.session.unpack_message(msg, content=True)
                      except Exception:
                          self.log.error("task::invalid task tracking message", exc_info=True)
                          return
                      content = msg['content']
                      # print (content)
                      msg_id = content['msg_id']
                      engine_uuid = content['engine_id']
                      eid = self.by_ident[engine_uuid]
                      self.log.info("task::task %r arrived on %r"%(msg_id, eid))
                      if msg_id in self.unassigned:
                          self.unassigned.remove(msg_id)
                      # else:
                      #     self.log.debug("task::task %r not listed as MIA?!"%(msg_id))
                      self.tasks[eid].append(msg_id)
                      # self.pending[msg_id][1].update(received=datetime.now(),engine=(eid,engine_uuid))
                      try:
                          self.db.update_record(msg_id, dict(engine_uuid=engine_uuid))
                      except Exception:
                          self.log.error("DB Error saving task destination %r"%msg_id, exc_info=True)
                  def mia_task_request(self, idents, msg):
                      raise NotImplementedError
                      client_id = idents[0]
                      # content = dict(mia=self.mia,status='ok')
                      # self.session.send('mia_reply', content=content, idents=client_id)
                  #--------------------- IOPub Traffic ------------------------------
                  def save_iopub_message(self, topics, msg):
                      """save an iopub message into the db"""
                      # print (topics)
                      try:
                          msg = self.session.unpack_message(msg, content=True)
                      except Exception:
                          self.log.error("iopub::invalid IOPub message", exc_info=True)
                          return
                      parent = msg['parent_header']
                      if not parent:
                          self.log.error("iopub::invalid IOPub message: %r"%msg)
                          return
                      msg_id = parent['msg_id']
                      msg_type = msg['msg_type']
                      content = msg['content']
                      # ensure msg_id is in db
                      try:
                          rec = self.db.get_record(msg_id)
                      except KeyError:
                          rec = empty_record()
                          rec['msg_id'] = msg_id
                          self.db.add_record(msg_id, rec)
                      # stream
                      d = {}
                      if msg_type == 'stream':
                          name = content['name']
                          s = rec[name] or ''
                          d[name] = s + content['data']
                      elif msg_type == 'pyerr':
                          d['pyerr'] = content
                      elif msg_type == 'pyin':
                          d['pyin'] = content['code']
                      else:
                          d[msg_type] = content.get('data', '')
                      try:
                          self.db.update_record(msg_id, d)
                      except Exception:
                          self.log.error("DB Error saving iopub message %r"%msg_id, exc_info=True)
                  #-------------------------------------------------------------------------
                  # Registration requests
                  #-------------------------------------------------------------------------
                  def connection_request(self, client_id, msg):
                      """Reply with connection addresses for clients."""
                      self.log.info("client::client %r connected"%client_id)
                      content = dict(status='ok')
                      content.update(self.client_info)
                      jsonable = {}
                      for k,v in self.keytable.iteritems():
                          if v not in self.dead_engines:
                              jsonable[str(k)] = v
                      content['engines'] = jsonable
                      self.session.send(self.query, 'connection_reply', content, parent=msg, ident=client_id)
                  def register_engine(self, reg, msg):
                      """Register a new engine."""
                      content = msg['content']
                      try:
                          queue = content['queue']
                      except KeyError:
                          self.log.error("registration::queue not specified", exc_info=True)
                          return
                      heart = content.get('heartbeat', None)
                      """register a new engine, and create the socket(s) necessary"""
                      eid = self._next_id
                      # print (eid, queue, reg, heart)
                      self.log.debug("registration::register_engine(%i, %r, %r, %r)"%(eid, queue, reg, heart))
                      content = dict(id=eid,status='ok')
                      content.update(self.engine_info)
                      # check if requesting available IDs:
                      if queue in self.by_ident:
                          try:
                              raise KeyError("queue_id %r in use"%queue)
                          except:
                              content = error.wrap_exception()
                              self.log.error("queue_id %r in use"%queue, exc_info=True)
                      elif heart in self.hearts: # need to check unique hearts?
                          try:
                              raise KeyError("heart_id %r in use"%heart)
                          except:
                              self.log.error("heart_id %r in use"%heart, exc_info=True)
                              content = error.wrap_exception()
                      else:
                          for h, pack in self.incoming_registrations.iteritems():
                              if heart == h:
                                  try:
                                      raise KeyError("heart_id %r in use"%heart)
                                  except:
                                      self.log.error("heart_id %r in use"%heart, exc_info=True)
                                      content = error.wrap_exception()
                                  break
                              elif queue == pack[1]:
                                  try:
                                      raise KeyError("queue_id %r in use"%queue)
                                  except:
                                      self.log.error("queue_id %r in use"%queue, exc_info=True)
                                      content = error.wrap_exception()
                                  break
                      msg = self.session.send(self.query, "registration_reply",
                              content=content,
                              ident=reg)
                      if content['status'] == 'ok':
                          if heart in self.heartmonitor.hearts:
                              # already beating
                              self.incoming_registrations[heart] = (eid,queue,reg[0],None)
                              self.finish_registration(heart)
                          else:
                              purge = lambda : self._purge_stalled_registration(heart)
                              dc = ioloop.DelayedCallback(purge, self.registration_timeout, self.loop)
                              dc.start()
                              self.incoming_registrations[heart] = (eid,queue,reg[0],dc)
                      else:
                          self.log.error("registration::registration %i failed: %r"%(eid, content['evalue']))
                      return eid
                  def unregister_engine(self, ident, msg):
                      """Unregister an engine that explicitly requested to leave."""
                      try:
                          eid = msg['content']['id']
                      except:
                          self.log.error("registration::bad engine id for unregistration: %r"%ident, exc_info=True)
                          return
                      self.log.info("registration::unregister_engine(%r)"%eid)
                      # print (eid)
                      uuid = self.keytable[eid]
                      content=dict(id=eid, queue=uuid)
                      self.dead_engines.add(uuid)
                      # self.ids.remove(eid)
                      # uuid = self.keytable.pop(eid)
                      #
                      # ec = self.engines.pop(eid)
                      # self.hearts.pop(ec.heartbeat)
                      # self.by_ident.pop(ec.queue)
                      # self.completed.pop(eid)
                      handleit = lambda : self._handle_stranded_msgs(eid, uuid)
                      dc = ioloop.DelayedCallback(handleit, self.registration_timeout, self.loop)
                      dc.start()
                      ############## TODO: HANDLE IT ################
                      if self.notifier:
                          self.session.send(self.notifier, "unregistration_notification", content=content)
                  def _handle_stranded_msgs(self, eid, uuid):
                      """Handle messages known to be on an engine when the engine unregisters.
                      It is possible that this will fire prematurely - that is, an engine will
                      go down after completing a result, and the client will be notified
                      that the result failed and later receive the actual result.
                      """
                      outstanding = self.queues[eid]
                      for msg_id in outstanding:
                          self.pending.remove(msg_id)
                          self.all_completed.add(msg_id)
                          try:
                              raise error.EngineError("Engine %r died while running task %r"%(eid, msg_id))
                          except:
                              content = error.wrap_exception()
                          # build a fake header:
                          header = {}
                          header['engine'] = uuid
                          header['date'] = datetime.now()
                          rec = dict(result_content=content, result_header=header, result_buffers=[])
                          rec['completed'] = header['date']
                          rec['engine_uuid'] = uuid
                          try:
                              self.db.update_record(msg_id, rec)
                          except Exception:
                              self.log.error("DB Error handling stranded msg %r"%msg_id, exc_info=True)
                  def finish_registration(self, heart):
                      """Second half of engine registration, called after our HeartMonitor
                      has received a beat from the Engine's Heart."""
                      try:
                          (eid,queue,reg,purge) = self.incoming_registrations.pop(heart)
                      except KeyError:
                          self.log.error("registration::tried to finish nonexistant registration", exc_info=True)
                          return
                      self.log.info("registration::finished registering engine %i:%r"%(eid,queue))
                      if purge is not None:
                          purge.stop()
                      control = queue
                      self.ids.add(eid)
                      self.keytable[eid] = queue
                      self.engines[eid] = EngineConnector(id=eid, queue=queue, registration=reg,
                                                  control=control, heartbeat=heart)
                      self.by_ident[queue] = eid
                      self.queues[eid] = list()
                      self.tasks[eid] = list()
                      self.completed[eid] = list()
                      self.hearts[heart] = eid
                      content = dict(id=eid, queue=self.engines[eid].queue)
                      if self.notifier:
                          self.session.send(self.notifier, "registration_notification", content=content)
                      self.log.info("engine::Engine Connected: %i"%eid)
                  def _purge_stalled_registration(self, heart):
                      if heart in self.incoming_registrations:
                          eid = self.incoming_registrations.pop(heart)[0]
                          self.log.info("registration::purging stalled registration: %i"%eid)
                      else:
                          pass
                  #-------------------------------------------------------------------------
                  # Client Requests
                  #-------------------------------------------------------------------------
                  def shutdown_request(self, client_id, msg):
                      """handle shutdown request."""
                      self.session.send(self.query, 'shutdown_reply', content={'status': 'ok'}, ident=client_id)
                      # also notify other clients of shutdown
                      self.session.send(self.notifier, 'shutdown_notice', content={'status': 'ok'})
                      dc = ioloop.DelayedCallback(lambda : self._shutdown(), 1000, self.loop)
                      dc.start()
                  def _shutdown(self):
                      self.log.info("hub::hub shutting down.")
                      time.sleep(0.1)
                      sys.exit(0)
                  def check_load(self, client_id, msg):
                      content = msg['content']
                      try:
                          targets = content['targets']
                          targets = self._validate_targets(targets)
                      except:
                          content = error.wrap_exception()
                          self.session.send(self.query, "hub_error",
                                  content=content, ident=client_id)
                          return
                      content = dict(status='ok')
                      # loads = {}
                      for t in targets:
                          content[bytes(t)] = len(self.queues[t])+len(self.tasks[t])
                      self.session.send(self.query, "load_reply", content=content, ident=client_id)
                  def queue_status(self, client_id, msg):
                      """Return the Queue status of one or more targets.
                      if verbose: return the msg_ids
                      else: return len of each type.
                      keys: queue (pending MUX jobs)
                          tasks (pending Task jobs)
                          completed (finished jobs from both queues)"""
                      content = msg['content']
                      targets = content['targets']
                      try:
                          targets = self._validate_targets(targets)
                      except:
                          content = error.wrap_exception()
                          self.session.send(self.query, "hub_error",
                                  content=content, ident=client_id)
                          return
                      verbose = content.get('verbose', False)
                      content = dict(status='ok')
                      for t in targets:
                          queue = self.queues[t]
                          completed = self.completed[t]
                          tasks = self.tasks[t]
                          if not verbose:
                              queue = len(queue)
                              completed = len(completed)
                              tasks = len(tasks)
                          content[bytes(t)] = {'queue': queue, 'completed': completed , 'tasks': tasks}
                      content['unassigned'] = list(self.unassigned) if verbose else len(self.unassigned)
                      self.session.send(self.query, "queue_reply", content=content, ident=client_id)
                  def purge_results(self, client_id, msg):
                      """Purge results from memory. This method is more valuable before we move
                      to a DB based message storage mechanism."""
                      content = msg['content']
                      msg_ids = content.get('msg_ids', [])
                      reply = dict(status='ok')
                      if msg_ids == 'all':
                          try:
                              self.db.drop_matching_records(dict(completed={'$ne':None}))
                          except Exception:
                              reply = error.wrap_exception()
                      else:
                          pending = filter(lambda m: m in self.pending, msg_ids)
                          if pending:
                              try:
                                  raise IndexError("msg pending: %r"%pending[0])
                              except:
                                  reply = error.wrap_exception()
                          else:
                              try:
                                  self.db.drop_matching_records(dict(msg_id={'$in':msg_ids}))
                              except Exception:
                                  reply = error.wrap_exception()
                          if reply['status'] == 'ok':
                              eids = content.get('engine_ids', [])
                              for eid in eids:
                                  if eid not in self.engines:
                                      try:
                                          raise IndexError("No such engine: %i"%eid)
                                      except:
                                          reply = error.wrap_exception()
                                      break
                                  msg_ids = self.completed.pop(eid)
                                  uid = self.engines[eid].queue
                                  try:
                                      self.db.drop_matching_records(dict(engine_uuid=uid, completed={'$ne':None}))
                                  except Exception:
                                      reply = error.wrap_exception()
                                      break
                      self.session.send(self.query, 'purge_reply', content=reply, ident=client_id)
                  def resubmit_task(self, client_id, msg):
                      """Resubmit one or more tasks."""
                      def finish(reply):
                          self.session.send(self.query, 'resubmit_reply', content=reply, ident=client_id)
                      content = msg['content']
                      msg_ids = content['msg_ids']
                      reply = dict(status='ok')
                      try:
                          records = self.db.find_records({'msg_id' : {'$in' : msg_ids}}, keys=[
                              'header', 'content', 'buffers'])
                      except Exception:
                          self.log.error('db::db error finding tasks to resubmit', exc_info=True)
                          return finish(error.wrap_exception())
                      # validate msg_ids
                      found_ids = [ rec['msg_id'] for rec in records ]
                      invalid_ids = filter(lambda m: m in self.pending, found_ids)
                      if len(records) > len(msg_ids):
                          try:
                              raise RuntimeError("DB appears to be in an inconsistent state."
                                  "More matching records were found than should exist")
                          except Exception:
                              return finish(error.wrap_exception())
                      elif len(records) < len(msg_ids):
                          missing = [ m for m in msg_ids if m not in found_ids ]
                          try:
                              raise KeyError("No such msg(s): %r"%missing)
                          except KeyError:
                              return finish(error.wrap_exception())
                      elif invalid_ids:
                          msg_id = invalid_ids[0]
                          try:
                              raise ValueError("Task %r appears to be inflight"%(msg_id))
                          except Exception:
                              return finish(error.wrap_exception())
                      # clear the existing records
                      now = datetime.now()
                      rec = empty_record()
                      map(rec.pop, ['msg_id', 'header', 'content', 'buffers', 'submitted'])
                      rec['resubmitted'] = now
                      rec['queue'] = 'task'
                      rec['client_uuid'] = client_id[0]
                      try:
                          for msg_id in msg_ids:
                              self.all_completed.discard(msg_id)
                              self.db.update_record(msg_id, rec)
                      except Exception:
                          self.log.error('db::db error upating record', exc_info=True)
                          reply = error.wrap_exception()
                      else:
                          # send the messages
                          for rec in records:
                              header = rec['header']
                              # include resubmitted in header to prevent digest collision
                              header['resubmitted'] = now
                              msg = self.session.msg(header['msg_type'])
                              msg['content'] = rec['content']
                              msg['header'] = header
                              msg['msg_id'] = rec['msg_id']
                              self.session.send(self.resubmit, msg, buffers=rec['buffers'])
                      finish(dict(status='ok'))
                  def _extract_record(self, rec):
                      """decompose a TaskRecord dict into subsection of reply for get_result"""
                      io_dict = {}
                      for key in 'pyin pyout pyerr stdout stderr'.split():
                              io_dict[key] = rec[key]
                      content = { 'result_content': rec['result_content'],
                                          'header': rec['header'],
                                          'result_header' : rec['result_header'],
                                          'io' : io_dict,
                                        }
                      if rec['result_buffers']:
                          buffers = map(str, rec['result_buffers'])
                      else:
                          buffers = []
                      return content, buffers
                  def get_results(self, client_id, msg):
                      """Get the result of 1 or more messages."""
                      content = msg['content']
                      msg_ids = sorted(set(content['msg_ids']))
                      statusonly = content.get('status_only', False)
                      pending = []
                      completed = []
                      content = dict(status='ok')
                      content['pending'] = pending
                      content['completed'] = completed
                      buffers = []
                      if not statusonly:
                          try:
                              matches = self.db.find_records(dict(msg_id={'$in':msg_ids}))
                              # turn match list into dict, for faster lookup
                              records = {}
                              for rec in matches:
                                  records[rec['msg_id']] = rec
                          except Exception:
                              content = error.wrap_exception()
                              self.session.send(self.query, "result_reply", content=content,
                                                                  parent=msg, ident=client_id)
                              return
                      else:
                          records = {}
                      for msg_id in msg_ids:
                          if msg_id in self.pending:
                              pending.append(msg_id)
                          elif msg_id in self.all_completed:
                              completed.append(msg_id)
                              if not statusonly:
                                  c,bufs = self._extract_record(records[msg_id])
                                  content[msg_id] = c
                                  buffers.extend(bufs)
                          elif msg_id in records:
                              if rec['completed']:
                                  completed.append(msg_id)
                                  c,bufs = self._extract_record(records[msg_id])
                                  content[msg_id] = c
                                  buffers.extend(bufs)
                              else:
                                  pending.append(msg_id)
                          else:
                              try:
                                  raise KeyError('No such message: '+msg_id)
                              except:
                                  content = error.wrap_exception()
                              break
                      self.session.send(self.query, "result_reply", content=content,
                                                          parent=msg, ident=client_id,
                                                          buffers=buffers)
                  def get_history(self, client_id, msg):
                      """Get a list of all msg_ids in our DB records"""
                      try:
                          msg_ids = self.db.get_history()
                      except Exception as e:
                          content = error.wrap_exception()
                      else:
                          content = dict(status='ok', history=msg_ids)
                      self.session.send(self.query, "history_reply", content=content,
                                                          parent=msg, ident=client_id)
                  def db_query(self, client_id, msg):
                      """Perform a raw query on the task record database."""
                      content = msg['content']
                      query = content.get('query', {})
                      keys = content.get('keys', None)
                      buffers = []
                      empty = list()
                      try:
                          records = self.db.find_records(query, keys)
                      except Exception as e:
                          content = error.wrap_exception()
                      else:
                          # extract buffers from reply content:
                          if keys is not None:
                              buffer_lens = [] if 'buffers' in keys else None
                              result_buffer_lens = [] if 'result_buffers' in keys else None
                          else:
                              buffer_lens = []
                              result_buffer_lens = []
                          for rec in records:
                              # buffers may be None, so double check
                              if buffer_lens is not None:
                                  b = rec.pop('buffers', empty) or empty
                                  buffer_lens.append(len(b))
                                  buffers.extend(b)
                              if result_buffer_lens is not None:
                                  rb = rec.pop('result_buffers', empty) or empty
                                  result_buffer_lens.append(len(rb))
                                  buffers.extend(rb)
                          content = dict(status='ok', records=records, buffer_lens=buffer_lens,
                                                  result_buffer_lens=result_buffer_lens)
                      self.session.send(self.query, "db_reply", content=content,
                                                          parent=msg, ident=client_id,
                                                          buffers=buffers)

IPython/parallel/controller/mongodb.py

0 +7 -2

-             """A TaskRecord backend using mongodb"""
+             """A TaskRecord backend using mongodb
+             Authors:
+             * Min RK
+             """
              #-----------------------------------------------------------------------------
-             #  Copyright (C) 2010  The IPython Development Team
+             #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              from pymongo import Connection
              from pymongo.binary import Binary
              from IPython.utils.traitlets import Dict, List, Unicode, Instance
              from .dictdb import BaseDB
              #-----------------------------------------------------------------------------
              # MongoDB class
              #-----------------------------------------------------------------------------
              class MongoDB(BaseDB):
                  """MongoDB TaskRecord backend."""
                  connection_args = List(config=True,
                      help="""Positional arguments to be passed to pymongo.Connection.  Only
                      necessary if the default mongodb configuration does not point to your
                      mongod instance.""")
                  connection_kwargs = Dict(config=True,
                      help="""Keyword arguments to be passed to pymongo.Connection.  Only
                      necessary if the default mongodb configuration does not point to your
                      mongod instance."""
                  )
                  database = Unicode(config=True,
                      help="""The MongoDB database name to use for storing tasks for this session. If unspecified,
                      a new database will be created with the Hub's IDENT.  Specifying the database will result
                      in tasks from previous sessions being available via Clients' db_query and
                      get_result methods.""")
                  _connection = Instance(Connection) # pymongo connection
                  def __init__(self, **kwargs):
                      super(MongoDB, self).__init__(**kwargs)
                      if self._connection is None:
                          self._connection = Connection(*self.connection_args, **self.connection_kwargs)
                      if not self.database:
                          self.database = self.session
                      self._db = self._connection[self.database]
                      self._records = self._db['task_records']
                      self._records.ensure_index('msg_id', unique=True)
                      self._records.ensure_index('submitted') # for sorting history
                      # for rec in self._records.find
                  def _binary_buffers(self, rec):
                      for key in ('buffers', 'result_buffers'):
                          if rec.get(key, None):
                              rec[key] = map(Binary, rec[key])
                      return rec
                  def add_record(self, msg_id, rec):
                      """Add a new Task Record, by msg_id."""
                      # print rec
                      rec = self._binary_buffers(rec)
                      self._records.insert(rec)
                  def get_record(self, msg_id):
                      """Get a specific Task Record, by msg_id."""
                      r = self._records.find_one({'msg_id': msg_id})
                      if not r:
                          # r will be '' if nothing is found
                          raise KeyError(msg_id)
                      return r
                  def update_record(self, msg_id, rec):
                      """Update the data in an existing record."""
                      rec = self._binary_buffers(rec)
                      self._records.update({'msg_id':msg_id}, {'$set': rec})
                  def drop_matching_records(self, check):
                      """Remove a record from the DB."""
                      self._records.remove(check)
                  def drop_record(self, msg_id):
                      """Remove a record from the DB."""
                      self._records.remove({'msg_id':msg_id})
                  def find_records(self, check, keys=None):
                      """Find records matching a query dict, optionally extracting subset of keys.
                      Returns list of matching records.
                      Parameters
                      ----------
                      check: dict
                          mongodb-style query argument
                      keys: list of strs [optional]
                          if specified, the subset of keys to extract.  msg_id will *always* be
                          included.
                      """
                      if keys and 'msg_id' not in keys:
                          keys.append('msg_id')
                      matches = list(self._records.find(check,keys))
                      for rec in matches:
                          rec.pop('_id')
                      return matches
                  def get_history(self):
                      """get all msg_ids, ordered by time submitted."""
                      cursor = self._records.find({},{'msg_id':1}).sort('submitted')
                      return [ rec['msg_id'] for rec in cursor ]

IPython/parallel/controller/scheduler.py

0 +4 0

              """The Python scheduler for rich scheduling.
              The Pure ZMQ scheduler does not allow routing schemes other than LRU,
              nor does it check msg_id DAG dependencies. For those, a slightly slower
              Python Scheduler exists.
+             Authors:
+             * Min RK
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #----------------------------------------------------------------------
              # Imports
              #----------------------------------------------------------------------
              from __future__ import print_function
              import logging
              import sys
              from datetime import datetime, timedelta
              from random import randint, random
              from types import FunctionType
              try:
                  import numpy
              except ImportError:
                  numpy = None
              import zmq
              from zmq.eventloop import ioloop, zmqstream
              # local imports
              from IPython.external.decorator import decorator
              from IPython.config.loader import Config
              from IPython.utils.traitlets import Instance, Dict, List, Set, Int, Str, Enum
              from IPython.parallel import error
              from IPython.parallel.factory import SessionFactory
              from IPython.parallel.util import connect_logger, local_logger
              from .dependency import Dependency
              @decorator
              def logged(f,self,*args,**kwargs):
                  # print ("#--------------------")
                  self.log.debug("scheduler::%s(*%s,**%s)"%(f.func_name, args, kwargs))
                  # print ("#--")
                  return f(self,*args, **kwargs)
              #----------------------------------------------------------------------
              # Chooser functions
              #----------------------------------------------------------------------
              def plainrandom(loads):
                  """Plain random pick."""
                  n = len(loads)
                  return randint(0,n-1)
              def lru(loads):
                  """Always pick the front of the line.
                  The content of `loads` is ignored.
                  Assumes LRU ordering of loads, with oldest first.
                  """
                  return 0
              def twobin(loads):
                  """Pick two at random, use the LRU of the two.
                  The content of loads is ignored.
                  Assumes LRU ordering of loads, with oldest first.
                  """
                  n = len(loads)
                  a = randint(0,n-1)
                  b = randint(0,n-1)
                  return min(a,b)
              def weighted(loads):
                  """Pick two at random using inverse load as weight.
                  Return the less loaded of the two.
                  """
                  # weight 0 a million times more than 1:
                  weights = 1./(1e-6+numpy.array(loads))
                  sums = weights.cumsum()
                  t = sums[-1]
                  x = random()*t
                  y = random()*t
                  idx = 0
                  idy = 0
                  while sums[idx] < x:
                      idx += 1
                  while sums[idy] < y:
                      idy += 1
                  if weights[idy] > weights[idx]:
                      return idy
                  else:
                      return idx
              def leastload(loads):
                  """Always choose the lowest load.
                  If the lowest load occurs more than once, the first
                  occurance will be used.  If loads has LRU ordering, this means
                  the LRU of those with the lowest load is chosen.
                  """
                  return loads.index(min(loads))
              #---------------------------------------------------------------------
              # Classes
              #---------------------------------------------------------------------
              # store empty default dependency:
              MET = Dependency([])
              class TaskScheduler(SessionFactory):
                  """Python TaskScheduler object.
                  This is the simplest object that supports msg_id based
                  DAG dependencies. *Only* task msg_ids are checked, not
                  msg_ids of jobs submitted via the MUX queue.
                  """
                  hwm = Int(0, config=True, shortname='hwm',
                      help="""specify the High Water Mark (HWM) for the downstream
                      socket in the Task scheduler. This is the maximum number
                      of allowed outstanding tasks on each engine."""
                  )
                  scheme_name = Enum(('leastload', 'pure', 'lru', 'plainrandom', 'weighted', 'twobin'),
                      'leastload', config=True, shortname='scheme', allow_none=False,
                      help="""select the task scheduler scheme  [default: Python LRU]
                      Options are: 'pure', 'lru', 'plainrandom', 'weighted', 'twobin','leastload'"""
                  )
                  def _scheme_name_changed(self, old, new):
                      self.log.debug("Using scheme %r"%new)
                      self.scheme = globals()[new]
                  # input arguments:
                  scheme = Instance(FunctionType) # function for determining the destination
                  def _scheme_default(self):
                      return leastload
                  client_stream = Instance(zmqstream.ZMQStream) # client-facing stream
                  engine_stream = Instance(zmqstream.ZMQStream) # engine-facing stream
                  notifier_stream = Instance(zmqstream.ZMQStream) # hub-facing sub stream
                  mon_stream = Instance(zmqstream.ZMQStream) # hub-facing pub stream
                  # internals:
                  graph = Dict() # dict by msg_id of [ msg_ids that depend on key ]
                  retries = Dict() # dict by msg_id of retries remaining (non-neg ints)
                  # waiting = List() # list of msg_ids ready to run, but haven't due to HWM
                  depending = Dict() # dict by msg_id of (msg_id, raw_msg, after, follow)
                  pending = Dict() # dict by engine_uuid of submitted tasks
                  completed = Dict() # dict by engine_uuid of completed tasks
                  failed = Dict() # dict by engine_uuid of failed tasks
                  destinations = Dict() # dict by msg_id of engine_uuids where jobs ran (reverse of completed+failed)
                  clients = Dict() # dict by msg_id for who submitted the task
                  targets = List() # list of target IDENTs
                  loads = List() # list of engine loads
                  # full = Set() # set of IDENTs that have HWM outstanding tasks
                  all_completed = Set() # set of all completed tasks
                  all_failed = Set() # set of all failed tasks
                  all_done = Set() # set of all finished tasks=union(completed,failed)
                  all_ids = Set() # set of all submitted task IDs
                  blacklist = Dict() # dict by msg_id of locations where a job has encountered UnmetDependency
                  auditor = Instance('zmq.eventloop.ioloop.PeriodicCallback')
                  def start(self):
                      self.engine_stream.on_recv(self.dispatch_result, copy=False)
                      self._notification_handlers = dict(
                          registration_notification = self._register_engine,
                          unregistration_notification = self._unregister_engine
                      )
                      self.notifier_stream.on_recv(self.dispatch_notification)
                      self.auditor = ioloop.PeriodicCallback(self.audit_timeouts, 2e3, self.loop) # 1 Hz
                      self.auditor.start()
                      self.log.info("Scheduler started [%s]"%self.scheme_name)
                  def resume_receiving(self):
                      """Resume accepting jobs."""
                      self.client_stream.on_recv(self.dispatch_submission, copy=False)
                  def stop_receiving(self):
                      """Stop accepting jobs while there are no engines.
                      Leave them in the ZMQ queue."""
                      self.client_stream.on_recv(None)
                  #-----------------------------------------------------------------------
                  # [Un]Registration Handling
                  #-----------------------------------------------------------------------
                  def dispatch_notification(self, msg):
                      """dispatch register/unregister events."""
                      try:
                          idents,msg = self.session.feed_identities(msg)
                      except ValueError:
                          self.log.warn("task::Invalid Message: %r"%msg)
                          return
                      try:
                          msg = self.session.unpack_message(msg)
                      except ValueError:
                          self.log.warn("task::Unauthorized message from: %r"%idents)
                          return
                      msg_type = msg['msg_type']
                      handler = self._notification_handlers.get(msg_type, None)
                      if handler is None:
                          self.log.error("Unhandled message type: %r"%msg_type)
                      else:
                          try:
                              handler(str(msg['content']['queue']))
                          except KeyError:
                              self.log.error("task::Invalid notification msg: %r"%msg)
                  @logged
                  def _register_engine(self, uid):
                      """New engine with ident `uid` became available."""
                      # head of the line:
                      self.targets.insert(0,uid)
                      self.loads.insert(0,0)
                      # initialize sets
                      self.completed[uid] = set()
                      self.failed[uid] = set()
                      self.pending[uid] = {}
                      if len(self.targets) == 1:
                          self.resume_receiving()
                      # rescan the graph:
                      self.update_graph(None)
                  def _unregister_engine(self, uid):
                      """Existing engine with ident `uid` became unavailable."""
                      if len(self.targets) == 1:
                          # this was our only engine
                          self.stop_receiving()
                      # handle any potentially finished tasks:
                      self.engine_stream.flush()
                      # don't pop destinations, because they might be used later
                      # map(self.destinations.pop, self.completed.pop(uid))
                      # map(self.destinations.pop, self.failed.pop(uid))
                      # prevent this engine from receiving work
                      idx = self.targets.index(uid)
                      self.targets.pop(idx)
                      self.loads.pop(idx)
                      # wait 5 seconds before cleaning up pending jobs, since the results might
                      # still be incoming
                      if self.pending[uid]:
                          dc = ioloop.DelayedCallback(lambda : self.handle_stranded_tasks(uid), 5000, self.loop)
                          dc.start()
                      else:
                          self.completed.pop(uid)
                          self.failed.pop(uid)
                  @logged
                  def handle_stranded_tasks(self, engine):
                      """Deal with jobs resident in an engine that died."""
                      lost = self.pending[engine]
                      for msg_id in lost.keys():
                          if msg_id not in self.pending[engine]:
                              # prevent double-handling of messages
                              continue
                          raw_msg = lost[msg_id][0]
                          idents,msg = self.session.feed_identities(raw_msg, copy=False)
                          parent = self.session.unpack(msg[1].bytes)
                          idents = [engine, idents[0]]
                          # build fake error reply
                          try:
                              raise error.EngineError("Engine %r died while running task %r"%(engine, msg_id))
                          except:
                              content = error.wrap_exception()
                          msg = self.session.msg('apply_reply', content, parent=parent, subheader={'status':'error'})
                          raw_reply = map(zmq.Message, self.session.serialize(msg, ident=idents))
                          # and dispatch it
                          self.dispatch_result(raw_reply)
                      # finally scrub completed/failed lists
                      self.completed.pop(engine)
                      self.failed.pop(engine)
                  #-----------------------------------------------------------------------
                  # Job Submission
                  #-----------------------------------------------------------------------
                  @logged
                  def dispatch_submission(self, raw_msg):
                      """Dispatch job submission to appropriate handlers."""
                      # ensure targets up to date:
                      self.notifier_stream.flush()
                      try:
                          idents, msg = self.session.feed_identities(raw_msg, copy=False)
                          msg = self.session.unpack_message(msg, content=False, copy=False)
                      except Exception:
                          self.log.error("task::Invaid task msg: %r"%raw_msg, exc_info=True)
                          return
                      # send to monitor
                      self.mon_stream.send_multipart(['intask']+raw_msg, copy=False)
                      header = msg['header']
                      msg_id = header['msg_id']
                      self.all_ids.add(msg_id)
                      # targets
                      targets = set(header.get('targets', []))
                      retries = header.get('retries', 0)
                      self.retries[msg_id] = retries
                      # time dependencies
                      after = Dependency(header.get('after', []))
                      if after.all:
                          if after.success:
                              after.difference_update(self.all_completed)
                          if after.failure:
                              after.difference_update(self.all_failed)
                      if after.check(self.all_completed, self.all_failed):
                          # recast as empty set, if `after` already met,
                          # to prevent unnecessary set comparisons
                          after = MET
                      # location dependencies
                      follow = Dependency(header.get('follow', []))
                      # turn timeouts into datetime objects:
                      timeout = header.get('timeout', None)
                      if timeout:
                          timeout = datetime.now() + timedelta(0,timeout,0)
                      args = [raw_msg, targets, after, follow, timeout]
                      # validate and reduce dependencies:
                      for dep in after,follow:
                          # check valid:
                          if msg_id in dep or dep.difference(self.all_ids):
                              self.depending[msg_id] = args
                              return self.fail_unreachable(msg_id, error.InvalidDependency)
                          # check if unreachable:
                          if dep.unreachable(self.all_completed, self.all_failed):
                              self.depending[msg_id] = args
                              return self.fail_unreachable(msg_id)
                      if after.check(self.all_completed, self.all_failed):
                          # time deps already met, try to run
                          if not self.maybe_run(msg_id, *args):
                              # can't run yet
                              if msg_id not in self.all_failed:
                                  # could have failed as unreachable
                                  self.save_unmet(msg_id, *args)
                      else:
                          self.save_unmet(msg_id, *args)
                  # @logged
                  def audit_timeouts(self):
                      """Audit all waiting tasks for expired timeouts."""
                      now = datetime.now()
                      for msg_id in self.depending.keys():
                          # must recheck, in case one failure cascaded to another:
                          if msg_id in self.depending:
                              raw,after,targets,follow,timeout = self.depending[msg_id]
                              if timeout and timeout < now:
                                  self.fail_unreachable(msg_id, error.TaskTimeout)
                  @logged
                  def fail_unreachable(self, msg_id, why=error.ImpossibleDependency):
                      """a task has become unreachable, send a reply with an ImpossibleDependency
                      error."""
                      if msg_id not in self.depending:
                          self.log.error("msg %r already failed!"%msg_id)
                          return
                      raw_msg,targets,after,follow,timeout = self.depending.pop(msg_id)
                      for mid in follow.union(after):
                          if mid in self.graph:
                              self.graph[mid].remove(msg_id)
                      # FIXME: unpacking a message I've already unpacked, but didn't save:
                      idents,msg = self.session.feed_identities(raw_msg, copy=False)
                      header = self.session.unpack(msg[1].bytes)
                      try:
                          raise why()
                      except:
                          content = error.wrap_exception()
                      self.all_done.add(msg_id)
                      self.all_failed.add(msg_id)
                      msg = self.session.send(self.client_stream, 'apply_reply', content,
                                                              parent=header, ident=idents)
                      self.session.send(self.mon_stream, msg, ident=['outtask']+idents)
                      self.update_graph(msg_id, success=False)
                  @logged
                  def maybe_run(self, msg_id, raw_msg, targets, after, follow, timeout):
                      """check location dependencies, and run if they are met."""
                      blacklist = self.blacklist.setdefault(msg_id, set())
                      if follow or targets or blacklist or self.hwm:
                          # we need a can_run filter
                          def can_run(idx):
                              # check hwm
                              if self.hwm and self.loads[idx] == self.hwm:
                                  return False
                              target = self.targets[idx]
                              # check blacklist
                              if target in blacklist:
                                  return False
                              # check targets
                              if targets and target not in targets:
                                  return False
                              # check follow
                              return follow.check(self.completed[target], self.failed[target])
                          indices = filter(can_run, range(len(self.targets)))
                          if not indices:
                              # couldn't run
                              if follow.all:
                                  # check follow for impossibility
                                  dests = set()
                                  relevant = set()
                                  if follow.success:
                                      relevant = self.all_completed
                                  if follow.failure:
                                      relevant = relevant.union(self.all_failed)
                                  for m in follow.intersection(relevant):
                                      dests.add(self.destinations[m])
                                  if len(dests) > 1:
                                      self.depending[msg_id] = (raw_msg, targets, after, follow, timeout)
                                      self.fail_unreachable(msg_id)
                                      return False
                              if targets:
                                  # check blacklist+targets for impossibility
                                  targets.difference_update(blacklist)
                                  if not targets or not targets.intersection(self.targets):
                                      self.depending[msg_id] = (raw_msg, targets, after, follow, timeout)
                                      self.fail_unreachable(msg_id)
                                      return False
                              return False
                      else:
                          indices = None
                      self.submit_task(msg_id, raw_msg, targets, follow, timeout, indices)
                      return True
                  @logged
                  def save_unmet(self, msg_id, raw_msg, targets, after, follow, timeout):
                      """Save a message for later submission when its dependencies are met."""
                      self.depending[msg_id] = [raw_msg,targets,after,follow,timeout]
                      # track the ids in follow or after, but not those already finished
                      for dep_id in after.union(follow).difference(self.all_done):
                          if dep_id not in self.graph:
                              self.graph[dep_id] = set()
                          self.graph[dep_id].add(msg_id)
                  @logged
                  def submit_task(self, msg_id, raw_msg, targets, follow, timeout, indices=None):
                      """Submit a task to any of a subset of our targets."""
                      if indices:
                          loads = [self.loads[i] for i in indices]
                      else:
                          loads = self.loads
                      idx = self.scheme(loads)
                      if indices:
                          idx = indices[idx]
                      target = self.targets[idx]
                      # print (target, map(str, msg[:3]))
                      # send job to the engine
                      self.engine_stream.send(target, flags=zmq.SNDMORE, copy=False)
                      self.engine_stream.send_multipart(raw_msg, copy=False)
                      # update load
                      self.add_job(idx)
                      self.pending[target][msg_id] = (raw_msg, targets, MET, follow, timeout)
                      # notify Hub
                      content = dict(msg_id=msg_id, engine_id=target)
                      self.session.send(self.mon_stream, 'task_destination', content=content,
                                      ident=['tracktask',self.session.session])
                  #-----------------------------------------------------------------------
                  # Result Handling
                  #-----------------------------------------------------------------------
                  @logged
                  def dispatch_result(self, raw_msg):
                      """dispatch method for result replies"""
                      try:
                          idents,msg = self.session.feed_identities(raw_msg, copy=False)
                          msg = self.session.unpack_message(msg, content=False, copy=False)
                          engine = idents[0]
                          try:
                              idx = self.targets.index(engine)
                          except ValueError:
                              pass # skip load-update for dead engines
                          else:
                              self.finish_job(idx)
                      except Exception:
                          self.log.error("task::Invaid result: %r"%raw_msg, exc_info=True)
                          return
                      header = msg['header']
                      parent = msg['parent_header']
                      if header.get('dependencies_met', True):
                          success = (header['status'] == 'ok')
                          msg_id = parent['msg_id']
                          retries = self.retries[msg_id]
                          if not success and retries > 0:
                              # failed
                              self.retries[msg_id] = retries - 1
                              self.handle_unmet_dependency(idents, parent)
                          else:
                              del self.retries[msg_id]
                              # relay to client and update graph
                              self.handle_result(idents, parent, raw_msg, success)
                              # send to Hub monitor
                              self.mon_stream.send_multipart(['outtask']+raw_msg, copy=False)
                      else:
                          self.handle_unmet_dependency(idents, parent)
                  @logged
                  def handle_result(self, idents, parent, raw_msg, success=True):
                      """handle a real task result, either success or failure"""
                      # first, relay result to client
                      engine = idents[0]
                      client = idents[1]
                      # swap_ids for XREP-XREP mirror
                      raw_msg[:2] = [client,engine]
                      # print (map(str, raw_msg[:4]))
                      self.client_stream.send_multipart(raw_msg, copy=False)
                      # now, update our data structures
                      msg_id = parent['msg_id']
                      self.blacklist.pop(msg_id, None)
                      self.pending[engine].pop(msg_id)
                      if success:
                          self.completed[engine].add(msg_id)
                          self.all_completed.add(msg_id)
                      else:
                          self.failed[engine].add(msg_id)
                          self.all_failed.add(msg_id)
                      self.all_done.add(msg_id)
                      self.destinations[msg_id] = engine
                      self.update_graph(msg_id, success)
                  @logged
                  def handle_unmet_dependency(self, idents, parent):
                      """handle an unmet dependency"""
                      engine = idents[0]
                      msg_id = parent['msg_id']
                      if msg_id not in self.blacklist:
                          self.blacklist[msg_id] = set()
                      self.blacklist[msg_id].add(engine)
                      args = self.pending[engine].pop(msg_id)
                      raw,targets,after,follow,timeout = args
                      if self.blacklist[msg_id] == targets:
                          self.depending[msg_id] = args
                          self.fail_unreachable(msg_id)
                      elif not self.maybe_run(msg_id, *args):
                          # resubmit failed
                          if msg_id not in self.all_failed:
                              # put it back in our dependency tree
                              self.save_unmet(msg_id, *args)
                      if self.hwm:
                          try:
                              idx = self.targets.index(engine)
                          except ValueError:
                              pass # skip load-update for dead engines
                          else:
                              if self.loads[idx] == self.hwm-1:
                                  self.update_graph(None)
                  @logged
                  def update_graph(self, dep_id=None, success=True):
                      """dep_id just finished. Update our dependency
                      graph and submit any jobs that just became runable.
                      Called with dep_id=None to update entire graph for hwm, but without finishing
                      a task.
                      """
                      # print ("\n\n***********")
                      # pprint (dep_id)
                      # pprint (self.graph)
                      # pprint (self.depending)
                      # pprint (self.all_completed)
                      # pprint (self.all_failed)
                      # print ("\n\n***********\n\n")
                      # update any jobs that depended on the dependency
                      jobs = self.graph.pop(dep_id, [])
                      # recheck *all* jobs if
                      # a) we have HWM and an engine just become no longer full
                      # or b) dep_id was given as None
                      if dep_id is None or self.hwm and any( [ load==self.hwm-1 for load in self.loads ]):
                          jobs = self.depending.keys()
                      for msg_id in jobs:
                          raw_msg, targets, after, follow, timeout = self.depending[msg_id]
                          if after.unreachable(self.all_completed, self.all_failed)\
                                  or follow.unreachable(self.all_completed, self.all_failed):
                              self.fail_unreachable(msg_id)
                          elif after.check(self.all_completed, self.all_failed): # time deps met, maybe run
                              if self.maybe_run(msg_id, raw_msg, targets, MET, follow, timeout):
                                  self.depending.pop(msg_id)
                                  for mid in follow.union(after):
                                      if mid in self.graph:
                                          self.graph[mid].remove(msg_id)
                  #----------------------------------------------------------------------
                  # methods to be overridden by subclasses
                  #----------------------------------------------------------------------
                  def add_job(self, idx):
                      """Called after self.targets[idx] just got the job with header.
                      Override with subclasses.  The default ordering is simple LRU.
                      The default loads are the number of outstanding jobs."""
                      self.loads[idx] += 1
                      for lis in (self.targets, self.loads):
                          lis.append(lis.pop(idx))
                  def finish_job(self, idx):
                      """Called after self.targets[idx] just finished a job.
                      Override with subclasses."""
                      self.loads[idx] -= 1
              def launch_scheduler(in_addr, out_addr, mon_addr, not_addr, config=None,
                                      logname='root', log_url=None, loglevel=logging.DEBUG,
                                      identity=b'task'):
                  from zmq.eventloop import ioloop
                  from zmq.eventloop.zmqstream import ZMQStream
                  if config:
                      # unwrap dict back into Config
                      config = Config(config)
                  ctx = zmq.Context()
                  loop = ioloop.IOLoop()
                  ins = ZMQStream(ctx.socket(zmq.XREP),loop)
                  ins.setsockopt(zmq.IDENTITY, identity)
                  ins.bind(in_addr)
                  outs = ZMQStream(ctx.socket(zmq.XREP),loop)
                  outs.setsockopt(zmq.IDENTITY, identity)
                  outs.bind(out_addr)
                  mons = ZMQStream(ctx.socket(zmq.PUB),loop)
                  mons.connect(mon_addr)
                  nots = ZMQStream(ctx.socket(zmq.SUB),loop)
                  nots.setsockopt(zmq.SUBSCRIBE, '')
                  nots.connect(not_addr)
                  # setup logging. Note that these will not work in-process, because they clobber
                  # existing loggers.
                  if log_url:
                      log = connect_logger(logname, ctx, log_url, root="scheduler", loglevel=loglevel)
                  else:
                      log = local_logger(logname, loglevel)
                  scheduler = TaskScheduler(client_stream=ins, engine_stream=outs,
                                          mon_stream=mons, notifier_stream=nots,
                                          loop=loop, log=log,
                                          config=config)
                  scheduler.start()
                  try:
                      loop.start()
                  except KeyboardInterrupt:
                      print ("interrupted, exiting...", file=sys.__stderr__)

IPython/parallel/controller/sqlitedb.py

0 +6 -1

-             """A TaskRecord backend using sqlite3"""
+             """A TaskRecord backend using sqlite3
+             Authors:
+             * Min RK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              import json
              import os
              import cPickle as pickle
              from datetime import datetime
              import sqlite3
              from zmq.eventloop import ioloop
              from IPython.utils.traitlets import Unicode, Instance, List, Dict
              from .dictdb import BaseDB
              from IPython.utils.jsonutil import date_default, extract_dates, squash_dates
              #-----------------------------------------------------------------------------
              # SQLite operators, adapters, and converters
              #-----------------------------------------------------------------------------
              operators = {
               '$lt' : "<",
               '$gt' : ">",
               # null is handled weird with ==,!=
               '$eq' : "=",
               '$ne' : "!=",
               '$lte': "<=",
               '$gte': ">=",
               '$in' : ('=', ' OR '),
               '$nin': ('!=', ' AND '),
               # '$all': None,
               # '$mod': None,
               # '$exists' : None
              }
              null_operators = {
              '=' : "IS NULL",
              '!=' : "IS NOT NULL",
              }
              def _adapt_dict(d):
                  return json.dumps(d, default=date_default)
              def _convert_dict(ds):
                  if ds is None:
                      return ds
                  else:
                      return extract_dates(json.loads(ds))
              def _adapt_bufs(bufs):
                  # this is *horrible*
                  # copy buffers into single list and pickle it:
                  if bufs and isinstance(bufs[0], (bytes, buffer)):
                      return sqlite3.Binary(pickle.dumps(map(bytes, bufs),-1))
                  elif bufs:
                      return bufs
                  else:
                      return None
              def _convert_bufs(bs):
                  if bs is None:
                      return []
                  else:
                      return pickle.loads(bytes(bs))
              #-----------------------------------------------------------------------------
              # SQLiteDB class
              #-----------------------------------------------------------------------------
              class SQLiteDB(BaseDB):
                  """SQLite3 TaskRecord backend."""
                  filename = Unicode('tasks.db', config=True,
                      help="""The filename of the sqlite task database. [default: 'tasks.db']""")
                  location = Unicode('', config=True,
                      help="""The directory containing the sqlite task database.  The default
                      is to use the cluster_dir location.""")
                  table = Unicode("", config=True,
                      help="""The SQLite Table to use for storing tasks for this session. If unspecified,
                      a new table will be created with the Hub's IDENT.  Specifying the table will result
                      in tasks from previous sessions being available via Clients' db_query and
                      get_result methods.""")
                  _db = Instance('sqlite3.Connection')
                  # the ordered list of column names
                  _keys = List(['msg_id' ,
                          'header' ,
                          'content',
                          'buffers',
                          'submitted',
                          'client_uuid' ,
                          'engine_uuid' ,
                          'started',
                          'completed',
                          'resubmitted',
                          'result_header' ,
                          'result_content' ,
                          'result_buffers' ,
                          'queue' ,
                          'pyin' ,
                          'pyout',
                          'pyerr',
                          'stdout',
                          'stderr',
                      ])
                  # sqlite datatypes for checking that db is current format
                  _types = Dict({'msg_id' : 'text' ,
                          'header' : 'dict text',
                          'content' : 'dict text',
                          'buffers' : 'bufs blob',
                          'submitted' : 'timestamp',
                          'client_uuid' : 'text',
                          'engine_uuid' : 'text',
                          'started' : 'timestamp',
                          'completed' : 'timestamp',
                          'resubmitted' : 'timestamp',
                          'result_header' : 'dict text',
                          'result_content' : 'dict text',
                          'result_buffers' : 'bufs blob',
                          'queue' : 'text',
                          'pyin' : 'text',
                          'pyout' : 'text',
                          'pyerr' : 'text',
                          'stdout' : 'text',
                          'stderr' : 'text',
                      })
                  def __init__(self, **kwargs):
                      super(SQLiteDB, self).__init__(**kwargs)
                      if not self.table:
                          # use session, and prefix _, since starting with # is illegal
                          self.table = '_'+self.session.replace('-','_')
                      if not self.location:
                          # get current profile
                          from IPython.core.newapplication import BaseIPythonApplication
                          if BaseIPythonApplication.initialized():
                              app = BaseIPythonApplication.instance()
                              if app.profile_dir is not None:
                                  self.location = app.profile_dir.location
                              else:
                                  self.location = u'.'
                          else:
                              self.location = u'.'
                      self._init_db()
                      # register db commit as 2s periodic callback
                      # to prevent clogging pipes
                      # assumes we are being run in a zmq ioloop app
                      loop = ioloop.IOLoop.instance()
                      pc = ioloop.PeriodicCallback(self._db.commit, 2000, loop)
                      pc.start()
                  def _defaults(self, keys=None):
                      """create an empty record"""
                      d = {}
                      keys = self._keys if keys is None else keys
                      for key in keys:
                          d[key] = None
                      return d
                  def _check_table(self):
                      """Ensure that an incorrect table doesn't exist
                      If a bad (old) table does exist, return False
                      """
                      cursor = self._db.execute("PRAGMA table_info(%s)"%self.table)
                      lines = cursor.fetchall()
                      if not lines:
                          # table does not exist
                          return True
                      types = {}
                      keys = []
                      for line in lines:
                          keys.append(line[1])
                          types[line[1]] = line[2]
                      if self._keys != keys:
                          # key mismatch
                          self.log.warn('keys mismatch')
                          return False
                      for key in self._keys:
                          if types[key] != self._types[key]:
                              self.log.warn(
                                  'type mismatch: %s: %s != %s'%(key,types[key],self._types[key])
                              )
                              return False
                      return True
                  def _init_db(self):
                      """Connect to the database and get new session number."""
                      # register adapters
                      sqlite3.register_adapter(dict, _adapt_dict)
                      sqlite3.register_converter('dict', _convert_dict)
                      sqlite3.register_adapter(list, _adapt_bufs)
                      sqlite3.register_converter('bufs', _convert_bufs)
                      # connect to the db
                      dbfile = os.path.join(self.location, self.filename)
                      self._db = sqlite3.connect(dbfile, detect_types=sqlite3.PARSE_DECLTYPES,
                          # isolation_level = None)#,
                           cached_statements=64)
                      # print dir(self._db)
                      first_table = self.table
                      i=0
                      while not self._check_table():
                          i+=1
                          self.table = first_table+'_%i'%i
                          self.log.warn(
                              "Table %s exists and doesn't match db format, trying %s"%
                              (first_table,self.table)
                          )
                      self._db.execute("""CREATE TABLE IF NOT EXISTS %s
                              (msg_id text PRIMARY KEY,
                              header dict text,
                              content dict text,
                              buffers bufs blob,
                              submitted timestamp,
                              client_uuid text,
                              engine_uuid text,
                              started timestamp,
                              completed timestamp,
                              resubmitted timestamp,
                              result_header dict text,
                              result_content dict text,
                              result_buffers bufs blob,
                              queue text,
                              pyin text,
                              pyout text,
                              pyerr text,
                              stdout text,
                              stderr text)
                              """%self.table)
                      self._db.commit()
                  def _dict_to_list(self, d):
                      """turn a mongodb-style record dict into a list."""
                      return [ d[key] for key in self._keys ]
                  def _list_to_dict(self, line, keys=None):
                      """Inverse of dict_to_list"""
                      keys = self._keys if keys is None else keys
                      d = self._defaults(keys)
                      for key,value in zip(keys, line):
                          d[key] = value
                      return d
                  def _render_expression(self, check):
                      """Turn a mongodb-style search dict into an SQL query."""
                      expressions = []
                      args = []
                      skeys = set(check.keys())
                      skeys.difference_update(set(self._keys))
                      skeys.difference_update(set(['buffers', 'result_buffers']))
                      if skeys:
                          raise KeyError("Illegal testing key(s): %s"%skeys)
                      for name,sub_check in check.iteritems():
                          if isinstance(sub_check, dict):
                              for test,value in sub_check.iteritems():
                                  try:
                                      op = operators[test]
                                  except KeyError:
                                      raise KeyError("Unsupported operator: %r"%test)
                                  if isinstance(op, tuple):
                                      op, join = op
                                  if value is None and op in null_operators:
                                          expr = "%s %s"%null_operators[op]
                                  else:
                                      expr = "%s %s ?"%(name, op)
                                      if isinstance(value, (tuple,list)):
                                          if op in null_operators and any([v is None for v in value]):
                                              # equality tests don't work with NULL
                                              raise ValueError("Cannot use %r test with NULL values on SQLite backend"%test)
                                          expr = '( %s )'%( join.join([expr]*len(value)) )
                                          args.extend(value)
                                      else:
                                          args.append(value)
                                  expressions.append(expr)
                          else:
                              # it's an equality check
                              if sub_check is None:
                                  expressions.append("%s IS NULL")
                              else:
                                  expressions.append("%s = ?"%name)
                                  args.append(sub_check)
                      expr = " AND ".join(expressions)
                      return expr, args
                  def add_record(self, msg_id, rec):
                      """Add a new Task Record, by msg_id."""
                      d = self._defaults()
                      d.update(rec)
                      d['msg_id'] = msg_id
                      line = self._dict_to_list(d)
                      tups = '(%s)'%(','.join(['?']*len(line)))
                      self._db.execute("INSERT INTO %s VALUES %s"%(self.table, tups), line)
                      # self._db.commit()
                  def get_record(self, msg_id):
                      """Get a specific Task Record, by msg_id."""
                      cursor = self._db.execute("""SELECT * FROM %s WHERE msg_id==?"""%self.table, (msg_id,))
                      line = cursor.fetchone()
                      if line is None:
                          raise KeyError("No such msg: %r"%msg_id)
                      return self._list_to_dict(line)
                  def update_record(self, msg_id, rec):
                      """Update the data in an existing record."""
                      query = "UPDATE %s SET "%self.table
                      sets = []
                      keys = sorted(rec.keys())
                      values = []
                      for key in keys:
                          sets.append('%s = ?'%key)
                          values.append(rec[key])
                      query += ', '.join(sets)
                      query += ' WHERE msg_id == ?'
                      values.append(msg_id)
                      self._db.execute(query, values)
                      # self._db.commit()
                  def drop_record(self, msg_id):
                      """Remove a record from the DB."""
                      self._db.execute("""DELETE FROM %s WHERE msg_id==?"""%self.table, (msg_id,))
                      # self._db.commit()
                  def drop_matching_records(self, check):
                      """Remove a record from the DB."""
                      expr,args = self._render_expression(check)
                      query = "DELETE FROM %s WHERE %s"%(self.table, expr)
                      self._db.execute(query,args)
                      # self._db.commit()
                  def find_records(self, check, keys=None):
                      """Find records matching a query dict, optionally extracting subset of keys.
                      Returns list of matching records.
                      Parameters
                      ----------
                      check: dict
                          mongodb-style query argument
                      keys: list of strs [optional]
                          if specified, the subset of keys to extract.  msg_id will *always* be
                          included.
                      """
                      if keys:
                          bad_keys = [ key for key in keys if key not in self._keys ]
                          if bad_keys:
                              raise KeyError("Bad record key(s): %s"%bad_keys)
                      if keys:
                          # ensure msg_id is present and first:
                          if 'msg_id' in keys:
                              keys.remove('msg_id')
                          keys.insert(0, 'msg_id')
                          req = ', '.join(keys)
                      else:
                          req = '*'
                      expr,args = self._render_expression(check)
                      query = """SELECT %s FROM %s WHERE %s"""%(req, self.table, expr)
                      cursor = self._db.execute(query, args)
                      matches = cursor.fetchall()
                      records = []
                      for line in matches:
                          rec = self._list_to_dict(line, keys)
                          records.append(rec)
                      return records
                  def get_history(self):
                      """get all msg_ids, ordered by time submitted."""
                      query = """SELECT msg_id FROM %s ORDER by submitted ASC"""%self.table
                      cursor = self._db.execute(query)
                      # will be a list of length 1 tuples
                      return [ tup[0] for tup in cursor.fetchall()]
              __all__ = ['SQLiteDB']
  No newline at end of file

IPython/parallel/engine/engine.py

0 +4 0

              #!/usr/bin/env python
              """A simple engine that talks to a controller over 0MQ.
              it handles registration, etc. and launches a kernel
              connected to the Controller's Schedulers.
+             Authors:
+             * Min RK
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              from __future__ import print_function
              import sys
              import time
              import zmq
              from zmq.eventloop import ioloop, zmqstream
              # internal
              from IPython.utils.traitlets import Instance, Dict, Int, Type, CFloat, Unicode
              # from IPython.utils.localinterfaces import LOCALHOST
              from IPython.parallel.controller.heartmonitor import Heart
              from IPython.parallel.factory import RegistrationFactory
              from IPython.parallel.util import disambiguate_url
              from IPython.zmq.session import Message
              from .streamkernel import Kernel
              class EngineFactory(RegistrationFactory):
                  """IPython engine"""
                  # configurables:
                  out_stream_factory=Type('IPython.zmq.iostream.OutStream', config=True,
                      help="""The OutStream for handling stdout/err.
                      Typically 'IPython.zmq.iostream.OutStream'""")
                  display_hook_factory=Type('IPython.zmq.displayhook.DisplayHook', config=True,
                      help="""The class for handling displayhook.
                      Typically 'IPython.zmq.displayhook.DisplayHook'""")
                  location=Unicode(config=True,
                      help="""The location (an IP address) of the controller.  This is
                      used for disambiguating URLs, to determine whether
                      loopback should be used to connect or the public address.""")
                  timeout=CFloat(2,config=True,
                      help="""The time (in seconds) to wait for the Controller to respond
                      to registration requests before giving up.""")
                  # not configurable:
                  user_ns=Dict()
                  id=Int(allow_none=True)
                  registrar=Instance('zmq.eventloop.zmqstream.ZMQStream')
                  kernel=Instance(Kernel)
                  def __init__(self, **kwargs):
                      super(EngineFactory, self).__init__(**kwargs)
                      self.ident = self.session.session
                      ctx = self.context
                      reg = ctx.socket(zmq.XREQ)
                      reg.setsockopt(zmq.IDENTITY, self.ident)
                      reg.connect(self.url)
                      self.registrar = zmqstream.ZMQStream(reg, self.loop)
                  def register(self):
                      """send the registration_request"""
                      self.log.info("registering")
                      content = dict(queue=self.ident, heartbeat=self.ident, control=self.ident)
                      self.registrar.on_recv(self.complete_registration)
                      # print (self.session.key)
                      self.session.send(self.registrar, "registration_request",content=content)
                  def complete_registration(self, msg):
                      # print msg
                      self._abort_dc.stop()
                      ctx = self.context
                      loop = self.loop
                      identity = self.ident
                      idents,msg = self.session.feed_identities(msg)
                      msg = Message(self.session.unpack_message(msg))
                      if msg.content.status == 'ok':
                          self.id = int(msg.content.id)
                          # create Shell Streams (MUX, Task, etc.):
                          queue_addr = msg.content.mux
                          shell_addrs = [ str(queue_addr) ]
                          task_addr = msg.content.task
                          if task_addr:
                              shell_addrs.append(str(task_addr))
                          # Uncomment this to go back to two-socket model
                          # shell_streams = []
                          # for addr in shell_addrs:
                          #     stream = zmqstream.ZMQStream(ctx.socket(zmq.XREP), loop)
                          #     stream.setsockopt(zmq.IDENTITY, identity)
                          #     stream.connect(disambiguate_url(addr, self.location))
                          #     shell_streams.append(stream)
                          # Now use only one shell stream for mux and tasks
                          stream = zmqstream.ZMQStream(ctx.socket(zmq.XREP), loop)
                          stream.setsockopt(zmq.IDENTITY, identity)
                          shell_streams = [stream]
                          for addr in shell_addrs:
                              stream.connect(disambiguate_url(addr, self.location))
                          # end single stream-socket
                          # control stream:
                          control_addr = str(msg.content.control)
                          control_stream = zmqstream.ZMQStream(ctx.socket(zmq.XREP), loop)
                          control_stream.setsockopt(zmq.IDENTITY, identity)
                          control_stream.connect(disambiguate_url(control_addr, self.location))
                          # create iopub stream:
                          iopub_addr = msg.content.iopub
                          iopub_stream = zmqstream.ZMQStream(ctx.socket(zmq.PUB), loop)
                          iopub_stream.setsockopt(zmq.IDENTITY, identity)
                          iopub_stream.connect(disambiguate_url(iopub_addr, self.location))
                          # launch heartbeat
                          hb_addrs = msg.content.heartbeat
                          # print (hb_addrs)
                          # # Redirect input streams and set a display hook.
                          if self.out_stream_factory:
                              sys.stdout = self.out_stream_factory(self.session, iopub_stream, u'stdout')
                              sys.stdout.topic = 'engine.%i.stdout'%self.id
                              sys.stderr = self.out_stream_factory(self.session, iopub_stream, u'stderr')
                              sys.stderr.topic = 'engine.%i.stderr'%self.id
                          if self.display_hook_factory:
                              sys.displayhook = self.display_hook_factory(self.session, iopub_stream)
                              sys.displayhook.topic = 'engine.%i.pyout'%self.id
                          self.kernel = Kernel(config=self.config, int_id=self.id, ident=self.ident, session=self.session,
                                  control_stream=control_stream, shell_streams=shell_streams, iopub_stream=iopub_stream,
                                  loop=loop, user_ns = self.user_ns, log=self.log)
                          self.kernel.start()
                          hb_addrs = [ disambiguate_url(addr, self.location) for addr in hb_addrs ]
                          heart = Heart(*map(str, hb_addrs), heart_id=identity)
                          heart.start()
                      else:
                          self.log.fatal("Registration Failed: %s"%msg)
                          raise Exception("Registration Failed: %s"%msg)
                      self.log.info("Completed registration with id %i"%self.id)
                  def abort(self):
                      self.log.fatal("Registration timed out after %.1f seconds"%self.timeout)
                      self.session.send(self.registrar, "unregistration_request", content=dict(id=self.id))
                      time.sleep(1)
                      sys.exit(255)
                  def start(self):
                      dc = ioloop.DelayedCallback(self.register, 0, self.loop)
                      dc.start()
                      self._abort_dc = ioloop.DelayedCallback(self.abort, self.timeout*1000, self.loop)
                      self._abort_dc.start()

IPython/parallel/engine/kernelstarter.py

0 +6 -1

-             """KernelStarter class that intercepts Control Queue messages, and handles process management."""
+             """KernelStarter class that intercepts Control Queue messages, and handles process management.
+             Authors:
+             * Min RK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              from zmq.eventloop import ioloop
              from IPython.zmq.session import Session
              class KernelStarter(object):
                  """Object for resetting/killing the Kernel."""
                  def __init__(self, session, upstream, downstream, *kernel_args, **kernel_kwargs):
                      self.session = session
                      self.upstream = upstream
                      self.downstream = downstream
                      self.kernel_args = kernel_args
                      self.kernel_kwargs = kernel_kwargs
                      self.handlers = {}
                      for method in 'shutdown_request shutdown_reply'.split():
                          self.handlers[method] = getattr(self, method)
                  def start(self):
                      self.upstream.on_recv(self.dispatch_request)
                      self.downstream.on_recv(self.dispatch_reply)
                  #--------------------------------------------------------------------------
                  # Dispatch methods
                  #--------------------------------------------------------------------------
                  def dispatch_request(self, raw_msg):
                      idents, msg = self.session.feed_identities()
                      try:
                          msg = self.session.unpack_message(msg, content=False)
                      except:
                          print ("bad msg: %s"%msg)
                      msgtype = msg['msg_type']
                      handler = self.handlers.get(msgtype, None)
                      if handler is None:
                          self.downstream.send_multipart(raw_msg, copy=False)
                      else:
                          handler(msg)
                  def dispatch_reply(self, raw_msg):
                      idents, msg = self.session.feed_identities()
                      try:
                          msg = self.session.unpack_message(msg, content=False)
                      except:
                          print ("bad msg: %s"%msg)
                      msgtype = msg['msg_type']
                      handler = self.handlers.get(msgtype, None)
                      if handler is None:
                          self.upstream.send_multipart(raw_msg, copy=False)
                      else:
                          handler(msg)
                  #--------------------------------------------------------------------------
                  # Handlers
                  #--------------------------------------------------------------------------
                  def shutdown_request(self, msg):
                      """"""
                      self.downstream.send_multipart(msg)
                  #--------------------------------------------------------------------------
                  # Kernel process management methods, from KernelManager:
                  #--------------------------------------------------------------------------
                  def _check_local(addr):
                      if isinstance(addr, tuple):
                          addr = addr[0]
                      return addr in LOCAL_IPS
                  def start_kernel(self, **kw):
                      """Starts a kernel process and configures the manager to use it.
                      If random ports (port=0) are being used, this method must be called
                      before the channels are created.
                      Parameters:
                      -----------
                      ipython : bool, optional (default True)
                           Whether to use an IPython kernel instead of a plain Python kernel.
                      """
                      self.kernel = Process(target=make_kernel, args=self.kernel_args,
                                                          kwargs=self.kernel_kwargs)
                  def shutdown_kernel(self, restart=False):
                      """ Attempts to the stop the kernel process cleanly. If the kernel
                      cannot be stopped, it is killed, if possible.
                      """
                      # FIXME: Shutdown does not work on Windows due to ZMQ errors!
                      if sys.platform == 'win32':
                          self.kill_kernel()
                          return
                      # Don't send any additional kernel kill messages immediately, to give
                      # the kernel a chance to properly execute shutdown actions. Wait for at
                      # most 1s, checking every 0.1s.
                      self.xreq_channel.shutdown(restart=restart)
                      for i in range(10):
                          if self.is_alive:
                              time.sleep(0.1)
                          else:
                              break
                      else:
                          # OK, we've waited long enough.
                          if self.has_kernel:
                              self.kill_kernel()
                  def restart_kernel(self, now=False):
                      """Restarts a kernel with the same arguments that were used to launch
                      it. If the old kernel was launched with random ports, the same ports
                      will be used for the new kernel.
                      Parameters
                      ----------
                      now : bool, optional
                        If True, the kernel is forcefully restarted *immediately*, without
                        having a chance to do any cleanup action.  Otherwise the kernel is
                        given 1s to clean up before a forceful restart is issued.
                        In all cases the kernel is restarted, the only difference is whether
                        it is given a chance to perform a clean shutdown or not.
                      """
                      if self._launch_args is None:
                          raise RuntimeError("Cannot restart the kernel. "
                                             "No previous call to 'start_kernel'.")
                      else:
                          if self.has_kernel:
                              if now:
                                  self.kill_kernel()
                              else:
                                  self.shutdown_kernel(restart=True)
                          self.start_kernel(**self._launch_args)
                          # FIXME: Messages get dropped in Windows due to probable ZMQ bug
                          # unless there is some delay here.
                          if sys.platform == 'win32':
                              time.sleep(0.2)
                  @property
                  def has_kernel(self):
                      """Returns whether a kernel process has been specified for the kernel
                      manager.
                      """
                      return self.kernel is not None
                  def kill_kernel(self):
                      """ Kill the running kernel. """
                      if self.has_kernel:
                          # Pause the heart beat channel if it exists.
                          if self._hb_channel is not None:
                              self._hb_channel.pause()
                          # Attempt to kill the kernel.
                          try:
                              self.kernel.kill()
                          except OSError, e:
                              # In Windows, we will get an Access Denied error if the process
                              # has already terminated. Ignore it.
                              if not (sys.platform == 'win32' and e.winerror == 5):
                                  raise
                          self.kernel = None
                      else:
                          raise RuntimeError("Cannot kill kernel. No kernel is running!")
                  def interrupt_kernel(self):
                      """ Interrupts the kernel. Unlike ``signal_kernel``, this operation is
                      well supported on all platforms.
                      """
                      if self.has_kernel:
                          if sys.platform == 'win32':
                              from parentpoller import ParentPollerWindows as Poller
                              Poller.send_interrupt(self.kernel.win32_interrupt_event)
                          else:
                              self.kernel.send_signal(signal.SIGINT)
                      else:
                          raise RuntimeError("Cannot interrupt kernel. No kernel is running!")
                  def signal_kernel(self, signum):
                      """ Sends a signal to the kernel. Note that since only SIGTERM is
                      supported on Windows, this function is only useful on Unix systems.
                      """
                      if self.has_kernel:
                          self.kernel.send_signal(signum)
                      else:
                          raise RuntimeError("Cannot signal kernel. No kernel is running!")
                  @property
                  def is_alive(self):
                      """Is the kernel process still running?"""
                      # FIXME: not using a heartbeat means this method is broken for any
                      # remote kernel, it's only capable of handling local kernels.
                      if self.has_kernel:
                          if self.kernel.poll() is None:
                              return True
                          else:
                              return False
                      else:
                          # We didn't start the kernel with this KernelManager so we don't
                          # know if it is running. We should use a heartbeat for this case.
                          return True
              def make_starter(up_addr, down_addr, *args, **kwargs):
                  """entry point function for launching a kernelstarter in a subprocess"""
                  loop = ioloop.IOLoop.instance()
                  ctx = zmq.Context()
                  session = Session()
                  upstream = zmqstream.ZMQStream(ctx.socket(zmq.XREQ),loop)
                  upstream.connect(up_addr)
                  downstream = zmqstream.ZMQStream(ctx.socket(zmq.XREQ),loop)
                  downstream.connect(down_addr)
                  starter = KernelStarter(session, upstream, downstream, *args, **kwargs)
                  starter.start()
                  loop.start()
   No newline at end of file

IPython/parallel/engine/streamkernel.py

0 +7 0

              #!/usr/bin/env python
              """
              Kernel adapted from kernel.py to use ZMQ Streams
+             Authors:
+             * Min RK
+             * Brian Granger
+             * Fernando Perez
+             * Evan Patterson
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              # Standard library imports.
              from __future__ import print_function
              import sys
              import time
              from code import CommandCompiler
              from datetime import datetime
              from pprint import pprint
              # System library imports.
              import zmq
              from zmq.eventloop import ioloop, zmqstream
              # Local imports.
              from IPython.utils.traitlets import Instance, List, Int, Dict, Set, Unicode
              from IPython.zmq.completer import KernelCompleter
              from IPython.parallel.error import wrap_exception
              from IPython.parallel.factory import SessionFactory
              from IPython.parallel.util import serialize_object, unpack_apply_message
              def printer(*args):
                  pprint(args, stream=sys.__stdout__)
              class _Passer(zmqstream.ZMQStream):
                  """Empty class that implements `send()` that does nothing.
                  Subclass ZMQStream for Session typechecking
                  """
                  def __init__(self, *args, **kwargs):
                      pass
                  def send(self, *args, **kwargs):
                      pass
                  send_multipart = send
              #-----------------------------------------------------------------------------
              # Main kernel class
              #-----------------------------------------------------------------------------
              class Kernel(SessionFactory):
                  #---------------------------------------------------------------------------
                  # Kernel interface
                  #---------------------------------------------------------------------------
                  # kwargs:
                  exec_lines = List(Unicode, config=True,
                      help="List of lines to execute")
                  int_id = Int(-1)
                  user_ns = Dict(config=True,  help="""Set the user's namespace of the Kernel""")
                  control_stream = Instance(zmqstream.ZMQStream)
                  task_stream = Instance(zmqstream.ZMQStream)
                  iopub_stream = Instance(zmqstream.ZMQStream)
                  client = Instance('IPython.parallel.Client')
                  # internals
                  shell_streams = List()
                  compiler = Instance(CommandCompiler, (), {})
                  completer = Instance(KernelCompleter)
                  aborted = Set()
                  shell_handlers = Dict()
                  control_handlers = Dict()
                  def _set_prefix(self):
                      self.prefix = "engine.%s"%self.int_id
                  def _connect_completer(self):
                      self.completer = KernelCompleter(self.user_ns)
                  def __init__(self, **kwargs):
                      super(Kernel, self).__init__(**kwargs)
                      self._set_prefix()
                      self._connect_completer()
                      self.on_trait_change(self._set_prefix, 'id')
                      self.on_trait_change(self._connect_completer, 'user_ns')
                      # Build dict of handlers for message types
                      for msg_type in ['execute_request', 'complete_request', 'apply_request',
                              'clear_request']:
                          self.shell_handlers[msg_type] = getattr(self, msg_type)
                      for msg_type in ['shutdown_request', 'abort_request']+self.shell_handlers.keys():
                          self.control_handlers[msg_type] = getattr(self, msg_type)
                      self._initial_exec_lines()
                  def _wrap_exception(self, method=None):
                      e_info = dict(engine_uuid=self.ident, engine_id=self.int_id, method=method)
                      content=wrap_exception(e_info)
                      return content
                  def _initial_exec_lines(self):
                      s = _Passer()
                      content = dict(silent=True, user_variable=[],user_expressions=[])
                      for line in self.exec_lines:
                          self.log.debug("executing initialization: %s"%line)
                          content.update({'code':line})
                          msg = self.session.msg('execute_request', content)
                          self.execute_request(s, [], msg)
                  #-------------------- control handlers -----------------------------
                  def abort_queues(self):
                      for stream in self.shell_streams:
                          if stream:
                              self.abort_queue(stream)
                  def abort_queue(self, stream):
                      while True:
                          idents,msg = self.session.recv(stream, zmq.NOBLOCK, content=True)
                          if msg is None:
                              return
                          self.log.info("Aborting:")
                          self.log.info(str(msg))
                          msg_type = msg['msg_type']
                          reply_type = msg_type.split('_')[0] + '_reply'
                          # reply_msg = self.session.msg(reply_type, {'status' : 'aborted'}, msg)
                          # self.reply_socket.send(ident,zmq.SNDMORE)
                          # self.reply_socket.send_json(reply_msg)
                          reply_msg = self.session.send(stream, reply_type,
                                      content={'status' : 'aborted'}, parent=msg, ident=idents)[0]
                          self.log.debug(str(reply_msg))
                          # We need to wait a bit for requests to come in. This can probably
                          # be set shorter for true asynchronous clients.
                          time.sleep(0.05)
                  def abort_request(self, stream, ident, parent):
                      """abort a specifig msg by id"""
                      msg_ids = parent['content'].get('msg_ids', None)
                      if isinstance(msg_ids, basestring):
                          msg_ids = [msg_ids]
                      if not msg_ids:
                          self.abort_queues()
                      for mid in msg_ids:
                          self.aborted.add(str(mid))
                      content = dict(status='ok')
                      reply_msg = self.session.send(stream, 'abort_reply', content=content,
                              parent=parent, ident=ident)
                      self.log.debug(str(reply_msg))
                  def shutdown_request(self, stream, ident, parent):
                      """kill ourself.  This should really be handled in an external process"""
                      try:
                          self.abort_queues()
                      except:
                          content = self._wrap_exception('shutdown')
                      else:
                          content = dict(parent['content'])
                          content['status'] = 'ok'
                      msg = self.session.send(stream, 'shutdown_reply',
                                              content=content, parent=parent, ident=ident)
                      self.log.debug(str(msg))
                      dc = ioloop.DelayedCallback(lambda : sys.exit(0), 1000, self.loop)
                      dc.start()
                  def dispatch_control(self, msg):
                      idents,msg = self.session.feed_identities(msg, copy=False)
                      try:
                          msg = self.session.unpack_message(msg, content=True, copy=False)
                      except:
                          self.log.error("Invalid Message", exc_info=True)
                          return
                      header = msg['header']
                      msg_id = header['msg_id']
                      handler = self.control_handlers.get(msg['msg_type'], None)
                      if handler is None:
                          self.log.error("UNKNOWN CONTROL MESSAGE TYPE: %r"%msg['msg_type'])
                      else:
                          handler(self.control_stream, idents, msg)
                  #-------------------- queue helpers ------------------------------
                  def check_dependencies(self, dependencies):
                      if not dependencies:
                          return True
                      if len(dependencies) == 2 and dependencies[0] in 'any all'.split():
                          anyorall = dependencies[0]
                          dependencies = dependencies[1]
                      else:
                          anyorall = 'all'
                      results = self.client.get_results(dependencies,status_only=True)
                      if results['status'] != 'ok':
                          return False
                      if anyorall == 'any':
                          if not results['completed']:
                              return False
                      else:
                          if results['pending']:
                              return False
                      return True
                  def check_aborted(self, msg_id):
                      return msg_id in self.aborted
                  #-------------------- queue handlers -----------------------------
                  def clear_request(self, stream, idents, parent):
                      """Clear our namespace."""
                      self.user_ns = {}
                      msg = self.session.send(stream, 'clear_reply', ident=idents, parent=parent,
                              content = dict(status='ok'))
                      self._initial_exec_lines()
                  def execute_request(self, stream, ident, parent):
                      self.log.debug('execute request %s'%parent)
                      try:
                          code = parent[u'content'][u'code']
                      except:
                          self.log.error("Got bad msg: %s"%parent, exc_info=True)
                          return
                      self.session.send(self.iopub_stream, u'pyin', {u'code':code},parent=parent,
                                          ident='%s.pyin'%self.prefix)
                      started = datetime.now()
                      try:
                          comp_code = self.compiler(code, '<zmq-kernel>')
                          # allow for not overriding displayhook
                          if hasattr(sys.displayhook, 'set_parent'):
                              sys.displayhook.set_parent(parent)
                              sys.stdout.set_parent(parent)
                              sys.stderr.set_parent(parent)
                          exec comp_code in self.user_ns, self.user_ns
                      except:
                          exc_content = self._wrap_exception('execute')
                          # exc_msg = self.session.msg(u'pyerr', exc_content, parent)
                          self.session.send(self.iopub_stream, u'pyerr', exc_content, parent=parent,
                                          ident='%s.pyerr'%self.prefix)
                          reply_content = exc_content
                      else:
                          reply_content = {'status' : 'ok'}
                      reply_msg = self.session.send(stream, u'execute_reply', reply_content, parent=parent,
                                  ident=ident, subheader = dict(started=started))
                      self.log.debug(str(reply_msg))
                      if reply_msg['content']['status'] == u'error':
                          self.abort_queues()
                  def complete_request(self, stream, ident, parent):
                      matches = {'matches' : self.complete(parent),
                                 'status' : 'ok'}
                      completion_msg = self.session.send(stream, 'complete_reply',
                                                         matches, parent, ident)
                      # print >> sys.__stdout__, completion_msg
                  def complete(self, msg):
                      return self.completer.complete(msg.content.line, msg.content.text)
                  def apply_request(self, stream, ident, parent):
                      # flush previous reply, so this request won't block it
                      stream.flush(zmq.POLLOUT)
                      try:
                          content = parent[u'content']
                          bufs = parent[u'buffers']
                          msg_id = parent['header']['msg_id']
                          # bound = parent['header'].get('bound', False)
                      except:
                          self.log.error("Got bad msg: %s"%parent, exc_info=True)
                          return
                      # pyin_msg = self.session.msg(u'pyin',{u'code':code}, parent=parent)
                      # self.iopub_stream.send(pyin_msg)
                      # self.session.send(self.iopub_stream, u'pyin', {u'code':code},parent=parent)
                      sub = {'dependencies_met' : True, 'engine' : self.ident,
                              'started': datetime.now()}
                      try:
                          # allow for not overriding displayhook
                          if hasattr(sys.displayhook, 'set_parent'):
                              sys.displayhook.set_parent(parent)
                              sys.stdout.set_parent(parent)
                              sys.stderr.set_parent(parent)
                          # exec "f(*args,**kwargs)" in self.user_ns, self.user_ns
                          working = self.user_ns
                          # suffix =
                          prefix = "_"+str(msg_id).replace("-","")+"_"
                          f,args,kwargs = unpack_apply_message(bufs, working, copy=False)
                          # if bound:
                          #     bound_ns = Namespace(working)
                          #     args = [bound_ns]+list(args)
                          fname = getattr(f, '__name__', 'f')
                          fname = prefix+"f"
                          argname = prefix+"args"
                          kwargname = prefix+"kwargs"
                          resultname = prefix+"result"
                          ns = { fname : f, argname : args, kwargname : kwargs , resultname : None }
                          # print ns
                          working.update(ns)
                          code = "%s=%s(*%s,**%s)"%(resultname, fname, argname, kwargname)
                          try:
                              exec code in working,working
                              result = working.get(resultname)
                          finally:
                              for key in ns.iterkeys():
                                  working.pop(key)
                          # if bound:
                          #     working.update(bound_ns)
                          packed_result,buf = serialize_object(result)
                          result_buf = [packed_result]+buf
                      except:
                          exc_content = self._wrap_exception('apply')
                          # exc_msg = self.session.msg(u'pyerr', exc_content, parent)
                          self.session.send(self.iopub_stream, u'pyerr', exc_content, parent=parent,
                                              ident='%s.pyerr'%self.prefix)
                          reply_content = exc_content
                          result_buf = []
                          if exc_content['ename'] == 'UnmetDependency':
                              sub['dependencies_met'] = False
                      else:
                          reply_content = {'status' : 'ok'}
                      # put 'ok'/'error' status in header, for scheduler introspection:
                      sub['status'] = reply_content['status']
                      reply_msg = self.session.send(stream, u'apply_reply', reply_content,
                                  parent=parent, ident=ident,buffers=result_buf, subheader=sub)
                      # flush i/o
                      # should this be before reply_msg is sent, like in the single-kernel code,
                      # or should nothing get in the way of real results?
                      sys.stdout.flush()
                      sys.stderr.flush()
                  def dispatch_queue(self, stream, msg):
                      self.control_stream.flush()
                      idents,msg = self.session.feed_identities(msg, copy=False)
                      try:
                          msg = self.session.unpack_message(msg, content=True, copy=False)
                      except:
                          self.log.error("Invalid Message", exc_info=True)
                          return
                      header = msg['header']
                      msg_id = header['msg_id']
                      if self.check_aborted(msg_id):
                          self.aborted.remove(msg_id)
                          # is it safe to assume a msg_id will not be resubmitted?
                          reply_type = msg['msg_type'].split('_')[0] + '_reply'
                          status = {'status' : 'aborted'}
                          reply_msg = self.session.send(stream, reply_type, subheader=status,
                                      content=status, parent=msg, ident=idents)
                          return
                      handler = self.shell_handlers.get(msg['msg_type'], None)
                      if handler is None:
                          self.log.error("UNKNOWN MESSAGE TYPE: %r"%msg['msg_type'])
                      else:
                          handler(stream, idents, msg)
                  def start(self):
                      #### stream mode:
                      if self.control_stream:
                          self.control_stream.on_recv(self.dispatch_control, copy=False)
                          self.control_stream.on_err(printer)
                      def make_dispatcher(stream):
                          def dispatcher(msg):
                              return self.dispatch_queue(stream, msg)
                          return dispatcher
                      for s in self.shell_streams:
                          s.on_recv(make_dispatcher(s), copy=False)
                          s.on_err(printer)
                      if self.iopub_stream:
                          self.iopub_stream.on_err(printer)
                      #### while True mode:
                      # while True:
                      #     idle = True
                      #     try:
                      #         msg = self.shell_stream.socket.recv_multipart(
                      #                     zmq.NOBLOCK, copy=False)
                      #     except zmq.ZMQError, e:
                      #         if e.errno != zmq.EAGAIN:
                      #             raise e
                      #     else:
                      #         idle=False
                      #         self.dispatch_queue(self.shell_stream, msg)
                      #
                      #     if not self.task_stream.empty():
                      #         idle=False
                      #         msg = self.task_stream.recv_multipart()
                      #         self.dispatch_queue(self.task_stream, msg)
                      #     if idle:
                      #         # don't busywait
                      #         time.sleep(1e-3)

IPython/parallel/error.py

0 +8 -2

              # encoding: utf-8
-             """Classes and functions for kernel related errors and exceptions."""
+             """Classes and functions for kernel related errors and exceptions.
+             Authors:
+             * Brian Granger
+             * Min RK
+             """
              from __future__ import print_function
              import sys
              import traceback
              __docformat__ = "restructuredtext en"
              # Tell nose to skip this module
              __test__ = {}
              #-------------------------------------------------------------------------------
-             #  Copyright (C) 2008  The IPython Development Team
+             #  Copyright (C) 2008-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Error classes
              #-------------------------------------------------------------------------------
              class IPythonError(Exception):
                  """Base exception that all of our exceptions inherit from.
                  This can be raised by code that doesn't have any more specific
                  information."""
                  pass
              # Exceptions associated with the controller objects
              class ControllerError(IPythonError): pass
              class ControllerCreationError(ControllerError): pass
              # Exceptions associated with the Engines
              class EngineError(IPythonError): pass
              class EngineCreationError(EngineError): pass
              class KernelError(IPythonError):
                  pass
              class NotDefined(KernelError):
                  def __init__(self, name):
                      self.name = name
                      self.args = (name,)
                  def __repr__(self):
                      return '<NotDefined: %s>' % self.name
                  __str__ = __repr__
              class QueueCleared(KernelError):
                  pass
              class IdInUse(KernelError):
                  pass
              class ProtocolError(KernelError):
                  pass
              class ConnectionError(KernelError):
                  pass
              class InvalidEngineID(KernelError):
                  pass
              class NoEnginesRegistered(KernelError):
                  pass
              class InvalidClientID(KernelError):
                  pass
              class InvalidDeferredID(KernelError):
                  pass
              class SerializationError(KernelError):
                  pass
              class MessageSizeError(KernelError):
                  pass
              class PBMessageSizeError(MessageSizeError):
                  pass
              class ResultNotCompleted(KernelError):
                  pass
              class ResultAlreadyRetrieved(KernelError):
                  pass
              class ClientError(KernelError):
                  pass
              class TaskAborted(KernelError):
                  pass
              class TaskTimeout(KernelError):
                  pass
              class NotAPendingResult(KernelError):
                  pass
              class UnpickleableException(KernelError):
                  pass
              class AbortedPendingDeferredError(KernelError):
                  pass
              class InvalidProperty(KernelError):
                  pass
              class MissingBlockArgument(KernelError):
                  pass
              class StopLocalExecution(KernelError):
                  pass
              class SecurityError(KernelError):
                  pass
              class FileTimeoutError(KernelError):
                  pass
              class TimeoutError(KernelError):
                  pass
              class UnmetDependency(KernelError):
                  pass
              class ImpossibleDependency(UnmetDependency):
                  pass
              class DependencyTimeout(ImpossibleDependency):
                  pass
              class InvalidDependency(ImpossibleDependency):
                  pass
              class RemoteError(KernelError):
                  """Error raised elsewhere"""
                  ename=None
                  evalue=None
                  traceback=None
                  engine_info=None
                  def __init__(self, ename, evalue, traceback, engine_info=None):
                      self.ename=ename
                      self.evalue=evalue
                      self.traceback=traceback
                      self.engine_info=engine_info or {}
                      self.args=(ename, evalue)
                  def __repr__(self):
                      engineid = self.engine_info.get('engine_id', ' ')
                      return "<Remote[%s]:%s(%s)>"%(engineid, self.ename, self.evalue)
                  def __str__(self):
                      sig = "%s(%s)"%(self.ename, self.evalue)
                      if self.traceback:
                          return sig + '\n' + self.traceback
                      else:
                          return sig
              class TaskRejectError(KernelError):
                  """Exception to raise when a task should be rejected by an engine.
                  This exception can be used to allow a task running on an engine to test
                  if the engine (or the user's namespace on the engine) has the needed
                  task dependencies.  If not, the task should raise this exception.  For
                  the task to be retried on another engine, the task should be created
                  with the `retries` argument > 1.
                  The advantage of this approach over our older properties system is that
                  tasks have full access to the user's namespace on the engines and the
                  properties don't have to be managed or tested by the controller.
                  """
              class CompositeError(RemoteError):
                  """Error for representing possibly multiple errors on engines"""
                  def __init__(self, message, elist):
                      Exception.__init__(self, *(message, elist))
                      # Don't use pack_exception because it will conflict with the .message
                      # attribute that is being deprecated in 2.6 and beyond.
                      self.msg = message
                      self.elist = elist
                      self.args = [ e[0] for e in elist ]
                  def _get_engine_str(self, ei):
                      if not ei:
                          return '[Engine Exception]'
                      else:
                          return '[%s:%s]: ' % (ei['engine_id'], ei['method'])
                  def _get_traceback(self, ev):
                      try:
                          tb = ev._ipython_traceback_text
                      except AttributeError:
                          return 'No traceback available'
                      else:
                          return tb
                  def __str__(self):
                      s = str(self.msg)
                      for en, ev, etb, ei in self.elist:
                          engine_str = self._get_engine_str(ei)
                          s = s + '\n' + engine_str + en + ': ' + str(ev)
                      return s
                  def __repr__(self):
                      return "CompositeError(%i)"%len(self.elist)
                  def print_tracebacks(self, excid=None):
                      if excid is None:
                          for (en,ev,etb,ei) in self.elist:
                              print (self._get_engine_str(ei))
                              print (etb or 'No traceback available')
                              print ()
                      else:
                          try:
                              en,ev,etb,ei = self.elist[excid]
                          except:
                              raise IndexError("an exception with index %i does not exist"%excid)
                          else:
                              print (self._get_engine_str(ei))
                              print (etb or 'No traceback available')
                  def raise_exception(self, excid=0):
                      try:
                          en,ev,etb,ei = self.elist[excid]
                      except:
                          raise IndexError("an exception with index %i does not exist"%excid)
                      else:
                          raise RemoteError(en, ev, etb, ei)
              def collect_exceptions(rdict_or_list, method='unspecified'):
                  """check a result dict for errors, and raise CompositeError if any exist.
                  Passthrough otherwise."""
                  elist = []
                  if isinstance(rdict_or_list, dict):
                      rlist = rdict_or_list.values()
                  else:
                      rlist = rdict_or_list
                  for r in rlist:
                      if isinstance(r, RemoteError):
                          en, ev, etb, ei = r.ename, r.evalue, r.traceback, r.engine_info
                          # Sometimes we could have CompositeError in our list.  Just take
                          # the errors out of them and put them in our new list.  This
                          # has the effect of flattening lists of CompositeErrors into one
                          # CompositeError
                          if en=='CompositeError':
                              for e in ev.elist:
                                  elist.append(e)
                          else:
                              elist.append((en, ev, etb, ei))
                  if len(elist)==0:
                      return rdict_or_list
                  else:
                      msg = "one or more exceptions from call to method: %s" % (method)
                      # This silliness is needed so the debugger has access to the exception
                      # instance (e in this case)
                      try:
                          raise CompositeError(msg, elist)
                      except CompositeError as e:
                          raise e
              def wrap_exception(engine_info={}):
                  etype, evalue, tb = sys.exc_info()
                  stb = traceback.format_exception(etype, evalue, tb)
                  exc_content = {
                      'status' : 'error',
                      'traceback' : stb,
                      'ename' : unicode(etype.__name__),
                      'evalue' : unicode(evalue),
                      'engine_info' : engine_info
                  }
                  return exc_content
              def unwrap_exception(content):
                  err = RemoteError(content['ename'], content['evalue'],
                              ''.join(content['traceback']),
                              content.get('engine_info', {}))
                  return err

IPython/parallel/factory.py

0 +6 -1

-             """Base config factories."""
+             """Base config factories.
+             Authors:
+             * Min RK
+             """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import logging
              import os
              import zmq
              from zmq.eventloop.ioloop import IOLoop
              from IPython.config.configurable import Configurable
              from IPython.utils.traitlets import Int, Instance, Unicode
              from IPython.parallel.util import select_random_ports
              from IPython.zmq.session import Session, SessionFactory
              #-----------------------------------------------------------------------------
              # Classes
              #-----------------------------------------------------------------------------
              class RegistrationFactory(SessionFactory):
                  """The Base Configurable for objects that involve registration."""
                  url = Unicode('', config=True,
                      help="""The 0MQ url used for registration. This sets transport, ip, and port
                      in one variable. For example: url='tcp://127.0.0.1:12345' or
                      url='epgm://*:90210'""") # url takes precedence over ip,regport,transport
                  transport = Unicode('tcp', config=True,
                      help="""The 0MQ transport for communications.  This will likely be
                      the default of 'tcp', but other values include 'ipc', 'epgm', 'inproc'.""")
                  ip = Unicode('127.0.0.1', config=True,
                      help="""The IP address for registration.  This is generally either
                      '127.0.0.1' for loopback only or '*' for all interfaces.
                      [default: '127.0.0.1']""")
                  regport = Int(config=True,
                      help="""The port on which the Hub listens for registration.""")
                  def _regport_default(self):
                      return select_random_ports(1)[0]
                  def __init__(self, **kwargs):
                      super(RegistrationFactory, self).__init__(**kwargs)
                      self._propagate_url()
                      self._rebuild_url()
                      self.on_trait_change(self._propagate_url, 'url')
                      self.on_trait_change(self._rebuild_url, 'ip')
                      self.on_trait_change(self._rebuild_url, 'transport')
                      self.on_trait_change(self._rebuild_url, 'regport')
                  def _rebuild_url(self):
                      self.url = "%s://%s:%i"%(self.transport, self.ip, self.regport)
                  def _propagate_url(self):
                      """Ensure self.url contains full transport://interface:port"""
                      if self.url:
                          iface = self.url.split('://',1)
                          if len(iface) == 2:
                              self.transport,iface = iface
                          iface = iface.split(':')
                          self.ip = iface[0]
                          if iface[1]:
                              self.regport = int(iface[1])

IPython/parallel/tests/clienttest.py

0 +6 -1

-             """base class for parallel client tests"""
+             """base class for parallel client tests
+             Authors:
+             * Min RK
+             """
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              import sys
              import tempfile
              import time
              from nose import SkipTest
              import zmq
              from zmq.tests import BaseZMQTestCase
              from IPython.external.decorator import decorator
              from IPython.parallel import error
              from IPython.parallel import Client
              from IPython.parallel.tests import launchers, add_engines
              # simple tasks for use in apply tests
              def segfault():
                  """this will segfault"""
                  import ctypes
                  ctypes.memset(-1,0,1)
              def crash():
                  """from stdlib crashers in the test suite"""
                  import types
                  if sys.platform.startswith('win'):
                      import ctypes
                      ctypes.windll.kernel32.SetErrorMode(0x0002);
                  co = types.CodeType(0, 0, 0, 0, b'\x04\x71\x00\x00',
                                           (), (), (), '', '', 1, b'')
                  exec(co)
              def wait(n):
                  """sleep for a time"""
                  import time
                  time.sleep(n)
                  return n
              def raiser(eclass):
                  """raise an exception"""
                  raise eclass()
              # test decorator for skipping tests when libraries are unavailable
              def skip_without(*names):
                  """skip a test if some names are not importable"""
                  @decorator
                  def skip_without_names(f, *args, **kwargs):
                      """decorator to skip tests in the absence of numpy."""
                      for name in names:
                          try:
                              __import__(name)
                          except ImportError:
                              raise SkipTest
                      return f(*args, **kwargs)
                  return skip_without_names
              class ClusterTestCase(BaseZMQTestCase):
                  def add_engines(self, n=1, block=True):
                      """add multiple engines to our cluster"""
                      self.engines.extend(add_engines(n))
                      if block:
                          self.wait_on_engines()
                  def wait_on_engines(self, timeout=5):
                      """wait for our engines to connect."""
                      n = len(self.engines)+self.base_engine_count
                      tic = time.time()
                      while time.time()-tic < timeout and len(self.client.ids) < n:
                          time.sleep(0.1)
                      assert not len(self.client.ids) < n, "waiting for engines timed out"
                  def connect_client(self):
                      """connect a client with my Context, and track its sockets for cleanup"""
                      c = Client(profile='iptest', context=self.context)
                      for name in filter(lambda n:n.endswith('socket'), dir(c)):
                          s = getattr(c, name)
                          s.setsockopt(zmq.LINGER, 0)
                          self.sockets.append(s)
                      return c
                  def assertRaisesRemote(self, etype, f, *args, **kwargs):
                      try:
                          try:
                              f(*args, **kwargs)
                          except error.CompositeError as e:
                              e.raise_exception()
                      except error.RemoteError as e:
                          self.assertEquals(etype.__name__, e.ename, "Should have raised %r, but raised %r"%(etype.__name__, e.ename))
                      else:
                          self.fail("should have raised a RemoteError")
                  def setUp(self):
                      BaseZMQTestCase.setUp(self)
                      self.client = self.connect_client()
                      # start every test with clean engine namespaces:
                      self.client.clear(block=True)
                      self.base_engine_count=len(self.client.ids)
                      self.engines=[]
                  def tearDown(self):
                      # self.client.clear(block=True)
                      # close fds:
                      for e in filter(lambda e: e.poll() is not None, launchers):
                          launchers.remove(e)
                      # allow flushing of incoming messages to prevent crash on socket close
                      self.client.wait(timeout=2)
                      # time.sleep(2)
                      self.client.spin()
                      self.client.close()
                      BaseZMQTestCase.tearDown(self)
                      # this will be redundant when pyzmq merges PR #88
                      # self.context.term()
                      # print tempfile.TemporaryFile().fileno(),
                      # sys.stdout.flush()
   No newline at end of file

IPython/parallel/tests/test_asyncresult.py

0 +6 -1

-             """Tests for asyncresult.py"""
+             """Tests for asyncresult.py
+             Authors:
+             * Min RK
+             """
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              from IPython.parallel.error import TimeoutError
              from IPython.parallel.tests import add_engines
              from .clienttest import ClusterTestCase
              def setup():
                  add_engines(2)
              def wait(n):
                  import time
                  time.sleep(n)
                  return n
              class AsyncResultTest(ClusterTestCase):
                  def test_single_result(self):
                      eid = self.client.ids[-1]
                      ar = self.client[eid].apply_async(lambda : 42)
                      self.assertEquals(ar.get(), 42)
                      ar = self.client[[eid]].apply_async(lambda : 42)
                      self.assertEquals(ar.get(), [42])
                      ar = self.client[-1:].apply_async(lambda : 42)
                      self.assertEquals(ar.get(), [42])
                  def test_get_after_done(self):
                      ar = self.client[-1].apply_async(lambda : 42)
                      ar.wait()
                      self.assertTrue(ar.ready())
                      self.assertEquals(ar.get(), 42)
                      self.assertEquals(ar.get(), 42)
                  def test_get_before_done(self):
                      ar = self.client[-1].apply_async(wait, 0.1)
                      self.assertRaises(TimeoutError, ar.get, 0)
                      ar.wait(0)
                      self.assertFalse(ar.ready())
                      self.assertEquals(ar.get(), 0.1)
                  def test_get_after_error(self):
                      ar = self.client[-1].apply_async(lambda : 1/0)
                      ar.wait()
                      self.assertRaisesRemote(ZeroDivisionError, ar.get)
                      self.assertRaisesRemote(ZeroDivisionError, ar.get)
                      self.assertRaisesRemote(ZeroDivisionError, ar.get_dict)
                  def test_get_dict(self):
                      n = len(self.client)
                      ar = self.client[:].apply_async(lambda : 5)
                      self.assertEquals(ar.get(), [5]*n)
                      d = ar.get_dict()
                      self.assertEquals(sorted(d.keys()), sorted(self.client.ids))
                      for eid,r in d.iteritems():
                          self.assertEquals(r, 5)

IPython/parallel/tests/test_client.py

0 +6 -1

-             """Tests for parallel client.py"""
+             """Tests for parallel client.py
+             Authors:
+             * Min RK
+             """
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              import time
              from datetime import datetime
              from tempfile import mktemp
              import zmq
              from IPython.parallel.client import client as clientmod
              from IPython.parallel import error
              from IPython.parallel import AsyncResult, AsyncHubResult
              from IPython.parallel import LoadBalancedView, DirectView
              from clienttest import ClusterTestCase, segfault, wait, add_engines
              def setup():
                  add_engines(4)
              class TestClient(ClusterTestCase):
                  def test_ids(self):
                      n = len(self.client.ids)
                      self.add_engines(3)
                      self.assertEquals(len(self.client.ids), n+3)
                  def test_view_indexing(self):
                      """test index access for views"""
                      self.add_engines(2)
                      targets = self.client._build_targets('all')[-1]
                      v = self.client[:]
                      self.assertEquals(v.targets, targets)
                      t = self.client.ids[2]
                      v = self.client[t]
                      self.assert_(isinstance(v, DirectView))
                      self.assertEquals(v.targets, t)
                      t = self.client.ids[2:4]
                      v = self.client[t]
                      self.assert_(isinstance(v, DirectView))
                      self.assertEquals(v.targets, t)
                      v = self.client[::2]
                      self.assert_(isinstance(v, DirectView))
                      self.assertEquals(v.targets, targets[::2])
                      v = self.client[1::3]
                      self.assert_(isinstance(v, DirectView))
                      self.assertEquals(v.targets, targets[1::3])
                      v = self.client[:-3]
                      self.assert_(isinstance(v, DirectView))
                      self.assertEquals(v.targets, targets[:-3])
                      v = self.client[-1]
                      self.assert_(isinstance(v, DirectView))
                      self.assertEquals(v.targets, targets[-1])
                      self.assertRaises(TypeError, lambda : self.client[None])
                  def test_lbview_targets(self):
                      """test load_balanced_view targets"""
                      v = self.client.load_balanced_view()
                      self.assertEquals(v.targets, None)
                      v = self.client.load_balanced_view(-1)
                      self.assertEquals(v.targets, [self.client.ids[-1]])
                      v = self.client.load_balanced_view('all')
                      self.assertEquals(v.targets, self.client.ids)
                  def test_targets(self):
                      """test various valid targets arguments"""
                      build = self.client._build_targets
                      ids = self.client.ids
                      idents,targets = build(None)
                      self.assertEquals(ids, targets)
                  def test_clear(self):
                      """test clear behavior"""
                      # self.add_engines(2)
                      v = self.client[:]
                      v.block=True
                      v.push(dict(a=5))
                      v.pull('a')
                      id0 = self.client.ids[-1]
                      self.client.clear(targets=id0, block=True)
                      a = self.client[:-1].get('a')
                      self.assertRaisesRemote(NameError, self.client[id0].get, 'a')
                      self.client.clear(block=True)
                      for i in self.client.ids:
                          # print i
                          self.assertRaisesRemote(NameError, self.client[i].get, 'a')
                  def test_get_result(self):
                      """test getting results from the Hub."""
                      c = clientmod.Client(profile='iptest')
                      # self.add_engines(1)
                      t = c.ids[-1]
                      ar = c[t].apply_async(wait, 1)
                      # give the monitor time to notice the message
                      time.sleep(.25)
                      ahr = self.client.get_result(ar.msg_ids)
                      self.assertTrue(isinstance(ahr, AsyncHubResult))
                      self.assertEquals(ahr.get(), ar.get())
                      ar2 = self.client.get_result(ar.msg_ids)
                      self.assertFalse(isinstance(ar2, AsyncHubResult))
                      c.close()
                  def test_ids_list(self):
                      """test client.ids"""
                      # self.add_engines(2)
                      ids = self.client.ids
                      self.assertEquals(ids, self.client._ids)
                      self.assertFalse(ids is self.client._ids)
                      ids.remove(ids[-1])
                      self.assertNotEquals(ids, self.client._ids)
                  def test_queue_status(self):
                      # self.addEngine(4)
                      ids = self.client.ids
                      id0 = ids[0]
                      qs = self.client.queue_status(targets=id0)
                      self.assertTrue(isinstance(qs, dict))
                      self.assertEquals(sorted(qs.keys()), ['completed', 'queue', 'tasks'])
                      allqs = self.client.queue_status()
                      self.assertTrue(isinstance(allqs, dict))
                      self.assertEquals(sorted(allqs.keys()), sorted(self.client.ids + ['unassigned']))
                      unassigned = allqs.pop('unassigned')
                      for eid,qs in allqs.items():
                          self.assertTrue(isinstance(qs, dict))
                          self.assertEquals(sorted(qs.keys()), ['completed', 'queue', 'tasks'])
                  def test_shutdown(self):
                      # self.addEngine(4)
                      ids = self.client.ids
                      id0 = ids[0]
                      self.client.shutdown(id0, block=True)
                      while id0 in self.client.ids:
                          time.sleep(0.1)
                          self.client.spin()
                      self.assertRaises(IndexError, lambda : self.client[id0])
                  def test_result_status(self):
                      pass
                      # to be written
                  def test_db_query_dt(self):
                      """test db query by date"""
                      hist = self.client.hub_history()
                      middle = self.client.db_query({'msg_id' : hist[len(hist)/2]})[0]
                      tic = middle['submitted']
                      before = self.client.db_query({'submitted' : {'$lt' : tic}})
                      after = self.client.db_query({'submitted' : {'$gte' : tic}})
                      self.assertEquals(len(before)+len(after),len(hist))
                      for b in before:
                          self.assertTrue(b['submitted'] < tic)
                      for a in after:
                          self.assertTrue(a['submitted'] >= tic)
                      same = self.client.db_query({'submitted' : tic})
                      for s in same:
                          self.assertTrue(s['submitted'] == tic)
                  def test_db_query_keys(self):
                      """test extracting subset of record keys"""
                      found = self.client.db_query({'msg_id': {'$ne' : ''}},keys=['submitted', 'completed'])
                      for rec in found:
                          self.assertEquals(set(rec.keys()), set(['msg_id', 'submitted', 'completed']))
                  def test_db_query_msg_id(self):
                      """ensure msg_id is always in db queries"""
                      found = self.client.db_query({'msg_id': {'$ne' : ''}},keys=['submitted', 'completed'])
                      for rec in found:
                          self.assertTrue('msg_id' in rec.keys())
                      found = self.client.db_query({'msg_id': {'$ne' : ''}},keys=['submitted'])
                      for rec in found:
                          self.assertTrue('msg_id' in rec.keys())
                      found = self.client.db_query({'msg_id': {'$ne' : ''}},keys=['msg_id'])
                      for rec in found:
                          self.assertTrue('msg_id' in rec.keys())
                  def test_db_query_in(self):
                      """test db query with '$in','$nin' operators"""
                      hist = self.client.hub_history()
                      even = hist[::2]
                      odd = hist[1::2]
                      recs = self.client.db_query({ 'msg_id' : {'$in' : even}})
                      found = [ r['msg_id'] for r in recs ]
                      self.assertEquals(set(even), set(found))
                      recs = self.client.db_query({ 'msg_id' : {'$nin' : even}})
                      found = [ r['msg_id'] for r in recs ]
                      self.assertEquals(set(odd), set(found))
                  def test_hub_history(self):
                      hist = self.client.hub_history()
                      recs = self.client.db_query({ 'msg_id' : {"$ne":''}})
                      recdict = {}
                      for rec in recs:
                          recdict[rec['msg_id']] = rec
                      latest = datetime(1984,1,1)
                      for msg_id in hist:
                          rec = recdict[msg_id]
                          newt = rec['submitted']
                          self.assertTrue(newt >= latest)
                          latest = newt
                      ar = self.client[-1].apply_async(lambda : 1)
                      ar.get()
                      time.sleep(0.25)
                      self.assertEquals(self.client.hub_history()[-1:],ar.msg_ids)
                  def test_resubmit(self):
                      def f():
                          import random
                          return random.random()
                      v = self.client.load_balanced_view()
                      ar = v.apply_async(f)
                      r1 = ar.get(1)
                      ahr = self.client.resubmit(ar.msg_ids)
                      r2 = ahr.get(1)
                      self.assertFalse(r1 == r2)
                  def test_resubmit_inflight(self):
                      """ensure ValueError on resubmit of inflight task"""
                      v = self.client.load_balanced_view()
                      ar = v.apply_async(time.sleep,1)
                      # give the message a chance to arrive
                      time.sleep(0.2)
                      self.assertRaisesRemote(ValueError, self.client.resubmit, ar.msg_ids)
                      ar.get(2)
                  def test_resubmit_badkey(self):
                      """ensure KeyError on resubmit of nonexistant task"""
                      self.assertRaisesRemote(KeyError, self.client.resubmit, ['invalid'])
                  def test_purge_results(self):
                      hist = self.client.hub_history()
                      self.client.purge_results(hist)
                      newhist = self.client.hub_history()
                      self.assertTrue(len(newhist) == 0)

IPython/parallel/tests/test_db.py

0 +6 -1

-             """Tests for db backends"""
+             """Tests for db backends
+             Authors:
+             * Min RK
+             """
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              import tempfile
              import time
              from datetime import datetime, timedelta
              from unittest import TestCase
              from nose import SkipTest
              from IPython.parallel import error
              from IPython.parallel.controller.dictdb import DictDB
              from IPython.parallel.controller.sqlitedb import SQLiteDB
              from IPython.parallel.controller.hub import init_record, empty_record
              from IPython.zmq.session import Session
              #-------------------------------------------------------------------------------
              # TestCases
              #-------------------------------------------------------------------------------
              class TestDictBackend(TestCase):
                  def setUp(self):
                      self.session = Session()
                      self.db = self.create_db()
                      self.load_records(16)
                  def create_db(self):
                      return DictDB()
                  def load_records(self, n=1):
                      """load n records for testing"""
                      #sleep 1/10 s, to ensure timestamp is different to previous calls
                      time.sleep(0.1)
                      msg_ids = []
                      for i in range(n):
                          msg = self.session.msg('apply_request', content=dict(a=5))
                          msg['buffers'] = []
                          rec = init_record(msg)
                          msg_ids.append(msg['msg_id'])
                          self.db.add_record(msg['msg_id'], rec)
                      return msg_ids
                  def test_add_record(self):
                      before = self.db.get_history()
                      self.load_records(5)
                      after = self.db.get_history()
                      self.assertEquals(len(after), len(before)+5)
                      self.assertEquals(after[:-5],before)
                  def test_drop_record(self):
                      msg_id = self.load_records()[-1]
                      rec = self.db.get_record(msg_id)
                      self.db.drop_record(msg_id)
                      self.assertRaises(KeyError,self.db.get_record, msg_id)
                  def _round_to_millisecond(self, dt):
                      """necessary because mongodb rounds microseconds"""
                      micro = dt.microsecond
                      extra = int(str(micro)[-3:])
                      return dt - timedelta(microseconds=extra)
                  def test_update_record(self):
                      now = self._round_to_millisecond(datetime.now())
                      #
                      msg_id = self.db.get_history()[-1]
                      rec1 = self.db.get_record(msg_id)
                      data = {'stdout': 'hello there', 'completed' : now}
                      self.db.update_record(msg_id, data)
                      rec2 = self.db.get_record(msg_id)
                      self.assertEquals(rec2['stdout'], 'hello there')
                      self.assertEquals(rec2['completed'], now)
                      rec1.update(data)
                      self.assertEquals(rec1, rec2)
                  # def test_update_record_bad(self):
                  #     """test updating nonexistant records"""
                  #     msg_id = str(uuid.uuid4())
                  #     data = {'stdout': 'hello there'}
                  #     self.assertRaises(KeyError, self.db.update_record, msg_id, data)
                  def test_find_records_dt(self):
                      """test finding records by date"""
                      hist = self.db.get_history()
                      middle = self.db.get_record(hist[len(hist)/2])
                      tic = middle['submitted']
                      before = self.db.find_records({'submitted' : {'$lt' : tic}})
                      after = self.db.find_records({'submitted' : {'$gte' : tic}})
                      self.assertEquals(len(before)+len(after),len(hist))
                      for b in before:
                          self.assertTrue(b['submitted'] < tic)
                      for a in after:
                          self.assertTrue(a['submitted'] >= tic)
                      same = self.db.find_records({'submitted' : tic})
                      for s in same:
                          self.assertTrue(s['submitted'] == tic)
                  def test_find_records_keys(self):
                      """test extracting subset of record keys"""
                      found = self.db.find_records({'msg_id': {'$ne' : ''}},keys=['submitted', 'completed'])
                      for rec in found:
                          self.assertEquals(set(rec.keys()), set(['msg_id', 'submitted', 'completed']))
                  def test_find_records_msg_id(self):
                      """ensure msg_id is always in found records"""
                      found = self.db.find_records({'msg_id': {'$ne' : ''}},keys=['submitted', 'completed'])
                      for rec in found:
                          self.assertTrue('msg_id' in rec.keys())
                      found = self.db.find_records({'msg_id': {'$ne' : ''}},keys=['submitted'])
                      for rec in found:
                          self.assertTrue('msg_id' in rec.keys())
                      found = self.db.find_records({'msg_id': {'$ne' : ''}},keys=['msg_id'])
                      for rec in found:
                          self.assertTrue('msg_id' in rec.keys())
                  def test_find_records_in(self):
                      """test finding records with '$in','$nin' operators"""
                      hist = self.db.get_history()
                      even = hist[::2]
                      odd = hist[1::2]
                      recs = self.db.find_records({ 'msg_id' : {'$in' : even}})
                      found = [ r['msg_id'] for r in recs ]
                      self.assertEquals(set(even), set(found))
                      recs = self.db.find_records({ 'msg_id' : {'$nin' : even}})
                      found = [ r['msg_id'] for r in recs ]
                      self.assertEquals(set(odd), set(found))
                  def test_get_history(self):
                      msg_ids = self.db.get_history()
                      latest = datetime(1984,1,1)
                      for msg_id in msg_ids:
                          rec = self.db.get_record(msg_id)
                          newt = rec['submitted']
                          self.assertTrue(newt >= latest)
                          latest = newt
                      msg_id = self.load_records(1)[-1]
                      self.assertEquals(self.db.get_history()[-1],msg_id)
                  def test_datetime(self):
                      """get/set timestamps with datetime objects"""
                      msg_id = self.db.get_history()[-1]
                      rec = self.db.get_record(msg_id)
                      self.assertTrue(isinstance(rec['submitted'], datetime))
                      self.db.update_record(msg_id, dict(completed=datetime.now()))
                      rec = self.db.get_record(msg_id)
                      self.assertTrue(isinstance(rec['completed'], datetime))
                  def test_drop_matching(self):
                      msg_ids = self.load_records(10)
                      query = {'msg_id' : {'$in':msg_ids}}
                      self.db.drop_matching_records(query)
                      recs = self.db.find_records(query)
                      self.assertTrue(len(recs)==0)
              class TestSQLiteBackend(TestDictBackend):
                  def create_db(self):
                      return SQLiteDB(location=tempfile.gettempdir())
                  def tearDown(self):
                      self.db._db.close()

IPython/parallel/tests/test_dependency.py

0 +6 -1

-             """Tests for dependency.py"""
+             """Tests for dependency.py
+             Authors:
+             * Min RK
+             """
              __docformat__ = "restructuredtext en"
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              # import
              import os
              from IPython.utils.pickleutil import can, uncan
              import IPython.parallel as pmod
              from IPython.parallel.util import interactive
              from IPython.parallel.tests import add_engines
              from .clienttest import ClusterTestCase
              def setup():
                  add_engines(1)
              @pmod.require('time')
              def wait(n):
                  time.sleep(n)
                  return n
              mixed = map(str, range(10))
              completed = map(str, range(0,10,2))
              failed = map(str, range(1,10,2))
              class DependencyTest(ClusterTestCase):
                  def setUp(self):
                      ClusterTestCase.setUp(self)
                      self.user_ns = {'__builtins__' : __builtins__}
                      self.view = self.client.load_balanced_view()
                      self.dview = self.client[-1]
                      self.succeeded = set(map(str, range(0,25,2)))
                      self.failed = set(map(str, range(1,25,2)))
                  def assertMet(self, dep):
                      self.assertTrue(dep.check(self.succeeded, self.failed), "Dependency should be met")
                  def assertUnmet(self, dep):
                      self.assertFalse(dep.check(self.succeeded, self.failed), "Dependency should not be met")
                  def assertUnreachable(self, dep):
                      self.assertTrue(dep.unreachable(self.succeeded, self.failed), "Dependency should be unreachable")
                  def assertReachable(self, dep):
                      self.assertFalse(dep.unreachable(self.succeeded, self.failed), "Dependency should be reachable")
                  def cancan(self, f):
                      """decorator to pass through canning into self.user_ns"""
                      return uncan(can(f), self.user_ns)
                  def test_require_imports(self):
                      """test that @require imports names"""
                      @self.cancan
                      @pmod.require('urllib')
                      @interactive
                      def encode(dikt):
                          return urllib.urlencode(dikt)
                      # must pass through canning to properly connect namespaces
                      self.assertEquals(encode(dict(a=5)), 'a=5')
                  def test_success_only(self):
                      dep = pmod.Dependency(mixed, success=True, failure=False)
                      self.assertUnmet(dep)
                      self.assertUnreachable(dep)
                      dep.all=False
                      self.assertMet(dep)
                      self.assertReachable(dep)
                      dep = pmod.Dependency(completed, success=True, failure=False)
                      self.assertMet(dep)
                      self.assertReachable(dep)
                      dep.all=False
                      self.assertMet(dep)
                      self.assertReachable(dep)
                  def test_failure_only(self):
                      dep = pmod.Dependency(mixed, success=False, failure=True)
                      self.assertUnmet(dep)
                      self.assertUnreachable(dep)
                      dep.all=False
                      self.assertMet(dep)
                      self.assertReachable(dep)
                      dep = pmod.Dependency(completed, success=False, failure=True)
                      self.assertUnmet(dep)
                      self.assertUnreachable(dep)
                      dep.all=False
                      self.assertUnmet(dep)
                      self.assertUnreachable(dep)

IPython/parallel/tests/test_lbview.py

0 +6 -1

-             """test LoadBalancedView objects"""
+             """test LoadBalancedView objects
+             Authors:
+             * Min RK
+             """
              # -*- coding: utf-8 -*-
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              import sys
              import time
              import zmq
              from IPython import parallel  as pmod
              from IPython.parallel import error
              from IPython.parallel.tests import add_engines
              from .clienttest import ClusterTestCase, crash, wait, skip_without
              def setup():
                  add_engines(3)
              class TestLoadBalancedView(ClusterTestCase):
                  def setUp(self):
                      ClusterTestCase.setUp(self)
                      self.view = self.client.load_balanced_view()
                  def test_z_crash_task(self):
                      """test graceful handling of engine death (balanced)"""
                      # self.add_engines(1)
                      ar = self.view.apply_async(crash)
                      self.assertRaisesRemote(error.EngineError, ar.get, 10)
                      eid = ar.engine_id
                      tic = time.time()
                      while eid in self.client.ids and time.time()-tic < 5:
                          time.sleep(.01)
                          self.client.spin()
                      self.assertFalse(eid in self.client.ids, "Engine should have died")
                  def test_map(self):
                      def f(x):
                          return x**2
                      data = range(16)
                      r = self.view.map_sync(f, data)
                      self.assertEquals(r, map(f, data))
                  def test_abort(self):
                      view = self.view
                      ar = self.client[:].apply_async(time.sleep, .5)
                      ar2 = view.apply_async(lambda : 2)
                      ar3 = view.apply_async(lambda : 3)
                      view.abort(ar2)
                      view.abort(ar3.msg_ids)
                      self.assertRaises(error.TaskAborted, ar2.get)
                      self.assertRaises(error.TaskAborted, ar3.get)
                  def test_retries(self):
                      add_engines(3)
                      view = self.view
                      view.timeout = 1 # prevent hang if this doesn't behave
                      def fail():
                          assert False
                      for r in range(len(self.client)-1):
                          with view.temp_flags(retries=r):
                              self.assertRaisesRemote(AssertionError, view.apply_sync, fail)
                      with view.temp_flags(retries=len(self.client), timeout=0.25):
                          self.assertRaisesRemote(error.TaskTimeout, view.apply_sync, fail)
                  def test_invalid_dependency(self):
                      view = self.view
                      with view.temp_flags(after='12345'):
                          self.assertRaisesRemote(error.InvalidDependency, view.apply_sync, lambda : 1)
                  def test_impossible_dependency(self):
                      if len(self.client) < 2:
                          add_engines(2)
                      view = self.client.load_balanced_view()
                      ar1 = view.apply_async(lambda : 1)
                      ar1.get()
                      e1 = ar1.engine_id
                      e2 = e1
                      while e2 == e1:
                          ar2 = view.apply_async(lambda : 1)
                          ar2.get()
                          e2 = ar2.engine_id
                      with view.temp_flags(follow=[ar1, ar2]):
                          self.assertRaisesRemote(error.ImpossibleDependency, view.apply_sync, lambda : 1)
                  def test_follow(self):
                      ar = self.view.apply_async(lambda : 1)
                      ar.get()
                      ars = []
                      first_id = ar.engine_id
                      self.view.follow = ar
                      for i in range(5):
                          ars.append(self.view.apply_async(lambda : 1))
                      self.view.wait(ars)
                      for ar in ars:
                          self.assertEquals(ar.engine_id, first_id)
                  def test_after(self):
                      view = self.view
                      ar = view.apply_async(time.sleep, 0.5)
                      with view.temp_flags(after=ar):
                          ar2 = view.apply_async(lambda : 1)
                      ar.wait()
                      ar2.wait()
                      self.assertTrue(ar2.started > ar.completed)

IPython/parallel/tests/test_mongodb.py

0 +6 -1

-             """Tests for mongodb backend"""
+             """Tests for mongodb backend
+             Authors:
+             * Min RK
+             """
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              from nose import SkipTest
              from pymongo import Connection
              from IPython.parallel.controller.mongodb import MongoDB
              from . import test_db
              try:
                  c = Connection()
              except Exception:
                  c=None
              class TestMongoBackend(test_db.TestDictBackend):
                  """MongoDB backend tests"""
                  def create_db(self):
                      try:
                          return MongoDB(database='iptestdb', _connection=c)
                      except Exception:
                          raise SkipTest("Couldn't connect to mongodb")
              def teardown(self):
                  if c is not None:
                      c.drop_database('iptestdb')

IPython/parallel/tests/test_newserialized.py

0 +6 -1

-             """test serialization with newserialized"""
+             """test serialization with newserialized
+             Authors:
+             * Min RK
+             """
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              from unittest import TestCase
              from IPython.testing.decorators import parametric
              from IPython.utils import newserialized as ns
              from IPython.utils.pickleutil import can, uncan, CannedObject, CannedFunction
              from IPython.parallel.tests.clienttest import skip_without
              class CanningTestCase(TestCase):
                  def test_canning(self):
                      d = dict(a=5,b=6)
                      cd = can(d)
                      self.assertTrue(isinstance(cd, dict))
                  def test_canned_function(self):
                      f = lambda : 7
                      cf = can(f)
                      self.assertTrue(isinstance(cf, CannedFunction))
                  @parametric
                  def test_can_roundtrip(cls):
                      objs = [
                          dict(),
                          set(),
                          list(),
                          ['a',1,['a',1],u'e'],
                      ]
                      return map(cls.run_roundtrip, objs)
                  @classmethod
                  def run_roundtrip(self, obj):
                      o = uncan(can(obj))
                      assert o == obj, "failed assertion: %r == %r"%(o,obj)
                  def test_serialized_interfaces(self):
                      us = {'a':10, 'b':range(10)}
                      s = ns.serialize(us)
                      uus = ns.unserialize(s)
                      self.assertTrue(isinstance(s, ns.SerializeIt))
                      self.assertEquals(uus, us)
                  def test_pickle_serialized(self):
                      obj = {'a':1.45345, 'b':'asdfsdf', 'c':10000L}
                      original = ns.UnSerialized(obj)
                      originalSer = ns.SerializeIt(original)
                      firstData = originalSer.getData()
                      firstTD = originalSer.getTypeDescriptor()
                      firstMD = originalSer.getMetadata()
                      self.assertEquals(firstTD, 'pickle')
                      self.assertEquals(firstMD, {})
                      unSerialized = ns.UnSerializeIt(originalSer)
                      secondObj = unSerialized.getObject()
                      for k, v in secondObj.iteritems():
                          self.assertEquals(obj[k], v)
                      secondSer = ns.SerializeIt(ns.UnSerialized(secondObj))
                      self.assertEquals(firstData, secondSer.getData())
                      self.assertEquals(firstTD, secondSer.getTypeDescriptor() )
                      self.assertEquals(firstMD, secondSer.getMetadata())
                  @skip_without('numpy')
                  def test_ndarray_serialized(self):
                      import numpy
                      a = numpy.linspace(0.0, 1.0, 1000)
                      unSer1 = ns.UnSerialized(a)
                      ser1 = ns.SerializeIt(unSer1)
                      td = ser1.getTypeDescriptor()
                      self.assertEquals(td, 'ndarray')
                      md = ser1.getMetadata()
                      self.assertEquals(md['shape'], a.shape)
                      self.assertEquals(md['dtype'], a.dtype.str)
                      buff = ser1.getData()
                      self.assertEquals(buff, numpy.getbuffer(a))
                      s = ns.Serialized(buff, td, md)
                      final = ns.unserialize(s)
                      self.assertEquals(numpy.getbuffer(a), numpy.getbuffer(final))
                      self.assertTrue((a==final).all())
                      self.assertEquals(a.dtype.str, final.dtype.str)
                      self.assertEquals(a.shape, final.shape)
                      # test non-copying:
                      a[2] = 1e9
                      self.assertTrue((a==final).all())
                  def test_uncan_function_globals(self):
                      """test that uncanning a module function restores it into its module"""
                      from re import search
                      cf = can(search)
                      csearch = uncan(cf)
                      self.assertEqual(csearch.__module__, search.__module__)
                      self.assertNotEqual(csearch('asd', 'asdf'), None)
                      csearch = uncan(cf, dict(a=5))
                      self.assertEqual(csearch.__module__, search.__module__)
                      self.assertNotEqual(csearch('asd', 'asdf'), None)
   No newline at end of file

IPython/parallel/tests/test_view.py

0 +6 -1

-             """test View objects"""
+             """test View objects
+             Authors:
+             * Min RK
+             """
              # -*- coding: utf-8 -*-
              #-------------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-------------------------------------------------------------------------------
              #-------------------------------------------------------------------------------
              # Imports
              #-------------------------------------------------------------------------------
              import sys
              import time
              from tempfile import mktemp
              from StringIO import StringIO
              import zmq
              from IPython import parallel  as pmod
              from IPython.parallel import error
              from IPython.parallel import AsyncResult, AsyncHubResult, AsyncMapResult
              from IPython.parallel import DirectView
              from IPython.parallel.util import interactive
              from IPython.parallel.tests import add_engines
              from .clienttest import ClusterTestCase, crash, wait, skip_without
              def setup():
                  add_engines(3)
              class TestView(ClusterTestCase):
                  def test_z_crash_mux(self):
                      """test graceful handling of engine death (direct)"""
                      # self.add_engines(1)
                      eid = self.client.ids[-1]
                      ar = self.client[eid].apply_async(crash)
                      self.assertRaisesRemote(error.EngineError, ar.get)
                      eid = ar.engine_id
                      tic = time.time()
                      while eid in self.client.ids and time.time()-tic < 5:
                          time.sleep(.01)
                          self.client.spin()
                      self.assertFalse(eid in self.client.ids, "Engine should have died")
                  def test_push_pull(self):
                      """test pushing and pulling"""
                      data = dict(a=10, b=1.05, c=range(10), d={'e':(1,2),'f':'hi'})
                      t = self.client.ids[-1]
                      v = self.client[t]
                      push = v.push
                      pull = v.pull
                      v.block=True
                      nengines = len(self.client)
                      push({'data':data})
                      d = pull('data')
                      self.assertEquals(d, data)
                      self.client[:].push({'data':data})
                      d = self.client[:].pull('data', block=True)
                      self.assertEquals(d, nengines*[data])
                      ar = push({'data':data}, block=False)
                      self.assertTrue(isinstance(ar, AsyncResult))
                      r = ar.get()
                      ar = self.client[:].pull('data', block=False)
                      self.assertTrue(isinstance(ar, AsyncResult))
                      r = ar.get()
                      self.assertEquals(r, nengines*[data])
                      self.client[:].push(dict(a=10,b=20))
                      r = self.client[:].pull(('a','b'), block=True)
                      self.assertEquals(r, nengines*[[10,20]])
                  def test_push_pull_function(self):
                      "test pushing and pulling functions"
                      def testf(x):
                          return 2.0*x
                      t = self.client.ids[-1]
                      v = self.client[t]
                      v.block=True
                      push = v.push
                      pull = v.pull
                      execute = v.execute
                      push({'testf':testf})
                      r = pull('testf')
                      self.assertEqual(r(1.0), testf(1.0))
                      execute('r = testf(10)')
                      r = pull('r')
                      self.assertEquals(r, testf(10))
                      ar = self.client[:].push({'testf':testf}, block=False)
                      ar.get()
                      ar = self.client[:].pull('testf', block=False)
                      rlist = ar.get()
                      for r in rlist:
                          self.assertEqual(r(1.0), testf(1.0))
                      execute("def g(x): return x*x")
                      r = pull(('testf','g'))
                      self.assertEquals((r[0](10),r[1](10)), (testf(10), 100))
                  def test_push_function_globals(self):
                      """test that pushed functions have access to globals"""
                      @interactive
                      def geta():
                          return a
                      # self.add_engines(1)
                      v = self.client[-1]
                      v.block=True
                      v['f'] = geta
                      self.assertRaisesRemote(NameError, v.execute, 'b=f()')
                      v.execute('a=5')
                      v.execute('b=f()')
                      self.assertEquals(v['b'], 5)
                  def test_push_function_defaults(self):
                      """test that pushed functions preserve default args"""
                      def echo(a=10):
                          return a
                      v = self.client[-1]
                      v.block=True
                      v['f'] = echo
                      v.execute('b=f()')
                      self.assertEquals(v['b'], 10)
                  def test_get_result(self):
                      """test getting results from the Hub."""
                      c = pmod.Client(profile='iptest')
                      # self.add_engines(1)
                      t = c.ids[-1]
                      v = c[t]
                      v2 = self.client[t]
                      ar = v.apply_async(wait, 1)
                      # give the monitor time to notice the message
                      time.sleep(.25)
                      ahr = v2.get_result(ar.msg_ids)
                      self.assertTrue(isinstance(ahr, AsyncHubResult))
                      self.assertEquals(ahr.get(), ar.get())
                      ar2 = v2.get_result(ar.msg_ids)
                      self.assertFalse(isinstance(ar2, AsyncHubResult))
                      c.spin()
                      c.close()
                  def test_run_newline(self):
                      """test that run appends newline to files"""
                      tmpfile = mktemp()
                      with open(tmpfile, 'w') as f:
                          f.write("""def g():
                              return 5
                              """)
                      v = self.client[-1]
                      v.run(tmpfile, block=True)
                      self.assertEquals(v.apply_sync(lambda f: f(), pmod.Reference('g')), 5)
                  def test_apply_tracked(self):
                      """test tracking for apply"""
                      # self.add_engines(1)
                      t = self.client.ids[-1]
                      v = self.client[t]
                      v.block=False
                      def echo(n=1024*1024, **kwargs):
                          with v.temp_flags(**kwargs):
                              return v.apply(lambda x: x, 'x'*n)
                      ar = echo(1, track=False)
                      self.assertTrue(isinstance(ar._tracker, zmq.MessageTracker))
                      self.assertTrue(ar.sent)
                      ar = echo(track=True)
                      self.assertTrue(isinstance(ar._tracker, zmq.MessageTracker))
                      self.assertEquals(ar.sent, ar._tracker.done)
                      ar._tracker.wait()
                      self.assertTrue(ar.sent)
                  def test_push_tracked(self):
                      t = self.client.ids[-1]
                      ns = dict(x='x'*1024*1024)
                      v = self.client[t]
                      ar = v.push(ns, block=False, track=False)
                      self.assertTrue(isinstance(ar._tracker, zmq.MessageTracker))
                      self.assertTrue(ar.sent)
                      ar = v.push(ns, block=False, track=True)
                      self.assertTrue(isinstance(ar._tracker, zmq.MessageTracker))
                      self.assertEquals(ar.sent, ar._tracker.done)
                      ar._tracker.wait()
                      self.assertTrue(ar.sent)
                      ar.get()
                  def test_scatter_tracked(self):
                      t = self.client.ids
                      x='x'*1024*1024
                      ar = self.client[t].scatter('x', x, block=False, track=False)
                      self.assertTrue(isinstance(ar._tracker, zmq.MessageTracker))
                      self.assertTrue(ar.sent)
                      ar = self.client[t].scatter('x', x, block=False, track=True)
                      self.assertTrue(isinstance(ar._tracker, zmq.MessageTracker))
                      self.assertEquals(ar.sent, ar._tracker.done)
                      ar._tracker.wait()
                      self.assertTrue(ar.sent)
                      ar.get()
                  def test_remote_reference(self):
                      v = self.client[-1]
                      v['a'] = 123
                      ra = pmod.Reference('a')
                      b = v.apply_sync(lambda x: x, ra)
                      self.assertEquals(b, 123)
                  def test_scatter_gather(self):
                      view = self.client[:]
                      seq1 = range(16)
                      view.scatter('a', seq1)
                      seq2 = view.gather('a', block=True)
                      self.assertEquals(seq2, seq1)
                      self.assertRaisesRemote(NameError, view.gather, 'asdf', block=True)
                  @skip_without('numpy')
                  def test_scatter_gather_numpy(self):
                      import numpy
                      from numpy.testing.utils import assert_array_equal, assert_array_almost_equal
                      view = self.client[:]
                      a = numpy.arange(64)
                      view.scatter('a', a)
                      b = view.gather('a', block=True)
                      assert_array_equal(b, a)
                  def test_map(self):
                      view = self.client[:]
                      def f(x):
                          return x**2
                      data = range(16)
                      r = view.map_sync(f, data)
                      self.assertEquals(r, map(f, data))
                  def test_scatterGatherNonblocking(self):
                      data = range(16)
                      view = self.client[:]
                      view.scatter('a', data, block=False)
                      ar = view.gather('a', block=False)
                      self.assertEquals(ar.get(), data)
                  @skip_without('numpy')
                  def test_scatter_gather_numpy_nonblocking(self):
                      import numpy
                      from numpy.testing.utils import assert_array_equal, assert_array_almost_equal
                      a = numpy.arange(64)
                      view = self.client[:]
                      ar = view.scatter('a', a, block=False)
                      self.assertTrue(isinstance(ar, AsyncResult))
                      amr = view.gather('a', block=False)
                      self.assertTrue(isinstance(amr, AsyncMapResult))
                      assert_array_equal(amr.get(), a)
                  def test_execute(self):
                      view = self.client[:]
                      # self.client.debug=True
                      execute = view.execute
                      ar = execute('c=30', block=False)
                      self.assertTrue(isinstance(ar, AsyncResult))
                      ar = execute('d=[0,1,2]', block=False)
                      self.client.wait(ar, 1)
                      self.assertEquals(len(ar.get()), len(self.client))
                      for c in view['c']:
                          self.assertEquals(c, 30)
                  def test_abort(self):
                      view = self.client[-1]
                      ar = view.execute('import time; time.sleep(0.25)', block=False)
                      ar2 = view.apply_async(lambda : 2)
                      ar3 = view.apply_async(lambda : 3)
                      view.abort(ar2)
                      view.abort(ar3.msg_ids)
                      self.assertRaises(error.TaskAborted, ar2.get)
                      self.assertRaises(error.TaskAborted, ar3.get)
                  def test_temp_flags(self):
                      view = self.client[-1]
                      view.block=True
                      with view.temp_flags(block=False):
                          self.assertFalse(view.block)
                      self.assertTrue(view.block)
                  def test_importer(self):
                      view = self.client[-1]
                      view.clear(block=True)
                      with view.importer:
                          import re
                      @interactive
                      def findall(pat, s):
                          # this globals() step isn't necessary in real code
                          # only to prevent a closure in the test
                          re = globals()['re']
                          return re.findall(pat, s)
                      self.assertEquals(view.apply_sync(findall, '\w+', 'hello world'), 'hello world'.split())
                  # parallel magic tests
                  def test_magic_px_blocking(self):
                      ip = get_ipython()
                      v = self.client[-1]
                      v.activate()
                      v.block=True
                      ip.magic_px('a=5')
                      self.assertEquals(v['a'], 5)
                      ip.magic_px('a=10')
                      self.assertEquals(v['a'], 10)
                      sio = StringIO()
                      savestdout = sys.stdout
                      sys.stdout = sio
                      ip.magic_px('print a')
                      sys.stdout = savestdout
                      sio.read()
                      self.assertTrue('[stdout:%i]'%v.targets in sio.buf)
                      self.assertTrue(sio.buf.rstrip().endswith('10'))
                      self.assertRaisesRemote(ZeroDivisionError, ip.magic_px, '1/0')
                  def test_magic_px_nonblocking(self):
                      ip = get_ipython()
                      v = self.client[-1]
                      v.activate()
                      v.block=False
                      ip.magic_px('a=5')
                      self.assertEquals(v['a'], 5)
                      ip.magic_px('a=10')
                      self.assertEquals(v['a'], 10)
                      sio = StringIO()
                      savestdout = sys.stdout
                      sys.stdout = sio
                      ip.magic_px('print a')
                      sys.stdout = savestdout
                      sio.read()
                      self.assertFalse('[stdout:%i]'%v.targets in sio.buf)
                      ip.magic_px('1/0')
                      ar = v.get_result(-1)
                      self.assertRaisesRemote(ZeroDivisionError, ar.get)
                  def test_magic_autopx_blocking(self):
                      ip = get_ipython()
                      v = self.client[-1]
                      v.activate()
                      v.block=True
                      sio = StringIO()
                      savestdout = sys.stdout
                      sys.stdout = sio
                      ip.magic_autopx()
                      ip.run_cell('\n'.join(('a=5','b=10','c=0')))
                      ip.run_cell('print b')
                      ip.run_cell("b/c")
                      ip.run_code(compile('b*=2', '', 'single'))
                      ip.magic_autopx()
                      sys.stdout = savestdout
                      sio.read()
                      output = sio.buf.strip()
                      self.assertTrue(output.startswith('%autopx enabled'))
                      self.assertTrue(output.endswith('%autopx disabled'))
                      self.assertTrue('RemoteError: ZeroDivisionError' in output)
                      ar = v.get_result(-2)
                      self.assertEquals(v['a'], 5)
                      self.assertEquals(v['b'], 20)
                      self.assertRaisesRemote(ZeroDivisionError, ar.get)
                  def test_magic_autopx_nonblocking(self):
                      ip = get_ipython()
                      v = self.client[-1]
                      v.activate()
                      v.block=False
                      sio = StringIO()
                      savestdout = sys.stdout
                      sys.stdout = sio
                      ip.magic_autopx()
                      ip.run_cell('\n'.join(('a=5','b=10','c=0')))
                      ip.run_cell('print b')
                      ip.run_cell("b/c")
                      ip.run_code(compile('b*=2', '', 'single'))
                      ip.magic_autopx()
                      sys.stdout = savestdout
                      sio.read()
                      output = sio.buf.strip()
                      self.assertTrue(output.startswith('%autopx enabled'))
                      self.assertTrue(output.endswith('%autopx disabled'))
                      self.assertFalse('ZeroDivisionError' in output)
                      ar = v.get_result(-2)
                      self.assertEquals(v['a'], 5)
                      self.assertEquals(v['b'], 20)
                      self.assertRaisesRemote(ZeroDivisionError, ar.get)
                  def test_magic_result(self):
                      ip = get_ipython()
                      v = self.client[-1]
                      v.activate()
                      v['a'] = 111
                      ra = v['a']
                      ar = ip.magic_result()
                      self.assertEquals(ar.msg_ids, [v.history[-1]])
                      self.assertEquals(ar.get(), 111)
                      ar = ip.magic_result('-2')
                      self.assertEquals(ar.msg_ids, [v.history[-2]])
                  def test_unicode_execute(self):
                      """test executing unicode strings"""
                      v = self.client[-1]
                      v.block=True
                      code=u"a=u'é'"
                      v.execute(code)
                      self.assertEquals(v['a'], u'é')
                  def test_unicode_apply_result(self):
                      """test unicode apply results"""
                      v = self.client[-1]
                      r = v.apply_sync(lambda : u'é')
                      self.assertEquals(r, u'é')
                  def test_unicode_apply_arg(self):
                      """test passing unicode arguments to apply"""
                      v = self.client[-1]
                      @interactive
                      def check_unicode(a, check):
                          assert isinstance(a, unicode), "%r is not unicode"%a
                          assert isinstance(check, bytes), "%r is not bytes"%check
                          assert a.encode('utf8') == check, "%s != %s"%(a,check)
                      for s in [ u'é', u'ßø®∫','asdf'.decode() ]:
                          try:
                              v.apply_sync(check_unicode, s, s.encode('utf8'))
                          except error.RemoteError as e:
                              if e.ename == 'AssertionError':
                                  self.fail(e.evalue)
                              else:
                                  raise e

IPython/parallel/util.py

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

IPython/zmq/session.py

0 0 0

	1		NO CONTENT: modified file
The requested commit or file is too big and content was truncated. Show full diff

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages