upstream/ipython Commit - r3989:2e5a1161

re-enable log forwarding and iplogger

MinRK -

r3989:2e5a1161

parent child

IPython/parallel/apps/clusterdir.py

0 +9 -4

              #!/usr/bin/env python
              # encoding: utf-8
              """
              The IPython cluster directory
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2008-2009  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from __future__ import with_statement
              import os
              import logging
              import re
              import shutil
              import sys
              from subprocess import Popen, PIPE
              from IPython.config.loader import PyFileConfigLoader, Config
              from IPython.config.configurable import Configurable
              from IPython.config.application import Application
              from IPython.core.crashhandler import CrashHandler
              from IPython.core.newapplication import BaseIPythonApplication
              from IPython.core import release
              from IPython.utils.path import (
                  get_ipython_package_dir,
                  get_ipython_dir,
                  expand_path
              )
              from IPython.utils.traitlets import Unicode, Bool, Instance, Dict
              #-----------------------------------------------------------------------------
              # Module errors
              #-----------------------------------------------------------------------------
              class ClusterDirError(Exception):
                  pass
              class PIDFileError(Exception):
                  pass
              #-----------------------------------------------------------------------------
              # Class for managing cluster directories
              #-----------------------------------------------------------------------------
              class ClusterDir(Configurable):
                  """An object to manage the cluster directory and its resources.
                  The cluster directory is used by :command:`ipengine`,
                  :command:`ipcontroller` and :command:`ipclsuter` to manage the
                  configuration, logging and security of these applications.
                  This object knows how to find, create and manage these directories. This
                  should be used by any code that want's to handle cluster directories.
                  """
                  security_dir_name = Unicode('security')
                  log_dir_name = Unicode('log')
                  pid_dir_name = Unicode('pid')
                  security_dir = Unicode(u'')
                  log_dir = Unicode(u'')
                  pid_dir = Unicode(u'')
                  auto_create = Bool(False,
                      help="""Whether to automatically create the ClusterDirectory if it does
                      not exist""")
                  overwrite = Bool(False,
                      help="""Whether to overwrite existing config files""")
                  location = Unicode(u'', config=True,
                      help="""Set the cluster dir. This overrides the logic used by the
                      `profile` option.""",
                      )
                  profile = Unicode(u'default', config=True,
                      help="""The string name of the profile to be used. This determines the name
                      of the cluster dir as: cluster_<profile>. The default profile is named
                      'default'.  The cluster directory is resolve this way if the
                      `cluster_dir` option is not used."""
                      )
                  _location_isset = Bool(False) # flag for detecting multiply set location
                  _new_dir = Bool(False) # flag for whether a new dir was created
                  def __init__(self, **kwargs):
                      # make sure auto_create,overwrite are set *before* location
                      for name in ('auto_create', 'overwrite'):
                          v = kwargs.pop(name, None)
                          if v is not None:
                              setattr(self, name, v)
                      super(ClusterDir, self).__init__(**kwargs)
                      if not self.location:
                          self._profile_changed('profile', 'default', self.profile)
                  def _location_changed(self, name, old, new):
                      if self._location_isset:
                          raise RuntimeError("Cannot set ClusterDir more than once.")
                      self._location_isset = True
                      if not os.path.isdir(new):
                          if self.auto_create:# or self.config.ClusterDir.auto_create:
                              os.makedirs(new)
                              self._new_dir = True
                          else:
                              raise ClusterDirError('Directory not found: %s' % new)
                      # ensure config files exist:
                      self.copy_all_config_files(overwrite=self.overwrite)
                      self.security_dir = os.path.join(new, self.security_dir_name)
                      self.log_dir = os.path.join(new, self.log_dir_name)
                      self.pid_dir = os.path.join(new, self.pid_dir_name)
                      self.check_dirs()
                  def _profile_changed(self, name, old, new):
                      if self._location_isset:
                          raise RuntimeError("ClusterDir already set.  Cannot set by profile.")
                      self.location = os.path.join(get_ipython_dir(), 'cluster_'+new)
                  def _log_dir_changed(self, name, old, new):
                      self.check_log_dir()
                  def check_log_dir(self):
                      if not os.path.isdir(self.log_dir):
                          os.mkdir(self.log_dir)
                  def _security_dir_changed(self, name, old, new):
                      self.check_security_dir()
                  def check_security_dir(self):
                      if not os.path.isdir(self.security_dir):
                          os.mkdir(self.security_dir, 0700)
                      os.chmod(self.security_dir, 0700)
                  def _pid_dir_changed(self, name, old, new):
                      self.check_pid_dir()
                  def check_pid_dir(self):
                      if not os.path.isdir(self.pid_dir):
                          os.mkdir(self.pid_dir, 0700)
                      os.chmod(self.pid_dir, 0700)
                  def check_dirs(self):
                      self.check_security_dir()
                      self.check_log_dir()
                      self.check_pid_dir()
                  def copy_config_file(self, config_file, path=None, overwrite=False):
                      """Copy a default config file into the active cluster directory.
                      Default configuration files are kept in :mod:`IPython.config.default`.
                      This function moves these from that location to the working cluster
                      directory.
                      """
                      if path is None:
                          import IPython.config.default
                          path = IPython.config.default.__file__.split(os.path.sep)[:-1]
                          path = os.path.sep.join(path)
                      src = os.path.join(path, config_file)
                      dst = os.path.join(self.location, config_file)
                      if not os.path.isfile(dst) or overwrite:
                          shutil.copy(src, dst)
                  def copy_all_config_files(self, path=None, overwrite=False):
                      """Copy all config files into the active cluster directory."""
                      for f in [u'ipcontroller_config.py', u'ipengine_config.py',
                                u'ipcluster_config.py']:
                          self.copy_config_file(f, path=path, overwrite=overwrite)
                  @classmethod
                  def create_cluster_dir(csl, cluster_dir):
                      """Create a new cluster directory given a full path.
                      Parameters
                      ----------
                      cluster_dir : str
                          The full path to the cluster directory.  If it does exist, it will
                          be used.  If not, it will be created.
                      """
                      return ClusterDir(location=cluster_dir)
                  @classmethod
                  def create_cluster_dir_by_profile(cls, path, profile=u'default'):
                      """Create a cluster dir by profile name and path.
                      Parameters
                      ----------
                      path : str
                          The path (directory) to put the cluster directory in.
                      profile : str
                          The name of the profile.  The name of the cluster directory will
                          be "cluster_<profile>".
                      """
                      if not os.path.isdir(path):
                          raise ClusterDirError('Directory not found: %s' % path)
                      cluster_dir = os.path.join(path, u'cluster_' + profile)
                      return ClusterDir(location=cluster_dir)
                  @classmethod
                  def find_cluster_dir_by_profile(cls, ipython_dir, profile=u'default'):
                      """Find an existing cluster dir by profile name, return its ClusterDir.
                      This searches through a sequence of paths for a cluster dir.  If it
                      is not found, a :class:`ClusterDirError` exception will be raised.
                      The search path algorithm is:
 . ``os.getcwd()``
 . ``ipython_dir``
 . The directories found in the ":" separated
                         :env:`IPCLUSTER_DIR_PATH` environment variable.
                      Parameters
                      ----------
                      ipython_dir : unicode or str
                          The IPython directory to use.
                      profile : unicode or str
                          The name of the profile.  The name of the cluster directory
                          will be "cluster_<profile>".
                      """
                      dirname = u'cluster_' + profile
                      cluster_dir_paths = os.environ.get('IPCLUSTER_DIR_PATH','')
                      if cluster_dir_paths:
                          cluster_dir_paths = cluster_dir_paths.split(':')
                      else:
                          cluster_dir_paths = []
                      paths = [os.getcwd(), ipython_dir] + cluster_dir_paths
                      for p in paths:
                          cluster_dir = os.path.join(p, dirname)
                          if os.path.isdir(cluster_dir):
                              return ClusterDir(location=cluster_dir)
                      else:
                          raise ClusterDirError('Cluster directory not found in paths: %s' % dirname)
                  @classmethod
                  def find_cluster_dir(cls, cluster_dir):
                      """Find/create a cluster dir and return its ClusterDir.
                      This will create the cluster directory if it doesn't exist.
                      Parameters
                      ----------
                      cluster_dir : unicode or str
                          The path of the cluster directory.  This is expanded using
                          :func:`IPython.utils.genutils.expand_path`.
                      """
                      cluster_dir = expand_path(cluster_dir)
                      if not os.path.isdir(cluster_dir):
                          raise ClusterDirError('Cluster directory not found: %s' % cluster_dir)
                      return ClusterDir(location=cluster_dir)
              #-----------------------------------------------------------------------------
              # Crash handler for this application
              #-----------------------------------------------------------------------------
              _message_template = """\
              Oops, $self.app_name crashed. We do our best to make it stable, but...
              A crash report was automatically generated with the following information:
                - A verbatim copy of the crash traceback.
                - Data on your current $self.app_name configuration.
              It was left in the file named:
              \t'$self.crash_report_fname'
              If you can email this file to the developers, the information in it will help
              them in understanding and correcting the problem.
              You can mail it to: $self.contact_name at $self.contact_email
              with the subject '$self.app_name Crash Report'.
              If you want to do it now, the following command will work (under Unix):
              mail -s '$self.app_name Crash Report' $self.contact_email < $self.crash_report_fname
              To ensure accurate tracking of this issue, please file a report about it at:
              $self.bug_tracker
              """
              class ClusterDirCrashHandler(CrashHandler):
                  """sys.excepthook for IPython itself, leaves a detailed report on disk."""
                  message_template = _message_template
                  def __init__(self, app):
                      contact_name = release.authors['Min'][0]
                      contact_email = release.authors['Min'][1]
                      bug_tracker = 'http://github.com/ipython/ipython/issues'
                      super(ClusterDirCrashHandler,self).__init__(
                          app, contact_name, contact_email, bug_tracker
                      )
              #-----------------------------------------------------------------------------
              # Main application
              #-----------------------------------------------------------------------------
              base_aliases = {
                  'profile' : "ClusterDir.profile",
                  'cluster_dir' : 'ClusterDir.location',
                  'auto_create' : 'ClusterDirApplication.auto_create',
                  'log_level' : 'ClusterApplication.log_level',
                  'work_dir' : 'ClusterApplication.work_dir',
                  'log_to_file' : 'ClusterApplication.log_to_file',
                  'clean_logs' : 'ClusterApplication.clean_logs',
                  'log_url' : 'ClusterApplication.log_url',
              }
              base_flags = {
                  'debug' : ( {"ClusterApplication" : {"log_level" : logging.DEBUG}}, "set loglevel to DEBUG"),
                  'quiet' : ( {"ClusterApplication" : {"log_level" : logging.CRITICAL}}, "set loglevel to CRITICAL (minimal output)"),
                  'log-to-file' : ( {"ClusterApplication" : {"log_to_file" : True}}, "redirect log output to a file"),
              }
              for k,v in base_flags.iteritems():
                  base_flags[k] = (Config(v[0]),v[1])
              class ClusterApplication(BaseIPythonApplication):
                  """An application that puts everything into a cluster directory.
                  Instead of looking for things in the ipython_dir, this type of application
                  will use its own private directory called the "cluster directory"
                  for things like config files, log files, etc.
                  The cluster directory is resolved as follows:
                  * If the ``--cluster-dir`` option is given, it is used.
                  * If ``--cluster-dir`` is not given, the application directory is
                    resolve using the profile name as ``cluster_<profile>``. The search
                    path for this directory is then i) cwd if it is found there
                    and ii) in ipython_dir otherwise.
                  The config file for the application is to be put in the cluster
                  dir and named the value of the ``config_file_name`` class attribute.
                  """
                  crash_handler_class = ClusterDirCrashHandler
                  auto_create_cluster_dir = Bool(True, config=True,
                      help="whether to create the cluster_dir if it doesn't exist")
                  cluster_dir = Instance(ClusterDir)
                  classes = [ClusterDir]
                  def _log_level_default(self):
                      # temporarily override default_log_level to INFO
                      return logging.INFO
                  work_dir = Unicode(os.getcwdu(), config=True,
                      help='Set the working dir for the process.'
                  )
                  def _work_dir_changed(self, name, old, new):
                      self.work_dir = unicode(expand_path(new))
                  log_to_file = Bool(config=True,
                      help="whether to log to a file")
                  clean_logs = Bool(False, shortname='--clean-logs', config=True,
                      help="whether to cleanup old logfiles before starting")
                  log_url = Unicode('', shortname='--log-url', config=True,
                      help="The ZMQ URL of the iplogger to aggregate logging.")
                  config_file = Unicode(u'', config=True,
                      help="""Path to ipcontroller configuration file.  The default is to use
                       <appname>_config.py, as found by cluster-dir."""
                  )
                  loop = Instance('zmq.eventloop.ioloop.IOLoop')
                  def _loop_default(self):
                      from zmq.eventloop.ioloop import IOLoop
                      return IOLoop.instance()
                  aliases = Dict(base_aliases)
                  flags = Dict(base_flags)
                  def init_clusterdir(self):
                      """This resolves the cluster directory.
                      This tries to find the cluster directory and if successful, it will
                      have done:
                      * Sets ``self.cluster_dir_obj`` to the :class:`ClusterDir` object for
                        the application.
                      * Sets ``self.cluster_dir`` attribute of the application and config
                        objects.
                      The algorithm used for this is as follows:
 . Try ``Global.cluster_dir``.
 . Try using ``Global.profile``.
 . If both of these fail and ``self.auto_create_cluster_dir`` is
                         ``True``, then create the new cluster dir in the IPython directory.
 . If all fails, then raise :class:`ClusterDirError`.
                      """
                      try:
                          self.cluster_dir = ClusterDir(auto_create=self.auto_create_cluster_dir, config=self.config)
                      except ClusterDirError as e:
                          self.log.fatal("Error initializing cluster dir: %s"%e)
                          self.log.fatal("A cluster dir must be created before running this command.")
                          self.log.fatal("Do 'ipcluster create -h' or 'ipcluster list -h' for more "
                          "information about creating and listing cluster dirs."
                          )
                          self.exit(1)
                      if self.cluster_dir._new_dir:
                          self.log.info('Creating new cluster dir: %s' % \
                                          self.cluster_dir.location)
                      else:
                          self.log.info('Using existing cluster dir: %s' % \
                                          self.cluster_dir.location)
                  def initialize(self, argv=None):
                      """initialize the app"""
                      self.init_crash_handler()
                      self.parse_command_line(argv)
                      cl_config = self.config
                      self.init_clusterdir()
                      if self.config_file:
                          self.load_config_file(self.config_file)
-                     else:
-                         self.load_config_file(self.default_config_file_name, path=self.cluster_dir.location)
+                     elif self.default_config_file_name:
+                         try:
+                             self.load_config_file(self.default_config_file_name,
+                                                     path=self.cluster_dir.location)
+                         except IOError:
+                             self.log.warn("Warning: Default config file not found")
                      # command-line should *override* config file, but command-line is necessary
                      # to determine clusterdir, etc.
                      self.update_config(cl_config)
-                     self.reinit_logging()
                      self.to_work_dir()
+                     self.reinit_logging()
                  def to_work_dir(self):
                      wd = self.work_dir
                      if unicode(wd) != os.getcwdu():
                          os.chdir(wd)
                          self.log.info("Changing to working dir: %s" % wd)
+                     # This is the working dir by now.
+                     sys.path.insert(0, '')
                  def load_config_file(self, filename, path=None):
                      """Load a .py based config file by filename and path."""
                      # use config.application.Application.load_config
                      # instead of inflexible core.newapplication.BaseIPythonApplication.load_config
                      return Application.load_config_file(self, filename, path=path)
                  #
                  # def load_default_config_file(self):
                  #     """Load a .py based config file by filename and path."""
                  #     return BaseIPythonApplication.load_config_file(self)
                  # disable URL-logging
                  def reinit_logging(self):
                      # Remove old log files
                      log_dir = self.cluster_dir.log_dir
                      if self.clean_logs:
                          for f in os.listdir(log_dir):
                              if re.match(r'%s-\d+\.(log|err|out)'%self.name,f):
                                  os.remove(os.path.join(log_dir, f))
                      if self.log_to_file:
                          # Start logging to the new log file
                          log_filename = self.name + u'-' + str(os.getpid()) + u'.log'
                          logfile = os.path.join(log_dir, log_filename)
                          open_log_file = open(logfile, 'w')
                      else:
                          open_log_file = None
                      if open_log_file is not None:
                          self.log.removeHandler(self._log_handler)
                          self._log_handler = logging.StreamHandler(open_log_file)
                          self._log_formatter = logging.Formatter("[%(name)s] %(message)s")
                          self._log_handler.setFormatter(self._log_formatter)
                          self.log.addHandler(self._log_handler)
                  def write_pid_file(self, overwrite=False):
                      """Create a .pid file in the pid_dir with my pid.
                      This must be called after pre_construct, which sets `self.pid_dir`.
                      This raises :exc:`PIDFileError` if the pid file exists already.
                      """
                      pid_file = os.path.join(self.cluster_dir.pid_dir, self.name + u'.pid')
                      if os.path.isfile(pid_file):
                          pid = self.get_pid_from_file()
                          if not overwrite:
                              raise PIDFileError(
                                  'The pid file [%s] already exists. \nThis could mean that this '
                                  'server is already running with [pid=%s].' % (pid_file, pid)
                              )
                      with open(pid_file, 'w') as f:
                          self.log.info("Creating pid file: %s" % pid_file)
                          f.write(repr(os.getpid())+'\n')
                  def remove_pid_file(self):
                      """Remove the pid file.
                      This should be called at shutdown by registering a callback with
                      :func:`reactor.addSystemEventTrigger`. This needs to return
                      ``None``.
                      """
                      pid_file = os.path.join(self.cluster_dir.pid_dir, self.name + u'.pid')
                      if os.path.isfile(pid_file):
                          try:
                              self.log.info("Removing pid file: %s" % pid_file)
                              os.remove(pid_file)
                          except:
                              self.log.warn("Error removing the pid file: %s" % pid_file)
                  def get_pid_from_file(self):
                      """Get the pid from the pid file.
                      If the  pid file doesn't exist a :exc:`PIDFileError` is raised.
                      """
                      pid_file = os.path.join(self.cluster_dir.pid_dir, self.name + u'.pid')
                      if os.path.isfile(pid_file):
                          with open(pid_file, 'r') as f:
                              pid = int(f.read().strip())
                              return pid
                      else:
                          raise PIDFileError('pid file not found: %s' % pid_file)
                  def check_pid(self, pid):
                      if os.name == 'nt':
                          try:
                              import ctypes
                              # returns 0 if no such process (of ours) exists
                              # positive int otherwise
                              p = ctypes.windll.kernel32.OpenProcess(1,0,pid)
                          except Exception:
                              self.log.warn(
                                  "Could not determine whether pid %i is running via `OpenProcess`. "
                                  " Making the likely assumption that it is."%pid
                              )
                              return True
                          return bool(p)
                      else:
                          try:
                              p = Popen(['ps','x'], stdout=PIPE, stderr=PIPE)
                              output,_ = p.communicate()
                          except OSError:
                              self.log.warn(
                                  "Could not determine whether pid %i is running via `ps x`. "
                                  " Making the likely assumption that it is."%pid
                              )
                              return True
                          pids = map(int, re.findall(r'^\W*\d+', output, re.MULTILINE))
                          return pid in pids

IPython/parallel/apps/ipcontrollerapp.py

0 +17 -15

              #!/usr/bin/env python
              # encoding: utf-8
              """
              The IPython controller application.
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2008-2009  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              from __future__ import with_statement
              import copy
              import os
              import logging
              import socket
              import stat
              import sys
              import uuid
              from multiprocessing import Process
              import zmq
              from zmq.devices import ProcessMonitoredQueue
              from zmq.log.handlers import PUBHandler
              from zmq.utils import jsonapi as json
              from IPython.config.loader import Config
              from IPython.parallel import factory
              from IPython.parallel.apps.clusterdir import (
                  ClusterDir,
                  ClusterApplication,
                  base_flags
                  # ClusterDirConfigLoader
              )
              from IPython.utils.importstring import import_item
              from IPython.utils.traitlets import Instance, Unicode, Bool, List, Dict
              # from IPython.parallel.controller.controller import ControllerFactory
              from IPython.parallel.streamsession import StreamSession
              from IPython.parallel.controller.heartmonitor import HeartMonitor
              from IPython.parallel.controller.hub import Hub, HubFactory
              from IPython.parallel.controller.scheduler import TaskScheduler,launch_scheduler
              from IPython.parallel.controller.sqlitedb import SQLiteDB
              from IPython.parallel.util import signal_children,disambiguate_ip_address, split_url
              # conditional import of MongoDB backend class
              try:
                  from IPython.parallel.controller.mongodb import MongoDB
              except ImportError:
                  maybe_mongo = []
              else:
                  maybe_mongo = [MongoDB]
              #-----------------------------------------------------------------------------
              # Module level variables
              #-----------------------------------------------------------------------------
              #: The default config file name for this application
              default_config_file_name = u'ipcontroller_config.py'
              _description = """Start the IPython controller for parallel computing.
              The IPython controller provides a gateway between the IPython engines and
              clients. The controller needs to be started before the engines and can be
              configured using command line options or using a cluster directory. Cluster
              directories contain config, log and security files and are usually located in
              your ipython directory and named as "cluster_<profile>". See the --profile
              and --cluster-dir options for details.
              """
              #-----------------------------------------------------------------------------
              # The main application
              #-----------------------------------------------------------------------------
              flags = {}
              flags.update(base_flags)
              flags.update({
                  'usethreads' : ( {'IPControllerApp' : {'usethreads' : True}},
                                  'Use threads instead of processes for the schedulers'),
                  'sqlitedb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.sqlitedb.SQLiteDB'}},
                                  'use the SQLiteDB backend'),
                  'mongodb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.mongodb.MongoDB'}},
                                  'use the MongoDB backend'),
                  'dictdb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.dictdb.DictDB'}},
                                  'use the in-memory DictDB backend'),
              })
              flags.update()
              class IPControllerApp(ClusterApplication):
                  name = u'ipcontroller'
                  description = _description
                  # command_line_loader = IPControllerAppConfigLoader
                  default_config_file_name = default_config_file_name
                  classes = [ClusterDir, StreamSession, HubFactory, TaskScheduler, HeartMonitor, SQLiteDB] + maybe_mongo
                  auto_create_cluster_dir = Bool(True, config=True,
                      help="Whether to create cluster_dir if it exists.")
                  reuse_files = Bool(False, config=True,
                      help='Whether to reuse existing json connection files [default: False]'
                  )
                  secure = Bool(True, config=True,
                      help='Whether to use exec_keys for extra authentication [default: True]'
                  )
                  ssh_server = Unicode(u'', config=True,
                      help="""ssh url for clients to use when connecting to the Controller
                      processes. It should be of the form: [user@]server[:port]. The
                      Controller\'s listening addresses must be accessible from the ssh server""",
                  )
                  location = Unicode(u'', config=True,
                      help="""The external IP or domain name of the Controller, used for disambiguating
                      engine and client connections.""",
                  )
                  import_statements = List([], config=True,
                      help="import statements to be run at startup.  Necessary in some environments"
                  )
                  usethreads = Bool(False, config=True,
                      help='Use threads instead of processes for the schedulers',
                      )
                  # internal
                  children = List()
                  mq_class = Unicode('zmq.devices.ProcessMonitoredQueue')
                  def _usethreads_changed(self, name, old, new):
                      self.mq_class = 'zmq.devices.%sMonitoredQueue'%('Thread' if new else 'Process')
                  aliases = Dict(dict(
                      config = 'IPControllerApp.config_file',
                      # file = 'IPControllerApp.url_file',
                      log_level = 'IPControllerApp.log_level',
+                     log_url = 'IPControllerApp.log_url',
                      reuse_files = 'IPControllerApp.reuse_files',
                      secure = 'IPControllerApp.secure',
                      ssh = 'IPControllerApp.ssh_server',
                      usethreads = 'IPControllerApp.usethreads',
                      import_statements = 'IPControllerApp.import_statements',
                      location = 'IPControllerApp.location',
                      ident = 'StreamSession.session',
                      user = 'StreamSession.username',
                      exec_key = 'StreamSession.keyfile',
                      url = 'HubFactory.url',
                      ip = 'HubFactory.ip',
                      transport = 'HubFactory.transport',
                      port = 'HubFactory.regport',
                      ping = 'HeartMonitor.period',
                      scheme = 'TaskScheduler.scheme_name',
                      hwm = 'TaskScheduler.hwm',
                      profile = "ClusterDir.profile",
                      cluster_dir = 'ClusterDir.location',
                  ))
                  flags = Dict(flags)
                  def save_connection_dict(self, fname, cdict):
                      """save a connection dict to json file."""
                      c = self.config
                      url = cdict['url']
                      location = cdict['location']
                      if not location:
                          try:
                              proto,ip,port = split_url(url)
                          except AssertionError:
                              pass
                          else:
                              location = socket.gethostbyname_ex(socket.gethostname())[2][-1]
                          cdict['location'] = location
                      fname = os.path.join(self.cluster_dir.security_dir, fname)
                      with open(fname, 'w') as f:
                          f.write(json.dumps(cdict, indent=2))
                      os.chmod(fname, stat.S_IRUSR|stat.S_IWUSR)
                  def load_config_from_json(self):
                      """load config from existing json connector files."""
                      c = self.config
                      # load from engine config
                      with open(os.path.join(self.cluster_dir.security_dir, 'ipcontroller-engine.json')) as f:
                          cfg = json.loads(f.read())
                      key = c.StreamSession.key = cfg['exec_key']
                      xport,addr = cfg['url'].split('://')
                      c.HubFactory.engine_transport = xport
                      ip,ports = addr.split(':')
                      c.HubFactory.engine_ip = ip
                      c.HubFactory.regport = int(ports)
                      self.location = cfg['location']
                      # load client config
                      with open(os.path.join(self.cluster_dir.security_dir, 'ipcontroller-client.json')) as f:
                          cfg = json.loads(f.read())
                      assert key == cfg['exec_key'], "exec_key mismatch between engine and client keys"
                      xport,addr = cfg['url'].split('://')
                      c.HubFactory.client_transport = xport
                      ip,ports = addr.split(':')
                      c.HubFactory.client_ip = ip
                      self.ssh_server = cfg['ssh']
                      assert int(ports) == c.HubFactory.regport, "regport mismatch"
                  def init_hub(self):
-                     # This is the working dir by now.
-                     sys.path.insert(0, '')
                      c = self.config
                      self.do_import_statements()
                      reusing = self.reuse_files
                      if reusing:
                          try:
                              self.load_config_from_json()
                          except (AssertionError,IOError):
                              reusing=False
                      # check again, because reusing may have failed:
                      if reusing:
                          pass
                      elif self.secure:
                          key = str(uuid.uuid4())
                          # keyfile = os.path.join(self.cluster_dir.security_dir, self.exec_key)
                          # with open(keyfile, 'w') as f:
                          #     f.write(key)
                          # os.chmod(keyfile, stat.S_IRUSR|stat.S_IWUSR)
                          c.StreamSession.key = key
                      else:
                          key = c.StreamSession.key = ''
                      try:
                          self.factory = HubFactory(config=c, log=self.log)
                          # self.start_logging()
                          self.factory.init_hub()
                      except:
                          self.log.error("Couldn't construct the Controller", exc_info=True)
                          self.exit(1)
                      if not reusing:
                          # save to new json config files
                          f = self.factory
                          cdict = {'exec_key' : key,
                                  'ssh' : self.ssh_server,
                                  'url' : "%s://%s:%s"%(f.client_transport, f.client_ip, f.regport),
                                  'location' : self.location
                                  }
                          self.save_connection_dict('ipcontroller-client.json', cdict)
                          edict = cdict
                          edict['url']="%s://%s:%s"%((f.client_transport, f.client_ip, f.regport))
                          self.save_connection_dict('ipcontroller-engine.json', edict)
                  #
                  def init_schedulers(self):
                      children = self.children
-                     mq = import_item(self.mq_class)
+                     mq = import_item(str(self.mq_class))
                      hub = self.factory
                      # maybe_inproc = 'inproc://monitor' if self.usethreads else self.monitor_url
                      # IOPub relay (in a Process)
                      q = mq(zmq.PUB, zmq.SUB, zmq.PUB, 'N/A','iopub')
                      q.bind_in(hub.client_info['iopub'])
                      q.bind_out(hub.engine_info['iopub'])
                      q.setsockopt_out(zmq.SUBSCRIBE, '')
                      q.connect_mon(hub.monitor_url)
                      q.daemon=True
                      children.append(q)
                      # Multiplexer Queue (in a Process)
                      q = mq(zmq.XREP, zmq.XREP, zmq.PUB, 'in', 'out')
                      q.bind_in(hub.client_info['mux'])
                      q.setsockopt_in(zmq.IDENTITY, 'mux')
                      q.bind_out(hub.engine_info['mux'])
                      q.connect_mon(hub.monitor_url)
                      q.daemon=True
                      children.append(q)
                      # Control Queue (in a Process)
                      q = mq(zmq.XREP, zmq.XREP, zmq.PUB, 'incontrol', 'outcontrol')
                      q.bind_in(hub.client_info['control'])
                      q.setsockopt_in(zmq.IDENTITY, 'control')
                      q.bind_out(hub.engine_info['control'])
                      q.connect_mon(hub.monitor_url)
                      q.daemon=True
                      children.append(q)
                      try:
                          scheme = self.config.TaskScheduler.scheme_name
                      except AttributeError:
                          scheme = TaskScheduler.scheme_name.get_default_value()
                      # Task Queue (in a Process)
                      if scheme == 'pure':
                          self.log.warn("task::using pure XREQ Task scheduler")
                          q = mq(zmq.XREP, zmq.XREQ, zmq.PUB, 'intask', 'outtask')
                          # q.setsockopt_out(zmq.HWM, hub.hwm)
                          q.bind_in(hub.client_info['task'][1])
                          q.setsockopt_in(zmq.IDENTITY, 'task')
                          q.bind_out(hub.engine_info['task'])
                          q.connect_mon(hub.monitor_url)
                          q.daemon=True
                          children.append(q)
                      elif scheme == 'none':
                          self.log.warn("task::using no Task scheduler")
                      else:
                          self.log.info("task::using Python %s Task scheduler"%scheme)
                          sargs = (hub.client_info['task'][1], hub.engine_info['task'],
                                              hub.monitor_url, hub.client_info['notification'])
-                         kwargs = dict(logname=self.log.name, loglevel=self.log_level,
-                                                                         config=dict(self.config))
+                         kwargs = dict(logname='scheduler', loglevel=self.log_level,
+                                         log_url = self.log_url, config=dict(self.config))
                          q = Process(target=launch_scheduler, args=sargs, kwargs=kwargs)
                          q.daemon=True
                          children.append(q)
                  def save_urls(self):
                      """save the registration urls to files."""
                      c = self.config
                      sec_dir = self.cluster_dir.security_dir
                      cf = self.factory
                      with open(os.path.join(sec_dir, 'ipcontroller-engine.url'), 'w') as f:
                          f.write("%s://%s:%s"%(cf.engine_transport, cf.engine_ip, cf.regport))
                      with open(os.path.join(sec_dir, 'ipcontroller-client.url'), 'w') as f:
                          f.write("%s://%s:%s"%(cf.client_transport, cf.client_ip, cf.regport))
                  def do_import_statements(self):
                      statements = self.import_statements
                      for s in statements:
                          try:
                              self.log.msg("Executing statement: '%s'" % s)
                              exec s in globals(), locals()
                          except:
                              self.log.msg("Error running statement: %s" % s)
-                 # def start_logging(self):
-                 #     super(IPControllerApp, self).start_logging()
-                 #     if self.config.Global.log_url:
-                 #         context = self.factory.context
-                 #         lsock = context.socket(zmq.PUB)
-                 #         lsock.connect(self.config.Global.log_url)
-                 #         handler = PUBHandler(lsock)
-                 #         handler.root_topic = 'controller'
-                 #         handler.setLevel(self.log_level)
-                 #         self.log.addHandler(handler)
+                 def forward_logging(self):
+                     if self.log_url:
+                         self.log.info("Forwarding logging to %s"%self.log_url)
+                         context = zmq.Context.instance()
+                         lsock = context.socket(zmq.PUB)
+                         lsock.connect(self.log_url)
+                         handler = PUBHandler(lsock)
+                         self.log.removeHandler(self._log_handler)
+                         handler.root_topic = 'controller'
+                         handler.setLevel(self.log_level)
+                         self.log.addHandler(handler)
+                         self._log_handler = handler
                  # #
                  def initialize(self, argv=None):
                      super(IPControllerApp, self).initialize(argv)
+                     self.forward_logging()
                      self.init_hub()
                      self.init_schedulers()
                  def start(self):
                      # Start the subprocesses:
                      self.factory.start()
                      child_procs = []
                      for child in self.children:
                          child.start()
                          if isinstance(child, ProcessMonitoredQueue):
                              child_procs.append(child.launcher)
                          elif isinstance(child, Process):
                              child_procs.append(child)
                      if child_procs:
                          signal_children(child_procs)
                      self.write_pid_file(overwrite=True)
                      try:
                          self.factory.loop.start()
                      except KeyboardInterrupt:
                          self.log.critical("Interrupted, Exiting...\n")
              def launch_new_instance():
                  """Create and run the IPython controller"""
                  app = IPControllerApp()
                  app.initialize()
                  app.start()
              if __name__ == '__main__':
                  launch_new_instance()

IPython/parallel/apps/ipengineapp.py

0 +17 -29

              #!/usr/bin/env python
              # encoding: utf-8
              """
              The IPython engine application
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2008-2009  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import json
              import os
              import sys
              import zmq
              from zmq.eventloop import ioloop
              from IPython.parallel.apps.clusterdir import (
                  ClusterApplication,
                  ClusterDir,
-                 base_aliases,
                  # ClusterDirConfigLoader
              )
              from IPython.zmq.log import EnginePUBHandler
              from IPython.config.configurable import Configurable
              from IPython.parallel.streamsession import StreamSession
              from IPython.parallel.engine.engine import EngineFactory
              from IPython.parallel.engine.streamkernel import Kernel
              from IPython.parallel.util import disambiguate_url
              from IPython.utils.importstring import import_item
-             from IPython.utils.traitlets import Bool, Unicode, Dict, List, CStr
+             from IPython.utils.traitlets import Bool, Unicode, Dict, List
              #-----------------------------------------------------------------------------
              # Module level variables
              #-----------------------------------------------------------------------------
              #: The default config file name for this application
              default_config_file_name = u'ipengine_config.py'
              _description = """Start an IPython engine for parallel computing.\n\n
              IPython engines run in parallel and perform computations on behalf of a client
              and controller. A controller needs to be started before the engines. The
              engine can be configured using command line options or using a cluster
              directory. Cluster directories contain config, log and security files and are
              usually located in your ipython directory and named as "cluster_<profile>".
              See the `profile` and `cluster_dir` options for details.
              """
              #-----------------------------------------------------------------------------
              # MPI configuration
              #-----------------------------------------------------------------------------
              mpi4py_init = """from mpi4py import MPI as mpi
              mpi.size = mpi.COMM_WORLD.Get_size()
              mpi.rank = mpi.COMM_WORLD.Get_rank()
              """
              pytrilinos_init = """from PyTrilinos import Epetra
              class SimpleStruct:
              pass
              mpi = SimpleStruct()
              mpi.rank = 0
              mpi.size = 0
              """
              class MPI(Configurable):
                  """Configurable for MPI initialization"""
                  use = Unicode('', config=True,
                      help='How to enable MPI (mpi4py, pytrilinos, or empty string to disable).'
                      )
                  def _on_use_changed(self, old, new):
                      # load default init script if it's not set
                      if not self.init_script:
                          self.init_script = self.default_inits.get(new, '')
                  init_script = Unicode('', config=True,
                      help="Initialization code for MPI")
                  default_inits = Dict({'mpi4py' : mpi4py_init, 'pytrilinos':pytrilinos_init},
                      config=True)
              #-----------------------------------------------------------------------------
              # Main application
              #-----------------------------------------------------------------------------
              class IPEngineApp(ClusterApplication):
                  app_name = Unicode(u'ipengine')
                  description = Unicode(_description)
                  default_config_file_name = default_config_file_name
                  classes = List([ClusterDir, StreamSession, EngineFactory, Kernel, MPI])
                  auto_create_cluster_dir = Bool(False,
                      help="whether to create the cluster_dir if it doesn't exist")
                  startup_script = Unicode(u'', config=True,
                      help='specify a script to be run at startup')
                  startup_command = Unicode('', config=True,
                          help='specify a command to be run at startup')
                  url_file = Unicode(u'', config=True,
                      help="""The full location of the file containing the connection information for
                      the controller. If this is not given, the file must be in the
                      security directory of the cluster directory.  This location is
                      resolved using the `profile` or `cluster_dir` options.""",
                      )
                  url_file_name = Unicode(u'ipcontroller-engine.json')
+                 log_url = Unicode('', config=True,
+                     help="""The URL for the iploggerapp instance, for forwarding
+                     logging to a central location.""")
                  aliases = Dict(dict(
                      config = 'IPEngineApp.config_file',
                      file = 'IPEngineApp.url_file',
                      c = 'IPEngineApp.startup_command',
                      s = 'IPEngineApp.startup_script',
                      ident = 'StreamSession.session',
                      user = 'StreamSession.username',
                      exec_key = 'StreamSession.keyfile',
                      url = 'EngineFactory.url',
                      ip = 'EngineFactory.ip',
                      transport = 'EngineFactory.transport',
                      port = 'EngineFactory.regport',
                      location = 'EngineFactory.location',
                      timeout = 'EngineFactory.timeout',
                      profile = "ClusterDir.profile",
                      cluster_dir = 'ClusterDir.location',
                      mpi = 'MPI.use',
                      log_level = 'IPEngineApp.log_level',
+                     log_url = 'IPEngineApp.log_url'
                  ))
                  # def find_key_file(self):
                  #     """Set the key file.
                  #
                  #     Here we don't try to actually see if it exists for is valid as that
                  #     is hadled by the connection logic.
                  #     """
                  #     config = self.master_config
                  #     # Find the actual controller key file
                  #     if not config.Global.key_file:
                  #         try_this = os.path.join(
                  #             config.Global.cluster_dir,
                  #             config.Global.security_dir,
                  #             config.Global.key_file_name
                  #         )
                  #         config.Global.key_file = try_this
                  def find_url_file(self):
                      """Set the key file.
                      Here we don't try to actually see if it exists for is valid as that
                      is hadled by the connection logic.
                      """
                      config = self.config
                      # Find the actual controller key file
                      if not self.url_file:
                          self.url_file = os.path.join(
                              self.cluster_dir.security_dir,
                              self.url_file_name
                          )
                  def init_engine(self):
                      # This is the working dir by now.
                      sys.path.insert(0, '')
                      config = self.config
                      # print config
                      self.find_url_file()
                      # if os.path.exists(config.Global.key_file) and config.Global.secure:
                      #     config.SessionFactory.exec_key = config.Global.key_file
                      if os.path.exists(self.url_file):
                          with open(self.url_file) as f:
                              d = json.loads(f.read())
                              for k,v in d.iteritems():
                                  if isinstance(v, unicode):
                                      d[k] = v.encode()
                          if d['exec_key']:
                              config.StreamSession.key = d['exec_key']
                          d['url'] = disambiguate_url(d['url'], d['location'])
                          config.EngineFactory.url = d['url']
                          config.EngineFactory.location = d['location']
                      try:
                          exec_lines = config.Kernel.exec_lines
                      except AttributeError:
                          config.Kernel.exec_lines = []
                          exec_lines = config.Kernel.exec_lines
                      if self.startup_script:
                          enc = sys.getfilesystemencoding() or 'utf8'
                          cmd="execfile(%r)"%self.startup_script.encode(enc)
                          exec_lines.append(cmd)
                      if self.startup_command:
                          exec_lines.append(self.startup_command)
                      # Create the underlying shell class and Engine
                      # shell_class = import_item(self.master_config.Global.shell_class)
                      # print self.config
                      try:
                          self.engine = EngineFactory(config=config, log=self.log)
                      except:
                          self.log.error("Couldn't start the Engine", exc_info=True)
                          self.exit(1)
-                     # self.start_logging()
-                     # Create the service hierarchy
-                     # self.main_service = service.MultiService()
-                     # self.engine_service.setServiceParent(self.main_service)
-                     # self.tub_service = Tub()
-                     # self.tub_service.setServiceParent(self.main_service)
-                     # # This needs to be called before the connection is initiated
-                     # self.main_service.startService()
-                     # This initiates the connection to the controller and calls
-                     # register_engine to tell the controller we are ready to do work
-                     # self.engine_connector = EngineConnector(self.tub_service)
-                     # self.log.info("Using furl file: %s" % self.master_config.Global.furl_file)
-                     # reactor.callWhenRunning(self.call_connect)
-                 # def start_logging(self):
-                 #     super(IPEngineApp, self).start_logging()
-                 #     if self.master_config.Global.log_url:
-                 #         context = self.engine.context
-                 #         lsock = context.socket(zmq.PUB)
-                 #         lsock.connect(self.master_config.Global.log_url)
-                 #         handler = EnginePUBHandler(self.engine, lsock)
-                 #         handler.setLevel(self.log_level)
-                 #         self.log.addHandler(handler)
+                 def forward_logging(self):
+                     if self.log_url:
+                         self.log.info("Forwarding logging to %s"%self.log_url)
+                         context = self.engine.context
+                         lsock = context.socket(zmq.PUB)
+                         lsock.connect(self.log_url)
+                         self.log.removeHandler(self._log_handler)
+                         handler = EnginePUBHandler(self.engine, lsock)
+                         handler.setLevel(self.log_level)
+                         self.log.addHandler(handler)
+                         self._log_handler = handler
                  #
                  def init_mpi(self):
                      global mpi
                      self.mpi = MPI(config=self.config)
                      mpi_import_statement = self.mpi.init_script
                      if mpi_import_statement:
                          try:
                              self.log.info("Initializing MPI:")
                              self.log.info(mpi_import_statement)
                              exec mpi_import_statement in globals()
                          except:
                              mpi = None
                      else:
                          mpi = None
                  def initialize(self, argv=None):
                      super(IPEngineApp, self).initialize(argv)
                      self.init_mpi()
                      self.init_engine()
+                     self.forward_logging()
                  def start(self):
                      self.engine.start()
                      try:
                          self.engine.loop.start()
                      except KeyboardInterrupt:
                          self.log.critical("Engine Interrupted, shutting down...\n")
              def launch_new_instance():
                  """Create and run the IPython engine"""
                  app = IPEngineApp()
                  app.initialize()
                  app.start()
              if __name__ == '__main__':
                  launch_new_instance()

IPython/parallel/apps/iploggerapp.py

0 +22 -57

              #!/usr/bin/env python
              # encoding: utf-8
              """
              A simple IPython logger application
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import os
              import sys
              import zmq
+             from IPython.utils.traitlets import Bool, Dict
              from IPython.parallel.apps.clusterdir import (
                  ClusterApplication,
-                 ClusterDirConfigLoader
+                 ClusterDir,
+                 base_aliases
              )
              from IPython.parallel.apps.logwatcher import LogWatcher
              #-----------------------------------------------------------------------------
              # Module level variables
              #-----------------------------------------------------------------------------
              #: The default config file name for this application
              default_config_file_name = u'iplogger_config.py'
              _description = """Start an IPython logger for parallel computing.\n\n
              IPython controllers and engines (and your own processes) can broadcast log messages
              by registering a `zmq.log.handlers.PUBHandler` with the `logging` module. The
              logger can be configured using command line options or using a cluster
              directory. Cluster directories contain config, log and security files and are
              usually located in your ipython directory and named as "cluster_<profile>".
              See the --profile and --cluster-dir options for details.
              """
-             #-----------------------------------------------------------------------------
-             # Command line options
-             #-----------------------------------------------------------------------------
-             class IPLoggerAppConfigLoader(ClusterDirConfigLoader):
-                 def _add_arguments(self):
-                     super(IPLoggerAppConfigLoader, self)._add_arguments()
-                     paa = self.parser.add_argument
-                     # Controller config
-                     paa('--url',
-                         type=str, dest='LogWatcher.url',
-                         help='The url the LogWatcher will listen on',
+                         )
-                     # MPI
-                     paa('--topics',
-                         type=str, dest='LogWatcher.topics', nargs='+',
-                         help='What topics to subscribe to',
-                         metavar='topics')
-                     # Global config
-                     paa('--log-to-file',
-                         action='store_true', dest='Global.log_to_file',
-                         help='Log to a file in the log directory (default is stdout)')
              #-----------------------------------------------------------------------------
              # Main application
              #-----------------------------------------------------------------------------
+             aliases = {}
+             aliases.update(base_aliases)
+             aliases.update(dict(url='LogWatcher.url', topics='LogWatcher.topics'))
              class IPLoggerApp(ClusterApplication):
                  name = u'iploggerz'
                  description = _description
-                 command_line_loader = IPLoggerAppConfigLoader
                  default_config_file_name = default_config_file_name
-                 auto_create_cluster_dir = True
-                 def create_default_config(self):
-                     super(IPLoggerApp, self).create_default_config()
-                     # The engine should not clean logs as we don't want to remove the
-                     # active log files of other running engines.
-                     self.default_config.Global.clean_logs = False
-                     # If given, this is the actual location of the logger's URL file.
-                     # If not, this is computed using the profile, app_dir and furl_file_name
-                     self.default_config.Global.url_file_name = u'iplogger.url'
-                     self.default_config.Global.url_file = u''
-                 def post_load_command_line_config(self):
-                     pass
-                 def pre_construct(self):
-                     super(IPLoggerApp, self).pre_construct()
-                 def construct(self):
-                     # This is the working dir by now.
-                     sys.path.insert(0, '')
-                     self.start_logging()
+                 auto_create_cluster_dir = Bool(False)
+                 classes = [LogWatcher, ClusterDir]
+                 aliases = Dict(aliases)
+                 def initialize(self, argv=None):
+                     super(IPLoggerApp, self).initialize(argv)
+                     self.init_watcher()
+                 def init_watcher(self):
                      try:
-                         self.watcher = LogWatcher(config=self.master_config, logname=self.log.name)
+                         self.watcher = LogWatcher(config=self.config, logname=self.log.name)
                      except:
                          self.log.error("Couldn't start the LogWatcher", exc_info=True)
                          self.exit(1)
+                     self.log.info("Listening for log messages on %r"%self.watcher.url)
-                 def start_app(self):
+                 def start(self):
+                     self.watcher.start()
                      try:
-                         self.watcher.start()
                          self.watcher.loop.start()
                      except KeyboardInterrupt:
                          self.log.critical("Logging Interrupted, shutting down...\n")
              def launch_new_instance():
                  """Create and run the IPython LogWatcher"""
                  app = IPLoggerApp()
+                 app.initialize()
                  app.start()
              if __name__ == '__main__':
                  launch_new_instance()

IPython/parallel/apps/logwatcher.py

0 +18 -8

              #!/usr/bin/env python
              """A simple logger object that consolidates messages incoming from ipcluster processes."""
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #-----------------------------------------------------------------------------
              # Imports
              #-----------------------------------------------------------------------------
              import logging
              import sys
              import zmq
              from zmq.eventloop import ioloop, zmqstream
              from IPython.utils.traitlets import Int, Unicode, Instance, List
              from IPython.parallel.factory import LoggingFactory
              #-----------------------------------------------------------------------------
              # Classes
              #-----------------------------------------------------------------------------
              class LogWatcher(LoggingFactory):
                  """A simple class that receives messages on a SUB socket, as published
                  by subclasses of `zmq.log.handlers.PUBHandler`, and logs them itself.
                  This can subscribe to multiple topics, but defaults to all topics.
                  """
                  # configurables
-                 topics = List([''], config=True)
-                 url = Unicode('tcp://127.0.0.1:20202', config=True)
+                 topics = List([''], config=True,
+                     help="The ZMQ topics to subscribe to. Default is to subscribe to all messages")
+                 url = Unicode('tcp://127.0.0.1:20202', config=True,
+                     help="ZMQ url on which to listen for log messages")
                  # internals
-                 context = Instance(zmq.Context, (), {})
                  stream = Instance('zmq.eventloop.zmqstream.ZMQStream')
-                 loop = Instance('zmq.eventloop.ioloop.IOLoop')
+                 context = Instance(zmq.Context)
+                 def _context_default(self):
+                     return zmq.Context.instance()
+                 loop = Instance(zmq.eventloop.ioloop.IOLoop)
                  def _loop_default(self):
                      return ioloop.IOLoop.instance()
                  def __init__(self, **kwargs):
                      super(LogWatcher, self).__init__(**kwargs)
                      s = self.context.socket(zmq.SUB)
                      s.bind(self.url)
                      self.stream = zmqstream.ZMQStream(s, self.loop)
                      self.subscribe()
                      self.on_trait_change(self.subscribe, 'topics')
                  def start(self):
                      self.stream.on_recv(self.log_message)
                  def stop(self):
                      self.stream.stop_on_recv()
                  def subscribe(self):
                      """Update our SUB socket's subscriptions."""
                      self.stream.setsockopt(zmq.UNSUBSCRIBE, '')
-                     for topic in self.topics:
-                         self.log.debug("Subscribing to: %r"%topic)
-                         self.stream.setsockopt(zmq.SUBSCRIBE, topic)
+                     if '' in self.topics:
+                         self.log.debug("Subscribing to: everything")
+                         self.stream.setsockopt(zmq.SUBSCRIBE, '')
+                     else:
+                         for topic in self.topics:
+                             self.log.debug("Subscribing to: %r"%(topic))
+                             self.stream.setsockopt(zmq.SUBSCRIBE, topic)
                  def _extract_level(self, topic_str):
                      """Turn 'engine.0.INFO.extra' into (logging.INFO, 'engine.0.extra')"""
                      topics = topic_str.split('.')
                      for idx,t in enumerate(topics):
                          level = getattr(logging, t, None)
                          if level is not None:
                              break
                      if level is None:
                          level = logging.INFO
                      else:
                          topics.pop(idx)
                      return level, '.'.join(topics)
                  def log_message(self, raw):
                      """receive and parse a message, then log it."""
                      if len(raw) != 2 or '.' not in raw[0]:
                          self.log.error("Invalid log message: %s"%raw)
                          return
                      else:
                          topic, msg = raw
                          # don't newline, since log messages always newline:
                          topic,level_name = topic.rsplit('.',1)
                          level,topic = self._extract_level(topic)
                          if msg[-1] == '\n':
                              msg = msg[:-1]
-                         logging.log(level, "[%s] %s" % (topic, msg))
+                         self.log.log(level, "[%s] %s" % (topic, msg))

IPython/parallel/controller/scheduler.py

0 +8 -6

              """The Python scheduler for rich scheduling.
              The Pure ZMQ scheduler does not allow routing schemes other than LRU,
              nor does it check msg_id DAG dependencies. For those, a slightly slower
              Python Scheduler exists.
              """
              #-----------------------------------------------------------------------------
              #  Copyright (C) 2010-2011  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
              #-----------------------------------------------------------------------------
              #----------------------------------------------------------------------
              # Imports
              #----------------------------------------------------------------------
              from __future__ import print_function
              import logging
              import sys
              from datetime import datetime, timedelta
              from random import randint, random
              from types import FunctionType
              try:
                  import numpy
              except ImportError:
                  numpy = None
              import zmq
              from zmq.eventloop import ioloop, zmqstream
              # local imports
              from IPython.external.decorator import decorator
              from IPython.config.loader import Config
              from IPython.utils.traitlets import Instance, Dict, List, Set, Int, Str, Enum
              from IPython.parallel import error
              from IPython.parallel.factory import SessionFactory
              from IPython.parallel.util import connect_logger, local_logger
              from .dependency import Dependency
              @decorator
              def logged(f,self,*args,**kwargs):
                  # print ("#--------------------")
                  self.log.debug("scheduler::%s(*%s,**%s)"%(f.func_name, args, kwargs))
                  # print ("#--")
                  return f(self,*args, **kwargs)
              #----------------------------------------------------------------------
              # Chooser functions
              #----------------------------------------------------------------------
              def plainrandom(loads):
                  """Plain random pick."""
                  n = len(loads)
                  return randint(0,n-1)
              def lru(loads):
                  """Always pick the front of the line.
                  The content of `loads` is ignored.
                  Assumes LRU ordering of loads, with oldest first.
                  """
                  return 0
              def twobin(loads):
                  """Pick two at random, use the LRU of the two.
                  The content of loads is ignored.
                  Assumes LRU ordering of loads, with oldest first.
                  """
                  n = len(loads)
                  a = randint(0,n-1)
                  b = randint(0,n-1)
                  return min(a,b)
              def weighted(loads):
                  """Pick two at random using inverse load as weight.
                  Return the less loaded of the two.
                  """
                  # weight 0 a million times more than 1:
                  weights = 1./(1e-6+numpy.array(loads))
                  sums = weights.cumsum()
                  t = sums[-1]
                  x = random()*t
                  y = random()*t
                  idx = 0
                  idy = 0
                  while sums[idx] < x:
                      idx += 1
                  while sums[idy] < y:
                      idy += 1
                  if weights[idy] > weights[idx]:
                      return idy
                  else:
                      return idx
              def leastload(loads):
                  """Always choose the lowest load.
                  If the lowest load occurs more than once, the first
                  occurance will be used.  If loads has LRU ordering, this means
                  the LRU of those with the lowest load is chosen.
                  """
                  return loads.index(min(loads))
              #---------------------------------------------------------------------
              # Classes
              #---------------------------------------------------------------------
              # store empty default dependency:
              MET = Dependency([])
              class TaskScheduler(SessionFactory):
                  """Python TaskScheduler object.
                  This is the simplest object that supports msg_id based
                  DAG dependencies. *Only* task msg_ids are checked, not
                  msg_ids of jobs submitted via the MUX queue.
                  """
                  hwm = Int(0, config=True, shortname='hwm',
                      help="""specify the High Water Mark (HWM) for the downstream
                      socket in the Task scheduler. This is the maximum number
                      of allowed outstanding tasks on each engine."""
                  )
                  scheme_name = Enum(('leastload', 'pure', 'lru', 'plainrandom', 'weighted', 'twobin'),
                      'leastload', config=True, shortname='scheme', allow_none=False,
                      help="""select the task scheduler scheme  [default: Python LRU]
                      Options are: 'pure', 'lru', 'plainrandom', 'weighted', 'twobin','leastload'"""
                  )
                  def _scheme_name_changed(self, old, new):
                      self.log.debug("Using scheme %r"%new)
                      self.scheme = globals()[new]
                  # input arguments:
-                 scheme = Instance(FunctionType, default=leastload) # function for determining the destination
+                 scheme = Instance(FunctionType) # function for determining the destination
+                 def _scheme_default(self):
+                     return leastload
                  client_stream = Instance(zmqstream.ZMQStream) # client-facing stream
                  engine_stream = Instance(zmqstream.ZMQStream) # engine-facing stream
                  notifier_stream = Instance(zmqstream.ZMQStream) # hub-facing sub stream
                  mon_stream = Instance(zmqstream.ZMQStream) # hub-facing pub stream
                  # internals:
                  graph = Dict() # dict by msg_id of [ msg_ids that depend on key ]
                  retries = Dict() # dict by msg_id of retries remaining (non-neg ints)
                  # waiting = List() # list of msg_ids ready to run, but haven't due to HWM
                  depending = Dict() # dict by msg_id of (msg_id, raw_msg, after, follow)
                  pending = Dict() # dict by engine_uuid of submitted tasks
                  completed = Dict() # dict by engine_uuid of completed tasks
                  failed = Dict() # dict by engine_uuid of failed tasks
                  destinations = Dict() # dict by msg_id of engine_uuids where jobs ran (reverse of completed+failed)
                  clients = Dict() # dict by msg_id for who submitted the task
                  targets = List() # list of target IDENTs
                  loads = List() # list of engine loads
                  # full = Set() # set of IDENTs that have HWM outstanding tasks
                  all_completed = Set() # set of all completed tasks
                  all_failed = Set() # set of all failed tasks
                  all_done = Set() # set of all finished tasks=union(completed,failed)
                  all_ids = Set() # set of all submitted task IDs
                  blacklist = Dict() # dict by msg_id of locations where a job has encountered UnmetDependency
                  auditor = Instance('zmq.eventloop.ioloop.PeriodicCallback')
                  def start(self):
                      self.engine_stream.on_recv(self.dispatch_result, copy=False)
                      self._notification_handlers = dict(
                          registration_notification = self._register_engine,
                          unregistration_notification = self._unregister_engine
                      )
                      self.notifier_stream.on_recv(self.dispatch_notification)
                      self.auditor = ioloop.PeriodicCallback(self.audit_timeouts, 2e3, self.loop) # 1 Hz
                      self.auditor.start()
                      self.log.info("Scheduler started...%r"%self)
                  def resume_receiving(self):
                      """Resume accepting jobs."""
                      self.client_stream.on_recv(self.dispatch_submission, copy=False)
                  def stop_receiving(self):
                      """Stop accepting jobs while there are no engines.
                      Leave them in the ZMQ queue."""
                      self.client_stream.on_recv(None)
                  #-----------------------------------------------------------------------
                  # [Un]Registration Handling
                  #-----------------------------------------------------------------------
                  def dispatch_notification(self, msg):
                      """dispatch register/unregister events."""
                      idents,msg = self.session.feed_identities(msg)
                      msg = self.session.unpack_message(msg)
                      msg_type = msg['msg_type']
                      handler = self._notification_handlers.get(msg_type, None)
                      if handler is None:
                          raise Exception("Unhandled message type: %s"%msg_type)
                      else:
                          try:
                              handler(str(msg['content']['queue']))
                          except KeyError:
                              self.log.error("task::Invalid notification msg: %s"%msg)
                  @logged
                  def _register_engine(self, uid):
                      """New engine with ident `uid` became available."""
                      # head of the line:
                      self.targets.insert(0,uid)
                      self.loads.insert(0,0)
                      # initialize sets
                      self.completed[uid] = set()
                      self.failed[uid] = set()
                      self.pending[uid] = {}
                      if len(self.targets) == 1:
                          self.resume_receiving()
                      # rescan the graph:
                      self.update_graph(None)
                  def _unregister_engine(self, uid):
                      """Existing engine with ident `uid` became unavailable."""
                      if len(self.targets) == 1:
                          # this was our only engine
                          self.stop_receiving()
                      # handle any potentially finished tasks:
                      self.engine_stream.flush()
                      # don't pop destinations, because they might be used later
                      # map(self.destinations.pop, self.completed.pop(uid))
                      # map(self.destinations.pop, self.failed.pop(uid))
                      # prevent this engine from receiving work
                      idx = self.targets.index(uid)
                      self.targets.pop(idx)
                      self.loads.pop(idx)
                      # wait 5 seconds before cleaning up pending jobs, since the results might
                      # still be incoming
                      if self.pending[uid]:
                          dc = ioloop.DelayedCallback(lambda : self.handle_stranded_tasks(uid), 5000, self.loop)
                          dc.start()
                      else:
                          self.completed.pop(uid)
                          self.failed.pop(uid)
                  @logged
                  def handle_stranded_tasks(self, engine):
                      """Deal with jobs resident in an engine that died."""
                      lost = self.pending[engine]
                      for msg_id in lost.keys():
                          if msg_id not in self.pending[engine]:
                              # prevent double-handling of messages
                              continue
                          raw_msg = lost[msg_id][0]
                          idents,msg = self.session.feed_identities(raw_msg, copy=False)
                          msg = self.session.unpack_message(msg, copy=False, content=False)
                          parent = msg['header']
                          idents = [engine, idents[0]]
                          # build fake error reply
                          try:
                              raise error.EngineError("Engine %r died while running task %r"%(engine, msg_id))
                          except:
                              content = error.wrap_exception()
                          msg = self.session.msg('apply_reply', content, parent=parent, subheader={'status':'error'})
                          raw_reply = map(zmq.Message, self.session.serialize(msg, ident=idents))
                          # and dispatch it
                          self.dispatch_result(raw_reply)
                      # finally scrub completed/failed lists
                      self.completed.pop(engine)
                      self.failed.pop(engine)
                  #-----------------------------------------------------------------------
                  # Job Submission
                  #-----------------------------------------------------------------------
                  @logged
                  def dispatch_submission(self, raw_msg):
                      """Dispatch job submission to appropriate handlers."""
                      # ensure targets up to date:
                      self.notifier_stream.flush()
                      try:
                          idents, msg = self.session.feed_identities(raw_msg, copy=False)
                          msg = self.session.unpack_message(msg, content=False, copy=False)
                      except Exception:
                          self.log.error("task::Invaid task: %s"%raw_msg, exc_info=True)
                          return
                      # send to monitor
                      self.mon_stream.send_multipart(['intask']+raw_msg, copy=False)
                      header = msg['header']
                      msg_id = header['msg_id']
                      self.all_ids.add(msg_id)
                      # targets
                      targets = set(header.get('targets', []))
                      retries = header.get('retries', 0)
                      self.retries[msg_id] = retries
                      # time dependencies
                      after = Dependency(header.get('after', []))
                      if after.all:
                          if after.success:
                              after.difference_update(self.all_completed)
                          if after.failure:
                              after.difference_update(self.all_failed)
                      if after.check(self.all_completed, self.all_failed):
                          # recast as empty set, if `after` already met,
                          # to prevent unnecessary set comparisons
                          after = MET
                      # location dependencies
                      follow = Dependency(header.get('follow', []))
                      # turn timeouts into datetime objects:
                      timeout = header.get('timeout', None)
                      if timeout:
                          timeout = datetime.now() + timedelta(0,timeout,0)
                      args = [raw_msg, targets, after, follow, timeout]
                      # validate and reduce dependencies:
                      for dep in after,follow:
                          # check valid:
                          if msg_id in dep or dep.difference(self.all_ids):
                              self.depending[msg_id] = args
                              return self.fail_unreachable(msg_id, error.InvalidDependency)
                          # check if unreachable:
                          if dep.unreachable(self.all_completed, self.all_failed):
                              self.depending[msg_id] = args
                              return self.fail_unreachable(msg_id)
                      if after.check(self.all_completed, self.all_failed):
                          # time deps already met, try to run
                          if not self.maybe_run(msg_id, *args):
                              # can't run yet
                              if msg_id not in self.all_failed:
                                  # could have failed as unreachable
                                  self.save_unmet(msg_id, *args)
                      else:
                          self.save_unmet(msg_id, *args)
                  # @logged
                  def audit_timeouts(self):
                      """Audit all waiting tasks for expired timeouts."""
                      now = datetime.now()
                      for msg_id in self.depending.keys():
                          # must recheck, in case one failure cascaded to another:
                          if msg_id in self.depending:
                              raw,after,targets,follow,timeout = self.depending[msg_id]
                              if timeout and timeout < now:
                                  self.fail_unreachable(msg_id, error.TaskTimeout)
                  @logged
                  def fail_unreachable(self, msg_id, why=error.ImpossibleDependency):
                      """a task has become unreachable, send a reply with an ImpossibleDependency
                      error."""
                      if msg_id not in self.depending:
                          self.log.error("msg %r already failed!"%msg_id)
                          return
                      raw_msg,targets,after,follow,timeout = self.depending.pop(msg_id)
                      for mid in follow.union(after):
                          if mid in self.graph:
                              self.graph[mid].remove(msg_id)
                      # FIXME: unpacking a message I've already unpacked, but didn't save:
                      idents,msg = self.session.feed_identities(raw_msg, copy=False)
                      msg = self.session.unpack_message(msg, copy=False, content=False)
                      header = msg['header']
                      try:
                          raise why()
                      except:
                          content = error.wrap_exception()
                      self.all_done.add(msg_id)
                      self.all_failed.add(msg_id)
                      msg = self.session.send(self.client_stream, 'apply_reply', content,
                                                              parent=header, ident=idents)
                      self.session.send(self.mon_stream, msg, ident=['outtask']+idents)
                      self.update_graph(msg_id, success=False)
                  @logged
                  def maybe_run(self, msg_id, raw_msg, targets, after, follow, timeout):
                      """check location dependencies, and run if they are met."""
                      blacklist = self.blacklist.setdefault(msg_id, set())
                      if follow or targets or blacklist or self.hwm:
                          # we need a can_run filter
                          def can_run(idx):
                              # check hwm
                              if self.hwm and self.loads[idx] == self.hwm:
                                  return False
                              target = self.targets[idx]
                              # check blacklist
                              if target in blacklist:
                                  return False
                              # check targets
                              if targets and target not in targets:
                                  return False
                              # check follow
                              return follow.check(self.completed[target], self.failed[target])
                          indices = filter(can_run, range(len(self.targets)))
                          if not indices:
                              # couldn't run
                              if follow.all:
                                  # check follow for impossibility
                                  dests = set()
                                  relevant = set()
                                  if follow.success:
                                      relevant = self.all_completed
                                  if follow.failure:
                                      relevant = relevant.union(self.all_failed)
                                  for m in follow.intersection(relevant):
                                      dests.add(self.destinations[m])
                                  if len(dests) > 1:
                                      self.depending[msg_id] = (raw_msg, targets, after, follow, timeout)
                                      self.fail_unreachable(msg_id)
                                      return False
                              if targets:
                                  # check blacklist+targets for impossibility
                                  targets.difference_update(blacklist)
                                  if not targets or not targets.intersection(self.targets):
                                      self.depending[msg_id] = (raw_msg, targets, after, follow, timeout)
                                      self.fail_unreachable(msg_id)
                                      return False
                              return False
                      else:
                          indices = None
                      self.submit_task(msg_id, raw_msg, targets, follow, timeout, indices)
                      return True
                  @logged
                  def save_unmet(self, msg_id, raw_msg, targets, after, follow, timeout):
                      """Save a message for later submission when its dependencies are met."""
                      self.depending[msg_id] = [raw_msg,targets,after,follow,timeout]
                      # track the ids in follow or after, but not those already finished
                      for dep_id in after.union(follow).difference(self.all_done):
                          if dep_id not in self.graph:
                              self.graph[dep_id] = set()
                          self.graph[dep_id].add(msg_id)
                  @logged
                  def submit_task(self, msg_id, raw_msg, targets, follow, timeout, indices=None):
                      """Submit a task to any of a subset of our targets."""
                      if indices:
                          loads = [self.loads[i] for i in indices]
                      else:
                          loads = self.loads
                      idx = self.scheme(loads)
                      if indices:
                          idx = indices[idx]
                      target = self.targets[idx]
                      # print (target, map(str, msg[:3]))
                      # send job to the engine
                      self.engine_stream.send(target, flags=zmq.SNDMORE, copy=False)
                      self.engine_stream.send_multipart(raw_msg, copy=False)
                      # update load
                      self.add_job(idx)
                      self.pending[target][msg_id] = (raw_msg, targets, MET, follow, timeout)
                      # notify Hub
                      content = dict(msg_id=msg_id, engine_id=target)
                      self.session.send(self.mon_stream, 'task_destination', content=content,
                                      ident=['tracktask',self.session.session])
                  #-----------------------------------------------------------------------
                  # Result Handling
                  #-----------------------------------------------------------------------
                  @logged
                  def dispatch_result(self, raw_msg):
                      """dispatch method for result replies"""
                      try:
                          idents,msg = self.session.feed_identities(raw_msg, copy=False)
                          msg = self.session.unpack_message(msg, content=False, copy=False)
                          engine = idents[0]
                          try:
                              idx = self.targets.index(engine)
                          except ValueError:
                              pass # skip load-update for dead engines
                          else:
                              self.finish_job(idx)
                      except Exception:
                          self.log.error("task::Invaid result: %s"%raw_msg, exc_info=True)
                          return
                      header = msg['header']
                      parent = msg['parent_header']
                      if header.get('dependencies_met', True):
                          success = (header['status'] == 'ok')
                          msg_id = parent['msg_id']
                          retries = self.retries[msg_id]
                          if not success and retries > 0:
                              # failed
                              self.retries[msg_id] = retries - 1
                              self.handle_unmet_dependency(idents, parent)
                          else:
                              del self.retries[msg_id]
                              # relay to client and update graph
                              self.handle_result(idents, parent, raw_msg, success)
                              # send to Hub monitor
                              self.mon_stream.send_multipart(['outtask']+raw_msg, copy=False)
                      else:
                          self.handle_unmet_dependency(idents, parent)
                  @logged
                  def handle_result(self, idents, parent, raw_msg, success=True):
                      """handle a real task result, either success or failure"""
                      # first, relay result to client
                      engine = idents[0]
                      client = idents[1]
                      # swap_ids for XREP-XREP mirror
                      raw_msg[:2] = [client,engine]
                      # print (map(str, raw_msg[:4]))
                      self.client_stream.send_multipart(raw_msg, copy=False)
                      # now, update our data structures
                      msg_id = parent['msg_id']
                      self.blacklist.pop(msg_id, None)
                      self.pending[engine].pop(msg_id)
                      if success:
                          self.completed[engine].add(msg_id)
                          self.all_completed.add(msg_id)
                      else:
                          self.failed[engine].add(msg_id)
                          self.all_failed.add(msg_id)
                      self.all_done.add(msg_id)
                      self.destinations[msg_id] = engine
                      self.update_graph(msg_id, success)
                  @logged
                  def handle_unmet_dependency(self, idents, parent):
                      """handle an unmet dependency"""
                      engine = idents[0]
                      msg_id = parent['msg_id']
                      if msg_id not in self.blacklist:
                          self.blacklist[msg_id] = set()
                      self.blacklist[msg_id].add(engine)
                      args = self.pending[engine].pop(msg_id)
                      raw,targets,after,follow,timeout = args
                      if self.blacklist[msg_id] == targets:
                          self.depending[msg_id] = args
                          self.fail_unreachable(msg_id)
                      elif not self.maybe_run(msg_id, *args):
                          # resubmit failed
                          if msg_id not in self.all_failed:
                              # put it back in our dependency tree
                              self.save_unmet(msg_id, *args)
                      if self.hwm:
                          try:
                              idx = self.targets.index(engine)
                          except ValueError:
                              pass # skip load-update for dead engines
                          else:
                              if self.loads[idx] == self.hwm-1:
                                  self.update_graph(None)
                  @logged
                  def update_graph(self, dep_id=None, success=True):
                      """dep_id just finished. Update our dependency
                      graph and submit any jobs that just became runable.
                      Called with dep_id=None to update entire graph for hwm, but without finishing
                      a task.
                      """
                      # print ("\n\n***********")
                      # pprint (dep_id)
                      # pprint (self.graph)
                      # pprint (self.depending)
                      # pprint (self.all_completed)
                      # pprint (self.all_failed)
                      # print ("\n\n***********\n\n")
                      # update any jobs that depended on the dependency
                      jobs = self.graph.pop(dep_id, [])
                      # recheck *all* jobs if
                      # a) we have HWM and an engine just become no longer full
                      # or b) dep_id was given as None
                      if dep_id is None or self.hwm and any( [ load==self.hwm-1 for load in self.loads ]):
                          jobs = self.depending.keys()
                      for msg_id in jobs:
                          raw_msg, targets, after, follow, timeout = self.depending[msg_id]
                          if after.unreachable(self.all_completed, self.all_failed) or follow.unreachable(self.all_completed, self.all_failed):
                              self.fail_unreachable(msg_id)
                          elif after.check(self.all_completed, self.all_failed): # time deps met, maybe run
                              if self.maybe_run(msg_id, raw_msg, targets, MET, follow, timeout):
                                  self.depending.pop(msg_id)
                                  for mid in follow.union(after):
                                      if mid in self.graph:
                                          self.graph[mid].remove(msg_id)
                  #----------------------------------------------------------------------
                  # methods to be overridden by subclasses
                  #----------------------------------------------------------------------
                  def add_job(self, idx):
                      """Called after self.targets[idx] just got the job with header.
                      Override with subclasses.  The default ordering is simple LRU.
                      The default loads are the number of outstanding jobs."""
                      self.loads[idx] += 1
                      for lis in (self.targets, self.loads):
                          lis.append(lis.pop(idx))
                  def finish_job(self, idx):
                      """Called after self.targets[idx] just finished a job.
                      Override with subclasses."""
                      self.loads[idx] -= 1
              def launch_scheduler(in_addr, out_addr, mon_addr, not_addr, config=None,logname='ZMQ',
-                                         log_addr=None, loglevel=logging.DEBUG,
+                                         log_url=None, loglevel=logging.DEBUG,
                                          identity=b'task'):
                  from zmq.eventloop import ioloop
                  from zmq.eventloop.zmqstream import ZMQStream
                  if config:
                      # unwrap dict back into Config
                      config = Config(config)
                  ctx = zmq.Context()
                  loop = ioloop.IOLoop()
                  ins = ZMQStream(ctx.socket(zmq.XREP),loop)
                  ins.setsockopt(zmq.IDENTITY, identity)
                  ins.bind(in_addr)
                  outs = ZMQStream(ctx.socket(zmq.XREP),loop)
                  outs.setsockopt(zmq.IDENTITY, identity)
                  outs.bind(out_addr)
                  mons = ZMQStream(ctx.socket(zmq.PUB),loop)
                  mons.connect(mon_addr)
                  nots = ZMQStream(ctx.socket(zmq.SUB),loop)
                  nots.setsockopt(zmq.SUBSCRIBE, '')
                  nots.connect(not_addr)
-                 # scheme = globals().get(scheme, None)
-                 # setup logging
-                 if log_addr:
-                     connect_logger(logname, ctx, log_addr, root="scheduler", loglevel=loglevel)
+                 # setup logging. Note that these will not work in-process, because they clobber
+                 # existing loggers.
+                 if log_url:
+                     connect_logger(logname, ctx, log_url, root="scheduler", loglevel=loglevel)
                  else:
                      local_logger(logname, loglevel)
                  scheduler = TaskScheduler(client_stream=ins, engine_stream=outs,
                                          mon_stream=mons, notifier_stream=nots,
                                          loop=loop, logname=logname,
                                          config=config)
                  scheduler.start()
                  try:
                      loop.start()
                  except KeyboardInterrupt:
                      print ("interrupted, exiting...", file=sys.__stderr__)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages