upstream/ipython Commit - r4725:7bde2f38

use ROUTER/DEALER socket names instead of XREP/XREQ...

MinRK -

r4725:7bde2f38

parent child

IPython/parallel/__init__.py

0 +5 -11

             """The IPython ZMQ-based parallel computing interface.
             Authors:
             * MinRK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2011 The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             import os
             import warnings
             import zmq
+            from IPython.zmq import check_for_zmq
             if os.name == 'nt':
-                if zmq.__version__ < '2.1.7':
+                min_pyzmq = '2.1.7'
-                    raise ImportError("IPython.parallel requires pyzmq/0MQ >= 2.1.7 on Windows, "
+            else:
-                    "and you appear to have %s"%zmq.__version__)
+                min_pyzmq = '2.1.4'
-            elif zmq.__version__ < '2.1.4':
-                raise ImportError("IPython.parallel requires pyzmq/0MQ >= 2.1.4, you appear to have %s"%zmq.__version__)
-            if zmq.zmq_version() >= '3.0.0':
-                warnings.warn("""libzmq 3 detected.
-                It is unlikely that IPython's zmq code will work properly.
-                Please install libzmq stable, which is 2.1.x or 2.2.x""",
-                RuntimeWarning)
+            check_for_zmq(min_pyzmq, 'IPython.parallel')
             from IPython.utils.pickleutil import Reference
             from .client.asyncresult import *
             from .client.client import Client
             from .client.remotefunction import *
             from .client.view import *
             from .controller.dependency import *

IPython/parallel/apps/ipcontrollerapp.py

0 +3 -3

             #!/usr/bin/env python
             # encoding: utf-8
             """
             The IPython controller application.
             Authors:
             * Brian Granger
             * MinRK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2008-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             from __future__ import with_statement
             import os
             import socket
             import stat
             import sys
             import uuid
             from multiprocessing import Process
             import zmq
             from zmq.devices import ProcessMonitoredQueue
             from zmq.log.handlers import PUBHandler
             from zmq.utils import jsonapi as json
             from IPython.config.application import boolean_flag
             from IPython.core.profiledir import ProfileDir
             from IPython.parallel.apps.baseapp import (
                 BaseParallelApplication,
                 base_aliases,
                 base_flags,
             )
             from IPython.utils.importstring import import_item
             from IPython.utils.traitlets import Instance, Unicode, Bool, List, Dict
             # from IPython.parallel.controller.controller import ControllerFactory
             from IPython.zmq.session import Session
             from IPython.parallel.controller.heartmonitor import HeartMonitor
             from IPython.parallel.controller.hub import HubFactory
             from IPython.parallel.controller.scheduler import TaskScheduler,launch_scheduler
             from IPython.parallel.controller.sqlitedb import SQLiteDB
             from IPython.parallel.util import signal_children, split_url, asbytes
             # conditional import of MongoDB backend class
             try:
                 from IPython.parallel.controller.mongodb import MongoDB
             except ImportError:
                 maybe_mongo = []
             else:
                 maybe_mongo = [MongoDB]
             #-----------------------------------------------------------------------------
             # Module level variables
             #-----------------------------------------------------------------------------
             #: The default config file name for this application
             default_config_file_name = u'ipcontroller_config.py'
             _description = """Start the IPython controller for parallel computing.
             The IPython controller provides a gateway between the IPython engines and
             clients. The controller needs to be started before the engines and can be
             configured using command line options or using a cluster directory. Cluster
             directories contain config, log and security files and are usually located in
             your ipython directory and named as "profile_name". See the `profile`
             and `profile-dir` options for details.
             """
             _examples = """
             ipcontroller --ip=192.168.0.1 --port=1000  # listen on ip, port for engines
             ipcontroller --scheme=pure  # use the pure zeromq scheduler
             """
             #-----------------------------------------------------------------------------
             # The main application
             #-----------------------------------------------------------------------------
             flags = {}
             flags.update(base_flags)
             flags.update({
                 'usethreads' : ( {'IPControllerApp' : {'use_threads' : True}},
                                 'Use threads instead of processes for the schedulers'),
                 'sqlitedb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.sqlitedb.SQLiteDB'}},
                                 'use the SQLiteDB backend'),
                 'mongodb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.mongodb.MongoDB'}},
                                 'use the MongoDB backend'),
                 'dictdb' : ({'HubFactory' : {'db_class' : 'IPython.parallel.controller.dictdb.DictDB'}},
                                 'use the in-memory DictDB backend'),
                 'reuse' : ({'IPControllerApp' : {'reuse_files' : True}},
                                 'reuse existing json connection files')
             })
             flags.update(boolean_flag('secure', 'IPControllerApp.secure',
                 "Use HMAC digests for authentication of messages.",
                 "Don't authenticate messages."
             ))
             aliases = dict(
                 secure = 'IPControllerApp.secure',
                 ssh = 'IPControllerApp.ssh_server',
                 enginessh = 'IPControllerApp.engine_ssh_server',
                 location = 'IPControllerApp.location',
                 ident = 'Session.session',
                 user = 'Session.username',
                 keyfile = 'Session.keyfile',
                 url = 'HubFactory.url',
                 ip = 'HubFactory.ip',
                 transport = 'HubFactory.transport',
                 port = 'HubFactory.regport',
                 ping = 'HeartMonitor.period',
                 scheme = 'TaskScheduler.scheme_name',
                 hwm = 'TaskScheduler.hwm',
             )
             aliases.update(base_aliases)
             class IPControllerApp(BaseParallelApplication):
                 name = u'ipcontroller'
                 description = _description
                 examples = _examples
                 config_file_name = Unicode(default_config_file_name)
                 classes = [ProfileDir, Session, HubFactory, TaskScheduler, HeartMonitor, SQLiteDB] + maybe_mongo
                 # change default to True
                 auto_create = Bool(True, config=True,
                     help="""Whether to create profile dir if it doesn't exist.""")
                 reuse_files = Bool(False, config=True,
                     help='Whether to reuse existing json connection files.'
                 )
                 secure = Bool(True, config=True,
                     help='Whether to use HMAC digests for extra message authentication.'
                 )
                 ssh_server = Unicode(u'', config=True,
                     help="""ssh url for clients to use when connecting to the Controller
                     processes. It should be of the form: [user@]server[:port]. The
                     Controller's listening addresses must be accessible from the ssh server""",
                 )
                 engine_ssh_server = Unicode(u'', config=True,
                     help="""ssh url for engines to use when connecting to the Controller
                     processes. It should be of the form: [user@]server[:port]. The
                     Controller's listening addresses must be accessible from the ssh server""",
                 )
                 location = Unicode(u'', config=True,
                     help="""The external IP or domain name of the Controller, used for disambiguating
                     engine and client connections.""",
                 )
                 import_statements = List([], config=True,
                     help="import statements to be run at startup.  Necessary in some environments"
                 )
                 use_threads = Bool(False, config=True,
                     help='Use threads instead of processes for the schedulers',
                     )
                 # internal
                 children = List()
                 mq_class = Unicode('zmq.devices.ProcessMonitoredQueue')
                 def _use_threads_changed(self, name, old, new):
                     self.mq_class = 'zmq.devices.%sMonitoredQueue'%('Thread' if new else 'Process')
                 aliases = Dict(aliases)
                 flags = Dict(flags)
                 def save_connection_dict(self, fname, cdict):
                     """save a connection dict to json file."""
                     c = self.config
                     url = cdict['url']
                     location = cdict['location']
                     if not location:
                         try:
                             proto,ip,port = split_url(url)
                         except AssertionError:
                             pass
                         else:
                             try:
                                 location = socket.gethostbyname_ex(socket.gethostname())[2][-1]
                             except (socket.gaierror, IndexError):
                                 self.log.warn("Could not identify this machine's IP, assuming 127.0.0.1."
                                 " You may need to specify '--location=<external_ip_address>' to help"
                                 " IPython decide when to connect via loopback.")
                                 location = '127.0.0.1'
                         cdict['location'] = location
                     fname = os.path.join(self.profile_dir.security_dir, fname)
                     with open(fname, 'wb') as f:
                         f.write(json.dumps(cdict, indent=2))
                     os.chmod(fname, stat.S_IRUSR|stat.S_IWUSR)
                 def load_config_from_json(self):
                     """load config from existing json connector files."""
                     c = self.config
                     # load from engine config
                     with open(os.path.join(self.profile_dir.security_dir, 'ipcontroller-engine.json')) as f:
                         cfg = json.loads(f.read())
                     key = c.Session.key = asbytes(cfg['exec_key'])
                     xport,addr = cfg['url'].split('://')
                     c.HubFactory.engine_transport = xport
                     ip,ports = addr.split(':')
                     c.HubFactory.engine_ip = ip
                     c.HubFactory.regport = int(ports)
                     self.location = cfg['location']
                     if not self.engine_ssh_server:
                         self.engine_ssh_server = cfg['ssh']
                     # load client config
                     with open(os.path.join(self.profile_dir.security_dir, 'ipcontroller-client.json')) as f:
                         cfg = json.loads(f.read())
                     assert key == cfg['exec_key'], "exec_key mismatch between engine and client keys"
                     xport,addr = cfg['url'].split('://')
                     c.HubFactory.client_transport = xport
                     ip,ports = addr.split(':')
                     c.HubFactory.client_ip = ip
                     if not self.ssh_server:
                         self.ssh_server = cfg['ssh']
                     assert int(ports) == c.HubFactory.regport, "regport mismatch"
                 def init_hub(self):
                     c = self.config
                     self.do_import_statements()
                     reusing = self.reuse_files
                     if reusing:
                         try:
                             self.load_config_from_json()
                         except (AssertionError,IOError):
                             reusing=False
                     # check again, because reusing may have failed:
                     if reusing:
                         pass
                     elif self.secure:
                         key = str(uuid.uuid4())
                         # keyfile = os.path.join(self.profile_dir.security_dir, self.exec_key)
                         # with open(keyfile, 'w') as f:
                         #     f.write(key)
                         # os.chmod(keyfile, stat.S_IRUSR|stat.S_IWUSR)
                         c.Session.key = asbytes(key)
                     else:
                         key = c.Session.key = b''
                     try:
                         self.factory = HubFactory(config=c, log=self.log)
                         # self.start_logging()
                         self.factory.init_hub()
                     except:
                         self.log.error("Couldn't construct the Controller", exc_info=True)
                         self.exit(1)
                     if not reusing:
                         # save to new json config files
                         f = self.factory
                         cdict = {'exec_key' : key,
                                 'ssh' : self.ssh_server,
                                 'url' : "%s://%s:%s"%(f.client_transport, f.client_ip, f.regport),
                                 'location' : self.location
                                 }
                         self.save_connection_dict('ipcontroller-client.json', cdict)
                         edict = cdict
                         edict['url']="%s://%s:%s"%((f.client_transport, f.client_ip, f.regport))
                         edict['ssh'] = self.engine_ssh_server
                         self.save_connection_dict('ipcontroller-engine.json', edict)
                 #
                 def init_schedulers(self):
                     children = self.children
                     mq = import_item(str(self.mq_class))
                     hub = self.factory
                     # maybe_inproc = 'inproc://monitor' if self.use_threads else self.monitor_url
                     # IOPub relay (in a Process)
                     q = mq(zmq.PUB, zmq.SUB, zmq.PUB, b'N/A',b'iopub')
                     q.bind_in(hub.client_info['iopub'])
                     q.bind_out(hub.engine_info['iopub'])
                     q.setsockopt_out(zmq.SUBSCRIBE, b'')
                     q.connect_mon(hub.monitor_url)
                     q.daemon=True
                     children.append(q)
                     # Multiplexer Queue (in a Process)
-                    q = mq(zmq.XREP, zmq.XREP, zmq.PUB, b'in', b'out')
+                    q = mq(zmq.ROUTER, zmq.ROUTER, zmq.PUB, b'in', b'out')
                     q.bind_in(hub.client_info['mux'])
                     q.setsockopt_in(zmq.IDENTITY, b'mux')
                     q.bind_out(hub.engine_info['mux'])
                     q.connect_mon(hub.monitor_url)
                     q.daemon=True
                     children.append(q)
                     # Control Queue (in a Process)
-                    q = mq(zmq.XREP, zmq.XREP, zmq.PUB, b'incontrol', b'outcontrol')
+                    q = mq(zmq.ROUTER, zmq.ROUTER, zmq.PUB, b'incontrol', b'outcontrol')
                     q.bind_in(hub.client_info['control'])
                     q.setsockopt_in(zmq.IDENTITY, b'control')
                     q.bind_out(hub.engine_info['control'])
                     q.connect_mon(hub.monitor_url)
                     q.daemon=True
                     children.append(q)
                     try:
                         scheme = self.config.TaskScheduler.scheme_name
                     except AttributeError:
                         scheme = TaskScheduler.scheme_name.get_default_value()
                     # Task Queue (in a Process)
                     if scheme == 'pure':
                         self.log.warn("task::using pure XREQ Task scheduler")
-                        q = mq(zmq.XREP, zmq.XREQ, zmq.PUB, b'intask', b'outtask')
+                        q = mq(zmq.ROUTER, zmq.DEALER, zmq.PUB, b'intask', b'outtask')
                         # q.setsockopt_out(zmq.HWM, hub.hwm)
                         q.bind_in(hub.client_info['task'][1])
                         q.setsockopt_in(zmq.IDENTITY, b'task')
                         q.bind_out(hub.engine_info['task'])
                         q.connect_mon(hub.monitor_url)
                         q.daemon=True
                         children.append(q)
                     elif scheme == 'none':
                         self.log.warn("task::using no Task scheduler")
                     else:
                         self.log.info("task::using Python %s Task scheduler"%scheme)
                         sargs = (hub.client_info['task'][1], hub.engine_info['task'],
                                             hub.monitor_url, hub.client_info['notification'])
                         kwargs = dict(logname='scheduler', loglevel=self.log_level,
                                         log_url = self.log_url, config=dict(self.config))
                         if 'Process' in self.mq_class:
                             # run the Python scheduler in a Process
                             q = Process(target=launch_scheduler, args=sargs, kwargs=kwargs)
                             q.daemon=True
                             children.append(q)
                         else:
                             # single-threaded Controller
                             kwargs['in_thread'] = True
                             launch_scheduler(*sargs, **kwargs)
                 def save_urls(self):
                     """save the registration urls to files."""
                     c = self.config
                     sec_dir = self.profile_dir.security_dir
                     cf = self.factory
                     with open(os.path.join(sec_dir, 'ipcontroller-engine.url'), 'w') as f:
                         f.write("%s://%s:%s"%(cf.engine_transport, cf.engine_ip, cf.regport))
                     with open(os.path.join(sec_dir, 'ipcontroller-client.url'), 'w') as f:
                         f.write("%s://%s:%s"%(cf.client_transport, cf.client_ip, cf.regport))
                 def do_import_statements(self):
                     statements = self.import_statements
                     for s in statements:
                         try:
                             self.log.msg("Executing statement: '%s'" % s)
                             exec s in globals(), locals()
                         except:
                             self.log.msg("Error running statement: %s" % s)
                 def forward_logging(self):
                     if self.log_url:
                         self.log.info("Forwarding logging to %s"%self.log_url)
                         context = zmq.Context.instance()
                         lsock = context.socket(zmq.PUB)
                         lsock.connect(self.log_url)
                         handler = PUBHandler(lsock)
                         self.log.removeHandler(self._log_handler)
                         handler.root_topic = 'controller'
                         handler.setLevel(self.log_level)
                         self.log.addHandler(handler)
                         self._log_handler = handler
                 # #
                 def initialize(self, argv=None):
                     super(IPControllerApp, self).initialize(argv)
                     self.forward_logging()
                     self.init_hub()
                     self.init_schedulers()
                 def start(self):
                     # Start the subprocesses:
                     self.factory.start()
                     child_procs = []
                     for child in self.children:
                         child.start()
                         if isinstance(child, ProcessMonitoredQueue):
                             child_procs.append(child.launcher)
                         elif isinstance(child, Process):
                             child_procs.append(child)
                     if child_procs:
                         signal_children(child_procs)
                     self.write_pid_file(overwrite=True)
                     try:
                         self.factory.loop.start()
                     except KeyboardInterrupt:
                         self.log.critical("Interrupted, Exiting...\n")
             def launch_new_instance():
                 """Create and run the IPython controller"""
                 if sys.platform == 'win32':
                     # make sure we don't get called from a multiprocessing subprocess
                     # this can result in infinite Controllers being started on Windows
                     # which doesn't have a proper fork, so multiprocessing is wonky
                     # this only comes up when IPython has been installed using vanilla
                     # setuptools, and *not* distribute.
                     import multiprocessing
                     p = multiprocessing.current_process()
                     # the main process has name 'MainProcess'
                     # subprocesses will have names like 'Process-1'
                     if p.name != 'MainProcess':
                         # we are a subprocess, don't start another Controller!
                         return
                 app = IPControllerApp.instance()
                 app.initialize()
                 app.start()
             if __name__ == '__main__':
                 launch_new_instance()

IPython/parallel/client/client.py

0 +5 -5

             """A semi-synchronous Client for the ZMQ cluster
             Authors:
             * MinRK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             import os
             import json
             import sys
             import time
             import warnings
             from datetime import datetime
             from getpass import getpass
             from pprint import pprint
             pjoin = os.path.join
             import zmq
             # from zmq.eventloop import ioloop, zmqstream
             from IPython.config.configurable import MultipleInstanceError
             from IPython.core.application import BaseIPythonApplication
             from IPython.utils.jsonutil import rekey
             from IPython.utils.localinterfaces import LOCAL_IPS
             from IPython.utils.path import get_ipython_dir
             from IPython.utils.traitlets import (HasTraits, Int, Instance, Unicode,
                                                 Dict, List, Bool, Set)
             from IPython.external.decorator import decorator
             from IPython.external.ssh import tunnel
             from IPython.parallel import error
             from IPython.parallel import util
             from IPython.zmq.session import Session, Message
             from .asyncresult import AsyncResult, AsyncHubResult
             from IPython.core.profiledir import ProfileDir, ProfileDirError
             from .view import DirectView, LoadBalancedView
             if sys.version_info[0] >= 3:
                 # xrange is used in a couple 'isinstance' tests in py2
                 # should be just 'range' in 3k
                 xrange = range
             #--------------------------------------------------------------------------
             # Decorators for Client methods
             #--------------------------------------------------------------------------
             @decorator
             def spin_first(f, self, *args, **kwargs):
                 """Call spin() to sync state prior to calling the method."""
                 self.spin()
                 return f(self, *args, **kwargs)
             #--------------------------------------------------------------------------
             # Classes
             #--------------------------------------------------------------------------
             class Metadata(dict):
                 """Subclass of dict for initializing metadata values.
                 Attribute access works on keys.
                 These objects have a strict set of keys - errors will raise if you try
                 to add new keys.
                 """
                 def __init__(self, *args, **kwargs):
                     dict.__init__(self)
                     md = {'msg_id' : None,
                           'submitted' : None,
                           'started' : None,
                           'completed' : None,
                           'received' : None,
                           'engine_uuid' : None,
                           'engine_id' : None,
                           'follow' : None,
                           'after' : None,
                           'status' : None,
                           'pyin' : None,
                           'pyout' : None,
                           'pyerr' : None,
                           'stdout' : '',
                           'stderr' : '',
                         }
                     self.update(md)
                     self.update(dict(*args, **kwargs))
                 def __getattr__(self, key):
                     """getattr aliased to getitem"""
                     if key in self.iterkeys():
                         return self[key]
                     else:
                         raise AttributeError(key)
                 def __setattr__(self, key, value):
                     """setattr aliased to setitem, with strict"""
                     if key in self.iterkeys():
                         self[key] = value
                     else:
                         raise AttributeError(key)
                 def __setitem__(self, key, value):
                     """strict static key enforcement"""
                     if key in self.iterkeys():
                         dict.__setitem__(self, key, value)
                     else:
                         raise KeyError(key)
             class Client(HasTraits):
                 """A semi-synchronous client to the IPython ZMQ cluster
                 Parameters
                 ----------
                 url_or_file : bytes or unicode; zmq url or path to ipcontroller-client.json
                     Connection information for the Hub's registration.  If a json connector
                     file is given, then likely no further configuration is necessary.
                     [Default: use profile]
                 profile : bytes
                     The name of the Cluster profile to be used to find connector information.
                     If run from an IPython application, the default profile will be the same
                     as the running application, otherwise it will be 'default'.
                 context : zmq.Context
                     Pass an existing zmq.Context instance, otherwise the client will create its own.
                 debug : bool
                     flag for lots of message printing for debug purposes
                 timeout : int/float
                     time (in seconds) to wait for connection replies from the Hub
                     [Default: 10]
                 #-------------- session related args ----------------
                 config : Config object
                     If specified, this will be relayed to the Session for configuration
                 username : str
                     set username for the session object
                 packer : str (import_string) or callable
                     Can be either the simple keyword 'json' or 'pickle', or an import_string to a
                     function to serialize messages. Must support same input as
                     JSON, and output must be bytes.
                     You can pass a callable directly as `pack`
                 unpacker : str (import_string) or callable
                     The inverse of packer.  Only necessary if packer is specified as *not* one
                     of 'json' or 'pickle'.
                 #-------------- ssh related args ----------------
                 # These are args for configuring the ssh tunnel to be used
                 # credentials are used to forward connections over ssh to the Controller
                 # Note that the ip given in `addr` needs to be relative to sshserver
                 # The most basic case is to leave addr as pointing to localhost (127.0.0.1),
                 # and set sshserver as the same machine the Controller is on. However,
                 # the only requirement is that sshserver is able to see the Controller
                 # (i.e. is within the same trusted network).
                 sshserver : str
                     A string of the form passed to ssh, i.e. 'server.tld' or 'user@server.tld:port'
                     If keyfile or password is specified, and this is not, it will default to
                     the ip given in addr.
                 sshkey : str; path to ssh private key file
                     This specifies a key to be used in ssh login, default None.
                     Regular default ssh keys will be used without specifying this argument.
                 password : str
                     Your ssh password to sshserver. Note that if this is left None,
                     you will be prompted for it if passwordless key based login is unavailable.
                 paramiko : bool
                     flag for whether to use paramiko instead of shell ssh for tunneling.
                     [default: True on win32, False else]
                 ------- exec authentication args -------
                 If even localhost is untrusted, you can have some protection against
                 unauthorized execution by signing messages with HMAC digests.
                 Messages are still sent as cleartext, so if someone can snoop your
                 loopback traffic this will not protect your privacy, but will prevent
                 unauthorized execution.
                 exec_key : str
                     an authentication key or file containing a key
                     default: None
                 Attributes
                 ----------
                 ids : list of int engine IDs
                     requesting the ids attribute always synchronizes
                     the registration state. To request ids without synchronization,
                     use semi-private _ids attributes.
                 history : list of msg_ids
                     a list of msg_ids, keeping track of all the execution
                     messages you have submitted in order.
                 outstanding : set of msg_ids
                     a set of msg_ids that have been submitted, but whose
                     results have not yet been received.
                 results : dict
                     a dict of all our results, keyed by msg_id
                 block : bool
                     determines default behavior when block not specified
                     in execution methods
                 Methods
                 -------
                 spin
                     flushes incoming results and registration state changes
                     control methods spin, and requesting `ids` also ensures up to date
                 wait
                     wait on one or more msg_ids
                 execution methods
                     apply
                     legacy: execute, run
                 data movement
                     push, pull, scatter, gather
                 query methods
                     queue_status, get_result, purge, result_status
                 control methods
                     abort, shutdown
                 """
                 block = Bool(False)
                 outstanding = Set()
                 results = Instance('collections.defaultdict', (dict,))
                 metadata = Instance('collections.defaultdict', (Metadata,))
                 history = List()
                 debug = Bool(False)
                 profile=Unicode()
                 def _profile_default(self):
                     if BaseIPythonApplication.initialized():
                         # an IPython app *might* be running, try to get its profile
                         try:
                             return BaseIPythonApplication.instance().profile
                         except (AttributeError, MultipleInstanceError):
                             # could be a *different* subclass of config.Application,
                             # which would raise one of these two errors.
                             return u'default'
                     else:
                         return u'default'
                 _outstanding_dict = Instance('collections.defaultdict', (set,))
                 _ids = List()
                 _connected=Bool(False)
                 _ssh=Bool(False)
                 _context = Instance('zmq.Context')
                 _config = Dict()
                 _engines=Instance(util.ReverseDict, (), {})
                 # _hub_socket=Instance('zmq.Socket')
                 _query_socket=Instance('zmq.Socket')
                 _control_socket=Instance('zmq.Socket')
                 _iopub_socket=Instance('zmq.Socket')
                 _notification_socket=Instance('zmq.Socket')
                 _mux_socket=Instance('zmq.Socket')
                 _task_socket=Instance('zmq.Socket')
                 _task_scheme=Unicode()
                 _closed = False
                 _ignored_control_replies=Int(0)
                 _ignored_hub_replies=Int(0)
                 def __new__(self, *args, **kw):
                     # don't raise on positional args
                     return HasTraits.__new__(self, **kw)
                 def __init__(self, url_or_file=None, profile=None, profile_dir=None, ipython_dir=None,
                         context=None, debug=False, exec_key=None,
                         sshserver=None, sshkey=None, password=None, paramiko=None,
                         timeout=10, **extra_args
                         ):
                     if profile:
                         super(Client, self).__init__(debug=debug, profile=profile)
                     else:
                         super(Client, self).__init__(debug=debug)
                     if context is None:
                         context = zmq.Context.instance()
                     self._context = context
                     self._setup_profile_dir(self.profile, profile_dir, ipython_dir)
                     if self._cd is not None:
                         if url_or_file is None:
                             url_or_file = pjoin(self._cd.security_dir, 'ipcontroller-client.json')
                     assert url_or_file is not None, "I can't find enough information to connect to a hub!"\
                         " Please specify at least one of url_or_file or profile."
                     try:
                         util.validate_url(url_or_file)
                     except AssertionError:
                         if not os.path.exists(url_or_file):
                             if self._cd:
                                 url_or_file = os.path.join(self._cd.security_dir, url_or_file)
                             assert os.path.exists(url_or_file), "Not a valid connection file or url: %r"%url_or_file
                         with open(url_or_file) as f:
                             cfg = json.loads(f.read())
                     else:
                         cfg = {'url':url_or_file}
                     # sync defaults from args, json:
                     if sshserver:
                         cfg['ssh'] = sshserver
                     if exec_key:
                         cfg['exec_key'] = exec_key
                     exec_key = cfg['exec_key']
                     location = cfg.setdefault('location', None)
                     cfg['url'] = util.disambiguate_url(cfg['url'], location)
                     url = cfg['url']
                     proto,addr,port = util.split_url(url)
                     if location is not None and addr == '127.0.0.1':
                         # location specified, and connection is expected to be local
                         if location not in LOCAL_IPS and not sshserver:
                             # load ssh from JSON *only* if the controller is not on
                             # this machine
                             sshserver=cfg['ssh']
                         if location not in LOCAL_IPS and not sshserver:
                             # warn if no ssh specified, but SSH is probably needed
                             # This is only a warning, because the most likely cause
                             # is a local Controller on a laptop whose IP is dynamic
                             warnings.warn("""
                         Controller appears to be listening on localhost, but not on this machine.
                         If this is true, you should specify Client(...,sshserver='you@%s')
                         or instruct your controller to listen on an external IP."""%location,
                             RuntimeWarning)
                     elif not sshserver:
                         # otherwise sync with cfg
                         sshserver = cfg['ssh']
                     self._config = cfg
                     self._ssh = bool(sshserver or sshkey or password)
                     if self._ssh and sshserver is None:
                         # default to ssh via localhost
                         sshserver = url.split('://')[1].split(':')[0]
                     if self._ssh and password is None:
                         if tunnel.try_passwordless_ssh(sshserver, sshkey, paramiko):
                             password=False
                         else:
                             password = getpass("SSH Password for %s: "%sshserver)
                     ssh_kwargs = dict(keyfile=sshkey, password=password, paramiko=paramiko)
                     # configure and construct the session
                     if exec_key is not None:
                         if os.path.isfile(exec_key):
                             extra_args['keyfile'] = exec_key
                         else:
                             exec_key = util.asbytes(exec_key)
                             extra_args['key'] = exec_key
                     self.session = Session(**extra_args)
-                    self._query_socket = self._context.socket(zmq.XREQ)
+                    self._query_socket = self._context.socket(zmq.DEALER)
                     self._query_socket.setsockopt(zmq.IDENTITY, util.asbytes(self.session.session))
                     if self._ssh:
                         tunnel.tunnel_connection(self._query_socket, url, sshserver, **ssh_kwargs)
                     else:
                         self._query_socket.connect(url)
                     self.session.debug = self.debug
                     self._notification_handlers = {'registration_notification' : self._register_engine,
                                                 'unregistration_notification' : self._unregister_engine,
                                                 'shutdown_notification' : lambda msg: self.close(),
                                                 }
                     self._queue_handlers = {'execute_reply' : self._handle_execute_reply,
                                             'apply_reply' : self._handle_apply_reply}
                     self._connect(sshserver, ssh_kwargs, timeout)
                 def __del__(self):
                     """cleanup sockets, but _not_ context."""
                     self.close()
                 def _setup_profile_dir(self, profile, profile_dir, ipython_dir):
                     if ipython_dir is None:
                         ipython_dir = get_ipython_dir()
                     if profile_dir is not None:
                         try:
                             self._cd = ProfileDir.find_profile_dir(profile_dir)
                             return
                         except ProfileDirError:
                             pass
                     elif profile is not None:
                         try:
                             self._cd = ProfileDir.find_profile_dir_by_name(
                                 ipython_dir, profile)
                             return
                         except ProfileDirError:
                             pass
                     self._cd = None
                 def _update_engines(self, engines):
                     """Update our engines dict and _ids from a dict of the form: {id:uuid}."""
                     for k,v in engines.iteritems():
                         eid = int(k)
                         self._engines[eid] = v
                         self._ids.append(eid)
                     self._ids = sorted(self._ids)
                     if sorted(self._engines.keys()) != range(len(self._engines)) and \
                                     self._task_scheme == 'pure' and self._task_socket:
                         self._stop_scheduling_tasks()
                 def _stop_scheduling_tasks(self):
                     """Stop scheduling tasks because an engine has been unregistered
                     from a pure ZMQ scheduler.
                     """
                     self._task_socket.close()
                     self._task_socket = None
                     msg = "An engine has been unregistered, and we are using pure " +\
                           "ZMQ task scheduling.  Task farming will be disabled."
                     if self.outstanding:
                         msg += " If you were running tasks when this happened, " +\
                                "some `outstanding` msg_ids may never resolve."
                     warnings.warn(msg, RuntimeWarning)
                 def _build_targets(self, targets):
                     """Turn valid target IDs or 'all' into two lists:
                     (int_ids, uuids).
                     """
                     if not self._ids:
                         # flush notification socket if no engines yet, just in case
                         if not self.ids:
                             raise error.NoEnginesRegistered("Can't build targets without any engines")
                     if targets is None:
                         targets = self._ids
                     elif isinstance(targets, basestring):
                         if targets.lower() == 'all':
                             targets = self._ids
                         else:
                             raise TypeError("%r not valid str target, must be 'all'"%(targets))
                     elif isinstance(targets, int):
                         if targets < 0:
                             targets = self.ids[targets]
                         if targets not in self._ids:
                             raise IndexError("No such engine: %i"%targets)
                         targets = [targets]
                     if isinstance(targets, slice):
                         indices = range(len(self._ids))[targets]
                         ids = self.ids
                         targets = [ ids[i] for i in indices ]
                     if not isinstance(targets, (tuple, list, xrange)):
                         raise TypeError("targets by int/slice/collection of ints only, not %s"%(type(targets)))
                     return [util.asbytes(self._engines[t]) for t in targets], list(targets)
                 def _connect(self, sshserver, ssh_kwargs, timeout):
                     """setup all our socket connections to the cluster. This is called from
                     __init__."""
                     # Maybe allow reconnecting?
                     if self._connected:
                         return
                     self._connected=True
                     def connect_socket(s, url):
                         url = util.disambiguate_url(url, self._config['location'])
                         if self._ssh:
                             return tunnel.tunnel_connection(s, url, sshserver, **ssh_kwargs)
                         else:
                             return s.connect(url)
                     self.session.send(self._query_socket, 'connection_request')
                     # use Poller because zmq.select has wrong units in pyzmq 2.1.7
                     poller = zmq.Poller()
                     poller.register(self._query_socket, zmq.POLLIN)
                     # poll expects milliseconds, timeout is seconds
                     evts = poller.poll(timeout*1000)
                     if not evts:
                         raise error.TimeoutError("Hub connection request timed out")
                     idents,msg = self.session.recv(self._query_socket,mode=0)
                     if self.debug:
                         pprint(msg)
                     msg = Message(msg)
                     content = msg.content
                     self._config['registration'] = dict(content)
                     if content.status == 'ok':
                         ident = util.asbytes(self.session.session)
                         if content.mux:
-                            self._mux_socket = self._context.socket(zmq.XREQ)
+                            self._mux_socket = self._context.socket(zmq.DEALER)
                             self._mux_socket.setsockopt(zmq.IDENTITY, ident)
                             connect_socket(self._mux_socket, content.mux)
                         if content.task:
                             self._task_scheme, task_addr = content.task
-                            self._task_socket = self._context.socket(zmq.XREQ)
+                            self._task_socket = self._context.socket(zmq.DEALER)
                             self._task_socket.setsockopt(zmq.IDENTITY, ident)
                             connect_socket(self._task_socket, task_addr)
                         if content.notification:
                             self._notification_socket = self._context.socket(zmq.SUB)
                             connect_socket(self._notification_socket, content.notification)
                             self._notification_socket.setsockopt(zmq.SUBSCRIBE, b'')
                         # if content.query:
-                        #     self._query_socket = self._context.socket(zmq.XREQ)
+                        #     self._query_socket = self._context.socket(zmq.DEALER)
                         #     self._query_socket.setsockopt(zmq.IDENTITY, self.session.session)
                         #     connect_socket(self._query_socket, content.query)
                         if content.control:
-                            self._control_socket = self._context.socket(zmq.XREQ)
+                            self._control_socket = self._context.socket(zmq.DEALER)
                             self._control_socket.setsockopt(zmq.IDENTITY, ident)
                             connect_socket(self._control_socket, content.control)
                         if content.iopub:
                             self._iopub_socket = self._context.socket(zmq.SUB)
                             self._iopub_socket.setsockopt(zmq.SUBSCRIBE, b'')
                             self._iopub_socket.setsockopt(zmq.IDENTITY, ident)
                             connect_socket(self._iopub_socket, content.iopub)
                         self._update_engines(dict(content.engines))
                     else:
                         self._connected = False
                         raise Exception("Failed to connect!")
                 #--------------------------------------------------------------------------
                 # handlers and callbacks for incoming messages
                 #--------------------------------------------------------------------------
                 def _unwrap_exception(self, content):
                     """unwrap exception, and remap engine_id to int."""
                     e = error.unwrap_exception(content)
                     # print e.traceback
                     if e.engine_info:
                         e_uuid = e.engine_info['engine_uuid']
                         eid = self._engines[e_uuid]
                         e.engine_info['engine_id'] = eid
                     return e
                 def _extract_metadata(self, header, parent, content):
                     md = {'msg_id' : parent['msg_id'],
                           'received' : datetime.now(),
                           'engine_uuid' : header.get('engine', None),
                           'follow' : parent.get('follow', []),
                           'after' : parent.get('after', []),
                           'status' : content['status'],
                         }
                     if md['engine_uuid'] is not None:
                         md['engine_id'] = self._engines.get(md['engine_uuid'], None)
                     if 'date' in parent:
                         md['submitted'] = parent['date']
                     if 'started' in header:
                         md['started'] = header['started']
                     if 'date' in header:
                         md['completed'] = header['date']
                     return md
                 def _register_engine(self, msg):
                     """Register a new engine, and update our connection info."""
                     content = msg['content']
                     eid = content['id']
                     d = {eid : content['queue']}
                     self._update_engines(d)
                 def _unregister_engine(self, msg):
                     """Unregister an engine that has died."""
                     content = msg['content']
                     eid = int(content['id'])
                     if eid in self._ids:
                         self._ids.remove(eid)
                         uuid = self._engines.pop(eid)
                         self._handle_stranded_msgs(eid, uuid)
                     if self._task_socket and self._task_scheme == 'pure':
                         self._stop_scheduling_tasks()
                 def _handle_stranded_msgs(self, eid, uuid):
                     """Handle messages known to be on an engine when the engine unregisters.
                     It is possible that this will fire prematurely - that is, an engine will
                     go down after completing a result, and the client will be notified
                     of the unregistration and later receive the successful result.
                     """
                     outstanding = self._outstanding_dict[uuid]
                     for msg_id in list(outstanding):
                         if msg_id in self.results:
                             # we already
                             continue
                         try:
                             raise error.EngineError("Engine %r died while running task %r"%(eid, msg_id))
                         except:
                             content = error.wrap_exception()
                         # build a fake message:
                         parent = {}
                         header = {}
                         parent['msg_id'] = msg_id
                         header['engine'] = uuid
                         header['date'] = datetime.now()
                         msg = dict(parent_header=parent, header=header, content=content)
                         self._handle_apply_reply(msg)
                 def _handle_execute_reply(self, msg):
                     """Save the reply to an execute_request into our results.
                     execute messages are never actually used. apply is used instead.
                     """
                     parent = msg['parent_header']
                     msg_id = parent['msg_id']
                     if msg_id not in self.outstanding:
                         if msg_id in self.history:
                             print ("got stale result: %s"%msg_id)
                         else:
                             print ("got unknown result: %s"%msg_id)
                     else:
                         self.outstanding.remove(msg_id)
                     self.results[msg_id] = self._unwrap_exception(msg['content'])
                 def _handle_apply_reply(self, msg):
                     """Save the reply to an apply_request into our results."""
                     parent = msg['parent_header']
                     msg_id = parent['msg_id']
                     if msg_id not in self.outstanding:
                         if msg_id in self.history:
                             print ("got stale result: %s"%msg_id)
                             print self.results[msg_id]
                             print msg
                         else:
                             print ("got unknown result: %s"%msg_id)
                     else:
                         self.outstanding.remove(msg_id)
                     content = msg['content']
                     header = msg['header']
                     # construct metadata:
                     md = self.metadata[msg_id]
                     md.update(self._extract_metadata(header, parent, content))
                     # is this redundant?
                     self.metadata[msg_id] = md
                     e_outstanding = self._outstanding_dict[md['engine_uuid']]
                     if msg_id in e_outstanding:
                         e_outstanding.remove(msg_id)
                     # construct result:
                     if content['status'] == 'ok':
                         self.results[msg_id] = util.unserialize_object(msg['buffers'])[0]
                     elif content['status'] == 'aborted':
                         self.results[msg_id] = error.TaskAborted(msg_id)
                     elif content['status'] == 'resubmitted':
                         # TODO: handle resubmission
                         pass
                     else:
                         self.results[msg_id] = self._unwrap_exception(content)
                 def _flush_notifications(self):
                     """Flush notifications of engine registrations waiting
                     in ZMQ queue."""
                     idents,msg = self.session.recv(self._notification_socket, mode=zmq.NOBLOCK)
                     while msg is not None:
                         if self.debug:
                             pprint(msg)
                         msg_type = msg['header']['msg_type']
                         handler = self._notification_handlers.get(msg_type, None)
                         if handler is None:
                             raise Exception("Unhandled message type: %s"%msg.msg_type)
                         else:
                             handler(msg)
                         idents,msg = self.session.recv(self._notification_socket, mode=zmq.NOBLOCK)
                 def _flush_results(self, sock):
                     """Flush task or queue results waiting in ZMQ queue."""
                     idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                     while msg is not None:
                         if self.debug:
                             pprint(msg)
                         msg_type = msg['header']['msg_type']
                         handler = self._queue_handlers.get(msg_type, None)
                         if handler is None:
                             raise Exception("Unhandled message type: %s"%msg.msg_type)
                         else:
                             handler(msg)
                         idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                 def _flush_control(self, sock):
                     """Flush replies from the control channel waiting
                     in the ZMQ queue.
                     Currently: ignore them."""
                     if self._ignored_control_replies <= 0:
                         return
                     idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                     while msg is not None:
                         self._ignored_control_replies -= 1
                         if self.debug:
                             pprint(msg)
                         idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                 def _flush_ignored_control(self):
                     """flush ignored control replies"""
                     while self._ignored_control_replies > 0:
                         self.session.recv(self._control_socket)
                         self._ignored_control_replies -= 1
                 def _flush_ignored_hub_replies(self):
                     ident,msg = self.session.recv(self._query_socket, mode=zmq.NOBLOCK)
                     while msg is not None:
                         ident,msg = self.session.recv(self._query_socket, mode=zmq.NOBLOCK)
                 def _flush_iopub(self, sock):
                     """Flush replies from the iopub channel waiting
                     in the ZMQ queue.
                     """
                     idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                     while msg is not None:
                         if self.debug:
                             pprint(msg)
                         parent = msg['parent_header']
                         msg_id = parent['msg_id']
                         content = msg['content']
                         header = msg['header']
                         msg_type = msg['header']['msg_type']
                         # init metadata:
                         md = self.metadata[msg_id]
                         if msg_type == 'stream':
                             name = content['name']
                             s = md[name] or ''
                             md[name] = s + content['data']
                         elif msg_type == 'pyerr':
                             md.update({'pyerr' : self._unwrap_exception(content)})
                         elif msg_type == 'pyin':
                             md.update({'pyin' : content['code']})
                         else:
                             md.update({msg_type : content.get('data', '')})
                         # reduntant?
                         self.metadata[msg_id] = md
                         idents,msg = self.session.recv(sock, mode=zmq.NOBLOCK)
                 #--------------------------------------------------------------------------
                 # len, getitem
                 #--------------------------------------------------------------------------
                 def __len__(self):
                     """len(client) returns # of engines."""
                     return len(self.ids)
                 def __getitem__(self, key):
                     """index access returns DirectView multiplexer objects
                     Must be int, slice, or list/tuple/xrange of ints"""
                     if not isinstance(key, (int, slice, tuple, list, xrange)):
                         raise TypeError("key by int/slice/iterable of ints only, not %s"%(type(key)))
                     else:
                         return self.direct_view(key)
                 #--------------------------------------------------------------------------
                 # Begin public methods
                 #--------------------------------------------------------------------------
                 @property
                 def ids(self):
                     """Always up-to-date ids property."""
                     self._flush_notifications()
                     # always copy:
                     return list(self._ids)
                 def close(self):
                     if self._closed:
                         return
                     snames = filter(lambda n: n.endswith('socket'), dir(self))
                     for socket in map(lambda name: getattr(self, name), snames):
                         if isinstance(socket, zmq.Socket) and not socket.closed:
                             socket.close()
                     self._closed = True
                 def spin(self):
                     """Flush any registration notifications and execution results
                     waiting in the ZMQ queue.
                     """
                     if self._notification_socket:
                         self._flush_notifications()
                     if self._mux_socket:
                         self._flush_results(self._mux_socket)
                     if self._task_socket:
                         self._flush_results(self._task_socket)
                     if self._control_socket:
                         self._flush_control(self._control_socket)
                     if self._iopub_socket:
                         self._flush_iopub(self._iopub_socket)
                     if self._query_socket:
                         self._flush_ignored_hub_replies()
                 def wait(self, jobs=None, timeout=-1):
                     """waits on one or more `jobs`, for up to `timeout` seconds.
                     Parameters
                     ----------
                     jobs : int, str, or list of ints and/or strs, or one or more AsyncResult objects
                             ints are indices to self.history
                             strs are msg_ids
                             default: wait on all outstanding messages
                     timeout : float
                             a time in seconds, after which to give up.
                             default is -1, which means no timeout
                     Returns
                     -------
                     True : when all msg_ids are done
                     False : timeout reached, some msg_ids still outstanding
                     """
                     tic = time.time()
                     if jobs is None:
                         theids = self.outstanding
                     else:
                         if isinstance(jobs, (int, basestring, AsyncResult)):
                             jobs = [jobs]
                         theids = set()
                         for job in jobs:
                             if isinstance(job, int):
                                 # index access
                                 job = self.history[job]
                             elif isinstance(job, AsyncResult):
                                 map(theids.add, job.msg_ids)
                                 continue
                             theids.add(job)
                     if not theids.intersection(self.outstanding):
                         return True
                     self.spin()
                     while theids.intersection(self.outstanding):
                         if timeout >= 0 and ( time.time()-tic ) > timeout:
                             break
                         time.sleep(1e-3)
                         self.spin()
                     return len(theids.intersection(self.outstanding)) == 0
                 #--------------------------------------------------------------------------
                 # Control methods
                 #--------------------------------------------------------------------------
                 @spin_first
                 def clear(self, targets=None, block=None):
                     """Clear the namespace in target(s)."""
                     block = self.block if block is None else block
                     targets = self._build_targets(targets)[0]
                     for t in targets:
                         self.session.send(self._control_socket, 'clear_request', content={}, ident=t)
                     error = False
                     if block:
                         self._flush_ignored_control()
                         for i in range(len(targets)):
                             idents,msg = self.session.recv(self._control_socket,0)
                             if self.debug:
                                 pprint(msg)
                             if msg['content']['status'] != 'ok':
                                 error = self._unwrap_exception(msg['content'])
                     else:
                         self._ignored_control_replies += len(targets)
                     if error:
                         raise error
                 @spin_first
                 def abort(self, jobs=None, targets=None, block=None):
                     """Abort specific jobs from the execution queues of target(s).
                     This is a mechanism to prevent jobs that have already been submitted
                     from executing.
                     Parameters
                     ----------
                     jobs : msg_id, list of msg_ids, or AsyncResult
                         The jobs to be aborted
                     """
                     block = self.block if block is None else block
                     targets = self._build_targets(targets)[0]
                     msg_ids = []
                     if isinstance(jobs, (basestring,AsyncResult)):
                         jobs = [jobs]
                     bad_ids = filter(lambda obj: not isinstance(obj, (basestring, AsyncResult)), jobs)
                     if bad_ids:
                         raise TypeError("Invalid msg_id type %r, expected str or AsyncResult"%bad_ids[0])
                     for j in jobs:
                         if isinstance(j, AsyncResult):
                             msg_ids.extend(j.msg_ids)
                         else:
                             msg_ids.append(j)
                     content = dict(msg_ids=msg_ids)
                     for t in targets:
                         self.session.send(self._control_socket, 'abort_request',
                                 content=content, ident=t)
                     error = False
                     if block:
                         self._flush_ignored_control()
                         for i in range(len(targets)):
                             idents,msg = self.session.recv(self._control_socket,0)
                             if self.debug:
                                 pprint(msg)
                             if msg['content']['status'] != 'ok':
                                 error = self._unwrap_exception(msg['content'])
                     else:
                         self._ignored_control_replies += len(targets)
                     if error:
                         raise error
                 @spin_first
                 def shutdown(self, targets=None, restart=False, hub=False, block=None):
                     """Terminates one or more engine processes, optionally including the hub."""
                     block = self.block if block is None else block
                     if hub:
                         targets = 'all'
                     targets = self._build_targets(targets)[0]
                     for t in targets:
                         self.session.send(self._control_socket, 'shutdown_request',
                                     content={'restart':restart},ident=t)
                     error = False
                     if block or hub:
                         self._flush_ignored_control()
                         for i in range(len(targets)):
                             idents,msg = self.session.recv(self._control_socket, 0)
                             if self.debug:
                                 pprint(msg)
                             if msg['content']['status'] != 'ok':
                                 error = self._unwrap_exception(msg['content'])
                     else:
                         self._ignored_control_replies += len(targets)
                     if hub:
                         time.sleep(0.25)
                         self.session.send(self._query_socket, 'shutdown_request')
                         idents,msg = self.session.recv(self._query_socket, 0)
                         if self.debug:
                             pprint(msg)
                         if msg['content']['status'] != 'ok':
                             error = self._unwrap_exception(msg['content'])
                     if error:
                         raise error
                 #--------------------------------------------------------------------------
                 # Execution related methods
                 #--------------------------------------------------------------------------
                 def _maybe_raise(self, result):
                     """wrapper for maybe raising an exception if apply failed."""
                     if isinstance(result, error.RemoteError):
                         raise result
                     return result
                 def send_apply_message(self, socket, f, args=None, kwargs=None, subheader=None, track=False,
                                         ident=None):
                     """construct and send an apply message via a socket.
                     This is the principal method with which all engine execution is performed by views.
                     """
                     assert not self._closed, "cannot use me anymore, I'm closed!"
                     # defaults:
                     args = args if args is not None else []
                     kwargs = kwargs if kwargs is not None else {}
                     subheader = subheader if subheader is not None else {}
                     # validate arguments
                     if not callable(f):
                         raise TypeError("f must be callable, not %s"%type(f))
                     if not isinstance(args, (tuple, list)):
                         raise TypeError("args must be tuple or list, not %s"%type(args))
                     if not isinstance(kwargs, dict):
                         raise TypeError("kwargs must be dict, not %s"%type(kwargs))
                     if not isinstance(subheader, dict):
                         raise TypeError("subheader must be dict, not %s"%type(subheader))
                     bufs = util.pack_apply_message(f,args,kwargs)
                     msg = self.session.send(socket, "apply_request", buffers=bufs, ident=ident,
                                         subheader=subheader, track=track)
                     msg_id = msg['header']['msg_id']
                     self.outstanding.add(msg_id)
                     if ident:
                         # possibly routed to a specific engine
                         if isinstance(ident, list):
                             ident = ident[-1]
                         if ident in self._engines.values():
                             # save for later, in case of engine death
                             self._outstanding_dict[ident].add(msg_id)
                     self.history.append(msg_id)
                     self.metadata[msg_id]['submitted'] = datetime.now()
                     return msg
                 #--------------------------------------------------------------------------
                 # construct a View object
                 #--------------------------------------------------------------------------
                 def load_balanced_view(self, targets=None):
                     """construct a DirectView object.
                     If no arguments are specified, create a LoadBalancedView
                     using all engines.
                     Parameters
                     ----------
                     targets: list,slice,int,etc. [default: use all engines]
                         The subset of engines across which to load-balance
                     """
                     if targets == 'all':
                         targets = None
                     if targets is not None:
                         targets = self._build_targets(targets)[1]
                     return LoadBalancedView(client=self, socket=self._task_socket, targets=targets)
                 def direct_view(self, targets='all'):
                     """construct a DirectView object.
                     If no targets are specified, create a DirectView
                     using all engines.
                     Parameters
                     ----------
                     targets: list,slice,int,etc. [default: use all engines]
                         The engines to use for the View
                     """
                     single = isinstance(targets, int)
                     # allow 'all' to be lazily evaluated at each execution
                     if targets != 'all':
                         targets = self._build_targets(targets)[1]
                     if single:
                         targets = targets[0]
                     return DirectView(client=self, socket=self._mux_socket, targets=targets)
                 #--------------------------------------------------------------------------
                 # Query methods
                 #--------------------------------------------------------------------------
                 @spin_first
                 def get_result(self, indices_or_msg_ids=None, block=None):
                     """Retrieve a result by msg_id or history index, wrapped in an AsyncResult object.
                     If the client already has the results, no request to the Hub will be made.
                     This is a convenient way to construct AsyncResult objects, which are wrappers
                     that include metadata about execution, and allow for awaiting results that
                     were not submitted by this Client.
                     It can also be a convenient way to retrieve the metadata associated with
                     blocking execution, since it always retrieves
                     Examples
                     --------
                     ::
                         In [10]: r = client.apply()
                     Parameters
                     ----------
                     indices_or_msg_ids : integer history index, str msg_id, or list of either
                         The indices or msg_ids of indices to be retrieved
                     block : bool
                         Whether to wait for the result to be done
                     Returns
                     -------
                     AsyncResult
                         A single AsyncResult object will always be returned.
                     AsyncHubResult
                         A subclass of AsyncResult that retrieves results from the Hub
                     """
                     block = self.block if block is None else block
                     if indices_or_msg_ids is None:
                         indices_or_msg_ids = -1
                     if not isinstance(indices_or_msg_ids, (list,tuple)):
                         indices_or_msg_ids = [indices_or_msg_ids]
                     theids = []
                     for id in indices_or_msg_ids:
                         if isinstance(id, int):
                             id = self.history[id]
                         if not isinstance(id, basestring):
                             raise TypeError("indices must be str or int, not %r"%id)
                         theids.append(id)
                     local_ids = filter(lambda msg_id: msg_id in self.history or msg_id in self.results, theids)
                     remote_ids = filter(lambda msg_id: msg_id not in local_ids, theids)
                     if remote_ids:
                         ar = AsyncHubResult(self, msg_ids=theids)
                     else:
                         ar = AsyncResult(self, msg_ids=theids)
                     if block:
                         ar.wait()
                     return ar
                 @spin_first
                 def resubmit(self, indices_or_msg_ids=None, subheader=None, block=None):
                     """Resubmit one or more tasks.
                     in-flight tasks may not be resubmitted.
                     Parameters
                     ----------
                     indices_or_msg_ids : integer history index, str msg_id, or list of either
                         The indices or msg_ids of indices to be retrieved
                     block : bool
                         Whether to wait for the result to be done
                     Returns
                     -------
                     AsyncHubResult
                         A subclass of AsyncResult that retrieves results from the Hub
                     """
                     block = self.block if block is None else block
                     if indices_or_msg_ids is None:
                         indices_or_msg_ids = -1
                     if not isinstance(indices_or_msg_ids, (list,tuple)):
                         indices_or_msg_ids = [indices_or_msg_ids]
                     theids = []
                     for id in indices_or_msg_ids:
                         if isinstance(id, int):
                             id = self.history[id]
                         if not isinstance(id, basestring):
                             raise TypeError("indices must be str or int, not %r"%id)
                         theids.append(id)
                     for msg_id in theids:
                         self.outstanding.discard(msg_id)
                         if msg_id in self.history:
                             self.history.remove(msg_id)
                         self.results.pop(msg_id, None)
                         self.metadata.pop(msg_id, None)
                     content = dict(msg_ids = theids)
                     self.session.send(self._query_socket, 'resubmit_request', content)
                     zmq.select([self._query_socket], [], [])
                     idents,msg = self.session.recv(self._query_socket, zmq.NOBLOCK)
                     if self.debug:
                         pprint(msg)
                     content = msg['content']
                     if content['status'] != 'ok':
                         raise self._unwrap_exception(content)
                     ar = AsyncHubResult(self, msg_ids=theids)
                     if block:
                         ar.wait()
                     return ar
                 @spin_first
                 def result_status(self, msg_ids, status_only=True):
                     """Check on the status of the result(s) of the apply request with `msg_ids`.
                     If status_only is False, then the actual results will be retrieved, else
                     only the status of the results will be checked.
                     Parameters
                     ----------
                     msg_ids : list of msg_ids
                         if int:
                             Passed as index to self.history for convenience.
                     status_only : bool (default: True)
                         if False:
                             Retrieve the actual results of completed tasks.
                     Returns
                     -------
                     results : dict
                         There will always be the keys 'pending' and 'completed', which will
                         be lists of msg_ids that are incomplete or complete. If `status_only`
                         is False, then completed results will be keyed by their `msg_id`.
                     """
                     if not isinstance(msg_ids, (list,tuple)):
                         msg_ids = [msg_ids]
                     theids = []
                     for msg_id in msg_ids:
                         if isinstance(msg_id, int):
                             msg_id = self.history[msg_id]
                         if not isinstance(msg_id, basestring):
                             raise TypeError("msg_ids must be str, not %r"%msg_id)
                         theids.append(msg_id)
                     completed = []
                     local_results = {}
                     # comment this block out to temporarily disable local shortcut:
                     for msg_id in theids:
                         if msg_id in self.results:
                             completed.append(msg_id)
                             local_results[msg_id] = self.results[msg_id]
                             theids.remove(msg_id)
                     if theids: # some not locally cached
                         content = dict(msg_ids=theids, status_only=status_only)
                         msg = self.session.send(self._query_socket, "result_request", content=content)
                         zmq.select([self._query_socket], [], [])
                         idents,msg = self.session.recv(self._query_socket, zmq.NOBLOCK)
                         if self.debug:
                             pprint(msg)
                         content = msg['content']
                         if content['status'] != 'ok':
                             raise self._unwrap_exception(content)
                         buffers = msg['buffers']
                     else:
                         content = dict(completed=[],pending=[])
                     content['completed'].extend(completed)
                     if status_only:
                         return content
                     failures = []
                     # load cached results into result:
                     content.update(local_results)
                     # update cache with results:
                     for msg_id in sorted(theids):
                         if msg_id in content['completed']:
                             rec = content[msg_id]
                             parent = rec['header']
                             header = rec['result_header']
                             rcontent = rec['result_content']
                             iodict = rec['io']
                             if isinstance(rcontent, str):
                                 rcontent = self.session.unpack(rcontent)
                             md = self.metadata[msg_id]
                             md.update(self._extract_metadata(header, parent, rcontent))
                             md.update(iodict)
                             if rcontent['status'] == 'ok':
                                 res,buffers = util.unserialize_object(buffers)
                             else:
                                 print rcontent
                                 res = self._unwrap_exception(rcontent)
                                 failures.append(res)
                             self.results[msg_id] = res
                             content[msg_id] = res
                     if len(theids) == 1 and failures:
                             raise failures[0]
                     error.collect_exceptions(failures, "result_status")
                     return content
                 @spin_first
                 def queue_status(self, targets='all', verbose=False):
                     """Fetch the status of engine queues.
                     Parameters
                     ----------
                     targets : int/str/list of ints/strs
                             the engines whose states are to be queried.
                             default : all
                     verbose : bool
                             Whether to return lengths only, or lists of ids for each element
                     """
                     engine_ids = self._build_targets(targets)[1]
                     content = dict(targets=engine_ids, verbose=verbose)
                     self.session.send(self._query_socket, "queue_request", content=content)
                     idents,msg = self.session.recv(self._query_socket, 0)
                     if self.debug:
                         pprint(msg)
                     content = msg['content']
                     status = content.pop('status')
                     if status != 'ok':
                         raise self._unwrap_exception(content)
                     content = rekey(content)
                     if isinstance(targets, int):
                         return content[targets]
                     else:
                         return content
                 @spin_first
                 def purge_results(self, jobs=[], targets=[]):
                     """Tell the Hub to forget results.
                     Individual results can be purged by msg_id, or the entire
                     history of specific targets can be purged.
                     Use `purge_results('all')` to scrub everything from the Hub's db.
                     Parameters
                     ----------
                     jobs : str or list of str or AsyncResult objects
                             the msg_ids whose results should be forgotten.
                     targets : int/str/list of ints/strs
                             The targets, by int_id, whose entire history is to be purged.
                             default : None
                     """
                     if not targets and not jobs:
                         raise ValueError("Must specify at least one of `targets` and `jobs`")
                     if targets:
                         targets = self._build_targets(targets)[1]
                     # construct msg_ids from jobs
                     if jobs == 'all':
                         msg_ids = jobs
                     else:
                         msg_ids = []
                         if isinstance(jobs, (basestring,AsyncResult)):
                             jobs = [jobs]
                         bad_ids = filter(lambda obj: not isinstance(obj, (basestring, AsyncResult)), jobs)
                         if bad_ids:
                             raise TypeError("Invalid msg_id type %r, expected str or AsyncResult"%bad_ids[0])
                         for j in jobs:
                             if isinstance(j, AsyncResult):
                                 msg_ids.extend(j.msg_ids)
                             else:
                                 msg_ids.append(j)
                     content = dict(engine_ids=targets, msg_ids=msg_ids)
                     self.session.send(self._query_socket, "purge_request", content=content)
                     idents, msg = self.session.recv(self._query_socket, 0)
                     if self.debug:
                         pprint(msg)
                     content = msg['content']
                     if content['status'] != 'ok':
                         raise self._unwrap_exception(content)
                 @spin_first
                 def hub_history(self):
                     """Get the Hub's history
                     Just like the Client, the Hub has a history, which is a list of msg_ids.
                     This will contain the history of all clients, and, depending on configuration,
                     may contain history across multiple cluster sessions.
                     Any msg_id returned here is a valid argument to `get_result`.
                     Returns
                     -------
                     msg_ids : list of strs
                             list of all msg_ids, ordered by task submission time.
                     """
                     self.session.send(self._query_socket, "history_request", content={})
                     idents, msg = self.session.recv(self._query_socket, 0)
                     if self.debug:
                         pprint(msg)
                     content = msg['content']
                     if content['status'] != 'ok':
                         raise self._unwrap_exception(content)
                     else:
                         return content['history']
                 @spin_first
                 def db_query(self, query, keys=None):
                     """Query the Hub's TaskRecord database
                     This will return a list of task record dicts that match `query`
                     Parameters
                     ----------
                     query : mongodb query dict
                         The search dict. See mongodb query docs for details.
                     keys : list of strs [optional]
                         The subset of keys to be returned.  The default is to fetch everything but buffers.
                         'msg_id' will *always* be included.
                     """
                     if isinstance(keys, basestring):
                         keys = [keys]
                     content = dict(query=query, keys=keys)
                     self.session.send(self._query_socket, "db_request", content=content)
                     idents, msg = self.session.recv(self._query_socket, 0)
                     if self.debug:
                         pprint(msg)
                     content = msg['content']
                     if content['status'] != 'ok':
                         raise self._unwrap_exception(content)
                     records = content['records']
                     buffer_lens = content['buffer_lens']
                     result_buffer_lens = content['result_buffer_lens']
                     buffers = msg['buffers']
                     has_bufs = buffer_lens is not None
                     has_rbufs = result_buffer_lens is not None
                     for i,rec in enumerate(records):
                         # relink buffers
                         if has_bufs:
                             blen = buffer_lens[i]
                             rec['buffers'], buffers = buffers[:blen],buffers[blen:]
                         if has_rbufs:
                             blen = result_buffer_lens[i]
                             rec['result_buffers'], buffers = buffers[:blen],buffers[blen:]
                     return records
             __all__ = [ 'Client' ]

IPython/parallel/controller/heartmonitor.py

0 +2 -2

             #!/usr/bin/env python
             """
             A multi-heart Heartbeat system using PUB and XREP sockets. pings are sent out on the PUB,
             and hearts are tracked based on their XREQ identities.
             Authors:
             * Min RK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             from __future__ import print_function
             import time
             import uuid
             import zmq
             from zmq.devices import ThreadDevice
             from zmq.eventloop import ioloop, zmqstream
             from IPython.config.configurable import LoggingConfigurable
             from IPython.utils.traitlets import Set, Instance, CFloat
             from IPython.parallel.util import asbytes
             class Heart(object):
                 """A basic heart object for responding to a HeartMonitor.
                 This is a simple wrapper with defaults for the most common
                 Device model for responding to heartbeats.
                 It simply builds a threadsafe zmq.FORWARDER Device, defaulting to using
                 SUB/XREQ for in/out.
                 You can specify the XREQ's IDENTITY via the optional heart_id argument."""
                 device=None
                 id=None
-                def __init__(self, in_addr, out_addr, in_type=zmq.SUB, out_type=zmq.XREQ, heart_id=None):
+                def __init__(self, in_addr, out_addr, in_type=zmq.SUB, out_type=zmq.DEALER, heart_id=None):
                     self.device = ThreadDevice(zmq.FORWARDER, in_type, out_type)
                     self.device.daemon=True
                     self.device.connect_in(in_addr)
                     self.device.connect_out(out_addr)
                     if in_type == zmq.SUB:
                         self.device.setsockopt_in(zmq.SUBSCRIBE, b"")
                     if heart_id is None:
                         heart_id = uuid.uuid4().bytes
                     self.device.setsockopt_out(zmq.IDENTITY, heart_id)
                     self.id = heart_id
                 def start(self):
                     return self.device.start()
             class HeartMonitor(LoggingConfigurable):
                 """A basic HeartMonitor class
                 pingstream: a PUB stream
                 pongstream: an XREP stream
                 period: the period of the heartbeat in milliseconds"""
                 period=CFloat(1000, config=True,
                     help='The frequency at which the Hub pings the engines for heartbeats '
                     ' (in ms) [default: 100]',
                 )
                 pingstream=Instance('zmq.eventloop.zmqstream.ZMQStream')
                 pongstream=Instance('zmq.eventloop.zmqstream.ZMQStream')
                 loop = Instance('zmq.eventloop.ioloop.IOLoop')
                 def _loop_default(self):
                     return ioloop.IOLoop.instance()
                 # not settable:
                 hearts=Set()
                 responses=Set()
                 on_probation=Set()
                 last_ping=CFloat(0)
                 _new_handlers = Set()
                 _failure_handlers = Set()
                 lifetime = CFloat(0)
                 tic = CFloat(0)
                 def __init__(self, **kwargs):
                     super(HeartMonitor, self).__init__(**kwargs)
                     self.pongstream.on_recv(self.handle_pong)
                 def start(self):
                     self.caller = ioloop.PeriodicCallback(self.beat, self.period, self.loop)
                     self.caller.start()
                 def add_new_heart_handler(self, handler):
                     """add a new handler for new hearts"""
                     self.log.debug("heartbeat::new_heart_handler: %s"%handler)
                     self._new_handlers.add(handler)
                 def add_heart_failure_handler(self, handler):
                     """add a new handler for heart failure"""
                     self.log.debug("heartbeat::new heart failure handler: %s"%handler)
                     self._failure_handlers.add(handler)
                 def beat(self):
                     self.pongstream.flush()
                     self.last_ping = self.lifetime
                     toc = time.time()
                     self.lifetime += toc-self.tic
                     self.tic = toc
                     # self.log.debug("heartbeat::%s"%self.lifetime)
                     goodhearts = self.hearts.intersection(self.responses)
                     missed_beats = self.hearts.difference(goodhearts)
                     heartfailures = self.on_probation.intersection(missed_beats)
                     newhearts = self.responses.difference(goodhearts)
                     map(self.handle_new_heart, newhearts)
                     map(self.handle_heart_failure, heartfailures)
                     self.on_probation = missed_beats.intersection(self.hearts)
                     self.responses = set()
                     # print self.on_probation, self.hearts
                     # self.log.debug("heartbeat::beat %.3f, %i beating hearts"%(self.lifetime, len(self.hearts)))
                     self.pingstream.send(asbytes(str(self.lifetime)))
                 def handle_new_heart(self, heart):
                     if self._new_handlers:
                         for handler in self._new_handlers:
                             handler(heart)
                     else:
                         self.log.info("heartbeat::yay, got new heart %s!"%heart)
                     self.hearts.add(heart)
                 def handle_heart_failure(self, heart):
                     if self._failure_handlers:
                         for handler in self._failure_handlers:
                             try:
                                 handler(heart)
                             except Exception as e:
                                 self.log.error("heartbeat::Bad Handler! %s"%handler, exc_info=True)
                                 pass
                     else:
                         self.log.info("heartbeat::Heart %s failed :("%heart)
                     self.hearts.remove(heart)
                 def handle_pong(self, msg):
                     "a heart just beat"
                     current = asbytes(str(self.lifetime))
                     last = asbytes(str(self.last_ping))
                     if msg[1] == current:
                         delta = time.time()-self.tic
                         # self.log.debug("heartbeat::heart %r took %.2f ms to respond"%(msg[0], 1000*delta))
                         self.responses.add(msg[0])
                     elif msg[1] == last:
                         delta = time.time()-self.tic + (self.lifetime-self.last_ping)
                         self.log.warn("heartbeat::heart %r missed a beat, and took %.2f ms to respond"%(msg[0], 1000*delta))
                         self.responses.add(msg[0])
                     else:
                         self.log.warn("heartbeat::got bad heartbeat (possibly old?): %s (current=%.3f)"%
                         (msg[1],self.lifetime))
             if __name__ == '__main__':
                 loop = ioloop.IOLoop.instance()
                 context = zmq.Context()
                 pub = context.socket(zmq.PUB)
                 pub.bind('tcp://127.0.0.1:5555')
-                xrep = context.socket(zmq.XREP)
+                xrep = context.socket(zmq.ROUTER)
                 xrep.bind('tcp://127.0.0.1:5556')
                 outstream = zmqstream.ZMQStream(pub, loop)
                 instream = zmqstream.ZMQStream(xrep, loop)
                 hb = HeartMonitor(loop, outstream, instream)
                 loop.start()

IPython/parallel/controller/hub.py

0 +3 -3

             """The IPython Controller Hub with 0MQ
             This is the master object that handles connections from engines and clients,
             and monitors traffic through the various queues.
             Authors:
             * Min RK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             from __future__ import print_function
             import sys
             import time
             from datetime import datetime
             import zmq
             from zmq.eventloop import ioloop
             from zmq.eventloop.zmqstream import ZMQStream
             # internal:
             from IPython.utils.importstring import import_item
             from IPython.utils.traitlets import (
                     HasTraits, Instance, Int, Unicode, Dict, Set, Tuple, CBytes, DottedObjectName
                     )
             from IPython.parallel import error, util
             from IPython.parallel.factory import RegistrationFactory
             from IPython.zmq.session import SessionFactory
             from .heartmonitor import HeartMonitor
             #-----------------------------------------------------------------------------
             # Code
             #-----------------------------------------------------------------------------
             def _passer(*args, **kwargs):
                 return
             def _printer(*args, **kwargs):
                 print (args)
                 print (kwargs)
             def empty_record():
                 """Return an empty dict with all record keys."""
                 return {
                     'msg_id' : None,
                     'header' : None,
                     'content': None,
                     'buffers': None,
                     'submitted': None,
                     'client_uuid' : None,
                     'engine_uuid' : None,
                     'started': None,
                     'completed': None,
                     'resubmitted': None,
                     'result_header' : None,
                     'result_content' : None,
                     'result_buffers' : None,
                     'queue' : None,
                     'pyin' : None,
                     'pyout': None,
                     'pyerr': None,
                     'stdout': '',
                     'stderr': '',
                 }
             def init_record(msg):
                 """Initialize a TaskRecord based on a request."""
                 header = msg['header']
                 return {
                     'msg_id' : header['msg_id'],
                     'header' : header,
                     'content': msg['content'],
                     'buffers': msg['buffers'],
                     'submitted': header['date'],
                     'client_uuid' : None,
                     'engine_uuid' : None,
                     'started': None,
                     'completed': None,
                     'resubmitted': None,
                     'result_header' : None,
                     'result_content' : None,
                     'result_buffers' : None,
                     'queue' : None,
                     'pyin' : None,
                     'pyout': None,
                     'pyerr': None,
                     'stdout': '',
                     'stderr': '',
                 }
             class EngineConnector(HasTraits):
                 """A simple object for accessing the various zmq connections of an object.
                 Attributes are:
                 id (int): engine ID
                 uuid (str): uuid (unused?)
                 queue (str): identity of queue's XREQ socket
                 registration (str): identity of registration XREQ socket
                 heartbeat (str): identity of heartbeat XREQ socket
                 """
                 id=Int(0)
                 queue=CBytes()
                 control=CBytes()
                 registration=CBytes()
                 heartbeat=CBytes()
                 pending=Set()
             class HubFactory(RegistrationFactory):
                 """The Configurable for setting up a Hub."""
                 # port-pairs for monitoredqueues:
                 hb = Tuple(Int,Int,config=True,
                     help="""XREQ/SUB Port pair for Engine heartbeats""")
                 def _hb_default(self):
                     return tuple(util.select_random_ports(2))
                 mux = Tuple(Int,Int,config=True,
                     help="""Engine/Client Port pair for MUX queue""")
                 def _mux_default(self):
                     return tuple(util.select_random_ports(2))
                 task = Tuple(Int,Int,config=True,
                     help="""Engine/Client Port pair for Task queue""")
                 def _task_default(self):
                     return tuple(util.select_random_ports(2))
                 control = Tuple(Int,Int,config=True,
                     help="""Engine/Client Port pair for Control queue""")
                 def _control_default(self):
                     return tuple(util.select_random_ports(2))
                 iopub = Tuple(Int,Int,config=True,
                     help="""Engine/Client Port pair for IOPub relay""")
                 def _iopub_default(self):
                     return tuple(util.select_random_ports(2))
                 # single ports:
                 mon_port = Int(config=True,
                     help="""Monitor (SUB) port for queue traffic""")
                 def _mon_port_default(self):
                     return util.select_random_ports(1)[0]
                 notifier_port = Int(config=True,
                     help="""PUB port for sending engine status notifications""")
                 def _notifier_port_default(self):
                     return util.select_random_ports(1)[0]
                 engine_ip = Unicode('127.0.0.1', config=True,
                     help="IP on which to listen for engine connections. [default: loopback]")
                 engine_transport = Unicode('tcp', config=True,
                     help="0MQ transport for engine connections. [default: tcp]")
                 client_ip = Unicode('127.0.0.1', config=True,
                     help="IP on which to listen for client connections. [default: loopback]")
                 client_transport = Unicode('tcp', config=True,
                     help="0MQ transport for client connections. [default : tcp]")
                 monitor_ip = Unicode('127.0.0.1', config=True,
                     help="IP on which to listen for monitor messages. [default: loopback]")
                 monitor_transport = Unicode('tcp', config=True,
                     help="0MQ transport for monitor messages. [default : tcp]")
                 monitor_url = Unicode('')
                 db_class = DottedObjectName('IPython.parallel.controller.dictdb.DictDB',
                     config=True, help="""The class to use for the DB backend""")
                 # not configurable
                 db = Instance('IPython.parallel.controller.dictdb.BaseDB')
                 heartmonitor = Instance('IPython.parallel.controller.heartmonitor.HeartMonitor')
                 def _ip_changed(self, name, old, new):
                     self.engine_ip = new
                     self.client_ip = new
                     self.monitor_ip = new
                     self._update_monitor_url()
                 def _update_monitor_url(self):
                     self.monitor_url = "%s://%s:%i"%(self.monitor_transport, self.monitor_ip, self.mon_port)
                 def _transport_changed(self, name, old, new):
                     self.engine_transport = new
                     self.client_transport = new
                     self.monitor_transport = new
                     self._update_monitor_url()
                 def __init__(self, **kwargs):
                     super(HubFactory, self).__init__(**kwargs)
                     self._update_monitor_url()
                 def construct(self):
                     self.init_hub()
                 def start(self):
                     self.heartmonitor.start()
                     self.log.info("Heartmonitor started")
                 def init_hub(self):
                     """construct"""
                     client_iface = "%s://%s:"%(self.client_transport, self.client_ip) + "%i"
                     engine_iface = "%s://%s:"%(self.engine_transport, self.engine_ip) + "%i"
                     ctx = self.context
                     loop = self.loop
                     # Registrar socket
-                    q = ZMQStream(ctx.socket(zmq.XREP), loop)
+                    q = ZMQStream(ctx.socket(zmq.ROUTER), loop)
                     q.bind(client_iface % self.regport)
                     self.log.info("Hub listening on %s for registration."%(client_iface%self.regport))
                     if self.client_ip != self.engine_ip:
                         q.bind(engine_iface % self.regport)
                         self.log.info("Hub listening on %s for registration."%(engine_iface%self.regport))
                     ### Engine connections ###
                     # heartbeat
                     hpub = ctx.socket(zmq.PUB)
                     hpub.bind(engine_iface % self.hb[0])
-                    hrep = ctx.socket(zmq.XREP)
+                    hrep = ctx.socket(zmq.ROUTER)
                     hrep.bind(engine_iface % self.hb[1])
                     self.heartmonitor = HeartMonitor(loop=loop, config=self.config, log=self.log,
                                             pingstream=ZMQStream(hpub,loop),
                                             pongstream=ZMQStream(hrep,loop)
                                         )
                     ### Client connections ###
                     # Notifier socket
                     n = ZMQStream(ctx.socket(zmq.PUB), loop)
                     n.bind(client_iface%self.notifier_port)
                     ### build and launch the queues ###
                     # monitor socket
                     sub = ctx.socket(zmq.SUB)
                     sub.setsockopt(zmq.SUBSCRIBE, b"")
                     sub.bind(self.monitor_url)
                     sub.bind('inproc://monitor')
                     sub = ZMQStream(sub, loop)
                     # connect the db
                     self.log.info('Hub using DB backend: %r'%(self.db_class.split()[-1]))
                     # cdir = self.config.Global.cluster_dir
                     self.db = import_item(str(self.db_class))(session=self.session.session,
                                                         config=self.config, log=self.log)
                     time.sleep(.25)
                     try:
                         scheme = self.config.TaskScheduler.scheme_name
                     except AttributeError:
                         from .scheduler import TaskScheduler
                         scheme = TaskScheduler.scheme_name.get_default_value()
                     # build connection dicts
                     self.engine_info = {
                         'control' : engine_iface%self.control[1],
                         'mux': engine_iface%self.mux[1],
                         'heartbeat': (engine_iface%self.hb[0], engine_iface%self.hb[1]),
                         'task' : engine_iface%self.task[1],
                         'iopub' : engine_iface%self.iopub[1],
                         # 'monitor' : engine_iface%self.mon_port,
                         }
                     self.client_info = {
                         'control' : client_iface%self.control[0],
                         'mux': client_iface%self.mux[0],
                         'task' : (scheme, client_iface%self.task[0]),
                         'iopub' : client_iface%self.iopub[0],
                         'notification': client_iface%self.notifier_port
                         }
                     self.log.debug("Hub engine addrs: %s"%self.engine_info)
                     self.log.debug("Hub client addrs: %s"%self.client_info)
                     # resubmit stream
-                    r = ZMQStream(ctx.socket(zmq.XREQ), loop)
+                    r = ZMQStream(ctx.socket(zmq.DEALER), loop)
                     url = util.disambiguate_url(self.client_info['task'][-1])
                     r.setsockopt(zmq.IDENTITY, util.asbytes(self.session.session))
                     r.connect(url)
                     self.hub = Hub(loop=loop, session=self.session, monitor=sub, heartmonitor=self.heartmonitor,
                             query=q, notifier=n, resubmit=r, db=self.db,
                             engine_info=self.engine_info, client_info=self.client_info,
                             log=self.log)
             class Hub(SessionFactory):
                 """The IPython Controller Hub with 0MQ connections
                 Parameters
                 ==========
                 loop: zmq IOLoop instance
                 session: Session object
                 <removed> context: zmq context for creating new connections (?)
                 queue: ZMQStream for monitoring the command queue (SUB)
                 query: ZMQStream for engine registration and client queries requests (XREP)
                 heartbeat: HeartMonitor object checking the pulse of the engines
                 notifier: ZMQStream for broadcasting engine registration changes (PUB)
                 db: connection to db for out of memory logging of commands
                             NotImplemented
                 engine_info: dict of zmq connection information for engines to connect
                             to the queues.
                 client_info: dict of zmq connection information for engines to connect
                             to the queues.
                 """
                 # internal data structures:
                 ids=Set() # engine IDs
                 keytable=Dict()
                 by_ident=Dict()
                 engines=Dict()
                 clients=Dict()
                 hearts=Dict()
                 pending=Set()
                 queues=Dict()  # pending msg_ids keyed by engine_id
                 tasks=Dict() # pending msg_ids submitted as tasks, keyed by client_id
                 completed=Dict() # completed msg_ids keyed by engine_id
                 all_completed=Set() # completed msg_ids keyed by engine_id
                 dead_engines=Set() # completed msg_ids keyed by engine_id
                 unassigned=Set() # set of task msg_ds not yet assigned a destination
                 incoming_registrations=Dict()
                 registration_timeout=Int()
                 _idcounter=Int(0)
                 # objects from constructor:
                 query=Instance(ZMQStream)
                 monitor=Instance(ZMQStream)
                 notifier=Instance(ZMQStream)
                 resubmit=Instance(ZMQStream)
                 heartmonitor=Instance(HeartMonitor)
                 db=Instance(object)
                 client_info=Dict()
                 engine_info=Dict()
                 def __init__(self, **kwargs):
                     """
                     # universal:
                     loop: IOLoop for creating future connections
                     session: streamsession for sending serialized data
                     # engine:
                     queue: ZMQStream for monitoring queue messages
                     query: ZMQStream for engine+client registration and client requests
                     heartbeat: HeartMonitor object for tracking engines
                     # extra:
                     db: ZMQStream for db connection (NotImplemented)
                     engine_info: zmq address/protocol dict for engine connections
                     client_info: zmq address/protocol dict for client connections
                     """
                     super(Hub, self).__init__(**kwargs)
                     self.registration_timeout = max(5000, 2*self.heartmonitor.period)
                     # validate connection dicts:
                     for k,v in self.client_info.iteritems():
                         if k == 'task':
                             util.validate_url_container(v[1])
                         else:
                             util.validate_url_container(v)
                     # util.validate_url_container(self.client_info)
                     util.validate_url_container(self.engine_info)
                     # register our callbacks
                     self.query.on_recv(self.dispatch_query)
                     self.monitor.on_recv(self.dispatch_monitor_traffic)
                     self.heartmonitor.add_heart_failure_handler(self.handle_heart_failure)
                     self.heartmonitor.add_new_heart_handler(self.handle_new_heart)
                     self.monitor_handlers = {b'in' : self.save_queue_request,
                                             b'out': self.save_queue_result,
                                             b'intask': self.save_task_request,
                                             b'outtask': self.save_task_result,
                                             b'tracktask': self.save_task_destination,
                                             b'incontrol': _passer,
                                             b'outcontrol': _passer,
                                             b'iopub': self.save_iopub_message,
                     }
                     self.query_handlers = {'queue_request': self.queue_status,
                                             'result_request': self.get_results,
                                             'history_request': self.get_history,
                                             'db_request': self.db_query,
                                             'purge_request': self.purge_results,
                                             'load_request': self.check_load,
                                             'resubmit_request': self.resubmit_task,
                                             'shutdown_request': self.shutdown_request,
                                             'registration_request' : self.register_engine,
                                             'unregistration_request' : self.unregister_engine,
                                             'connection_request': self.connection_request,
                     }
                     # ignore resubmit replies
                     self.resubmit.on_recv(lambda msg: None, copy=False)
                     self.log.info("hub::created hub")
                 @property
                 def _next_id(self):
                     """gemerate a new ID.
                     No longer reuse old ids, just count from 0."""
                     newid = self._idcounter
                     self._idcounter += 1
                     return newid
                     # newid = 0
                     # incoming = [id[0] for id in self.incoming_registrations.itervalues()]
                     # # print newid, self.ids, self.incoming_registrations
                     # while newid in self.ids or newid in incoming:
                     #     newid += 1
                     # return newid
                 #-----------------------------------------------------------------------------
                 # message validation
                 #-----------------------------------------------------------------------------
                 def _validate_targets(self, targets):
                     """turn any valid targets argument into a list of integer ids"""
                     if targets is None:
                         # default to all
                         targets = self.ids
                     if isinstance(targets, (int,str,unicode)):
                         # only one target specified
                         targets = [targets]
                     _targets = []
                     for t in targets:
                         # map raw identities to ids
                         if isinstance(t, (str,unicode)):
                             t = self.by_ident.get(t, t)
                         _targets.append(t)
                     targets = _targets
                     bad_targets = [ t for t in targets if t not in self.ids ]
                     if bad_targets:
                         raise IndexError("No Such Engine: %r"%bad_targets)
                     if not targets:
                         raise IndexError("No Engines Registered")
                     return targets
                 #-----------------------------------------------------------------------------
                 # dispatch methods (1 per stream)
                 #-----------------------------------------------------------------------------
                 def dispatch_monitor_traffic(self, msg):
                     """all ME and Task queue messages come through here, as well as
                     IOPub traffic."""
                     self.log.debug("monitor traffic: %r"%msg[:2])
                     switch = msg[0]
                     try:
                         idents, msg = self.session.feed_identities(msg[1:])
                     except ValueError:
                         idents=[]
                     if not idents:
                         self.log.error("Bad Monitor Message: %r"%msg)
                         return
                     handler = self.monitor_handlers.get(switch, None)
                     if handler is not None:
                         handler(idents, msg)
                     else:
                         self.log.error("Invalid monitor topic: %r"%switch)
                 def dispatch_query(self, msg):
                     """Route registration requests and queries from clients."""
                     try:
                         idents, msg = self.session.feed_identities(msg)
                     except ValueError:
                         idents = []
                     if not idents:
                         self.log.error("Bad Query Message: %r"%msg)
                         return
                     client_id = idents[0]
                     try:
                         msg = self.session.unserialize(msg, content=True)
                     except Exception:
                         content = error.wrap_exception()
                         self.log.error("Bad Query Message: %r"%msg, exc_info=True)
                         self.session.send(self.query, "hub_error", ident=client_id,
                                 content=content)
                         return
                     # print client_id, header, parent, content
                     #switch on message type:
                     msg_type = msg['header']['msg_type']
                     self.log.info("client::client %r requested %r"%(client_id, msg_type))
                     handler = self.query_handlers.get(msg_type, None)
                     try:
                         assert handler is not None, "Bad Message Type: %r"%msg_type
                     except:
                         content = error.wrap_exception()
                         self.log.error("Bad Message Type: %r"%msg_type, exc_info=True)
                         self.session.send(self.query, "hub_error", ident=client_id,
                                 content=content)
                         return
                     else:
                         handler(idents, msg)
                 def dispatch_db(self, msg):
                     """"""
                     raise NotImplementedError
                 #---------------------------------------------------------------------------
                 # handler methods (1 per event)
                 #---------------------------------------------------------------------------
                 #----------------------- Heartbeat --------------------------------------
                 def handle_new_heart(self, heart):
                     """handler to attach to heartbeater.
                     Called when a new heart starts to beat.
                     Triggers completion of registration."""
                     self.log.debug("heartbeat::handle_new_heart(%r)"%heart)
                     if heart not in self.incoming_registrations:
                         self.log.info("heartbeat::ignoring new heart: %r"%heart)
                     else:
                         self.finish_registration(heart)
                 def handle_heart_failure(self, heart):
                     """handler to attach to heartbeater.
                     called when a previously registered heart fails to respond to beat request.
                     triggers unregistration"""
                     self.log.debug("heartbeat::handle_heart_failure(%r)"%heart)
                     eid = self.hearts.get(heart, None)
                     queue = self.engines[eid].queue
                     if eid is None:
                         self.log.info("heartbeat::ignoring heart failure %r"%heart)
                     else:
                         self.unregister_engine(heart, dict(content=dict(id=eid, queue=queue)))
                 #----------------------- MUX Queue Traffic ------------------------------
                 def save_queue_request(self, idents, msg):
                     if len(idents) < 2:
                         self.log.error("invalid identity prefix: %r"%idents)
                         return
                     queue_id, client_id = idents[:2]
                     try:
                         msg = self.session.unserialize(msg)
                     except Exception:
                         self.log.error("queue::client %r sent invalid message to %r: %r"%(client_id, queue_id, msg), exc_info=True)
                         return
                     eid = self.by_ident.get(queue_id, None)
                     if eid is None:
                         self.log.error("queue::target %r not registered"%queue_id)
                         self.log.debug("queue::    valid are: %r"%(self.by_ident.keys()))
                         return
                     record = init_record(msg)
                     msg_id = record['msg_id']
                     # Unicode in records
                     record['engine_uuid'] = queue_id.decode('ascii')
                     record['client_uuid'] = client_id.decode('ascii')
                     record['queue'] = 'mux'
                     try:
                         # it's posible iopub arrived first:
                         existing = self.db.get_record(msg_id)
                         for key,evalue in existing.iteritems():
                             rvalue = record.get(key, None)
                             if evalue and rvalue and evalue != rvalue:
                                 self.log.warn("conflicting initial state for record: %r:%r <%r> %r"%(msg_id, rvalue, key, evalue))
                             elif evalue and not rvalue:
                                 record[key] = evalue
                         try:
                             self.db.update_record(msg_id, record)
                         except Exception:
                             self.log.error("DB Error updating record %r"%msg_id, exc_info=True)
                     except KeyError:
                         try:
                             self.db.add_record(msg_id, record)
                         except Exception:
                             self.log.error("DB Error adding record %r"%msg_id, exc_info=True)
                     self.pending.add(msg_id)
                     self.queues[eid].append(msg_id)
                 def save_queue_result(self, idents, msg):
                     if len(idents) < 2:
                         self.log.error("invalid identity prefix: %r"%idents)
                         return
                     client_id, queue_id = idents[:2]
                     try:
                         msg = self.session.unserialize(msg)
                     except Exception:
                         self.log.error("queue::engine %r sent invalid message to %r: %r"%(
                                 queue_id,client_id, msg), exc_info=True)
                         return
                     eid = self.by_ident.get(queue_id, None)
                     if eid is None:
                         self.log.error("queue::unknown engine %r is sending a reply: "%queue_id)
                         return
                     parent = msg['parent_header']
                     if not parent:
                         return
                     msg_id = parent['msg_id']
                     if msg_id in self.pending:
                         self.pending.remove(msg_id)
                         self.all_completed.add(msg_id)
                         self.queues[eid].remove(msg_id)
                         self.completed[eid].append(msg_id)
                     elif msg_id not in self.all_completed:
                         # it could be a result from a dead engine that died before delivering the
                         # result
                         self.log.warn("queue:: unknown msg finished %r"%msg_id)
                         return
                     # update record anyway, because the unregistration could have been premature
                     rheader = msg['header']
                     completed = rheader['date']
                     started = rheader.get('started', None)
                     result = {
                         'result_header' : rheader,
                         'result_content': msg['content'],
                         'started' : started,
                         'completed' : completed
                     }
                     result['result_buffers'] = msg['buffers']
                     try:
                         self.db.update_record(msg_id, result)
                     except Exception:
                         self.log.error("DB Error updating record %r"%msg_id, exc_info=True)
                 #--------------------- Task Queue Traffic ------------------------------
                 def save_task_request(self, idents, msg):
                     """Save the submission of a task."""
                     client_id = idents[0]
                     try:
                         msg = self.session.unserialize(msg)
                     except Exception:
                         self.log.error("task::client %r sent invalid task message: %r"%(
                                 client_id, msg), exc_info=True)
                         return
                     record = init_record(msg)
                     record['client_uuid'] = client_id
                     record['queue'] = 'task'
                     header = msg['header']
                     msg_id = header['msg_id']
                     self.pending.add(msg_id)
                     self.unassigned.add(msg_id)
                     try:
                         # it's posible iopub arrived first:
                         existing = self.db.get_record(msg_id)
                         if existing['resubmitted']:
                             for key in ('submitted', 'client_uuid', 'buffers'):
                                 # don't clobber these keys on resubmit
                                 # submitted and client_uuid should be different
                                 # and buffers might be big, and shouldn't have changed
                                 record.pop(key)
                                 # still check content,header which should not change
                                 # but are not expensive to compare as buffers
                         for key,evalue in existing.iteritems():
                             if key.endswith('buffers'):
                                 # don't compare buffers
                                 continue
                             rvalue = record.get(key, None)
                             if evalue and rvalue and evalue != rvalue:
                                 self.log.warn("conflicting initial state for record: %r:%r <%r> %r"%(msg_id, rvalue, key, evalue))
                             elif evalue and not rvalue:
                                 record[key] = evalue
                         try:
                             self.db.update_record(msg_id, record)
                         except Exception:
                             self.log.error("DB Error updating record %r"%msg_id, exc_info=True)
                     except KeyError:
                         try:
                             self.db.add_record(msg_id, record)
                         except Exception:
                             self.log.error("DB Error adding record %r"%msg_id, exc_info=True)
                     except Exception:
                         self.log.error("DB Error saving task request %r"%msg_id, exc_info=True)
                 def save_task_result(self, idents, msg):
                     """save the result of a completed task."""
                     client_id = idents[0]
                     try:
                         msg = self.session.unserialize(msg)
                     except Exception:
                         self.log.error("task::invalid task result message send to %r: %r"%(
                                 client_id, msg), exc_info=True)
                         return
                     parent = msg['parent_header']
                     if not parent:
                         # print msg
                         self.log.warn("Task %r had no parent!"%msg)
                         return
                     msg_id = parent['msg_id']
                     if msg_id in self.unassigned:
                         self.unassigned.remove(msg_id)
                     header = msg['header']
                     engine_uuid = header.get('engine', None)
                     eid = self.by_ident.get(engine_uuid, None)
                     if msg_id in self.pending:
                         self.pending.remove(msg_id)
                         self.all_completed.add(msg_id)
                         if eid is not None:
                             self.completed[eid].append(msg_id)
                             if msg_id in self.tasks[eid]:
                                 self.tasks[eid].remove(msg_id)
                         completed = header['date']
                         started = header.get('started', None)
                         result = {
                             'result_header' : header,
                             'result_content': msg['content'],
                             'started' : started,
                             'completed' : completed,
                             'engine_uuid': engine_uuid
                         }
                         result['result_buffers'] = msg['buffers']
                         try:
                             self.db.update_record(msg_id, result)
                         except Exception:
                             self.log.error("DB Error saving task request %r"%msg_id, exc_info=True)
                     else:
                         self.log.debug("task::unknown task %r finished"%msg_id)
                 def save_task_destination(self, idents, msg):
                     try:
                         msg = self.session.unserialize(msg, content=True)
                     except Exception:
                         self.log.error("task::invalid task tracking message", exc_info=True)
                         return
                     content = msg['content']
                     # print (content)
                     msg_id = content['msg_id']
                     engine_uuid = content['engine_id']
                     eid = self.by_ident[util.asbytes(engine_uuid)]
                     self.log.info("task::task %r arrived on %r"%(msg_id, eid))
                     if msg_id in self.unassigned:
                         self.unassigned.remove(msg_id)
                     # else:
                     #     self.log.debug("task::task %r not listed as MIA?!"%(msg_id))
                     self.tasks[eid].append(msg_id)
                     # self.pending[msg_id][1].update(received=datetime.now(),engine=(eid,engine_uuid))
                     try:
                         self.db.update_record(msg_id, dict(engine_uuid=engine_uuid))
                     except Exception:
                         self.log.error("DB Error saving task destination %r"%msg_id, exc_info=True)
                 def mia_task_request(self, idents, msg):
                     raise NotImplementedError
                     client_id = idents[0]
                     # content = dict(mia=self.mia,status='ok')
                     # self.session.send('mia_reply', content=content, idents=client_id)
                 #--------------------- IOPub Traffic ------------------------------
                 def save_iopub_message(self, topics, msg):
                     """save an iopub message into the db"""
                     # print (topics)
                     try:
                         msg = self.session.unserialize(msg, content=True)
                     except Exception:
                         self.log.error("iopub::invalid IOPub message", exc_info=True)
                         return
                     parent = msg['parent_header']
                     if not parent:
                         self.log.error("iopub::invalid IOPub message: %r"%msg)
                         return
                     msg_id = parent['msg_id']
                     msg_type = msg['header']['msg_type']
                     content = msg['content']
                     # ensure msg_id is in db
                     try:
                         rec = self.db.get_record(msg_id)
                     except KeyError:
                         rec = empty_record()
                         rec['msg_id'] = msg_id
                         self.db.add_record(msg_id, rec)
                     # stream
                     d = {}
                     if msg_type == 'stream':
                         name = content['name']
                         s = rec[name] or ''
                         d[name] = s + content['data']
                     elif msg_type == 'pyerr':
                         d['pyerr'] = content
                     elif msg_type == 'pyin':
                         d['pyin'] = content['code']
                     else:
                         d[msg_type] = content.get('data', '')
                     try:
                         self.db.update_record(msg_id, d)
                     except Exception:
                         self.log.error("DB Error saving iopub message %r"%msg_id, exc_info=True)
                 #-------------------------------------------------------------------------
                 # Registration requests
                 #-------------------------------------------------------------------------
                 def connection_request(self, client_id, msg):
                     """Reply with connection addresses for clients."""
                     self.log.info("client::client %r connected"%client_id)
                     content = dict(status='ok')
                     content.update(self.client_info)
                     jsonable = {}
                     for k,v in self.keytable.iteritems():
                         if v not in self.dead_engines:
                             jsonable[str(k)] = v.decode('ascii')
                     content['engines'] = jsonable
                     self.session.send(self.query, 'connection_reply', content, parent=msg, ident=client_id)
                 def register_engine(self, reg, msg):
                     """Register a new engine."""
                     content = msg['content']
                     try:
                         queue = util.asbytes(content['queue'])
                     except KeyError:
                         self.log.error("registration::queue not specified", exc_info=True)
                         return
                     heart = content.get('heartbeat', None)
                     if heart:
                         heart = util.asbytes(heart)
                     """register a new engine, and create the socket(s) necessary"""
                     eid = self._next_id
                     # print (eid, queue, reg, heart)
                     self.log.debug("registration::register_engine(%i, %r, %r, %r)"%(eid, queue, reg, heart))
                     content = dict(id=eid,status='ok')
                     content.update(self.engine_info)
                     # check if requesting available IDs:
                     if queue in self.by_ident:
                         try:
                             raise KeyError("queue_id %r in use"%queue)
                         except:
                             content = error.wrap_exception()
                             self.log.error("queue_id %r in use"%queue, exc_info=True)
                     elif heart in self.hearts: # need to check unique hearts?
                         try:
                             raise KeyError("heart_id %r in use"%heart)
                         except:
                             self.log.error("heart_id %r in use"%heart, exc_info=True)
                             content = error.wrap_exception()
                     else:
                         for h, pack in self.incoming_registrations.iteritems():
                             if heart == h:
                                 try:
                                     raise KeyError("heart_id %r in use"%heart)
                                 except:
                                     self.log.error("heart_id %r in use"%heart, exc_info=True)
                                     content = error.wrap_exception()
                                 break
                             elif queue == pack[1]:
                                 try:
                                     raise KeyError("queue_id %r in use"%queue)
                                 except:
                                     self.log.error("queue_id %r in use"%queue, exc_info=True)
                                     content = error.wrap_exception()
                                 break
                     msg = self.session.send(self.query, "registration_reply",
                             content=content,
                             ident=reg)
                     if content['status'] == 'ok':
                         if heart in self.heartmonitor.hearts:
                             # already beating
                             self.incoming_registrations[heart] = (eid,queue,reg[0],None)
                             self.finish_registration(heart)
                         else:
                             purge = lambda : self._purge_stalled_registration(heart)
                             dc = ioloop.DelayedCallback(purge, self.registration_timeout, self.loop)
                             dc.start()
                             self.incoming_registrations[heart] = (eid,queue,reg[0],dc)
                     else:
                         self.log.error("registration::registration %i failed: %r"%(eid, content['evalue']))
                     return eid
                 def unregister_engine(self, ident, msg):
                     """Unregister an engine that explicitly requested to leave."""
                     try:
                         eid = msg['content']['id']
                     except:
                         self.log.error("registration::bad engine id for unregistration: %r"%ident, exc_info=True)
                         return
                     self.log.info("registration::unregister_engine(%r)"%eid)
                     # print (eid)
                     uuid = self.keytable[eid]
                     content=dict(id=eid, queue=uuid.decode('ascii'))
                     self.dead_engines.add(uuid)
                     # self.ids.remove(eid)
                     # uuid = self.keytable.pop(eid)
                     #
                     # ec = self.engines.pop(eid)
                     # self.hearts.pop(ec.heartbeat)
                     # self.by_ident.pop(ec.queue)
                     # self.completed.pop(eid)
                     handleit = lambda : self._handle_stranded_msgs(eid, uuid)
                     dc = ioloop.DelayedCallback(handleit, self.registration_timeout, self.loop)
                     dc.start()
                     ############## TODO: HANDLE IT ################
                     if self.notifier:
                         self.session.send(self.notifier, "unregistration_notification", content=content)
                 def _handle_stranded_msgs(self, eid, uuid):
                     """Handle messages known to be on an engine when the engine unregisters.
                     It is possible that this will fire prematurely - that is, an engine will
                     go down after completing a result, and the client will be notified
                     that the result failed and later receive the actual result.
                     """
                     outstanding = self.queues[eid]
                     for msg_id in outstanding:
                         self.pending.remove(msg_id)
                         self.all_completed.add(msg_id)
                         try:
                             raise error.EngineError("Engine %r died while running task %r"%(eid, msg_id))
                         except:
                             content = error.wrap_exception()
                         # build a fake header:
                         header = {}
                         header['engine'] = uuid
                         header['date'] = datetime.now()
                         rec = dict(result_content=content, result_header=header, result_buffers=[])
                         rec['completed'] = header['date']
                         rec['engine_uuid'] = uuid
                         try:
                             self.db.update_record(msg_id, rec)
                         except Exception:
                             self.log.error("DB Error handling stranded msg %r"%msg_id, exc_info=True)
                 def finish_registration(self, heart):
                     """Second half of engine registration, called after our HeartMonitor
                     has received a beat from the Engine's Heart."""
                     try:
                         (eid,queue,reg,purge) = self.incoming_registrations.pop(heart)
                     except KeyError:
                         self.log.error("registration::tried to finish nonexistant registration", exc_info=True)
                         return
                     self.log.info("registration::finished registering engine %i:%r"%(eid,queue))
                     if purge is not None:
                         purge.stop()
                     control = queue
                     self.ids.add(eid)
                     self.keytable[eid] = queue
                     self.engines[eid] = EngineConnector(id=eid, queue=queue, registration=reg,
                                                 control=control, heartbeat=heart)
                     self.by_ident[queue] = eid
                     self.queues[eid] = list()
                     self.tasks[eid] = list()
                     self.completed[eid] = list()
                     self.hearts[heart] = eid
                     content = dict(id=eid, queue=self.engines[eid].queue.decode('ascii'))
                     if self.notifier:
                         self.session.send(self.notifier, "registration_notification", content=content)
                     self.log.info("engine::Engine Connected: %i"%eid)
                 def _purge_stalled_registration(self, heart):
                     if heart in self.incoming_registrations:
                         eid = self.incoming_registrations.pop(heart)[0]
                         self.log.info("registration::purging stalled registration: %i"%eid)
                     else:
                         pass
                 #-------------------------------------------------------------------------
                 # Client Requests
                 #-------------------------------------------------------------------------
                 def shutdown_request(self, client_id, msg):
                     """handle shutdown request."""
                     self.session.send(self.query, 'shutdown_reply', content={'status': 'ok'}, ident=client_id)
                     # also notify other clients of shutdown
                     self.session.send(self.notifier, 'shutdown_notice', content={'status': 'ok'})
                     dc = ioloop.DelayedCallback(lambda : self._shutdown(), 1000, self.loop)
                     dc.start()
                 def _shutdown(self):
                     self.log.info("hub::hub shutting down.")
                     time.sleep(0.1)
                     sys.exit(0)
                 def check_load(self, client_id, msg):
                     content = msg['content']
                     try:
                         targets = content['targets']
                         targets = self._validate_targets(targets)
                     except:
                         content = error.wrap_exception()
                         self.session.send(self.query, "hub_error",
                                 content=content, ident=client_id)
                         return
                     content = dict(status='ok')
                     # loads = {}
                     for t in targets:
                         content[bytes(t)] = len(self.queues[t])+len(self.tasks[t])
                     self.session.send(self.query, "load_reply", content=content, ident=client_id)
                 def queue_status(self, client_id, msg):
                     """Return the Queue status of one or more targets.
                     if verbose: return the msg_ids
                     else: return len of each type.
                     keys: queue (pending MUX jobs)
                         tasks (pending Task jobs)
                         completed (finished jobs from both queues)"""
                     content = msg['content']
                     targets = content['targets']
                     try:
                         targets = self._validate_targets(targets)
                     except:
                         content = error.wrap_exception()
                         self.session.send(self.query, "hub_error",
                                 content=content, ident=client_id)
                         return
                     verbose = content.get('verbose', False)
                     content = dict(status='ok')
                     for t in targets:
                         queue = self.queues[t]
                         completed = self.completed[t]
                         tasks = self.tasks[t]
                         if not verbose:
                             queue = len(queue)
                             completed = len(completed)
                             tasks = len(tasks)
                         content[str(t)] = {'queue': queue, 'completed': completed , 'tasks': tasks}
                     content['unassigned'] = list(self.unassigned) if verbose else len(self.unassigned)
                     # print (content)
                     self.session.send(self.query, "queue_reply", content=content, ident=client_id)
                 def purge_results(self, client_id, msg):
                     """Purge results from memory. This method is more valuable before we move
                     to a DB based message storage mechanism."""
                     content = msg['content']
                     self.log.info("Dropping records with %s", content)
                     msg_ids = content.get('msg_ids', [])
                     reply = dict(status='ok')
                     if msg_ids == 'all':
                         try:
                             self.db.drop_matching_records(dict(completed={'$ne':None}))
                         except Exception:
                             reply = error.wrap_exception()
                     else:
                         pending = filter(lambda m: m in self.pending, msg_ids)
                         if pending:
                             try:
                                 raise IndexError("msg pending: %r"%pending[0])
                             except:
                                 reply = error.wrap_exception()
                         else:
                             try:
                                 self.db.drop_matching_records(dict(msg_id={'$in':msg_ids}))
                             except Exception:
                                 reply = error.wrap_exception()
                         if reply['status'] == 'ok':
                             eids = content.get('engine_ids', [])
                             for eid in eids:
                                 if eid not in self.engines:
                                     try:
                                         raise IndexError("No such engine: %i"%eid)
                                     except:
                                         reply = error.wrap_exception()
                                     break
                                 uid = self.engines[eid].queue
                                 try:
                                     self.db.drop_matching_records(dict(engine_uuid=uid, completed={'$ne':None}))
                                 except Exception:
                                     reply = error.wrap_exception()
                                     break
                     self.session.send(self.query, 'purge_reply', content=reply, ident=client_id)
                 def resubmit_task(self, client_id, msg):
                     """Resubmit one or more tasks."""
                     def finish(reply):
                         self.session.send(self.query, 'resubmit_reply', content=reply, ident=client_id)
                     content = msg['content']
                     msg_ids = content['msg_ids']
                     reply = dict(status='ok')
                     try:
                         records = self.db.find_records({'msg_id' : {'$in' : msg_ids}}, keys=[
                             'header', 'content', 'buffers'])
                     except Exception:
                         self.log.error('db::db error finding tasks to resubmit', exc_info=True)
                         return finish(error.wrap_exception())
                     # validate msg_ids
                     found_ids = [ rec['msg_id'] for rec in records ]
                     invalid_ids = filter(lambda m: m in self.pending, found_ids)
                     if len(records) > len(msg_ids):
                         try:
                             raise RuntimeError("DB appears to be in an inconsistent state."
                                 "More matching records were found than should exist")
                         except Exception:
                             return finish(error.wrap_exception())
                     elif len(records) < len(msg_ids):
                         missing = [ m for m in msg_ids if m not in found_ids ]
                         try:
                             raise KeyError("No such msg(s): %r"%missing)
                         except KeyError:
                             return finish(error.wrap_exception())
                     elif invalid_ids:
                         msg_id = invalid_ids[0]
                         try:
                             raise ValueError("Task %r appears to be inflight"%(msg_id))
                         except Exception:
                             return finish(error.wrap_exception())
                     # clear the existing records
                     now = datetime.now()
                     rec = empty_record()
                     map(rec.pop, ['msg_id', 'header', 'content', 'buffers', 'submitted'])
                     rec['resubmitted'] = now
                     rec['queue'] = 'task'
                     rec['client_uuid'] = client_id[0]
                     try:
                         for msg_id in msg_ids:
                             self.all_completed.discard(msg_id)
                             self.db.update_record(msg_id, rec)
                     except Exception:
                         self.log.error('db::db error upating record', exc_info=True)
                         reply = error.wrap_exception()
                     else:
                         # send the messages
                         for rec in records:
                             header = rec['header']
                             # include resubmitted in header to prevent digest collision
                             header['resubmitted'] = now
                             msg = self.session.msg(header['msg_type'])
                             msg['content'] = rec['content']
                             msg['header'] = header
                             msg['header']['msg_id'] = rec['msg_id']
                             self.session.send(self.resubmit, msg, buffers=rec['buffers'])
                     finish(dict(status='ok'))
                 def _extract_record(self, rec):
                     """decompose a TaskRecord dict into subsection of reply for get_result"""
                     io_dict = {}
                     for key in 'pyin pyout pyerr stdout stderr'.split():
                             io_dict[key] = rec[key]
                     content = { 'result_content': rec['result_content'],
                                         'header': rec['header'],
                                         'result_header' : rec['result_header'],
                                         'io' : io_dict,
                                       }
                     if rec['result_buffers']:
                         buffers = map(bytes, rec['result_buffers'])
                     else:
                         buffers = []
                     return content, buffers
                 def get_results(self, client_id, msg):
                     """Get the result of 1 or more messages."""
                     content = msg['content']
                     msg_ids = sorted(set(content['msg_ids']))
                     statusonly = content.get('status_only', False)
                     pending = []
                     completed = []
                     content = dict(status='ok')
                     content['pending'] = pending
                     content['completed'] = completed
                     buffers = []
                     if not statusonly:
                         try:
                             matches = self.db.find_records(dict(msg_id={'$in':msg_ids}))
                             # turn match list into dict, for faster lookup
                             records = {}
                             for rec in matches:
                                 records[rec['msg_id']] = rec
                         except Exception:
                             content = error.wrap_exception()
                             self.session.send(self.query, "result_reply", content=content,
                                                                 parent=msg, ident=client_id)
                             return
                     else:
                         records = {}
                     for msg_id in msg_ids:
                         if msg_id in self.pending:
                             pending.append(msg_id)
                         elif msg_id in self.all_completed:
                             completed.append(msg_id)
                             if not statusonly:
                                 c,bufs = self._extract_record(records[msg_id])
                                 content[msg_id] = c
                                 buffers.extend(bufs)
                         elif msg_id in records:
                             if rec['completed']:
                                 completed.append(msg_id)
                                 c,bufs = self._extract_record(records[msg_id])
                                 content[msg_id] = c
                                 buffers.extend(bufs)
                             else:
                                 pending.append(msg_id)
                         else:
                             try:
                                 raise KeyError('No such message: '+msg_id)
                             except:
                                 content = error.wrap_exception()
                             break
                     self.session.send(self.query, "result_reply", content=content,
                                                         parent=msg, ident=client_id,
                                                         buffers=buffers)
                 def get_history(self, client_id, msg):
                     """Get a list of all msg_ids in our DB records"""
                     try:
                         msg_ids = self.db.get_history()
                     except Exception as e:
                         content = error.wrap_exception()
                     else:
                         content = dict(status='ok', history=msg_ids)
                     self.session.send(self.query, "history_reply", content=content,
                                                         parent=msg, ident=client_id)
                 def db_query(self, client_id, msg):
                     """Perform a raw query on the task record database."""
                     content = msg['content']
                     query = content.get('query', {})
                     keys = content.get('keys', None)
                     buffers = []
                     empty = list()
                     try:
                         records = self.db.find_records(query, keys)
                     except Exception as e:
                         content = error.wrap_exception()
                     else:
                         # extract buffers from reply content:
                         if keys is not None:
                             buffer_lens = [] if 'buffers' in keys else None
                             result_buffer_lens = [] if 'result_buffers' in keys else None
                         else:
                             buffer_lens = []
                             result_buffer_lens = []
                         for rec in records:
                             # buffers may be None, so double check
                             if buffer_lens is not None:
                                 b = rec.pop('buffers', empty) or empty
                                 buffer_lens.append(len(b))
                                 buffers.extend(b)
                             if result_buffer_lens is not None:
                                 rb = rec.pop('result_buffers', empty) or empty
                                 result_buffer_lens.append(len(rb))
                                 buffers.extend(rb)
                         content = dict(status='ok', records=records, buffer_lens=buffer_lens,
                                                 result_buffer_lens=result_buffer_lens)
                     # self.log.debug (content)
                     self.session.send(self.query, "db_reply", content=content,
                                                         parent=msg, ident=client_id,
                                                         buffers=buffers)

IPython/parallel/controller/scheduler.py

0 +2 -2

             """The Python scheduler for rich scheduling.
             The Pure ZMQ scheduler does not allow routing schemes other than LRU,
             nor does it check msg_id DAG dependencies. For those, a slightly slower
             Python Scheduler exists.
             Authors:
             * Min RK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #----------------------------------------------------------------------
             # Imports
             #----------------------------------------------------------------------
             from __future__ import print_function
             import logging
             import sys
             from datetime import datetime, timedelta
             from random import randint, random
             from types import FunctionType
             try:
                 import numpy
             except ImportError:
                 numpy = None
             import zmq
             from zmq.eventloop import ioloop, zmqstream
             # local imports
             from IPython.external.decorator import decorator
             from IPython.config.application import Application
             from IPython.config.loader import Config
             from IPython.utils.traitlets import Instance, Dict, List, Set, Int, Enum, CBytes
             from IPython.parallel import error
             from IPython.parallel.factory import SessionFactory
             from IPython.parallel.util import connect_logger, local_logger, asbytes
             from .dependency import Dependency
             @decorator
             def logged(f,self,*args,**kwargs):
                 # print ("#--------------------")
                 self.log.debug("scheduler::%s(*%s,**%s)", f.func_name, args, kwargs)
                 # print ("#--")
                 return f(self,*args, **kwargs)
             #----------------------------------------------------------------------
             # Chooser functions
             #----------------------------------------------------------------------
             def plainrandom(loads):
                 """Plain random pick."""
                 n = len(loads)
                 return randint(0,n-1)
             def lru(loads):
                 """Always pick the front of the line.
                 The content of `loads` is ignored.
                 Assumes LRU ordering of loads, with oldest first.
                 """
                 return 0
             def twobin(loads):
                 """Pick two at random, use the LRU of the two.
                 The content of loads is ignored.
                 Assumes LRU ordering of loads, with oldest first.
                 """
                 n = len(loads)
                 a = randint(0,n-1)
                 b = randint(0,n-1)
                 return min(a,b)
             def weighted(loads):
                 """Pick two at random using inverse load as weight.
                 Return the less loaded of the two.
                 """
                 # weight 0 a million times more than 1:
                 weights = 1./(1e-6+numpy.array(loads))
                 sums = weights.cumsum()
                 t = sums[-1]
                 x = random()*t
                 y = random()*t
                 idx = 0
                 idy = 0
                 while sums[idx] < x:
                     idx += 1
                 while sums[idy] < y:
                     idy += 1
                 if weights[idy] > weights[idx]:
                     return idy
                 else:
                     return idx
             def leastload(loads):
                 """Always choose the lowest load.
                 If the lowest load occurs more than once, the first
                 occurance will be used.  If loads has LRU ordering, this means
                 the LRU of those with the lowest load is chosen.
                 """
                 return loads.index(min(loads))
             #---------------------------------------------------------------------
             # Classes
             #---------------------------------------------------------------------
             # store empty default dependency:
             MET = Dependency([])
             class TaskScheduler(SessionFactory):
                 """Python TaskScheduler object.
                 This is the simplest object that supports msg_id based
                 DAG dependencies. *Only* task msg_ids are checked, not
                 msg_ids of jobs submitted via the MUX queue.
                 """
                 hwm = Int(0, config=True, shortname='hwm',
                     help="""specify the High Water Mark (HWM) for the downstream
                     socket in the Task scheduler. This is the maximum number
                     of allowed outstanding tasks on each engine."""
                 )
                 scheme_name = Enum(('leastload', 'pure', 'lru', 'plainrandom', 'weighted', 'twobin'),
                     'leastload', config=True, shortname='scheme', allow_none=False,
                     help="""select the task scheduler scheme  [default: Python LRU]
                     Options are: 'pure', 'lru', 'plainrandom', 'weighted', 'twobin','leastload'"""
                 )
                 def _scheme_name_changed(self, old, new):
                     self.log.debug("Using scheme %r"%new)
                     self.scheme = globals()[new]
                 # input arguments:
                 scheme = Instance(FunctionType) # function for determining the destination
                 def _scheme_default(self):
                     return leastload
                 client_stream = Instance(zmqstream.ZMQStream) # client-facing stream
                 engine_stream = Instance(zmqstream.ZMQStream) # engine-facing stream
                 notifier_stream = Instance(zmqstream.ZMQStream) # hub-facing sub stream
                 mon_stream = Instance(zmqstream.ZMQStream) # hub-facing pub stream
                 # internals:
                 graph = Dict() # dict by msg_id of [ msg_ids that depend on key ]
                 retries = Dict() # dict by msg_id of retries remaining (non-neg ints)
                 # waiting = List() # list of msg_ids ready to run, but haven't due to HWM
                 depending = Dict() # dict by msg_id of (msg_id, raw_msg, after, follow)
                 pending = Dict() # dict by engine_uuid of submitted tasks
                 completed = Dict() # dict by engine_uuid of completed tasks
                 failed = Dict() # dict by engine_uuid of failed tasks
                 destinations = Dict() # dict by msg_id of engine_uuids where jobs ran (reverse of completed+failed)
                 clients = Dict() # dict by msg_id for who submitted the task
                 targets = List() # list of target IDENTs
                 loads = List() # list of engine loads
                 # full = Set() # set of IDENTs that have HWM outstanding tasks
                 all_completed = Set() # set of all completed tasks
                 all_failed = Set() # set of all failed tasks
                 all_done = Set() # set of all finished tasks=union(completed,failed)
                 all_ids = Set() # set of all submitted task IDs
                 blacklist = Dict() # dict by msg_id of locations where a job has encountered UnmetDependency
                 auditor = Instance('zmq.eventloop.ioloop.PeriodicCallback')
                 ident = CBytes() # ZMQ identity. This should just be self.session.session
                                  # but ensure Bytes
                 def _ident_default(self):
                     return asbytes(self.session.session)
                 def start(self):
                     self.engine_stream.on_recv(self.dispatch_result, copy=False)
                     self._notification_handlers = dict(
                         registration_notification = self._register_engine,
                         unregistration_notification = self._unregister_engine
                     )
                     self.notifier_stream.on_recv(self.dispatch_notification)
                     self.auditor = ioloop.PeriodicCallback(self.audit_timeouts, 2e3, self.loop) # 1 Hz
                     self.auditor.start()
                     self.log.info("Scheduler started [%s]"%self.scheme_name)
                 def resume_receiving(self):
                     """Resume accepting jobs."""
                     self.client_stream.on_recv(self.dispatch_submission, copy=False)
                 def stop_receiving(self):
                     """Stop accepting jobs while there are no engines.
                     Leave them in the ZMQ queue."""
                     self.client_stream.on_recv(None)
                 #-----------------------------------------------------------------------
                 # [Un]Registration Handling
                 #-----------------------------------------------------------------------
                 def dispatch_notification(self, msg):
                     """dispatch register/unregister events."""
                     try:
                         idents,msg = self.session.feed_identities(msg)
                     except ValueError:
                         self.log.warn("task::Invalid Message: %r",msg)
                         return
                     try:
                         msg = self.session.unserialize(msg)
                     except ValueError:
                         self.log.warn("task::Unauthorized message from: %r"%idents)
                         return
                     msg_type = msg['header']['msg_type']
                     handler = self._notification_handlers.get(msg_type, None)
                     if handler is None:
                         self.log.error("Unhandled message type: %r"%msg_type)
                     else:
                         try:
                             handler(asbytes(msg['content']['queue']))
                         except Exception:
                             self.log.error("task::Invalid notification msg: %r",msg)
                 def _register_engine(self, uid):
                     """New engine with ident `uid` became available."""
                     # head of the line:
                     self.targets.insert(0,uid)
                     self.loads.insert(0,0)
                     # initialize sets
                     self.completed[uid] = set()
                     self.failed[uid] = set()
                     self.pending[uid] = {}
                     if len(self.targets) == 1:
                         self.resume_receiving()
                     # rescan the graph:
                     self.update_graph(None)
                 def _unregister_engine(self, uid):
                     """Existing engine with ident `uid` became unavailable."""
                     if len(self.targets) == 1:
                         # this was our only engine
                         self.stop_receiving()
                     # handle any potentially finished tasks:
                     self.engine_stream.flush()
                     # don't pop destinations, because they might be used later
                     # map(self.destinations.pop, self.completed.pop(uid))
                     # map(self.destinations.pop, self.failed.pop(uid))
                     # prevent this engine from receiving work
                     idx = self.targets.index(uid)
                     self.targets.pop(idx)
                     self.loads.pop(idx)
                     # wait 5 seconds before cleaning up pending jobs, since the results might
                     # still be incoming
                     if self.pending[uid]:
                         dc = ioloop.DelayedCallback(lambda : self.handle_stranded_tasks(uid), 5000, self.loop)
                         dc.start()
                     else:
                         self.completed.pop(uid)
                         self.failed.pop(uid)
                 def handle_stranded_tasks(self, engine):
                     """Deal with jobs resident in an engine that died."""
                     lost = self.pending[engine]
                     for msg_id in lost.keys():
                         if msg_id not in self.pending[engine]:
                             # prevent double-handling of messages
                             continue
                         raw_msg = lost[msg_id][0]
                         idents,msg = self.session.feed_identities(raw_msg, copy=False)
                         parent = self.session.unpack(msg[1].bytes)
                         idents = [engine, idents[0]]
                         # build fake error reply
                         try:
                             raise error.EngineError("Engine %r died while running task %r"%(engine, msg_id))
                         except:
                             content = error.wrap_exception()
                         msg = self.session.msg('apply_reply', content, parent=parent, subheader={'status':'error'})
                         raw_reply = map(zmq.Message, self.session.serialize(msg, ident=idents))
                         # and dispatch it
                         self.dispatch_result(raw_reply)
                     # finally scrub completed/failed lists
                     self.completed.pop(engine)
                     self.failed.pop(engine)
                 #-----------------------------------------------------------------------
                 # Job Submission
                 #-----------------------------------------------------------------------
                 def dispatch_submission(self, raw_msg):
                     """Dispatch job submission to appropriate handlers."""
                     # ensure targets up to date:
                     self.notifier_stream.flush()
                     try:
                         idents, msg = self.session.feed_identities(raw_msg, copy=False)
                         msg = self.session.unserialize(msg, content=False, copy=False)
                     except Exception:
                         self.log.error("task::Invaid task msg: %r"%raw_msg, exc_info=True)
                         return
                     # send to monitor
                     self.mon_stream.send_multipart([b'intask']+raw_msg, copy=False)
                     header = msg['header']
                     msg_id = header['msg_id']
                     self.all_ids.add(msg_id)
                     # get targets as a set of bytes objects
                     # from a list of unicode objects
                     targets = header.get('targets', [])
                     targets = map(asbytes, targets)
                     targets = set(targets)
                     retries = header.get('retries', 0)
                     self.retries[msg_id] = retries
                     # time dependencies
                     after = header.get('after', None)
                     if after:
                         after = Dependency(after)
                         if after.all:
                             if after.success:
                                 after = Dependency(after.difference(self.all_completed),
                                             success=after.success,
                                             failure=after.failure,
                                             all=after.all,
                                 )
                             if after.failure:
                                 after = Dependency(after.difference(self.all_failed),
                                             success=after.success,
                                             failure=after.failure,
                                             all=after.all,
                                 )
                         if after.check(self.all_completed, self.all_failed):
                             # recast as empty set, if `after` already met,
                             # to prevent unnecessary set comparisons
                             after = MET
                     else:
                         after = MET
                     # location dependencies
                     follow = Dependency(header.get('follow', []))
                     # turn timeouts into datetime objects:
                     timeout = header.get('timeout', None)
                     if timeout:
                         timeout = datetime.now() + timedelta(0,timeout,0)
                     args = [raw_msg, targets, after, follow, timeout]
                     # validate and reduce dependencies:
                     for dep in after,follow:
                         if not dep: # empty dependency
                             continue
                         # check valid:
                         if msg_id in dep or dep.difference(self.all_ids):
                             self.depending[msg_id] = args
                             return self.fail_unreachable(msg_id, error.InvalidDependency)
                         # check if unreachable:
                         if dep.unreachable(self.all_completed, self.all_failed):
                             self.depending[msg_id] = args
                             return self.fail_unreachable(msg_id)
                     if after.check(self.all_completed, self.all_failed):
                         # time deps already met, try to run
                         if not self.maybe_run(msg_id, *args):
                             # can't run yet
                             if msg_id not in self.all_failed:
                                 # could have failed as unreachable
                                 self.save_unmet(msg_id, *args)
                     else:
                         self.save_unmet(msg_id, *args)
                 def audit_timeouts(self):
                     """Audit all waiting tasks for expired timeouts."""
                     now = datetime.now()
                     for msg_id in self.depending.keys():
                         # must recheck, in case one failure cascaded to another:
                         if msg_id in self.depending:
                             raw,after,targets,follow,timeout = self.depending[msg_id]
                             if timeout and timeout < now:
                                 self.fail_unreachable(msg_id, error.TaskTimeout)
                 def fail_unreachable(self, msg_id, why=error.ImpossibleDependency):
                     """a task has become unreachable, send a reply with an ImpossibleDependency
                     error."""
                     if msg_id not in self.depending:
                         self.log.error("msg %r already failed!", msg_id)
                         return
                     raw_msg,targets,after,follow,timeout = self.depending.pop(msg_id)
                     for mid in follow.union(after):
                         if mid in self.graph:
                             self.graph[mid].remove(msg_id)
                     # FIXME: unpacking a message I've already unpacked, but didn't save:
                     idents,msg = self.session.feed_identities(raw_msg, copy=False)
                     header = self.session.unpack(msg[1].bytes)
                     try:
                         raise why()
                     except:
                         content = error.wrap_exception()
                     self.all_done.add(msg_id)
                     self.all_failed.add(msg_id)
                     msg = self.session.send(self.client_stream, 'apply_reply', content,
                                                             parent=header, ident=idents)
                     self.session.send(self.mon_stream, msg, ident=[b'outtask']+idents)
                     self.update_graph(msg_id, success=False)
                 def maybe_run(self, msg_id, raw_msg, targets, after, follow, timeout):
                     """check location dependencies, and run if they are met."""
                     blacklist = self.blacklist.setdefault(msg_id, set())
                     if follow or targets or blacklist or self.hwm:
                         # we need a can_run filter
                         def can_run(idx):
                             # check hwm
                             if self.hwm and self.loads[idx] == self.hwm:
                                 return False
                             target = self.targets[idx]
                             # check blacklist
                             if target in blacklist:
                                 return False
                             # check targets
                             if targets and target not in targets:
                                 return False
                             # check follow
                             return follow.check(self.completed[target], self.failed[target])
                         indices = filter(can_run, range(len(self.targets)))
                         if not indices:
                             # couldn't run
                             if follow.all:
                                 # check follow for impossibility
                                 dests = set()
                                 relevant = set()
                                 if follow.success:
                                     relevant = self.all_completed
                                 if follow.failure:
                                     relevant = relevant.union(self.all_failed)
                                 for m in follow.intersection(relevant):
                                     dests.add(self.destinations[m])
                                 if len(dests) > 1:
                                     self.depending[msg_id] = (raw_msg, targets, after, follow, timeout)
                                     self.fail_unreachable(msg_id)
                                     return False
                             if targets:
                                 # check blacklist+targets for impossibility
                                 targets.difference_update(blacklist)
                                 if not targets or not targets.intersection(self.targets):
                                     self.depending[msg_id] = (raw_msg, targets, after, follow, timeout)
                                     self.fail_unreachable(msg_id)
                                     return False
                             return False
                     else:
                         indices = None
                     self.submit_task(msg_id, raw_msg, targets, follow, timeout, indices)
                     return True
                 def save_unmet(self, msg_id, raw_msg, targets, after, follow, timeout):
                     """Save a message for later submission when its dependencies are met."""
                     self.depending[msg_id] = [raw_msg,targets,after,follow,timeout]
                     # track the ids in follow or after, but not those already finished
                     for dep_id in after.union(follow).difference(self.all_done):
                         if dep_id not in self.graph:
                             self.graph[dep_id] = set()
                         self.graph[dep_id].add(msg_id)
                 def submit_task(self, msg_id, raw_msg, targets, follow, timeout, indices=None):
                     """Submit a task to any of a subset of our targets."""
                     if indices:
                         loads = [self.loads[i] for i in indices]
                     else:
                         loads = self.loads
                     idx = self.scheme(loads)
                     if indices:
                         idx = indices[idx]
                     target = self.targets[idx]
                     # print (target, map(str, msg[:3]))
                     # send job to the engine
                     self.engine_stream.send(target, flags=zmq.SNDMORE, copy=False)
                     self.engine_stream.send_multipart(raw_msg, copy=False)
                     # update load
                     self.add_job(idx)
                     self.pending[target][msg_id] = (raw_msg, targets, MET, follow, timeout)
                     # notify Hub
                     content = dict(msg_id=msg_id, engine_id=target.decode('ascii'))
                     self.session.send(self.mon_stream, 'task_destination', content=content,
                                     ident=[b'tracktask',self.ident])
                 #-----------------------------------------------------------------------
                 # Result Handling
                 #-----------------------------------------------------------------------
                 def dispatch_result(self, raw_msg):
                     """dispatch method for result replies"""
                     try:
                         idents,msg = self.session.feed_identities(raw_msg, copy=False)
                         msg = self.session.unserialize(msg, content=False, copy=False)
                         engine = idents[0]
                         try:
                             idx = self.targets.index(engine)
                         except ValueError:
                             pass # skip load-update for dead engines
                         else:
                             self.finish_job(idx)
                     except Exception:
                         self.log.error("task::Invaid result: %r", raw_msg, exc_info=True)
                         return
                     header = msg['header']
                     parent = msg['parent_header']
                     if header.get('dependencies_met', True):
                         success = (header['status'] == 'ok')
                         msg_id = parent['msg_id']
                         retries = self.retries[msg_id]
                         if not success and retries > 0:
                             # failed
                             self.retries[msg_id] = retries - 1
                             self.handle_unmet_dependency(idents, parent)
                         else:
                             del self.retries[msg_id]
                             # relay to client and update graph
                             self.handle_result(idents, parent, raw_msg, success)
                             # send to Hub monitor
                             self.mon_stream.send_multipart([b'outtask']+raw_msg, copy=False)
                     else:
                         self.handle_unmet_dependency(idents, parent)
                 def handle_result(self, idents, parent, raw_msg, success=True):
                     """handle a real task result, either success or failure"""
                     # first, relay result to client
                     engine = idents[0]
                     client = idents[1]
                     # swap_ids for XREP-XREP mirror
                     raw_msg[:2] = [client,engine]
                     # print (map(str, raw_msg[:4]))
                     self.client_stream.send_multipart(raw_msg, copy=False)
                     # now, update our data structures
                     msg_id = parent['msg_id']
                     self.blacklist.pop(msg_id, None)
                     self.pending[engine].pop(msg_id)
                     if success:
                         self.completed[engine].add(msg_id)
                         self.all_completed.add(msg_id)
                     else:
                         self.failed[engine].add(msg_id)
                         self.all_failed.add(msg_id)
                     self.all_done.add(msg_id)
                     self.destinations[msg_id] = engine
                     self.update_graph(msg_id, success)
                 def handle_unmet_dependency(self, idents, parent):
                     """handle an unmet dependency"""
                     engine = idents[0]
                     msg_id = parent['msg_id']
                     if msg_id not in self.blacklist:
                         self.blacklist[msg_id] = set()
                     self.blacklist[msg_id].add(engine)
                     args = self.pending[engine].pop(msg_id)
                     raw,targets,after,follow,timeout = args
                     if self.blacklist[msg_id] == targets:
                         self.depending[msg_id] = args
                         self.fail_unreachable(msg_id)
                     elif not self.maybe_run(msg_id, *args):
                         # resubmit failed
                         if msg_id not in self.all_failed:
                             # put it back in our dependency tree
                             self.save_unmet(msg_id, *args)
                     if self.hwm:
                         try:
                             idx = self.targets.index(engine)
                         except ValueError:
                             pass # skip load-update for dead engines
                         else:
                             if self.loads[idx] == self.hwm-1:
                                 self.update_graph(None)
                 def update_graph(self, dep_id=None, success=True):
                     """dep_id just finished. Update our dependency
                     graph and submit any jobs that just became runable.
                     Called with dep_id=None to update entire graph for hwm, but without finishing
                     a task.
                     """
                     # print ("\n\n***********")
                     # pprint (dep_id)
                     # pprint (self.graph)
                     # pprint (self.depending)
                     # pprint (self.all_completed)
                     # pprint (self.all_failed)
                     # print ("\n\n***********\n\n")
                     # update any jobs that depended on the dependency
                     jobs = self.graph.pop(dep_id, [])
                     # recheck *all* jobs if
                     # a) we have HWM and an engine just become no longer full
                     # or b) dep_id was given as None
                     if dep_id is None or self.hwm and any( [ load==self.hwm-1 for load in self.loads ]):
                         jobs = self.depending.keys()
                     for msg_id in jobs:
                         raw_msg, targets, after, follow, timeout = self.depending[msg_id]
                         if after.unreachable(self.all_completed, self.all_failed)\
                                 or follow.unreachable(self.all_completed, self.all_failed):
                             self.fail_unreachable(msg_id)
                         elif after.check(self.all_completed, self.all_failed): # time deps met, maybe run
                             if self.maybe_run(msg_id, raw_msg, targets, MET, follow, timeout):
                                 self.depending.pop(msg_id)
                                 for mid in follow.union(after):
                                     if mid in self.graph:
                                         self.graph[mid].remove(msg_id)
                 #----------------------------------------------------------------------
                 # methods to be overridden by subclasses
                 #----------------------------------------------------------------------
                 def add_job(self, idx):
                     """Called after self.targets[idx] just got the job with header.
                     Override with subclasses.  The default ordering is simple LRU.
                     The default loads are the number of outstanding jobs."""
                     self.loads[idx] += 1
                     for lis in (self.targets, self.loads):
                         lis.append(lis.pop(idx))
                 def finish_job(self, idx):
                     """Called after self.targets[idx] just finished a job.
                     Override with subclasses."""
                     self.loads[idx] -= 1
             def launch_scheduler(in_addr, out_addr, mon_addr, not_addr, config=None,
                                     logname='root', log_url=None, loglevel=logging.DEBUG,
                                     identity=b'task', in_thread=False):
                 ZMQStream = zmqstream.ZMQStream
                 if config:
                     # unwrap dict back into Config
                     config = Config(config)
                 if in_thread:
                     # use instance() to get the same Context/Loop as our parent
                     ctx = zmq.Context.instance()
                     loop = ioloop.IOLoop.instance()
                 else:
                     # in a process, don't use instance()
                     # for safety with multiprocessing
                     ctx = zmq.Context()
                     loop = ioloop.IOLoop()
-                ins = ZMQStream(ctx.socket(zmq.XREP),loop)
+                ins = ZMQStream(ctx.socket(zmq.ROUTER),loop)
                 ins.setsockopt(zmq.IDENTITY, identity)
                 ins.bind(in_addr)
-                outs = ZMQStream(ctx.socket(zmq.XREP),loop)
+                outs = ZMQStream(ctx.socket(zmq.ROUTER),loop)
                 outs.setsockopt(zmq.IDENTITY, identity)
                 outs.bind(out_addr)
                 mons = zmqstream.ZMQStream(ctx.socket(zmq.PUB),loop)
                 mons.connect(mon_addr)
                 nots = zmqstream.ZMQStream(ctx.socket(zmq.SUB),loop)
                 nots.setsockopt(zmq.SUBSCRIBE, b'')
                 nots.connect(not_addr)
                 # setup logging.
                 if in_thread:
                     log = Application.instance().log
                 else:
                     if log_url:
                         log = connect_logger(logname, ctx, log_url, root="scheduler", loglevel=loglevel)
                     else:
                         log = local_logger(logname, loglevel)
                 scheduler = TaskScheduler(client_stream=ins, engine_stream=outs,
                                         mon_stream=mons, notifier_stream=nots,
                                         loop=loop, log=log,
                                         config=config)
                 scheduler.start()
                 if not in_thread:
                     try:
                         loop.start()
                     except KeyboardInterrupt:
                         print ("interrupted, exiting...", file=sys.__stderr__)

IPython/parallel/engine/engine.py

0 +4 -4

             """A simple engine that talks to a controller over 0MQ.
             it handles registration, etc. and launches a kernel
             connected to the Controller's Schedulers.
             Authors:
             * Min RK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             from __future__ import print_function
             import sys
             import time
             from getpass import getpass
             import zmq
             from zmq.eventloop import ioloop, zmqstream
             from IPython.external.ssh import tunnel
             # internal
             from IPython.utils.traitlets import (
                 Instance, Dict, Int, Type, CFloat, Unicode, CBytes, Bool
             )
             # from IPython.utils.localinterfaces import LOCALHOST
             from IPython.parallel.controller.heartmonitor import Heart
             from IPython.parallel.factory import RegistrationFactory
             from IPython.parallel.util import disambiguate_url, asbytes
             from IPython.zmq.session import Message
             from .streamkernel import Kernel
             class EngineFactory(RegistrationFactory):
                 """IPython engine"""
                 # configurables:
                 out_stream_factory=Type('IPython.zmq.iostream.OutStream', config=True,
                     help="""The OutStream for handling stdout/err.
                     Typically 'IPython.zmq.iostream.OutStream'""")
                 display_hook_factory=Type('IPython.zmq.displayhook.ZMQDisplayHook', config=True,
                     help="""The class for handling displayhook.
                     Typically 'IPython.zmq.displayhook.ZMQDisplayHook'""")
                 location=Unicode(config=True,
                     help="""The location (an IP address) of the controller.  This is
                     used for disambiguating URLs, to determine whether
                     loopback should be used to connect or the public address.""")
                 timeout=CFloat(2,config=True,
                     help="""The time (in seconds) to wait for the Controller to respond
                     to registration requests before giving up.""")
                 sshserver=Unicode(config=True,
                     help="""The SSH server to use for tunneling connections to the Controller.""")
                 sshkey=Unicode(config=True,
                     help="""The SSH private key file to use when tunneling connections to the Controller.""")
                 paramiko=Bool(sys.platform == 'win32', config=True,
                     help="""Whether to use paramiko instead of openssh for tunnels.""")
                 # not configurable:
                 user_ns=Dict()
                 id=Int(allow_none=True)
                 registrar=Instance('zmq.eventloop.zmqstream.ZMQStream')
                 kernel=Instance(Kernel)
                 bident = CBytes()
                 ident = Unicode()
                 def _ident_changed(self, name, old, new):
                     self.bident = asbytes(new)
                 using_ssh=Bool(False)
                 def __init__(self, **kwargs):
                     super(EngineFactory, self).__init__(**kwargs)
                     self.ident = self.session.session
                 def init_connector(self):
                     """construct connection function, which handles tunnels."""
                     self.using_ssh = bool(self.sshkey or self.sshserver)
                     if self.sshkey and not self.sshserver:
                         # We are using ssh directly to the controller, tunneling localhost to localhost
                         self.sshserver = self.url.split('://')[1].split(':')[0]
                     if self.using_ssh:
                         if tunnel.try_passwordless_ssh(self.sshserver, self.sshkey, self.paramiko):
                             password=False
                         else:
                             password = getpass("SSH Password for %s: "%self.sshserver)
                     else:
                         password = False
                     def connect(s, url):
                         url = disambiguate_url(url, self.location)
                         if self.using_ssh:
                             self.log.debug("Tunneling connection to %s via %s"%(url, self.sshserver))
                             return tunnel.tunnel_connection(s, url, self.sshserver,
                                         keyfile=self.sshkey, paramiko=self.paramiko,
                                         password=password,
                             )
                         else:
                             return s.connect(url)
                     def maybe_tunnel(url):
                         """like connect, but don't complete the connection (for use by heartbeat)"""
                         url = disambiguate_url(url, self.location)
                         if self.using_ssh:
                             self.log.debug("Tunneling connection to %s via %s"%(url, self.sshserver))
                             url,tunnelobj = tunnel.open_tunnel(url, self.sshserver,
                                         keyfile=self.sshkey, paramiko=self.paramiko,
                                         password=password,
                             )
                         return url
                     return connect, maybe_tunnel
                 def register(self):
                     """send the registration_request"""
                     self.log.info("Registering with controller at %s"%self.url)
                     ctx = self.context
                     connect,maybe_tunnel = self.init_connector()
-                    reg = ctx.socket(zmq.XREQ)
+                    reg = ctx.socket(zmq.DEALER)
                     reg.setsockopt(zmq.IDENTITY, self.bident)
                     connect(reg, self.url)
                     self.registrar = zmqstream.ZMQStream(reg, self.loop)
                     content = dict(queue=self.ident, heartbeat=self.ident, control=self.ident)
                     self.registrar.on_recv(lambda msg: self.complete_registration(msg, connect, maybe_tunnel))
                     # print (self.session.key)
                     self.session.send(self.registrar, "registration_request",content=content)
                 def complete_registration(self, msg, connect, maybe_tunnel):
                     # print msg
                     self._abort_dc.stop()
                     ctx = self.context
                     loop = self.loop
                     identity = self.bident
                     idents,msg = self.session.feed_identities(msg)
                     msg = Message(self.session.unserialize(msg))
                     if msg.content.status == 'ok':
                         self.id = int(msg.content.id)
                         # launch heartbeat
                         hb_addrs = msg.content.heartbeat
                         # possibly forward hb ports with tunnels
                         hb_addrs = [ maybe_tunnel(addr) for addr in hb_addrs ]
                         heart = Heart(*map(str, hb_addrs), heart_id=identity)
                         heart.start()
                         # create Shell Streams (MUX, Task, etc.):
                         queue_addr = msg.content.mux
                         shell_addrs = [ str(queue_addr) ]
                         task_addr = msg.content.task
                         if task_addr:
                             shell_addrs.append(str(task_addr))
                         # Uncomment this to go back to two-socket model
                         # shell_streams = []
                         # for addr in shell_addrs:
-                        #     stream = zmqstream.ZMQStream(ctx.socket(zmq.XREP), loop)
+                        #     stream = zmqstream.ZMQStream(ctx.socket(zmq.ROUTER), loop)
                         #     stream.setsockopt(zmq.IDENTITY, identity)
                         #     stream.connect(disambiguate_url(addr, self.location))
                         #     shell_streams.append(stream)
                         # Now use only one shell stream for mux and tasks
-                        stream = zmqstream.ZMQStream(ctx.socket(zmq.XREP), loop)
+                        stream = zmqstream.ZMQStream(ctx.socket(zmq.ROUTER), loop)
                         stream.setsockopt(zmq.IDENTITY, identity)
                         shell_streams = [stream]
                         for addr in shell_addrs:
                             connect(stream, addr)
                         # end single stream-socket
                         # control stream:
                         control_addr = str(msg.content.control)
-                        control_stream = zmqstream.ZMQStream(ctx.socket(zmq.XREP), loop)
+                        control_stream = zmqstream.ZMQStream(ctx.socket(zmq.ROUTER), loop)
                         control_stream.setsockopt(zmq.IDENTITY, identity)
                         connect(control_stream, control_addr)
                         # create iopub stream:
                         iopub_addr = msg.content.iopub
                         iopub_stream = zmqstream.ZMQStream(ctx.socket(zmq.PUB), loop)
                         iopub_stream.setsockopt(zmq.IDENTITY, identity)
                         connect(iopub_stream, iopub_addr)
                         # # Redirect input streams and set a display hook.
                         if self.out_stream_factory:
                             sys.stdout = self.out_stream_factory(self.session, iopub_stream, u'stdout')
                             sys.stdout.topic = 'engine.%i.stdout'%self.id
                             sys.stderr = self.out_stream_factory(self.session, iopub_stream, u'stderr')
                             sys.stderr.topic = 'engine.%i.stderr'%self.id
                         if self.display_hook_factory:
                             sys.displayhook = self.display_hook_factory(self.session, iopub_stream)
                             sys.displayhook.topic = 'engine.%i.pyout'%self.id
                         self.kernel = Kernel(config=self.config, int_id=self.id, ident=self.ident, session=self.session,
                                 control_stream=control_stream, shell_streams=shell_streams, iopub_stream=iopub_stream,
                                 loop=loop, user_ns = self.user_ns, log=self.log)
                         self.kernel.start()
                     else:
                         self.log.fatal("Registration Failed: %s"%msg)
                         raise Exception("Registration Failed: %s"%msg)
                     self.log.info("Completed registration with id %i"%self.id)
                 def abort(self):
                     self.log.fatal("Registration timed out after %.1f seconds"%self.timeout)
                     self.session.send(self.registrar, "unregistration_request", content=dict(id=self.id))
                     time.sleep(1)
                     sys.exit(255)
                 def start(self):
                     dc = ioloop.DelayedCallback(self.register, 0, self.loop)
                     dc.start()
                     self._abort_dc = ioloop.DelayedCallback(self.abort, self.timeout*1000, self.loop)
                     self._abort_dc.start()

IPython/parallel/engine/kernelstarter.py

0 +2 -2

             """KernelStarter class that intercepts Control Queue messages, and handles process management.
             Authors:
             * Min RK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             from zmq.eventloop import ioloop
             from IPython.zmq.session import Session
             class KernelStarter(object):
                 """Object for resetting/killing the Kernel."""
                 def __init__(self, session, upstream, downstream, *kernel_args, **kernel_kwargs):
                     self.session = session
                     self.upstream = upstream
                     self.downstream = downstream
                     self.kernel_args = kernel_args
                     self.kernel_kwargs = kernel_kwargs
                     self.handlers = {}
                     for method in 'shutdown_request shutdown_reply'.split():
                         self.handlers[method] = getattr(self, method)
                 def start(self):
                     self.upstream.on_recv(self.dispatch_request)
                     self.downstream.on_recv(self.dispatch_reply)
                 #--------------------------------------------------------------------------
                 # Dispatch methods
                 #--------------------------------------------------------------------------
                 def dispatch_request(self, raw_msg):
                     idents, msg = self.session.feed_identities()
                     try:
                         msg = self.session.unserialize(msg, content=False)
                     except:
                         print ("bad msg: %s"%msg)
                     msgtype = msg['header']['msg_type']
                     handler = self.handlers.get(msgtype, None)
                     if handler is None:
                         self.downstream.send_multipart(raw_msg, copy=False)
                     else:
                         handler(msg)
                 def dispatch_reply(self, raw_msg):
                     idents, msg = self.session.feed_identities()
                     try:
                         msg = self.session.unserialize(msg, content=False)
                     except:
                         print ("bad msg: %s"%msg)
                     msgtype = msg['header']['msg_type']
                     handler = self.handlers.get(msgtype, None)
                     if handler is None:
                         self.upstream.send_multipart(raw_msg, copy=False)
                     else:
                         handler(msg)
                 #--------------------------------------------------------------------------
                 # Handlers
                 #--------------------------------------------------------------------------
                 def shutdown_request(self, msg):
                     """"""
                     self.downstream.send_multipart(msg)
                 #--------------------------------------------------------------------------
                 # Kernel process management methods, from KernelManager:
                 #--------------------------------------------------------------------------
                 def _check_local(addr):
                     if isinstance(addr, tuple):
                         addr = addr[0]
                     return addr in LOCAL_IPS
                 def start_kernel(self, **kw):
                     """Starts a kernel process and configures the manager to use it.
                     If random ports (port=0) are being used, this method must be called
                     before the channels are created.
                     Parameters:
                     -----------
                     ipython : bool, optional (default True)
                          Whether to use an IPython kernel instead of a plain Python kernel.
                     """
                     self.kernel = Process(target=make_kernel, args=self.kernel_args,
                                                         kwargs=self.kernel_kwargs)
                 def shutdown_kernel(self, restart=False):
                     """ Attempts to the stop the kernel process cleanly. If the kernel
                     cannot be stopped, it is killed, if possible.
                     """
                     # FIXME: Shutdown does not work on Windows due to ZMQ errors!
                     if sys.platform == 'win32':
                         self.kill_kernel()
                         return
                     # Don't send any additional kernel kill messages immediately, to give
                     # the kernel a chance to properly execute shutdown actions. Wait for at
                     # most 1s, checking every 0.1s.
                     self.xreq_channel.shutdown(restart=restart)
                     for i in range(10):
                         if self.is_alive:
                             time.sleep(0.1)
                         else:
                             break
                     else:
                         # OK, we've waited long enough.
                         if self.has_kernel:
                             self.kill_kernel()
                 def restart_kernel(self, now=False):
                     """Restarts a kernel with the same arguments that were used to launch
                     it. If the old kernel was launched with random ports, the same ports
                     will be used for the new kernel.
                     Parameters
                     ----------
                     now : bool, optional
                       If True, the kernel is forcefully restarted *immediately*, without
                       having a chance to do any cleanup action.  Otherwise the kernel is
                       given 1s to clean up before a forceful restart is issued.
                       In all cases the kernel is restarted, the only difference is whether
                       it is given a chance to perform a clean shutdown or not.
                     """
                     if self._launch_args is None:
                         raise RuntimeError("Cannot restart the kernel. "
                                            "No previous call to 'start_kernel'.")
                     else:
                         if self.has_kernel:
                             if now:
                                 self.kill_kernel()
                             else:
                                 self.shutdown_kernel(restart=True)
                         self.start_kernel(**self._launch_args)
                         # FIXME: Messages get dropped in Windows due to probable ZMQ bug
                         # unless there is some delay here.
                         if sys.platform == 'win32':
                             time.sleep(0.2)
                 @property
                 def has_kernel(self):
                     """Returns whether a kernel process has been specified for the kernel
                     manager.
                     """
                     return self.kernel is not None
                 def kill_kernel(self):
                     """ Kill the running kernel. """
                     if self.has_kernel:
                         # Pause the heart beat channel if it exists.
                         if self._hb_channel is not None:
                             self._hb_channel.pause()
                         # Attempt to kill the kernel.
                         try:
                             self.kernel.kill()
                         except OSError, e:
                             # In Windows, we will get an Access Denied error if the process
                             # has already terminated. Ignore it.
                             if not (sys.platform == 'win32' and e.winerror == 5):
                                 raise
                         self.kernel = None
                     else:
                         raise RuntimeError("Cannot kill kernel. No kernel is running!")
                 def interrupt_kernel(self):
                     """ Interrupts the kernel. Unlike ``signal_kernel``, this operation is
                     well supported on all platforms.
                     """
                     if self.has_kernel:
                         if sys.platform == 'win32':
                             from parentpoller import ParentPollerWindows as Poller
                             Poller.send_interrupt(self.kernel.win32_interrupt_event)
                         else:
                             self.kernel.send_signal(signal.SIGINT)
                     else:
                         raise RuntimeError("Cannot interrupt kernel. No kernel is running!")
                 def signal_kernel(self, signum):
                     """ Sends a signal to the kernel. Note that since only SIGTERM is
                     supported on Windows, this function is only useful on Unix systems.
                     """
                     if self.has_kernel:
                         self.kernel.send_signal(signum)
                     else:
                         raise RuntimeError("Cannot signal kernel. No kernel is running!")
                 @property
                 def is_alive(self):
                     """Is the kernel process still running?"""
                     # FIXME: not using a heartbeat means this method is broken for any
                     # remote kernel, it's only capable of handling local kernels.
                     if self.has_kernel:
                         if self.kernel.poll() is None:
                             return True
                         else:
                             return False
                     else:
                         # We didn't start the kernel with this KernelManager so we don't
                         # know if it is running. We should use a heartbeat for this case.
                         return True
             def make_starter(up_addr, down_addr, *args, **kwargs):
                 """entry point function for launching a kernelstarter in a subprocess"""
                 loop = ioloop.IOLoop.instance()
                 ctx = zmq.Context()
                 session = Session()
-                upstream = zmqstream.ZMQStream(ctx.socket(zmq.XREQ),loop)
+                upstream = zmqstream.ZMQStream(ctx.socket(zmq.DEALER),loop)
                 upstream.connect(up_addr)
-                downstream = zmqstream.ZMQStream(ctx.socket(zmq.XREQ),loop)
+                downstream = zmqstream.ZMQStream(ctx.socket(zmq.DEALER),loop)
                 downstream.connect(down_addr)
                 starter = KernelStarter(session, upstream, downstream, *args, **kwargs)
                 starter.start()
                 loop.start()

IPython/zmq/__init__.py

0 +23 -15

             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING.txt, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Verify zmq version dependency >= 2.1.4
             #-----------------------------------------------------------------------------
+            import re
             import warnings
-            minimum_pyzmq_version = "2.1.4"
+            def check_for_zmq(minimum_version, module='IPython.zmq'):
+                min_vlist = [int(n) for n in minimum_version.split('.')]
-            try:
+                try:
-                import zmq
+                    import zmq
-            except ImportError:
+                except ImportError:
-                raise ImportError("IPython.zmq requires pyzmq >= %s"%minimum_pyzmq_version)
+                    raise ImportError("%s requires pyzmq >= %s"%(module, minimum_version))
-            pyzmq_version = zmq.__version__
+                pyzmq_version = zmq.__version__
+                vlist = [int(n) for n in re.findall(r'\d+', pyzmq_version)]
-            if pyzmq_version < minimum_pyzmq_version:
+                if 'dev' not in pyzmq_version and vlist < min_vlist:
-                raise ImportError("IPython.zmq requires pyzmq >= %s, but you have %s"%(
+                    raise ImportError("%s requires pyzmq >= %s, but you have %s"%(
-                                minimum_pyzmq_version, pyzmq_version))
+                                    module, minimum_version, pyzmq_version))
-            del pyzmq_version
+                # fix missing DEALER/ROUTER aliases in pyzmq < 2.1.9
+                if not hasattr(zmq, 'DEALER'):
+                    zmq.DEALER = zmq.XREQ
+                if not hasattr(zmq, 'ROUTER'):
+                    zmq.ROUTER = zmq.XREP
-            if zmq.zmq_version() >= '3.0.0':
+                if zmq.zmq_version() >= '4.0.0':
-                warnings.warn("""libzmq 3 detected.
+                    warnings.warn("""libzmq 4 detected.
-                It is unlikely that IPython's zmq code will work properly.
+                    It is unlikely that IPython's zmq code will work properly.
-                Please install libzmq stable, which is 2.1.x or 2.2.x""",
+                    Please install libzmq stable, which is 2.1.x or 2.2.x""",
-                RuntimeWarning)
+                    RuntimeWarning)
+            check_for_zmq('2.1.4')

IPython/zmq/frontend.py

0 +1 -1

             #!/usr/bin/env python
             """A simple interactive frontend that talks to a kernel over 0MQ.
             """
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             # stdlib
             import cPickle as pickle
             import code
             import readline
             import sys
             import time
             import uuid
             # our own
             import zmq
             import session
             import completer
             from IPython.utils.localinterfaces import LOCALHOST
             #-----------------------------------------------------------------------------
             # Classes and functions
             #-----------------------------------------------------------------------------
             class Console(code.InteractiveConsole):
                 def __init__(self, locals=None, filename="<console>",
                              session = session,
                              request_socket=None,
                              sub_socket=None):
                     code.InteractiveConsole.__init__(self, locals, filename)
                     self.session = session
                     self.request_socket = request_socket
                     self.sub_socket = sub_socket
                     self.backgrounded = 0
                     self.messages = {}
                     # Set tab completion
                     self.completer = completer.ClientCompleter(self, session, request_socket)
                     readline.parse_and_bind('tab: complete')
                     readline.parse_and_bind('set show-all-if-ambiguous on')
                     readline.set_completer(self.completer.complete)
                     # Set system prompts
                     sys.ps1 = 'Py>>> '
                     sys.ps2 = '  ... '
                     sys.ps3 = 'Out : '
                     # Build dict of handlers for message types
                     self.handlers = {}
                     for msg_type in ['pyin', 'pyout', 'pyerr', 'stream']:
                         self.handlers[msg_type] = getattr(self, 'handle_%s' % msg_type)
                 def handle_pyin(self, omsg):
                     if omsg.parent_header.session == self.session.session:
                         return
                     c = omsg.content.code.rstrip()
                     if c:
                         print '[IN from %s]' % omsg.parent_header.username
                         print c
                 def handle_pyout(self, omsg):
                     #print omsg # dbg
                     if omsg.parent_header.session == self.session.session:
                         print "%s%s" % (sys.ps3, omsg.content.data)
                     else:
                         print '[Out from %s]' % omsg.parent_header.username
                         print omsg.content.data
                 def print_pyerr(self, err):
                     print >> sys.stderr, err.etype,':', err.evalue
                     print >> sys.stderr, ''.join(err.traceback)
                 def handle_pyerr(self, omsg):
                     if omsg.parent_header.session == self.session.session:
                         return
                     print >> sys.stderr, '[ERR from %s]' % omsg.parent_header.username
                     self.print_pyerr(omsg.content)
                 def handle_stream(self, omsg):
                     if omsg.content.name == 'stdout':
                         outstream = sys.stdout
                     else:
                         outstream = sys.stderr
                         print >> outstream, '*ERR*',
                     print >> outstream, omsg.content.data,
                 def handle_output(self, omsg):
                     handler = self.handlers.get(omsg.msg_type, None)
                     if handler is not None:
                         handler(omsg)
                 def recv_output(self):
                     while True:
                         ident,msg = self.session.recv(self.sub_socket)
                         if msg is None:
                             break
                         self.handle_output(Message(msg))
                 def handle_reply(self, rep):
                     # Handle any side effects on output channels
                     self.recv_output()
                     # Now, dispatch on the possible reply types we must handle
                     if rep is None:
                         return
                     if rep.content.status == 'error':
                         self.print_pyerr(rep.content)
                     elif rep.content.status == 'aborted':
                         print >> sys.stderr, "ERROR: ABORTED"
                         ab = self.messages[rep.parent_header.msg_id].content
                         if 'code' in ab:
                             print >> sys.stderr, ab.code
                         else:
                             print >> sys.stderr, ab
                 def recv_reply(self):
                     ident,rep = self.session.recv(self.request_socket)
                     mrep = Message(rep)
                     self.handle_reply(mrep)
                     return mrep
                 def runcode(self, code):
                     # We can't pickle code objects, so fetch the actual source
                     src = '\n'.join(self.buffer)
                     # for non-background inputs, if we do have previoiusly backgrounded
                     # jobs, check to see if they've produced results
                     if not src.endswith(';'):
                         while self.backgrounded > 0:
                             #print 'checking background'
                             rep = self.recv_reply()
                             if rep:
                                 self.backgrounded -= 1
                             time.sleep(0.05)
                     # Send code execution message to kernel
                     omsg = self.session.send(self.request_socket,
                                              'execute_request', dict(code=src))
                     self.messages[omsg.header.msg_id] = omsg
                     # Fake asynchronicity by letting the user put ';' at the end of the line
                     if src.endswith(';'):
                         self.backgrounded += 1
                         return
                     # For foreground jobs, wait for reply
                     while True:
                         rep = self.recv_reply()
                         if rep is not None:
                             break
                         self.recv_output()
                         time.sleep(0.05)
                     else:
                         # We exited without hearing back from the kernel!
                         print >> sys.stderr, 'ERROR!!! kernel never got back to us!!!'
             class InteractiveClient(object):
                 def __init__(self, session, request_socket, sub_socket):
                     self.session = session
                     self.request_socket = request_socket
                     self.sub_socket = sub_socket
                     self.console = Console(None, '<zmq-console>',
                                            session, request_socket, sub_socket)
                 def interact(self):
                     self.console.interact()
             def main():
                 # Defaults
                 #ip = '192.168.2.109'
                 ip = LOCALHOST
                 #ip = '99.146.222.252'
                 port_base = 5575
                 connection = ('tcp://%s' % ip) + ':%i'
                 req_conn = connection % port_base
                 sub_conn = connection % (port_base+1)
                 # Create initial sockets
                 c = zmq.Context()
-                request_socket = c.socket(zmq.XREQ)
+                request_socket = c.socket(zmq.DEALER)
                 request_socket.connect(req_conn)
                 sub_socket = c.socket(zmq.SUB)
                 sub_socket.connect(sub_conn)
                 sub_socket.setsockopt(zmq.SUBSCRIBE, '')
                 # Make session and user-facing client
                 sess = session.Session()
                 client = InteractiveClient(sess, request_socket, sub_socket)
                 client.interact()
             if __name__ == '__main__':
                 main()

IPython/zmq/kernelapp.py

0 +2 -2

             """An Application for launching a kernel
             Authors
             -------
             * MinRK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING.txt, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             # Standard library imports.
             import os
             import sys
             # System library imports.
             import zmq
             # IPython imports.
             from IPython.core.ultratb import FormattedTB
             from IPython.core.application import (
                 BaseIPythonApplication, base_flags, base_aliases
             )
             from IPython.utils import io
             from IPython.utils.localinterfaces import LOCALHOST
             from IPython.utils.traitlets import (Any, Instance, Dict, Unicode, Int, Bool,
                                                     DottedObjectName)
             from IPython.utils.importstring import import_item
             # local imports
             from IPython.zmq.heartbeat import Heartbeat
             from IPython.zmq.parentpoller import ParentPollerUnix, ParentPollerWindows
             from IPython.zmq.session import Session
             #-----------------------------------------------------------------------------
             # Flags and Aliases
             #-----------------------------------------------------------------------------
             kernel_aliases = dict(base_aliases)
             kernel_aliases.update({
                 'ip' : 'KernelApp.ip',
                 'hb' : 'KernelApp.hb_port',
                 'shell' : 'KernelApp.shell_port',
                 'iopub' : 'KernelApp.iopub_port',
                 'stdin' : 'KernelApp.stdin_port',
                 'parent': 'KernelApp.parent',
             })
             if sys.platform.startswith('win'):
                 kernel_aliases['interrupt'] = 'KernelApp.interrupt'
             kernel_flags = dict(base_flags)
             kernel_flags.update({
                 'no-stdout' : (
                         {'KernelApp' : {'no_stdout' : True}},
                         "redirect stdout to the null device"),
                 'no-stderr' : (
                         {'KernelApp' : {'no_stderr' : True}},
                         "redirect stderr to the null device"),
             })
             #-----------------------------------------------------------------------------
             # Application class for starting a Kernel
             #-----------------------------------------------------------------------------
             class KernelApp(BaseIPythonApplication):
                 name='pykernel'
                 aliases = Dict(kernel_aliases)
                 flags = Dict(kernel_flags)
                 classes = [Session]
                 # the kernel class, as an importstring
                 kernel_class = DottedObjectName('IPython.zmq.pykernel.Kernel')
                 kernel = Any()
                 poller = Any() # don't restrict this even though current pollers are all Threads
                 heartbeat = Instance(Heartbeat)
                 session = Instance('IPython.zmq.session.Session')
                 ports = Dict()
                 # inherit config file name from parent:
                 parent_appname = Unicode(config=True)
                 def _parent_appname_changed(self, name, old, new):
                     if self.config_file_specified:
                         # it was manually specified, ignore
                         return
                     self.config_file_name = new.replace('-','_') + u'_config.py'
                     # don't let this count as specifying the config file
                     self.config_file_specified = False
                 # connection info:
                 ip = Unicode(LOCALHOST, config=True,
                     help="Set the IP or interface on which the kernel will listen.")
                 hb_port = Int(0, config=True, help="set the heartbeat port [default: random]")
                 shell_port = Int(0, config=True, help="set the shell (XREP) port [default: random]")
                 iopub_port = Int(0, config=True, help="set the iopub (PUB) port [default: random]")
                 stdin_port = Int(0, config=True, help="set the stdin (XREQ) port [default: random]")
                 # streams, etc.
                 no_stdout = Bool(False, config=True, help="redirect stdout to the null device")
                 no_stderr = Bool(False, config=True, help="redirect stderr to the null device")
                 outstream_class = DottedObjectName('IPython.zmq.iostream.OutStream',
                     config=True, help="The importstring for the OutStream factory")
                 displayhook_class = DottedObjectName('IPython.zmq.displayhook.ZMQDisplayHook',
                     config=True, help="The importstring for the DisplayHook factory")
                 # polling
                 parent = Int(0, config=True,
                     help="""kill this process if its parent dies.  On Windows, the argument
                     specifies the HANDLE of the parent process, otherwise it is simply boolean.
                     """)
                 interrupt = Int(0, config=True,
                     help="""ONLY USED ON WINDOWS
                     Interrupt this process when the parent is signalled.
                     """)
                 def init_crash_handler(self):
                     # Install minimal exception handling
                     sys.excepthook = FormattedTB(mode='Verbose', color_scheme='NoColor',
                                                  ostream=sys.__stdout__)
                 def init_poller(self):
                     if sys.platform == 'win32':
                         if self.interrupt or self.parent:
                             self.poller = ParentPollerWindows(self.interrupt, self.parent)
                     elif self.parent:
                         self.poller = ParentPollerUnix()
                 def _bind_socket(self, s, port):
                     iface = 'tcp://%s' % self.ip
                     if port <= 0:
                         port = s.bind_to_random_port(iface)
                     else:
                         s.bind(iface + ':%i'%port)
                     return port
                 def init_sockets(self):
                     # Create a context, a session, and the kernel sockets.
                     self.log.info("Starting the kernel at pid: %i", os.getpid())
                     context = zmq.Context.instance()
                     # Uncomment this to try closing the context.
                     # atexit.register(context.term)
-                    self.shell_socket = context.socket(zmq.XREP)
+                    self.shell_socket = context.socket(zmq.ROUTER)
                     self.shell_port = self._bind_socket(self.shell_socket, self.shell_port)
-                    self.log.debug("shell XREP Channel on port: %i"%self.shell_port)
+                    self.log.debug("shell ROUTER Channel on port: %i"%self.shell_port)
                     self.iopub_socket = context.socket(zmq.PUB)
                     self.iopub_port = self._bind_socket(self.iopub_socket, self.iopub_port)
                     self.log.debug("iopub PUB Channel on port: %i"%self.iopub_port)
                     self.stdin_socket = context.socket(zmq.XREQ)
                     self.stdin_port = self._bind_socket(self.stdin_socket, self.stdin_port)
                     self.log.debug("stdin XREQ Channel on port: %i"%self.stdin_port)
                     self.heartbeat = Heartbeat(context, (self.ip, self.hb_port))
                     self.hb_port = self.heartbeat.port
                     self.log.debug("Heartbeat REP Channel on port: %i"%self.hb_port)
                     # Helper to make it easier to connect to an existing kernel, until we have
                     # single-port connection negotiation fully implemented.
                     # set log-level to critical, to make sure it is output
                     self.log.critical("To connect another client to this kernel, use:")
                     self.log.critical("--existing --shell={0} --iopub={1} --stdin={2} --hb={3}".format(
                         self.shell_port, self.iopub_port, self.stdin_port, self.hb_port))
                     self.ports = dict(shell=self.shell_port, iopub=self.iopub_port,
                                             stdin=self.stdin_port, hb=self.hb_port)
                 def init_session(self):
                     """create our session object"""
                     self.session = Session(config=self.config, username=u'kernel')
                 def init_blackhole(self):
                     """redirects stdout/stderr to devnull if necessary"""
                     if self.no_stdout or self.no_stderr:
                         blackhole = file(os.devnull, 'w')
                         if self.no_stdout:
                             sys.stdout = sys.__stdout__ = blackhole
                         if self.no_stderr:
                             sys.stderr = sys.__stderr__ = blackhole
                 def init_io(self):
                     """Redirect input streams and set a display hook."""
                     if self.outstream_class:
                         outstream_factory = import_item(str(self.outstream_class))
                         sys.stdout = outstream_factory(self.session, self.iopub_socket, u'stdout')
                         sys.stderr = outstream_factory(self.session, self.iopub_socket, u'stderr')
                     if self.displayhook_class:
                         displayhook_factory = import_item(str(self.displayhook_class))
                         sys.displayhook = displayhook_factory(self.session, self.iopub_socket)
                 def init_kernel(self):
                     """Create the Kernel object itself"""
                     kernel_factory = import_item(str(self.kernel_class))
                     self.kernel = kernel_factory(config=self.config, session=self.session,
                                             shell_socket=self.shell_socket,
                                             iopub_socket=self.iopub_socket,
                                             stdin_socket=self.stdin_socket,
                                             log=self.log
                     )
                     self.kernel.record_ports(self.ports)
                 def initialize(self, argv=None):
                     super(KernelApp, self).initialize(argv)
                     self.init_blackhole()
                     self.init_session()
                     self.init_poller()
                     self.init_sockets()
                     self.init_io()
                     self.init_kernel()
                 def start(self):
                     self.heartbeat.start()
                     if self.poller is not None:
                         self.poller.start()
                     try:
                         self.kernel.start()
                     except KeyboardInterrupt:
                         pass

IPython/zmq/kernelmanager.py

0 +2 -2

             """Base classes to manage the interaction with a running kernel.
             TODO
             * Create logger to handle debugging and console messages.
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2008-2010  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #-----------------------------------------------------------------------------
             # Imports
             #-----------------------------------------------------------------------------
             # Standard library imports.
             import atexit
             import errno
             from Queue import Queue, Empty
             from subprocess import Popen
             import signal
             import sys
             from threading import Thread
             import time
             import logging
             # System library imports.
             import zmq
             from zmq import POLLIN, POLLOUT, POLLERR
             from zmq.eventloop import ioloop
             # Local imports.
             from IPython.config.loader import Config
             from IPython.utils import io
             from IPython.utils.localinterfaces import LOCALHOST, LOCAL_IPS
             from IPython.utils.traitlets import HasTraits, Any, Instance, Type, TCPAddress
             from session import Session, Message
             #-----------------------------------------------------------------------------
             # Constants and exceptions
             #-----------------------------------------------------------------------------
             class InvalidPortNumber(Exception):
                 pass
             #-----------------------------------------------------------------------------
             # Utility functions
             #-----------------------------------------------------------------------------
             # some utilities to validate message structure, these might get moved elsewhere
             # if they prove to have more generic utility
             def validate_string_list(lst):
                 """Validate that the input is a list of strings.
                 Raises ValueError if not."""
                 if not isinstance(lst, list):
                     raise ValueError('input %r must be a list' % lst)
                 for x in lst:
                     if not isinstance(x, basestring):
                         raise ValueError('element %r in list must be a string' % x)
             def validate_string_dict(dct):
                 """Validate that the input is a dict with string keys and values.
                 Raises ValueError if not."""
                 for k,v in dct.iteritems():
                     if not isinstance(k, basestring):
                         raise ValueError('key %r in dict must be a string' % k)
                     if not isinstance(v, basestring):
                         raise ValueError('value %r in dict must be a string' % v)
             #-----------------------------------------------------------------------------
             # ZMQ Socket Channel classes
             #-----------------------------------------------------------------------------
             class ZMQSocketChannel(Thread):
                 """The base class for the channels that use ZMQ sockets.
                 """
                 context = None
                 session = None
                 socket = None
                 ioloop = None
                 iostate = None
                 _address = None
                 def __init__(self, context, session, address):
                     """Create a channel
                     Parameters
                     ----------
                     context : :class:`zmq.Context`
                         The ZMQ context to use.
                     session : :class:`session.Session`
                         The session to use.
                     address : tuple
                         Standard (ip, port) tuple that the kernel is listening on.
                     """
                     super(ZMQSocketChannel, self).__init__()
                     self.daemon = True
                     self.context = context
                     self.session = session
                     if address[1] == 0:
                         message = 'The port number for a channel cannot be 0.'
                         raise InvalidPortNumber(message)
                     self._address = address
                 def _run_loop(self):
                     """Run my loop, ignoring EINTR events in the poller"""
                     while True:
                         try:
                             self.ioloop.start()
                         except zmq.ZMQError as e:
                             if e.errno == errno.EINTR:
                                 continue
                             else:
                                 raise
                         else:
                             break
                 def stop(self):
                     """Stop the channel's activity.
                     This calls :method:`Thread.join` and returns when the thread
                     terminates. :class:`RuntimeError` will be raised if
                     :method:`self.start` is called again.
                     """
                     self.join()
                 @property
                 def address(self):
                     """Get the channel's address as an (ip, port) tuple.
                     By the default, the address is (localhost, 0), where 0 means a random
                     port.
                     """
                     return self._address
                 def add_io_state(self, state):
                     """Add IO state to the eventloop.
                     Parameters
                     ----------
                     state : zmq.POLLIN|zmq.POLLOUT|zmq.POLLERR
                         The IO state flag to set.
                     This is thread safe as it uses the thread safe IOLoop.add_callback.
                     """
                     def add_io_state_callback():
                         if not self.iostate & state:
                             self.iostate = self.iostate | state
                             self.ioloop.update_handler(self.socket, self.iostate)
                     self.ioloop.add_callback(add_io_state_callback)
                 def drop_io_state(self, state):
                     """Drop IO state from the eventloop.
                     Parameters
                     ----------
                     state : zmq.POLLIN|zmq.POLLOUT|zmq.POLLERR
                         The IO state flag to set.
                     This is thread safe as it uses the thread safe IOLoop.add_callback.
                     """
                     def drop_io_state_callback():
                         if self.iostate & state:
                             self.iostate = self.iostate & (~state)
                             self.ioloop.update_handler(self.socket, self.iostate)
                     self.ioloop.add_callback(drop_io_state_callback)
             class ShellSocketChannel(ZMQSocketChannel):
                 """The XREQ channel for issues request/replies to the kernel.
                 """
                 command_queue = None
                 def __init__(self, context, session, address):
                     super(ShellSocketChannel, self).__init__(context, session, address)
                     self.command_queue = Queue()
                     self.ioloop = ioloop.IOLoop()
                 def run(self):
                     """The thread's main activity.  Call start() instead."""
-                    self.socket = self.context.socket(zmq.XREQ)
+                    self.socket = self.context.socket(zmq.DEALER)
                     self.socket.setsockopt(zmq.IDENTITY, self.session.session)
                     self.socket.connect('tcp://%s:%i' % self.address)
                     self.iostate = POLLERR|POLLIN
                     self.ioloop.add_handler(self.socket, self._handle_events,
                                             self.iostate)
                     self._run_loop()
                 def stop(self):
                     self.ioloop.stop()
                     super(ShellSocketChannel, self).stop()
                 def call_handlers(self, msg):
                     """This method is called in the ioloop thread when a message arrives.
                     Subclasses should override this method to handle incoming messages.
                     It is important to remember that this method is called in the thread
                     so that some logic must be done to ensure that the application leve
                     handlers are called in the application thread.
                     """
                     raise NotImplementedError('call_handlers must be defined in a subclass.')
                 def execute(self, code, silent=False,
                             user_variables=None, user_expressions=None):
                     """Execute code in the kernel.
                     Parameters
                     ----------
                     code : str
                         A string of Python code.
                     silent : bool, optional (default False)
                         If set, the kernel will execute the code as quietly possible.
                     user_variables : list, optional
                         A list of variable names to pull from the user's namespace.  They
                         will come back as a dict with these names as keys and their
                         :func:`repr` as values.
                     user_expressions : dict, optional
                         A dict with string keys and  to pull from the user's
                         namespace.  They will come back as a dict with these names as keys
                         and their :func:`repr` as values.
                     Returns
                     -------
                     The msg_id of the message sent.
                     """
                     if user_variables is None:
                         user_variables = []
                     if user_expressions is None:
                         user_expressions = {}
                     # Don't waste network traffic if inputs are invalid
                     if not isinstance(code, basestring):
                         raise ValueError('code %r must be a string' % code)
                     validate_string_list(user_variables)
                     validate_string_dict(user_expressions)
                     # Create class for content/msg creation. Related to, but possibly
                     # not in Session.
                     content = dict(code=code, silent=silent,
                                    user_variables=user_variables,
                                    user_expressions=user_expressions)
                     msg = self.session.msg('execute_request', content)
                     self._queue_request(msg)
                     return msg['header']['msg_id']
                 def complete(self, text, line, cursor_pos, block=None):
                     """Tab complete text in the kernel's namespace.
                     Parameters
                     ----------
                     text : str
                         The text to complete.
                     line : str
                         The full line of text that is the surrounding context for the
                         text to complete.
                     cursor_pos : int
                         The position of the cursor in the line where the completion was
                         requested.
                     block : str, optional
                         The full block of code in which the completion is being requested.
                     Returns
                     -------
                     The msg_id of the message sent.
                     """
                     content = dict(text=text, line=line, block=block, cursor_pos=cursor_pos)
                     msg = self.session.msg('complete_request', content)
                     self._queue_request(msg)
                     return msg['header']['msg_id']
                 def object_info(self, oname):
                     """Get metadata information about an object.
                     Parameters
                     ----------
                     oname : str
                         A string specifying the object name.
                     Returns
                     -------
                     The msg_id of the message sent.
                     """
                     content = dict(oname=oname)
                     msg = self.session.msg('object_info_request', content)
                     self._queue_request(msg)
                     return msg['header']['msg_id']
                 def history(self, raw=True, output=False, hist_access_type='range', **kwargs):
                     """Get entries from the history list.
                     Parameters
                     ----------
                     raw : bool
                         If True, return the raw input.
                     output : bool
                         If True, then return the output as well.
                     hist_access_type : str
                         'range' (fill in session, start and stop params), 'tail' (fill in n)
                          or 'search' (fill in pattern param).
                     session : int
                         For a range request, the session from which to get lines. Session
                         numbers are positive integers; negative ones count back from the
                         current session.
                     start : int
                         The first line number of a history range.
                     stop : int
                         The final (excluded) line number of a history range.
                     n : int
                         The number of lines of history to get for a tail request.
                     pattern : str
                         The glob-syntax pattern for a search request.
                     Returns
                     -------
                     The msg_id of the message sent.
                     """
                     content = dict(raw=raw, output=output, hist_access_type=hist_access_type,
                                                                                 **kwargs)
                     msg = self.session.msg('history_request', content)
                     self._queue_request(msg)
                     return msg['header']['msg_id']
                 def shutdown(self, restart=False):
                     """Request an immediate kernel shutdown.
                     Upon receipt of the (empty) reply, client code can safely assume that
                     the kernel has shut down and it's safe to forcefully terminate it if
                     it's still alive.
                     The kernel will send the reply via a function registered with Python's
                     atexit module, ensuring it's truly done as the kernel is done with all
                     normal operation.
                     """
                     # Send quit message to kernel. Once we implement kernel-side setattr,
                     # this should probably be done that way, but for now this will do.
                     msg = self.session.msg('shutdown_request', {'restart':restart})
                     self._queue_request(msg)
                     return msg['header']['msg_id']
                 def _handle_events(self, socket, events):
                     if events & POLLERR:
                         self._handle_err()
                     if events & POLLOUT:
                         self._handle_send()
                     if events & POLLIN:
                         self._handle_recv()
                 def _handle_recv(self):
                     ident,msg = self.session.recv(self.socket, 0)
                     self.call_handlers(msg)
                 def _handle_send(self):
                     try:
                         msg = self.command_queue.get(False)
                     except Empty:
                         pass
                     else:
                         self.session.send(self.socket,msg)
                     if self.command_queue.empty():
                         self.drop_io_state(POLLOUT)
                 def _handle_err(self):
                     # We don't want to let this go silently, so eventually we should log.
                     raise zmq.ZMQError()
                 def _queue_request(self, msg):
                     self.command_queue.put(msg)
                     self.add_io_state(POLLOUT)
             class SubSocketChannel(ZMQSocketChannel):
                 """The SUB channel which listens for messages that the kernel publishes.
                 """
                 def __init__(self, context, session, address):
                     super(SubSocketChannel, self).__init__(context, session, address)
                     self.ioloop = ioloop.IOLoop()
                 def run(self):
                     """The thread's main activity.  Call start() instead."""
                     self.socket = self.context.socket(zmq.SUB)
                     self.socket.setsockopt(zmq.SUBSCRIBE,'')
                     self.socket.setsockopt(zmq.IDENTITY, self.session.session)
                     self.socket.connect('tcp://%s:%i' % self.address)
                     self.iostate = POLLIN|POLLERR
                     self.ioloop.add_handler(self.socket, self._handle_events,
                                             self.iostate)
                     self._run_loop()
                 def stop(self):
                     self.ioloop.stop()
                     super(SubSocketChannel, self).stop()
                 def call_handlers(self, msg):
                     """This method is called in the ioloop thread when a message arrives.
                     Subclasses should override this method to handle incoming messages.
                     It is important to remember that this method is called in the thread
                     so that some logic must be done to ensure that the application leve
                     handlers are called in the application thread.
                     """
                     raise NotImplementedError('call_handlers must be defined in a subclass.')
                 def flush(self, timeout=1.0):
                     """Immediately processes all pending messages on the SUB channel.
                     Callers should use this method to ensure that :method:`call_handlers`
                     has been called for all messages that have been received on the
 MQ SUB socket of this channel.
                     This method is thread safe.
                     Parameters
                     ----------
                     timeout : float, optional
                         The maximum amount of time to spend flushing, in seconds. The
                         default is one second.
                     """
                     # We do the IOLoop callback process twice to ensure that the IOLoop
                     # gets to perform at least one full poll.
                     stop_time = time.time() + timeout
                     for i in xrange(2):
                         self._flushed = False
                         self.ioloop.add_callback(self._flush)
                         while not self._flushed and time.time() < stop_time:
                             time.sleep(0.01)
                 def _handle_events(self, socket, events):
                     # Turn on and off POLLOUT depending on if we have made a request
                     if events & POLLERR:
                         self._handle_err()
                     if events & POLLIN:
                         self._handle_recv()
                 def _handle_err(self):
                     # We don't want to let this go silently, so eventually we should log.
                     raise zmq.ZMQError()
                 def _handle_recv(self):
                     # Get all of the messages we can
                     while True:
                         try:
                             ident,msg = self.session.recv(self.socket)
                         except zmq.ZMQError:
                             # Check the errno?
                             # Will this trigger POLLERR?
                             break
                         else:
                             if msg is None:
                                 break
                             self.call_handlers(msg)
                 def _flush(self):
                     """Callback for :method:`self.flush`."""
                     self._flushed = True
             class StdInSocketChannel(ZMQSocketChannel):
                 """A reply channel to handle raw_input requests that the kernel makes."""
                 msg_queue = None
                 def __init__(self, context, session, address):
                     super(StdInSocketChannel, self).__init__(context, session, address)
                     self.ioloop = ioloop.IOLoop()
                     self.msg_queue = Queue()
                 def run(self):
                     """The thread's main activity.  Call start() instead."""
-                    self.socket = self.context.socket(zmq.XREQ)
+                    self.socket = self.context.socket(zmq.DEALER)
                     self.socket.setsockopt(zmq.IDENTITY, self.session.session)
                     self.socket.connect('tcp://%s:%i' % self.address)
                     self.iostate = POLLERR|POLLIN
                     self.ioloop.add_handler(self.socket, self._handle_events,
                                             self.iostate)
                     self._run_loop()
                 def stop(self):
                     self.ioloop.stop()
                     super(StdInSocketChannel, self).stop()
                 def call_handlers(self, msg):
                     """This method is called in the ioloop thread when a message arrives.
                     Subclasses should override this method to handle incoming messages.
                     It is important to remember that this method is called in the thread
                     so that some logic must be done to ensure that the application leve
                     handlers are called in the application thread.
                     """
                     raise NotImplementedError('call_handlers must be defined in a subclass.')
                 def input(self, string):
                     """Send a string of raw input to the kernel."""
                     content = dict(value=string)
                     msg = self.session.msg('input_reply', content)
                     self._queue_reply(msg)
                 def _handle_events(self, socket, events):
                     if events & POLLERR:
                         self._handle_err()
                     if events & POLLOUT:
                         self._handle_send()
                     if events & POLLIN:
                         self._handle_recv()
                 def _handle_recv(self):
                     ident,msg = self.session.recv(self.socket, 0)
                     self.call_handlers(msg)
                 def _handle_send(self):
                     try:
                         msg = self.msg_queue.get(False)
                     except Empty:
                         pass
                     else:
                         self.session.send(self.socket,msg)
                     if self.msg_queue.empty():
                         self.drop_io_state(POLLOUT)
                 def _handle_err(self):
                     # We don't want to let this go silently, so eventually we should log.
                     raise zmq.ZMQError()
                 def _queue_reply(self, msg):
                     self.msg_queue.put(msg)
                     self.add_io_state(POLLOUT)
             class HBSocketChannel(ZMQSocketChannel):
                 """The heartbeat channel which monitors the kernel heartbeat.
                 Note that the heartbeat channel is paused by default. As long as you start
                 this channel, the kernel manager will ensure that it is paused and un-paused
                 as appropriate.
                 """
                 time_to_dead = 3.0
                 socket = None
                 poller = None
                 _running = None
                 _pause = None
                 def __init__(self, context, session, address):
                     super(HBSocketChannel, self).__init__(context, session, address)
                     self._running = False
                     self._pause = True
                 def _create_socket(self):
                     self.socket = self.context.socket(zmq.REQ)
                     self.socket.setsockopt(zmq.IDENTITY, self.session.session)
                     self.socket.connect('tcp://%s:%i' % self.address)
                     self.poller = zmq.Poller()
                     self.poller.register(self.socket, zmq.POLLIN)
                 def run(self):
                     """The thread's main activity.  Call start() instead."""
                     self._create_socket()
                     self._running = True
                     while self._running:
                         if self._pause:
                             time.sleep(self.time_to_dead)
                         else:
                             since_last_heartbeat = 0.0
                             request_time = time.time()
                             try:
                                 #io.rprint('Ping from HB channel') # dbg
                                 self.socket.send(b'ping')
                             except zmq.ZMQError, e:
                                 #io.rprint('*** HB Error:', e) # dbg
                                 if e.errno == zmq.EFSM:
                                     #io.rprint('sleep...', self.time_to_dead) # dbg
                                     time.sleep(self.time_to_dead)
                                     self._create_socket()
                                 else:
                                     raise
                             else:
                                 while True:
                                     try:
                                         self.socket.recv(zmq.NOBLOCK)
                                     except zmq.ZMQError, e:
                                         #io.rprint('*** HB Error 2:', e) # dbg
                                         if e.errno == zmq.EAGAIN:
                                             before_poll = time.time()
                                             until_dead = self.time_to_dead - (before_poll -
                                                                               request_time)
                                             # When the return value of poll() is an empty
                                             # list, that is when things have gone wrong
                                             # (zeromq bug). As long as it is not an empty
                                             # list, poll is working correctly even if it
                                             # returns quickly. Note: poll timeout is in
                                             # milliseconds.
                                             if until_dead > 0.0:
                                                 while True:
                                                     try:
                                                         self.poller.poll(1000 * until_dead)
                                                     except zmq.ZMQError as e:
                                                         if e.errno == errno.EINTR:
                                                             continue
                                                         else:
                                                             raise
                                                     else:
                                                         break
                                             since_last_heartbeat = time.time()-request_time
                                             if since_last_heartbeat > self.time_to_dead:
                                                 self.call_handlers(since_last_heartbeat)
                                                 break
                                         else:
                                             # FIXME: We should probably log this instead.
                                             raise
                                     else:
                                         until_dead = self.time_to_dead - (time.time() -
                                                                           request_time)
                                         if until_dead > 0.0:
                                             #io.rprint('sleep...', self.time_to_dead) # dbg
                                             time.sleep(until_dead)
                                         break
                 def pause(self):
                     """Pause the heartbeat."""
                     self._pause = True
                 def unpause(self):
                     """Unpause the heartbeat."""
                     self._pause = False
                 def is_beating(self):
                     """Is the heartbeat running and not paused."""
                     if self.is_alive() and not self._pause:
                         return True
                     else:
                         return False
                 def stop(self):
                     self._running = False
                     super(HBSocketChannel, self).stop()
                 def call_handlers(self, since_last_heartbeat):
                     """This method is called in the ioloop thread when a message arrives.
                     Subclasses should override this method to handle incoming messages.
                     It is important to remember that this method is called in the thread
                     so that some logic must be done to ensure that the application leve
                     handlers are called in the application thread.
                     """
                     raise NotImplementedError('call_handlers must be defined in a subclass.')
             #-----------------------------------------------------------------------------
             # Main kernel manager class
             #-----------------------------------------------------------------------------
             class KernelManager(HasTraits):
                 """ Manages a kernel for a frontend.
                 The SUB channel is for the frontend to receive messages published by the
                 kernel.
                 The REQ channel is for the frontend to make requests of the kernel.
                 The REP channel is for the kernel to request stdin (raw_input) from the
                 frontend.
                 """
                 # config object for passing to child configurables
                 config = Instance(Config)
                 # The PyZMQ Context to use for communication with the kernel.
                 context = Instance(zmq.Context)
                 def _context_default(self):
                     return zmq.Context.instance()
                 # The Session to use for communication with the kernel.
                 session = Instance(Session)
                 # The kernel process with which the KernelManager is communicating.
                 kernel = Instance(Popen)
                 # The addresses for the communication channels.
                 shell_address = TCPAddress((LOCALHOST, 0))
                 sub_address = TCPAddress((LOCALHOST, 0))
                 stdin_address = TCPAddress((LOCALHOST, 0))
                 hb_address = TCPAddress((LOCALHOST, 0))
                 # The classes to use for the various channels.
                 shell_channel_class = Type(ShellSocketChannel)
                 sub_channel_class = Type(SubSocketChannel)
                 stdin_channel_class = Type(StdInSocketChannel)
                 hb_channel_class = Type(HBSocketChannel)
                 # Protected traits.
                 _launch_args = Any
                 _shell_channel = Any
                 _sub_channel = Any
                 _stdin_channel = Any
                 _hb_channel = Any
                 def __init__(self, **kwargs):
                     super(KernelManager, self).__init__(**kwargs)
                     if self.session is None:
                         self.session = Session(config=self.config)
                     # Uncomment this to try closing the context.
                     # atexit.register(self.context.term)
                 #--------------------------------------------------------------------------
                 # Channel management methods:
                 #--------------------------------------------------------------------------
                 def start_channels(self, shell=True, sub=True, stdin=True, hb=True):
                     """Starts the channels for this kernel.
                     This will create the channels if they do not exist and then start
                     them. If port numbers of 0 are being used (random ports) then you
                     must first call :method:`start_kernel`. If the channels have been
                     stopped and you call this, :class:`RuntimeError` will be raised.
                     """
                     if shell:
                         self.shell_channel.start()
                     if sub:
                         self.sub_channel.start()
                     if stdin:
                         self.stdin_channel.start()
                     if hb:
                         self.hb_channel.start()
                 def stop_channels(self):
                     """Stops all the running channels for this kernel.
                     """
                     if self.shell_channel.is_alive():
                         self.shell_channel.stop()
                     if self.sub_channel.is_alive():
                         self.sub_channel.stop()
                     if self.stdin_channel.is_alive():
                         self.stdin_channel.stop()
                     if self.hb_channel.is_alive():
                         self.hb_channel.stop()
                 @property
                 def channels_running(self):
                     """Are any of the channels created and running?"""
                     return (self.shell_channel.is_alive() or self.sub_channel.is_alive() or
                             self.stdin_channel.is_alive() or self.hb_channel.is_alive())
                 #--------------------------------------------------------------------------
                 # Kernel process management methods:
                 #--------------------------------------------------------------------------
                 def start_kernel(self, **kw):
                     """Starts a kernel process and configures the manager to use it.
                     If random ports (port=0) are being used, this method must be called
                     before the channels are created.
                     Parameters:
                     -----------
                     ipython : bool, optional (default True)
                          Whether to use an IPython kernel instead of a plain Python kernel.
                     launcher : callable, optional (default None)
                          A custom function for launching the kernel process (generally a
                          wrapper around ``entry_point.base_launch_kernel``). In most cases,
                          it should not be necessary to use this parameter.
                     **kw : optional
                          See respective options for IPython and Python kernels.
                     """
                     shell, sub, stdin, hb = self.shell_address, self.sub_address, \
                         self.stdin_address, self.hb_address
                     if shell[0] not in LOCAL_IPS or sub[0] not in LOCAL_IPS or \
                             stdin[0] not in LOCAL_IPS or hb[0] not in LOCAL_IPS:
                         raise RuntimeError("Can only launch a kernel on a local interface. "
                                            "Make sure that the '*_address' attributes are "
                                            "configured properly. "
                                            "Currently valid addresses are: %s"%LOCAL_IPS
                                            )
                     self._launch_args = kw.copy()
                     launch_kernel = kw.pop('launcher', None)
                     if launch_kernel is None:
                         if kw.pop('ipython', True):
                             from ipkernel import launch_kernel
                         else:
                             from pykernel import launch_kernel
                     self.kernel, xrep, pub, req, _hb = launch_kernel(
                         shell_port=shell[1], iopub_port=sub[1],
                         stdin_port=stdin[1], hb_port=hb[1], **kw)
                     self.shell_address = (shell[0], xrep)
                     self.sub_address = (sub[0], pub)
                     self.stdin_address = (stdin[0], req)
                     self.hb_address = (hb[0], _hb)
                 def shutdown_kernel(self, restart=False):
                     """ Attempts to the stop the kernel process cleanly. If the kernel
                     cannot be stopped, it is killed, if possible.
                     """
                     # FIXME: Shutdown does not work on Windows due to ZMQ errors!
                     if sys.platform == 'win32':
                         self.kill_kernel()
                         return
                     # Pause the heart beat channel if it exists.
                     if self._hb_channel is not None:
                         self._hb_channel.pause()
                     # Don't send any additional kernel kill messages immediately, to give
                     # the kernel a chance to properly execute shutdown actions. Wait for at
                     # most 1s, checking every 0.1s.
                     self.shell_channel.shutdown(restart=restart)
                     for i in range(10):
                         if self.is_alive:
                             time.sleep(0.1)
                         else:
                             break
                     else:
                         # OK, we've waited long enough.
                         if self.has_kernel:
                             self.kill_kernel()
                 def restart_kernel(self, now=False, **kw):
                     """Restarts a kernel with the arguments that were used to launch it.
                     If the old kernel was launched with random ports, the same ports will be
                     used for the new kernel.
                     Parameters
                     ----------
                     now : bool, optional
                         If True, the kernel is forcefully restarted *immediately*, without
                         having a chance to do any cleanup action.  Otherwise the kernel is
                         given 1s to clean up before a forceful restart is issued.
                         In all cases the kernel is restarted, the only difference is whether
                         it is given a chance to perform a clean shutdown or not.
                     **kw : optional
                         Any options specified here will replace those used to launch the
                         kernel.
                     """
                     if self._launch_args is None:
                         raise RuntimeError("Cannot restart the kernel. "
                                            "No previous call to 'start_kernel'.")
                     else:
                         # Stop currently running kernel.
                         if self.has_kernel:
                             if now:
                                 self.kill_kernel()
                             else:
                                 self.shutdown_kernel(restart=True)
                         # Start new kernel.
                         self._launch_args.update(kw)
                         self.start_kernel(**self._launch_args)
                         # FIXME: Messages get dropped in Windows due to probable ZMQ bug
                         # unless there is some delay here.
                         if sys.platform == 'win32':
                             time.sleep(0.2)
                 @property
                 def has_kernel(self):
                     """Returns whether a kernel process has been specified for the kernel
                     manager.
                     """
                     return self.kernel is not None
                 def kill_kernel(self):
                     """ Kill the running kernel. """
                     if self.has_kernel:
                         # Pause the heart beat channel if it exists.
                         if self._hb_channel is not None:
                             self._hb_channel.pause()
                         # Attempt to kill the kernel.
                         try:
                             self.kernel.kill()
                         except OSError, e:
                             # In Windows, we will get an Access Denied error if the process
                             # has already terminated. Ignore it.
                             if sys.platform == 'win32':
                                 if e.winerror != 5:
                                     raise
                             # On Unix, we may get an ESRCH error if the process has already
                             # terminated. Ignore it.
                             else:
                                 from errno import ESRCH
                                 if e.errno != ESRCH:
                                     raise
                         self.kernel = None
                     else:
                         raise RuntimeError("Cannot kill kernel. No kernel is running!")
                 def interrupt_kernel(self):
                     """ Interrupts the kernel. Unlike ``signal_kernel``, this operation is
                     well supported on all platforms.
                     """
                     if self.has_kernel:
                         if sys.platform == 'win32':
                             from parentpoller import ParentPollerWindows as Poller
                             Poller.send_interrupt(self.kernel.win32_interrupt_event)
                         else:
                             self.kernel.send_signal(signal.SIGINT)
                     else:
                         raise RuntimeError("Cannot interrupt kernel. No kernel is running!")
                 def signal_kernel(self, signum):
                     """ Sends a signal to the kernel. Note that since only SIGTERM is
                     supported on Windows, this function is only useful on Unix systems.
                     """
                     if self.has_kernel:
                         self.kernel.send_signal(signum)
                     else:
                         raise RuntimeError("Cannot signal kernel. No kernel is running!")
                 @property
                 def is_alive(self):
                     """Is the kernel process still running?"""
                     # FIXME: not using a heartbeat means this method is broken for any
                     # remote kernel, it's only capable of handling local kernels.
                     if self.has_kernel:
                         if self.kernel.poll() is None:
                             return True
                         else:
                             return False
                     else:
                         # We didn't start the kernel with this KernelManager so we don't
                         # know if it is running. We should use a heartbeat for this case.
                         return True
                 #--------------------------------------------------------------------------
                 # Channels used for communication with the kernel:
                 #--------------------------------------------------------------------------
                 @property
                 def shell_channel(self):
                     """Get the REQ socket channel object to make requests of the kernel."""
                     if self._shell_channel is None:
                         self._shell_channel = self.shell_channel_class(self.context,
                                                                      self.session,
                                                                      self.shell_address)
                     return self._shell_channel
                 @property
                 def sub_channel(self):
                     """Get the SUB socket channel object."""
                     if self._sub_channel is None:
                         self._sub_channel = self.sub_channel_class(self.context,
                                                                    self.session,
                                                                    self.sub_address)
                     return self._sub_channel
                 @property
                 def stdin_channel(self):
                     """Get the REP socket channel object to handle stdin (raw_input)."""
                     if self._stdin_channel is None:
                         self._stdin_channel = self.stdin_channel_class(self.context,
                                                                    self.session,
                                                                    self.stdin_address)
                     return self._stdin_channel
                 @property
                 def hb_channel(self):
                     """Get the heartbeat socket channel object to check that the
                     kernel is alive."""
                     if self._hb_channel is None:
                         self._hb_channel = self.hb_channel_class(self.context,
                                                                    self.session,
                                                                    self.hb_address)
                     return self._hb_channel

docs/source/development/ipython_qt.txt

0 +1 -1

             .. _ipython_qt:
             ====================
             IPython Qt interface
             ====================
             Abstract
             --------
             This is about the implementation of a Qt-based Graphical User Interface (GUI)
             to execute Python code with an interpreter that runs in a separate process and
             the two systems (GUI frontend and interpreter kernel) communicating via the
             ZeroMQ Messaging library.  The bulk of the implementation will be done without
             dependencies on IPython (only on Zmq). Once the key features are ready,
             IPython-specific features can be added using the IPython codebase.
             Project details
             ---------------
             For a long time there has been demand for a graphical user interface for
             IPython, and the project already ships Wx-based prototypes thereof.  But these
             run all code in a single process, making them extremely brittle, as a crash of
             the Python interpreter kills the entire user session.  Here I propose to build
             a Qt-based GUI that will communicate with a separate process for the code
             execution, so that if the interpreter kernel dies, the frontend can continue to
             function after restarting a new kernel (and offering the user the option to
             re-execute all inputs, which the frontend can know).
             This GUI will allow for the easy editing of multi-line input and the convenient
             re-editing of previous blocks of input, which can be displayed in a 2-d
             workspace instead of a line-driven one like today's IPython. This makes it much
             easier to incrementally build and tune a code, by combining the rapid feedback
             cycle of IPython with the ability to edit multiline code with good graphical
             support.
 -process model pyzmq base
             ~~~~~~~~~~~~~~~~~~~~~~~~~~
             Since the necessity of a user to keep his data safe, the design is based in a
 -process model that will be achieved with a simple client/server system with
             `pyzmq <http://www.zeromq.org/bindings:python>`_, so the GUI session do not
             crash if the the kernel process does. This will be achieved using this test
             `code
             <http://github.com/fperez/pyzmq/blob/completer/examples/kernel/kernel.py>`_ and
             customizing it to the necessities of the GUI such as queue management with
             discrimination for different frontends connected to the same kernel and tab
             completion. A piece of drafted code for the kernel (server) should look like
             this::
                 def main():
                     c = zmq.Context(1, 1)
                     rep_conn = connection % port_base
                     pub_conn = connection % (port_base+1)
                     print >>sys.__stdout__, "Starting the kernel..."
                     print >>sys.__stdout__, "On:",rep_conn, pub_conn
                     session = Session(username=u'kernel')
-                    reply_socket = c.socket(zmq.XREP)
+                    reply_socket = c.socket(zmq.ROUTER)
                     reply_socket.bind(rep_conn)
                     pub_socket = c.socket(zmq.PUB)
                     pub_socket.bind(pub_conn)
                     stdout = OutStream(session, pub_socket, u'stdout')
                     stderr = OutStream(session, pub_socket, u'stderr')
                     sys.stdout = stdout
                     sys.stderr = stderr
                     display_hook = DisplayHook(session, pub_socket)
                     sys.displayhook = display_hook
                     kernel = Kernel(session, reply_socket, pub_socket)
             This kernel will use two queues (output and input), the input queue will have
             the id of the process(frontend) making the request, type(execute, complete,
             help, etc) and id of the request itself and the string of code to be executed,
             the output queue will have basically the same information just that the string
             is the to be displayed. This model is because the kernel needs to maintain
             control of timeouts when multiple requests are sent and keep them indexed.
             Qt based GUI
             ~~~~~~~~~~~~
             Design of the interface is going to be based in cells of code executed on the
             previous defined kernel. It will also have GUI facilities such toolboxes,
             tooltips to autocomplete code and function summary, highlighting and
             autoindentation.  It will have the cell kind of multiline edition mode so each
             block of code can be edited and executed independently, this can be achieved
             queuing QTextEdit objects (the cell) giving them format so we can discriminate
             outputs from inputs.  One of the main characteristics will be the debug support
             that will show the requested outputs as the debugger (that will be on a popup
             widget) "walks" through the code, this design is to be reviewed with the
             mentor.  `This <http://gfif.udea.edu.co/IPythonQt_snapshot.png>`_ is a
             tentative view of the main window.
             The GUI will check continuously the output queue from the kernel for new
             information to handle. This information have to be handled with care since any
             output will come at anytime and possibly in a different order than requested or
             maybe not appear at all, this could be possible due to a variety of reasons(for
             example tab completion request while the kernel is busy processing another
             frontend's request). This is, if the kernel is busy it won't be possible to
             fulfill the request for a while so the GUI will be prepared to abandon waiting
             for the reply if the user moves on or a certain timeout expires.
             POSSIBLE FUTURE DIRECTIONS
             ---------------------------
             The near future will bring the feature of saving and loading sessions, also
             importing and exporting to different formats like rst, html, pdf and
             python/ipython code, a discussion about this is taking place in the ipython-dev
             mailing list. Also the interaction with a remote kernel and distributed
             computation which is an IPython's project already in development.
             The idea of a mathematica-like help widget (i.e. there will be parts of it that
             will execute as a native session of IPythonQt) is still to be discussed in the
             development mailing list but it's definitively a great idea.

docs/source/development/messaging.txt

0 +8 -8

             .. _messaging:
             ======================
              Messaging in IPython
             ======================
             Introduction
             ============
             This document explains the basic communications design and messaging
             specification for how the various IPython objects interact over a network
             transport.  The current implementation uses the ZeroMQ_ library for messaging
             within and between hosts.
             .. Note::
                This document should be considered the authoritative description of the
                IPython messaging protocol, and all developers are strongly encouraged to
                keep it updated as the implementation evolves, so that we have a single
                common reference for all protocol details.
             The basic design is explained in the following diagram:
             .. image:: figs/frontend-kernel.png
                :width: 450px
                :alt: IPython kernel/frontend messaging architecture.
                :align: center
                :target: ../_images/frontend-kernel.png
             A single kernel can be simultaneously connected to one or more frontends.  The
             kernel has three sockets that serve the following functions:
 . REQ: this socket is connected to a *single* frontend at a time, and it allows
                the kernel to request input from a frontend when :func:`raw_input` is called.
                The frontend holding the matching REP socket acts as a 'virtual keyboard'
                for the kernel while this communication is happening (illustrated in the
                figure by the black outline around the central keyboard).  In practice,
                frontends may display such kernel requests using a special input widget or
                otherwise indicating that the user is to type input for the kernel instead
                of normal commands in the frontend.
-. XREP: this single sockets allows multiple incoming connections from
+. ROUTER: this single sockets allows multiple incoming connections from
                frontends, and this is the socket where requests for code execution, object
                information, prompts, etc. are made to the kernel by any frontend.  The
                communication on this socket is a sequence of request/reply actions from
                each frontend and the kernel.
 . PUB: this socket is the 'broadcast channel' where the kernel publishes all
                side effects (stdout, stderr, etc.) as well as the requests coming from any
-               client over the XREP socket and its own requests on the REP socket.  There
+               client over the ROUTER socket and its own requests on the REP socket.  There
                are a number of actions in Python which generate side effects: :func:`print`
                writes to ``sys.stdout``, errors generate tracebacks, etc.  Additionally, in
                a multi-client scenario, we want all frontends to be able to know what each
                other has sent to the kernel (this can be useful in collaborative scenarios,
                for example).  This socket allows both side effects and the information
-               about communications taking place with one client over the XREQ/XREP channel
+               about communications taking place with one client over the ROUTER/DEALER channel
                to be made available to all clients in a uniform manner.
                All messages are tagged with enough information (details below) for clients
                to know which messages come from their own interaction with the kernel and
                which ones are from other clients, so they can display each type
                appropriately.
             The actual format of the messages allowed on each of these channels is
             specified below.  Messages are dicts of dicts with string keys and values that
             are reasonably representable in JSON.  Our current implementation uses JSON
             explicitly as its message format, but this shouldn't be considered a permanent
             feature.  As we've discovered that JSON has non-trivial performance issues due
             to excessive copying, we may in the future move to a pure pickle-based raw
             message format.  However, it should be possible to easily convert from the raw
             objects to JSON, since we may have non-python clients (e.g. a web frontend).
             As long as it's easy to make a JSON version of the objects that is a faithful
             representation of all the data, we can communicate with such clients.
             .. Note::
                Not all of these have yet been fully fleshed out, but the key ones are, see
                kernel and frontend files for actual implementation details.
             Python functional API
             =====================
             As messages are dicts, they map naturally to a ``func(**kw)`` call form.  We
             should develop, at a few key points, functional forms of all the requests that
             take arguments in this manner and automatically construct the necessary dict
             for sending.
             General Message Format
             ======================
             All messages send or received by any IPython process should have the following
             generic structure::
                 {
                   # The message header contains a pair of unique identifiers for the
                   # originating session and the actual message id, in addition to the
                   # username for the process that generated the message.  This is useful in
                   # collaborative settings where multiple users may be interacting with the
                   # same kernel simultaneously, so that frontends can label the various
                   # messages in a meaningful way.
                   'header' : {
                                 'msg_id' : uuid,
                                 'username' : str,
                                 'session' : uuid
                                 # All recognized message type strings are listed below.
                                 'msg_type' : str,
                      },
                   # In a chain of messages, the header from the parent is copied so that
                   # clients can track where messages come from.
                   'parent_header' : dict,
                   # The actual content of the message must be a dict, whose structure
                   # depends on the message type.x
                   'content' : dict,
                 }
             For each message type, the actual content will differ and all existing message
             types are specified in what follows of this document.
-            Messages on the XREP/XREQ socket
+            Messages on the ROUTER/DEALER socket
             ================================
             .. _execute:
             Execute
             -------
             This message type is used by frontends to ask the kernel to execute code on
             behalf of the user, in a namespace reserved to the user's variables (and thus
             separate from the kernel's own internal code and variables).
             Message type: ``execute_request``::
                 content = {
                     # Source code to be executed by the kernel, one or more lines.
                 'code' : str,
                 # A boolean flag which, if True, signals the kernel to execute this
                 # code as quietly as possible.  This means that the kernel will compile
                 # the code witIPython/core/tests/h 'exec' instead of 'single' (so
                 # sys.displayhook will not fire), and will *not*:
                 #   - broadcast exceptions on the PUB socket
                 #   - do any logging
                 #   - populate any history
                 #
                 # The default is False.
                 'silent' : bool,
                 # A list of variable names from the user's namespace to be retrieved.  What
                 # returns is a JSON string of the variable's repr(), not a python object.
                 'user_variables' : list,
                 # Similarly, a dict mapping names to expressions to be evaluated in the
                 # user's dict.
                 'user_expressions' : dict,
                 }
             The ``code`` field contains a single string (possibly multiline).  The kernel
             is responsible for splitting this into one or more independent execution blocks
             and deciding whether to compile these in 'single' or 'exec' mode (see below for
             detailed execution semantics).
             The ``user_`` fields deserve a detailed explanation.  In the past, IPython had
             the notion of a prompt string that allowed arbitrary code to be evaluated, and
             this was put to good use by many in creating prompts that displayed system
             status, path information, and even more esoteric uses like remote instrument
             status aqcuired over the network.  But now that IPython has a clean separation
             between the kernel and the clients, the kernel has no prompt knowledge; prompts
             are a frontend-side feature, and it should be even possible for different
             frontends to display different prompts while interacting with the same kernel.
             The kernel now provides the ability to retrieve data from the user's namespace
             after the execution of the main ``code``, thanks to two fields in the
             ``execute_request`` message:
             - ``user_variables``: If only variables from the user's namespace are needed, a
               list of variable names can be passed and a dict with these names as keys and
               their :func:`repr()` as values will be returned.
             - ``user_expressions``: For more complex expressions that require function
               evaluations, a dict can be provided with string keys and arbitrary python
               expressions as values.  The return message will contain also a dict with the
               same keys and the :func:`repr()` of the evaluated expressions as value.
             With this information, frontends can display any status information they wish
             in the form that best suits each frontend (a status line, a popup, inline for a
             terminal, etc).
             .. Note::
                In order to obtain the current execution counter for the purposes of
                displaying input prompts, frontends simply make an execution request with an
                empty code string and ``silent=True``.
             Execution semantics
             ~~~~~~~~~~~~~~~~~~~
             When the silent flag is false, the execution of use code consists of the
             following phases (in silent mode, only the ``code`` field is executed):
 . Run the ``pre_runcode_hook``.
 . Execute the ``code`` field, see below for details.
 . If #2 succeeds, compute ``user_variables`` and ``user_expressions`` are
                computed.  This ensures that any error in the latter don't harm the main
                code execution.
 . Call any method registered with :meth:`register_post_execute`.
             .. warning::
                The API for running code before/after the main code block is likely to
                change soon.  Both the ``pre_runcode_hook`` and the
                :meth:`register_post_execute` are susceptible to modification, as we find a
                consistent model for both.
             To understand how the ``code`` field is executed, one must know that Python
             code can be compiled in one of three modes (controlled by the ``mode`` argument
             to the :func:`compile` builtin):
             *single*
               Valid for a single interactive statement (though the source can contain
               multiple lines, such as a for loop).  When compiled in this mode, the
               generated bytecode contains special instructions that trigger the calling of
               :func:`sys.displayhook` for any expression in the block that returns a value.
               This means that a single statement can actually produce multiple calls to
               :func:`sys.displayhook`, if for example it contains a loop where each
               iteration computes an unassigned expression would generate 10 calls::
                   for i in range(10):
                       i**2
             *exec*
               An arbitrary amount of source code, this is how modules are compiled.
               :func:`sys.displayhook` is *never* implicitly called.
             *eval*
               A single expression that returns a value.  :func:`sys.displayhook` is *never*
               implicitly called.
             The ``code`` field is split into individual blocks each of which is valid for
             execution in 'single' mode, and then:
             - If there is only a single block: it is executed in 'single' mode.
             - If there is more than one block:
               * if the last one is a single line long, run all but the last in 'exec' mode
                 and the very last one in 'single' mode.  This makes it easy to type simple
                 expressions at the end to see computed values.
               * if the last one is no more than two lines long, run all but the last in
                 'exec' mode and the very last one in 'single' mode.  This makes it easy to
                 type simple expressions at the end to see computed values.  - otherwise
                 (last one is also multiline), run all in 'exec' mode
               * otherwise (last one is also multiline), run all in 'exec' mode as a single
                 unit.
             Any error in retrieving the ``user_variables`` or evaluating the
             ``user_expressions`` will result in a simple error message in the return fields
             of the form::
                [ERROR] ExceptionType: Exception message
             The user can simply send the same variable name or expression for evaluation to
             see a regular traceback.
             Errors in any registered post_execute functions are also reported similarly,
             and the failing function is removed from the post_execution set so that it does
             not continue triggering failures.
             Upon completion of the execution request, the kernel *always* sends a reply,
             with a status code indicating what happened and additional data depending on
             the outcome.  See :ref:`below <execution_results>` for the possible return
             codes and associated data.
             Execution counter (old prompt number)
             ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
             The kernel has a single, monotonically increasing counter of all execution
             requests that are made with ``silent=False``.  This counter is used to populate
             the ``In[n]``, ``Out[n]`` and ``_n`` variables, so clients will likely want to
             display it in some form to the user, which will typically (but not necessarily)
             be done in the prompts.  The value of this counter will be returned as the
             ``execution_count`` field of all ``execute_reply`` messages.
             .. _execution_results:
             Execution results
             ~~~~~~~~~~~~~~~~~
             Message type: ``execute_reply``::
                 content = {
                   # One of: 'ok' OR 'error' OR 'abort'
                   'status' : str,
                   # The global kernel counter that increases by one with each non-silent
                   # executed request.  This will typically be used by clients to display
                   # prompt numbers to the user.  If the request was a silent one, this will
                   # be the current value of the counter in the kernel.
                   'execution_count' : int,
                 }
             When status is 'ok', the following extra fields are present::
                 {
                   # The execution payload is a dict with string keys that may have been
                   # produced by the code being executed.  It is retrieved by the kernel at
                   # the end of the execution and sent back to the front end, which can take
                   # action on it as needed.  See main text for further details.
                   'payload' : dict,
                   # Results for the user_variables and user_expressions.
                   'user_variables' : dict,
                   'user_expressions' : dict,
                   # The kernel will often transform the input provided to it.  If the
                   # '---->' transform had been applied, this is filled, otherwise it's the
                   # empty string.  So transformations like magics don't appear here, only
                   # autocall ones.
                   'transformed_code' : str,
                   }
             .. admonition:: Execution payloads
                The notion of an 'execution payload' is different from a return value of a
                given set of code, which normally is just displayed on the pyout stream
                through the PUB socket.  The idea of a payload is to allow special types of
                code, typically magics, to populate a data container in the IPython kernel
                that will be shipped back to the caller via this channel.  The kernel will
                have an API for this, probably something along the lines of::
                    ip.exec_payload_add(key, value)
                though this API is still in the design stages.  The data returned in this
                payload will allow frontends to present special views of what just happened.
             When status is 'error', the following extra fields are present::
                 {
                   'exc_name' : str,   # Exception name, as a string
                   'exc_value' : str,  # Exception value, as a string
                   # The traceback will contain a list of frames, represented each as a
                   # string.  For now we'll stick to the existing design of ultraTB, which
                   # controls exception level of detail statefully.  But eventually we'll
                   # want to grow into a model where more information is collected and
                   # packed into the traceback object, with clients deciding how little or
                   # how much of it to unpack.  But for now, let's start with a simple list
                   # of strings, since that requires only minimal changes to ultratb as
                   # written.
                   'traceback' : list,
                 }
             When status is 'abort', there are for now no additional data fields.  This
             happens when the kernel was interrupted by a signal.
             Kernel attribute access
             -----------------------
             .. warning::
                This part of the messaging spec is not actually implemented in the kernel
                yet.
             While this protocol does not specify full RPC access to arbitrary methods of
             the kernel object, the kernel does allow read (and in some cases write) access
             to certain attributes.
             The policy for which attributes can be read is: any attribute of the kernel, or
             its sub-objects, that belongs to a :class:`Configurable` object and has been
             declared at the class-level with Traits validation, is in principle accessible
             as long as its name does not begin with a leading underscore.  The attribute
             itself will have metadata indicating whether it allows remote read and/or write
             access.  The message spec follows for attribute read and write requests.
             Message type: ``getattr_request``::
                 content = {
                     # The (possibly dotted) name of the attribute
             	'name' : str,
                 }
             When a ``getattr_request`` fails, there are two possible error types:
             - AttributeError: this type of error was raised when trying to access the
               given name by the kernel itself.  This means that the attribute likely
               doesn't exist.
             - AccessError: the attribute exists but its value is not readable remotely.
             Message type: ``getattr_reply``::
                 content = {
                     # One of ['ok', 'AttributeError', 'AccessError'].
                     'status' : str,
             	# If status is 'ok', a JSON object.
             	'value' : object,
                 }
             Message type: ``setattr_request``::
                 content = {
                     # The (possibly dotted) name of the attribute
             	'name' : str,
             	# A JSON-encoded object, that will be validated by the Traits
             	# information in the kernel
             	'value' : object,
                 }
             When a ``setattr_request`` fails, there are also two possible error types with
             similar meanings  as those of the ``getattr_request`` case, but for writing.
             Message type: ``setattr_reply``::
                 content = {
                     # One of ['ok', 'AttributeError', 'AccessError'].
                     'status' : str,
                 }
             Object information
             ------------------
             One of IPython's most used capabilities is the introspection of Python objects
             in the user's namespace, typically invoked via the ``?`` and ``??`` characters
             (which in reality are shorthands for the ``%pinfo`` magic).  This is used often
             enough that it warrants an explicit message type, especially because frontends
             may want to get object information in response to user keystrokes (like Tab or
             F1) besides from the user explicitly typing code like ``x??``.
             Message type: ``object_info_request``::
                 content = {
                     # The (possibly dotted) name of the object to be searched in all
             	# relevant namespaces
                     'name' : str,
                 	# The level of detail desired.  The default (0) is equivalent to typing
             	# 'x?' at the prompt, 1 is equivalent to 'x??'.
             	'detail_level' : int,
                 }
             The returned information will be a dictionary with keys very similar to the
             field names that IPython prints at the terminal.
             Message type: ``object_info_reply``::
                 content = {
                 # The name the object was requested under
                 'name' : str,
                 # Boolean flag indicating whether the named object was found or not.  If
                 # it's false, all other fields will be empty.
                 'found' : bool,
                 # Flags for magics and system aliases
                 'ismagic' : bool,
                 'isalias' : bool,
                 # The name of the namespace where the object was found ('builtin',
                 # 'magics', 'alias', 'interactive', etc.)
                 'namespace' : str,
                 # The type name will be type.__name__ for normal Python objects, but it
                 # can also be a string like 'Magic function' or 'System alias'
                 'type_name' : str,
                 # The string form of the object, possibly truncated for length if
                 # detail_level is 0
                 'string_form' : str,
                 # For objects with a __class__ attribute this will be set
                 'base_class' : str,
                 # For objects with a __len__ attribute this will be set
                 'length' : int,
                 # If the object is a function, class or method whose file we can find,
                 # we give its full path
                 'file' : str,
                 # For pure Python callable objects, we can reconstruct the object
                 # definition line which provides its call signature.  For convenience this
                 # is returned as a single 'definition' field, but below the raw parts that
                 # compose it are also returned as the argspec field.
                 'definition' : str,
                 # The individual parts that together form the definition string.  Clients
                 # with rich display capabilities may use this to provide a richer and more
                 # precise representation of the definition line (e.g. by highlighting
                 # arguments based on the user's cursor position).  For non-callable
                 # objects, this field is empty.
                 'argspec' : { # The names of all the arguments
                               args : list,
             		  # The name of the varargs (*args), if any
                               varargs : str,
             		  # The name of the varkw (**kw), if any
             		  varkw : str,
             		  # The values (as strings) of all default arguments.  Note
             		  # that these must be matched *in reverse* with the 'args'
             		  # list above, since the first positional args have no default
             		  # value at all.
             		  defaults : list,
             		  },
                 # For instances, provide the constructor signature (the definition of
                 # the __init__ method):
                 'init_definition' : str,
                 # Docstrings: for any object (function, method, module, package) with a
                 # docstring, we show it.  But in addition, we may provide additional
                 # docstrings.  For example, for instances we will show the constructor
                 # and class docstrings as well, if available.
                 'docstring' : str,
                 # For instances, provide the constructor and class docstrings
                 'init_docstring' : str,
                 'class_docstring' : str,
                 # If it's a callable object whose call method has a separate docstring and
                 # definition line:
                 'call_def' : str,
                 'call_docstring' : str,
                 # If detail_level was 1, we also try to find the source code that
                 # defines the object, if possible.  The string 'None' will indicate
                 # that no source was found.
                 'source' : str,
                 }
             '
             Complete
             --------
             Message type: ``complete_request``::
                 content = {
                     # The text to be completed, such as 'a.is'
                 'text' : str,
                 # The full line, such as 'print a.is'.  This allows completers to
                 # make decisions that may require information about more than just the
                 # current word.
                 'line' : str,
                 # The entire block of text where the line is.  This may be useful in the
                 # case of multiline completions where more context may be needed.  Note: if
                 # in practice this field proves unnecessary, remove it to lighten the
                 # messages.
                 'block' : str,
                 # The position of the cursor where the user hit 'TAB' on the line.
                 'cursor_pos' : int,
                 }
             Message type: ``complete_reply``::
                 content = {
                     # The list of all matches to the completion request, such as
                 # ['a.isalnum', 'a.isalpha'] for the above example.
                 'matches' : list
                 }
             History
             -------
             For clients to explicitly request history from a kernel.  The kernel has all
             the actual execution history stored in a single location, so clients can
             request it from the kernel when needed.
             Message type: ``history_request``::
                 content = {
                   # If True, also return output history in the resulting dict.
                   'output' : bool,
                   # If True, return the raw input history, else the transformed input.
                   'raw' : bool,
                   # So far, this can be 'range', 'tail' or 'search'.
                   'hist_access_type' : str,
                   # If hist_access_type is 'range', get a range of input cells. session can
                   # be a positive session number, or a negative number to count back from
                   # the current session.
                   'session' : int,
                   # start and stop are line numbers within that session.
                   'start' : int,
                   'stop' : int,
                   # If hist_access_type is 'tail', get the last n cells.
                   'n' : int,
                   # If hist_access_type is 'search', get cells matching the specified glob
                   # pattern (with * and ? as wildcards).
                   'pattern' : str,
                 }
             Message type: ``history_reply``::
                 content = {
                   # A list of 3 tuples, either:
                   # (session, line_number, input) or
                   # (session, line_number, (input, output)),
                   # depending on whether output was False or True, respectively.
                   'history' : list,
                 }
             Connect
             -------
             When a client connects to the request/reply socket of the kernel, it can issue
             a connect request to get basic information about the kernel, such as the ports
             the other ZeroMQ sockets are listening on. This allows clients to only have
-            to know about a single port (the XREQ/XREP channel) to connect to a kernel.
+            to know about a single port (the DEALER/ROUTER channel) to connect to a kernel.
             Message type: ``connect_request``::
                 content = {
                 }
             Message type: ``connect_reply``::
                 content = {
-                    'xrep_port' : int  # The port the XREP socket is listening on.
+                    'xrep_port' : int  # The port the ROUTER socket is listening on.
                     'pub_port' : int   # The port the PUB socket is listening on.
                     'req_port' : int   # The port the REQ socket is listening on.
                     'hb_port' : int    # The port the heartbeat socket is listening on.
                 }
             Kernel shutdown
             ---------------
             The clients can request the kernel to shut itself down; this is used in
             multiple cases:
             - when the user chooses to close the client application via a menu or window
               control.
             - when the user types 'exit' or 'quit' (or their uppercase magic equivalents).
             - when the user chooses a GUI method (like the 'Ctrl-C' shortcut in the
               IPythonQt client) to force a kernel restart to get a clean kernel without
               losing client-side state like history or inlined figures.
             The client sends a shutdown request to the kernel, and once it receives the
             reply message (which is otherwise empty), it can assume that the kernel has
             completed shutdown safely.
             Upon their own shutdown, client applications will typically execute a last
             minute sanity check and forcefully terminate any kernel that is still alive, to
             avoid leaving stray processes in the user's machine.
             For both shutdown request and reply, there is no actual content that needs to
             be sent, so the content dict is empty.
             Message type: ``shutdown_request``::
                 content = {
                     'restart' : bool # whether the shutdown is final, or precedes a restart
                 }
             Message type: ``shutdown_reply``::
                 content = {
                     'restart' : bool # whether the shutdown is final, or precedes a restart
                 }
             .. Note::
                When the clients detect a dead kernel thanks to inactivity on the heartbeat
                socket, they simply send a forceful process termination signal, since a dead
                process is unlikely to respond in any useful way to messages.
             Messages on the PUB/SUB socket
             ==============================
             Streams (stdout,  stderr, etc)
             ------------------------------
             Message type: ``stream``::
                 content = {
                     # The name of the stream is one of 'stdin', 'stdout', 'stderr'
                     'name' : str,
                     # The data is an arbitrary string to be written to that stream
                     'data' : str,
                 }
             When a kernel receives a raw_input call, it should also broadcast it on the pub
             socket with the names 'stdin' and 'stdin_reply'.  This will allow other clients
             to monitor/display kernel interactions and possibly replay them to their user
             or otherwise expose them.
             Display Data
             ------------
             This type of message is used to bring back data that should be diplayed (text,
             html, svg, etc.) in the frontends. This data is published to all frontends.
             Each message can have multiple representations of the data; it is up to the
             frontend to decide which to use and how. A single message should contain all
             possible representations of the same information. Each representation should
             be a JSON'able data structure, and should be a valid MIME type.
             Some questions remain about this design:
             * Do we use this message type for pyout/displayhook? Probably not, because
               the displayhook also has to handle the Out prompt display. On the other hand
               we could put that information into the metadata secion.
             Message type: ``display_data``::
                 content = {
                     # Who create the data
                     'source' : str,
                     # The data dict contains key/value pairs, where the kids are MIME
                     # types and the values are the raw data of the representation in that
                     # format. The data dict must minimally contain the ``text/plain``
                     # MIME type which is used as a backup representation.
                     'data' : dict,
                     # Any metadata that describes the data
                     'metadata' : dict
                 }
             Python inputs
             -------------
             These messages are the re-broadcast of the ``execute_request``.
             Message type: ``pyin``::
                 content = {
                     'code' : str  # Source code to be executed, one or more lines
                 }
             Python outputs
             --------------
             When Python produces output from code that has been compiled in with the
             'single' flag to :func:`compile`, any expression that produces a value (such as
             ``1+1``) is passed to ``sys.displayhook``, which is a callable that can do with
             this value whatever it wants.  The default behavior of ``sys.displayhook`` in
             the Python interactive prompt is to print to ``sys.stdout`` the :func:`repr` of
             the value as long as it is not ``None`` (which isn't printed at all).  In our
             case, the kernel instantiates as ``sys.displayhook`` an object which has
             similar behavior, but which instead of printing to stdout, broadcasts these
             values as ``pyout`` messages for clients to display appropriately.
             IPython's displayhook can handle multiple simultaneous formats depending on its
             configuration. The default pretty-printed repr text is always given with the
             ``data`` entry in this message. Any other formats are provided in the
             ``extra_formats`` list. Frontends are free to display any or all of these
             according to its capabilities. ``extra_formats`` list contains 3-tuples of an ID
             string, a type string, and the data. The ID is unique to the formatter
             implementation that created the data. Frontends will typically ignore the ID
             unless if it has requested a particular formatter. The type string tells the
             frontend how to interpret the data. It is often, but not always a MIME type.
             Frontends should ignore types that it does not understand. The data itself is
             any JSON object and depends on the format. It is often, but not always a string.
             Message type: ``pyout``::
                 content = {
                     # The counter for this execution is also provided so that clients can
                     # display it, since IPython automatically creates variables called _N
                     # (for prompt N).
                     'execution_count' : int,
                     # The data dict contains key/value pairs, where the kids are MIME
                     # types and the values are the raw data of the representation in that
                     # format. The data dict must minimally contain the ``text/plain``
                     # MIME type which is used as a backup representation.
                     'data' : dict,
                 }
             Python errors
             -------------
             When an error occurs during code execution
             Message type: ``pyerr``::
                 content = {
                    # Similar content to the execute_reply messages for the 'error' case,
                    # except the 'status' field is omitted.
                 }
             Kernel status
             -------------
             This message type is used by frontends to monitor the status of the kernel.
             Message type: ``status``::
                 content = {
                     # When the kernel starts to execute code, it will enter the 'busy'
                     # state and when it finishes, it will enter the 'idle' state.
                     execution_state : ('busy', 'idle')
                 }
             Kernel crashes
             --------------
             When the kernel has an unexpected exception, caught by the last-resort
             sys.excepthook, we should broadcast the crash handler's output before exiting.
             This will allow clients to notice that a kernel died, inform the user and
             propose further actions.
             Message type: ``crash``::
                 content = {
                    # Similarly to the 'error' case for execute_reply messages, this will
                    # contain exc_name, exc_type and traceback fields.
                    # An additional field with supplementary information such as where to
                    # send the crash message
                    'info' : str,
                 }
             Future ideas
             ------------
             Other potential message types, currently unimplemented, listed below as ideas.
             Message type: ``file``::
                 content = {
                 'path' : 'cool.jpg',
                 'mimetype' : str,
                 'data' : str,
                 }
             Messages on the REQ/REP socket
             ==============================
             This is a socket that goes in the opposite direction: from the kernel to a
             *single* frontend, and its purpose is to allow ``raw_input`` and similar
             operations that read from ``sys.stdin`` on the kernel to be fulfilled by the
             client.  For now we will keep these messages as simple as possible, since they
             basically only mean to convey the ``raw_input(prompt)`` call.
             Message type: ``input_request``::
                 content = { 'prompt' : str }
             Message type: ``input_reply``::
                 content = { 'value' : str }
             .. Note::
                We do not explicitly try to forward the raw ``sys.stdin`` object, because in
                practice the kernel should behave like an interactive program.  When a
                program is opened on the console, the keyboard effectively takes over the
                ``stdin`` file descriptor, and it can't be used for raw reading anymore.
                Since the IPython kernel effectively behaves like a console program (albeit
                one whose "keyboard" is actually living in a separate process and
                transported over the zmq connection), raw ``stdin`` isn't expected to be
                available.
             Heartbeat for kernels
             =====================
             Initially we had considered using messages like those above over ZMQ for a
             kernel 'heartbeat' (a way to detect quickly and reliably whether a kernel is
             alive at all, even if it may be busy executing user code).  But this has the
             problem that if the kernel is locked inside extension code, it wouldn't execute
             the python heartbeat code.  But it turns out that we can implement a basic
             heartbeat with pure ZMQ, without using any Python messaging at all.
             The monitor sends out a single zmq message (right now, it is a str of the
             monitor's lifetime in seconds), and gets the same message right back, prefixed
-            with the zmq identity of the XREQ socket in the heartbeat process. This can be
+            with the zmq identity of the DEALER socket in the heartbeat process. This can be
             a uuid, or even a full message, but there doesn't seem to be a need for packing
             up a message when the sender and receiver are the exact same Python object.
             The model is this::
                 monitor.send(str(self.lifetime)) # '1.2345678910'
             and the monitor receives some number of messages of the form::
                 ['uuid-abcd-dead-beef', '1.2345678910']
-            where the first part is the zmq.IDENTITY of the heart's XREQ on the engine, and
+            where the first part is the zmq.IDENTITY of the heart's DEALER on the engine, and
             the rest is the message sent by the monitor.  No Python code ever has any
             access to the message between the monitor's send, and the monitor's recv.
             ToDo
             ====
             Missing things include:
             * Important: finish thinking through the payload concept and API.
             * Important: ensure that we have a good solution for magics like %edit.  It's
               likely that with the payload concept we can build a full solution, but not
 % clear yet.
             * Finishing the details of the heartbeat protocol.
             * Signal handling: specify what kind of information kernel should broadcast (or
               not) when it receives signals.
             .. include:: ../links.rst

docs/source/development/parallel_connections.txt

0 +16 -16

             .. _parallel_connections:
             ==============================================
             Connection Diagrams of The IPython ZMQ Cluster
             ==============================================
             This is a quick summary and illustration of the connections involved in the ZeroMQ based
             IPython cluster for parallel computing.
             All Connections
             ===============
             The IPython cluster consists of a Controller, and one or more each of clients and engines.
             The goal of the Controller is to manage and monitor the connections and communications
             between the clients and the engines.  The Controller is no longer a single process entity,
             but rather a collection of processes - specifically one Hub, and 4 (or more) Schedulers.
             It is important for security/practicality reasons that all connections be inbound to the
             controller processes. The arrows in the figures indicate the direction of the
             connection.
             .. figure:: figs/allconnections.png
                 :width: 432px
                 :alt: IPython cluster connections
                 :align: center
                 All the connections involved in connecting one client to one engine.
             The Controller consists of 1-4 processes. Central to the cluster is the **Hub**, which monitors
             engine state, execution traffic, and handles registration and notification. The Hub includes a
             Heartbeat Monitor for keeping track of engines that are alive. Outside the Hub are 4
             **Schedulers**. These devices are very small pure-C MonitoredQueue processes (or optionally
             threads) that relay messages very fast, but also send a copy of each message along a side socket
             to the Hub. The MUX queue and Control queue are MonitoredQueue ØMQ devices which relay
             explicitly addressed messages from clients to engines, and their replies back up. The Balanced
             queue performs load-balancing destination-agnostic scheduling. It may be a MonitoredQueue
             device, but may also be a Python Scheduler that behaves externally in an identical fashion to MQ
             devices, but with additional internal logic. stdout/err are also propagated from the Engines to
             the clients via a PUB/SUB MonitoredQueue.
             Registration
             ------------
             .. figure:: figs/queryfade.png
                 :width: 432px
                 :alt: IPython Registration connections
                 :align: center
-                Engines and Clients only need to know where the Query ``XREP`` is located to start
+                Engines and Clients only need to know where the Query ``ROUTER`` is located to start
                 connecting.
             Once a controller is launched, the only information needed for connecting clients and/or
-            engines is the IP/port of the Hub's ``XREP`` socket called the Registrar. This socket
+            engines is the IP/port of the Hub's ``ROUTER`` socket called the Registrar. This socket
             handles connections from both clients and engines, and replies with the remaining
             information necessary to establish the remaining connections. Clients use this same socket for
             querying the Hub for state information.
             Heartbeat
             ---------
             .. figure:: figs/hbfade.png
                 :width: 432px
                 :alt: IPython Heartbeat connections
                 :align: center
                 The heartbeat sockets.
             The heartbeat process has been described elsewhere. To summarize: the Heartbeat Monitor
             publishes a distinct message periodically via a ``PUB`` socket. Each engine has a
-            ``zmq.FORWARDER`` device with a ``SUB`` socket for input, and ``XREQ`` socket for output.
+            ``zmq.FORWARDER`` device with a ``SUB`` socket for input, and ``DEALER`` socket for output.
-            The ``SUB`` socket is connected to the ``PUB`` socket labeled *ping*, and the ``XREQ`` is
+            The ``SUB`` socket is connected to the ``PUB`` socket labeled *ping*, and the ``DEALER`` is
-            connected to the ``XREP`` labeled *pong*. This results in the same message being relayed
+            connected to the ``ROUTER`` labeled *pong*. This results in the same message being relayed
-            back to the Heartbeat Monitor with the addition of the ``XREQ`` prefix. The Heartbeat
+            back to the Heartbeat Monitor with the addition of the ``DEALER`` prefix. The Heartbeat
-            Monitor receives all the replies via an ``XREP`` socket, and identifies which hearts are
+            Monitor receives all the replies via an ``ROUTER`` socket, and identifies which hearts are
-            still beating by the ``zmq.IDENTITY`` prefix of the ``XREQ`` sockets, which information
+            still beating by the ``zmq.IDENTITY`` prefix of the ``DEALER`` sockets, which information
             the Hub uses to notify clients of any changes in the available engines.
             Schedulers
             ----------
             .. figure:: figs/queuefade.png
                 :width: 432px
                 :alt: IPython Queue connections
                 :align: center
                 Control message scheduler on the left, execution (apply) schedulers on the right.
             The controller has at least three Schedulers. These devices are primarily for
             relaying messages between clients and engines, but the Hub needs to see those
             messages for its own purposes. Since no Python code may exist between the two sockets in a
             queue, all messages sent through these queues (both directions) are also sent via a
             ``PUB`` socket to a monitor, which allows the Hub to monitor queue traffic without
             interfering with it.
-            For tasks, the engine need not be specified. Messages sent to the ``XREP`` socket from the
+            For tasks, the engine need not be specified. Messages sent to the ``ROUTER`` socket from the
-            client side are assigned to an engine via ZMQ's ``XREQ`` round-robin load balancing.
+            client side are assigned to an engine via ZMQ's ``DEALER`` round-robin load balancing.
             Engine replies are directed to specific clients via the IDENTITY of the client, which is
             received as a prefix at the Engine.
-            For Multiplexing, ``XREP`` is used for both in and output sockets in the device. Clients must
+            For Multiplexing, ``ROUTER`` is used for both in and output sockets in the device. Clients must
-            specify the destination by the ``zmq.IDENTITY`` of the ``XREP`` socket connected to
+            specify the destination by the ``zmq.IDENTITY`` of the ``ROUTER`` socket connected to
             the downstream end of the device.
-            At the Kernel level, both of these ``XREP`` sockets are treated in the same way as the ``REP``
+            At the Kernel level, both of these ``ROUTER`` sockets are treated in the same way as the ``REP``
             socket in the serial version (except using ZMQStreams instead of explicit sockets).
             Execution can be done in a load-balanced (engine-agnostic) or multiplexed (engine-specified)
             manner. The sockets on the Client and Engine are the same for these two actions, but the
             scheduler used determines the actual behavior. This routing is done via the ``zmq.IDENTITY`` of
             the upstream sockets in each MonitoredQueue.
             IOPub
             -----
             .. figure:: figs/iopubfade.png
                 :width: 432px
                 :alt: IOPub connections
                 :align: center
                 stdout/err are published via a ``PUB/SUB`` MonitoredQueue
             On the kernels, stdout/stderr are captured and published via a ``PUB`` socket. These ``PUB``
             sockets all connect to a ``SUB`` socket input of a MonitoredQueue, which subscribes to all
             messages. They are then republished via another ``PUB`` socket, which can be
             subscribed by the clients.
             Client connections
             ------------------
             .. figure:: figs/queryfade.png
                 :width: 432px
                 :alt: IPython client query connections
                 :align: center
-                Clients connect to an ``XREP`` socket to query the hub.
+                Clients connect to an ``ROUTER`` socket to query the hub.
-            The hub's registrar ``XREP`` socket also listens for queries from clients as to queue status,
+            The hub's registrar ``ROUTER`` socket also listens for queries from clients as to queue status,
-            and control instructions. Clients connect to this socket via an ``XREQ`` during registration.
+            and control instructions. Clients connect to this socket via an ``DEALER`` during registration.
             .. figure:: figs/notiffade.png
                 :width: 432px
                 :alt: IPython Registration connections
                 :align: center
                 Engine registration events are published via a ``PUB`` socket.
             The Hub publishes all registration/unregistration events via a ``PUB`` socket. This
             allows clients to stay up to date with what engines are available by subscribing to the
             feed with a ``SUB`` socket. Other processes could selectively subscribe to just
             registration or unregistration events.

docs/source/development/parallel_messages.txt

0 +9 -9

             .. _parallel_messages:
             Messaging for Parallel Computing
             ================================
             This is an extension of the :ref:`messaging <messaging>` doc. Diagrams of the connections
             can be found in the :ref:`parallel connections <parallel_connections>` doc.
             ZMQ messaging is also used in the parallel computing IPython system. All messages to/from
             kernels remain the same as the single kernel model, and are forwarded through a ZMQ Queue
             device. The controller receives all messages and replies in these channels, and saves
             results for future use.
             The Controller
             --------------
             The controller is the central collection of processes in the IPython parallel computing
             model. It has two major components:
                 * The Hub
                 * A collection of Schedulers
             The Hub
             -------
             The Hub is the central process for monitoring the state of the engines, and all task
             requests and results.  It has no role in execution and does no relay of messages, so
             large blocking requests or database actions in the Hub do not have the ability to impede
             job submission and results.
-            Registration (``XREP``)
+            Registration (``ROUTER``)
             ***********************
             The first function of the Hub is to facilitate and monitor connections of clients
             and engines. Both client and engine registration are handled by the same socket, so only
             one ip/port pair is needed to connect any number of connections and clients.
-            Engines register with the ``zmq.IDENTITY`` of their two ``XREQ`` sockets, one for the
+            Engines register with the ``zmq.IDENTITY`` of their two ``DEALER`` sockets, one for the
             queue, which receives execute requests, and one for the heartbeat, which is used to
             monitor the survival of the Engine process.
             Message type: ``registration_request``::
                 content = {
                     'queue'   : 'abcd-1234-...', # the MUX queue zmq.IDENTITY
                     'control'   : 'abcd-1234-...', # the control queue zmq.IDENTITY
                     'heartbeat' : 'abcd-1234-...' # the heartbeat zmq.IDENTITY
                 }
             .. note::
                 these are always the same, at least for now.
             The Controller replies to an Engine's registration request with the engine's integer ID,
             and all the remaining connection information for connecting the heartbeat process, and
             kernel queue socket(s). The message status will be an error if the Engine requests IDs that
             already in use.
             Message type: ``registration_reply``::
                 content = {
                     'status' : 'ok', # or 'error'
                     # if ok:
                     'id' : 0, # int, the engine id
                     'queue' : 'tcp://127.0.0.1:12345', # connection for engine side of the queue
                     'control' : 'tcp://...', # addr for control queue
                     'heartbeat' : ('tcp://...','tcp://...'), # tuple containing two interfaces needed for heartbeat
                     'task' : 'tcp://...', # addr for task queue, or None if no task queue running
                 }
             Clients use the same socket as engines to start their connections. Connection requests
             from clients need no information:
             Message type: ``connection_request``::
                 content = {}
             The reply to a Client registration request contains the connection information for the
             multiplexer and load balanced queues, as well as the address for direct hub
             queries. If any of these addresses is `None`, that functionality is not available.
             Message type: ``connection_reply``::
                 content = {
                     'status' : 'ok', # or 'error'
                     # if ok:
                     'queue' : 'tcp://127.0.0.1:12345', # connection for client side of the MUX queue
                     'task' : ('lru','tcp...'), # routing scheme and addr for task queue (len 2 tuple)
                     'query' : 'tcp...', # addr for methods to query the hub, like queue_request, etc.
                     'control' : 'tcp...', # addr for control methods, like abort, etc.
                 }
             Heartbeat
             *********
             The hub uses a heartbeat system to monitor engines, and track when they become
             unresponsive. As described in :ref:`messaging <messaging>`, and shown in :ref:`connections
             <parallel_connections>`.
             Notification (``PUB``)
             **********************
             The hub publishes all engine registration/unregistration events on a ``PUB`` socket.
             This allows clients to have up-to-date engine ID sets without polling. Registration
             notifications contain both the integer engine ID and the queue ID, which is necessary for
             sending messages via the Multiplexer Queue and Control Queues.
             Message type: ``registration_notification``::
                 content = {
                     'id' : 0, # engine ID that has been registered
                     'queue' : 'engine_id' # the IDENT for the engine's queue
                 }
             Message type : ``unregistration_notification``::
                 content = {
                     'id' : 0 # engine ID that has been unregistered
                 }
-            Client Queries (``XREP``)
+            Client Queries (``ROUTER``)
             *************************
             The hub monitors and logs all queue traffic, so that clients can retrieve past
             results or monitor pending tasks. This information may reside in-memory on the Hub, or
             on disk in a database (SQLite and MongoDB are currently supported).  These requests are
             handled by the same socket as registration.
             :func:`queue_request` requests can specify multiple engines to query via the `targets`
             element. A verbose flag can be passed, to determine whether the result should be the list
             of `msg_ids` in the queue or simply the length of each list.
             Message type: ``queue_request``::
                 content = {
                     'verbose' : True, # whether return should be lists themselves or just lens
                     'targets' : [0,3,1] # list of ints
                 }
             The content of a reply to a :func:`queue_request` request is a dict, keyed by the engine
             IDs. Note that they will be the string representation of the integer keys, since JSON
             cannot handle number keys.  The three keys of each dict are::
                 'completed' :  messages submitted via any queue that ran on the engine
                 'queue' : jobs submitted via MUX queue, whose results have not been received
                 'tasks' : tasks that are known to have been submitted to the engine, but
                             have not completed.  Note that with the pure zmq scheduler, this will
                             always be 0/[].
             Message type: ``queue_reply``::
                 content = {
                     'status' : 'ok', # or 'error'
                     # if verbose=False:
                     '0' : {'completed' : 1, 'queue' : 7, 'tasks' : 0},
                     # if verbose=True:
                     '1' : {'completed' : ['abcd-...','1234-...'], 'queue' : ['58008-'], 'tasks' : []},
                 }
             Clients can request individual results directly from the hub. This is primarily for
             gathering results of executions not submitted by the requesting client, as the client
             will have all its own results already. Requests are made by msg_id, and can contain one or
             more msg_id. An additional boolean key 'statusonly' can be used to not request the
             results, but simply poll the status of the jobs.
             Message type: ``result_request``::
                 content = {
                     'msg_ids' : ['uuid','...'], # list of strs
                     'targets' : [1,2,3], # list of int ids or uuids
                     'statusonly' : False, # bool
                 }
             The :func:`result_request` reply contains the content objects of the actual execution
             reply messages. If `statusonly=True`, then there will be only the 'pending' and
             'completed' lists.
             Message type: ``result_reply``::
                 content = {
                     'status' : 'ok', # else error
                     # if ok:
                     'acbd-...' : msg, # the content dict is keyed by msg_ids,
                                      # values are the result messages
                                     # there will be none of these if `statusonly=True`
                     'pending' : ['msg_id','...'], # msg_ids still pending
                     'completed' : ['msg_id','...'], # list of completed msg_ids
                 }
                 buffers = ['bufs','...'] # the buffers that contained the results of the objects.
                                         # this will be empty if no messages are complete, or if
                                         # statusonly is True.
             For memory management purposes, Clients can also instruct the hub to forget the
             results of messages. This can be done by message ID or engine ID. Individual messages are
             dropped by msg_id, and all messages completed on an engine are dropped by engine ID. This
             may no longer be necessary with the mongodb-based message logging backend.
             If the msg_ids element is the string ``'all'`` instead of a list, then all completed
             results are forgotten.
             Message type: ``purge_request``::
                 content = {
                     'msg_ids' : ['id1', 'id2',...], # list of msg_ids or 'all'
                     'engine_ids' : [0,2,4] # list of engine IDs
                 }
             The reply to a purge request is simply the status 'ok' if the request succeeded, or an
             explanation of why it failed, such as requesting the purge of a nonexistent or pending
             message.
             Message type: ``purge_reply``::
                 content = {
                     'status' : 'ok', # or 'error'
                 }
             Schedulers
             ----------
             There are three basic schedulers:
               * Task Scheduler
               * MUX Scheduler
               * Control Scheduler
-            The MUX and Control schedulers are simple MonitoredQueue ØMQ devices, with ``XREP``
+            The MUX and Control schedulers are simple MonitoredQueue ØMQ devices, with ``ROUTER``
             sockets on either side. This allows the queue to relay individual messages to particular
             targets via ``zmq.IDENTITY`` routing. The Task scheduler may be a MonitoredQueue ØMQ
-            device, in which case the client-facing socket is ``XREP``, and the engine-facing socket
+            device, in which case the client-facing socket is ``ROUTER``, and the engine-facing socket
-            is ``XREQ``.  The result of this is that client-submitted messages are load-balanced via
+            is ``DEALER``.  The result of this is that client-submitted messages are load-balanced via
-            the ``XREQ`` socket, but the engine's replies to each message go to the requesting client.
+            the ``DEALER`` socket, but the engine's replies to each message go to the requesting client.
-            Raw ``XREQ`` scheduling is quite primitive, and doesn't allow message introspection, so
+            Raw ``DEALER`` scheduling is quite primitive, and doesn't allow message introspection, so
             there are also Python Schedulers that can be used. These Schedulers behave in much the
             same way as a MonitoredQueue does from the outside, but have rich internal logic to
             determine destinations, as well as handle dependency graphs Their sockets are always
-            ``XREP`` on both sides.
+            ``ROUTER`` on both sides.
             The Python task schedulers have an additional message type, which informs the Hub of
             the destination of a task as soon as that destination is known.
             Message type: ``task_destination``::
                 content = {
                     'msg_id' : 'abcd-1234-...', # the msg's uuid
                     'engine_id' : '1234-abcd-...', # the destination engine's zmq.IDENTITY
                 }
             :func:`apply` and :func:`apply_bound`
             *************************************
             In terms of message classes, the MUX scheduler and Task scheduler relay the exact same
             message types.  Their only difference lies in how the destination is selected.
             The `Namespace <http://gist.github.com/483294>`_ model suggests that execution be able to
             use the model::
                 ns.apply(f, *args, **kwargs)
             which takes `f`, a function in the user's namespace, and executes ``f(*args, **kwargs)``
             on a remote engine, returning the result (or, for non-blocking, information facilitating
             later retrieval of the result). This model, unlike the execute message which just uses a
             code string, must be able to send arbitrary (pickleable) Python objects. And ideally, copy
             as little data as we can. The `buffers` property of a Message was introduced for this
             purpose.
             Utility method :func:`build_apply_message` in :mod:`IPython.zmq.streamsession` wraps a
             function signature and builds a sendable buffer format for minimal data copying (exactly
             zero copies of numpy array data or buffers or large strings).
             Message type: ``apply_request``::
                 content = {
                     'bound' : True, # whether to execute in the engine's namespace or unbound
                     'after' : ['msg_id',...], # list of msg_ids or output of Dependency.as_dict()
                     'follow' : ['msg_id',...], # list of msg_ids or output of Dependency.as_dict()
                 }
                 buffers = ['...'] # at least 3 in length
                                 # as built by build_apply_message(f,args,kwargs)
             after/follow represent task dependencies. 'after' corresponds to a time dependency. The
             request will not arrive at an engine until the 'after' dependency tasks have completed.
             'follow' corresponds to a location dependency. The task will be submitted to the same
             engine as these msg_ids (see :class:`Dependency` docs for details).
             Message type: ``apply_reply``::
                 content = {
                     'status' : 'ok' # 'ok' or 'error'
                     # other error info here, as in other messages
                 }
                 buffers = ['...'] # either 1 or 2 in length
                                 # a serialization of the return value of f(*args,**kwargs)
                                 # only populated if status is 'ok'
             All engine execution and data movement is performed via apply messages.
             Control Messages
             ----------------
             Messages that interact with the engines, but are not meant to execute code, are submitted
             via the Control queue. These messages have high priority, and are thus received and
             handled before any execution requests.
             Clients may want to clear the namespace on the engine. There are no arguments nor
             information involved in this request, so the content is empty.
             Message type: ``clear_request``::
                 content = {}
             Message type: ``clear_reply``::
                 content = {
                     'status' : 'ok' # 'ok' or 'error'
                     # other error info here, as in other messages
                 }
             Clients may want to abort tasks that have not yet run. This can by done by message id, or
             all enqueued messages can be aborted if None is specified.
             Message type: ``abort_request``::
                 content = {
                     'msg_ids' : ['1234-...', '...'] # list of msg_ids or None
                 }
             Message type: ``abort_reply``::
                 content = {
                     'status' : 'ok' # 'ok' or 'error'
                     # other error info here, as in other messages
                 }
             The last action a client may want to do is shutdown the kernel. If a kernel receives a
             shutdown request, then it aborts all queued messages, replies to the request, and exits.
             Message type: ``shutdown_request``::
                 content = {}
             Message type: ``shutdown_reply``::
                 content = {
                     'status' : 'ok' # 'ok' or 'error'
                     # other error info here, as in other messages
                 }
             Implementation
             --------------
             There are a few differences in implementation between the `StreamSession` object used in
             the newparallel branch and the `Session` object, the main one being that messages are
             sent in parts, rather than as a single serialized object. `StreamSession` objects also
             take pack/unpack functions, which are to be used when serializing/deserializing objects.
             These can be any functions that translate to/from formats that ZMQ sockets can send
             (buffers,bytes, etc.).
             Split Sends
             ***********
             Previously, messages were bundled as a single json object and one call to
             :func:`socket.send_json`. Since the hub inspects all messages, and doesn't need to
             see the content of the messages, which can be large, messages are now serialized and sent in
             pieces. All messages are sent in at least 3 parts: the header, the parent header, and the
             content. This allows the controller to unpack and inspect the (always small) header,
             without spending time unpacking the content unless the message is bound for the
             controller. Buffers are added on to the end of the message, and can be any objects that
             present the buffer interface.

docs/source/parallel/parallel_task.txt

0 +1 -1

             .. _parallel_task:
             ==========================
             The IPython task interface
             ==========================
             The task interface to the cluster presents the engines as a fault tolerant,
             dynamic load-balanced system of workers. Unlike the multiengine interface, in
             the task interface the user have no direct access to individual engines. By
             allowing the IPython scheduler to assign work, this interface is simultaneously
             simpler and more powerful.
             Best of all, the user can use both of these interfaces running at the same time
             to take advantage of their respective strengths. When the user can break up
             the user's work into segments that do not depend on previous execution, the
             task interface is ideal. But it also has more power and flexibility, allowing
             the user to guide the distribution of jobs, without having to assign tasks to
             engines explicitly.
             Starting the IPython controller and engines
             ===========================================
             To follow along with this tutorial, you will need to start the IPython
             controller and four IPython engines. The simplest way of doing this is to use
             the :command:`ipcluster` command::
             	$ ipcluster start -n 4
             For more detailed information about starting the controller and engines, see
             our :ref:`introduction <parallel_overview>` to using IPython for parallel computing.
             Creating a ``Client`` instance
             ==============================
             The first step is to import the IPython :mod:`IPython.parallel`
             module and then create a :class:`.Client` instance, and we will also be using
             a :class:`LoadBalancedView`, here called `lview`:
             .. sourcecode:: ipython
                 In [1]: from IPython.parallel import Client
                 In [2]: rc = Client()
             This form assumes that the controller was started on localhost with default
             configuration. If not, the location of the controller must be given as an
             argument to the constructor:
             .. sourcecode:: ipython
                 # for a visible LAN controller listening on an external port:
                 In [2]: rc = Client('tcp://192.168.1.16:10101')
                 # or to connect with a specific profile you have set up:
                 In [3]: rc = Client(profile='mpi')
             For load-balanced execution, we will make use of a :class:`LoadBalancedView` object, which can
             be constructed via the client's :meth:`load_balanced_view` method:
             .. sourcecode:: ipython
                 In [4]: lview = rc.load_balanced_view() # default load-balanced view
             .. seealso::
                 For more information, see the in-depth explanation of :ref:`Views <parallel_details>`.
             Quick and easy parallelism
             ==========================
             In many cases, you simply want to apply a Python function to a sequence of
             objects, but *in parallel*. Like the multiengine interface, these can be
             implemented via the task interface. The exact same tools can perform these
             actions in load-balanced ways as well as multiplexed ways: a parallel version
             of :func:`map` and :func:`@parallel` function decorator. If one specifies the
             argument `balanced=True`, then they are dynamically load balanced. Thus, if the
             execution time per item varies significantly, you should use the versions in
             the task interface.
             Parallel map
             ------------
             To load-balance :meth:`map`,simply use a LoadBalancedView:
             .. sourcecode:: ipython
                 In [62]: lview.block = True
             	In [63]: serial_result = map(lambda x:x**10, range(32))
             	In [64]: parallel_result = lview.map(lambda x:x**10, range(32))
             	In [65]: serial_result==parallel_result
             	Out[65]: True
             Parallel function decorator
             ---------------------------
             Parallel functions are just like normal function, but they can be called on
             sequences and *in parallel*. The multiengine interface provides a decorator
             that turns any Python function into a parallel function:
             .. sourcecode:: ipython
                 In [10]: @lview.parallel()
                    ....: def f(x):
                    ....:     return 10.0*x**4
                    ....:
                 In [11]: f.map(range(32))    # this is done in parallel
                 Out[11]: [0.0,10.0,160.0,...]
             .. _parallel_dependencies:
             Dependencies
             ============
             Often, pure atomic load-balancing is too primitive for your work. In these cases, you
             may want to associate some kind of `Dependency` that describes when, where, or whether
             a task can be run.  In IPython, we provide two types of dependencies:
             `Functional Dependencies`_ and `Graph Dependencies`_
             .. note::
                 It is important to note that the pure ZeroMQ scheduler does not support dependencies,
                 and you will see errors or warnings if you try to use dependencies with the pure
                 scheduler.
             Functional Dependencies
             -----------------------
             Functional dependencies are used to determine whether a given engine is capable of running
             a particular task.  This is implemented via a special :class:`Exception` class,
             :class:`UnmetDependency`, found in `IPython.parallel.error`.  Its use is very simple:
             if a task fails with an UnmetDependency exception, then the scheduler, instead of relaying
             the error up to the client like any other error, catches the error, and submits the task
             to a different engine.  This will repeat indefinitely, and a task will never be submitted
             to a given engine a second time.
             You can manually raise the :class:`UnmetDependency` yourself, but IPython has provided
             some decorators for facilitating this behavior.
             There are two decorators and a class used for functional dependencies:
             .. sourcecode:: ipython
                 In [9]: from IPython.parallel import depend, require, dependent
             @require
             ********
             The simplest sort of dependency is requiring that a Python module is available. The
             ``@require`` decorator lets you define a function that will only run on engines where names
             you specify are importable:
             .. sourcecode:: ipython
                 In [10]: @require('numpy', 'zmq')
                     ...: def myfunc():
                     ...:     return dostuff()
             Now, any time you apply :func:`myfunc`, the task will only run on a machine that has
             numpy and pyzmq available, and when :func:`myfunc` is called, numpy and zmq will be imported.
             @depend
             *******
             The ``@depend`` decorator lets you decorate any function with any *other* function to
             evaluate the dependency. The dependency function will be called at the start of the task,
             and if it returns ``False``, then the dependency will be considered unmet, and the task
             will be assigned to another engine. If the dependency returns *anything other than
             ``False``*, the rest of the task will continue.
             .. sourcecode:: ipython
                 In [10]: def platform_specific(plat):
                     ...:    import sys
                     ...:    return sys.platform == plat
                 In [11]: @depend(platform_specific, 'darwin')
                     ...: def mactask():
                     ...:    do_mac_stuff()
                 In [12]: @depend(platform_specific, 'nt')
                     ...: def wintask():
                     ...:    do_windows_stuff()
             In this case, any time you apply ``mytask``, it will only run on an OSX machine.
             ``@depend`` is just like ``apply``, in that it has a ``@depend(f,*args,**kwargs)``
             signature.
             dependents
             **********
             You don't have to use the decorators on your tasks, if for instance you may want
             to run tasks with a single function but varying dependencies, you can directly construct
             the :class:`dependent` object that the decorators use:
             .. sourcecode::ipython
                 In [13]: def mytask(*args):
                     ...:    dostuff()
                 In [14]: mactask = dependent(mytask, platform_specific, 'darwin')
                 # this is the same as decorating the declaration of mytask with @depend
                 # but you can do it again:
                 In [15]: wintask = dependent(mytask, platform_specific, 'nt')
                 # in general:
                 In [16]: t = dependent(f, g, *dargs, **dkwargs)
                 # is equivalent to:
                 In [17]: @depend(g, *dargs, **dkwargs)
                     ...: def t(a,b,c):
                     ...:     # contents of f
             Graph Dependencies
             ------------------
             Sometimes you want to restrict the time and/or location to run a given task as a function
             of the time and/or location of other tasks. This is implemented via a subclass of
             :class:`set`, called a :class:`Dependency`. A Dependency is just a set of `msg_ids`
             corresponding to tasks, and a few attributes to guide how to decide when the Dependency
             has been met.
             The switches we provide for interpreting whether a given dependency set has been met:
             any|all
                 Whether the dependency is considered met if *any* of the dependencies are done, or
                 only after *all* of them have finished.  This is set by a Dependency's :attr:`all`
                 boolean attribute, which defaults to ``True``.
             success [default: True]
                 Whether to consider tasks that succeeded as fulfilling dependencies.
             failure [default : False]
                 Whether to consider tasks that failed as fulfilling dependencies.
                 using `failure=True,success=False` is useful for setting up cleanup tasks, to be run
                 only when tasks have failed.
             Sometimes you want to run a task after another, but only if that task succeeded. In this case,
             ``success`` should be ``True`` and ``failure`` should be ``False``. However sometimes you may
             not care whether the task succeeds, and always want the second task to run, in which case you
             should use `success=failure=True`. The default behavior is to only use successes.
             There are other switches for interpretation that are made at the *task* level.  These are
             specified via keyword arguments to the client's :meth:`apply` method.
             after,follow
                 You may want to run a task *after* a given set of dependencies have been run and/or
                 run it *where* another set of dependencies are met. To support this, every task has an
                 `after` dependency to restrict time, and a `follow` dependency to restrict
                 destination.
             timeout
                 You may also want to set a time-limit for how long the scheduler should wait before a
                 task's dependencies are met. This is done via a `timeout`, which defaults to 0, which
                 indicates that the task should never timeout. If the timeout is reached, and the
                 scheduler still hasn't been able to assign the task to an engine, the task will fail
                 with a :class:`DependencyTimeout`.
             .. note::
                 Dependencies only work within the task scheduler. You cannot instruct a load-balanced
                 task to run after a job submitted via the MUX interface.
             The simplest form of Dependencies is with `all=True,success=True,failure=False`. In these cases,
             you can skip using Dependency objects, and just pass msg_ids or AsyncResult objects as the
             `follow` and `after` keywords to :meth:`client.apply`:
             .. sourcecode:: ipython
                 In [14]: client.block=False
                 In [15]: ar = lview.apply(f, args, kwargs)
                 In [16]: ar2 = lview.apply(f2)
                 In [17]: ar3 = lview.apply_with_flags(f3, after=[ar,ar2])
                 In [17]: ar4 = lview.apply_with_flags(f3, follow=[ar], timeout=2.5)
             .. seealso::
                 Some parallel workloads can be described as a `Directed Acyclic Graph
                 <http://en.wikipedia.org/wiki/Directed_acyclic_graph>`_, or DAG. See :ref:`DAG
                 Dependencies <dag_dependencies>` for an example demonstrating how to use map a NetworkX DAG
                 onto task dependencies.
             Impossible Dependencies
             ***********************
             The schedulers do perform some analysis on graph dependencies to determine whether they
             are not possible to be met. If the scheduler does discover that a dependency cannot be
             met, then the task will fail with an :class:`ImpossibleDependency` error. This way, if the
             scheduler realized that a task can never be run, it won't sit indefinitely in the
             scheduler clogging the pipeline.
             The basic cases that are checked:
             * depending on nonexistent messages
             * `follow` dependencies were run on more than one machine and `all=True`
             * any dependencies failed and `all=True,success=True,failures=False`
             * all dependencies failed and `all=False,success=True,failure=False`
             .. warning::
                 This analysis has not been proven to be rigorous, so it is likely possible for tasks
                 to become impossible to run in obscure situations, so a timeout may be a good choice.
             Retries and Resubmit
             ====================
             Retries
             -------
             Another flag for tasks is `retries`.  This is an integer, specifying how many times
             a task should be resubmitted after failure.  This is useful for tasks that should still run
             if their engine was shutdown, or may have some statistical chance of failing.  The default
             is to not retry tasks.
             Resubmit
             --------
             Sometimes you may want to re-run a task. This could be because it failed for some reason, and
             you have fixed the error, or because you want to restore the cluster to an interrupted state.
             For this, the :class:`Client` has a :meth:`rc.resubmit` method.  This simply takes one or more
             msg_ids, and returns an :class:`AsyncHubResult` for the result(s).  You cannot resubmit
             a task that is pending - only those that have finished, either successful or unsuccessful.
             .. _parallel_schedulers:
             Schedulers
             ==========
             There are a variety of valid ways to determine where jobs should be assigned in a
             load-balancing situation.  In IPython, we support several standard schemes, and
             even make it easy to define your own.  The scheme can be selected via the ``scheme``
             argument to :command:`ipcontroller`, or in the :attr:`TaskScheduler.schemename` attribute
             of a controller config object.
             The built-in routing schemes:
             To select one of these schemes, simply do::
                 $ ipcontroller --scheme=<schemename>
                 for instance:
                 $ ipcontroller --scheme=lru
             lru: Least Recently Used
                 Always assign work to the least-recently-used engine.  A close relative of
                 round-robin, it will be fair with respect to the number of tasks, agnostic
                 with respect to runtime of each task.
             plainrandom: Plain Random
                 Randomly picks an engine on which to run.
             twobin: Two-Bin Random
                 **Requires numpy**
                 Pick two engines at random, and use the LRU of the two. This is known to be better
                 than plain random in many cases, but requires a small amount of computation.
             leastload: Least Load
                 **This is the default scheme**
                 Always assign tasks to the engine with the fewest outstanding tasks (LRU breaks tie).
             weighted: Weighted Two-Bin Random
                 **Requires numpy**
                 Pick two engines at random using the number of outstanding tasks as inverse weights,
                 and use the one with the lower load.
             Pure ZMQ Scheduler
             ------------------
             For maximum throughput, the 'pure' scheme is not Python at all, but a C-level
-            :class:`MonitoredQueue` from PyZMQ, which uses a ZeroMQ ``XREQ`` socket to perform all
+            :class:`MonitoredQueue` from PyZMQ, which uses a ZeroMQ ``DEALER`` socket to perform all
             load-balancing. This scheduler does not support any of the advanced features of the Python
             :class:`.Scheduler`.
             Disabled features when using the ZMQ Scheduler:
             * Engine unregistration
                 Task farming will be disabled if an engine unregisters.
                 Further, if an engine is unregistered during computation, the scheduler may not recover.
             * Dependencies
                 Since there is no Python logic inside the Scheduler, routing decisions cannot be made
                 based on message content.
             * Early destination notification
                 The Python schedulers know which engine gets which task, and notify the Hub.  This
                 allows graceful handling of Engines coming and going.  There is no way to know
                 where ZeroMQ messages have gone, so there is no way to know what tasks are on which
                 engine until they *finish*.  This makes recovery from engine shutdown very difficult.
             .. note::
                 TODO: performance comparisons
             More details
             ============
             The :class:`LoadBalancedView` has many more powerful features that allow quite a bit
             of flexibility in how tasks are defined and run. The next places to look are
             in the following classes:
             * :class:`~IPython.parallel.client.view.LoadBalancedView`
             * :class:`~IPython.parallel.client.asyncresult.AsyncResult`
             * :meth:`~IPython.parallel.client.view.LoadBalancedView.apply`
             * :mod:`~IPython.parallel.controller.dependency`
             The following is an overview of how to use these classes together:
 . Create a :class:`Client` and :class:`LoadBalancedView`
 . Define some functions to be run as tasks
 . Submit your tasks to using the :meth:`apply` method of your
                :class:`LoadBalancedView` instance.
 . Use :meth:`Client.get_result` to get the results of the
                tasks, or use the :meth:`AsyncResult.get` method of the results to wait
                for and then receive the results.
             .. seealso::
                 A demo of :ref:`DAG Dependencies <dag_dependencies>` with NetworkX and IPython.

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages