upstream/ipython Commit - r1405:dc02b179

Merge with upstream

Fernando Perez -

r1405:dc02b179

parent child

IPython/kernel/mapper.py

0 created 644 +233 0

			@@ -0,0 +1,233 b''
		1	# encoding: utf-8
		2
		3	"""A parallelized version of Python's builtin map."""
		4
		5	__docformat__ = "restructuredtext en"
		6
		7	#----------------------------------------------------------------------------
		8	# Copyright (C) 2008 The IPython Development Team
		9	#
		10	# Distributed under the terms of the BSD License. The full license is in
		11	# the file COPYING, distributed as part of this software.
		12	#----------------------------------------------------------------------------
		13
		14	#----------------------------------------------------------------------------
		15	# Imports
		16	#----------------------------------------------------------------------------
		17
		18	from types import FunctionType
		19	from zope.interface import Interface, implements
		20	from IPython.kernel.task import MapTask
		21	from IPython.kernel.twistedutil import DeferredList, gatherBoth
		22	from IPython.kernel.util import printer
		23	from IPython.kernel.error import collect_exceptions
		24
		25	#----------------------------------------------------------------------------
		26	# Code
		27	#----------------------------------------------------------------------------
		28
		29	class IMapper(Interface):
		30	"""The basic interface for a Mapper.
		31
		32	This defines a generic interface for mapping. The idea of this is
		33	similar to that of Python's builtin `map` function, which applies a function
		34	elementwise to a sequence.
		35	"""
		36
		37	def map(func, *seqs):
		38	"""Do map in parallel.
		39
		40	Equivalent to map(func, *seqs) or:
		41
		42	[func(seqs[0][0], seqs[1][0],...), func(seqs[0][1], seqs[1][1],...),...]
		43
		44	:Parameters:
		45	func : FunctionType
		46	The function to apply to the sequence
		47	sequences : tuple of iterables
		48	A sequence of iterables that are used for sucessive function
		49	arguments. This work just like map
		50	"""
		51
		52	class IMultiEngineMapperFactory(Interface):
		53	"""
		54	An interface for something that creates `IMapper` instances.
		55	"""
		56
		57	def mapper(dist='b', targets='all', block=True):
		58	"""
		59	Create an `IMapper` implementer with a given set of arguments.
		60
		61	The `IMapper` created using a multiengine controller is
		62	not load balanced.
		63	"""
		64
		65	class ITaskMapperFactory(Interface):
		66	"""
		67	An interface for something that creates `IMapper` instances.
		68	"""
		69
		70	def mapper(clear_before=False, clear_after=False, retries=0,
		71	recovery_task=None, depend=None, block=True):
		72	"""
		73	Create an `IMapper` implementer with a given set of arguments.
		74
		75	The `IMapper` created using a task controller is load balanced.
		76
		77	See the documentation for `IPython.kernel.task.BaseTask` for
		78	documentation on the arguments to this method.
		79	"""
		80
		81
		82	class MultiEngineMapper(object):
		83	"""
		84	A Mapper for `IMultiEngine` implementers.
		85	"""
		86
		87	implements(IMapper)
		88
		89	def __init__(self, multiengine, dist='b', targets='all', block=True):
		90	"""
		91	Create a Mapper for a multiengine.
		92
		93	The value of all arguments are used for all calls to `map`. This
		94	class allows these arguemnts to be set for a series of map calls.
		95
		96	:Parameters:
		97	multiengine : `IMultiEngine` implementer
		98	The multiengine to use for running the map commands
		99	dist : str
		100	The type of decomposition to use. Only block ('b') is
		101	supported currently
		102	targets : (str, int, tuple of ints)
		103	The engines to use in the map
		104	block : boolean
		105	Whether to block when the map is applied
		106	"""
		107	self.multiengine = multiengine
		108	self.dist = dist
		109	self.targets = targets
		110	self.block = block
		111
		112	def map(self, func, *sequences):
		113	"""
		114	Apply func to *sequences elementwise. Like Python's builtin map.
		115
		116	This version is not load balanced.
		117	"""
		118	max_len = max(len(s) for s in sequences)
		119	for s in sequences:
		120	if len(s)!=max_len:
		121	raise ValueError('all sequences must have equal length')
		122	assert isinstance(func, (str, FunctionType)), "func must be a fuction or str"
		123	return self.multiengine.raw_map(func, sequences, dist=self.dist,
		124	targets=self.targets, block=self.block)
		125
		126	class TaskMapper(object):
		127	"""
		128	Make an `ITaskController` look like an `IMapper`.
		129
		130	This class provides a load balanced version of `map`.
		131	"""
		132
		133	def __init__(self, task_controller, clear_before=False, clear_after=False, retries=0,
		134	recovery_task=None, depend=None, block=True):
		135	"""
		136	Create a `IMapper` given a `TaskController` and arguments.
		137
		138	The additional arguments are those that are common to all types of
		139	tasks and are described in the documentation for
		140	`IPython.kernel.task.BaseTask`.
		141
		142	:Parameters:
		143	task_controller : an `IBlockingTaskClient` implementer
		144	The `TaskController` to use for calls to `map`
		145	"""
		146	self.task_controller = task_controller
		147	self.clear_before = clear_before
		148	self.clear_after = clear_after
		149	self.retries = retries
		150	self.recovery_task = recovery_task
		151	self.depend = depend
		152	self.block = block
		153
		154	def map(self, func, *sequences):
		155	"""
		156	Apply func to *sequences elementwise. Like Python's builtin map.
		157
		158	This version is load balanced.
		159	"""
		160	max_len = max(len(s) for s in sequences)
		161	for s in sequences:
		162	if len(s)!=max_len:
		163	raise ValueError('all sequences must have equal length')
		164	task_args = zip(*sequences)
		165	task_ids = []
		166	dlist = []
		167	for ta in task_args:
		168	task = MapTask(func, ta, clear_before=self.clear_before,
		169	clear_after=self.clear_after, retries=self.retries,
		170	recovery_task=self.recovery_task, depend=self.depend)
		171	dlist.append(self.task_controller.run(task))
		172	dlist = gatherBoth(dlist, consumeErrors=1)
		173	dlist.addCallback(collect_exceptions,'map')
		174	if self.block:
		175	def get_results(task_ids):
		176	d = self.task_controller.barrier(task_ids)
		177	d.addCallback(lambda _: gatherBoth([self.task_controller.get_task_result(tid) for tid in task_ids], consumeErrors=1))
		178	d.addCallback(collect_exceptions, 'map')
		179	return d
		180	dlist.addCallback(get_results)
		181	return dlist
		182
		183	class SynchronousTaskMapper(object):
		184	"""
		185	Make an `IBlockingTaskClient` look like an `IMapper`.
		186
		187	This class provides a load balanced version of `map`.
		188	"""
		189
		190	def __init__(self, task_controller, clear_before=False, clear_after=False, retries=0,
		191	recovery_task=None, depend=None, block=True):
		192	"""
		193	Create a `IMapper` given a `IBlockingTaskClient` and arguments.
		194
		195	The additional arguments are those that are common to all types of
		196	tasks and are described in the documentation for
		197	`IPython.kernel.task.BaseTask`.
		198
		199	:Parameters:
		200	task_controller : an `IBlockingTaskClient` implementer
		201	The `TaskController` to use for calls to `map`
		202	"""
		203	self.task_controller = task_controller
		204	self.clear_before = clear_before
		205	self.clear_after = clear_after
		206	self.retries = retries
		207	self.recovery_task = recovery_task
		208	self.depend = depend
		209	self.block = block
		210
		211	def map(self, func, *sequences):
		212	"""
		213	Apply func to *sequences elementwise. Like Python's builtin map.
		214
		215	This version is load balanced.
		216	"""
		217	max_len = max(len(s) for s in sequences)
		218	for s in sequences:
		219	if len(s)!=max_len:
		220	raise ValueError('all sequences must have equal length')
		221	task_args = zip(*sequences)
		222	task_ids = []
		223	for ta in task_args:
		224	task = MapTask(func, ta, clear_before=self.clear_before,
		225	clear_after=self.clear_after, retries=self.retries,
		226	recovery_task=self.recovery_task, depend=self.depend)
		227	task_ids.append(self.task_controller.run(task))
		228	if self.block:
		229	self.task_controller.barrier(task_ids)
		230	task_results = [self.task_controller.get_task_result(tid) for tid in task_ids]
		231	return task_results
		232	else:
		233	return task_ids No newline at end of file

IPython/tools/tests/__init__.py

0 created 644 0 0

NO CONTENT: new file 100644

docs/examples/kernel/multienginemap.py

0 created 644 +18 0

			@@ -0,0 +1,18 b''
		1	from IPython.kernel import client
		2
		3	mec = client.MultiEngineClient()
		4
		5	result = mec.map(lambda x: 2*x, range(10))
		6	print "Simple, default map: ", result
		7
		8	m = mec.mapper(block=False)
		9	pr = m.map(lambda x: 2*x, range(10))
		10	print "Submitted map, got PendingResult: ", pr
		11	result = pr.r
		12	print "Using a mapper: ", result
		13
		14	@mec.parallel()
		15	def f(x): return 2*x
		16
		17	result = f(range(10))
		18	print "Using a parallel function: ", result No newline at end of file

docs/examples/kernel/taskmap.py

0 created 644 +19 0

			@@ -0,0 +1,19 b''
		1	from IPython.kernel import client
		2
		3	tc = client.TaskClient()
		4
		5	result = tc.map(lambda x: 2*x, range(10))
		6	print "Simple, default map: ", result
		7
		8	m = tc.mapper(block=False, clear_after=True, clear_before=True)
		9	tids = m.map(lambda x: 2*x, range(10))
		10	print "Submitted tasks, got ids: ", tids
		11	tc.barrier(tids)
		12	result = [tc.get_task_result(tid) for tid in tids]
		13	print "Using a mapper: ", result
		14
		15	@tc.parallel()
		16	def f(x): return 2*x
		17
		18	result = f(range(10))
		19	print "Using a parallel function: ", result No newline at end of file

IPython/frontend/tests/test_frontendbase.py

0 +1 -1

                      d.addCallback(self.checkBlockID, expected='TEST_ID')
                  def test_blockID_added_to_failure(self):
-                     block = "raise  Exception()"
+                     block = "raise Exception()"
                      d = self.fb.execute(block,blockID='TEST_ID')
                      d.addErrback(self.checkFailureID, expected='TEST_ID')

IPython/kernel/asyncclient.py

0 +1 -1

              from IPython.kernel.clientconnector import ClientConnector
              # Other things that the user will need
-             from IPython.kernel.task import Task
+             from IPython.kernel.task import MapTask, StringTask
              from IPython.kernel.error import CompositeError
              #-------------------------------------------------------------------------------

IPython/kernel/client.py

0 +1 -1

              import IPython.kernel.magic
              # Other things that the user will need
-             from IPython.kernel.task import Task
+             from IPython.kernel.task import MapTask, StringTask
              from IPython.kernel.error import CompositeError
              #-------------------------------------------------------------------------------

IPython/kernel/contexts.py

0 0 -43

		@@ -141,46 +141,3 b' class RemoteMultiEngine(RemoteContextBase):'
141	141	def __enter__(self):
142	142	src = self.findsource(sys._getframe(1))
143	143	return self.mec.execute(src)
144
145
146		# XXX - Temporary hackish testing, we'll move this into proper tests right
147		# away
148
149		if __name__ == '__main__':
150
151		# XXX - for now, we need a running cluster to be started separately. The
152		# daemon work is almost finished, and will make much of this unnecessary.
153		from IPython.kernel import client
154		mec = client.MultiEngineClient(('127.0.0.1',10105))
155
156		try:
157		mec.get_ids()
158		except ConnectionRefusedError:
159		import os, time
160		os.system('ipcluster -n 2 &')
161		time.sleep(2)
162		mec = client.MultiEngineClient(('127.0.0.1',10105))
163
164		mec.block = False
165
166		import itertools
167		c = itertools.count()
168
169		parallel = RemoteMultiEngine(mec)
170
171		mec.pushAll()
172
173		with parallel as pr:
174		# A comment
175		remote() # this means the code below only runs remotely
176		print 'Hello remote world'
177		x = range(10)
178		# Comments are OK
179		# Even misindented.
180		y = x+1
181
182
183		with pfor('i',sequence) as pr:
184		print x[i]
185
186		print pr.x + pr.y

IPython/kernel/magic.py

0 +1 -1

                  except AttributeError:
                      print NO_ACTIVE_CONTROLLER
                  else:
-                     print "Executing command on Controller"
+                     print "Parallel execution on engines: %s" % activeController.targets
                      result = activeController.execute(parameter_s)
                      return result

IPython/kernel/map.py

0 +1 -1

                      #    result.append(concat[i:totalLength:maxPartitionLength])
                      return self.concatenate(listOfPartitions)
-             styles = {'basic':Map}
+             dists = {'b':Map}

IPython/kernel/multiengine.py

0 +53 -80

		@@ -653,67 +653,55 b' components.registerAdapter(SynchronousMultiEngine, IMultiEngine, ISynchronousMul'
653	653	class IMultiEngineCoordinator(Interface):
654	654	"""Methods that work on multiple engines explicitly."""
655	655
656		def scatter(key, seq, st~~yle~~='b~~asic~~', flatten=False, targets='all'):
657		"""Partition and distribute a sequence to targets.
	656	def scatter(key, seq, dist='b', flatten=False, targets='all'):
	657	"""Partition and distribute a sequence to targets."""
658	658
659		:Parameters:
660		key : str
661		The variable name to call the scattered sequence.
662		seq : list, tuple, array
663		The sequence to scatter. The type should be preserved.
664		style : string
665		A specification of how the sequence is partitioned. Currently
666		only 'basic' is implemented.
667		flatten : boolean
668		Should single element sequences be converted to scalars.
669		"""
670
671		def gather(key, style='basic', targets='all'):
672		"""Gather object key from targets.
	659	def gather(key, dist='b', targets='all'):
	660	"""Gather object key from targets."""
673	661
674		:Parameters:
675		key : string
676		The name of a sequence on the targets to gather.
677		style : string
678		A specification of how the sequence is partitioned. Currently
679		only 'basic' is implemented.
	662	def raw_map(func, seqs, dist='b', targets='all'):
680	663	~~"""~~
681
682		def map(func, seq, style='basic', targets='all'):
683		"""A parallelized version of Python's builtin map.
	664	A parallelized version of Python's builtin `map` function.
684	665
685		This function implements the following pattern:
	666	This has a slightly different syntax than the builtin `map`.
	667	This is needed because we need to have keyword arguments and thus
	668	can't use *args to capture all the sequences. Instead, they must
	669	be passed in a list or tuple.
686	670
687		1. The sequence seq is scattered to the given targets.
688		2. map(functionSource, seq) is called on each engine.
689		3. The resulting sequences are gathered back to the local machine.
690
691		:Parameters:
692		targets : int, list or 'all'
693		The engine ids the action will apply to. Call `get_ids` to see
694		a list of currently available engines.
695		func : str, function
696		An actual function object or a Python string that names a
697		callable defined on the engines.
698		seq : list, tuple or numpy array
699		The local sequence to be scattered.
700		style : str
701		Only 'basic' is supported for now.
702
703		:Returns: A list of len(seq) with functionSource called on each element
704		of seq.
705
706		Example
707		=======
	671	The equivalence is:
708	672
709		>>> rc.mapAll('lambda x: x*x', range(10000))
710		[0,2,4,9,25,36,...]
	673	raw_map(func, seqs) -> map(func, seqs[0], seqs[1], ...)
	674
	675	Most users will want to use parallel functions or the `mapper`
	676	and `map` methods for an API that follows that of the builtin
	677	`map`.
711	678	"""
712	679
713	680
714	681	class ISynchronousMultiEngineCoordinator(IMultiEngineCoordinator):
715	682	"""Methods that work on multiple engines explicitly."""
716		pass
	683
	684	def scatter(key, seq, dist='b', flatten=False, targets='all', block=True):
	685	"""Partition and distribute a sequence to targets."""
	686
	687	def gather(key, dist='b', targets='all', block=True):
	688	"""Gather object key from targets"""
	689
	690	def raw_map(func, seqs, dist='b', targets='all', block=True):
	691	"""
	692	A parallelized version of Python's builtin map.
	693
	694	This has a slightly different syntax than the builtin `map`.
	695	This is needed because we need to have keyword arguments and thus
	696	can't use *args to capture all the sequences. Instead, they must
	697	be passed in a list or tuple.
	698
	699	raw_map(func, seqs) -> map(func, seqs[0], seqs[1], ...)
	700
	701	Most users will want to use parallel functions or the `mapper`
	702	and `map` methods for an API that follows that of the builtin
	703	`map`.
	704	"""
717	705
718	706
719	707	#-------------------------------------------------------------------------------
		@@ -722,46 +710,31 b' class ISynchronousMultiEngineCoordinator(IMultiEngineCoordinator):'
722	710
723	711	class IMultiEngineExtras(Interface):
724	712
725		def zip_pull(targets, *keys):
726		"""Pull, but return results in a different format from `pull`.
	713	def zip_pull(targets, keys):
	714	"""
	715	Pull, but return results in a different format from `pull`.
727	716
728	717	This method basically returns zip(pull(targets, *keys)), with a few
729	718	edge cases handled differently. Users of chainsaw will find this format
730	719	familiar.
731
732		:Parameters:
733		targets : int, list or 'all'
734		The engine ids the action will apply to. Call `get_ids` to see
735		a list of currently available engines.
736		keys: list or tuple of str
737		A list of variable names as string of the Python objects to be pulled
738		back to the client.
739
740		:Returns: A list of pulled Python objects for each target.
741	720	"""
742	721
743	722	def run(targets, fname):
744		"""Run a .py file on targets.
745
746		:Parameters:
747		targets : int, list or 'all'
748		The engine ids the action will apply to. Call `get_ids` to see
749		a list of currently available engines.
750		fname : str
751		The filename of a .py file on the local system to be sent to and run
752		on the engines.
753		block : boolean
754		Should I block or not. If block=True, wait for the action to
755		complete and return the result. If block=False, return a
756		`PendingResult` object that can be used to later get the
757		result. If block is not specified, the block attribute
758		will be used instead.
759		"""
	723	"""Run a .py file on targets."""
760	724
761	725
762	726	class ISynchronousMultiEngineExtras(IMultiEngineExtras):
763		pass
764
	727	def zip_pull(targets, keys, block=True):
	728	"""
	729	Pull, but return results in a different format from `pull`.
	730
	731	This method basically returns zip(pull(targets, *keys)), with a few
	732	edge cases handled differently. Users of chainsaw will find this format
	733	familiar.
	734	"""
	735
	736	def run(targets, fname, block=True):
	737	"""Run a .py file on targets."""
765	738
766	739	#-------------------------------------------------------------------------------
767	740	# The full MultiEngine interface

IPython/kernel/multiengineclient.py

0 +98 -35

              from IPython.kernel.twistedutil import blockingCallFromThread
              from IPython.kernel import error
              from IPython.kernel.parallelfunction import ParallelFunction
+             from IPython.kernel.mapper import (
+                 MultiEngineMapper,
+                 IMultiEngineMapperFactory,
+                 IMapper
+             )
              from IPython.kernel import map as Map
              from IPython.kernel import multiengine as me
              from IPython.kernel.multiengine import (IFullMultiEngine,
                  def __repr__(self):
                      output = []
-                     blue = TermColors.Blue
-                     normal = TermColors.Normal
-                     red = TermColors.Red
-                     green = TermColors.Green
+                     # These colored prompts were not working on Windows
+                     if sys.platform == 'win32':
+                         blue = normal = red = green = ''
+                     else:
+                         blue = TermColors.Blue
+                         normal = TermColors.Normal
+                         red = TermColors.Red
+                         green = TermColors.Green
                      output.append("<Results List>\n")
                      for cmd in self:
                          if isinstance(cmd, Failure):
                  def __len__(self):
                      """Return the number of available engines."""
                      return len(self.get_ids())
-                 def parallelize(self, func, targets=None, block=None):
-                     """Build a `ParallelFunction` object for functionName on engines.
-                     The returned object will implement a parallel version of functionName
-                     that takes a local sequence as its only argument and calls (in
-                     parallel) functionName on each element of that sequence.  The
-                     `ParallelFunction` object has a `targets` attribute that controls
-                     which engines the function is run on.
-                     :Parameters:
-                         targets : int, list or 'all'
-                             The engine ids the action will apply to.  Call `get_ids` to see
-                             a list of currently available engines.
-                         functionName : str
-                             A Python string that names a callable defined on the engines.
-                     :Returns:  A `ParallelFunction` object.
-                     """
-                     targets, block = self._findTargetsAndBlock(targets, block)
-                     return ParallelFunction(func, self, targets, block)
                  #---------------------------------------------------------------------------
                  # Make this a context manager for with
                  #---------------------------------------------------------------------------
                  engine, run code on it, etc.
                  """
-                 implements(IFullBlockingMultiEngineClient)
+                 implements(
+                     IFullBlockingMultiEngineClient,
+                     IMultiEngineMapperFactory,
+                     IMapper
+                 )
                  def __init__(self, smultiengine):
                      self.smultiengine = smultiengine
                  # IMultiEngineCoordinator
                  #---------------------------------------------------------------------------
-                 def scatter(self, key, seq, style='basic', flatten=False, targets=None, block=None):
+                 def scatter(self, key, seq, dist='b', flatten=False, targets=None, block=None):
                      """
                      Partition a Python sequence and send the partitions to a set of engines.
                      """
                      targets, block = self._findTargetsAndBlock(targets, block)
                      return self._blockFromThread(self.smultiengine.scatter, key, seq,
-                         style, flatten, targets=targets, block=block)
+                         dist, flatten, targets=targets, block=block)
-                 def gather(self, key, style='basic', targets=None, block=None):
+                 def gather(self, key, dist='b', targets=None, block=None):
                      """
                      Gather a partitioned sequence on a set of engines as a single local seq.
                      """
                      targets, block = self._findTargetsAndBlock(targets, block)
-                     return self._blockFromThread(self.smultiengine.gather, key, style,
+                     return self._blockFromThread(self.smultiengine.gather, key, dist,
                          targets=targets, block=block)
-                 def map(self, func, seq, style='basic', targets=None, block=None):
+                 def raw_map(self, func, seq, dist='b', targets=None, block=None):
                      """
-                     A parallelized version of Python's builtin map
+                     A parallelized version of Python's builtin map.
+                     This has a slightly different syntax than the builtin `map`.
+                     This is needed because we need to have keyword arguments and thus
+                     can't use *args to capture all the sequences.  Instead, they must
+                     be passed in a list or tuple.
+                     raw_map(func, seqs) -> map(func, seqs[0], seqs[1], ...)
+                     Most users will want to use parallel functions or the `mapper`
+                     and `map` methods for an API that follows that of the builtin
+                     `map`.
                      """
                      targets, block = self._findTargetsAndBlock(targets, block)
-                     return self._blockFromThread(self.smultiengine.map, func, seq,
-                         style, targets=targets, block=block)
+                     return self._blockFromThread(self.smultiengine.raw_map, func, seq,
+                         dist, targets=targets, block=block)
+                 def map(self, func, *sequences):
+                     """
+                     A parallel version of Python's builtin `map` function.
+                     This method applies a function to sequences of arguments.  It
+                     follows the same syntax as the builtin `map`.
+                     This method creates a mapper objects by calling `self.mapper` with
+                     no arguments and then uses that mapper to do the mapping.  See
+                     the documentation of `mapper` for more details.
+                     """
+                     return self.mapper().map(func, *sequences)
+                 def mapper(self, dist='b', targets='all', block=None):
+                     """
+                     Create a mapper object that has a `map` method.
+                     This method returns an object that implements the `IMapper`
+                     interface.  This method is a factory that is used to control how
+                     the map happens.
+                     :Parameters:
+                         dist : str
+                             What decomposition to use, 'b' is the only one supported
+                             currently
+                         targets : str, int, sequence of ints
+                             Which engines to use for the map
+                         block : boolean
+                             Should calls to `map` block or not
+                     """
+                     return MultiEngineMapper(self, dist, targets, block)
+                 def parallel(self, dist='b', targets=None, block=None):
+                     """
+                     A decorator that turns a function into a parallel function.
+                     This can be used as:
+                     @parallel()
+                     def f(x, y)
+                         ...
+                     f(range(10), range(10))
+                     This causes f(0,0), f(1,1), ... to be called in parallel.
+                     :Parameters:
+                         dist : str
+                             What decomposition to use, 'b' is the only one supported
+                             currently
+                         targets : str, int, sequence of ints
+                             Which engines to use for the map
+                         block : boolean
+                             Should calls to `map` block or not
+                     """
+                     targets, block = self._findTargetsAndBlock(targets, block)
+                     mapper = self.mapper(dist, targets, block)
+                     pf = ParallelFunction(mapper)
+                     return pf
                  #---------------------------------------------------------------------------
                  # IMultiEngineExtras

IPython/kernel/multienginefc.py

0 +100 -11

              from IPython.kernel import error
              from IPython.kernel.util import printer
              from IPython.kernel import map as Map
+             from IPython.kernel.parallelfunction import ParallelFunction
+             from IPython.kernel.mapper import (
+                 MultiEngineMapper,
+                 IMultiEngineMapperFactory,
+                 IMapper
+             )
              from IPython.kernel.twistedutil import gatherBoth
              from IPython.kernel.multiengine import (MultiEngine,
                  IMultiEngine,
              class FCFullSynchronousMultiEngineClient(object):
-                 implements(IFullSynchronousMultiEngine, IBlockingClientAdaptor)
+                 implements(
+                     IFullSynchronousMultiEngine,
+                     IBlockingClientAdaptor,
+                     IMultiEngineMapperFactory,
+                     IMapper
+                 )
                  def __init__(self, remote_reference):
                      self.remote_reference = remote_reference
                      d.addCallback(create_targets)
                      return d
-                 def scatter(self, key, seq, style='basic', flatten=False, targets='all', block=True):
+                 def scatter(self, key, seq, dist='b', flatten=False, targets='all', block=True):
                      # Note: scatter and gather handle pending deferreds locally through self.pdm.
                      # This enables us to collect a bunch fo deferred ids and make a secondary
                      # difficult to get right though.
                      def do_scatter(engines):
                          nEngines = len(engines)
-                         mapClass = Map.styles[style]
+                         mapClass = Map.dists[dist]
                          mapObject = mapClass()
                          d_list = []
                          # Loop through and push to each engine in non-blocking mode.
                      d.addCallback(do_scatter)
                      return d
-                 def gather(self, key, style='basic', targets='all', block=True):
+                 def gather(self, key, dist='b', targets='all', block=True):
                      # Note: scatter and gather handle pending deferreds locally through self.pdm.
                      # This enables us to collect a bunch fo deferred ids and make a secondary
                      # difficult to get right though.
                      def do_gather(engines):
                          nEngines = len(engines)
-                         mapClass = Map.styles[style]
+                         mapClass = Map.dists[dist]
                          mapObject = mapClass()
                          d_list = []
                          # Loop through and push to each engine in non-blocking mode.
                      d.addCallback(do_gather)
                      return d
-                 def map(self, func, seq, style='basic', targets='all', block=True):
-                     d_list = []
+                 def raw_map(self, func, sequences, dist='b', targets='all', block=True):
+                     """
+                     A parallelized version of Python's builtin map.
+                     This has a slightly different syntax than the builtin `map`.
+                     This is needed because we need to have keyword arguments and thus
+                     can't use *args to capture all the sequences.  Instead, they must
+                     be passed in a list or tuple.
+                     raw_map(func, seqs) -> map(func, seqs[0], seqs[1], ...)
+                     Most users will want to use parallel functions or the `mapper`
+                     and `map` methods for an API that follows that of the builtin
+                     `map`.
+                     """
+                     if not isinstance(sequences, (list, tuple)):
+                         raise TypeError('sequences must be a list or tuple')
+                     max_len = max(len(s) for s in sequences)
+                     for s in sequences:
+                         if len(s)!=max_len:
+                             raise ValueError('all sequences must have equal length')
                      if isinstance(func, FunctionType):
                          d = self.push_function(dict(_ipython_map_func=func), targets=targets, block=False)
                          d.addCallback(lambda did: self.get_pending_deferred(did, True))
-                         sourceToRun = '_ipython_map_seq_result = map(_ipython_map_func, _ipython_map_seq)'
+                         sourceToRun = '_ipython_map_seq_result = map(_ipython_map_func, *zip(*_ipython_map_seq))'
                      elif isinstance(func, str):
                          d = defer.succeed(None)
                          sourceToRun = \
-                             '_ipython_map_seq_result = map(%s, _ipython_map_seq)' % func
+                             '_ipython_map_seq_result = map(%s, *zip(*_ipython_map_seq))' % func
                      else:
                          raise TypeError("func must be a function or str")
-                     d.addCallback(lambda _: self.scatter('_ipython_map_seq', seq, style, targets=targets))
+                     d.addCallback(lambda _: self.scatter('_ipython_map_seq', zip(*sequences), dist, targets=targets))
                      d.addCallback(lambda _: self.execute(sourceToRun, targets=targets, block=False))
                      d.addCallback(lambda did: self.get_pending_deferred(did, True))
-                     d.addCallback(lambda _: self.gather('_ipython_map_seq_result', style, targets=targets, block=block))
+                     d.addCallback(lambda _: self.gather('_ipython_map_seq_result', dist, targets=targets, block=block))
                      return d
+                 def map(self, func, *sequences):
+                     """
+                     A parallel version of Python's builtin `map` function.
+                     This method applies a function to sequences of arguments.  It
+                     follows the same syntax as the builtin `map`.
+                     This method creates a mapper objects by calling `self.mapper` with
+                     no arguments and then uses that mapper to do the mapping.  See
+                     the documentation of `mapper` for more details.
+                     """
+                     return self.mapper().map(func, *sequences)
+                 def mapper(self, dist='b', targets='all', block=True):
+                     """
+                     Create a mapper object that has a `map` method.
+                     This method returns an object that implements the `IMapper`
+                     interface.  This method is a factory that is used to control how
+                     the map happens.
+                     :Parameters:
+                         dist : str
+                             What decomposition to use, 'b' is the only one supported
+                             currently
+                         targets : str, int, sequence of ints
+                             Which engines to use for the map
+                         block : boolean
+                             Should calls to `map` block or not
+                     """
+                     return MultiEngineMapper(self, dist, targets, block)
+                 def parallel(self, dist='b', targets='all', block=True):
+                     """
+                     A decorator that turns a function into a parallel function.
+                     This can be used as:
+                     @parallel()
+                     def f(x, y)
+                         ...
+                     f(range(10), range(10))
+                     This causes f(0,0), f(1,1), ... to be called in parallel.
+                     :Parameters:
+                         dist : str
+                             What decomposition to use, 'b' is the only one supported
+                             currently
+                         targets : str, int, sequence of ints
+                             Which engines to use for the map
+                         block : boolean
+                             Should calls to `map` block or not
+                     """
+                     mapper = self.mapper(dist, targets, block)
+                     pf = ParallelFunction(mapper)
+                     return pf
                  #---------------------------------------------------------------------------
                  # ISynchronousMultiEngineExtras related methods
                  #---------------------------------------------------------------------------

IPython/kernel/parallelfunction.py

0 +85 -10

		@@ -16,17 +16,92 b' __docformat__ = "restructuredtext en"'
16	16	#-------------------------------------------------------------------------------
17	17
18	18	from types import FunctionType
	19	from zope.interface import Interface, implements
19	20
20		class ParallelFunction:
21		"""A function that operates in parallel on sequences."""
22		def __init__(self, func, multiengine, targets, block):
23		"""Create a `ParallelFunction`.
	21
	22	class IMultiEngineParallelDecorator(Interface):
	23	"""A decorator that creates a parallel function."""
	24
	25	def parallel(dist='b', targets=None, block=None):
	26	"""
	27	A decorator that turns a function into a parallel function.
	28
	29	This can be used as:
	30
	31	@parallel()
	32	def f(x, y)
	33	...
	34
	35	f(range(10), range(10))
	36
	37	This causes f(0,0), f(1,1), ... to be called in parallel.
	38
	39	:Parameters:
	40	dist : str
	41	What decomposition to use, 'b' is the only one supported
	42	currently
	43	targets : str, int, sequence of ints
	44	Which engines to use for the map
	45	block : boolean
	46	Should calls to `map` block or not
	47	"""
	48
	49	class ITaskParallelDecorator(Interface):
	50	"""A decorator that creates a parallel function."""
	51
	52	def parallel(clear_before=False, clear_after=False, retries=0,
	53	recovery_task=None, depend=None, block=True):
	54	"""
	55	A decorator that turns a function into a parallel function.
	56
	57	This can be used as:
	58
	59	@parallel()
	60	def f(x, y)
	61	...
	62
	63	f(range(10), range(10))
	64
	65	This causes f(0,0), f(1,1), ... to be called in parallel.
	66
	67	See the documentation for `IPython.kernel.task.BaseTask` for
	68	documentation on the arguments to this method.
	69	"""
	70
	71	class IParallelFunction(Interface):
	72	pass
	73
	74	class ParallelFunction(object):
	75	"""
	76	The implementation of a parallel function.
	77
	78	A parallel function is similar to Python's map function:
	79
	80	map(func, sequences) -> pfunc(sequences)
	81
	82	Parallel functions should be created by using the @parallel decorator.
	83	"""
	84
	85	implements(IParallelFunction)
	86
	87	def __init__(self, mapper):
	88	"""
	89	Create a parallel function from an `IMapper`.
	90
	91	:Parameters:
	92	mapper : an `IMapper` implementer.
	93	The mapper to use for the parallel function
	94	"""
	95	self.mapper = mapper
	96
	97	def __call__(self, func):
	98	"""
	99	Decorate a function to make it run in parallel.
24	100	"""
25	101	assert isinstance(func, (str, FunctionType)), "func must be a fuction or str"
26	102	self.func = func
27		self.multiengine = multiengine
28		self.targets = targets
29		self.block = block
30
31		def __call__(self, sequence):
32		return self.multiengine.map(self.func, sequence, targets=self.targets, block=self.block) No newline at end of file
	103	def call_function(*sequences):
	104	return self.mapper.map(self.func, *sequences)
	105	return call_function
	106
	107	No newline at end of file

IPython/kernel/task.py

0 +496 -186

              __docformat__ = "restructuredtext en"
-             #-------------------------------------------------------------------------------
+             #-----------------------------------------------------------------------------
              #  Copyright (C) 2008  The IPython Development Team
              #
              #  Distributed under the terms of the BSD License.  The full license is in
              #  the file COPYING, distributed as part of this software.
-             #-------------------------------------------------------------------------------
+             #-----------------------------------------------------------------------------
-             #-------------------------------------------------------------------------------
+             #-----------------------------------------------------------------------------
              # Imports
-             #-------------------------------------------------------------------------------
+             #-----------------------------------------------------------------------------
              import copy, time
-             from types import FunctionType as function
+             from types import FunctionType
              import zope.interface as zi, string
              from twisted.internet import defer, reactor
              from twisted.python import components, log, failure
-             # from IPython.genutils import time
+             from IPython.kernel.util import printer
              from IPython.kernel import engineservice as es, error
              from IPython.kernel import controllerservice as cs
              from IPython.kernel.twistedutil import gatherBoth, DeferredList
-             from IPython.kernel.pickleutil import can,uncan, CannedFunction
-             def canTask(task):
-                 t = copy.copy(task)
-                 t.depend = can(t.depend)
-                 if t.recovery_task:
-                     t.recovery_task = canTask(t.recovery_task)
-                 return t
+             from IPython.kernel.pickleutil import can, uncan, CannedFunction
-             def uncanTask(task):
-                 t = copy.copy(task)
-                 t.depend = uncan(t.depend)
-                 if t.recovery_task and t.recovery_task is not task:
-                     t.recovery_task = uncanTask(t.recovery_task)
-                 return t
+             #-----------------------------------------------------------------------------
+             # Definition of the Task objects
+             #-----------------------------------------------------------------------------
              time_format = '%Y/%m/%d %H:%M:%S'
-             class Task(object):
-                 r"""Our representation of a task for the `TaskController` interface.
-                 The user should create instances of this class to represent a task that
-                 needs to be done.
-                 :Parameters:
-                     expression : str
-                         A str that is valid python code that is the task.
-                     pull : str or list of str
-                         The names of objects to be pulled as results.  If not specified,
-                         will return {'result', None}
-                     push : dict
-                         A dict of objects to be pushed into the engines namespace before
-                         execution of the expression.
-                     clear_before : boolean
-                         Should the engine's namespace be cleared before the task is run.
-                         Default=False.
-                     clear_after : boolean
-                         Should the engine's namespace be cleared after the task is run.
-                         Default=False.
-                     retries : int
-                         The number of times to resumbit the task if it fails.  Default=0.
-                     recovery_task : Task
-                         This is the Task to be run when the task has exhausted its retries
-                         Default=None.
-                     depend : bool function(properties)
-                         This is the dependency function for the Task, which determines
-                         whether a task can be run on a Worker.  `depend` is called with
-                         one argument, the worker's properties dict, and should return
-                         True if the worker meets the dependencies or False if it does
-                         not.
-                         Default=None - run on any worker
-                     options : dict
-                         Any other keyword options for more elaborate uses of tasks
-                 Examples
-                 --------
+             class ITask(zi.Interface):
+                 """
+                 This interface provides a generic definition of what constitutes a task.
+                 There are two sides to a task.  First a task needs to take input from
+                 a user to determine what work is performed by the task.  Second, the
+                 task needs to have the logic that knows how to turn that information
+                 info specific calls to a worker, through the `IQueuedEngine` interface.
+                 Many method in this class get two things passed to them: a Deferred
+                 and an IQueuedEngine implementer.  Such methods should register callbacks
+                 on the Deferred that use the IQueuedEngine to accomplish something.  See
+                 the existing task objects for examples.
+                 """
+                 zi.Attribute('retries','How many times to retry the task')
+                 zi.Attribute('recovery_task','A task to try if the initial one fails')
+                 zi.Attribute('taskid','the id of the task')
+                 def start_time(result):
+                     """
+                     Do anything needed to start the timing of the task.
+                     Must simply return the result after starting the timers.
+                     """
-                 >>> t = Task('dostuff(args)')
-                 >>> t = Task('a=5', pull='a')
-                 >>> t = Task('a=5\nb=4', pull=['a','b'])
-                 >>> t = Task('os.kill(os.getpid(),9)', retries=100) # this is a bad idea
+                 def stop_time(result):
+                     """
+                     Do anything needed to stop the timing of the task.
+                     Must simply return the result after stopping the timers.  This
+                     method will usually set attributes that are used by `process_result`
+                     in building result of the task.
+                     """
+                 def pre_task(d, queued_engine):
+                     """Do something with the queued_engine before the task is run.
+                     This method should simply add callbacks to the input Deferred
+                     that do something with the `queued_engine` before the task is run.
+                     :Parameters:
+                         d : Deferred
+                             The deferred that actions should be attached to
+                         queued_engine : IQueuedEngine implementer
+                             The worker that has been allocated to perform the task
+                     """
+                 def post_task(d, queued_engine):
+                     """Do something with the queued_engine after the task is run.
+                     This method should simply add callbacks to the input Deferred
+                     that do something with the `queued_engine` before the task is run.
+                     :Parameters:
+                         d : Deferred
+                             The deferred that actions should be attached to
+                         queued_engine : IQueuedEngine implementer
+                             The worker that has been allocated to perform the task
+                     """
+                 def submit_task(d, queued_engine):
+                     """Submit a task using the `queued_engine` we have been allocated.
+                     When a task is ready to run, this method is called.  This method
+                     must take the internal information of the task and make suitable
+                     calls on the queued_engine to have the actual work done.
+                     This method should simply add callbacks to the input Deferred
+                     that do something with the `queued_engine` before the task is run.
+                     :Parameters:
+                         d : Deferred
+                             The deferred that actions should be attached to
+                         queued_engine : IQueuedEngine implementer
+                             The worker that has been allocated to perform the task
+                     """
-                 A dependency case:
-                 >>> def hasMPI(props):
-                 ...     return props.get('mpi') is not None
-                 >>> t = Task('mpi.send(blah,blah)', depend = hasMPI)
+                 def process_result(d, result, engine_id):
+                     """Take a raw task result.
+                     Objects that implement `ITask` can choose how the result of running
+                     the task is presented.  This method takes the raw result and
+                     does this logic.  Two example are the `MapTask` which simply returns
+                     the raw result or a `Failure` object and the `StringTask` which
+                     returns a `TaskResult` object.
+                     :Parameters:
+                         d : Deferred
+                             The deferred that actions should be attached to
+                         result : object
+                             The raw task result that needs to be wrapped
+                         engine_id : int
+                             The id of the engine that did the task
+                     :Returns:
+                         The result, as a tuple of the form: (success, result).
+                         Here, success is a boolean indicating if the task
+                         succeeded or failed and result is the result.
+                     """
+                 def check_depend(properties):
+                     """Check properties to see if the task should be run.
+                     :Parameters:
+                         properties : dict
+                             A dictionary of properties that an engine has set
+                     :Returns:
+                         True if the task should be run, False otherwise
+                     """
+                 def can_task(self):
+                     """Serialize (can) any functions in the task for pickling.
+                     Subclasses must override this method and make sure that all
+                     functions in the task are canned by calling `can` on the
+                     function.
+                     """
+                 def uncan_task(self):
+                     """Unserialize (uncan) any canned function in the task."""
+             class BaseTask(object):
+                 """
+                 Common fuctionality for all objects implementing `ITask`.
                  """
-                 def __init__(self, expression, pull=None, push=None,
-                         clear_before=False, clear_after=False, retries=0,
-                         recovery_task=None, depend=None, **options):
-                     self.expression = expression
-                     if isinstance(pull, str):
-                         self.pull = [pull]
-                     else:
-                         self.pull = pull
-                     self.push = push
+                 zi.implements(ITask)
+                 def __init__(self, clear_before=False, clear_after=False, retries=0,
+                         recovery_task=None, depend=None):
+                     """
+                     Make a generic task.
+                     :Parameters:
+                         clear_before : boolean
+                             Should the engines namespace be cleared before the task
+                             is run
+                         clear_after : boolean
+                             Should the engines namespace be clear after the task is run
+                         retries : int
+                             The number of times a task should be retries upon failure
+                         recovery_task : any task object
+                             If a task fails and it has a recovery_task, that is run
+                             upon a retry
+                         depend : FunctionType
+                             A function that is called to test for properties.  This function
+                             must take one argument, the properties dict and return a boolean
+                     """
                      self.clear_before = clear_before
                      self.clear_after = clear_after
-                     self.retries=retries
+                     self.retries = retries
                      self.recovery_task = recovery_task
                      self.depend = depend
-                     self.options = options
                      self.taskid = None
+                 def start_time(self, result):
+                     """
+                     Start the basic timers.
+                     """
+                     self.start = time.time()
+                     self.start_struct = time.localtime()
+                     return result
+                 def stop_time(self, result):
+                     """
+                     Stop the basic timers.
+                     """
+                     self.stop = time.time()
+                     self.stop_struct = time.localtime()
+                     self.duration = self.stop - self.start
+                     self.submitted = time.strftime(time_format, self.start_struct)
+                     self.completed = time.strftime(time_format)
+                     return result
+                 def pre_task(self, d, queued_engine):
+                     """
+                     Clear the engine before running the task if clear_before is set.
+                     """
+                     if self.clear_before:
+                         d.addCallback(lambda r: queued_engine.reset())
+                 def post_task(self, d, queued_engine):
+                     """
+                     Clear the engine after running the task if clear_after is set.
+                     """
+                     def reseter(result):
+                         queued_engine.reset()
+                         return result
+                     if self.clear_after:
+                         d.addBoth(reseter)
+                 def submit_task(self, d, queued_engine):
+                     raise NotImplementedError('submit_task must be implemented in a subclass')
+                 def process_result(self, result, engine_id):
+                     """
+                     Process a task result.
+                     This is the default `process_result` that just returns the raw
+                     result or a `Failure`.
+                     """
+                     if isinstance(result, failure.Failure):
+                         return (False, result)
+                     else:
+                         return (True, result)
+                 def check_depend(self, properties):
+                     """
+                     Calls self.depend(properties) to see if a task should be run.
+                     """
+                     if self.depend is not None:
+                         return self.depend(properties)
+                     else:
+                         return True
+                 def can_task(self):
+                     self.depend = can(self.depend)
+                     if isinstance(self.recovery_task, BaseTask):
+                         self.recovery_task.can_task()
+                 def uncan_task(self):
+                     self.depend = uncan(self.depend)
+                     if isinstance(self.recovery_task, BaseTask):
+                         self.recovery_task.uncan_task()
+             class MapTask(BaseTask):
+                 """
+                 A task that consists of a function and arguments.
+                 """
+                 zi.implements(ITask)
+                 def __init__(self, function, args=None, kwargs=None, clear_before=False,
+                         clear_after=False, retries=0, recovery_task=None, depend=None):
+                     """
+                     Create a task based on a function, args and kwargs.
+                     This is a simple type of task that consists of calling:
+                     function(*args, **kwargs) and wrapping the result in a `TaskResult`.
+                     The return value of the function, or a `Failure` wrapping an
+                     exception is the task result for this type of task.
+                     """
+                     BaseTask.__init__(self, clear_before, clear_after, retries,
+                         recovery_task, depend)
+                     if not isinstance(function, FunctionType):
+                         raise TypeError('a task function must be a FunctionType')
+                     self.function = function
+                     if args is None:
+                         self.args = ()
+                     else:
+                         self.args = args
+                     if not isinstance(self.args, (list, tuple)):
+                         raise TypeError('a task args must be a list or tuple')
+                     if kwargs is None:
+                         self.kwargs = {}
+                     else:
+                         self.kwargs = kwargs
+                     if not isinstance(self.kwargs, dict):
+                         raise TypeError('a task kwargs must be a dict')
+                 def submit_task(self, d, queued_engine):
+                     d.addCallback(lambda r: queued_engine.push_function(
+                         dict(_ipython_task_function=self.function))
+                     )
+                     d.addCallback(lambda r: queued_engine.push(
+                         dict(_ipython_task_args=self.args,_ipython_task_kwargs=self.kwargs))
+                     )
+                     d.addCallback(lambda r: queued_engine.execute(
+                         '_ipython_task_result = _ipython_task_function(*_ipython_task_args,**_ipython_task_kwargs)')
+                     )
+                     d.addCallback(lambda r: queued_engine.pull('_ipython_task_result'))
+                 def can_task(self):
+                     self.function = can(self.function)
+                     BaseTask.can_task(self)
+                 def uncan_task(self):
+                     self.function = uncan(self.function)
+                     BaseTask.uncan_task(self)
+             class StringTask(BaseTask):
+                 """
+                 A task that consists of a string of Python code to run.
+                 """
+                 def __init__(self, expression, pull=None, push=None,
+                         clear_before=False, clear_after=False, retries=0,
+                         recovery_task=None, depend=None):
+                     """
+                     Create a task based on a Python expression and variables
+                     This type of task lets you push a set of variables to the engines
+                     namespace, run a Python string in that namespace and then bring back
+                     a different set of Python variables as the result.
+                     Because this type of task can return many results (through the
+                     `pull` keyword argument) it returns a special `TaskResult` object
+                     that wraps the pulled variables, statistics about the run and
+                     any exceptions raised.
+                     """
+                     if not isinstance(expression, str):
+                         raise TypeError('a task expression must be a string')
+                     self.expression = expression
+                     if pull==None:
+                         self.pull = ()
+                     elif isinstance(pull, str):
+                         self.pull = (pull,)
+                     elif isinstance(pull, (list, tuple)):
+                         self.pull = pull
+                     else:
+                         raise TypeError('pull must be str or a sequence of strs')
+                     if push==None:
+                         self.push = {}
+                     elif isinstance(push, dict):
+                         self.push = push
+                     else:
+                         raise TypeError('push must be a dict')
+                     BaseTask.__init__(self, clear_before, clear_after, retries,
+                         recovery_task, depend)
-             class ResultNS:
-                 """The result namespace object for use in TaskResult objects as tr.ns.
+                 def submit_task(self, d, queued_engine):
+                     if self.push is not None:
+                         d.addCallback(lambda r: queued_engine.push(self.push))
+                     d.addCallback(lambda r: queued_engine.execute(self.expression))
+                     if self.pull is not None:
+                         d.addCallback(lambda r: queued_engine.pull(self.pull))
+                     else:
+                         d.addCallback(lambda r: None)
+                 def process_result(self, result, engine_id):
+                     if isinstance(result, failure.Failure):
+                         tr = TaskResult(result, engine_id)
+                     else:
+                         if self.pull is None:
+                             resultDict = {}
+                         elif len(self.pull) == 1:
+                             resultDict = {self.pull[0]:result}
+                         else:
+                             resultDict = dict(zip(self.pull, result))
+                         tr = TaskResult(resultDict, engine_id)
+                     # Assign task attributes
+                     tr.submitted = self.submitted
+                     tr.completed = self.completed
+                     tr.duration = self.duration
+                     if hasattr(self,'taskid'):
+                         tr.taskid = self.taskid
+                     else:
+                         tr.taskid = None
+                     if isinstance(result, failure.Failure):
+                         return (False, tr)
+                     else:
+                         return (True, tr)
+             class ResultNS(object):
+                 """
+                 A dict like object for holding the results of a task.
+                 The result namespace object for use in `TaskResult` objects as tr.ns.
                  It builds an object from a dictionary, such that it has attributes
                  according to the key,value pairs of the dictionary.
                  --------
                  >>> ns = ResultNS({'a':17,'foo':range(3)})
                  >>> print ns
-                 NS{'a': 17, 'foo': [0, 1, 2]}
+                     NS{'a':17,'foo':range(3)}
                  >>> ns.a
                  >>> ns['foo']
-                 [0, 1, 2]
+                     [0,1,2]
                  """
                  def __init__(self, dikt):
                      for k,v in dikt.iteritems():
              class TaskResult(object):
                  """
-                 An object for returning task results.
+                 An object for returning task results for certain types of tasks.
                  This object encapsulates the results of a task.  On task
                  success it will have a keys attribute that will have a list
                  In task failure, keys will be empty, but failure will contain
                  the failure object that encapsulates the remote exception.
-                 One can also simply call the raiseException() method of
+                 One can also simply call the `raise_exception` method of
                  this class to re-raise any remote exception in the local
                  session.
-                 The TaskResult has a .ns member, which is a property for access
+                 The `TaskResult` has a `.ns` member, which is a property for access
                  to the results.  If the Task had pull=['a', 'b'], then the
-                 Task Result will have attributes tr.ns.a, tr.ns.b for those values.
-                 Accessing tr.ns will raise the remote failure if the task failed.
+                 Task Result will have attributes `tr.ns.a`, `tr.ns.b` for those values.
+                 Accessing `tr.ns` will raise the remote failure if the task failed.
-                 The engineid attribute should have the engineid of the engine
-                 that ran the task.  But, because engines can come and go in
-                 the ipython task system, the engineid may not continue to be
+                 The `engineid` attribute should have the `engineid` of the engine
+                 that ran the task.  But, because engines can come and go,
+                 the `engineid` may not continue to be
                  valid or accurate.
-                 The taskid attribute simply gives the taskid that the task
+                 The `taskid` attribute simply gives the `taskid` that the task
                  is tracked under.
                  """
                  taskid = None
                          return self._ns
                  def _setNS(self, v):
-                     raise Exception("I am protected!")
+                     raise Exception("the ns attribute cannot be changed")
                  ns = property(_getNS, _setNS)
                  def __getitem__(self, key):
                      if self.failure is not None:
-                         self.raiseException()
+                         self.raise_exception()
                      return self.results[key]
-                 def raiseException(self):
+                 def raise_exception(self):
                      """Re-raise any remote exceptions in the local python session."""
                      if self.failure is not None:
                          self.failure.raiseException()
+             #-----------------------------------------------------------------------------
+             # The controller side of things
+             #-----------------------------------------------------------------------------
              class IWorker(zi.Interface):
                  """The Basic Worker Interface.
                      :Parameters:
                          task : a `Task` object
-                     :Returns: `Deferred` to a `TaskResult` object.
+                     :Returns: `Deferred` to a tuple of (success, result) where
+                         success if a boolean that signifies success or failure
+                         and result is the task result.
                      """
              class WorkerFromQueuedEngine(object):
                  """Adapt an `IQueuedEngine` to an `IWorker` object"""
                  zi.implements(IWorker)
                  def __init__(self, qe):
                  def run(self, task):
                      """Run task in worker's namespace.
+                     This takes a task and calls methods on the task that actually
+                     cause `self.queuedEngine` to do the task.  See the methods of
+                     `ITask` for more information about how these methods are called.
                      :Parameters:
                          task : a `Task` object
-                     :Returns: `Deferred` to a `TaskResult` object.
+                     :Returns: `Deferred` to a tuple of (success, result) where
+                         success if a boolean that signifies success or failure
+                         and result is the task result.
                      """
-                     if task.clear_before:
-                         d = self.queuedEngine.reset()
-                     else:
-                         d = defer.succeed(None)
-                     if task.push is not None:
-                         d.addCallback(lambda r: self.queuedEngine.push(task.push))
-                     d.addCallback(lambda r: self.queuedEngine.execute(task.expression))
-                     if task.pull is not None:
-                         d.addCallback(lambda r: self.queuedEngine.pull(task.pull))
-                     else:
-                         d.addCallback(lambda r: None)
-                     def reseter(result):
-                         self.queuedEngine.reset()
-                         return result
-                     if task.clear_after:
-                         d.addBoth(reseter)
-                     return d.addBoth(self._zipResults, task.pull, time.time(), time.localtime())
-                 def _zipResults(self, result, names, start, start_struct):
-                     """Callback for construting the TaskResult object."""
-                     if isinstance(result, failure.Failure):
-                         tr = TaskResult(result, self.queuedEngine.id)
-                     else:
-                         if names is None:
-                             resultDict = {}
-                         elif len(names) == 1:
-                             resultDict = {names[0]:result}
-                         else:
-                             resultDict = dict(zip(names, result))
-                         tr = TaskResult(resultDict, self.queuedEngine.id)
-                     # the time info
-                     tr.submitted = time.strftime(time_format, start_struct)
-                     tr.completed = time.strftime(time_format)
-                     tr.duration = time.time()-start
-                     return tr
+                     d = defer.succeed(None)
+                     d.addCallback(task.start_time)
+                     task.pre_task(d, self.queuedEngine)
+                     task.submit_task(d, self.queuedEngine)
+                     task.post_task(d, self.queuedEngine)
+                     d.addBoth(task.stop_time)
+                     d.addBoth(task.process_result, self.queuedEngine.id)
+                     # At this point, there will be (success, result) coming down the line
+                     return d
              components.registerAdapter(WorkerFromQueuedEngine, es.IEngineQueued, IWorker)
                      """Add a task to the queue of the Scheduler.
                      :Parameters:
-                         task : a `Task` object
+                         task : an `ITask` implementer
                              The task to be queued.
                          flags : dict
                              General keywords for more sophisticated scheduling
                      """
                  def pop_task(id=None):
-                     """Pops a Task object.
+                     """Pops a task object from the queue.
                      This gets the next task to be run.  If no `id` is requested, the highest priority
                      task is returned.
                              The id of the task to be popped.  The default (None) is to return
                              the highest priority task.
-                     :Returns: a `Task` object
+                     :Returns: an `ITask` implementer
                      :Exceptions:
                          IndexError : raised if no taskid in queue
                      """Add a worker to the worker queue.
                      :Parameters:
-                         worker : an IWorker implementing object
-                         flags : General keywords for more sophisticated scheduling
+                         worker : an `IWorker` implementer
+                         flags : dict
+                             General keywords for more sophisticated scheduling
                      """
                  def pop_worker(id=None):
                      """Returns True if there is something to do, False otherwise"""
                  def schedule():
-                     """Returns a tuple of the worker and task pair for the next
-                     task to be run.
-                     """
+                     """Returns (worker,task) pair for the next task to be run."""
              class FIFOScheduler(object):
-                 """A basic First-In-First-Out (Queue) Scheduler.
-                 This is the default Scheduler for the TaskController.
-                 See the docstrings for IScheduler for interface details.
+                 """
+                 A basic First-In-First-Out (Queue) Scheduler.
+                 This is the default Scheduler for the `TaskController`.
+                 See the docstrings for `IScheduler` for interface details.
                  """
                  zi.implements(IScheduler)
                      for t in self.tasks:
                          for w in self.workers:
                              try:# do not allow exceptions to break this
-                                 cando = t.depend is None or t.depend(w.properties)
+                                 # Allow the task to check itself using its
+                                 # check_depend method.
+                                 cando = t.check_depend(w.properties)
                              except:
                                  cando = False
                              if cando:
              class LIFOScheduler(FIFOScheduler):
-                 """A Last-In-First-Out (Stack) Scheduler.  This scheduler should naively
-                 reward fast engines by giving them more jobs.  This risks starvation, but
-                 only in cases with low load, where starvation does not really matter.
+                 """
+                 A Last-In-First-Out (Stack) Scheduler.
+                 This scheduler should naively reward fast engines by giving
+                 them more jobs.  This risks starvation, but only in cases with
+                 low load, where starvation does not really matter.
                  """
                  def add_task(self, task, **flags):
              class ITaskController(cs.IControllerBase):
-                 """The Task based interface to a `ControllerService` object
+                 """
+                 The Task based interface to a `ControllerService` object
                  This adapts a `ControllerService` to the ITaskController interface.
                  """
                  def run(task):
-                     """Run a task.
+                     """
+                     Run a task.
                      :Parameters:
                          task : an IPython `Task` object
                      """
                  def get_task_result(taskid, block=False):
-                     """Get the result of a task by its ID.
+                     """
+                     Get the result of a task by its ID.
                      :Parameters:
                          taskid : int
                              the id of the task whose result is requested
-                     :Returns: `Deferred` to (taskid, actualResult) if the task is done, and None
+                     :Returns: `Deferred` to the task result if the task is done, and None
                          if not.
                      :Exceptions:
                      """
                  def barrier(taskids):
-                     """Block until the list of taskids are completed.
+                     """
+                     Block until the list of taskids are completed.
                      Returns None on success.
                      """
                  def spin():
-                     """touch the scheduler, to resume scheduling without submitting
-                     a task.
+                     """
+                     Touch the scheduler, to resume scheduling without submitting a task.
                      """
-                 def queue_status(self, verbose=False):
-                     """Get a dictionary with the current state of the task queue.
+                 def queue_status(verbose=False):
+                     """
+                     Get a dictionary with the current state of the task queue.
                      If verbose is True, then return lists of taskids, otherwise,
                      return the number of tasks with each status.
                      """
+                 def clear():
+                     """
+                     Clear all previously run tasks from the task controller.
+                     This is needed because the task controller keep all task results
+                     in memory.  This can be a problem is there are many completed
+                     tasks.  Users should call this periodically to clean out these
+                     cached task results.
+                     """
              class TaskController(cs.ControllerAdapterBase):
                  """The Task based interface to a Controller object.
                  def registerWorker(self, id):
                      """Called by controller.register_engine."""
                      if self.workers.get(id):
-                         raise "We already have one!  This should not happen."
+                         raise ValueError("worker with id %s already exists.  This should not happen." % id)
                      self.workers[id] = IWorker(self.controller.engines[id])
                      self.workers[id].workerid = id
                      if not self.pendingTasks.has_key(id):# if not working
                  #---------------------------------------------------------------------------
                  def run(self, task):
-                     """Run a task and return `Deferred` to its taskid."""
+                     """
+                     Run a task and return `Deferred` to its taskid.
+                     """
                      task.taskid = self.taskid
                      task.start = time.localtime()
                      self.taskid += 1
                      d = defer.Deferred()
                      self.scheduler.add_task(task)
-                     # log.msg('Queuing task: %i' % task.taskid)
+                     log.msg('Queuing task: %i' % task.taskid)
                      self.deferredResults[task.taskid] = []
                      self.distributeTasks()
                      return defer.succeed(task.taskid)
                  def get_task_result(self, taskid, block=False):
-                     """Returns a `Deferred` to a TaskResult tuple or None."""
-                     # log.msg("Getting task result: %i" % taskid)
+                     """
+                     Returns a `Deferred` to the task result, or None.
+                     """
+                     log.msg("Getting task result: %i" % taskid)
                      if self.finishedResults.has_key(taskid):
                          tr = self.finishedResults[taskid]
                          return defer.succeed(tr)
                          return defer.fail(IndexError("task ID not registered: %r" % taskid))
                  def abort(self, taskid):
-                     """Remove a task from the queue if it has not been run already."""
+                     """
+                     Remove a task from the queue if it has not been run already.
+                     """
                      if not isinstance(taskid, int):
                          return defer.fail(failure.Failure(TypeError("an integer task id expected: %r" % taskid)))
                      try:
                  #---------------------------------------------------------------------------
                  def _doAbort(self, taskid):
-                     """Helper function for aborting a pending task."""
-                     # log.msg("Task aborted: %i" % taskid)
+                     """
+                     Helper function for aborting a pending task.
+                     """
+                     log.msg("Task aborted: %i" % taskid)
                      result = failure.Failure(error.TaskAborted())
                      self._finishTask(taskid, result)
                      if taskid in self.abortPending:
                  def _finishTask(self, taskid, result):
                      dlist = self.deferredResults.pop(taskid)
-                     result.taskid = taskid   # The TaskResult should save the taskid
+                     # result.taskid = taskid   # The TaskResult should save the taskid
                      self.finishedResults[taskid] = result
                      for d in dlist:
                          d.callback(result)
                  def distributeTasks(self):
-                     """Distribute tasks while self.scheduler has things to do."""
-                     # log.msg("distributing Tasks")
+                     """
+                     Distribute tasks while self.scheduler has things to do.
+                     """
+                     log.msg("distributing Tasks")
                      worker, task = self.scheduler.schedule()
                      if not worker and not task:
                          if self.idleLater and self.idleLater.called:# we are inside failIdle
                          self.pendingTasks[worker.workerid] = task
                          # run/link callbacks
                          d = worker.run(task)
-                         # log.msg("Running task %i on worker %i" %(task.taskid, worker.workerid))
+                         log.msg("Running task %i on worker %i" %(task.taskid, worker.workerid))
                          d.addBoth(self.taskCompleted, task.taskid, worker.workerid)
                          worker, task = self.scheduler.schedule()
                      # check for idle timeout:
                              t = self.scheduler.pop_task()
                              msg = "task %i failed to execute due to unmet dependencies"%t.taskid
                              msg += " for %i seconds"%self.timeout
-                             # log.msg("Task aborted by timeout: %i" % t.taskid)
+                             log.msg("Task aborted by timeout: %i" % t.taskid)
                              f = failure.Failure(error.TaskTimeout(msg))
                              self._finishTask(t.taskid, f)
                      self.idleLater = None
-                 def taskCompleted(self, result, taskid, workerid):
+                 def taskCompleted(self, success_and_result, taskid, workerid):
                      """This is the err/callback for a completed task."""
+                     success, result = success_and_result
                      try:
                          task = self.pendingTasks.pop(workerid)
                      except:
                          aborted = True
                      if not aborted:
-                         if result.failure is not None and isinstance(result.failure, failure.Failure): # we failed
+                         if not success:
                              log.msg("Task %i failed on worker %i"% (taskid, workerid))
                              if task.retries > 0: # resubmit
                                  task.retries -= 1
                                  s = "Resubmitting task %i, %i retries remaining" %(taskid, task.retries)
                                  log.msg(s)
                                  self.distributeTasks()
-                             elif isinstance(task.recovery_task, Task) and \
+                             elif isinstance(task.recovery_task, BaseTask) and \
                                                  task.recovery_task.retries > -1:
                                  # retries = -1 is to prevent infinite recovery_task loop
                                  task.retries = -1
                              # it may have died, and not yet been unregistered
                              reactor.callLater(self.failurePenalty, self.readmitWorker, workerid)
                          else: # we succeeded
-                             # log.msg("Task completed: %i"% taskid)
+                             log.msg("Task completed: %i"% taskid)
                              self._finishTask(taskid, result)
                              self.readmitWorker(workerid)
-                     else:# we aborted the task
-                         if result.failure is not None and isinstance(result.failure, failure.Failure): # it failed, penalize worker
+                     else: # we aborted the task
+                         if not success:
                              reactor.callLater(self.failurePenalty, self.readmitWorker, workerid)
                          else:
                              self.readmitWorker(workerid)
                  def readmitWorker(self, workerid):
-                     """Readmit a worker to the scheduler.
+                     """
+                     Readmit a worker to the scheduler.
                      This is outside `taskCompleted` because of the `failurePenalty` being
                      implemented through `reactor.callLater`.
                      if workerid in self.workers.keys() and workerid not in self.pendingTasks.keys():
                          self.scheduler.add_worker(self.workers[workerid])
                          self.distributeTasks()
+                 def clear(self):
+                     """
+                     Clear all previously run tasks from the task controller.
+                     This is needed because the task controller keep all task results
+                     in memory.  This can be a problem is there are many completed
+                     tasks.  Users should call this periodically to clean out these
+                     cached task results.
+                     """
+                     self.finishedResults = {}
+                     return defer.succeed(None)
              components.registerAdapter(TaskController, cs.IControllerBase, ITaskController)

IPython/kernel/taskclient.py

0 +89 -70

              # encoding: utf-8
              # -*- test-case-name: IPython.kernel.tests.test_taskcontrollerxmlrpc -*-
-             """The Generic Task Client object.
-             This must be subclassed based on your connection method.
+             """
+             A blocking version of the task client.
              """
              __docformat__ = "restructuredtext en"
              from IPython.kernel.twistedutil import blockingCallFromThread
              from IPython.kernel import task, error
+             from IPython.kernel.mapper import (
+                 SynchronousTaskMapper,
+                 ITaskMapperFactory,
+                 IMapper
+             )
+             from IPython.kernel.parallelfunction import (
+                 ParallelFunction,
+                 ITaskParallelDecorator
+             )
              #-------------------------------------------------------------------------------
-             # Connecting Task Client
+             # The task client
              #-------------------------------------------------------------------------------
-             class InteractiveTaskClient(object):
-                 def irun(self, *args, **kwargs):
-                     """Run a task on the `TaskController`.
-                     This method is a shorthand for run(task) and its arguments are simply
-                     passed onto a `Task` object:
-                     irun(*args, **kwargs) -> run(Task(*args, **kwargs))
-                     :Parameters:
-                         expression : str
-                             A str that is valid python code that is the task.
-                         pull : str or list of str
-                             The names of objects to be pulled as results.
-                         push : dict
-                             A dict of objects to be pushed into the engines namespace before
-                             execution of the expression.
-                         clear_before : boolean
-                             Should the engine's namespace be cleared before the task is run.
-                             Default=False.
-                         clear_after : boolean
-                             Should the engine's namespace be cleared after the task is run.
-                             Default=False.
-                         retries : int
-                             The number of times to resumbit the task if it fails.  Default=0.
-                         options : dict
-                             Any other keyword options for more elaborate uses of tasks
-                     :Returns: A `TaskResult` object.
-                     """
-                     block = kwargs.pop('block', False)
-                     if len(args) == 1 and isinstance(args[0], task.Task):
-                         t = args[0]
-                     else:
-                         t = task.Task(*args, **kwargs)
-                     taskid = self.run(t)
-                     print "TaskID = %i"%taskid
-                     if block:
-                         return self.get_task_result(taskid, block)
-                     else:
-                         return taskid
              class IBlockingTaskClient(Interface):
                  """
-                 An interface for blocking task clients.
+                 A vague interface of the blocking task client
                  """
                  pass
-             class BlockingTaskClient(InteractiveTaskClient):
+             class BlockingTaskClient(object):
                  """
-                 This class provides a blocking task client.
+                 A blocking task client that adapts a non-blocking one.
                  """
-                 implements(IBlockingTaskClient)
+                 implements(
+                     IBlockingTaskClient,
+                     ITaskMapperFactory,
+                     IMapper,
+                     ITaskParallelDecorator
+                 )
                  def __init__(self, task_controller):
                      self.task_controller = task_controller
                      self.block = True
-                 def run(self, task):
-                     """
-                     Run a task and return a task id that can be used to get the task result.
+                 def run(self, task, block=False):
+                     """Run a task on the `TaskController`.
+                     See the documentation of the `MapTask` and `StringTask` classes for
+                     details on how to build a task of different types.
                      :Parameters:
-                         task : `Task`
-                             The `Task` object to run
+                         task : an `ITask` implementer
+                     :Returns: The int taskid of the submitted task.  Pass this to
+                         `get_task_result` to get the `TaskResult` object.
                      """
-                     return blockingCallFromThread(self.task_controller.run, task)
+                     tid = blockingCallFromThread(self.task_controller.run, task)
+                     if block:
+                         return self.get_task_result(tid, block=True)
+                     else:
+                         return tid
                  def get_task_result(self, taskid, block=False):
                      """
-                     Get or poll for a task result.
+                     Get a task result by taskid.
                      :Parameters:
                          taskid : int
-                             The id of the task whose result to get
+                             The taskid of the task to be retrieved.
                          block : boolean
-                             If True, wait until the task is done and then result the
-                             `TaskResult` object.  If False, just poll for the result and
-                             return None if the task is not done.
+                             Should I block until the task is done?
+                     :Returns: A `TaskResult` object that encapsulates the task result.
                      """
                      return blockingCallFromThread(self.task_controller.get_task_result,
                          taskid, block)
                  def abort(self, taskid):
                      """
-                     Abort a task by task id if it has not been started.
+                     Abort a task by taskid.
+                     :Parameters:
+                         taskid : int
+                             The taskid of the task to be aborted.
                      """
                      return blockingCallFromThread(self.task_controller.abort, taskid)
                  def barrier(self, taskids):
-                     """
-                     Wait for a set of tasks to finish.
+                     """Block until a set of tasks are completed.
                      :Parameters:
-                         taskids : list of ints
-                             A list of task ids to wait for.
+                         taskids : list, tuple
+                             A sequence of taskids to block on.
                      """
                      return blockingCallFromThread(self.task_controller.barrier, taskids)
                  def spin(self):
                      """
-                     Cause the scheduler to schedule tasks.
+                     Touch the scheduler, to resume scheduling without submitting a task.
                      This method only needs to be called in unusual situations where the
-                     scheduler is idle for some reason.
+                     scheduler is idle for some reason.
                      """
                      return blockingCallFromThread(self.task_controller.spin)
                          A dict with the queue status.
                      """
                      return blockingCallFromThread(self.task_controller.queue_status, verbose)
+                 def clear(self):
+                     """
+                     Clear all previously run tasks from the task controller.
+                     This is needed because the task controller keep all task results
+                     in memory.  This can be a problem is there are many completed
+                     tasks.  Users should call this periodically to clean out these
+                     cached task results.
+                     """
+                     return blockingCallFromThread(self.task_controller.clear)
+                 def map(self, func, *sequences):
+                     """
+                     Apply func to *sequences elementwise.  Like Python's builtin map.
+                     This version is load balanced.
+                     """
+                     return self.mapper().map(func, *sequences)
+                 def mapper(self, clear_before=False, clear_after=False, retries=0,
+                             recovery_task=None, depend=None, block=True):
+                     """
+                     Create an `IMapper` implementer with a given set of arguments.
+                     The `IMapper` created using a task controller is load balanced.
+                     See the documentation for `IPython.kernel.task.BaseTask` for
+                     documentation on the arguments to this method.
+                     """
+                     return SynchronousTaskMapper(self, clear_before=clear_before,
+                         clear_after=clear_after, retries=retries,
+                         recovery_task=recovery_task, depend=depend, block=block)
+                 def parallel(self, clear_before=False, clear_after=False, retries=0,
+                     recovery_task=None, depend=None, block=True):
+                     mapper = self.mapper(clear_before, clear_after, retries,
+                         recovery_task, depend, block)
+                     pf = ParallelFunction(mapper)
+                     return pf
              components.registerAdapter(BlockingTaskClient,
                          task.ITaskController, IBlockingTaskClient)

IPython/kernel/taskfc.py

0 +119 -57

                  IFCClientInterfaceProvider,
                  IBlockingClientAdaptor
              )
+             from IPython.kernel.mapper import (
+                 TaskMapper,
+                 ITaskMapperFactory,
+                 IMapper
+             )
+             from IPython.kernel.parallelfunction import (
+                 ParallelFunction,
+                 ITaskParallelDecorator
+             )
              #-------------------------------------------------------------------------------
              # The Controller side of things
              class IFCTaskController(Interface):
                  """Foolscap interface to task controller.
-                 See the documentation of ITaskController for documentation about the methods.
+                 See the documentation of `ITaskController` for more information.
                  """
-                 def remote_run(request, binTask):
+                 def remote_run(binTask):
                      """"""
-                 def remote_abort(request, taskid):
+                 def remote_abort(taskid):
                      """"""
-                 def remote_get_task_result(request, taskid, block=False):
+                 def remote_get_task_result(taskid, block=False):
                      """"""
-                 def remote_barrier(request, taskids):
+                 def remote_barrier(taskids):
+                     """"""
+                 def remote_spin():
                      """"""
-                 def remote_spin(request):
+                 def remote_queue_status(verbose):
                      """"""
-                 def remote_queue_status(request, verbose):
+                 def remote_clear():
                      """"""
              class FCTaskControllerFromTaskController(Referenceable):
-                 """XML-RPC attachmeot for controller.
-                 See IXMLRPCTaskController and ITaskController (and its children) for documentation.
-                 """
+                 Adapt a `TaskController` to an `IFCTaskController`
+                 This class is used to expose a `TaskController` over the wire using
+                 the Foolscap network protocol.
+                 """
                  implements(IFCTaskController, IFCClientInterfaceProvider)
                  def __init__(self, taskController):
                  def remote_run(self, ptask):
                      try:
-                         ctask = pickle.loads(ptask)
-                         task = taskmodule.uncanTask(ctask)
+                         task = pickle.loads(ptask)
+                         task.uncan_task()
                      except:
                          d = defer.fail(pickle.UnpickleableError("Could not unmarshal task"))
                      else:
                      d.addErrback(self.packageFailure)
                      return d
+                 def remote_clear(self):
+                     return self.taskController.clear()
                  def remote_get_client_name(self):
                      return 'IPython.kernel.taskfc.FCTaskClient'
              #-------------------------------------------------------------------------------
              class FCTaskClient(object):
-                 """XML-RPC based TaskController client that implements ITaskController.
-                 :Parameters:
-                     addr : (ip, port)
-                         The ip (str) and port (int) tuple of the `TaskController`.
-                 """
-                 implements(taskmodule.ITaskController, IBlockingClientAdaptor)
+                 Client class for Foolscap exposed `TaskController`.
+                 This class is an adapter that makes a `RemoteReference` to a
+                 `TaskController` look like an actual `ITaskController` on the client side.
+                 This class also implements `IBlockingClientAdaptor` so that clients can
+                 automatically get a blocking version of this class.
+                 """
+                 implements(
+                     taskmodule.ITaskController,
+                     IBlockingClientAdaptor,
+                     ITaskMapperFactory,
+                     IMapper,
+                     ITaskParallelDecorator
+                 )
                  def __init__(self, remote_reference):
                      self.remote_reference = remote_reference
                  def run(self, task):
                      """Run a task on the `TaskController`.
-                     :Parameters:
-                         task : a `Task` object
-                     The Task object is created using the following signature:
-                     Task(expression, pull=None, push={}, clear_before=False,
-                         clear_after=False, retries=0, **options):)
+                     See the documentation of the `MapTask` and `StringTask` classes for
+                     details on how to build a task of different types.
-                     The meaning of the arguments is as follows:
+                     :Parameters:
+                         task : an `ITask` implementer
-                     :Task Parameters:
-                         expression : str
-                             A str that is valid python code that is the task.
-                         pull : str or list of str
-                             The names of objects to be pulled as results.
-                         push : dict
-                             A dict of objects to be pushed into the engines namespace before
-                             execution of the expression.
-                         clear_before : boolean
-                             Should the engine's namespace be cleared before the task is run.
-                             Default=False.
-                         clear_after : boolean
-                             Should the engine's namespace be cleared after the task is run.
-                             Default=False.
-                         retries : int
-                             The number of times to resumbit the task if it fails.  Default=0.
-                         options : dict
-                             Any other keyword options for more elaborate uses of tasks
                      :Returns: The int taskid of the submitted task.  Pass this to
                          `get_task_result` to get the `TaskResult` object.
                      """
-                     assert isinstance(task, taskmodule.Task), "task must be a Task object!"
-                     ctask = taskmodule.canTask(task) # handles arbitrary function in .depend
-                                             # as well as arbitrary recovery_task chains
-                     ptask = pickle.dumps(ctask, 2)
+                     assert isinstance(task, taskmodule.BaseTask), "task must be a Task object!"
+                     task.can_task()
+                     ptask = pickle.dumps(task, 2)
+                     task.uncan_task()
                      d = self.remote_reference.callRemote('run', ptask)
                      d.addCallback(self.unpackage)
                      return d
                  def get_task_result(self, taskid, block=False):
-                     """The task result by taskid.
+                     """
+                     Get a task result by taskid.
                      :Parameters:
                          taskid : int
                      return d
                  def abort(self, taskid):
-                     """Abort a task by taskid.
+                     """
+                     Abort a task by taskid.
                      :Parameters:
                          taskid : int
                              The taskid of the task to be aborted.
-                         block : boolean
-                             Should I block until the task is aborted.
                      """
                      d = self.remote_reference.callRemote('abort', taskid)
                      d.addCallback(self.unpackage)
                      return d
                  def barrier(self, taskids):
-                     """Block until all tasks are completed.
+                     """Block until a set of tasks are completed.
                      :Parameters:
                          taskids : list, tuple
                      return d
                  def spin(self):
-                     """touch the scheduler, to resume scheduling without submitting
-                     a task.
+                     """
+                     Touch the scheduler, to resume scheduling without submitting a task.
+                     This method only needs to be called in unusual situations where the
+                     scheduler is idle for some reason.
                      """
                      d = self.remote_reference.callRemote('spin')
                      d.addCallback(self.unpackage)
                      return d
                  def queue_status(self, verbose=False):
-                     """Return a dict with the status of the task queue."""
+                     """
+                     Get a dictionary with the current state of the task queue.
+                     :Parameters:
+                         verbose : boolean
+                             If True, return a list of taskids.  If False, simply give
+                             the number of tasks with each status.
+                     :Returns:
+                         A dict with the queue status.
+                     """
                      d = self.remote_reference.callRemote('queue_status', verbose)
                      d.addCallback(self.unpackage)
                      return d
+                 def clear(self):
+                     """
+                     Clear all previously run tasks from the task controller.
+                     This is needed because the task controller keep all task results
+                     in memory.  This can be a problem is there are many completed
+                     tasks.  Users should call this periodically to clean out these
+                     cached task results.
+                     """
+                     d = self.remote_reference.callRemote('clear')
+                     return d
                  def adapt_to_blocking_client(self):
+                     """
+                     Wrap self in a blocking version that implements `IBlockingTaskClient.
+                     """
                      from IPython.kernel.taskclient import IBlockingTaskClient
                      return IBlockingTaskClient(self)
+                 def map(self, func, *sequences):
+                     """
+                     Apply func to *sequences elementwise.  Like Python's builtin map.
+                     This version is load balanced.
+                     """
+                     return self.mapper().map(func, *sequences)
+                 def mapper(self, clear_before=False, clear_after=False, retries=0,
+                             recovery_task=None, depend=None, block=True):
+                     """
+                     Create an `IMapper` implementer with a given set of arguments.
+                     The `IMapper` created using a task controller is load balanced.
+                     See the documentation for `IPython.kernel.task.BaseTask` for
+                     documentation on the arguments to this method.
+                     """
+                     return TaskMapper(self, clear_before=clear_before,
+                         clear_after=clear_after, retries=retries,
+                         recovery_task=recovery_task, depend=depend, block=block)
+                 def parallel(self, clear_before=False, clear_after=False, retries=0,
+                     recovery_task=None, depend=None, block=True):
+                     mapper = self.mapper(clear_before, clear_after, retries,
+                         recovery_task, depend, block)
+                     pf = ParallelFunction(mapper)
+                     return pf

IPython/kernel/tests/engineservicetest.py

0 0 -1

                      try:
                          import numpy
                      except:
-                         print 'no numpy, ',
                          return
                      a = numpy.random.random(1000)
                      d = self.engine.push(dict(a=a))

IPython/kernel/tests/multienginetest.py

0 +2 -12

                      d.addCallback(lambda did: self.multiengine.get_pending_deferred(did, True))
                      d.addCallback(lambda r: self.assertEquals(r, range(16)))
                      return d
                  def testScatterGatherNumpyNonblocking(self):
                      try:
                          import numpy
                          d.addCallback(lambda did: self.multiengine.get_pending_deferred(did, True))
                          d.addCallback(lambda r: assert_array_equal(r, a))
                          return d
-                 def testMapNonblocking(self):
-                     self.addEngine(4)
-                     def f(x):
-                         return x**2
-                     data = range(16)
-                     d= self.multiengine.map(f, data, block=False)
-                     d.addCallback(lambda did: self.multiengine.get_pending_deferred(did, True))
-                     d.addCallback(lambda r: self.assertEquals(r,[f(x) for x in data]))
-                     return d
                  def test_clear_pending_deferreds(self):
                      self.addEngine(4)
                      did_list = []

IPython/kernel/tests/tasktest.py

0 +65 -36

              class ITaskControllerTestCase(TaskTestBase):
-                 def testTaskIDs(self):
+                 def test_task_ids(self):
                      self.addEngine(1)
-                     d = self.tc.run(task.Task('a=5'))
+                     d = self.tc.run(task.StringTask('a=5'))
                      d.addCallback(lambda r: self.assertEquals(r, 0))
-                     d.addCallback(lambda r: self.tc.run(task.Task('a=5')))
+                     d.addCallback(lambda r: self.tc.run(task.StringTask('a=5')))
                      d.addCallback(lambda r: self.assertEquals(r, 1))
-                     d.addCallback(lambda r: self.tc.run(task.Task('a=5')))
+                     d.addCallback(lambda r: self.tc.run(task.StringTask('a=5')))
                      d.addCallback(lambda r: self.assertEquals(r, 2))
-                     d.addCallback(lambda r: self.tc.run(task.Task('a=5')))
+                     d.addCallback(lambda r: self.tc.run(task.StringTask('a=5')))
                      d.addCallback(lambda r: self.assertEquals(r, 3))
                      return d
-                 def testAbort(self):
+                 def test_abort(self):
                      """Cannot do a proper abort test, because blocking execution prevents
                      abort from being called before task completes"""
                      self.addEngine(1)
-                     t = task.Task('a=5')
+                     t = task.StringTask('a=5')
                      d = self.tc.abort(0)
                      d.addErrback(lambda f: self.assertRaises(IndexError, f.raiseException))
                      d.addCallback(lambda _:self.tc.run(t))
                      d.addErrback(lambda f: self.assertRaises(IndexError, f.raiseException))
                      return d
-                 def testAbortType(self):
+                 def test_abort_type(self):
                      self.addEngine(1)
                      d = self.tc.abort('asdfadsf')
                      d.addErrback(lambda f: self.assertRaises(TypeError, f.raiseException))
                      return d
-                 def testClears(self):
+                 def test_clear_before_and_after(self):
                      self.addEngine(1)
-                     t = task.Task('a=1', clear_before=True, pull='b', clear_after=True)
+                     t = task.StringTask('a=1', clear_before=True, pull='b', clear_after=True)
                      d = self.multiengine.execute('b=1', targets=0)
                      d.addCallback(lambda _: self.tc.run(t))
                      d.addCallback(lambda tid: self.tc.get_task_result(tid,block=True))
                      d.addErrback(lambda f: self.assertRaises(NameError, _raise_it, f))
                      return d
-                 def testSimpleRetries(self):
+                 def test_simple_retries(self):
                      self.addEngine(1)
-                     t = task.Task("i += 1\nassert i == 16", pull='i',retries=10)
-                     t2 = task.Task("i += 1\nassert i == 16", pull='i',retries=10)
+                     t = task.StringTask("i += 1\nassert i == 16", pull='i',retries=10)
+                     t2 = task.StringTask("i += 1\nassert i == 16", pull='i',retries=10)
                      d = self.multiengine.execute('i=0', targets=0)
                      d.addCallback(lambda r: self.tc.run(t))
                      d.addCallback(self.tc.get_task_result, block=True)
                      d.addCallback(lambda r: self.assertEquals(r, 16))
                      return d
-                 def testRecoveryTasks(self):
+                 def test_recovery_tasks(self):
                      self.addEngine(1)
-                     t = task.Task("i=16", pull='i')
-                     t2 = task.Task("raise Exception", recovery_task=t, retries = 2)
+                     t = task.StringTask("i=16", pull='i')
+                     t2 = task.StringTask("raise Exception", recovery_task=t, retries = 2)
                      d = self.tc.run(t2)
                      d.addCallback(self.tc.get_task_result, block=True)
                      d.addCallback(lambda r: self.assertEquals(r, 16))
                      return d
-                 # def testInfiniteRecoveryLoop(self):
-                 #     self.addEngine(1)
-                 #     t = task.Task("raise Exception", retries = 5)
-                 #     t2 = task.Task("assert True", retries = 2, recovery_task = t)
-                 #     t.recovery_task = t2
+                 #
-                 #     d = self.tc.run(t)
-                 #     d.addCallback(self.tc.get_task_result, block=True)
-                 #     d.addCallback(lambda tr: tr.ns.i)
-                 #     d.addBoth(printer)
-                 #     d.addErrback(lambda f: self.assertRaises(AssertionError, f.raiseException))
-                 #     return d
+                 #
-                 def testSetupNS(self):
+                 def test_setup_ns(self):
                      self.addEngine(1)
                      d = self.multiengine.execute('a=0', targets=0)
                      ns = dict(a=1, b=0)
-                     t = task.Task("", push=ns, pull=['a','b'])
+                     t = task.StringTask("", push=ns, pull=['a','b'])
                      d.addCallback(lambda r: self.tc.run(t))
                      d.addCallback(self.tc.get_task_result, block=True)
                      d.addCallback(lambda tr: {'a':tr.ns.a, 'b':tr['b']})
                      d.addCallback(lambda r: self.assertEquals(r, ns))
                      return d
-                 def testTaskResults(self):
+                 def test_string_task_results(self):
                      self.addEngine(1)
-                     t1 = task.Task('a=5', pull='a')
+                     t1 = task.StringTask('a=5', pull='a')
                      d = self.tc.run(t1)
                      d.addCallback(self.tc.get_task_result, block=True)
-                     d.addCallback(lambda tr: (tr.ns.a,tr['a'],tr.failure, tr.raiseException()))
+                     d.addCallback(lambda tr: (tr.ns.a,tr['a'],tr.failure, tr.raise_exception()))
                      d.addCallback(lambda r: self.assertEquals(r, (5,5,None,None)))
-                     t2 = task.Task('7=5')
+                     t2 = task.StringTask('7=5')
                      d.addCallback(lambda r: self.tc.run(t2))
                      d.addCallback(self.tc.get_task_result, block=True)
                      d.addCallback(lambda tr: tr.ns)
                      d.addErrback(lambda f: self.assertRaises(SyntaxError, f.raiseException))
-                     t3 = task.Task('', pull='b')
+                     t3 = task.StringTask('', pull='b')
                      d.addCallback(lambda r: self.tc.run(t3))
                      d.addCallback(self.tc.get_task_result, block=True)
                      d.addCallback(lambda tr: tr.ns)
                      d.addErrback(lambda f: self.assertRaises(NameError, f.raiseException))
                      return d
+                 def test_map_task(self):
+                     self.addEngine(1)
+                     t1 = task.MapTask(lambda x: 2*x,(10,))
+                     d = self.tc.run(t1)
+                     d.addCallback(self.tc.get_task_result, block=True)
+                     d.addCallback(lambda r: self.assertEquals(r,20))
+                     t2 = task.MapTask(lambda : 20)
+                     d.addCallback(lambda _: self.tc.run(t2))
+                     d.addCallback(self.tc.get_task_result, block=True)
+                     d.addCallback(lambda r: self.assertEquals(r,20))
+                     t3 = task.MapTask(lambda x: x,(),{'x':20})
+                     d.addCallback(lambda _: self.tc.run(t3))
+                     d.addCallback(self.tc.get_task_result, block=True)
+                     d.addCallback(lambda r: self.assertEquals(r,20))
+                     return d
+                 def test_map_task_failure(self):
+                     self.addEngine(1)
+                     t1 = task.MapTask(lambda x: 1/0,(10,))
+                     d = self.tc.run(t1)
+                     d.addCallback(self.tc.get_task_result, block=True)
+                     d.addErrback(lambda f: self.assertRaises(ZeroDivisionError, f.raiseException))
+                     return d
+                 def test_map_task_args(self):
+                     self.assertRaises(TypeError, task.MapTask, 'asdfasdf')
+                     self.assertRaises(TypeError, task.MapTask, lambda x: x, 10)
+                     self.assertRaises(TypeError, task.MapTask, lambda x: x, (10,),30)
+                 def test_clear(self):
+                     self.addEngine(1)
+                     t1 = task.MapTask(lambda x: 2*x,(10,))
+                     d = self.tc.run(t1)
+                     d.addCallback(lambda _: self.tc.get_task_result(0, block=True))
+                     d.addCallback(lambda r: self.assertEquals(r,20))
+                     d.addCallback(lambda _: self.tc.clear())
+                     d.addCallback(lambda _: self.tc.get_task_result(0, block=True))
+                     d.addErrback(lambda f: self.assertRaises(IndexError, f.raiseException))
+                     return d

IPython/kernel/tests/test_enginefc.py

0 +1 -1

                      IEngineQueuedTestCase
              except ImportError:
                  print "we got an error!!!"
-                 pass
+                 raise
              else:
                  class EngineFCTest(DeferredTestCase,
                                     IEngineCoreTestCase,

IPython/kernel/tests/test_multienginefc.py

0 +74 0

		@@ -26,9 +26,20 b' try:'
26	26	from IPython.kernel.multienginefc import IFCSynchronousMultiEngine
27	27	from IPython.kernel import multiengine as me
28	28	from IPython.kernel.clientconnector import ClientConnector
	29	from IPython.kernel.parallelfunction import ParallelFunction
	30	from IPython.kernel.error import CompositeError
	31	from IPython.kernel.util import printer
29	32	except ImportError:
30	33	pass
31	34	else:
	35
	36	def _raise_it(f):
	37	try:
	38	f.raiseException()
	39	except CompositeError, e:
	40	e.raise_exception()
	41
	42
32	43	class FullSynchronousMultiEngineTestCase(DeferredTestCase, IFullSynchronousMultiEngineTestCase):
33	44
34	45	def setUp(self):
		@@ -68,3 +79,66 b' else:'
68	79	d.addBoth(lambda _: self.controller.stopService())
69	80	dlist.append(d)
70	81	return defer.DeferredList(dlist)
	82
	83	def test_mapper(self):
	84	self.addEngine(4)
	85	m = self.multiengine.mapper()
	86	self.assertEquals(m.multiengine,self.multiengine)
	87	self.assertEquals(m.dist,'b')
	88	self.assertEquals(m.targets,'all')
	89	self.assertEquals(m.block,True)
	90
	91	def test_map_default(self):
	92	self.addEngine(4)
	93	m = self.multiengine.mapper()
	94	d = m.map(lambda x: 2*x, range(10))
	95	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	96	d.addCallback(lambda _: self.multiengine.map(lambda x: 2*x, range(10)))
	97	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	98	return d
	99
	100	def test_map_noblock(self):
	101	self.addEngine(4)
	102	m = self.multiengine.mapper(block=False)
	103	d = m.map(lambda x: 2*x, range(10))
	104	d.addCallback(lambda did: self.multiengine.get_pending_deferred(did, True))
	105	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	106	return d
	107
	108	def test_mapper_fail(self):
	109	self.addEngine(4)
	110	m = self.multiengine.mapper()
	111	d = m.map(lambda x: 1/0, range(10))
	112	d.addBoth(lambda f: self.assertRaises(ZeroDivisionError, _raise_it, f))
	113	return d
	114
	115	def test_parallel(self):
	116	self.addEngine(4)
	117	p = self.multiengine.parallel()
	118	self.assert_(isinstance(p, ParallelFunction))
	119	@p
	120	def f(x): return 2*x
	121	d = f(range(10))
	122	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	123	return d
	124
	125	def test_parallel_noblock(self):
	126	self.addEngine(1)
	127	p = self.multiengine.parallel(block=False)
	128	self.assert_(isinstance(p, ParallelFunction))
	129	@p
	130	def f(x): return 2*x
	131	d = f(range(10))
	132	d.addCallback(lambda did: self.multiengine.get_pending_deferred(did, True))
	133	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	134	return d
	135
	136	def test_parallel_fail(self):
	137	self.addEngine(4)
	138	p = self.multiengine.parallel()
	139	self.assert_(isinstance(p, ParallelFunction))
	140	@p
	141	def f(x): return 1/0
	142	d = f(range(10))
	143	d.addBoth(lambda f: self.assertRaises(ZeroDivisionError, _raise_it, f))
	144	return d No newline at end of file

IPython/kernel/tests/test_pendingdeferred.py

0 755 ➡ 644 +5 -5

                  from twisted.internet import defer
                  from twisted.python import failure
-                 from IPython.testing import tcommon
-                 #from IPython.testing.tcommon import *
                  from IPython.testing.util import DeferredTestCase
                  import IPython.kernel.pendingdeferred as pd
                  from IPython.kernel import error
              except ImportError:
                  pass
              else:
+                 class Foo(object):
+                     def bar(self, bahz):
+                         return defer.succeed('blahblah: %s' % bahz)
                  class TwoPhaseFoo(pd.PendingDeferredManager):
                          d3 = self.pdm.get_pending_deferred(did,False)
                          d3.addCallback(lambda r: self.assertEquals(r,'bar'))
-             # Global object expected by Twisted's trial
-             testSuite = lambda : makeTestSuite(__name__,dt_files,dt_modules)

IPython/kernel/tests/test_taskfc.py

0 +72 -1

		@@ -30,6 +30,8 b' try:'
30	30	from IPython.kernel.util import printer
31	31	from IPython.kernel.tests.tasktest import ITaskControllerTestCase
32	32	from IPython.kernel.clientconnector import ClientConnector
	33	from IPython.kernel.error import CompositeError
	34	from IPython.kernel.parallelfunction import ParallelFunction
33	35	except ImportError:
34	36	pass
35	37	else:
		@@ -38,6 +40,12 b' else:'
38	40	# Tests
39	41	#-------------------------------------------------------------------------------
40	42
	43	def _raise_it(f):
	44	try:
	45	f.raiseException()
	46	except CompositeError, e:
	47	e.raise_exception()
	48
41	49	class TaskTest(DeferredTestCase, ITaskControllerTestCase):
42	50
43	51	def setUp(self):
		@@ -87,4 +95,67 b' else:'
87	95	d.addBoth(lambda _: self.controller.stopService())
88	96	dlist.append(d)
89	97	return defer.DeferredList(dlist)
90
	98
	99	def test_mapper(self):
	100	self.addEngine(1)
	101	m = self.tc.mapper()
	102	self.assertEquals(m.task_controller,self.tc)
	103	self.assertEquals(m.clear_before,False)
	104	self.assertEquals(m.clear_after,False)
	105	self.assertEquals(m.retries,0)
	106	self.assertEquals(m.recovery_task,None)
	107	self.assertEquals(m.depend,None)
	108	self.assertEquals(m.block,True)
	109
	110	def test_map_default(self):
	111	self.addEngine(1)
	112	m = self.tc.mapper()
	113	d = m.map(lambda x: 2*x, range(10))
	114	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	115	d.addCallback(lambda _: self.tc.map(lambda x: 2*x, range(10)))
	116	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	117	return d
	118
	119	def test_map_noblock(self):
	120	self.addEngine(1)
	121	m = self.tc.mapper(block=False)
	122	d = m.map(lambda x: 2*x, range(10))
	123	d.addCallback(lambda r: self.assertEquals(r,[x for x in range(10)]))
	124	return d
	125
	126	def test_mapper_fail(self):
	127	self.addEngine(1)
	128	m = self.tc.mapper()
	129	d = m.map(lambda x: 1/0, range(10))
	130	d.addBoth(lambda f: self.assertRaises(ZeroDivisionError, _raise_it, f))
	131	return d
	132
	133	def test_parallel(self):
	134	self.addEngine(1)
	135	p = self.tc.parallel()
	136	self.assert_(isinstance(p, ParallelFunction))
	137	@p
	138	def f(x): return 2*x
	139	d = f(range(10))
	140	d.addCallback(lambda r: self.assertEquals(r,[2*x for x in range(10)]))
	141	return d
	142
	143	def test_parallel_noblock(self):
	144	self.addEngine(1)
	145	p = self.tc.parallel(block=False)
	146	self.assert_(isinstance(p, ParallelFunction))
	147	@p
	148	def f(x): return 2*x
	149	d = f(range(10))
	150	d.addCallback(lambda r: self.assertEquals(r,[x for x in range(10)]))
	151	return d
	152
	153	def test_parallel_fail(self):
	154	self.addEngine(1)
	155	p = self.tc.parallel()
	156	self.assert_(isinstance(p, ParallelFunction))
	157	@p
	158	def f(x): return 1/0
	159	d = f(range(10))
	160	d.addBoth(lambda f: self.assertRaises(ZeroDivisionError, _raise_it, f))
	161	return d No newline at end of file

docs/examples/kernel/fetchparse.py

0 +1 -1

                          self.allLinks.append(url)
                          if url.startswith(self.site):
                              print '    ', url
-                             self.linksWorking[url] = self.tc.run(client.Task('links = fetchAndParse(url)', pull=['links'], push={'url': url}))
+                             self.linksWorking[url] = self.tc.run(client.StringTask('links = fetchAndParse(url)', pull=['links'], push={'url': url}))
                  def onVisitDone(self, result, url):
                      print url, ':'

docs/examples/kernel/helloworld.py

0 +2 -2

              mec = client.MultiEngineClient()
              mec.execute('import time')
-             hello_taskid = tc.run(client.Task('time.sleep(3) ; word = "Hello,"', pull=('word')))
-             world_taskid = tc.run(client.Task('time.sleep(3) ; word = "World!"', pull=('word')))
+             hello_taskid = tc.run(client.StringTask('time.sleep(3) ; word = "Hello,"', pull=('word')))
+             world_taskid = tc.run(client.StringTask('time.sleep(3) ; word = "World!"', pull=('word')))
              print "Submitted tasks:", hello_taskid, world_taskid
              print tc.get_task_result(hello_taskid,block=True).ns.word, tc.get_task_result(world_taskid,block=True).ns.word

docs/examples/kernel/mcdriver.py

0 +1 -1

              taskids = []
              for K in K_vals:
                  for sigma in sigma_vals:
-                     t = client.Task(task_string,
+                     t = client.StringTask(task_string,
                          push=dict(sigma=sigma,K=K),
                          pull=('vp','ap','vc','ac','sigma','K'))
                      taskids.append(tc.run(t))

docs/examples/kernel/task1.py

0 +2 -2

              c = a*b*d
              """
-             t1 = client.Task(cmd1, clear_before=False, clear_after=True, pull=['a','b','c'])
+             t1 = client.StringTask(cmd1, clear_before=False, clear_after=True, pull=['a','b','c'])
              tid1 = tc.run(t1)
              tr1 = tc.get_task_result(tid1,block=True)
-             tr1.raiseException()
+             tr1.raise_exception()
              print "a, b: ", tr1.ns.a, tr1.ns.b
  No newline at end of file

docs/examples/kernel/task2.py

0 +3 -3

              mec.execute('import time')
              for i in range(24):
-                 tc.irun('time.sleep(1)')
+                 tc.run(client.StringTask('time.sleep(1)'))
              for i in range(6):
                  time.sleep(1.0)
                  print tc.queue_status()
              for i in range(24):
-                 tc.irun('time.sleep(1)')
+                 tc.run(client.StringTask('time.sleep(1)'))
              for i in range(6):
                  time.sleep(1.0)
                  print tc.queue_status(True)
              for i in range(12):
-                 tc.irun('time.sleep(2)')
+                 tc.run(client.StringTask('time.sleep(2)'))
              print "Queue status (vebose=True)"
              print tc.queue_status(True)

docs/examples/kernel/task_profiler.py

0 +1 -1

                  # the jobs should take a random time within a range
                  times = [random.random()*(opts.tmax-opts.tmin)+opts.tmin for i in range(opts.n)]
-                 tasks = [client.Task("time.sleep(%f)"%t) for t in times]
+                 tasks = [client.StringTask("time.sleep(%f)"%t) for t in times]
                  stime = sum(times)
                  print "executing %i tasks, totalling %.1f secs on %i engines"%(opts.n, stime, nengines)

docs/source/changes.txt

0 +24 -2

              New features
              ------------
+             	* The notion of a task has been completely reworked.  An `ITask` interface has
+             	  been created.  This interface defines the methods that tasks need to implement.
+             	  These methods are now responsible for things like submitting tasks and processing
+             	  results.  There are two basic task types: :class:`IPython.kernel.task.StringTask`
+             	  (this is the old `Task` object, but renamed) and the new
+             	  :class:`IPython.kernel.task.MapTask`, which is based on a function.
+             	* A new interface, :class:`IPython.kernel.mapper.IMapper` has been defined to
+             	  standardize the idea of a `map` method.  This interface has a single
+             	  `map` method that has the same syntax as the built-in `map`.  We have also defined
+             	  a `mapper` factory interface that creates objects that implement
+             	  :class:`IPython.kernel.mapper.IMapper` for different controllers.  Both
+             	  the multiengine and task controller now have mapping capabilties.
+             	* The parallel function capabilities have been reworks.  The major changes are that
+             	  i) there is now an `@parallel` magic that creates parallel functions, ii)
+             	  the syntax for mulitple variable follows that of `map`, iii) both the
+             	  multiengine and task controller now have a parallel function implementation.
              	* All of the parallel computing capabilities from `ipython1-dev` have been merged into
              	  IPython proper.  This resulted in the following new subpackages:
              	  :mod:`IPython.kernel`, :mod:`IPython.kernel.core`, :mod:`IPython.config`,
              	  when ipcluster is able to start things on other hosts, we will put security
              	  back.
              Bug fixes
              ---------
+             	* The colors escapes in the multiengine client are now turned off on win32 as they
+             	  don't print correctly.
              	* The :mod:`IPython.kernel.scripts.ipengine` script was exec'ing mpi_import_statement
              	  incorrectly, which was leading the engine to crash when mpi was enabled.
              	* A few subpackages has missing `__init__.py` files.
              Backwards incompatible changes
              ------------------------------
+             	* :class:`IPython.kernel.client.Task` has been renamed
+             	  :class:`IPython.kernel.client.StringTask` to make way for new task types.
+             	* The keyword argument `style` has been renamed `dist` in `scatter`, `gather`
+             	  and `map`.
+             	* Renamed the values that the rename `dist` keyword argument can have from
+             	  `'basic'` to `'b'`.
              	* IPython has a larger set of dependencies if you want all of its capabilities.
              	  See the `setup.py` script for details.
              	* The constructors for :class:`IPython.kernel.client.MultiEngineClient` and

docs/source/install/index.txt

0 +2 0

+             .. _install_index:
              ==================
              Installation
              ==================

docs/source/overview.txt

0 +132 -147

		@@ -4,18 +4,6 b''
4	4	Introduction
5	5	============
6	6
7		This is the official documentation for IPython 0.x series (i.e. what
8		we are used to refer to just as "IPython"). The original text of the
9		manual (most of which is still in place) has been authored by Fernando
10		Perez, but as recommended usage patterns and new features have
11		emerged, this manual has been updated to reflect that fact. Most of
12		the additions have been authored by Ville M. Vainio.
13
14		The manual has been generated from reStructuredText source markup with
15		Sphinx, which should make it much easier to keep it up-to-date in the
16		future. Some reST artifacts and bugs may still be apparent in the
17		documentation, but this should improve as the toolchain matures.
18
19	7	Overview
20	8	========
21	9
		@@ -25,8 +13,19 b' creating test files as is typical in most programming languages.'
25	13	However, the interpreter supplied with the standard Python distribution
26	14	is somewhat limited for extended interactive use.
27	15
28		IPython is a free software project (released under the BSD license)
29		which tries to:
	16	The goal of IPython is to create a comprehensive environment for
	17	interactive and exploratory computing. To support, this goal, IPython
	18	has two main components:
	19
	20	* An enhanced interactive Python shell.
	21	* An architecture for interactive parallel computing.
	22
	23	All of IPython is open source (released under the revised BSD license).
	24
	25	Enhanced interactive Python shell
	26	=================================
	27
	28	IPython's interactive shell (`ipython`), has the following goals:
30	29
31	30	1. Provide an interactive shell superior to Python's default. IPython
32	31	has many features for object introspection, system shell access,
		@@ -50,140 +49,126 b' which tries to:'
50	49	WX applications via special threading flags. The normal Python
51	50	shell can only do this for Tkinter applications.
52	51
53
54		Main features
55		-------------
56
57		* Dynamic object introspection. One can access docstrings, function
58		definition prototypes, source code, source files and other details
59		of any object accessible to the interpreter with a single
60		keystroke ('?', and using '??' provides additional detail).
61		* Searching through modules and namespaces with '*' wildcards, both
62		when using the '?' system and via the %psearch command.
63		* Completion in the local namespace, by typing TAB at the prompt.
64		This works for keywords, modules, methods, variables and files in the
65		current directory. This is supported via the readline library, and
66		full access to configuring readline's behavior is provided.
67		Custom completers can be implemented easily for different purposes
68		(system commands, magic arguments etc.)
69		* Numbered input/output prompts with command history (persistent
70		across sessions and tied to each profile), full searching in this
71		history and caching of all input and output.
72		* User-extensible 'magic' commands. A set of commands prefixed with
73		% is available for controlling IPython itself and provides
74		directory control, namespace information and many aliases to
75		common system shell commands.
76		* Alias facility for defining your own system aliases.
77		* Complete system shell access. Lines starting with ! are passed
78		directly to the system shell, and using !! or var = !cmd
79		captures shell output into python variables for further use.
80		* Background execution of Python commands in a separate thread.
81		IPython has an internal job manager called jobs, and a
82		conveninence backgrounding magic function called %bg.
83		* The ability to expand python variables when calling the system
84		shell. In a shell command, any python variable prefixed with $ is
85		expanded. A double $$ allows passing a literal $ to the shell (for
86		access to shell and environment variables like $PATH).
87		* Filesystem navigation, via a magic %cd command, along with a
88		persistent bookmark system (using %bookmark) for fast access to
89		frequently visited directories.
90		* A lightweight persistence framework via the %store command, which
91		allows you to save arbitrary Python variables. These get restored
92		automatically when your session restarts.
93		* Automatic indentation (optional) of code as you type (through the
94		readline library).
95		* Macro system for quickly re-executing multiple lines of previous
96		input with a single name. Macros can be stored persistently via
97		%store and edited via %edit.
98		* Session logging (you can then later use these logs as code in your
99		programs). Logs can optionally timestamp all input, and also store
100		session output (marked as comments, so the log remains valid
101		Python source code).
102		* Session restoring: logs can be replayed to restore a previous
103		session to the state where you left it.
104		* Verbose and colored exception traceback printouts. Easier to parse
105		visually, and in verbose mode they produce a lot of useful
106		debugging information (basically a terminal version of the cgitb
107		module).
108		* Auto-parentheses: callable objects can be executed without
109		parentheses: 'sin 3' is automatically converted to 'sin(3)'.
110		* Auto-quoting: using ',' or ';' as the first character forces
111		auto-quoting of the rest of the line: ',my_function a b' becomes
112		automatically 'my_function("a","b")', while ';my_function a b'
113		becomes 'my_function("a b")'.
114		* Extensible input syntax. You can define filters that pre-process
115		user input to simplify input in special situations. This allows
116		for example pasting multi-line code fragments which start with
117		'>>>' or '...' such as those from other python sessions or the
118		standard Python documentation.
119		* Flexible configuration system. It uses a configuration file which
120		allows permanent setting of all command-line options, module
121		loading, code and file execution. The system allows recursive file
122		inclusion, so you can have a base file with defaults and layers
123		which load other customizations for particular projects.
124		* Embeddable. You can call IPython as a python shell inside your own
125		python programs. This can be used both for debugging code or for
126		providing interactive abilities to your programs with knowledge
127		about the local namespaces (very useful in debugging and data
128		analysis situations).
129		* Easy debugger access. You can set IPython to call up an enhanced
130		version of the Python debugger (pdb) every time there is an
131		uncaught exception. This drops you inside the code which triggered
132		the exception with all the data live and it is possible to
133		navigate the stack to rapidly isolate the source of a bug. The
134		%run magic command -with the -d option- can run any script under
135		pdb's control, automatically setting initial breakpoints for you.
136		This version of pdb has IPython-specific improvements, including
137		tab-completion and traceback coloring support. For even easier
138		debugger access, try %debug after seeing an exception. winpdb is
139		also supported, see ipy_winpdb extension.
140		* Profiler support. You can run single statements (similar to
141		profile.run()) or complete programs under the profiler's control.
142		While this is possible with standard cProfile or profile modules,
143		IPython wraps this functionality with magic commands (see '%prun'
144		and '%run -p') convenient for rapid interactive work.
145		* Doctest support. The special %doctest_mode command toggles a mode
146		that allows you to paste existing doctests (with leading '>>>'
147		prompts and whitespace) and uses doctest-compatible prompts and
148		output, so you can use IPython sessions as doctest code.
149
	52	Main features of the interactive shell
	53	--------------------------------------
	54
	55	* Dynamic object introspection. One can access docstrings, function
	56	definition prototypes, source code, source files and other details
	57	of any object accessible to the interpreter with a single
	58	keystroke (:samp:`?`, and using :samp:`??` provides additional detail).
	59	* Searching through modules and namespaces with :samp:`*` wildcards, both
	60	when using the :samp:`?` system and via the :samp:`%psearch` command.
	61	* Completion in the local namespace, by typing :kbd:`TAB` at the prompt.
	62	This works for keywords, modules, methods, variables and files in the
	63	current directory. This is supported via the readline library, and
	64	full access to configuring readline's behavior is provided.
	65	Custom completers can be implemented easily for different purposes
	66	(system commands, magic arguments etc.)
	67	* Numbered input/output prompts with command history (persistent
	68	across sessions and tied to each profile), full searching in this
	69	history and caching of all input and output.
	70	* User-extensible 'magic' commands. A set of commands prefixed with
	71	:samp:`%` is available for controlling IPython itself and provides
	72	directory control, namespace information and many aliases to
	73	common system shell commands.
	74	* Alias facility for defining your own system aliases.
	75	* Complete system shell access. Lines starting with :samp:`!` are passed
	76	directly to the system shell, and using :samp:`!!` or :samp:`var = !cmd`
	77	captures shell output into python variables for further use.
	78	* Background execution of Python commands in a separate thread.
	79	IPython has an internal job manager called jobs, and a
	80	conveninence backgrounding magic function called :samp:`%bg`.
	81	* The ability to expand python variables when calling the system
	82	shell. In a shell command, any python variable prefixed with :samp:`$` is
	83	expanded. A double :samp:`$$` allows passing a literal :samp:`$` to the shell (for
	84	access to shell and environment variables like :envvar:`PATH`).
	85	* Filesystem navigation, via a magic :samp:`%cd` command, along with a
	86	persistent bookmark system (using :samp:`%bookmark`) for fast access to
	87	frequently visited directories.
	88	* A lightweight persistence framework via the :samp:`%store` command, which
	89	allows you to save arbitrary Python variables. These get restored
	90	automatically when your session restarts.
	91	* Automatic indentation (optional) of code as you type (through the
	92	readline library).
	93	* Macro system for quickly re-executing multiple lines of previous
	94	input with a single name. Macros can be stored persistently via
	95	:samp:`%store` and edited via :samp:`%edit`.
	96	* Session logging (you can then later use these logs as code in your
	97	programs). Logs can optionally timestamp all input, and also store
	98	session output (marked as comments, so the log remains valid
	99	Python source code).
	100	* Session restoring: logs can be replayed to restore a previous
	101	session to the state where you left it.
	102	* Verbose and colored exception traceback printouts. Easier to parse
	103	visually, and in verbose mode they produce a lot of useful
	104	debugging information (basically a terminal version of the cgitb
	105	module).
	106	* Auto-parentheses: callable objects can be executed without
	107	parentheses: :samp:`sin 3` is automatically converted to :samp:`sin(3)`.
	108	* Auto-quoting: using :samp:`,`, or :samp:`;` as the first character forces
	109	auto-quoting of the rest of the line: :samp:`,my_function a b` becomes
	110	automatically :samp:`my_function("a","b")`, while :samp:`;my_function a b`
	111	becomes :samp:`my_function("a b")`.
	112	* Extensible input syntax. You can define filters that pre-process
	113	user input to simplify input in special situations. This allows
	114	for example pasting multi-line code fragments which start with
	115	:samp:`>>>` or :samp:`...` such as those from other python sessions or the
	116	standard Python documentation.
	117	* Flexible configuration system. It uses a configuration file which
	118	allows permanent setting of all command-line options, module
	119	loading, code and file execution. The system allows recursive file
	120	inclusion, so you can have a base file with defaults and layers
	121	which load other customizations for particular projects.
	122	* Embeddable. You can call IPython as a python shell inside your own
	123	python programs. This can be used both for debugging code or for
	124	providing interactive abilities to your programs with knowledge
	125	about the local namespaces (very useful in debugging and data
	126	analysis situations).
	127	* Easy debugger access. You can set IPython to call up an enhanced
	128	version of the Python debugger (pdb) every time there is an
	129	uncaught exception. This drops you inside the code which triggered
	130	the exception with all the data live and it is possible to
	131	navigate the stack to rapidly isolate the source of a bug. The
	132	:samp:`%run` magic command (with the :samp:`-d` option) can run any script under
	133	pdb's control, automatically setting initial breakpoints for you.
	134	This version of pdb has IPython-specific improvements, including
	135	tab-completion and traceback coloring support. For even easier
	136	debugger access, try :samp:`%debug` after seeing an exception. winpdb is
	137	also supported, see ipy_winpdb extension.
	138	* Profiler support. You can run single statements (similar to
	139	:samp:`profile.run()`) or complete programs under the profiler's control.
	140	While this is possible with standard cProfile or profile modules,
	141	IPython wraps this functionality with magic commands (see :samp:`%prun`
	142	and :samp:`%run -p`) convenient for rapid interactive work.
	143	* Doctest support. The special :samp:`%doctest_mode` command toggles a mode
	144	that allows you to paste existing doctests (with leading :samp:`>>>`
	145	prompts and whitespace) and uses doctest-compatible prompts and
	146	output, so you can use IPython sessions as doctest code.
	147
	148	Interactive parallel computing
	149	==============================
	150
	151	Increasingly, parallel computer hardware, such as multicore CPUs, clusters and supercomputers, is becoming ubiquitous. Over the last 3 years, we have developed an
	152	architecture within IPython that allows such hardware to be used quickly and easily
	153	from Python. Moreover, this architecture is designed to support interactive and
	154	collaborative parallel computing.
	155
	156	For more information, see our :ref:`overview <parallel_index>` of using IPython for
	157	parallel computing.
150	158
151	159	Portability and Python requirements
152	160	-----------------------------------
153	161
154		Python requirements: IPython requires with Python version 2.3 or newer.
155		If you are still using Python 2.2 and can not upgrade, the last version
156		of IPython which worked with Python 2.2 was 0.6.15, so you will have to
157		use that.
158
159		IPython is developed under Linux, but it should work in any reasonable
160		Unix-type system (tested OK under Solaris and the BSD family, for which
161		a port exists thanks to Dryice Liu).
162
163		Mac OS X: it works, apparently without any problems (thanks to Jim Boyle
164		at Lawrence Livermore for the information). Thanks to Andrea Riciputi,
165		Fink support is available.
166
167		CygWin: it works mostly OK, though some users have reported problems
168		with prompt coloring. No satisfactory solution to this has been found so
169		far, you may want to disable colors permanently in the ipythonrc
170		configuration file if you experience problems. If you have proper color
171		support under cygwin, please post to the IPython mailing list so this
172		issue can be resolved for all users.
173
174		Windows: it works well under Windows Vista/XP/2k, and I suspect NT should
175		behave similarly. Section "Installation under windows" describes
176		installation details for Windows, including some additional tools needed
177		on this platform.
178
179		Windows 9x support is present, and has been reported to work fine (at
180		least on WinME).
181
182		Location
183		--------
184
185		IPython is generously hosted at http://ipython.scipy.org by the
186		Enthought, Inc and the SciPy project. This site offers downloads,
187		subversion access, mailing lists and a bug tracking system. I am very
188		grateful to Enthought (http://www.enthought.com) and all of the SciPy
189		team for their contribution. No newline at end of file
	162	As of the 0.9 release, IPython requires Python 2.4 or greater. We have
	163	not begun to test IPython on Python 2.6 or 3.0, but we expect it will
	164	work with some minor changes.
	165
	166	IPython is known to work on the following operating systems:
	167
	168	* Linux
	169	* AIX
	170	* Most other Unix-like OSs (Solaris, BSD, etc.)
	171	* Mac OS X
	172	* Windows (CygWin, XP, Vista, etc.)
	173
	174	See :ref:`here <install_index>` for instructions on how to install IPython. No newline at end of file

docs/source/parallel/index.txt

0 +2 0

+             .. _parallel_index:
              ====================================
              Using IPython for Parallel computing
              ====================================

IPython/testing/tests/test_testutils.py

0 removed 0 -66

NO CONTENT: file was removed

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages