upstream/ipython Commit - r5171:0d15755f

add unordered iteration to AsyncMapResults...

MinRK -

r5171:0d15755f

parent child

IPython/parallel/client/asyncresult.py

0 +51 -1

@@ -261,12 +261,19 b' class AsyncMapResult(AsyncResult):'
261	"""Class for representing results of non-blocking gathers.	261	"""Class for representing results of non-blocking gathers.
262		262
263	This will properly reconstruct the gather.	263	This will properly reconstruct the gather.
		264
		265	This class is iterable at any time, and will wait on results as they come.
		266
		267	If ordered=False, then the first results to arrive will come first, otherwise
		268	results will be yielded in the order they were submitted.
		269
264	"""	270	"""
265		271
266	def __init__(self, client, msg_ids, mapObject, fname=''):	272	def __init__(self, client, msg_ids, mapObject, fname='', ordered=True):
267	AsyncResult.__init__(self, client, msg_ids, fname=fname)	273	AsyncResult.__init__(self, client, msg_ids, fname=fname)
268	self._mapObject = mapObject	274	self._mapObject = mapObject
269	self._single_result = False	275	self._single_result = False
		276	self.ordered = ordered
270		277
271	def _reconstruct_result(self, res):	278	def _reconstruct_result(self, res):
272	"""Perform the gather on the actual results."""	279	"""Perform the gather on the actual results."""
@@ -274,6 +281,13 b' class AsyncMapResult(AsyncResult):'
274		281
275	# asynchronous iterator:	282	# asynchronous iterator:
276	def __iter__(self):	283	def __iter__(self):
		284	it = self._ordered_iter if self.ordered else self._unordered_iter
		285	for r in it():
		286	yield r
		287
		288	# asynchronous ordered iterator:
		289	def _ordered_iter(self):
		290	"""iterator for results as they arrive, preserving submission order."""
277	try:	291	try:
278	rlist = self.get(0)	292	rlist = self.get(0)
279	except error.TimeoutError:	293	except error.TimeoutError:
@@ -294,6 +308,42 b' class AsyncMapResult(AsyncResult):'
294	for r in rlist:	308	for r in rlist:
295	yield r	309	yield r
296		310
		311	# asynchronous unordered iterator:
		312	def _unordered_iter(self):
		313	"""iterator for results as they arrive, on FCFS basis, ignoring submission order."""
		314	try:
		315	rlist = self.get(0)
		316	except error.TimeoutError:
		317	pending = set(self.msg_ids)
		318	while pending:
		319	try:
		320	self._client.wait(pending, 1e-3)
		321	except error.TimeoutError:
		322	# ignore timeout error, because that only means
		323	# some jobs are outstanding
		324	pass
		325	# update ready set with those no longer outstanding:
		326	ready = pending.difference(self._client.outstanding)
		327	# update pending to exclude those that are finished
		328	pending = pending.difference(ready)
		329	while ready:
		330	msg_id = ready.pop()
		331	ar = AsyncResult(self._client, msg_id, self._fname)
		332	rlist = ar.get()
		333	try:
		334	for r in rlist:
		335	yield r
		336	except TypeError:
		337	# flattened, not a list
		338	# this could get broken by flattened data that returns iterables
		339	# but most calls to map do not expose the `flatten` argument
		340	yield rlist
		341	else:
		342	# already done
		343	for r in rlist:
		344	yield r
		345
		346
297		347
298	class AsyncHubResult(AsyncResult):	348	class AsyncHubResult(AsyncResult):
299	"""Class to wrap pending results that must be requested from the Hub.	349	"""Class to wrap pending results that must be requested from the Hub.

IPython/parallel/client/remotefunction.py

0 +11 -4

                 return remote_function
             @skip_doctest
-            def parallel(view, dist='b', block=None, **flags):
+            def parallel(view, dist='b', block=None, ordered=True, **flags):
                 """Turn a function into a parallel remote function.
                 This method can be used for map:
                 """
                 def parallel_function(f):
-                    return ParallelFunction(view, f, dist=dist, block=block, **flags)
+                    return ParallelFunction(view, f, dist=dist, block=block, ordered=ordered, **flags)
                 return parallel_function
             #--------------------------------------------------------------------------
                     to use the current `block` attribute of `view`
                 chunksize : int or None
                     The size of chunk to use when breaking up sequences in a load-balanced manner
+                ordered : bool [default: True]
+                    Whether
                 **flags : remaining kwargs are passed to View.temp_flags
                 """
                 chunksize=None
+                ordered=None
                 mapObject=None
-                def __init__(self, view, f, dist='b', block=None, chunksize=None, **flags):
+                def __init__(self, view, f, dist='b', block=None, chunksize=None, ordered=True, **flags):
                     super(ParallelFunction, self).__init__(view, f, block=block, **flags)
                     self.chunksize = chunksize
+                    self.ordered = ordered
                     mapClass = Map.dists[dist]
                     self.mapObject = mapClass()
                         msg_ids.append(ar.msg_ids[0])
-                    r = AsyncMapResult(self.view.client, msg_ids, self.mapObject, fname=self.func.__name__)
+                    r = AsyncMapResult(self.view.client, msg_ids, self.mapObject,
+                                        fname=self.func.__name__,
+                                        ordered=self.ordered
+                                    )
                     if self.block:
                         try:

IPython/parallel/client/view.py

0 +13 -6

                 @spin_after
                 @save_ids
                 def map(self, f, *sequences, **kwargs):
-                    """view.map(f, *sequences, block=self.block, chunksize=1) => list|AsyncMapResult
+                    """view.map(f, *sequences, block=self.block, chunksize=1, ordered=True) => list|AsyncMapResult
                     Parallel version of builtin `map`, load-balanced by this View.
                         function to be mapped
                     *sequences: one or more sequences of matching length
                         the sequences to be distributed and passed to `f`
-                    block : bool
+                    block : bool [default self.block]
-                        whether to wait for the result or not [default self.block]
+                        whether to wait for the result or not
                     track : bool
                         whether to create a MessageTracker to allow the user to
                         safely edit after arrays and buffers during non-copying
                         sends.
-                    chunksize : int
+                    chunksize : int [default 1]
-                        how many elements should be in each task [default 1]
+                        how many elements should be in each task.
+                    ordered : bool [default True]
+                        Whether the results should be gathered as they arrive, or enforce
+                        the order of submission.
+                        Only applies when iterating through AsyncMapResult as results arrive.
+                        Has no effect when block=True.
                     Returns
                     -------
                     # default
                     block = kwargs.get('block', self.block)
                     chunksize = kwargs.get('chunksize', 1)
+                    ordered = kwargs.get('ordered', True)
                     keyset = set(kwargs.keys())
                     extra_keys = keyset.difference_update(set(['block', 'chunksize']))
                     assert len(sequences) > 0, "must have some sequences to map onto!"
-                    pf = ParallelFunction(self, f, block=block,  chunksize=chunksize)
+                    pf = ParallelFunction(self, f, block=block, chunksize=chunksize, ordered=ordered)
                     return pf.map(*sequences)
             __all__ = ['LoadBalancedView', 'DirectView']

IPython/parallel/tests/test_lbview.py

0 +36 0

@@ -58,6 +58,42 b' class TestLoadBalancedView(ClusterTestCase):'
58	r = self.view.map_sync(f, data)	58	r = self.view.map_sync(f, data)
59	self.assertEquals(r, map(f, data))	59	self.assertEquals(r, map(f, data))
60		60
		61	def test_map_unordered(self):
		62	def f(x):
		63	return x**2
		64	def slow_f(x):
		65	import time
		66	time.sleep(0.05*x)
		67	return x**2
		68	data = range(16,0,-1)
		69	reference = map(f, data)
		70
		71	amr = self.view.map_async(f, data, ordered=False)
		72	self.assertTrue(isinstance(amr, pmod.AsyncMapResult))
		73	# check individual elements, retrieved as they come (uses __iter__)
		74	astheycame = list(amr)
		75	# Ensure that at least one result came out of order:
		76	self.assertNotEquals(astheycame, reference, "should not have preserved order")
		77	self.assertEquals(sorted(astheycame, reverse=True), reference, "result corrupted")
		78
		79	def test_map_ordered(self):
		80	def f(x):
		81	return x**2
		82	def slow_f(x):
		83	import time
		84	time.sleep(0.05*x)
		85	return x**2
		86	data = range(16,0,-1)
		87	reference = map(f, data)
		88
		89	amr = self.view.map_async(f, data)
		90	self.assertTrue(isinstance(amr, pmod.AsyncMapResult))
		91	# check individual elements, retrieved as they come (uses __iter__)
		92	astheycame = list(amr)
		93	# Ensure that results came in order
		94	self.assertEquals(astheycame, reference)
		95	self.assertEquals(amr.result, reference)
		96
61	def test_abort(self):	97	def test_abort(self):
62	view = self.view	98	view = self.view
63	ar = self.client[:].apply_async(time.sleep, .5)	99	ar = self.client[:].apply_async(time.sleep, .5)

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages