upstream/ipython Commit - r10605:9f313b4a

Merge pull request from minrk/mapgenerator...

Brian E. Granger -

r10605:9f313b4a

parent child

IPython/parallel/client/map.py

0 +13 -16

             class Map(object):
                 """A class for partitioning a sequence using a map."""
-                def getPartition(self, seq, p, q):
+                def getPartition(self, seq, p, q, n=None):
-                    """Returns the pth partition of q partitions of seq."""
+                    """Returns the pth partition of q partitions of seq.
+                    The length can be specified as `n`,
+                    otherwise it is the value of `len(seq)`
+                    """
+                    n = len(seq) if n is None else n
                     # Test for error conditions here
                     if p<0 or p>=q:
-                      print "No partition exists."
+                      raise ValueError("must have 0 <= p <= q, but have p=%s,q=%s" % (p, q))
-                      return
-                    N = len(seq)
+                    remainder = n % q
-                    remainder = N % q
+                    basesize = n // q
-                    basesize = N // q
                     if p < remainder:
                         low = p * (basesize + 1)
                     return listOfPartitions
             class RoundRobinMap(Map):
-                """Partitions a sequence in a roun robin fashion.
+                """Partitions a sequence in a round robin fashion.
                 This currently does not work!
                 """
-                def getPartition(self, seq, p, q):
+                def getPartition(self, seq, p, q, n=None):
-                    # if not isinstance(seq,(list,tuple)):
+                    n = len(seq) if n is None else n
-                    #     raise NotImplementedError("cannot RR partition type %s"%type(seq))
+                    return seq[p:n:q]
-                    return seq[p:len(seq):q]
-                    #result = []
-                    #for i in range(p,len(seq),q):
-                    #    result.append(seq[i])
-                    #return result
                 def joinPartitions(self, listOfPartitions):
                     testObject = listOfPartitions[0]

IPython/parallel/client/remotefunction.py

0 +46 -28

                 chunksize : int or None
                     The size of chunk to use when breaking up sequences in a load-balanced manner
                 ordered : bool [default: True]
-                    Whether
+                    Whether the result should be kept in order. If False,
+                    results become available as they arrive, regardless of submission order.
                 **flags : remaining kwargs are passed to View.temp_flags
                 """
-                chunksize=None
+                chunksize = None
-                ordered=None
+                ordered = None
-                mapObject=None
+                mapObject = None
+                _mapping = False
                 def __init__(self, view, f, dist='b', block=None, chunksize=None, ordered=True, **flags):
                     super(ParallelFunction, self).__init__(view, f, block=block, **flags)
                     mapClass = Map.dists[dist]
                     self.mapObject = mapClass()
                 @sync_view_results
                 def __call__(self, *sequences):
                     client = self.view.client
+                    lens = []
+                    maxlen = minlen = -1
+                    for i, seq in enumerate(sequences):
+                        try:
+                            n = len(seq)
+                        except Exception:
+                            seq = list(seq)
+                            if isinstance(sequences, tuple):
+                                # can't alter a tuple
+                                sequences = list(sequences)
+                            sequences[i] = seq
+                            n = len(seq)
+                        if n > maxlen:
+                            maxlen = n
+                        if minlen == -1 or n < minlen:
+                            minlen = n
+                        lens.append(n)
                     # check that the length of sequences match
-                    len_0 = len(sequences[0])
+                    if not self._mapping and minlen != maxlen:
-                    for s in sequences:
+                        msg = 'all sequences must have equal length, but have %s' % lens
-                        if len(s)!=len_0:
+                        raise ValueError(msg)
-                            msg = 'all sequences must have equal length, but %i!=%i'%(len_0,len(s))
-                            raise ValueError(msg)
                     balanced = 'Balanced' in self.view.__class__.__name__
                     if balanced:
                         if self.chunksize:
-                            nparts = len_0//self.chunksize + int(len_0%self.chunksize > 0)
+                            nparts = maxlen // self.chunksize + int(maxlen % self.chunksize > 0)
                         else:
-                            nparts = len_0
+                            nparts = maxlen
                         targets = [None]*nparts
                     else:
                         if self.chunksize:
                     for index, t in enumerate(targets):
                         args = []
                         for seq in sequences:
-                            part = self.mapObject.getPartition(seq, index, nparts)
+                            part = self.mapObject.getPartition(seq, index, nparts, maxlen)
-                            if len(part) == 0:
+                            args.append(part)
-                                continue
+                        if not any(args):
-                            else:
-                                args.append(part)
-                        if not args:
                             continue
-                        # print (args)
+                        if self._mapping:
-                        if hasattr(self, '_map'):
                             if sys.version_info[0] >= 3:
                                 f = lambda f, *sequences: list(map(f, *sequences))
                             else:
                                 f = map
-                            args = [self.func]+args
+                            args = [self.func] + args
                         else:
                             f=self.func
                         with view.temp_flags(block=False, **self.flags):
                             ar = view.apply(f, *args)
-                        msg_ids.append(ar.msg_ids[0])
+                        msg_ids.extend(ar.msg_ids)
                     r = AsyncMapResult(self.view.client, msg_ids, self.mapObject,
                                         fname=getname(self.func),
                                         ordered=self.ordered
                                     )
                         return r
                 def map(self, *sequences):
-                    """call a function on each element of a sequence remotely.
+                    """call a function on each element of one or more sequence(s) remotely.
                     This should behave very much like the builtin map, but return an AsyncMapResult
                     if self.block is False.
+                    That means it can take generators (will be cast to lists locally),
+                    and mismatched sequence lengths will be padded with None.
                     """
-                    # set _map as a flag for use inside self.__call__
+                    # set _mapping as a flag for use inside self.__call__
-                    self._map = True
+                    self._mapping = True
                     try:
-                        ret = self.__call__(*sequences)
+                        ret = self(*sequences)
                     finally:
-                        del self._map
+                        self._mapping = False
                     return ret
             __all__ = ['remote', 'parallel', 'RemoteFunction', 'ParallelFunction']

IPython/parallel/tests/test_lbview.py

0 +34 0

@@ -58,6 +58,40 b' class TestLoadBalancedView(ClusterTestCase):'
58	data = range(16)	58	data = range(16)
59	r = self.view.map_sync(f, data)	59	r = self.view.map_sync(f, data)
60	self.assertEqual(r, map(f, data))	60	self.assertEqual(r, map(f, data))
		61
		62	def test_map_generator(self):
		63	def f(x):
		64	return x**2
		65
		66	data = range(16)
		67	r = self.view.map_sync(f, iter(data))
		68	self.assertEqual(r, map(f, iter(data)))
		69
		70	def test_map_short_first(self):
		71	def f(x,y):
		72	if y is None:
		73	return y
		74	if x is None:
		75	return x
		76	return x*y
		77	data = range(10)
		78	data2 = range(4)
		79
		80	r = self.view.map_sync(f, data, data2)
		81	self.assertEqual(r, map(f, data, data2))
		82
		83	def test_map_short_last(self):
		84	def f(x,y):
		85	if y is None:
		86	return y
		87	if x is None:
		88	return x
		89	return x*y
		90	data = range(4)
		91	data2 = range(10)
		92
		93	r = self.view.map_sync(f, data, data2)
		94	self.assertEqual(r, map(f, data, data2))
61		95
62	def test_map_unordered(self):	96	def test_map_unordered(self):
63	def f(x):	97	def f(x):

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages