upstream/ipython Commit - r10605:9f313b4a

Merge pull request from minrk/mapgenerator...

Brian E. Granger -

r10605:9f313b4a

parent child

IPython/parallel/client/map.py

0 +13 -16

              class Map(object):
                  """A class for partitioning a sequence using a map."""
-                 def getPartition(self, seq, p, q):
-                     """Returns the pth partition of q partitions of seq."""
+                 def getPartition(self, seq, p, q, n=None):
+                     """Returns the pth partition of q partitions of seq.
+                     The length can be specified as `n`,
+                     otherwise it is the value of `len(seq)`
+                     """
+                     n = len(seq) if n is None else n
                      # Test for error conditions here
                      if p<0 or p>=q:
-                       print "No partition exists."
-                       return
+                       raise ValueError("must have 0 <= p <= q, but have p=%s,q=%s" % (p, q))
-                     N = len(seq)
-                     remainder = N % q
-                     basesize = N // q
+                     remainder = n % q
+                     basesize = n // q
                      if p < remainder:
                          low = p * (basesize + 1)
                      return listOfPartitions
              class RoundRobinMap(Map):
-                 """Partitions a sequence in a roun robin fashion.
+                 """Partitions a sequence in a round robin fashion.
                  This currently does not work!
                  """
-                 def getPartition(self, seq, p, q):
-                     # if not isinstance(seq,(list,tuple)):
-                     #     raise NotImplementedError("cannot RR partition type %s"%type(seq))
-                     return seq[p:len(seq):q]
-                     #result = []
-                     #for i in range(p,len(seq),q):
-                     #    result.append(seq[i])
-                     #return result
+                 def getPartition(self, seq, p, q, n=None):
+                     n = len(seq) if n is None else n
+                     return seq[p:n:q]
                  def joinPartitions(self, listOfPartitions):
                      testObject = listOfPartitions[0]

IPython/parallel/client/remotefunction.py

0 +38 -20

                  chunksize : int or None
                      The size of chunk to use when breaking up sequences in a load-balanced manner
                  ordered : bool [default: True]
-                     Whether
+                     Whether the result should be kept in order. If False,
+                     results become available as they arrive, regardless of submission order.
                  **flags : remaining kwargs are passed to View.temp_flags
                  """
                  chunksize=None
                  ordered=None
                  mapObject=None
+                 _mapping = False
                  def __init__(self, view, f, dist='b', block=None, chunksize=None, ordered=True, **flags):
                      super(ParallelFunction, self).__init__(view, f, block=block, **flags)
                  def __call__(self, *sequences):
                      client = self.view.client
+                     lens = []
+                     maxlen = minlen = -1
+                     for i, seq in enumerate(sequences):
+                         try:
+                             n = len(seq)
+                         except Exception:
+                             seq = list(seq)
+                             if isinstance(sequences, tuple):
+                                 # can't alter a tuple
+                                 sequences = list(sequences)
+                             sequences[i] = seq
+                             n = len(seq)
+                         if n > maxlen:
+                             maxlen = n
+                         if minlen == -1 or n < minlen:
+                             minlen = n
+                         lens.append(n)
                      # check that the length of sequences match
-                     len_0 = len(sequences[0])
-                     for s in sequences:
-                         if len(s)!=len_0:
-                             msg = 'all sequences must have equal length, but %i!=%i'%(len_0,len(s))
+                     if not self._mapping and minlen != maxlen:
+                         msg = 'all sequences must have equal length, but have %s' % lens
-                             raise ValueError(msg)
                      balanced = 'Balanced' in self.view.__class__.__name__
                      if balanced:
                          if self.chunksize:
-                             nparts = len_0//self.chunksize + int(len_0%self.chunksize > 0)
+                             nparts = maxlen // self.chunksize + int(maxlen % self.chunksize > 0)
                          else:
-                             nparts = len_0
+                             nparts = maxlen
                          targets = [None]*nparts
                      else:
                          if self.chunksize:
                      for index, t in enumerate(targets):
                          args = []
                          for seq in sequences:
-                             part = self.mapObject.getPartition(seq, index, nparts)
-                             if len(part) == 0:
-                                 continue
-                             else:
+                             part = self.mapObject.getPartition(seq, index, nparts, maxlen)
-                                 args.append(part)
-                         if not args:
+                         if not any(args):
                              continue
-                         # print (args)
-                         if hasattr(self, '_map'):
+                         if self._mapping:
                              if sys.version_info[0] >= 3:
                                  f = lambda f, *sequences: list(map(f, *sequences))
                              else:
                          with view.temp_flags(block=False, **self.flags):
                              ar = view.apply(f, *args)
-                         msg_ids.append(ar.msg_ids[0])
+                         msg_ids.extend(ar.msg_ids)
-                     r = AsyncMapResult(self.view.client, msg_ids, self.mapObject,
                                          fname=getname(self.func),
                          return r
                  def map(self, *sequences):
-                     """call a function on each element of a sequence remotely.
+                     """call a function on each element of one or more sequence(s) remotely.
                      This should behave very much like the builtin map, but return an AsyncMapResult
                      if self.block is False.
+                     That means it can take generators (will be cast to lists locally),
+                     and mismatched sequence lengths will be padded with None.
                      """
-                     # set _map as a flag for use inside self.__call__
-                     self._map = True
+                     # set _mapping as a flag for use inside self.__call__
+                     self._mapping = True
                      try:
-                         ret = self.__call__(*sequences)
+                         ret = self(*sequences)
                      finally:
-                         del self._map
+                         self._mapping = False
                      return ret
              __all__ = ['remote', 'parallel', 'RemoteFunction', 'ParallelFunction']

IPython/parallel/tests/test_lbview.py

0 +34 0

		@@ -59,6 +59,40 b' class TestLoadBalancedView(ClusterTestCase):'
59	59	r = self.view.map_sync(f, data)
60	60	self.assertEqual(r, map(f, data))
61	61
	62	def test_map_generator(self):
	63	def f(x):
	64	return x**2
	65
	66	data = range(16)
	67	r = self.view.map_sync(f, iter(data))
	68	self.assertEqual(r, map(f, iter(data)))
	69
	70	def test_map_short_first(self):
	71	def f(x,y):
	72	if y is None:
	73	return y
	74	if x is None:
	75	return x
	76	return x*y
	77	data = range(10)
	78	data2 = range(4)
	79
	80	r = self.view.map_sync(f, data, data2)
	81	self.assertEqual(r, map(f, data, data2))
	82
	83	def test_map_short_last(self):
	84	def f(x,y):
	85	if y is None:
	86	return y
	87	if x is None:
	88	return x
	89	return x*y
	90	data = range(4)
	91	data2 = range(10)
	92
	93	r = self.view.map_sync(f, data, data2)
	94	self.assertEqual(r, map(f, data, data2))
	95
62	96	def test_map_unordered(self):
63	97	def f(x):
64	98	return x**2

General Comments 0

Write
Preview

You need to be logged in to leave comments. Login now

No TODOs yet

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages