bpo-29842: Make Executor.map less eager so it handles large/unbounded…

… input iterables appropriately
python · MojoVampire · Mar 18, 2017 · May 6, 2019 · May 6, 2019 · May 6, 2019
commit fbdb56cda18634fce0882e043ac26acd3d2e17c6
diff --git a/Doc/library/concurrent.futures.rst b/Doc/library/concurrent.futures.rst
@@ -38,7 +38,7 @@ Executor Objects
              future = executor.submit(pow, 323, 1235)
              print(future.result())

-    .. method:: map(func, *iterables, timeout=None, chunksize=1)
+    .. method:: map(func, *iterables, timeout=None, chunksize=1, prefetch=None)

       Equivalent to :func:`map(func, *iterables) <map>` except *func* is executed
       asynchronously and several calls to *func* may be made concurrently.  The
@@ -54,11 +54,16 @@ Executor Objects
       specified by setting *chunksize* to a positive integer. For very long
       iterables, using a large value for *chunksize* can significantly improve
       performance compared to the default size of 1. With :class:`ThreadPoolExecutor`,
-       *chunksize* has no effect.
+       *chunksize* has no effect. By default, a reasonable number of tasks are
+       queued beyond the number of workers, an explicit *prefetch* count may be
+       provided to specify how many extra tasks should be queued.

       .. versionchanged:: 3.5
          Added the *chunksize* argument.

+       .. versionchanged:: 3.7
+          Added the *prefetch* argument.
+
    .. method:: shutdown(wait=True)

       Signal the executor that it should free any resources that it is using

diff --git a/Lib/concurrent/futures/_base.py b/Lib/concurrent/futures/_base.py
@@ -4,6 +4,7 @@
 __author__ = 'Brian Quinlan (brian@sweetapp.com)'

 import collections
+import itertools
 import logging
 import threading
 import time
@@ -520,7 +521,7 @@ def submit(self, fn, *args, **kwargs):
        """
        raise NotImplementedError()

-    def map(self, fn, *iterables, timeout=None, chunksize=1):
+    def map(self, fn, *iterables, timeout=None, chunksize=1, prefetch=None):
        """Returns an iterator equivalent to map(fn, iter).

        Args:
@@ -544,18 +545,40 @@ def map(self, fn, *iterables, timeout=None, chunksize=1):
        """
        if timeout is not None:
            end_time = timeout + time.time()
+        if prefetch is None:
+            prefetch = self._max_workers
+        if prefetch < 0:
+            raise ValueError("prefetch count may not be negative")

-        fs = [self.submit(fn, *args) for args in zip(*iterables)]
+        argsiter = zip(*iterables)
+
+        fs = collections.deque(self.submit(fn, *args) for args in itertools.islice(argsiter, self._max_workers + prefetch))

        # Yield must be hidden in closure so that the futures are submitted
        # before the first iterator value is required.
        def result_iterator():
+            nonlocal argsiter
            try:
-                for future in fs:
+                while fs:
                    if timeout is None:
-                        yield future.result()
+                        res = fs[0].result()
                    else:
-                        yield future.result(end_time - time.time())
+                        res = fs[0].result(end_time - time.time())
+
+                    # Got a result, future needn't be cancelled
+                    del fs[0]
+
+                    # Dispatch next task before yielding to keep
+                    # pipeline full
+                    if argsiter:
+                        try:
+                            args = next(argsiter)
+                        except StopIteration:
+                            argsiter = None
+                        else:
+                            fs.append(self.submit(fn, *args))
+
+                    yield res
            finally:
                for future in fs:
                    future.cancel()

diff --git a/Lib/concurrent/futures/process.py b/Lib/concurrent/futures/process.py
@@ -455,7 +455,7 @@ def submit(self, fn, *args, **kwargs):
            return f
    submit.__doc__ = _base.Executor.submit.__doc__

-    def map(self, fn, *iterables, timeout=None, chunksize=1):
+    def map(self, fn, *iterables, timeout=None, chunksize=1, prefetch=None):
        """Returns an iterator equivalent to map(fn, iter).

        Args:
@@ -481,7 +481,7 @@ def map(self, fn, *iterables, timeout=None, chunksize=1):

        results = super().map(partial(_process_chunk, fn),
                              _get_chunks(*iterables, chunksize=chunksize),
-                              timeout=timeout)
+                              timeout=timeout, prefetch=prefetch)
        return itertools.chain.from_iterable(results)

    def shutdown(self, wait=True):

diff --git a/Lib/test/test_concurrent_futures.py b/Lib/test/test_concurrent_futures.py
@@ -467,7 +467,22 @@ def record_finished(n):

        self.executor.map(record_finished, range(10))
        self.executor.shutdown(wait=True)
-        self.assertCountEqual(finished, range(10))
+        # No guarantees on how many tasks dispatched,
+        # but at least one should have been dispatched
+        self.assertGreater(len(finished), 0)
+
+    def test_infinite_map_input_completes_work(self):
+        import itertools
+        def identity(x):
+            return x
+
+        mapobj = self.executor.map(identity, itertools.count(0))
+        # Get one result, which shows we handle infinite inputs
+        # without waiting for all work to be dispatched
+        res = next(mapobj)
+        mapobj.close()  # Make sure futures cancelled
+
+        self.assertEqual(res, 0)

    def test_default_workers(self):
        executor = self.executor_type()

diff --git a/Misc/NEWS b/Misc/NEWS
@@ -281,6 +281,12 @@ Extension Modules
 Library
 -------

+- bpo-29842: Executor.map no longer creates all futures eagerly prior to
+  yielding any results. This allows it to work with huge or infinite iterables
+  without consuming excessive resources or crashing, making it more suitable
+  as a drop in replacement for the built-in map.
+  Patch by Josh Rosenberg.
+
 - bpo-29800: Fix crashes in partial.__repr__ if the keys of partial.keywords
  are not strings.  Patch by Michael Seifert.
-Original file line number
+Diff line change
@@ -38,7 +38,7 @@ Executor Objects
                   future = executor.submit(pow, 323, 1235)
                   print(future.result())
-        .. method:: map(func, *iterables, timeout=None, chunksize=1)
+        .. method:: map(func, *iterables, timeout=None, chunksize=1, prefetch=None)
            Equivalent to :func:`map(func, *iterables) <map>` except *func* is executed
            asynchronously and several calls to *func* may be made concurrently.  The
@@ -54,11 +54,16 @@ Executor Objects
            specified by setting *chunksize* to a positive integer. For very long
            iterables, using a large value for *chunksize* can significantly improve
            performance compared to the default size of 1. With :class:`ThreadPoolExecutor`,
-           *chunksize* has no effect.
+           *chunksize* has no effect. By default, a reasonable number of tasks are
+           queued beyond the number of workers, an explicit *prefetch* count may be
+           provided to specify how many extra tasks should be queued.
             Copy link

  
      
    
  

  
      

  
  Member


      

  

  
    
      

      
            pitrou
  

      

      

      


        May 6, 2019


      
    

  


        
      
  
  
  
    

    There was a problem hiding this comment.


  

 
  
    

    Choose a reason for hiding this comment

    
      The reason will be displayed to describe this comment to others. Learn more.
    

    
      
      


  


  
    
      Using "chunks" here would be more precise than "tasks".
    
  
  


    

        
      
  
  
    
  
  
  
    
    Sorry, something went wrong.
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.


  
  


          
      
  
    
    
      
        
            
    All reactions
  


          
          
        
      
    

    



    
        
  
    
        
    
  


      
          
  
      
            Copy link

  
      
    
  

  
      

  
    Contributor


      

  Author


  

  
    
      

      
            MojoVampire
  

      

      

      


        May 6, 2019


      
    

  


        
      
  
  
  
    

    There was a problem hiding this comment.


  

 
  
    

    Choose a reason for hiding this comment

    
      The reason will be displayed to describe this comment to others. Learn more.
    

    
      
      


  


  
    
      The documentation for chunksize uses the phrasing "this method chops iterables into a number of chunks which it submits to the pool as separate tasks", and since not all executors even use chunks (ThreadPoolExecutor ignores the argument), I figured I'd stick with "tasks". It does kind of leave out a term to describe a single work item; the docs uses chunks and tasks as synonyms, with no term for a single work item.
    
  
  


    

        
      
  
  
    
  
  
  
    
    Sorry, something went wrong.
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.


  
  


          
      
  
    
    
      
        
            
    All reactions
                   MojoVampire marked this conversation as resolved.
              

          
            Show resolved
            Hide resolved
        

                
  
            
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.
            .. versionchanged:: 3.5
               Added the *chunksize* argument.
+           .. versionchanged:: 3.7
                   MojoVampire marked this conversation as resolved.
              

          
            Show resolved
            Hide resolved
        

                
  
            
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.
+              Added the *prefetch* argument.
         .. method:: shutdown(wait=True)
            Signal the executor that it should free any resources that it is using
-          Expand Down