]> granicus.if.org Git - python/commitdiff
Issue #23992: multiprocessing: make MapResult not fail-fast upon exception.
authorCharles-François Natali <cf.natali@gmail.com>
Wed, 10 Feb 2016 22:58:18 +0000 (22:58 +0000)
committerCharles-François Natali <cf.natali@gmail.com>
Wed, 10 Feb 2016 22:58:18 +0000 (22:58 +0000)
Lib/multiprocessing/pool.py
Lib/test/_test_multiprocessing.py
Misc/NEWS

index 6d25469e1620c0cae48c70611c1a530a041551f3..ffdf42614d59ebadd021d98c66cfcebdcd5408b1 100644 (file)
@@ -638,22 +638,26 @@ class MapResult(ApplyResult):
             self._number_left = length//chunksize + bool(length % chunksize)
 
     def _set(self, i, success_result):
+        self._number_left -= 1
         success, result = success_result
-        if success:
+        if success and self._success:
             self._value[i*self._chunksize:(i+1)*self._chunksize] = result
-            self._number_left -= 1
             if self._number_left == 0:
                 if self._callback:
                     self._callback(self._value)
                 del self._cache[self._job]
                 self._event.set()
         else:
-            self._success = False
-            self._value = result
-            if self._error_callback:
-                self._error_callback(self._value)
-            del self._cache[self._job]
-            self._event.set()
+            if not success and self._success:
+                # only store first exception
+                self._success = False
+                self._value = result
+            if self._number_left == 0:
+                # only consider the result ready once all jobs are done
+                if self._error_callback:
+                    self._error_callback(self._value)
+                del self._cache[self._job]
+                self._event.set()
 
 #
 # Class whose instances are returned by `Pool.imap()`
index e9120abe5d9cc6e45031441cab1f720f64b9f2b2..a59d2ba6692969391cc1b5d2c38bf7f30701ab57 100644 (file)
@@ -1660,6 +1660,10 @@ def sqr(x, wait=0.0):
 def mul(x, y):
     return x*y
 
+def raise_large_valuerror(wait):
+    time.sleep(wait)
+    raise ValueError("x" * 1024**2)
+
 class SayWhenError(ValueError): pass
 
 def exception_throwing_generator(total, when):
@@ -1895,6 +1899,26 @@ class _TestPool(BaseTestCase):
             with self.assertRaises(RuntimeError):
                 p.apply(self._test_wrapped_exception)
 
+    def test_map_no_failfast(self):
+        # Issue #23992: the fail-fast behaviour when an exception is raised
+        # during map() would make Pool.join() deadlock, because a worker
+        # process would fill the result queue (after the result handler thread
+        # terminated, hence not draining it anymore).
+
+        t_start = time.time()
+
+        with self.assertRaises(ValueError):
+            with self.Pool(2) as p:
+                try:
+                    p.map(raise_large_valuerror, [0, 1])
+                finally:
+                    time.sleep(0.5)
+                    p.close()
+                    p.join()
+
+        # check that we indeed waited for all jobs
+        self.assertGreater(time.time() - t_start, 0.9)
+
 
 def raising():
     raise KeyError("key")
index 1ac4ad02b4beb7e4121f1dcfa8f3c908b2e30073..22a392ef69b49871b73146e7318aeff577420d45 100644 (file)
--- a/Misc/NEWS
+++ b/Misc/NEWS
@@ -179,6 +179,8 @@ Core and Builtins
 Library
 -------
 
+- Issue #23992: multiprocessing: make MapResult not fail-fast upon exception.
+
 - Issue #26243: Support keyword arguments to zlib.compress().  Patch by Aviv
   Palivoda.