reflectometry · bmaranville · Oct 29, 2024 · Nov 8, 2024
diff --git a/refl1d/errors.py b/refl1d/errors.py
@@ -11,6 +11,8 @@
 
 from __future__ import print_function
 
+import dill
+
 __all__ = [
     "reload_errors",
     "run_errors",
@@ -21,6 +23,7 @@
     "show_residuals",
 ]
 
+import multiprocessing
 import sys
 import os
 
@@ -119,7 +122,19 @@ def _usage():
     print(run_errors.__doc__)
 
 
-def calc_errors(problem, points):
+def _initialize_worker(shared_serialized_problem):
+    global _shared_problem
+    _shared_problem = dill.loads(np.asarray(shared_serialized_problem[:], dtype="uint8").tobytes())
+
+
+_shared_problem = None  # used by multiprocessing pool to hold problem
+
+
+def _worker_eval_point(point):
+    return _eval_point(_shared_problem, point)
+
+
+def calc_errors(problem, points, parallel: int = 0):
     """
     Align the sample profiles and compute the residual difference from the
     measured reflectivity for a set of points.
@@ -128,6 +143,9 @@ def calc_errors(problem, points):
     distribution computed from MCMC, bootstrapping or sampled from
     the error ellipse calculated at the minimum.
 
+    The *parallel* parameter controls the number of parallel processes
+    (set to 1 to disable use of ProcessPoolExecutor, or 0 to use all processors).
+
     Each of the returned arguments is a dictionary mapping model number to
     error sample data as follows:
 
@@ -161,8 +179,26 @@ def calc_errors(problem, points):
 
     # Put best at slot 0, no alignment
     data = [_eval_point(problem, problem.getp())]
-    for p in points:
-        data.append(_eval_point(problem, p))
+
+    if parallel != 1:
+        import concurrent.futures
+        from functools import partial
+
+        max_workers = parallel if parallel > 0 else None
+        serialized_problem_array = np.frombuffer(dill.dumps(problem), dtype="uint8")
+
+        with multiprocessing.Manager() as manager:
+            shared_serialized_problem = manager.Array("B", serialized_problem_array)
+            args = [(shared_serialized_problem, point) for point in points]
+
+            with concurrent.futures.ProcessPoolExecutor(
+                max_workers=max_workers, initializer=_initialize_worker, initargs=(shared_serialized_problem,)
+            ) as executor:
+                results = executor.map(_worker_eval_point, points)
+            data.extend(results)
+    else:
+        for p in points:
+            data.append(_eval_point(problem, p))
 
     profiles, slabs, residuals = zip(*data)