Netflix · npow · Apr 12, 2026 · Mar 6, 2026 · Mar 6, 2026 · Mar 6, 2026
diff --git a/metaflow/datastore/flow_datastore.py b/metaflow/datastore/flow_datastore.py
@@ -241,6 +241,17 @@ def get_task_datastores(
             )
             for v in latest_to_fetch
         ]
+        if pathspecs:
+            # The set operations above (latest_started_attempts & done_attempts)
+            # discard the original pathspecs ordering. When the caller provides
+            # pathspecs, they expect results back in that same order -- e.g. foreach
+            # join inputs must arrive in split order. Sort to restore it.
+            # pathspec format: run_id/step_name/task_id[/attempt]
+            position = {
+                (ps.split("/")[1], ps.split("/")[2]): i
+                for i, ps in enumerate(pathspecs)
+            }
+            latest_to_fetch.sort(key=lambda v: position[v[1], v[2]])
         return list(itertools.starmap(self.get_task_datastore, latest_to_fetch))
 
     def get_task_datastore(

diff --git a/metaflow/datastore/inputs.py b/metaflow/datastore/inputs.py
@@ -6,7 +6,6 @@ class Inputs(object):
     """
 
     def __init__(self, flows):
-        # TODO sort by foreach index
         self.flows = list(flows)
         for flow in self.flows:
             setattr(self, flow._current_step, flow)

diff --git a/test/core/tests/basic_foreach.py b/test/core/tests/basic_foreach.py
@@ -17,7 +17,41 @@ class BasicForeachTest(MetaflowTest):
     @steps(0, ["foreach-split"], required=True)
     def split(self):
         self.my_index = None
-        self.arr = range(32)
+        # Non-monotonic to catch foreach join ordering bugs
+        self.arr = [
+            26,
+            5,
+            10,
+            15,
+            25,
+            11,
+            22,
+            6,
+            19,
+            12,
+            16,
+            9,
+            28,
+            14,
+            24,
+            20,
+            30,
+            1,
+            13,
+            18,
+            2,
+            17,
+            21,
+            3,
+            29,
+            4,
+            27,
+            31,
+            8,
+            23,
+            0,
+            7,
+        ]
 
     @steps(0, ["foreach-inner"], required=True)
     def inner(self):
@@ -30,8 +64,44 @@ def inner(self):
 
     @steps(0, ["foreach-join"], required=True)
     def join(self, inputs):
-        got = sorted([inp.my_input for inp in inputs])
-        assert_equals(list(range(32)), got)
+        got = [inp.my_input for inp in inputs]
+        assert_equals(
+            [
+                26,
+                5,
+                10,
+                15,
+                25,
+                11,
+                22,
+                6,
+                19,
+                12,
+                16,
+                9,
+                28,
+                14,
+                24,
+                20,
+                30,
+                1,
+                13,
+                18,
+                2,
+                17,
+                21,
+                3,
+                29,
+                4,
+                27,
+                31,
+                8,
+                23,
+                0,
+                7,
+            ],
+            got,
+        )
 
     @steps(1, ["all"])
     def step_all(self):

diff --git a/test/core/tests/wide_foreach.py b/test/core/tests/wide_foreach.py
@@ -25,7 +25,7 @@ def inner(self):
 
     @steps(0, ["foreach-join-small"], required=True)
     def join(self, inputs):
-        got = sorted([inp.my_input for inp in inputs])
+        got = [inp.my_input for inp in inputs]
         assert_equals(list(range(1200)), got)
-    def join(self, inputs):
-        got = sorted([inp.my_input for inp in inputs])
-        got = [inp.my_input for inp in inputs]
-        assert_equals(list(range(1200)), got)
+    @steps(0, ["foreach-join-small"], required=True)
+    def join(self, inputs):
+        # arr is range(1200), so value == index for each branch — this makes
+        # the assertion an ordering test: any permutation of inputs yields a
+        # got[i] != i mismatch.
+        got = [inp.my_input for inp in inputs]
+        assert_equals(list(range(1200)), got)
-    def join(self, inputs):
-        got = sorted([inp.my_input for inp in inputs])
-        got = [inp.my_input for inp in inputs]
-        assert_equals(list(range(1200)), got)
+    @steps(0, ["foreach-join-small"], required=True)
+    def join(self, inputs):
+        # arr is range(1200), so value == index for each branch — this makes
+        # the assertion an ordering test: any permutation of inputs yields a
+        # got[i] != i mismatch.
+        got = [inp.my_input for inp in inputs]
+        assert_equals(list(range(1200)), got)
 
     @steps(1, ["all"])