Fix TASK_SOURCE cache policy for remote execution with cloudpickle

desertaxle · claude · desertaxle · commit 71988fe41161 · 2025-12-22T10:51:00.000-06:00
This PR fixes an issue where the `TASK_SOURCE` cache policy fails when used with remote execution decorators like `@ecs` that use cloudpickle to ship code to remote environments. The problem: `inspect.getsource()` fails on cloudpickled functions because the original source file doesn't exist on the remote machine. The previous fallback to hashing `__code__.co_code` (bytecode) led to inconsistent cache keys because bytecode varies across Python versions and the code object contains unstable attributes like `co_locals` that change between serialization/deserialization cycles. The solution: Store the function's source code on the `Task` object during initialization so it survives cloudpickle serialization. The `TaskSource.compute_key()` method now checks for this stored source code first before falling back to `inspect.getsource()`. This ensures stable, deterministic cache keys regardless of execution environment. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
diff --git a/src/prefect/cache_policies.py b/src/prefect/cache_policies.py
@@ -291,6 +291,13 @@ def compute_key(
     ) -> Optional[str]:
         if not task_ctx:
             return None
+
+        # Use stored source code if available (works after cloudpickle serialization)
+        source_code = getattr(task_ctx.task, "source_code", None)
+        if source_code is not None:
+            return hash_objects(source_code, raise_on_failure=True)
+
+        # Fall back to inspect.getsource for local execution
         try:
             lines = inspect.getsource(task_ctx.task)
         except TypeError:
diff --git a/src/prefect/tasks.py b/src/prefect/tasks.py
@@ -456,6 +456,14 @@ def __init__(
         update_wrapper(self, fn)
         self.fn = fn
 
+        # Capture source code for cache key computation
+        # This is stored on the task so it survives cloudpickle serialization
+        # to remote environments where the source file is not available
+        try:
+            self.source_code: str | None = inspect.getsource(fn)
+        except (TypeError, OSError):
+            self.source_code = None
+
         # the task is considered async if its function is async or an async
         # generator
         self.isasync: bool = inspect.iscoroutinefunction(
diff --git a/tests/test_cache_policies.py b/tests/test_cache_policies.py
@@ -283,35 +283,100 @@ def my_func(x):
 
         assert key != new_key
 
-    def test_source_fallback_behavior(self):
+    def test_uses_stored_source_code(self):
+        """Test that TaskSource uses stored source_code attribute when available."""
         policy = TaskSource()
 
-        def task_a_fn():
-            pass
+        mock_task_a = MagicMock()
+        mock_task_b = MagicMock()
+
+        # Set different source code on each mock task
+        mock_task_a.source_code = "def task_a():\n    return 'a'"
+        mock_task_b.source_code = "def task_b():\n    return 'b'"
+
+        task_ctx_a = TaskRunContext.model_construct(task=mock_task_a)
+        task_ctx_b = TaskRunContext.model_construct(task=mock_task_b)
+
+        key_a = policy.compute_key(
+            task_ctx=task_ctx_a, inputs=None, flow_parameters=None
+        )
+        key_b = policy.compute_key(
+            task_ctx=task_ctx_b, inputs=None, flow_parameters=None
+        )
+
+        # Keys should be generated and different for different source code
+        assert key_a is not None
+        assert key_b is not None
+        assert key_a != key_b
+
+    def test_stored_source_code_stability(self):
+        """Test that the same source code produces the same key consistently."""
+        policy = TaskSource()
+
+        mock_task = MagicMock()
+        mock_task.source_code = "def my_task():\n    return 'hello'"
 
-        def task_b_fn():
-            return 1
+        task_ctx = TaskRunContext.model_construct(task=mock_task)
+
+        key1 = policy.compute_key(task_ctx=task_ctx, inputs=None, flow_parameters=None)
+        key2 = policy.compute_key(task_ctx=task_ctx, inputs=None, flow_parameters=None)
+
+        # Same source code should produce same key
+        assert key1 == key2
+
+    def test_fallback_when_source_code_is_none(self):
+        """Test that TaskSource returns None when source_code is None and getsource fails."""
+        policy = TaskSource()
 
         mock_task_a = MagicMock()
         mock_task_b = MagicMock()
 
-        mock_task_a.fn = task_a_fn
-        mock_task_b.fn = task_b_fn
+        mock_task_a.source_code = None
+        mock_task_b.source_code = None
 
         task_ctx_a = TaskRunContext.model_construct(task=mock_task_a)
         task_ctx_b = TaskRunContext.model_construct(task=mock_task_b)
 
+        # When source_code is None and getsource fails, policy returns None
         for os_error_msg in {"could not get source code", "source code not available"}:
-            with patch("inspect.getsource", side_effect=OSError(os_error_msg)):
+            with patch(
+                "prefect.cache_policies.inspect.getsource",
+                side_effect=OSError(os_error_msg),
+            ):
                 fallback_key_a = policy.compute_key(
                     task_ctx=task_ctx_a, inputs=None, flow_parameters=None
                 )
                 fallback_key_b = policy.compute_key(
                     task_ctx=task_ctx_b, inputs=None, flow_parameters=None
                 )
 
-            assert fallback_key_a and fallback_key_b
-            assert fallback_key_a != fallback_key_b
+            # Without stored source and without getsource, returns None
+            assert fallback_key_a is None
+            assert fallback_key_b is None
+
+    def test_returns_none_when_no_source_available(self):
+        """Test that TaskSource returns None when neither stored source nor getsource works."""
+        policy = TaskSource()
+
+        def task_fn():
+            return "test"
+
+        mock_task = MagicMock()
+        mock_task.source_code = None
+        mock_task.fn = task_fn
+
+        task_ctx = TaskRunContext.model_construct(task=mock_task)
+
+        # When source_code is None and getsource raises TypeError, returns None
+        with patch(
+            "prefect.cache_policies.inspect.getsource",
+            side_effect=TypeError("not a function"),
+        ):
+            key = policy.compute_key(
+                task_ctx=task_ctx, inputs=None, flow_parameters=None
+            )
+
+        assert key is None
 
 
 class TestDefaultPolicy:
diff --git a/tests/test_tasks.py b/tests/test_tasks.py
@@ -161,6 +161,62 @@ def __call__(self, x):
         assert tt.task_key.startswith("Funky-")
 
 
+class TestTaskSourceCode:
+    def test_source_code_captured_for_function(self):
+        @task
+        def my_task():
+            return 42
+
+        assert my_task.source_code is not None
+        assert "def my_task" in my_task.source_code
+        assert "return 42" in my_task.source_code
+
+    def test_source_code_is_none_for_callable_object(self):
+        class MyCallable:
+            def __call__(self):
+                return 42
+
+        callable_obj = MyCallable()
+        my_task = Task(fn=callable_obj)
+
+        # Callable objects don't have source code accessible via inspect.getsource
+        assert my_task.source_code is None
+
+    def test_source_code_survives_cloudpickle(self):
+        import cloudpickle
+
+        @task
+        def my_task():
+            return "hello"
+
+        # Verify source code is captured
+        original_source = my_task.source_code
+        assert original_source is not None
+        assert "def my_task" in original_source
+
+        # Serialize and deserialize the task
+        pickled = cloudpickle.dumps(my_task)
+        restored_task = cloudpickle.loads(pickled)
+
+        # Source code should survive serialization
+        assert restored_task.source_code == original_source
+
+    def test_source_code_different_for_different_tasks(self):
+        @task
+        def task_a():
+            return "a"
+
+        @task
+        def task_b():
+            return "b"
+
+        assert task_a.source_code is not None
+        assert task_b.source_code is not None
+        assert task_a.source_code != task_b.source_code
+        assert "task_a" in task_a.source_code
+        assert "task_b" in task_b.source_code
+
+
 class TestTaskRunName:
     def test_run_name_default(self):
         @task