ecmwf · tmi · Feb 12, 2026
diff --git a/AGENTS.md b/AGENTS.md
@@ -0,0 +1,10 @@
+# Overview
+* utilize `just` for command running -- `just val` in backend is the "typechecking and testing". Always run this after you make any changes to python code
+* project is managed by `uv` -- utilize that for running any python-related subcommands like `uv run pytest` or `uv run ty` for typechecking
+* there are two python modules -- cascade which is a low level execution engine, and earthkit.workflows which is a higher level abstraction on top of it. Each has its own subdirectory in tests
+* always use type annotations, it is enforced
+  * when working with a package with bad typing coverage like sqlalchemy, use ty:ignore comment
+  * when ty is not powerful enough, use ty:ignore 
+  * use typing.cast when the code logic is implicitly erasing the type information
+* prioritize using pydantic.BaseModel or dataclasses.dataclass object for capturing contracts and interfaces.
+  * ideally keep them plain, stateless, frozen, without functions -- we end up serializing those objects often over to other python processes or different languages
diff --git a/src/cascade/executor/runner/runner.py b/src/cascade/executor/runner/runner.py
@@ -12,6 +12,7 @@
 """
 
 import logging
+from collections.abc import Generator
 from dataclasses import dataclass
 from time import perf_counter_ns
 from typing import Any, Callable
@@ -81,19 +82,9 @@ def run(taskId: TaskId, executionContext: ExecutionContext, memory: Memory) -> N
 
     # invoke
     result = func(*args, **kwargs)
-    if outputsN == 1:
-        mark({"task": taskId, "action": TaskLifecycle.computed})
-        run_end = perf_counter_ns()
 
     # store outputs
-    if outputsN == 1:
-        outputKey, outputSchema = outputs[0]
-        outputId = DatasetId(taskId, outputKey)
-        memory.handle(
-            outputId, outputSchema, result, outputId in executionContext.publish
-        )
-        mark({"task": taskId, "action": TaskLifecycle.published})
-    else:
+    if isinstance(result, Generator):
         outputsI = iter(outputs)
         for (outputKey, outputSchema), outputValue in zip(outputsI, result):
             outputId = DatasetId(taskId, outputKey)
@@ -113,6 +104,19 @@ def run(taskId: TaskId, executionContext: ExecutionContext, memory: Memory) -> N
         mark({"task": taskId, "action": TaskLifecycle.computed})
         run_end = perf_counter_ns()
         mark({"task": taskId, "action": TaskLifecycle.published})
+    else:
+        if outputsN != 1:
+            raise ValueError(
+                f"task {taskId} returned non-generator result but has {outputsN} outputs declared"
+            )
+        mark({"task": taskId, "action": TaskLifecycle.computed})
+        run_end = perf_counter_ns()
+        outputKey, outputSchema = outputs[0]
+        outputId = DatasetId(taskId, outputKey)
+        memory.handle(
+            outputId, outputSchema, result, outputId in executionContext.publish
+        )
+        mark({"task": taskId, "action": TaskLifecycle.published})
     end = perf_counter_ns()
 
     trace(Microtrace.wrk_task, end - start)