Support Annotated in CLI (#118)

marcromeyn · web-flow · commit 74cf9029e968 · 2024-12-03T18:20:17.000+01:00
* Support Annotated in CLI

Signed-off-by: Marc Romeyn &lt;mromeijn@nvidia.com&gt;

* Fix failing test

Signed-off-by: Marc Romeyn &lt;mromeijn@nvidia.com&gt;

---------

Signed-off-by: Marc Romeyn &lt;mromeijn@nvidia.com&gt;
diff --git a/src/nemo_run/cli/cli_parser.py b/src/nemo_run/cli/cli_parser.py
@@ -702,6 +702,14 @@ def parse_buildable(self, value: str, annotation: Type[Config | Partial]) -> Con
             elif buildable_type == "Partial":
                 return Partial(config_type)
 
+        if str(annotation).startswith("typing.Annotated"):
+            args = get_args(annotation)
+            if str(args[0]).startswith("typing.Optional") and len(args) > 1:
+                cfg_type = get_args(args[0])[0]
+                buildable = args[1].__origin__
+                if issubclass(buildable, fdl.Buildable):
+                    return buildable(cfg_type)
+
         return Config(annotation)
 
     def parse_int(self, value: str, _: Type) -> int:
diff --git a/test/cli/test_api.py b/test/cli/test_api.py
@@ -15,7 +15,7 @@
 
 from configparser import ConfigParser
 from dataclasses import dataclass
-from typing import List, Optional, Union
+from typing import Annotated, List, Optional, Tuple, Union
 from unittest.mock import Mock, patch
 
 import fiddle as fdl
@@ -439,9 +439,9 @@ class Model:
 class Optimizer:
     """Dummy optimizer config"""
 
-    learning_rate: float
-    weight_decay: float
-    betas: List[float]
+    learning_rate: float = 0.001
+    weight_decay: float = 1e-5
+    betas: Tuple[float, float] = (0.9, 0.999)
 
 
 @run.cli.factory
@@ -506,6 +506,22 @@ def train_model(
     return {"model": model, "optimizer": optimizer, "epochs": epochs, "batch_size": batch_size}
 
 
+@run.cli.entrypoint(
+    namespace="my_llm",
+    skip_confirmation=True,
+)
+def train_model_default_optimizer(
+    model: Model,
+    optimizer: Annotated[Optional[Optimizer], run.Config[Optimizer]] = None,
+    epochs: int = 10,
+    batch_size: int = 32,
+):
+    if optimizer is None:
+        optimizer = Optimizer()
+
+    return train_model(model, optimizer, epochs, batch_size)
+
+
 @run.cli.factory(target=train_model)
 def custom_defaults() -> run.Partial["train_model"]:
     return run.Partial(
@@ -585,6 +601,37 @@ def test_with_defaults(self, runner, app):
         for i in range(1, 31):
             assert f"Epoch {i}/30" in output
 
+    def test_with_defaults_no_optimizer(self, runner, app):
+        # Test CLI execution with default factory
+        result = runner.invoke(
+            app,
+            [
+                "my_llm",
+                "train_model_default_optimizer",
+                "model=my_model(hidden_size=1024)",
+                "epochs=30",
+                "run.skip_confirmation=True",
+            ],
+            env={"INCLUDE_WORKSPACE_FILE": "false"},
+        )
+        assert result.exit_code == 0
+
+        # Parse the output to check the values
+        output = result.stdout
+        assert "Training model with the following configuration:" in output
+        assert "Model: Model(hidden_size=1024, num_layers=3, activation='relu')" in output
+        assert (
+            "Optimizer: Optimizer(learning_rate=0.001, weight_decay=1e-05, betas=(0.9, 0.999))"
+            in output
+        )
+        assert "Epochs: 30" in output
+        assert "Batch size: 32" in output
+        assert "Training completed!" in output
+
+        # Check that all epochs were simulated
+        for i in range(1, 31):
+            assert f"Epoch {i}/30" in output
+
     def test_experiment_entrypoint(self):
         def dummy_pretrain(log_dir: str):
             pass