Skip to content

Commit c16a572

Browse files
Add retry_until_up (#340)
Signed-off-by: Romil Bhardwaj <[email protected]>
1 parent 2caf5d7 commit c16a572

File tree

1 file changed

+2
-1
lines changed

1 file changed

+2
-1
lines changed

nemo_run/core/execution/skypilot.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -107,6 +107,7 @@ class SkypilotExecutor(Executor):
107107
cluster_config_overrides: Optional[dict[str, Any]] = None
108108
infra: Optional[str] = None
109109
network_tier: Optional[str] = None
110+
retry_until_up: bool = False
110111
packager: Packager = field(default_factory=lambda: GitArchivePackager()) # type: ignore # noqa: F821
111112

112113
def __post_init__(self):
@@ -410,7 +411,7 @@ def launch(
410411
idle_minutes_to_autostop=self.idle_minutes_to_autostop,
411412
down=self.autodown,
412413
fast=True,
413-
# retry_until_up=retry_until_up,
414+
retry_until_up=self.retry_until_up,
414415
# clone_disk_from=clone_disk_from,
415416
)
416417
)

0 commit comments

Comments
 (0)