Skip to content

Commit e149887

Browse files
committed
Upgrade skypilot to 0.7.0
Signed-off-by: Hemil Desai <hemild@nvidia.com>
1 parent 03db88e commit e149887

File tree

2 files changed

+7
-3
lines changed

2 files changed

+7
-3
lines changed

pyproject.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -47,10 +47,10 @@ dgx_cloud = "nemo_run.run.torchx_backend.schedulers.dgxcloud:create_scheduler"
4747

4848
[project.optional-dependencies]
4949
skypilot = [
50-
"skypilot[kubernetes]>=v0.6.1",
50+
"skypilot[kubernetes]>=v0.7.0",
5151
]
5252
skypilot-all = [
53-
"skypilot[all]>=v0.6.1",
53+
"skypilot[all]>=v0.7.0",
5454
]
5555

5656
[dependency-groups]

src/nemo_run/core/execution/skypilot.py

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@
1818
import subprocess
1919
from dataclasses import dataclass, field
2020
from pathlib import Path
21-
from typing import Optional, Type, Union
21+
from typing import Any, Optional, Type, Union
2222

2323
from invoke.context import Context
2424

@@ -104,6 +104,7 @@ class SkypilotExecutor(Executor):
104104
autodown: bool = False
105105
idle_minutes_to_autostop: Optional[int] = None
106106
torchrun_nproc_per_node: Optional[int] = None
107+
cluster_config_overrides: Optional[dict[str, Any]] = None
107108
packager: Packager = field(default_factory=lambda: GitArchivePackager()) # type: ignore # noqa: F821
108109

109110
def __post_init__(self):
@@ -182,6 +183,9 @@ def parse_attr(attr: str):
182183
parse_attr(attr)
183184

184185
resources_cfg["any_of"] = any_of
186+
if self.cluster_config_overrides:
187+
resources_cfg["_cluster_config_overrides"] = self.cluster_config_overrides
188+
185189
resources = Resources.from_yaml_config(resources_cfg)
186190

187191
return resources # type: ignore

0 commit comments

Comments
 (0)