Skip to content

Commit 4cf3936

Browse files
thomasdhcNeMo Bot
authored andcommitted
ci: Add open-clip-torch as vlm dependency (#1329)
* Add open-clip-torch as vlm dependency Signed-off-by: Dong Hyuk Chang <donghyukc@nvidia.com> * Fix vlm typo Signed-off-by: Dong Hyuk Chang <donghyukc@nvidia.com> * Update uv lock Signed-off-by: thomasdhc <thomasdhc@users.noreply.github.com> --------- Signed-off-by: Dong Hyuk Chang <donghyukc@nvidia.com> Signed-off-by: thomasdhc <thomasdhc@users.noreply.github.com> Co-authored-by: thomasdhc <thomasdhc@users.noreply.github.com> Signed-off-by: NeMo Bot <nemo-bot@nvidia.com>
1 parent bc8bfa7 commit 4cf3936

File tree

3 files changed

+60
-12
lines changed

3 files changed

+60
-12
lines changed

docker/common/uv-pytorch.lock

Lines changed: 25 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3192,6 +3192,7 @@ all = [
31923192
{ name = "numpy", version = "2.4.1", source = { registry = "https://pypi.org/simple" }, marker = "python_full_version >= '3.13'" },
31933193
{ name = "nv-grouped-gemm" },
31943194
{ name = "onnxscript" },
3195+
{ name = "open-clip-torch" },
31953196
{ name = "perceptron" },
31963197
{ name = "pillow" },
31973198
{ name = "qwen-omni-utils" },
@@ -3238,6 +3239,7 @@ vlm = [
32383239
{ name = "numba", version = "0.62.1", source = { registry = "https://pypi.org/simple" }, marker = "python_full_version < '3.13'" },
32393240
{ name = "numpy", version = "1.26.4", source = { registry = "https://pypi.org/simple" }, marker = "python_full_version < '3.13'" },
32403241
{ name = "numpy", version = "2.4.1", source = { registry = "https://pypi.org/simple" }, marker = "python_full_version >= '3.13'" },
3242+
{ name = "open-clip-torch" },
32413243
{ name = "pillow" },
32423244
{ name = "qwen-omni-utils" },
32433245
{ name = "qwen-vl-utils", extra = ["decord"], marker = "platform_machine == 'x86_64' and sys_platform != 'darwin'" },
@@ -3306,6 +3308,7 @@ requires-dist = [
33063308
{ name = "numpy", marker = "extra == 'vlm'" },
33073309
{ name = "nv-grouped-gemm", marker = "extra == 'cuda'" },
33083310
{ name = "onnxscript", marker = "extra == 'cuda'", specifier = ">=0.5.6" },
3311+
{ name = "open-clip-torch", marker = "extra == 'vlm'" },
33093312
{ name = "opencv-python-headless", specifier = "==4.10.0.84" },
33103313
{ name = "perceptron", marker = "extra == 'extra'" },
33113314
{ name = "pillow", marker = "extra == 'vlm'" },
@@ -3754,6 +3757,25 @@ wheels = [
37543757
{ url = "https://files.pythonhosted.org/packages/0c/28/96f946a46b1b5d9ac2cd74f40df17e47e3481aeb469c23d7152d7ba1283f/onnxscript-0.6.0-py3-none-any.whl", hash = "sha256:80ded699e4953b05134e79abf6b77969ad4d66587f532ca583bee382086d1d24", size = 689121, upload-time = "2026-01-29T19:08:59.296Z" },
37553758
]
37563759

3760+
[[package]]
3761+
name = "open-clip-torch"
3762+
version = "3.2.0"
3763+
source = { registry = "https://pypi.org/simple" }
3764+
dependencies = [
3765+
{ name = "ftfy" },
3766+
{ name = "huggingface-hub" },
3767+
{ name = "regex" },
3768+
{ name = "safetensors" },
3769+
{ name = "timm" },
3770+
{ name = "torch", marker = "sys_platform == 'never'" },
3771+
{ name = "torchvision", marker = "sys_platform == 'never'" },
3772+
{ name = "tqdm" },
3773+
]
3774+
sdist = { url = "https://files.pythonhosted.org/packages/30/46/fb8be250fa7fcfc56fbeb41583645e18d868268f67fbbbeb8ed62a8ff18a/open_clip_torch-3.2.0.tar.gz", hash = "sha256:62b7743012ccc40fb7c64819fa762fba0a13dd74585ac733babe58c2974c2506", size = 1502853, upload-time = "2025-09-21T17:32:08.289Z" }
3775+
wheels = [
3776+
{ url = "https://files.pythonhosted.org/packages/94/91/397327cc1597fa317942cc15bef414175eee4b3c2263b34407c57f3521f9/open_clip_torch-3.2.0-py3-none-any.whl", hash = "sha256:e1f5b3ecbadb6d8ea64b1f887db23efee9739e7c0d0075a8a2a3cabae8fed8d1", size = 1546677, upload-time = "2025-09-21T17:32:06.269Z" },
3777+
]
3778+
37573779
[[package]]
37583780
name = "opencv-python-headless"
37593781
version = "4.10.0.84"
@@ -6065,7 +6087,7 @@ wheels = [
60656087

60666088
[[package]]
60676089
name = "timm"
6068-
version = "1.0.16"
6090+
version = "1.0.22"
60696091
source = { registry = "https://pypi.org/simple" }
60706092
dependencies = [
60716093
{ name = "huggingface-hub" },
@@ -6074,9 +6096,9 @@ dependencies = [
60746096
{ name = "torch", marker = "sys_platform == 'never'" },
60756097
{ name = "torchvision", marker = "sys_platform == 'never'" },
60766098
]
6077-
sdist = { url = "https://files.pythonhosted.org/packages/94/f6/4d7a8c261341fa6ad281920618739f2a650f41043afcedb570f24e99a776/timm-1.0.16.tar.gz", hash = "sha256:a3b8130dd2cb8dc3b9f5e3d09ab6d677a6315a8695fd5264eb6d52a4a46c1044", size = 2339999, upload-time = "2025-06-26T17:09:44.208Z" }
6099+
sdist = { url = "https://files.pythonhosted.org/packages/c5/9d/e4670765d1c033f97096c760b3b907eeb659cf80f3678640e5f060b04c6c/timm-1.0.22.tar.gz", hash = "sha256:14fd74bcc17db3856b1a47d26fb305576c98579ab9d02b36714a5e6b25cde422", size = 2382998, upload-time = "2025-11-05T04:06:09.377Z" }
60786100
wheels = [
6079-
{ url = "https://files.pythonhosted.org/packages/3b/14/10d0ea58a7580b8bd7c8d69420b3dc3a1deb890d4ff297deca9717689598/timm-1.0.16-py3-none-any.whl", hash = "sha256:a640e58f4ae41e0445517d1133b34be75bb2bd49cdb830d739925ce1fb7d2526", size = 2485733, upload-time = "2025-06-26T17:09:42.652Z" },
6101+
{ url = "https://files.pythonhosted.org/packages/d6/14/fc04d491527b774ec7479897f5861959209de1480e4c4cd32ed098ff8bea/timm-1.0.22-py3-none-any.whl", hash = "sha256:888981753e65cbaacfc07494370138b1700a27b1f0af587f4f9b47bc024161d0", size = 2530238, upload-time = "2025-11-05T04:06:06.823Z" },
60806102
]
60816103

60826104
[[package]]

pyproject.toml

Lines changed: 7 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -116,16 +116,17 @@ moe = [
116116
"deep_ep",
117117
]
118118
vlm = [
119-
"pillow",
120-
"qwen-vl-utils[decord]; (platform_machine == 'x86_64' and platform_system != 'Darwin')",
121-
"qwen-omni-utils",
122-
"timm<=1.0.22",
119+
"albumentations",
123120
"backoff",
121+
"mistral_common[opencv]>=1.9.0",
124122
"numpy",
125123
"numba",
124+
"open-clip-torch",
125+
"pillow",
126+
"qwen-omni-utils",
127+
"qwen-vl-utils[decord]; (platform_machine == 'x86_64' and platform_system != 'Darwin')",
128+
"timm<=1.0.22",
126129
"torchcodec; (platform_machine == 'x86_64' and platform_system != 'Darwin')",
127-
"mistral_common[opencv]>=1.9.0",
128-
"albumentations"
129130
]
130131
all = [
131132
"nemo_automodel[cuda]",

uv.lock

Lines changed: 28 additions & 3 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

0 commit comments

Comments
 (0)