[slimtensor] Add CUDA slimtensor creation with basic functionality #5314
cuda.yml
on: pull_request
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
unittest-cuda
/
linux-job
25m 13s
Matrix: test-models-cuda
Matrix: test-model-cuda-e2e
check-all-cuda-builds
2s
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
google-gemma-3-4b-it-cuda-non-quantized
|
7.22 GB |
sha256:807c20581ac0e893ab2b4cfe1c55885687a73c3c1d63a2125283658b32d6f0bd
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
|
3.36 GB |
sha256:e4a27f92b8a5495bf112df6681496abb80104144fb916e91c03cb812093b7413
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
|
6.82 GB |
sha256:b445439bc6d21ec30a6ad6a8a0f96aa6361e454f2b0755706bf21eda8bacede8
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
|
2.8 GB |
sha256:3643ee654b3d8c706bea3317b42fa38b05d5d92ed55e4ad615064ff6568871ed
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
|
6.14 GB |
sha256:3805a16b9bbadd0b577d28a04184dcbd733c4821e9132a0b0772d19a5d450a7a
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
|
1.18 GB |
sha256:f34cc596ac08b6b254bbe97db867fa611abb70a140a4a35e08d7b19d1cce3672
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
|
491 MB |
sha256:71f075c4cd426c222177e7c16c97cc5bfc40b57a95dd06d6db528ad3a8ba84d4
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
|
485 MB |
sha256:de36adeb072e7721962510dda98cc215aae18a784dd1bda8087e58abd1f1ced2
|
|
|
openai-whisper-small-cuda-non-quantized
|
361 MB |
sha256:b10264f6308a0bb88fd69fd36dc0e99d7d917e7b7d8d65342a00651f16479194
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
|
172 MB |
sha256:f18cf06eceae7e82c3191308bebdd649e826107efb8034f0ad71ec7fe1f8bdfe
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
|
270 MB |
sha256:c138377a8dca4d813661d0323a82eb45358ed91dc5d77d716036c555a9146b1b
|
|