[slimtensor] integration into backend #5693
cuda.yml
on: pull_request
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
unittest-cuda
/
linux-job
19m 57s
Matrix: test-models-cuda
Matrix: test-model-cuda-e2e
check-all-cuda-builds
2s
Annotations
18 errors
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
google-gemma-3-4b-it-cuda-non-quantized
|
7.22 GB |
sha256:48473fd0da3e12dee0340c4ebea88e9ee21006f4fef69167fa8318e3dadec157
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
|
3.36 GB |
sha256:a1cb726ad89cc22687f3f4d3a5fe616ed2a060754bada04c85d5ccf02823ec59
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
|
6.82 GB |
sha256:9d13550c9dbf62a27c7421d71e7aec944a048f824981c344255e2ae87a270429
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
|
2.8 GB |
sha256:0cee5809ba176876f7160c64a55db3eb0577d58326a7bbee5d5abc5b8febd664
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
|
6.14 GB |
sha256:4d389e693306a2f091ea1ab152d03f551abca0dc12cfb103258896a0e8a5a312
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
|
1.18 GB |
sha256:ee49addda43294a66c0a24676baf7a1b967e100dc4d5bbb66416585c2b6c5e2e
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
|
491 MB |
sha256:3759d2c52f53823a7dcaaaf4c9e698f7faa4b68cd43c0597f92705281b3d07d9
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
|
485 MB |
sha256:ecb8623df640e0370d267dbc841332fe4c97969b01434d0b952b3edd3cbb06e0
|
|
|
openai-whisper-small-cuda-non-quantized
|
361 MB |
sha256:ad915f6060cc520ce9d0b18e8fba16b482278428ebd86fcb8e73275a47ab4927
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
|
172 MB |
sha256:f990eaf70ddfbfccd2185023c6fe84498a854e0e6aa00296f76cb748b6ffcca8
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
|
270 MB |
sha256:20ceda463e0e8bc12ca07ab30e77f00dce8a29d019ac8d6884c1740065180d73
|
|