Custom Triton kernel registration #2927
cuda.yml
on: pull_request
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
Matrix: test-models-cuda
Matrix: benchmark-model-cuda
Matrix: test-model-cuda-e2e
check-all-cuda-builds
3s
Annotations
21 errors and 1 warning
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
google-gemma-3-4b-it-cuda-non-quantized
|
7.22 GB |
sha256:59dcb89cb66b38d5b14f73afd06afb135593eabbb1f3a053ff0d4aa99ca5e0cc
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
|
4.03 GB |
sha256:b7e125593b412789d2b1f81a20c0456aff5ea31c81217072228ccf386d4360c7
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
|
6.82 GB |
sha256:9794e6021ad3ff6ba2990eb0d9dd5b505dc1e7628aca760bfd7c22ec9e3b50b1
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
|
2.89 GB |
sha256:495c8ef817cf33c86367bc94fb7936b469b46c0b89f05531e8586abe32e800f0
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
|
6.14 GB |
sha256:8130ac2800b2ef513e75acd72af70fc0c269382ee96c70bc70d33e7b78e812d4
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
|
1.17 GB |
sha256:cd86fb98b528d6a737b3e61075cad3d207a429e4944e6a08a510617aff520b9b
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
|
490 MB |
sha256:01259bbfc60b8ce94610026994c668eacd54825666a3d088e202636b82dfe5ab
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
|
484 MB |
sha256:4ba51691c78364235a19a03833591e63c10aeb05d046bda419131a7f7d37eeb5
|
|
|
openai-whisper-small-cuda-non-quantized
|
361 MB |
sha256:14ddd38a216faa355f18de0494cfa491dc2219ed223358d0d6ae5b90ea869290
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
|
172 MB |
sha256:dfed81828943aea4080e029e64b2d7081b7a4fba4a389df600cc3de8f1fa0a94
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
|
270 MB |
sha256:bf213aa7d111eaa08581d102652a57d35a064dc7b13bce873e85b783fee852ec
|
|