Remove type dispatch for quantized_conv1d ops #10886
cuda.yml
on: pull_request
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
unittest-cuda
/
linux-job
28m 33s
Matrix: test-models-cuda
Annotations
1 error
|
test-model-cuda-e2e (mistralai, Voxtral-Mini-4B-Realtime-2602, quantized-int4-tile-packed) / linux-job
Process completed with exit code 1.
|
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
Qwen-Qwen3-0.6B-cuda-non-quantized
|
1.1 GB |
sha256:33ebc2435769c765c6326751d1ccfaa9a68dd9ab5488f3a58dc3345934d28916
|
|
|
Qwen-Qwen3-0.6B-cuda-quantized-int4-tile-packed
|
559 MB |
sha256:81b6c91d1080f5c47e87ac33a12b61dc15e4fa260225822eda43f9f10c67d631
|
|
|
Qwen-Qwen3-0.6B-cuda-quantized-int4-weight-only
|
1.1 GB |
sha256:30fe12b066c95d5ccce132bf2ba22004c034988e2599dd280c810070aaa29cf0
|
|
|
google-gemma-3-4b-it-cuda-non-quantized
|
7.22 GB |
sha256:db70f7b8edcf0a4d5aee7235e020b1b7ccb86c98648d72ab5a4bfd43f002485c
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
|
3.36 GB |
sha256:b7b7736779bb7c68b505bd853974283142503df1912714585414f817c793b02f
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
|
6.82 GB |
sha256:a064b19195eb2fd30e052ee1db7e9037c6072984bac3cebb95d6ecac3dc93193
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
|
2.8 GB |
sha256:d1b577ff9d6081a12b046cdf2a48129eba45d367fcf088dc61635d396c0da711
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
|
6.14 GB |
sha256:35074f761434fcadab19e5e8677de5b2c6e767c2ef874aefd1dfea229ffebff7
|
|
|
mistralai-Voxtral-Mini-4B-Realtime-2602-cuda-quantized-int4-tile-packed
|
15.5 GB |
sha256:cb623044d4a36e2260a6a78821e88210981b1de43364e8ec072c1f7967427cd5
|
|
|
nvidia-diar_streaming_sortformer_4spk-v2-cuda-non-quantized
|
436 MB |
sha256:391995cac76c2a26ff74c2b09179aca469aca652c710c4584c920496b02f41fc
|
|
|
nvidia-parakeet-tdt-cuda-non-quantized
|
952 MB |
sha256:c8a3caad8026fff2271d1be8dded34aed542e9606f3d023409f2fd4aa8479faa
|
|
|
nvidia-parakeet-tdt-cuda-quantized-int4-tile-packed
|
443 MB |
sha256:cf5f11104da983e02c157bb1d9460efb8c04892f132b91b579020197da14d5a5
|
|
|
nvidia-parakeet-tdt-cuda-quantized-int4-weight-only
|
430 MB |
sha256:d9ede62ce8499d85336d109af94ce04669827fe398d6a051b5b3bc6f5e828d07
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
|
1.18 GB |
sha256:aff11b09e1b5ecc61e17fc10fc91225dee395ac89e0174c8e1440d27de4aa056
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
|
491 MB |
sha256:a1c40fb1c6155b29b1c96d135787a70fb9fa0655f10403d9abeb3f9ebf947698
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
|
485 MB |
sha256:be719c0aa16b64e3913777cd54fb7d7018dff4f98b4056cfb823fef98b5d2531
|
|
|
openai-whisper-small-cuda-non-quantized
|
361 MB |
sha256:d26605eab70efa47a423c587aff870ccf8a125f9a007d6ee61955238e13047c5
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
|
172 MB |
sha256:54e83d3996f406dad27f5eaaad69a27354c3c5f6ef2596221d3daf9538dc2042
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
|
271 MB |
sha256:9696fc8cad4291cfb4fe40f6e8fbb37a99d819697209f864e64d50d7e305a49b
|
|