Arm backend: Update vgf model tests (#16199) #4572
cuda.yml
on: push
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
Matrix: test-models-cuda
Matrix: test-model-cuda-e2e
check-all-cuda-builds
3s
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
google-gemma-3-4b-it-cuda-non-quantized
|
7.22 GB |
sha256:5f2701699b9303922fb06751a637c142faa28957b314f7f1be62031ed890689e
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
|
3.36 GB |
sha256:74cc939a57539f686eb6a8a3db2f44e3e2e50934414a4411b978e2ceb4783cde
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
|
6.82 GB |
sha256:c7669b0981c81a95b542897bd66986506624dba014eab2611ea7549f9295dcec
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
|
2.89 GB |
sha256:ec35bdeabe0a0b33b585b9ae038fcc5732f6ed594fe197c496721a3972242b78
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
|
6.14 GB |
sha256:ad0da5e5a41b544db7e240f421b5fddc6203fcc53eee30bc306985af7bc17b3c
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
|
1.18 GB |
sha256:dab18ca7ccbbfb41fc665dc5eac496525c232a41194d9cdff6966d2c2b1850b4
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
|
491 MB |
sha256:149c36adea5cc2f29522d479f8827725dc6a28ef2970f0b8676bf28437875bc9
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
|
485 MB |
sha256:7799d63f6221519cd55c2e6cd618ae54a3de05c0ffe1f09c85e917b774437939
|
|
|
openai-whisper-small-cuda-non-quantized
|
361 MB |
sha256:1d9c4d17617e81cb4c15aa78034bf3975f7f4f08793d8d50c2cf6a061540b7b9
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
|
172 MB |
sha256:87117181e59344c68267f25e88c493c8b3902ca4db161267462ce868cec194b4
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
|
270 MB |
sha256:cc3f22d20e42922f2b62a44222e86423adaaa1d90760617b7be03ad45e484929
|
|