Arm backend: Fix broken index_tensor tests (#16220) #4563
cuda.yml
on: push
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
Matrix: test-models-cuda
Matrix: test-model-cuda-e2e
check-all-cuda-builds
3s
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
google-gemma-3-4b-it-cuda-non-quantized
|
7.22 GB |
sha256:4724316fce35e5cf08b0bb532705c9cf6c931134148e07d0158d5b6d05d7bb17
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
|
3.36 GB |
sha256:16034821f371962c4d50affd201bc29cb5f168bf6a4e017ab211eafd3735edec
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
|
6.82 GB |
sha256:a552c42613237230a5539d09c05092ec965ee6a216508bf700b60f90128c7d3a
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
|
2.89 GB |
sha256:2dd38158518d6e4eadfd36a59565805d69703cd3d935c4a12445a0e8ef6d4c5c
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
|
6.14 GB |
sha256:e5a7c90d88c99eebb4243a3c3343eca6a32fce0b71641d4ef48b2d9ae93749b4
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
|
1.18 GB |
sha256:be5a6678275040d5b1db2e9e13aef959c68459317da8b7c6f141a356e9541171
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
|
491 MB |
sha256:45bbe503131fe051cb480dd39bae67860b663f9d8aac6b8e4786a0eea2a53e2e
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
|
485 MB |
sha256:822e1e90b4e212c917c1149a82c8c5aa5c64755dd0b60458d71bed0647f896c5
|
|
|
openai-whisper-small-cuda-non-quantized
|
361 MB |
sha256:dd8385d4e98d68e453ebdb825b5cb1728b1c868e15422857a322c22a50f62548
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
|
172 MB |
sha256:a51436815a4627bfaa4254e7319b19b7164141c9a791fb98d2810794e02bddfb
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
|
270 MB |
sha256:ccf595b6bd7697b7c22a7692f077200e81a2f10c0c3f514b4bb6e91697e6a3b4
|
|