[ET-VK] Add fused q8ta_relu unary operator for int8x4 tensors #9365
cuda.yml
on: pull_request
Matrix: export-model-cuda-artifact
Matrix: test-cuda-builds
unittest-cuda
/
linux-job
24m 56s
Matrix: test-models-cuda
Artifacts
Produced during runtime
| Name | Size | Digest | |
|---|---|---|---|
|
google-gemma-3-4b-it-cuda-non-quantized
Expired
|
7.22 GB |
sha256:57576226a133cd58f0975cefd6d08c91d8d4075fa0a6892b05f0cdfa3a373766
|
|
|
google-gemma-3-4b-it-cuda-quantized-int4-tile-packed
Expired
|
3.36 GB |
sha256:c8c15f1a4481edf3af0d4c5a87ab684c0e961adbccaf0cac19bb9265abfcb563
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-non-quantized
Expired
|
6.82 GB |
sha256:91a9adc44f9f30170dc0d59c474b9ddb0510570111c12d37b79cad3b2340c84c
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-tile-packed
Expired
|
2.8 GB |
sha256:86da211fa2cd025fe703aa1dd302541c2bb149994de613c644c29e8951313e99
|
|
|
mistralai-Voxtral-Mini-3B-2507-cuda-quantized-int4-weight-only
Expired
|
6.14 GB |
sha256:01d7a21f3692f88b609866d292ca12439847c97673178c27ed7634f50b15280e
|
|
|
nvidia-parakeet-tdt-cuda-non-quantized
Expired
|
952 MB |
sha256:86fd8f3ab36957e2c971016fb081fe659fd0bdc5b9f01c566ac3fdf41beabb18
|
|
|
nvidia-parakeet-tdt-cuda-quantized-int4-tile-packed
Expired
|
443 MB |
sha256:56b3d77c6189ec07ec1dd3379507f6e18c54389a1c162a72fd4a16f7b9a61aec
|
|
|
nvidia-parakeet-tdt-cuda-quantized-int4-weight-only
Expired
|
430 MB |
sha256:81157e1690a81841beb601abfd72c40ce0b0522ce65fc4040249059bd96141ef
|
|
|
openai-whisper-large-v3-turbo-cuda-non-quantized
Expired
|
1.18 GB |
sha256:7249e12e5a1e59fb7da6aedfb0934dae3b0c2131c00098f2a1ee1c9024b37e69
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-tile-packed
Expired
|
491 MB |
sha256:644037872e9476f0c6c74ba69d80f50a29174e5ebb4049ff768689ce1255bb71
|
|
|
openai-whisper-large-v3-turbo-cuda-quantized-int4-weight-only
Expired
|
485 MB |
sha256:a97f87496f1a383a9e69d76d90f3933b87229d88343f0bee2de137f6efe13756
|
|
|
openai-whisper-small-cuda-non-quantized
Expired
|
361 MB |
sha256:6d07f5859b6d8774622e33e8afe4edb3b04b8401fa980a30e5cba2b4445fa785
|
|
|
openai-whisper-small-cuda-quantized-int4-tile-packed
Expired
|
172 MB |
sha256:24ca86002c0fc8b2b6ceefab37b105c6e81c3e2261f34b736d0be9ab0e2cccb9
|
|
|
openai-whisper-small-cuda-quantized-int4-weight-only
Expired
|
271 MB |
sha256:e611d309a88e68f67203d3c6c4b8ecc544f2aea1411c4f4da8abf0c882ee2e4b
|
|