v0.34.0
Browse filesSee https://github.com/quic/ai-hub-models/releases/v0.34.0 for changelog.
- README.md +54 -64
- VIT_w8a16.dlc +1 -1
- VIT_w8a8.dlc +1 -1
- precompiled/qualcomm-qcs6490-proxy/sdk_versions.yml +3 -0
- precompiled/qualcomm-snapdragon-x-elite/VIT.bin +1 -1
- precompiled/qualcomm-snapdragon-x-elite/VIT.onnx.zip +1 -1
- precompiled/qualcomm-snapdragon-x-elite/VIT_w8a16.onnx.zip +1 -1
- precompiled/qualcomm-snapdragon-x-elite/VIT_w8a8.onnx.zip +2 -2
- precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml +5 -0
README.md
CHANGED
@@ -24,6 +24,7 @@ More details on model performance across various devices, can be found
|
|
24 |
[here](https://aihub.qualcomm.com/models/vit).
|
25 |
|
26 |
|
|
|
27 |
### Model Details
|
28 |
|
29 |
- **Model Type:** Model_use_case.image_classification
|
@@ -37,83 +38,82 @@ More details on model performance across various devices, can be found
|
|
37 |
|
38 |
| Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model
|
39 |
|---|---|---|---|---|---|---|---|---|
|
40 |
-
| VIT | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE | 43.
|
41 |
| VIT | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 45.176 ms | 0 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
42 |
-
| VIT | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE | 17.
|
43 |
| VIT | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 21.31 ms | 0 - 316 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
44 |
-
| VIT | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE | 12.
|
45 |
| VIT | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 13.809 ms | 0 - 32 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
46 |
-
| VIT | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE | 16.
|
47 |
| VIT | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 16.876 ms | 1 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
48 |
-
| VIT | float | SA7255P ADP | Qualcomm® SA7255P | TFLITE | 43.
|
49 |
| VIT | float | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 45.176 ms | 0 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
50 |
-
| VIT | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | TFLITE |
|
51 |
| VIT | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC | 13.828 ms | 0 - 31 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
52 |
-
| VIT | float | SA8295P ADP | Qualcomm® SA8295P | TFLITE | 20.
|
53 |
| VIT | float | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 19.819 ms | 1 - 327 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
54 |
-
| VIT | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | TFLITE | 12.
|
55 |
| VIT | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 13.893 ms | 0 - 30 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
56 |
-
| VIT | float | SA8775P ADP | Qualcomm® SA8775P | TFLITE | 16.
|
57 |
| VIT | float | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 16.876 ms | 1 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
58 |
-
| VIT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE |
|
59 |
| VIT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 13.859 ms | 0 - 28 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
60 |
| VIT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 13.522 ms | 1 - 22 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
61 |
-
| VIT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE | 8.
|
62 |
| VIT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 9.587 ms | 38 - 370 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
63 |
| VIT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 9.342 ms | 1 - 336 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
64 |
-
| VIT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | TFLITE | 8.262 ms | 0 - 319 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
65 |
| VIT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 8.024 ms | 1 - 314 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
66 |
| VIT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 7.694 ms | 1 - 320 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
67 |
| VIT | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 16.174 ms | 1116 - 1116 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
68 |
| VIT | float | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 14.917 ms | 171 - 171 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
69 |
-
| VIT | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 64.
|
70 |
-
| VIT | w8a16 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC |
|
71 |
-
| VIT | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 25.
|
72 |
-
| VIT | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 22.
|
73 |
-
| VIT | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_DLC |
|
74 |
-
| VIT | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 64.
|
75 |
-
| VIT | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC |
|
76 |
-
| VIT | w8a16 | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 37.
|
77 |
-
| VIT | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 25.
|
78 |
-
| VIT | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 22.
|
79 |
-
| VIT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC |
|
80 |
| VIT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 157.686 ms | 462 - 586 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
81 |
-
| VIT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 19.
|
82 |
| VIT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 125.213 ms | 621 - 779 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
83 |
-
| VIT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC |
|
84 |
| VIT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 106.961 ms | 489 - 619 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
85 |
-
| VIT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 27.
|
86 |
| VIT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 176.132 ms | 923 - 923 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
87 |
-
| VIT | w8a8 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE | 24.
|
88 |
-
| VIT | w8a8 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 30.
|
89 |
-
| VIT | w8a8 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE | 12.
|
90 |
-
| VIT | w8a8 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC |
|
91 |
-
| VIT | w8a8 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE | 12.
|
92 |
-
| VIT | w8a8 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 10.
|
93 |
-
| VIT | w8a8 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE | 12.
|
94 |
-
| VIT | w8a8 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 9.
|
95 |
-
| VIT | w8a8 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | TFLITE |
|
96 |
-
| VIT | w8a8 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_DLC |
|
97 |
-
| VIT | w8a8 | SA7255P ADP | Qualcomm® SA7255P | TFLITE | 24.
|
98 |
-
| VIT | w8a8 | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 30.
|
99 |
-
| VIT | w8a8 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | TFLITE | 12.
|
100 |
-
| VIT | w8a8 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC | 10.
|
101 |
-
| VIT | w8a8 | SA8295P ADP | Qualcomm® SA8295P | TFLITE | 14.
|
102 |
-
| VIT | w8a8 | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 16.
|
103 |
-
| VIT | w8a8 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | TFLITE | 12.
|
104 |
-
| VIT | w8a8 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 10.
|
105 |
-
| VIT | w8a8 | SA8775P ADP | Qualcomm® SA8775P | TFLITE | 12.
|
106 |
-
| VIT | w8a8 | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 9.
|
107 |
-
| VIT | w8a8 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE | 12.
|
108 |
-
| VIT | w8a8 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 10.
|
109 |
| VIT | w8a8 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 156.848 ms | 462 - 577 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
110 |
-
| VIT | w8a8 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE | 8.
|
111 |
-
| VIT | w8a8 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC |
|
112 |
| VIT | w8a8 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 127.23 ms | 487 - 644 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
113 |
-
| VIT | w8a8 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | TFLITE | 7.
|
114 |
-
| VIT | w8a8 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 6.
|
115 |
| VIT | w8a8 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 103.704 ms | 495 - 618 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
116 |
-
| VIT | w8a8 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 11.
|
117 |
| VIT | w8a8 | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 180.062 ms | 924 - 924 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
118 |
|
119 |
|
@@ -172,17 +172,7 @@ device. This script does the following:
|
|
172 |
```bash
|
173 |
python -m qai_hub_models.models.vit.export
|
174 |
```
|
175 |
-
|
176 |
-
Profiling Results
|
177 |
-
------------------------------------------------------------
|
178 |
-
VIT
|
179 |
-
Device : cs_8275 (ANDROID 14)
|
180 |
-
Runtime : TFLITE
|
181 |
-
Estimated inference time (ms) : 43.9
|
182 |
-
Estimated peak memory usage (MB): [0, 315]
|
183 |
-
Total # Ops : 1579
|
184 |
-
Compute Unit(s) : npu (1579 ops) gpu (0 ops) cpu (0 ops)
|
185 |
-
```
|
186 |
|
187 |
|
188 |
## How does this work?
|
|
|
24 |
[here](https://aihub.qualcomm.com/models/vit).
|
25 |
|
26 |
|
27 |
+
|
28 |
### Model Details
|
29 |
|
30 |
- **Model Type:** Model_use_case.image_classification
|
|
|
38 |
|
39 |
| Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model
|
40 |
|---|---|---|---|---|---|---|---|---|
|
41 |
+
| VIT | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE | 43.869 ms | 7 - 322 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
42 |
| VIT | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 45.176 ms | 0 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
43 |
+
| VIT | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE | 17.952 ms | 0 - 317 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
44 |
| VIT | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 21.31 ms | 0 - 316 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
45 |
+
| VIT | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE | 12.713 ms | 0 - 29 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
46 |
| VIT | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 13.809 ms | 0 - 32 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
47 |
+
| VIT | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE | 16.053 ms | 0 - 315 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
48 |
| VIT | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 16.876 ms | 1 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
49 |
+
| VIT | float | SA7255P ADP | Qualcomm® SA7255P | TFLITE | 43.869 ms | 7 - 322 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
50 |
| VIT | float | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 45.176 ms | 0 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
51 |
+
| VIT | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | TFLITE | 12.704 ms | 0 - 25 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
52 |
| VIT | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC | 13.828 ms | 0 - 31 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
53 |
+
| VIT | float | SA8295P ADP | Qualcomm® SA8295P | TFLITE | 20.083 ms | 0 - 307 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
54 |
| VIT | float | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 19.819 ms | 1 - 327 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
55 |
+
| VIT | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | TFLITE | 12.698 ms | 0 - 28 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
56 |
| VIT | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 13.893 ms | 0 - 30 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
57 |
+
| VIT | float | SA8775P ADP | Qualcomm® SA8775P | TFLITE | 16.053 ms | 0 - 315 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
58 |
| VIT | float | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 16.876 ms | 1 - 324 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
59 |
+
| VIT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE | 13.128 ms | 0 - 15 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
60 |
| VIT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 13.859 ms | 0 - 28 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
61 |
| VIT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 13.522 ms | 1 - 22 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
62 |
+
| VIT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE | 8.998 ms | 0 - 322 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT.tflite) |
|
63 |
| VIT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 9.587 ms | 38 - 370 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
64 |
| VIT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 9.342 ms | 1 - 336 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
|
|
65 |
| VIT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 8.024 ms | 1 - 314 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
66 |
| VIT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 7.694 ms | 1 - 320 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
67 |
| VIT | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 16.174 ms | 1116 - 1116 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT.dlc) |
|
68 |
| VIT | float | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 14.917 ms | 171 - 171 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT.onnx) |
|
69 |
+
| VIT | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 64.929 ms | 0 - 190 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
70 |
+
| VIT | w8a16 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 54.816 ms | 0 - 209 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
71 |
+
| VIT | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 25.79 ms | 0 - 47 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
72 |
+
| VIT | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 22.672 ms | 0 - 189 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
73 |
+
| VIT | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_DLC | 201.193 ms | 0 - 1673 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
74 |
+
| VIT | w8a16 | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 64.929 ms | 0 - 190 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
75 |
+
| VIT | w8a16 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC | 25.947 ms | 0 - 47 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
76 |
+
| VIT | w8a16 | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 37.114 ms | 0 - 212 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
77 |
+
| VIT | w8a16 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 25.936 ms | 0 - 47 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
78 |
+
| VIT | w8a16 | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 22.672 ms | 0 - 189 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
79 |
+
| VIT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 25.826 ms | 0 - 47 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
80 |
| VIT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 157.686 ms | 462 - 586 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
81 |
+
| VIT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 19.399 ms | 0 - 199 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
82 |
| VIT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 125.213 ms | 621 - 779 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
83 |
+
| VIT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 16.166 ms | 0 - 187 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
84 |
| VIT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 106.961 ms | 489 - 619 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
85 |
+
| VIT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 27.135 ms | 337 - 337 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.dlc) |
|
86 |
| VIT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 176.132 ms | 923 - 923 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a16.onnx) |
|
87 |
+
| VIT | w8a8 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE | 24.338 ms | 0 - 49 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
88 |
+
| VIT | w8a8 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 30.29 ms | 0 - 164 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
89 |
+
| VIT | w8a8 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE | 12.745 ms | 0 - 58 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
90 |
+
| VIT | w8a8 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 13.785 ms | 0 - 226 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
91 |
+
| VIT | w8a8 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE | 12.099 ms | 0 - 94 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
92 |
+
| VIT | w8a8 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 10.539 ms | 0 - 27 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
93 |
+
| VIT | w8a8 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE | 12.508 ms | 0 - 49 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
94 |
+
| VIT | w8a8 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 9.603 ms | 0 - 164 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
95 |
+
| VIT | w8a8 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | TFLITE | 84.469 ms | 2 - 44 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
96 |
+
| VIT | w8a8 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_DLC | 79.01 ms | 0 - 408 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
97 |
+
| VIT | w8a8 | SA7255P ADP | Qualcomm® SA7255P | TFLITE | 24.338 ms | 0 - 49 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
98 |
+
| VIT | w8a8 | SA7255P ADP | Qualcomm® SA7255P | QNN_DLC | 30.29 ms | 0 - 164 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
99 |
+
| VIT | w8a8 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | TFLITE | 12.207 ms | 0 - 35 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
100 |
+
| VIT | w8a8 | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_DLC | 10.547 ms | 0 - 28 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
101 |
+
| VIT | w8a8 | SA8295P ADP | Qualcomm® SA8295P | TFLITE | 14.655 ms | 0 - 50 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
102 |
+
| VIT | w8a8 | SA8295P ADP | Qualcomm® SA8295P | QNN_DLC | 16.428 ms | 0 - 170 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
103 |
+
| VIT | w8a8 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | TFLITE | 12.183 ms | 0 - 85 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
104 |
+
| VIT | w8a8 | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_DLC | 10.556 ms | 0 - 26 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
105 |
+
| VIT | w8a8 | SA8775P ADP | Qualcomm® SA8775P | TFLITE | 12.508 ms | 0 - 49 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
106 |
+
| VIT | w8a8 | SA8775P ADP | Qualcomm® SA8775P | QNN_DLC | 9.603 ms | 0 - 164 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
107 |
+
| VIT | w8a8 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE | 12.209 ms | 0 - 73 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
108 |
+
| VIT | w8a8 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 10.529 ms | 0 - 25 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
109 |
| VIT | w8a8 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 156.848 ms | 462 - 577 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
110 |
+
| VIT | w8a8 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE | 8.691 ms | 0 - 53 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
111 |
+
| VIT | w8a8 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 6.967 ms | 0 - 167 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
112 |
| VIT | w8a8 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 127.23 ms | 487 - 644 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
113 |
+
| VIT | w8a8 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | TFLITE | 7.178 ms | 0 - 54 MB | NPU | [VIT.tflite](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.tflite) |
|
114 |
+
| VIT | w8a8 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 6.089 ms | 0 - 162 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
115 |
| VIT | w8a8 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 103.704 ms | 495 - 618 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
116 |
+
| VIT | w8a8 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 11.726 ms | 415 - 415 MB | NPU | [VIT.dlc](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.dlc) |
|
117 |
| VIT | w8a8 | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 180.062 ms | 924 - 924 MB | NPU | [VIT.onnx](https://huggingface.co/qualcomm/VIT/blob/main/VIT_w8a8.onnx) |
|
118 |
|
119 |
|
|
|
172 |
```bash
|
173 |
python -m qai_hub_models.models.vit.export
|
174 |
```
|
175 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
176 |
|
177 |
|
178 |
## How does this work?
|
VIT_w8a16.dlc
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 90398197
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb6605ac8f250b3abea1daa1237d74c7e1b0fa416476c24667b673729c020f48
|
3 |
size 90398197
|
VIT_w8a8.dlc
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 90020334
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4158e452b163f433d1a69623ad161727480e5f9e95d80000614abb608389fdee
|
3 |
size 90020334
|
precompiled/qualcomm-qcs6490-proxy/sdk_versions.yml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
sdk_versions:
|
2 |
+
qnn_context_binary:
|
3 |
+
qairt: 2.34.2.250528164111_119506
|
precompiled/qualcomm-snapdragon-x-elite/VIT.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 178936368
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:855f3e912ace5f2b29fbfac4a841a2393512398c30851e4c0a9d6505a01efaa8
|
3 |
size 178936368
|
precompiled/qualcomm-snapdragon-x-elite/VIT.onnx.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 162468018
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef2d7fc0a077404ced21457be724b54f652ea58e80e1d94cdd80e5dc9b6417bd
|
3 |
size 162468018
|
precompiled/qualcomm-snapdragon-x-elite/VIT_w8a16.onnx.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 78150683
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a016ca8d47544902792a90ce4b0ca481223cb5ab0128a4874d2efa6a6bd518df
|
3 |
size 78150683
|
precompiled/qualcomm-snapdragon-x-elite/VIT_w8a8.onnx.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb90538f5156885da145068055c3dd53b67b32edfa13f71a555a9fa75f4bb3ec
|
3 |
+
size 77566465
|
precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
sdk_versions:
|
2 |
+
qnn_context_binary:
|
3 |
+
qairt: 2.34.2.250528164111_119506
|
4 |
+
precompiled_qnn_onnx:
|
5 |
+
qairt: 2.33.2.250410134701_117956
|