v0.36.0
Browse filesSee https://github.com/quic/ai-hub-models/releases/v0.36.0 for changelog.
- LeViT.onnx.zip +1 -1
- LeViT.tflite +1 -1
- LeViT_w8a16.dlc +2 -2
- LeViT_w8a16.onnx.zip +2 -2
- README.md +24 -24
- precompiled/qualcomm-qcs6490-proxy/LeViT_w8a16.bin +3 -0
- precompiled/qualcomm-qcs6490-proxy/sdk_versions.yml +3 -0
- precompiled/qualcomm-snapdragon-x-elite/LeViT_w8a16.bin +2 -2
- precompiled/qualcomm-snapdragon-x-elite/LeViT_w8a16.onnx.zip +2 -2
- precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml +1 -1
- sdk_versions.yml +3 -3
LeViT.onnx.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 27620709
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e8d0db873c00c754e81c33d73022ff83be4deea4361dfdeff454415b8bbdebc
|
3 |
size 27620709
|
LeViT.tflite
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 31342312
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aea4b43f15d5446e18b1f6d88fdb1a16b68f678f3581ee4711e09d8df54b6450
|
3 |
size 31342312
|
LeViT_w8a16.dlc
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39e51b6c896ce9ebb04708acc7b3f7576537368df184735773e1e7d0a742e32c
|
3 |
+
size 8619004
|
LeViT_w8a16.onnx.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f8e4e4a5f312814fa277fc9b3286b12fc5221a74d3280b01759a87405f6365b
|
3 |
+
size 10499358
|
README.md
CHANGED
@@ -36,30 +36,30 @@ More details on model performance across various devices, can be found
|
|
36 |
|
37 |
| Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model
|
38 |
|---|---|---|---|---|---|---|---|---|
|
39 |
-
| LeViT | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE | 4.
|
40 |
-
| LeViT | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE | 1.
|
41 |
-
| LeViT | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE | 1.
|
42 |
-
| LeViT | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE | 2.
|
43 |
-
| LeViT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE | 1.
|
44 |
-
| LeViT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 1.
|
45 |
-
| LeViT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE | 1.
|
46 |
-
| LeViT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 1.
|
47 |
-
| LeViT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | TFLITE |
|
48 |
-
| LeViT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 1.
|
49 |
-
| LeViT | float | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 1.
|
50 |
-
| LeViT | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 2.
|
51 |
-
| LeViT | w8a16 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 1.
|
52 |
-
| LeViT | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 1.
|
53 |
-
| LeViT | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 1.
|
54 |
-
| LeViT | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_DLC |
|
55 |
-
| LeViT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 1.
|
56 |
-
| LeViT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 3.
|
57 |
-
| LeViT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 0.
|
58 |
-
| LeViT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 2.
|
59 |
-
| LeViT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 0.
|
60 |
-
| LeViT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX |
|
61 |
-
| LeViT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 1.
|
62 |
-
| LeViT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX |
|
63 |
|
64 |
|
65 |
|
|
|
36 |
|
37 |
| Model | Precision | Device | Chipset | Target Runtime | Inference Time (ms) | Peak Memory Range (MB) | Primary Compute Unit | Target Model
|
38 |
|---|---|---|---|---|---|---|---|---|
|
39 |
+
| LeViT | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | TFLITE | 4.109 ms | 0 - 42 MB | NPU | [LeViT.tflite](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.tflite) |
|
40 |
+
| LeViT | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | TFLITE | 1.861 ms | 0 - 50 MB | NPU | [LeViT.tflite](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.tflite) |
|
41 |
+
| LeViT | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | TFLITE | 1.569 ms | 0 - 85 MB | NPU | [LeViT.tflite](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.tflite) |
|
42 |
+
| LeViT | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | TFLITE | 2.091 ms | 0 - 43 MB | NPU | [LeViT.tflite](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.tflite) |
|
43 |
+
| LeViT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | TFLITE | 1.571 ms | 0 - 88 MB | NPU | [LeViT.tflite](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.tflite) |
|
44 |
+
| LeViT | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 1.56 ms | 1 - 51 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.onnx.zip) |
|
45 |
+
| LeViT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | TFLITE | 1.056 ms | 0 - 53 MB | NPU | [LeViT.tflite](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.tflite) |
|
46 |
+
| LeViT | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 1.04 ms | 0 - 47 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.onnx.zip) |
|
47 |
+
| LeViT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | TFLITE | 0.839 ms | 0 - 48 MB | NPU | [LeViT.tflite](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.tflite) |
|
48 |
+
| LeViT | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 1.118 ms | 1 - 45 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.onnx.zip) |
|
49 |
+
| LeViT | float | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 1.63 ms | 16 - 16 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT.onnx.zip) |
|
50 |
+
| LeViT | w8a16 | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_DLC | 2.756 ms | 0 - 26 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
51 |
+
| LeViT | w8a16 | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_DLC | 1.575 ms | 0 - 35 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
52 |
+
| LeViT | w8a16 | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_DLC | 1.354 ms | 0 - 10 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
53 |
+
| LeViT | w8a16 | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_DLC | 1.675 ms | 0 - 25 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
54 |
+
| LeViT | w8a16 | RB3 Gen 2 (Proxy) | Qualcomm® QCS6490 (Proxy) | QNN_DLC | 4.133 ms | 0 - 34 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
55 |
+
| LeViT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_DLC | 1.371 ms | 0 - 11 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
56 |
+
| LeViT | w8a16 | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | ONNX | 3.983 ms | 0 - 41 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.onnx.zip) |
|
57 |
+
| LeViT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_DLC | 0.917 ms | 0 - 35 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
58 |
+
| LeViT | w8a16 | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | ONNX | 2.881 ms | 0 - 68 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.onnx.zip) |
|
59 |
+
| LeViT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_DLC | 0.779 ms | 0 - 25 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
60 |
+
| LeViT | w8a16 | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | ONNX | 3.275 ms | 0 - 56 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.onnx.zip) |
|
61 |
+
| LeViT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_DLC | 1.565 ms | 12 - 12 MB | NPU | [LeViT.dlc](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.dlc) |
|
62 |
+
| LeViT | w8a16 | Snapdragon X Elite CRD | Snapdragon® X Elite | ONNX | 4.249 ms | 14 - 14 MB | NPU | [LeViT.onnx.zip](https://huggingface.co/qualcomm/LeViT/blob/main/LeViT_w8a16.onnx.zip) |
|
63 |
|
64 |
|
65 |
|
precompiled/qualcomm-qcs6490-proxy/LeViT_w8a16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64b796e97626d17cd681331b03fc66c50ec3bfeed0502b0e3496bce0340d4f3d
|
3 |
+
size 8826880
|
precompiled/qualcomm-qcs6490-proxy/sdk_versions.yml
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
sdk_versions:
|
2 |
+
qnn_context_binary:
|
3 |
+
qairt: 2.37.0.250724175447_124859
|
precompiled/qualcomm-snapdragon-x-elite/LeViT_w8a16.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d9640bf7628c439e2a8c1d1f0ba80d21710e6988695aa98657f345303e5b77d
|
3 |
+
size 9048064
|
precompiled/qualcomm-snapdragon-x-elite/LeViT_w8a16.onnx.zip
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:40ec16cc3e7a1f9f6423c831f76ce83ca13198042e71d9dc42f75052e8b1f32d
|
3 |
+
size 5594814
|
precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
sdk_versions:
|
2 |
qnn_context_binary:
|
3 |
-
qairt: 2.
|
4 |
precompiled_qnn_onnx:
|
5 |
qairt: 2.33.2.250410134701_117956
|
|
|
1 |
sdk_versions:
|
2 |
qnn_context_binary:
|
3 |
+
qairt: 2.37.0.250724175447_124859
|
4 |
precompiled_qnn_onnx:
|
5 |
qairt: 2.33.2.250410134701_117956
|
sdk_versions.yml
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
sdk_versions:
|
2 |
tflite:
|
3 |
-
qairt: 2.
|
4 |
tflite: 2.17.0
|
5 |
onnx:
|
6 |
-
qairt: 2.
|
7 |
onnx_runtime: 1.22.0
|
8 |
qnn_dlc:
|
9 |
-
qairt: 2.
|
|
|
1 |
sdk_versions:
|
2 |
tflite:
|
3 |
+
qairt: 2.37.0.250724175447_124859
|
4 |
tflite: 2.17.0
|
5 |
onnx:
|
6 |
+
qairt: 2.33.2.250410134701_117956
|
7 |
onnx_runtime: 1.22.0
|
8 |
qnn_dlc:
|
9 |
+
qairt: 2.37.0.250724175447_124859
|