diff --git a/README.md b/README.md index fba81d9f3263499aed526b33e1dfc4307155016b..dbb9e0a1347b75301685f4173b2347e6cee1449f 100644 --- a/README.md +++ b/README.md @@ -42,6 +42,7 @@ More details on model performance across various devices, can be found | HfWhisperEncoder | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 424.037 ms | 1 - 10 MB | NPU | Use Export Script | | HfWhisperEncoder | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_CONTEXT_BINARY | 314.877 ms | 0 - 18 MB | NPU | Use Export Script | | HfWhisperEncoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 132.256 ms | 8 - 10 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 137.915 ms | 0 - 259 MB | NPU | Use Export Script | | HfWhisperEncoder | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 154.294 ms | 1 - 10 MB | NPU | Use Export Script | | HfWhisperEncoder | float | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 424.037 ms | 1 - 10 MB | NPU | Use Export Script | | HfWhisperEncoder | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 136.109 ms | 1 - 3 MB | NPU | Use Export Script | @@ -49,16 +50,17 @@ More details on model performance across various devices, can be found | HfWhisperEncoder | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 138.032 ms | 1 - 3 MB | NPU | Use Export Script | | HfWhisperEncoder | float | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 154.294 ms | 1 - 10 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_CONTEXT_BINARY | 134.534 ms | 1 - 3 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 138.173 ms | 0 - 258 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 136.701 ms | 0 - 258 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 102.365 ms | 0 - 19 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 105.447 ms | 128 - 147 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 103.523 ms | 122 - 141 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_CONTEXT_BINARY | 86.361 ms | 0 - 14 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 89.991 ms | 129 - 143 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 90.639 ms | 128 - 141 MB | NPU | Use Export Script | | HfWhisperEncoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 130.698 ms | 0 - 0 MB | NPU | Use Export Script | -| HfWhisperEncoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 131.817 ms | 227 - 227 MB | NPU | Use Export Script | +| HfWhisperEncoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 132.388 ms | 226 - 226 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS8275 (Proxy) | Qualcomm® QCS8275 (Proxy) | QNN_CONTEXT_BINARY | 18.261 ms | 45 - 54 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS8450 (Proxy) | Qualcomm® QCS8450 (Proxy) | QNN_CONTEXT_BINARY | 17.513 ms | 52 - 73 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | QNN_CONTEXT_BINARY | 12.24 ms | 53 - 55 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | QCS8550 (Proxy) | Qualcomm® QCS8550 (Proxy) | PRECOMPILED_QNN_ONNX | 12.992 ms | 61 - 63 MB | NPU | Use Export Script | | HfWhisperDecoder | float | QCS9075 (Proxy) | Qualcomm® QCS9075 (Proxy) | QNN_CONTEXT_BINARY | 13.211 ms | 45 - 55 MB | NPU | Use Export Script | | HfWhisperDecoder | float | SA7255P ADP | Qualcomm® SA7255P | QNN_CONTEXT_BINARY | 18.261 ms | 45 - 54 MB | NPU | Use Export Script | | HfWhisperDecoder | float | SA8255 (Proxy) | Qualcomm® SA8255P (Proxy) | QNN_CONTEXT_BINARY | 11.863 ms | 66 - 68 MB | NPU | Use Export Script | @@ -66,13 +68,13 @@ More details on model performance across various devices, can be found | HfWhisperDecoder | float | SA8650 (Proxy) | Qualcomm® SA8650P (Proxy) | QNN_CONTEXT_BINARY | 11.818 ms | 64 - 66 MB | NPU | Use Export Script | | HfWhisperDecoder | float | SA8775P ADP | Qualcomm® SA8775P | QNN_CONTEXT_BINARY | 13.211 ms | 45 - 55 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | QNN_CONTEXT_BINARY | 12.05 ms | 65 - 69 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 13.294 ms | 0 - 319 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Samsung Galaxy S23 | Snapdragon® 8 Gen 2 Mobile | PRECOMPILED_QNN_ONNX | 13.626 ms | 0 - 319 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | QNN_CONTEXT_BINARY | 9.634 ms | 55 - 74 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 10.846 ms | 75 - 95 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Samsung Galaxy S24 | Snapdragon® 8 Gen 3 Mobile | PRECOMPILED_QNN_ONNX | 10.913 ms | 75 - 90 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | QNN_CONTEXT_BINARY | 8.157 ms | 60 - 75 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 8.731 ms | 73 - 87 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Snapdragon 8 Elite QRD | Snapdragon® 8 Elite Mobile | PRECOMPILED_QNN_ONNX | 8.816 ms | 74 - 89 MB | NPU | Use Export Script | | HfWhisperDecoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | QNN_CONTEXT_BINARY | 10.432 ms | 60 - 60 MB | NPU | Use Export Script | -| HfWhisperDecoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 10.429 ms | 286 - 286 MB | NPU | Use Export Script | +| HfWhisperDecoder | float | Snapdragon X Elite CRD | Snapdragon® X Elite | PRECOMPILED_QNN_ONNX | 10.144 ms | 286 - 286 MB | NPU | Use Export Script | diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs8275-proxy/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs8275-proxy/sdk_versions.yml b/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-qcs8275-proxy/sdk_versions.yml rename to precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-qcs8275-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-qcs8275-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs8450-proxy/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8255p-proxy/sdk_versions.yml b/precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml similarity index 80% rename from precompiled/qualcomm-sa8255p-proxy/sdk_versions.yml rename to precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml index 645a4ba899019438314a76813152c259f4f74b92..bb24388e3ba98d34090587000fa8f77ca5b64cf0 100644 --- a/precompiled/qualcomm-sa8255p-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-qcs8450-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..1759786eb9485bb93b484941ecfcdffdf8ab52cf --- /dev/null +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40bf631247b1430b3cb4084e899b888db5c9817189f6a18acf3262b815084539 +size 330402729 diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..9ecdf634d49969a4f33aac30baaf8ddf1d0fba6a --- /dev/null +++ b/precompiled/qualcomm-qcs8550-proxy/Whisper-Small_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fd9bffaa03a40977856ad4ac62c3d959fa2b0abe286766ae9430f7d04f8c896 +size 197781386 diff --git a/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml b/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-qcs8550-proxy/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-qcs9075-proxy/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa7255p/sdk_versions.yml b/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-sa7255p/sdk_versions.yml rename to precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-sa7255p/sdk_versions.yml +++ b/precompiled/qualcomm-qcs9075-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa7255p/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8295p/sdk_versions.yml b/precompiled/qualcomm-sa7255p/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-sa8295p/sdk_versions.yml rename to precompiled/qualcomm-sa7255p/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-sa8295p/sdk_versions.yml +++ b/precompiled/qualcomm-sa7255p/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8255p-proxy/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs8450-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml similarity index 80% rename from precompiled/qualcomm-qcs8450-proxy/sdk_versions.yml rename to precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml index 645a4ba899019438314a76813152c259f4f74b92..bb24388e3ba98d34090587000fa8f77ca5b64cf0 100644 --- a/precompiled/qualcomm-qcs8450-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-sa8255p-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8295p/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-qcs9075-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8295p/tool-versions.yaml similarity index 81% rename from precompiled/qualcomm-qcs9075-proxy/sdk_versions.yml rename to precompiled/qualcomm-sa8295p/tool-versions.yaml index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..f83be1ae234292df6b302b536309cbf56a9598b0 100644 --- a/precompiled/qualcomm-qcs9075-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-sa8295p/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8650p-proxy/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8650p-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8650p-proxy/sdk_versions.yml deleted file mode 100644 index 645a4ba899019438314a76813152c259f4f74b92..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8650p-proxy/sdk_versions.yml +++ /dev/null @@ -1,3 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-qcs8550-proxy/sdk_versions.yml b/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml similarity index 80% rename from precompiled/qualcomm-qcs8550-proxy/sdk_versions.yml rename to precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml index 645a4ba899019438314a76813152c259f4f74b92..bb24388e3ba98d34090587000fa8f77ca5b64cf0 100644 --- a/precompiled/qualcomm-qcs8550-proxy/sdk_versions.yml +++ b/precompiled/qualcomm-sa8650p-proxy/tool-versions.yaml @@ -1,3 +1,3 @@ -sdk_versions: +tool_versions: qnn_context_binary: qairt: 2.37.0.250724175447_124859 diff --git a/precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-sa8775p/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-sa8775p/sdk_versions.yml b/precompiled/qualcomm-sa8775p/sdk_versions.yml deleted file mode 100644 index cf3db9eb5c8793178dd19d986de2ebb9f7dee490..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-sa8775p/sdk_versions.yml +++ /dev/null @@ -1,3 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-sa8775p/tool-versions.yaml b/precompiled/qualcomm-sa8775p/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f83be1ae234292df6b302b536309cbf56a9598b0 --- /dev/null +++ b/precompiled/qualcomm-sa8775p/tool-versions.yaml @@ -0,0 +1,3 @@ +tool_versions: + qnn_context_binary: + qairt: 2.37.0.250724175447_124859-auto diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder.onnx.zip deleted file mode 100644 index 9866c6fb13dc393db504fd52dc573fbb39822bda..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5e6f9e7608a66b9f1d3af0659f51441e5686b403097d368a56f14c7ed9603607 -size 330432535 diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..7af2e23f363d34aea1827860bf5582598650530b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:462ec6a945f5b9ef4525eb6db508b1133f2c2630437d61bf15ed84016ba15ce4 +size 330380681 diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder.onnx.zip deleted file mode 100644 index f7d237af41c97015e5fbba2ae833ea06379ff492..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4504dedf932f69c95aaa30df710e8bdce98787992fd4b6d5bf17d0a215c956ee -size 196175657 diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..a0211fffc82b2ff0e04cf3ea7ed5146ba75a2269 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8-elite/Whisper-Small_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7865d9114f0987c317a2f00283a481d707b8b6ea2bac1741b1b535861f950fe8 +size 197405579 diff --git a/precompiled/qualcomm-snapdragon-8-elite/sdk_versions.yml b/precompiled/qualcomm-snapdragon-8-elite/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8-elite/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8-elite/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8-elite/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8-elite/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder.onnx.zip deleted file mode 100644 index a9cd2e720f4efc690c3d288d237fd597e36543b4..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b04c2fa55da6ceb37c9782f431b4d96e54e9b9566bf6cd2dbac2b7c1b5f61d00 -size 330469625 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..4f31ff72758d7ae780fa869f9d9f847cd3fb962f --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849b30b9d605b2637bc84cf28ff24cf96c0b0376f4cf8cf3e49d620bcca6fb4f +size 330402720 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder.onnx.zip deleted file mode 100644 index 80ee4d9719920377a6c6b756075bf91714f52474..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4d8ff7c7f3d4b47231792485ba27b0504d97fed4ba7f63448404a71694648799 -size 197747935 diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..a86e62c4f873d3ed0cddaf71f3f6ded03a3e2a6c --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen2/Whisper-Small_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bbc7d5ec1dec2a42cc59957d0f5469bab1077e5ddd15cfcfe06122e93caf588 +size 197781387 diff --git a/precompiled/qualcomm-snapdragon-8gen2/sdk_versions.yml b/precompiled/qualcomm-snapdragon-8gen2/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen2/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen2/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8gen2/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen2/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder.onnx.zip deleted file mode 100644 index e68a6e98896b4f536252c93392b335e55a542f94..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7d668ec279ebd2a01525fd320e389fb140b31d1cdc5490cc31fc971de436935e -size 330472065 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..fd184b44ea5820c171246a4ee09c5e8390965bcb --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e3e8f51a9ff3843c43d0fca4939ede91feaece760ddb714a35c6ccdb7287820 +size 330404945 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder.onnx.zip deleted file mode 100644 index 5747e3f4713c160b27244a0dcec738bc6fee33aa..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e983757f38c492f2b54de9901d010de394eeda13cd07daa608466401838849b -size 196723296 diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..0ed2c7bb93c30e35d97bf54b10f30aaec2f1d7cf --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen3/Whisper-Small_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda43de8e790e883f98e643b71fd443806358675761d229879cba3bf94eb38d2 +size 197877968 diff --git a/precompiled/qualcomm-snapdragon-8gen3/sdk_versions.yml b/precompiled/qualcomm-snapdragon-8gen3/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-8gen3/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml b/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-8gen3/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder.onnx.zip deleted file mode 100644 index c0ee2f58ebb0401352691ca2bda6256122fc7b39..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:43425810d8d78355c30f3cffe5943904f7d36aa212c191ddacfdb22c3d28a6d9 -size 330473991 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder.bin rename to precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..5bd2d20209ab25c413eef82b7a1e3cfd8f0cbde5 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperDecoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad41ef6240de4b20ce99c279d813def49a961e8f6e9ced831f5b924541696337 +size 330399718 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder.onnx.zip deleted file mode 100644 index 8f3e07eaf7955321c0e34d84faee03b6685ed008..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder.onnx.zip +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:38e489759b13e47a1d158e16486785751334a3dfb3730d47b5787c651a5ee92e -size 197739694 diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder.bin b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder_float.bin similarity index 100% rename from precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder.bin rename to precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder_float.bin diff --git a/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder_float.onnx.zip b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder_float.onnx.zip new file mode 100644 index 0000000000000000000000000000000000000000..e244420d55aff9031eaa50cfaa530640ad06e641 --- /dev/null +++ b/precompiled/qualcomm-snapdragon-x-elite/Whisper-Small_HfWhisperEncoder_float.onnx.zip @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7006a0fec80cc2bd09a08502375db536829c625ee27792afc7d8034af414dd +size 197719459 diff --git a/precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml b/precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml deleted file mode 100644 index 609bfba19166f29f971a2e5925e62115df03422c..0000000000000000000000000000000000000000 --- a/precompiled/qualcomm-snapdragon-x-elite/sdk_versions.yml +++ /dev/null @@ -1,6 +0,0 @@ -sdk_versions: - qnn_context_binary: - qairt: 2.37.0.250724175447_124859 - precompiled_qnn_onnx: - qairt: 2.33.2.250410134701_117956 - onnx_runtime: 1.22.0 diff --git a/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml b/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml new file mode 100644 index 0000000000000000000000000000000000000000..f0a567e21880e5efda78dc062ffeb343dbb1976b --- /dev/null +++ b/precompiled/qualcomm-snapdragon-x-elite/tool-versions.yaml @@ -0,0 +1,4 @@ +tool_versions: + precompiled_qnn_onnx: + qairt: 2.36.4.250725200057_123280 + onnx_runtime: 1.22.0