Commit
·
ec0ed95
1
Parent(s):
610de97
Upload Phi-4-multimodal-instruct ONNX models
Browse files- LICENSE +21 -0
- config.json +3 -0
- gpu/gpu-int4-rtn-block-32/added_tokens.json +3 -0
- gpu/gpu-int4-rtn-block-32/genai_config.json +3 -0
- gpu/gpu-int4-rtn-block-32/merges.txt +0 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-embedding.onnx +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-embedding.onnx.data +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-speech.onnx +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-speech.onnx.data +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-speech.onnx_adapter +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-text.onnx +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-text.onnx.data +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-vision.onnx +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-vision.onnx.data +3 -0
- gpu/gpu-int4-rtn-block-32/phi-4-mm-vision.onnx_adapter +3 -0
- gpu/gpu-int4-rtn-block-32/special_tokens_map.json +3 -0
- gpu/gpu-int4-rtn-block-32/speech_processor.json +3 -0
- gpu/gpu-int4-rtn-block-32/tokenizer.json +3 -0
- gpu/gpu-int4-rtn-block-32/tokenizer_config.json +3 -0
- gpu/gpu-int4-rtn-block-32/vision_processor.json +3 -0
- gpu/gpu-int4-rtn-block-32/vocab.json +3 -0
LICENSE
ADDED
@@ -0,0 +1,21 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
MIT License
|
2 |
+
|
3 |
+
Copyright (c) Microsoft Corporation.
|
4 |
+
|
5 |
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
6 |
+
of this software and associated documentation files (the "Software"), to deal
|
7 |
+
in the Software without restriction, including without limitation the rights
|
8 |
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
9 |
+
copies of the Software, and to permit persons to whom the Software is
|
10 |
+
furnished to do so, subject to the following conditions:
|
11 |
+
|
12 |
+
The above copyright notice and this permission notice shall be included in all
|
13 |
+
copies or substantial portions of the Software.
|
14 |
+
|
15 |
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
16 |
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
17 |
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
18 |
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
19 |
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
20 |
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
21 |
+
SOFTWARE
|
config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49e1c05f93d43d7f17715b779a2576235b019f587285d7d914e5b05156253f62
|
3 |
+
size 4631
|
gpu/gpu-int4-rtn-block-32/added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4f2aceb0f20b71dd1f4bcc7e052e4412946bf281840b8f83d39f259571af486
|
3 |
+
size 249
|
gpu/gpu-int4-rtn-block-32/genai_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d674802d88d850c2f8cf2361f419160f2c739376c78361f00736740c9e6658e3
|
3 |
+
size 2919
|
gpu/gpu-int4-rtn-block-32/merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-embedding.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e201c5981608c06f93b15860993bf6029cfc3f60401290926c404ab84946dddd
|
3 |
+
size 12008
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-embedding.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:85e0389fd112f00584016e1429588410e07f548cbedc5111c84bafabb14c825b
|
3 |
+
size 1229193216
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-speech.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b3d608bbc3affc2228f065f38962efc59cfb219ab21bcb3add01267b6e97ce3
|
3 |
+
size 428970
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-speech.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d28dc86d07fe3469e307bf06d6ad05dde254f58b7e5625d9b6f88ac65284878e
|
3 |
+
size 519824640
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-speech.onnx_adapter
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67d2ef0f27d22477f5c48f750b25c67e728b79c72d7c72ae5dd5c2090dd48ddd
|
3 |
+
size 312704560
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-text.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f84c26e4745958d98628619dbc9f6bc17cf72d9642a34053197301a9f6e10b18
|
3 |
+
size 236917443
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-text.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e64a9c88de1e7e316e11a6a86e063a533ce26cc8e92e65003e2daebf6e0106b6
|
3 |
+
size 2184001536
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-vision.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5ef47554450d7bf96f9dcfe28e6bbf2c99beddcd5dfc8786d69713b7f70e9fd
|
3 |
+
size 376524
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-vision.onnx.data
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0faf7f9b430c3092737e96e5f98b5509022e8cd5063cc5c05e4987503fbd7728
|
3 |
+
size 383529536
|
gpu/gpu-int4-rtn-block-32/phi-4-mm-vision.onnx_adapter
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b596e59e6092dfda593f449abc7c6437cf46cc1f366e5283475299ae2e7629ab
|
3 |
+
size 250183216
|
gpu/gpu-int4-rtn-block-32/special_tokens_map.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aff38493227d813e29fcf8406e8e90062f1f031aa47d589325e9c31d89ac7cc3
|
3 |
+
size 587
|
gpu/gpu-int4-rtn-block-32/speech_processor.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77ac9c85f4cc8b947bdd19d77ba71de814f76ef6658130e344ee4ecc2eef7014
|
3 |
+
size 1799
|
gpu/gpu-int4-rtn-block-32/tokenizer.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c1b9f641d4f8b7247b8d5007dd3b6a9f6a87cb5123134fe0d326f14d10c0585
|
3 |
+
size 15524479
|
gpu/gpu-int4-rtn-block-32/tokenizer_config.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60d63678e0cfc6c6c3deb98419b4326a3ada8680165aa0318389355383208b41
|
3 |
+
size 3274
|
gpu/gpu-int4-rtn-block-32/vision_processor.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e40a4384c7f530f73514fd87d3fe9219be2a012fded0037bfa06a5468067623a
|
3 |
+
size 2010
|
gpu/gpu-int4-rtn-block-32/vocab.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cb65a857824fa6615bb1782d95d882617a8bbce1da0317118586b36f39e98bd
|
3 |
+
size 3910310
|