Add new files to repository
Browse files- config.json +3 -2
- generation_config.json +1 -1
- onnx/model.onnx +3 -0
- onnx/model_bnb4.onnx +3 -0
- onnx/model_fp16.onnx +3 -0
- onnx/model_int8.onnx +3 -0
- onnx/model_q4.onnx +3 -0
- onnx/model_q4f16.onnx +3 -0
- onnx/model_quantized.onnx +3 -0
- onnx/model_uint8.onnx +3 -0
- quantize_config.json +18 -0
config.json
CHANGED
@@ -25,7 +25,8 @@
|
|
25 |
"rope_scaling": null,
|
26 |
"rope_theta": 10000.0,
|
27 |
"tie_word_embeddings": false,
|
28 |
-
"
|
29 |
-
"
|
|
|
30 |
"vocab_size": 32000
|
31 |
}
|
|
|
25 |
"rope_scaling": null,
|
26 |
"rope_theta": 10000.0,
|
27 |
"tie_word_embeddings": false,
|
28 |
+
"torch_dtype": "float32",
|
29 |
+
"transformers_version": "4.49.0",
|
30 |
+
"use_cache": true,
|
31 |
"vocab_size": 32000
|
32 |
}
|
generation_config.json
CHANGED
@@ -3,5 +3,5 @@
|
|
3 |
"bos_token_id": 1,
|
4 |
"eos_token_id": 2,
|
5 |
"pad_token_id": 0,
|
6 |
-
"transformers_version": "4.
|
7 |
}
|
|
|
3 |
"bos_token_id": 1,
|
4 |
"eos_token_id": 2,
|
5 |
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.49.0"
|
7 |
}
|
onnx/model.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9aa4bfd0970e36a19a1b2e6127a188d0a803398f0d29ab3e3e9b030acdae2139
|
3 |
+
size 649920885
|
onnx/model_bnb4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adc7059722bae4fb925d0a73f409c97666ece55f17fe2914aad51d2acc8e36ba
|
3 |
+
size 176170279
|
onnx/model_fp16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4a785ae43577058a2ac5414c8dd3001f74d6945894b9cd1d4324e54fb69e85b
|
3 |
+
size 325091713
|
onnx/model_int8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb442954e76e56b333c0e2f56624f541bbb527fdc1a8277a20893874404386db
|
3 |
+
size 162818537
|
onnx/model_q4.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2daffba27d3c9e8660b28a815802e406402b08b4b603ca2ecc358d70d4b043af
|
3 |
+
size 184783537
|
onnx/model_q4f16.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:385ae25e0416b73086b90bf7cf4687ae4b552f026a89da2e3a1af573fe0132fc
|
3 |
+
size 126984987
|
onnx/model_quantized.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb442954e76e56b333c0e2f56624f541bbb527fdc1a8277a20893874404386db
|
3 |
+
size 162818537
|
onnx/model_uint8.onnx
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:48d4f752716773d086c8507f315ef5390bcc18efff53d38e7981e225a25f66d9
|
3 |
+
size 162818574
|
quantize_config.json
ADDED
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"modes": [
|
3 |
+
"fp16",
|
4 |
+
"q8",
|
5 |
+
"int8",
|
6 |
+
"uint8",
|
7 |
+
"q4",
|
8 |
+
"q4f16",
|
9 |
+
"bnb4"
|
10 |
+
],
|
11 |
+
"per_channel": false,
|
12 |
+
"reduce_range": false,
|
13 |
+
"block_size": null,
|
14 |
+
"is_symmetric": true,
|
15 |
+
"accuracy_level": null,
|
16 |
+
"quant_type": 1,
|
17 |
+
"op_block_list": null
|
18 |
+
}
|