lakpriya commited on
Commit
d2d7638
·
verified ·
1 Parent(s): 9d44b94

Add new files to repository

Browse files
config.json CHANGED
@@ -25,7 +25,8 @@
25
  "rope_scaling": null,
26
  "rope_theta": 10000.0,
27
  "tie_word_embeddings": false,
28
- "transformers_version": "4.48.3",
29
- "use_cache": false,
 
30
  "vocab_size": 32000
31
  }
 
25
  "rope_scaling": null,
26
  "rope_theta": 10000.0,
27
  "tie_word_embeddings": false,
28
+ "torch_dtype": "float32",
29
+ "transformers_version": "4.49.0",
30
+ "use_cache": true,
31
  "vocab_size": 32000
32
  }
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.48.3"
7
  }
 
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.49.0"
7
  }
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9aa4bfd0970e36a19a1b2e6127a188d0a803398f0d29ab3e3e9b030acdae2139
3
+ size 649920885
onnx/model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adc7059722bae4fb925d0a73f409c97666ece55f17fe2914aad51d2acc8e36ba
3
+ size 176170279
onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4a785ae43577058a2ac5414c8dd3001f74d6945894b9cd1d4324e54fb69e85b
3
+ size 325091713
onnx/model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb442954e76e56b333c0e2f56624f541bbb527fdc1a8277a20893874404386db
3
+ size 162818537
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2daffba27d3c9e8660b28a815802e406402b08b4b603ca2ecc358d70d4b043af
3
+ size 184783537
onnx/model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:385ae25e0416b73086b90bf7cf4687ae4b552f026a89da2e3a1af573fe0132fc
3
+ size 126984987
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb442954e76e56b333c0e2f56624f541bbb527fdc1a8277a20893874404386db
3
+ size 162818537
onnx/model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48d4f752716773d086c8507f315ef5390bcc18efff53d38e7981e225a25f66d9
3
+ size 162818574
quantize_config.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "modes": [
3
+ "fp16",
4
+ "q8",
5
+ "int8",
6
+ "uint8",
7
+ "q4",
8
+ "q4f16",
9
+ "bnb4"
10
+ ],
11
+ "per_channel": false,
12
+ "reduce_range": false,
13
+ "block_size": null,
14
+ "is_symmetric": true,
15
+ "accuracy_level": null,
16
+ "quant_type": 1,
17
+ "op_block_list": null
18
+ }