Xenova HF staff commited on
Commit
be39539
1 Parent(s): 021674c

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -35,7 +35,7 @@
35
  },
36
  "tie_word_embeddings": false,
37
  "tokenizer_class": "GPT2Tokenizer",
38
- "transformers_version": "4.29.2",
39
  "use_cache": true,
40
  "vocab_size": 51200
41
  }
 
35
  },
36
  "tie_word_embeddings": false,
37
  "tokenizer_class": "GPT2Tokenizer",
38
+ "transformers_version": "4.33.0.dev0",
39
  "use_cache": true,
40
  "vocab_size": 51200
41
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 50256,
5
- "transformers_version": "4.29.2"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 50256,
5
+ "transformers_version": "4.33.0.dev0"
6
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:001ffadb35ae890965862447cb2a898a65d6773bb63bfc1e54e8eb5157d8b4b6
3
- size 1435433361
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e253a493c957bf95f09bcdf7993e6b5a2d186c11ecceb26552b13c11a5056c6
3
+ size 1435431277
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5144a56780c9634fd33f2c222c33e43d9c86d2bc10270d4e819f64761f5a00cc
3
- size 1436616692
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab6c0373942118feca0695cae8731c0870b4aff536bd53520ad90dc02672348
3
+ size 1440806543
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea712a8bc11dedd856351158bd57f7559cb5f76b9f5fbbfe0a287daaf2b0db70
3
- size 370397170
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa7ebc46ccff17b6ceb88f22374d66b88e2a97e8db3cd2fa656d8407a8b21642
3
+ size 373406712
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1211fd052d96727b54ec9ae545c18eb759aa112a79c72122526397dfe16226de
3
- size 368793710
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb38edfc1cbf1dfff557ca96a9b7b4360eb7ee156b30a703c4f5e18de60dee6a
3
+ size 367612429
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:58c23045d67dfe409d2482c2d63d12c2df4ced0fc501f762d1d4fe84564b7616
3
- size 1432225419
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66bfd6759c350ba9a1ce93618f279eca8ecc0e5c23b83d7c21eef10bf3ef236c
3
+ size 1432223346
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b539fa9219b2f212463333eeb53f3a594f3b7df68c32dc4616d660085961ed52
3
- size 364276590
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fce1369c36d39319d1a6088d18edae2a4fd18e9bfadffc07eac4f4435fd128a8
3
+ size 363095324
quantize_config.json ADDED
@@ -0,0 +1,103 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": false,
3
+ "reduce_range": false,
4
+ "per_model_config": {
5
+ "decoder_model": {
6
+ "op_types": [
7
+ "MatMul",
8
+ "Tanh",
9
+ "Unsqueeze",
10
+ "Range",
11
+ "Add",
12
+ "Sqrt",
13
+ "Slice",
14
+ "Split",
15
+ "Sub",
16
+ "Where",
17
+ "Transpose",
18
+ "ReduceMean",
19
+ "Softmax",
20
+ "Shape",
21
+ "Mul",
22
+ "Equal",
23
+ "Reshape",
24
+ "Squeeze",
25
+ "Concat",
26
+ "Pow",
27
+ "Constant",
28
+ "ConstantOfShape",
29
+ "Expand",
30
+ "Cast",
31
+ "Gather",
32
+ "Div",
33
+ "Neg"
34
+ ],
35
+ "weight_type": "QInt8"
36
+ },
37
+ "decoder_model_merged": {
38
+ "op_types": [
39
+ "MatMul",
40
+ "Tanh",
41
+ "Unsqueeze",
42
+ "Range",
43
+ "Add",
44
+ "Sqrt",
45
+ "Slice",
46
+ "Split",
47
+ "Sub",
48
+ "Where",
49
+ "Transpose",
50
+ "ReduceMean",
51
+ "Softmax",
52
+ "Shape",
53
+ "If",
54
+ "Mul",
55
+ "Equal",
56
+ "Reshape",
57
+ "Squeeze",
58
+ "Concat",
59
+ "Pow",
60
+ "Constant",
61
+ "ConstantOfShape",
62
+ "Expand",
63
+ "Cast",
64
+ "Gather",
65
+ "Div",
66
+ "Neg"
67
+ ],
68
+ "weight_type": "QInt8"
69
+ },
70
+ "decoder_with_past_model": {
71
+ "op_types": [
72
+ "MatMul",
73
+ "Tanh",
74
+ "Unsqueeze",
75
+ "Range",
76
+ "Add",
77
+ "Sqrt",
78
+ "Slice",
79
+ "Split",
80
+ "Sub",
81
+ "Where",
82
+ "Transpose",
83
+ "ReduceMean",
84
+ "Softmax",
85
+ "Shape",
86
+ "Mul",
87
+ "Equal",
88
+ "Reshape",
89
+ "Squeeze",
90
+ "Concat",
91
+ "Pow",
92
+ "Constant",
93
+ "ConstantOfShape",
94
+ "Expand",
95
+ "Cast",
96
+ "Gather",
97
+ "Div",
98
+ "Neg"
99
+ ],
100
+ "weight_type": "QInt8"
101
+ }
102
+ }
103
+ }