tarekziade commited on
Commit
cc33764
1 Parent(s): 940a273

Upload 16 files

Browse files
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "architectures": [
3
  "VisionEncoderDecoderModel"
4
  ],
@@ -2173,6 +2174,5 @@
2173
  "model_type": "vision-encoder-decoder",
2174
  "pad_token_id": 50256,
2175
  "tie_word_embeddings": false,
2176
- "torch_dtype": "float32",
2177
- "transformers_version": "4.38.2"
2178
  }
 
1
  {
2
+ "_name_or_path": "tarekziade/deit-tiny-distilgpt2",
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
 
2174
  "model_type": "vision-encoder-decoder",
2175
  "pad_token_id": 50256,
2176
  "tie_word_embeddings": false,
2177
+ "transformers_version": "4.36.2"
 
2178
  }
generation_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
  "bos_token_id": 50256,
3
  "eos_token_id": 50256,
4
- "transformers_version": "4.38.2"
5
  }
 
1
  {
2
  "bos_token_id": 50256,
3
  "eos_token_id": 50256,
4
+ "transformers_version": "4.36.2"
5
  }
onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95230cea497effc8eb407b0e190bc39e9799b40048b63d6ac16ec846b0eb9be7
3
+ size 386451960
onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcf356550b2794843a8cbc5e279b36676d025b63b95a483542c79d6256925ac8
3
+ size 387928537
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6fd9c0ea213be12610b06cb3304c20bdd60cd8f0b2ec06c695d2dd9b72ee126c
3
+ size 99900479
onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96f6daab7f2de1096ba6af627903c9b022ccfb846fbdf55a334974e5e204eb18
3
+ size 98207533
onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f63e1745e472b6121f01bffbbebc0e59e7149635a8e262aa7420dbe2bb1bfc50
3
+ size 386456075
onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0153902ef06d3afe269072efb68b87562cb39062f1816af5bcb2a4f63653c79
3
+ size 98213050
onnx/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d7f4928b69e0b198701b2924a8233be2da9cdb9c1cd548a33070103e8e67a56
3
+ size 22346734
onnx/encoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0440b5a907b9d65f5a87340ff19e0f79945c3c0b216a638b99f2cb6bf27e2f48
3
+ size 6150834
quantize_config.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": false,
3
+ "reduce_range": false,
4
+ "per_model_config": {
5
+ "decoder_with_past_model": {
6
+ "op_types": [
7
+ "Sqrt",
8
+ "Tanh",
9
+ "Slice",
10
+ "Pow",
11
+ "Div",
12
+ "Range",
13
+ "ConstantOfShape",
14
+ "Split",
15
+ "Unsqueeze",
16
+ "Sub",
17
+ "Add",
18
+ "Softmax",
19
+ "Where",
20
+ "Shape",
21
+ "ReduceMean",
22
+ "Concat",
23
+ "Transpose",
24
+ "Gemm",
25
+ "Cast",
26
+ "Reshape",
27
+ "Mul",
28
+ "Gather",
29
+ "Squeeze",
30
+ "Constant",
31
+ "MatMul"
32
+ ],
33
+ "weight_type": "QInt8"
34
+ },
35
+ "decoder_model": {
36
+ "op_types": [
37
+ "Sqrt",
38
+ "Tanh",
39
+ "Slice",
40
+ "Pow",
41
+ "Div",
42
+ "Range",
43
+ "ConstantOfShape",
44
+ "Split",
45
+ "Unsqueeze",
46
+ "Sub",
47
+ "Add",
48
+ "Softmax",
49
+ "Where",
50
+ "Shape",
51
+ "ReduceMean",
52
+ "Concat",
53
+ "Transpose",
54
+ "Gemm",
55
+ "Cast",
56
+ "Reshape",
57
+ "Mul",
58
+ "Gather",
59
+ "Squeeze",
60
+ "Constant",
61
+ "MatMul"
62
+ ],
63
+ "weight_type": "QInt8"
64
+ },
65
+ "encoder_model": {
66
+ "op_types": [
67
+ "Sqrt",
68
+ "Slice",
69
+ "Pow",
70
+ "Div",
71
+ "ConstantOfShape",
72
+ "Unsqueeze",
73
+ "Conv",
74
+ "Sub",
75
+ "Erf",
76
+ "Add",
77
+ "Softmax",
78
+ "Where",
79
+ "Expand",
80
+ "Shape",
81
+ "ReduceMean",
82
+ "Concat",
83
+ "Transpose",
84
+ "Equal",
85
+ "Reshape",
86
+ "Mul",
87
+ "Gather",
88
+ "Constant",
89
+ "MatMul"
90
+ ],
91
+ "weight_type": "QUInt8"
92
+ },
93
+ "decoder_model_merged": {
94
+ "op_types": [
95
+ "Sqrt",
96
+ "Tanh",
97
+ "Slice",
98
+ "If",
99
+ "Pow",
100
+ "Div",
101
+ "Range",
102
+ "ConstantOfShape",
103
+ "Split",
104
+ "Unsqueeze",
105
+ "Sub",
106
+ "Add",
107
+ "Softmax",
108
+ "Where",
109
+ "Shape",
110
+ "ReduceMean",
111
+ "Concat",
112
+ "Transpose",
113
+ "Gemm",
114
+ "Cast",
115
+ "Reshape",
116
+ "Mul",
117
+ "Gather",
118
+ "Squeeze",
119
+ "Constant",
120
+ "MatMul"
121
+ ],
122
+ "weight_type": "QInt8"
123
+ }
124
+ }
125
+ }
special_tokens_map.json CHANGED
@@ -1,6 +1,30 @@
1
  {
2
- "bos_token": "<|endoftext|>",
3
- "eos_token": "<|endoftext|>",
4
- "pad_token": "<|endoftext|>",
5
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  }
 
1
  {
2
+ "bos_token": {
3
+ "content": "<|endoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|endoftext|>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<|endoftext|>",
25
+ "lstrip": false,
26
+ "normalized": true,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
  }