tarekziade commited on
Commit
1b63a83
1 Parent(s): a406da5

Upload 16 files

Browse files
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "architectures": [
3
  "VisionEncoderDecoderModel"
4
  ],
@@ -178,6 +179,5 @@
178
  "model_type": "vision-encoder-decoder",
179
  "pad_token_id": 50256,
180
  "tie_word_embeddings": false,
181
- "torch_dtype": "float32",
182
- "transformers_version": "4.38.2"
183
  }
 
1
  {
2
+ "_name_or_path": "tarekziade/distilvit",
3
  "architectures": [
4
  "VisionEncoderDecoderModel"
5
  ],
 
179
  "model_type": "vision-encoder-decoder",
180
  "pad_token_id": 50256,
181
  "tie_word_embeddings": false,
182
+ "transformers_version": "4.36.2"
 
183
  }
generation_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
  "bos_token_id": 50256,
3
  "eos_token_id": 50256,
4
- "transformers_version": "4.38.2"
5
  }
 
1
  {
2
  "bos_token_id": 50256,
3
  "eos_token_id": 50256,
4
+ "transformers_version": "4.36.2"
5
  }
onnx/decoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4884fbf497eeb3b9548ff95cf37062f709d24a12568903decd06438b68f83cfa
3
+ size 385863272
onnx/decoder_model_merged.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d091bfbb6bcf0e5d0be5b2cb6d94d4f4409a9f406627e203103f15dcfccdf4fa
3
+ size 387339536
onnx/decoder_model_merged_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad7ac7290a551abc1ef84fe9f5fbddc92f0b255a589479b890040ba4391c3bb6
3
+ size 99755448
onnx/decoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5be7fe9e2aa7cbd9ad7d264c7fb5c840588d95d34efb609a304e3d17e5eb73e0
3
+ size 98063696
onnx/decoder_with_past_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f0b91b8725dfd83b4c56561cfb8af05c3c490ec7f01176dfc65282d29d32f6
3
+ size 385862852
onnx/decoder_with_past_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d92e6d422d6fb0270176b92ba235ba32f401f9f8d313829a960b6d921e0456e
3
+ size 98061103
onnx/encoder_model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e151662b541653ab63ea653056c6902f90d001358c831c7c6b3f02f4123480e3
3
+ size 343440610
onnx/encoder_model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dfb73885aa98a91d6bd31c24ca7902acf0517f43ae99a8fe827ad50f007df8c
3
+ size 87038150
quantize_config.json ADDED
@@ -0,0 +1,125 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": false,
3
+ "reduce_range": false,
4
+ "per_model_config": {
5
+ "decoder_with_past_model": {
6
+ "op_types": [
7
+ "Softmax",
8
+ "Add",
9
+ "Cast",
10
+ "ReduceMean",
11
+ "Pow",
12
+ "Where",
13
+ "Transpose",
14
+ "ConstantOfShape",
15
+ "Mul",
16
+ "Concat",
17
+ "Split",
18
+ "Gather",
19
+ "Sub",
20
+ "Range",
21
+ "Div",
22
+ "Gemm",
23
+ "Constant",
24
+ "Reshape",
25
+ "Sqrt",
26
+ "Unsqueeze",
27
+ "Slice",
28
+ "MatMul",
29
+ "Squeeze",
30
+ "Tanh",
31
+ "Shape"
32
+ ],
33
+ "weight_type": "QInt8"
34
+ },
35
+ "decoder_model": {
36
+ "op_types": [
37
+ "Softmax",
38
+ "Cast",
39
+ "Add",
40
+ "ReduceMean",
41
+ "Pow",
42
+ "Where",
43
+ "Transpose",
44
+ "ConstantOfShape",
45
+ "Mul",
46
+ "Concat",
47
+ "Split",
48
+ "Gather",
49
+ "Sub",
50
+ "Range",
51
+ "Div",
52
+ "Gemm",
53
+ "Constant",
54
+ "Reshape",
55
+ "Sqrt",
56
+ "Unsqueeze",
57
+ "Slice",
58
+ "MatMul",
59
+ "Squeeze",
60
+ "Tanh",
61
+ "Shape"
62
+ ],
63
+ "weight_type": "QInt8"
64
+ },
65
+ "encoder_model": {
66
+ "op_types": [
67
+ "Equal",
68
+ "Softmax",
69
+ "Expand",
70
+ "Add",
71
+ "ReduceMean",
72
+ "Pow",
73
+ "Where",
74
+ "Transpose",
75
+ "ConstantOfShape",
76
+ "Mul",
77
+ "Concat",
78
+ "Gather",
79
+ "Sub",
80
+ "Div",
81
+ "Constant",
82
+ "Reshape",
83
+ "Sqrt",
84
+ "Erf",
85
+ "Unsqueeze",
86
+ "Slice",
87
+ "MatMul",
88
+ "Conv",
89
+ "Shape"
90
+ ],
91
+ "weight_type": "QUInt8"
92
+ },
93
+ "decoder_model_merged": {
94
+ "op_types": [
95
+ "Softmax",
96
+ "Cast",
97
+ "Add",
98
+ "ReduceMean",
99
+ "Pow",
100
+ "Where",
101
+ "Transpose",
102
+ "ConstantOfShape",
103
+ "If",
104
+ "Mul",
105
+ "Concat",
106
+ "Split",
107
+ "Gather",
108
+ "Sub",
109
+ "Range",
110
+ "Div",
111
+ "Gemm",
112
+ "Constant",
113
+ "Reshape",
114
+ "Sqrt",
115
+ "Unsqueeze",
116
+ "Slice",
117
+ "MatMul",
118
+ "Squeeze",
119
+ "Tanh",
120
+ "Shape"
121
+ ],
122
+ "weight_type": "QInt8"
123
+ }
124
+ }
125
+ }
special_tokens_map.json CHANGED
@@ -1,6 +1,30 @@
1
  {
2
- "bos_token": "<|endoftext|>",
3
- "eos_token": "<|endoftext|>",
4
- "pad_token": "<|endoftext|>",
5
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  }
 
1
  {
2
+ "bos_token": {
3
+ "content": "<|endoftext|>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "eos_token": {
10
+ "content": "<|endoftext|>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "<|endoftext|>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "unk_token": {
24
+ "content": "<|endoftext|>",
25
+ "lstrip": false,
26
+ "normalized": true,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ }
30
  }