Xenova HF staff commited on
Commit
d33af21
1 Parent(s): cf036d5

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -50,6 +50,7 @@
50
  "max_length": 448,
51
  "max_source_positions": 1500,
52
  "max_target_positions": 448,
 
53
  "model_type": "whisper",
54
  "num_hidden_layers": 6,
55
  "num_mel_bins": 80,
@@ -145,7 +146,7 @@
145
  50361,
146
  50362
147
  ],
148
- "transformers_version": "4.30.2",
149
  "use_cache": true,
150
  "use_weighted_layer_sum": false,
151
  "vocab_size": 51865
 
50
  "max_length": 448,
51
  "max_source_positions": 1500,
52
  "max_target_positions": 448,
53
+ "median_filter_width": 7,
54
  "model_type": "whisper",
55
  "num_hidden_layers": 6,
56
  "num_mel_bins": 80,
 
146
  50361,
147
  50362
148
  ],
149
+ "transformers_version": "4.33.0.dev0",
150
  "use_cache": true,
151
  "use_weighted_layer_sum": false,
152
  "vocab_size": 51865
generation_config.json CHANGED
@@ -1,5 +1,38 @@
1
  {
2
- "alignment_heads": [[3, 1], [4, 2], [4, 3], [4, 7], [5, 1], [5, 2], [5, 4], [5, 6]],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "begin_suppress_tokens": [
4
  220,
5
  50257
@@ -218,5 +251,5 @@
218
  "transcribe": 50359,
219
  "translate": 50358
220
  },
221
- "transformers_version": "4.30.2"
222
  }
 
1
  {
2
+ "alignment_heads": [
3
+ [
4
+ 3,
5
+ 1
6
+ ],
7
+ [
8
+ 4,
9
+ 2
10
+ ],
11
+ [
12
+ 4,
13
+ 3
14
+ ],
15
+ [
16
+ 4,
17
+ 7
18
+ ],
19
+ [
20
+ 5,
21
+ 1
22
+ ],
23
+ [
24
+ 5,
25
+ 2
26
+ ],
27
+ [
28
+ 5,
29
+ 4
30
+ ],
31
+ [
32
+ 5,
33
+ 6
34
+ ]
35
+ ],
36
  "begin_suppress_tokens": [
37
  220,
38
  50257
 
251
  "transcribe": 50359,
252
  "translate": 50358
253
  },
254
+ "transformers_version": "4.33.0.dev0"
255
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30dc5d792fc7dee971935fa6cd4df68e219d866ecc6b4309ecdfc7c7efcab992
3
- size 314491115
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bae722537859a68b8babc4930c504f1f51a83420a2b1b0bd0b0947b4811b8042
3
+ size 208304195
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17eeff2508a474685cec5b46587c13eb7d0d28f921ce64d08b8ef3e7a9c2938e
3
- size 314710581
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fed66b2b8dfa1ae213f768527dff1ef7e3857b8d45a36381850ce4dff8db936
3
+ size 208560983
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edccc6c79bf0f9b46a99770172cf3160154734640795f84c6fc516932b7b87b9
3
- size 80172704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6beb6baabb66f00b6a686d828c95ffca6146d51900cbad0266cad38f64cf861
3
+ size 53707539
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0302f2ff47b04e6715e5812a1313084d404cbdeff4a55fdab22e4c5f7c00aa2
3
- size 79822868
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96fc8b98013e0f9461159a7b0d57922e170b15767db8afef1ea7880f1deef33b
3
+ size 53309877
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c77771da8b403752fe44d95d8a38e975e11e4ba170dc0407b19a433f838470e3
3
- size 301854704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75f7f7144348fb70fd421587b938e6b215188f1e480fbc0be016177b0e3891dd
3
+ size 195670910
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54d7fad0e7189431eab05cc42fb488f7d8b8011070c70e49aa9d833cb4a917c2
3
- size 76596950
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b12f3892bce5a5c9729eb3d5c2ac451e64dd20e367d643eaa675345a114471d
3
+ size 50088237
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5508b72d9379911bf51bcf034ce26c43501a5dccc7a5ca4a061fc851471f9a10
3
- size 82461621
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0bd7927234639c6e1f293cef18a210cee4e4aea93e200ebbe48e1d7acf6fdb1
3
+ size 82474863
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e360d86928a0232eb6100f2a36fa4a358c101e0a6a39763e5eefe139dca5fe71
3
- size 23183300
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e345e977b55620a37c0c2b2af0644e019afdfad562dcf71eb929bb7274285f9
3
+ size 23200850
quantize_config.json ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": false,
3
+ "reduce_range": false,
4
+ "per_model_config": {
5
+ "decoder_model": {
6
+ "op_types": [
7
+ "Erf",
8
+ "Squeeze",
9
+ "Gather",
10
+ "Unsqueeze",
11
+ "Slice",
12
+ "Shape",
13
+ "Transpose",
14
+ "MatMul",
15
+ "Softmax",
16
+ "Reshape",
17
+ "Range",
18
+ "Less",
19
+ "Equal",
20
+ "Concat",
21
+ "Sqrt",
22
+ "Mul",
23
+ "Pow",
24
+ "Sub",
25
+ "Constant",
26
+ "ConstantOfShape",
27
+ "Div",
28
+ "Add",
29
+ "Expand",
30
+ "Where",
31
+ "Cast",
32
+ "ReduceMean"
33
+ ],
34
+ "weight_type": "QInt8"
35
+ },
36
+ "decoder_model_merged": {
37
+ "op_types": [
38
+ "Erf",
39
+ "Squeeze",
40
+ "Gather",
41
+ "Unsqueeze",
42
+ "Slice",
43
+ "Shape",
44
+ "Transpose",
45
+ "MatMul",
46
+ "Softmax",
47
+ "Reshape",
48
+ "Range",
49
+ "Cast",
50
+ "Less",
51
+ "Equal",
52
+ "Concat",
53
+ "If",
54
+ "Sqrt",
55
+ "Mul",
56
+ "Pow",
57
+ "Sub",
58
+ "Constant",
59
+ "Div",
60
+ "Add",
61
+ "Expand",
62
+ "Where",
63
+ "ConstantOfShape",
64
+ "ReduceMean"
65
+ ],
66
+ "weight_type": "QInt8"
67
+ },
68
+ "decoder_with_past_model": {
69
+ "op_types": [
70
+ "Reshape",
71
+ "Mul",
72
+ "Erf",
73
+ "Div",
74
+ "Gather",
75
+ "Unsqueeze",
76
+ "Add",
77
+ "Shape",
78
+ "Slice",
79
+ "Sub",
80
+ "Constant",
81
+ "Pow",
82
+ "Transpose",
83
+ "Concat",
84
+ "MatMul",
85
+ "Softmax",
86
+ "ReduceMean",
87
+ "Sqrt"
88
+ ],
89
+ "weight_type": "QInt8"
90
+ },
91
+ "encoder_model": {
92
+ "op_types": [
93
+ "Reshape",
94
+ "Erf",
95
+ "Mul",
96
+ "Div",
97
+ "Conv",
98
+ "Gather",
99
+ "Add",
100
+ "Pow",
101
+ "Shape",
102
+ "Transpose",
103
+ "Sub",
104
+ "Constant",
105
+ "Unsqueeze",
106
+ "Concat",
107
+ "MatMul",
108
+ "Softmax",
109
+ "ReduceMean",
110
+ "Sqrt"
111
+ ],
112
+ "weight_type": "QUInt8"
113
+ }
114
+ }
115
+ }