Xenova HF staff commited on
Commit
220c655
1 Parent(s): fe129a9

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -42,6 +42,7 @@
42
  "max_length": 448,
43
  "max_source_positions": 1500,
44
  "max_target_positions": 448,
 
45
  "model_type": "whisper",
46
  "num_hidden_layers": 24,
47
  "num_mel_bins": 80,
@@ -139,7 +140,7 @@
139
  50360,
140
  50361
141
  ],
142
- "transformers_version": "4.30.2",
143
  "use_cache": true,
144
  "use_weighted_layer_sum": false,
145
  "vocab_size": 51864
 
42
  "max_length": 448,
43
  "max_source_positions": 1500,
44
  "max_target_positions": 448,
45
+ "median_filter_width": 7,
46
  "model_type": "whisper",
47
  "num_hidden_layers": 24,
48
  "num_mel_bins": 80,
 
140
  50360,
141
  50361
142
  ],
143
+ "transformers_version": "4.33.0.dev0",
144
  "use_cache": true,
145
  "use_weighted_layer_sum": false,
146
  "vocab_size": 51864
generation_config.json CHANGED
@@ -1,5 +1,78 @@
1
  {
2
- "alignment_heads": [[11, 4], [14, 1], [14, 12], [14, 14], [15, 4], [16, 0], [16, 4], [16, 9], [17, 12], [17, 14], [18, 7], [18, 10], [18, 15], [20, 0], [20, 3], [20, 9], [20, 14], [21, 12]],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "begin_suppress_tokens": [
4
  220,
5
  50256
@@ -111,5 +184,5 @@
111
  50360,
112
  50361
113
  ],
114
- "transformers_version": "4.30.2"
115
  }
 
1
  {
2
+ "alignment_heads": [
3
+ [
4
+ 11,
5
+ 4
6
+ ],
7
+ [
8
+ 14,
9
+ 1
10
+ ],
11
+ [
12
+ 14,
13
+ 12
14
+ ],
15
+ [
16
+ 14,
17
+ 14
18
+ ],
19
+ [
20
+ 15,
21
+ 4
22
+ ],
23
+ [
24
+ 16,
25
+ 0
26
+ ],
27
+ [
28
+ 16,
29
+ 4
30
+ ],
31
+ [
32
+ 16,
33
+ 9
34
+ ],
35
+ [
36
+ 17,
37
+ 12
38
+ ],
39
+ [
40
+ 17,
41
+ 14
42
+ ],
43
+ [
44
+ 18,
45
+ 7
46
+ ],
47
+ [
48
+ 18,
49
+ 10
50
+ ],
51
+ [
52
+ 18,
53
+ 15
54
+ ],
55
+ [
56
+ 20,
57
+ 0
58
+ ],
59
+ [
60
+ 20,
61
+ 3
62
+ ],
63
+ [
64
+ 20,
65
+ 9
66
+ ],
67
+ [
68
+ 20,
69
+ 14
70
+ ],
71
+ [
72
+ 21,
73
+ 12
74
+ ]
75
+ ],
76
  "begin_suppress_tokens": [
77
  220,
78
  50256
 
184
  50360,
185
  50361
186
  ],
187
+ "transformers_version": "4.33.0.dev0"
188
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c768cbdc2f7da73f15400f34e4e20b439f043ab870bb3e80c7d2d9f40f242bd
3
- size 2040006900
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94d45552fa1245ee26fdd5189637d1bdda3b5db7e403fd7e4c173db90826e071
3
+ size 1827703309
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a6bc26a22416cb5ca53f5db05a44fae39a56a38053bd172c60a77be35974151
3
- size 1926573
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9361cc5a61a932b6e478b57401f1fe55ef86181aa1ee6adcce121c36ce03bd6c
3
+ size 1828724169
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd4c06f8bfbfb28f8a777a84618692ee05687ab598fef9dffb2fea11d3cd83c4
3
- size 515405408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b009dc2d71add45954b927ff01815d25d9d397bbb8b2ad72c6b9bd3279d7607
3
+ size 462660582
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8fe4c89bbf88b377dd1d2862571d7611ce6888d8d1a055b61790050791d97deb
3
- size 514017234
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e2f4fed175268b904c6daf9ffb59f095864aa9f3b0217dcdeaa88a5307759f8
3
+ size 461078933
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0fd1ee78061a395fd1e623ec308a19d9b4803b450aa8e70b24fad833c17e3c76
3
- size 1838433559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fce529ecc15e2abd10d50baafa927be37043764da0bb1832fb28a05b8e2ccac7
3
+ size 1626142598
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:789bc74086187043db99dd1684f3d82ec61d15464dddc2c3daba21dec6e505d5
3
- size 463338655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98c5f7b1868fb1cc0a4b3838652f41748784015e7a2675fbbc536ac1328c9d16
3
+ size 410417655
onnx/encoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2846e5d8c8c847af016939d49add139b57f3a1f5a2739f8eb77f48d18f67e552
3
- size 1229258863
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f334bbbcdf56bb3e2a82cfb523673fdd4b7a6b5d9b7298e9d7fcefd03fe9ada5
3
+ size 1229312445
onnx/encoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:952aacc7ab4ff86afccc732a42c4d6c8babb7651653aeb9b0ff22adcc42dcc90
3
- size 313397176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6fdaff8017b837b7b205ccd1d5f283008f4ee9677a29e503b3cf8e68efa9bb3
3
+ size 313468028
quantize_config.json ADDED
@@ -0,0 +1,115 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "per_channel": false,
3
+ "reduce_range": false,
4
+ "per_model_config": {
5
+ "decoder_model": {
6
+ "op_types": [
7
+ "Cast",
8
+ "Gather",
9
+ "Sqrt",
10
+ "Constant",
11
+ "Softmax",
12
+ "MatMul",
13
+ "Unsqueeze",
14
+ "Reshape",
15
+ "ConstantOfShape",
16
+ "Range",
17
+ "Add",
18
+ "Where",
19
+ "Equal",
20
+ "Transpose",
21
+ "Slice",
22
+ "Concat",
23
+ "Div",
24
+ "Less",
25
+ "ReduceMean",
26
+ "Squeeze",
27
+ "Shape",
28
+ "Erf",
29
+ "Sub",
30
+ "Mul",
31
+ "Expand",
32
+ "Pow"
33
+ ],
34
+ "weight_type": "QInt8"
35
+ },
36
+ "decoder_model_merged": {
37
+ "op_types": [
38
+ "Cast",
39
+ "Gather",
40
+ "Sqrt",
41
+ "Constant",
42
+ "Softmax",
43
+ "MatMul",
44
+ "Unsqueeze",
45
+ "Reshape",
46
+ "ConstantOfShape",
47
+ "Range",
48
+ "Add",
49
+ "Where",
50
+ "If",
51
+ "Equal",
52
+ "Transpose",
53
+ "Slice",
54
+ "Concat",
55
+ "Div",
56
+ "Less",
57
+ "ReduceMean",
58
+ "Squeeze",
59
+ "Shape",
60
+ "Erf",
61
+ "Sub",
62
+ "Mul",
63
+ "Expand",
64
+ "Pow"
65
+ ],
66
+ "weight_type": "QInt8"
67
+ },
68
+ "decoder_with_past_model": {
69
+ "op_types": [
70
+ "MatMul",
71
+ "Erf",
72
+ "Sub",
73
+ "Add",
74
+ "Unsqueeze",
75
+ "Softmax",
76
+ "Reshape",
77
+ "Mul",
78
+ "Transpose",
79
+ "Slice",
80
+ "Concat",
81
+ "Gather",
82
+ "Div",
83
+ "ReduceMean",
84
+ "Sqrt",
85
+ "Pow",
86
+ "Constant",
87
+ "Shape"
88
+ ],
89
+ "weight_type": "QInt8"
90
+ },
91
+ "encoder_model": {
92
+ "op_types": [
93
+ "MatMul",
94
+ "Erf",
95
+ "Sub",
96
+ "Add",
97
+ "Unsqueeze",
98
+ "Softmax",
99
+ "Reshape",
100
+ "Mul",
101
+ "Transpose",
102
+ "Div",
103
+ "Concat",
104
+ "Gather",
105
+ "Conv",
106
+ "ReduceMean",
107
+ "Sqrt",
108
+ "Pow",
109
+ "Constant",
110
+ "Shape"
111
+ ],
112
+ "weight_type": "QUInt8"
113
+ }
114
+ }
115
+ }