Upload folder using huggingface_hub

Browse files

Files changed (11) hide show

config.json +2 -1
generation_config.json +79 -2
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
onnx/encoder_model.onnx +2 -2
onnx/encoder_model_quantized.onnx +2 -2
quantize_config.json +115 -0

config.json CHANGED Viewed

@@ -42,6 +42,7 @@
   "max_length": 448,
   "max_source_positions": 1500,
   "max_target_positions": 448,
   "model_type": "whisper",
   "num_hidden_layers": 12,
   "num_mel_bins": 80,
@@ -139,7 +140,7 @@
     50360,
     50361
   ],
-  "transformers_version": "4.30.2",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51864

   "max_length": 448,
   "max_source_positions": 1500,
   "max_target_positions": 448,
+  "median_filter_width": 7,
   "model_type": "whisper",
   "num_hidden_layers": 12,
   "num_mel_bins": 80,
     50360,
     50361
   ],
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51864

generation_config.json CHANGED Viewed

@@ -1,5 +1,82 @@
 {
-  "alignment_heads": [[6, 6], [7, 0], [7, 3], [7, 8], [8, 2], [8, 5], [8, 7], [9, 0], [9, 4], [9, 8], [9, 10], [10, 0], [10, 1], [10, 2], [10, 3], [10, 6], [10, 11], [11, 2], [11, 4]],
   "begin_suppress_tokens": [
     220,
     50256
@@ -110,5 +187,5 @@
     50360,
     50361
   ],
-  "transformers_version": "4.30.2"
 }

 {
+  "alignment_heads": [
+    [
+      6,
+      6
+    ],
+    [
+      7,
+      0
+    ],
+    [
+      7,
+      3
+    ],
+    [
+      7,
+      8
+    ],
+    [
+      8,
+      2
+    ],
+    [
+      8,
+      5
+    ],
+    [
+      8,
+      7
+    ],
+    [
+      9,
+      0
+    ],
+    [
+      9,
+      4
+    ],
+    [
+      9,
+      8
+    ],
+    [
+      9,
+      10
+    ],
+    [
+      10,
+      0
+    ],
+    [
+      10,
+      1
+    ],
+    [
+      10,
+      2
+    ],
+    [
+      10,
+      3
+    ],
+    [
+      10,
+      6
+    ],
+    [
+      10,
+      11
+    ],
+    [
+      11,
+      2
+    ],
+    [
+      11,
+      4
+    ]
+  ],
   "begin_suppress_tokens": [
     220,
     50256
     50360,
     50361
   ],
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ea38750c855e4a27256f08057fd9fb91f4ebb4705d6717522728ac9789a71394
-size 774153408

 version https://git-lfs.github.com/spec/v1
+oid sha256:ea5d821f98329d78cd0c8387476633bd195bb9df897b5248d8711b6cefa4ca1f
+size 614892481

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:821a0fae52d92575d988421df91cc2792827b58f42d6274324fa184a592dc6a2
-size 774588347

 version https://git-lfs.github.com/spec/v1
+oid sha256:680e293ef4fb01f2e6a636ab574eb6ee1da697ce9f492066904917406a446c1e
+size 615402140

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ba8567520a70349d064d7ffec5f440e78a149bf5968bfedd94ad78b6287e8798
-size 196431022

 version https://git-lfs.github.com/spec/v1
+oid sha256:7cff5df61a1809654a5e62d89cbb99e8231b229f41412ab626a1d8fff77397ab
+size 156780181

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:053b11d598b22f489e0075714ca9191f4016c356544131b908f2eb87648d72c2
-size 195737631

 version https://git-lfs.github.com/spec/v1
+oid sha256:60095134fb8e35617495b117d2c780f606d39f28e631c876f4c2bd898bcb3873
+size 155990510

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d605634ae33667a23a37100bb2d014d5cb99f774f3fe5891d0d4d777264b5990
-size 717416719

 version https://git-lfs.github.com/spec/v1
+oid sha256:d4186916df15a6ae504cad0c7e3c854715661e5fb2dcb35cbf941f60a92c981c
+size 558162062

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b5b511413b04bb36148c2b45799223c14d5075bd6b1f16d16145d14fb6adc57f
-size 181417229

 version https://git-lfs.github.com/spec/v1
+oid sha256:95f5e8f13c480b2141a94c8e8a9e89831b7ad0cc4518feac27b19c0afc714bca
+size 141678688

onnx/encoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6590ebbed3fe0be31ca86ab0b8b6e086114e4da0f81421a4d06aeec5335d97d3
-size 352812843

 version https://git-lfs.github.com/spec/v1
+oid sha256:3032ccbfd40346a2552bfe08d66d6070d8f1cd37602053fccab8694adf57d329
+size 352839389

onnx/encoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:cc7c82e4908c040e156b4063f6cc319b5f31d68ff5812a7e4ac05659cb88ac5c
-size 92289703

 version https://git-lfs.github.com/spec/v1
+oid sha256:dd37efa07dad7619592ef849a40317dcfd182a2e632275a53a023f02f685cfa7
+size 92324819

quantize_config.json ADDED Viewed

	@@ -0,0 +1,115 @@

+{
+    "per_channel": false,
+    "reduce_range": false,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Slice",
+                "Range",
+                "Constant",
+                "Pow",
+                "Gather",
+                "Concat",
+                "Div",
+                "Unsqueeze",
+                "Expand",
+                "Equal",
+                "Erf",
+                "ReduceMean",
+                "ConstantOfShape",
+                "Sqrt",
+                "Sub",
+                "Where",
+                "Transpose",
+                "Mul",
+                "MatMul",
+                "Cast",
+                "Squeeze",
+                "Reshape",
+                "Less",
+                "Add",
+                "Softmax",
+                "Shape"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Slice",
+                "Range",
+                "Constant",
+                "Pow",
+                "Gather",
+                "Concat",
+                "Div",
+                "Unsqueeze",
+                "Expand",
+                "Equal",
+                "Erf",
+                "ReduceMean",
+                "ConstantOfShape",
+                "Sqrt",
+                "Sub",
+                "Where",
+                "Transpose",
+                "Mul",
+                "If",
+                "MatMul",
+                "Cast",
+                "Squeeze",
+                "Reshape",
+                "Less",
+                "Add",
+                "Softmax",
+                "Shape"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Sqrt",
+                "Slice",
+                "Softmax",
+                "Reshape",
+                "Constant",
+                "Sub",
+                "Div",
+                "Pow",
+                "Erf",
+                "Transpose",
+                "Gather",
+                "Mul",
+                "MatMul",
+                "Concat",
+                "Add",
+                "ReduceMean",
+                "Unsqueeze",
+                "Shape"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Sqrt",
+                "Softmax",
+                "Reshape",
+                "Constant",
+                "Sub",
+                "Erf",
+                "Pow",
+                "Transpose",
+                "Shape",
+                "Gather",
+                "Mul",
+                "MatMul",
+                "Conv",
+                "Concat",
+                "Add",
+                "Div",
+                "Unsqueeze",
+                "ReduceMean"
+            ],
+            "weight_type": "QUInt8"
+        }
+    }
+}