feat: Update converted models with config

Browse files

Files changed (8) hide show

config.json +0 -1
merges.txt +0 -1
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
preprocessor_config.json +0 -0
quantize_config.json +68 -68
tokenizer_config.json +33 -4
vocab.json +0 -0

config.json CHANGED Viewed

@@ -146,7 +146,6 @@
     50361,
     50362
   ],
-  "torch_dtype": "float32",
   "transformers_version": "4.33.2",
   "use_cache": true,
   "use_weighted_layer_sum": false,

     50361,
     50362
   ],
   "transformers_version": "4.33.2",
   "use_cache": true,
   "use_weighted_layer_sum": false,

merges.txt CHANGED Viewed

@@ -49998,4 +49998,3 @@ ctic amente
 Ġmanif ests
 ĠPak istani
 Ġ( '
-åľ º

 Ġmanif ests
 ĠPak istani
 Ġ( '

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6c169b8c330d4345cdf607e23dbff2664bad8c767c7ead33343248a3df773bf5
-size 118533120

 version https://git-lfs.github.com/spec/v1
+oid sha256:13f7f875d3fcbc9883bcbaf031597c900ec45a42e3cf56907fa6cf8f4b4df978
+size 118533111

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a36371f1eac6675aec784a6cdb35f29154d3cf95bd8969f434c40269f11112d
-size 30667401

 version https://git-lfs.github.com/spec/v1
+oid sha256:820865ac5e5162fcdffc44692dc1f50af6f29a1421391add0227db3497698404
+size 30667374

preprocessor_config.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

quantize_config.json CHANGED Viewed

@@ -4,110 +4,110 @@
     "per_model_config": {
         "encoder_model": {
             "op_types": [
-                "Erf",
                 "Add",
-                "Mul",
-                "Constant",
-                "Sub",
-                "Div",
-                "MatMul",
                 "Concat",
-                "ReduceMean",
                 "Transpose",
                 "Sqrt",
-                "Pow",
-                "Conv",
-                "Gather",
                 "Unsqueeze",
-                "Softmax",
-                "Shape",
-                "Reshape"
             ],
             "weight_type": "QUInt8"
         },
         "decoder_model": {
             "op_types": [
-                "Erf",
-                "Squeeze",
-                "Expand",
-                "Sub",
                 "Concat",
-                "Sqrt",
                 "Unsqueeze",
-                "Range",
-                "Equal",
                 "Constant",
-                "ConstantOfShape",
-                "ReduceMean",
-                "Transpose",
-                "Gather",
-                "Less",
                 "Shape",
                 "Add",
-                "Slice",
-                "Div",
-                "Where",
-                "Reshape",
-                "Cast",
                 "Mul",
-                "MatMul",
-                "Pow",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
-                "Erf",
-                "Add",
-                "Mul",
-                "Constant",
-                "Slice",
-                "Sub",
-                "Div",
-                "MatMul",
-                "Concat",
                 "ReduceMean",
-                "Transpose",
-                "Sqrt",
                 "Pow",
-                "Gather",
-                "Unsqueeze",
                 "Softmax",
                 "Shape",
-                "Reshape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
-                "Erf",
-                "Squeeze",
-                "Expand",
-                "Sub",
                 "Concat",
-                "Sqrt",
-                "If",
                 "Unsqueeze",
-                "Range",
-                "Equal",
                 "Constant",
-                "ConstantOfShape",
-                "ReduceMean",
-                "Transpose",
-                "Gather",
-                "Less",
                 "Shape",
                 "Add",
-                "Slice",
-                "Div",
-                "Where",
-                "Reshape",
-                "Cast",
                 "Mul",
-                "MatMul",
-                "Pow",
-                "Softmax"
             ],
             "weight_type": "QInt8"
         }

     "per_model_config": {
         "encoder_model": {
             "op_types": [
+                "Gather",
+                "ReduceMean",
                 "Add",
+                "Pow",
                 "Concat",
+                "Erf",
+                "Softmax",
+                "Div",
+                "Conv",
                 "Transpose",
+                "Mul",
+                "Shape",
                 "Sqrt",
+                "MatMul",
                 "Unsqueeze",
+                "Reshape",
+                "Sub",
+                "Constant"
             ],
             "weight_type": "QUInt8"
         },
         "decoder_model": {
             "op_types": [
                 "Concat",
+                "Div",
+                "Cast",
+                "Slice",
                 "Unsqueeze",
+                "MatMul",
                 "Constant",
+                "Where",
+                "Expand",
+                "Softmax",
                 "Shape",
+                "Gather",
+                "Pow",
+                "ConstantOfShape",
                 "Add",
+                "Squeeze",
+                "Equal",
+                "Range",
+                "Less",
                 "Mul",
+                "Sub",
+                "ReduceMean",
+                "Erf",
+                "Transpose",
+                "Sqrt",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         },
         "decoder_with_past_model": {
             "op_types": [
+                "Gather",
                 "ReduceMean",
+                "Add",
                 "Pow",
+                "Concat",
                 "Softmax",
+                "Erf",
+                "MatMul",
+                "Div",
+                "Slice",
+                "Mul",
+                "Unsqueeze",
                 "Shape",
+                "Sqrt",
+                "Transpose",
+                "Reshape",
+                "Sub",
+                "Constant"
             ],
             "weight_type": "QInt8"
         },
         "decoder_model_merged": {
             "op_types": [
                 "Concat",
+                "Div",
+                "Cast",
+                "Slice",
                 "Unsqueeze",
+                "MatMul",
                 "Constant",
+                "Where",
+                "Expand",
+                "Softmax",
                 "Shape",
+                "Gather",
+                "Pow",
+                "ConstantOfShape",
                 "Add",
+                "If",
+                "Squeeze",
+                "Equal",
+                "Range",
+                "Less",
                 "Mul",
+                "Sub",
+                "ReduceMean",
+                "Erf",
+                "Transpose",
+                "Sqrt",
+                "Reshape"
             ],
             "weight_type": "QInt8"
         }

tokenizer_config.json CHANGED Viewed

@@ -12976,14 +12976,43 @@
     "<|nocaptions|>",
     "<|notimestamps|>"
   ],
-  "bos_token": "<|endoftext|>",
   "clean_up_tokenization_spaces": true,
-  "eos_token": "<|endoftext|>",
   "errors": "replace",
   "model_max_length": 1024,
-  "pad_token": "<|endoftext|>",
   "processor_class": "WhisperProcessor",
   "return_attention_mask": false,
   "tokenizer_class": "WhisperTokenizer",
-  "unk_token": "<|endoftext|>"
 }

     "<|nocaptions|>",
     "<|notimestamps|>"
   ],
+  "bos_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "clean_up_tokenization_spaces": true,
+  "eos_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "errors": "replace",
   "model_max_length": 1024,
+  "pad_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
   "processor_class": "WhisperProcessor",
   "return_attention_mask": false,
   "tokenizer_class": "WhisperTokenizer",
+  "trust_remote_code": false,
+  "unk_token": {
+    "__type": "AddedToken",
+    "content": "<|endoftext|>",
+    "lstrip": false,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  }
 }

vocab.json CHANGED Viewed

The diff for this file is too large to render. See raw diff