Upload folder using huggingface_hub

Browse files

Files changed (10) hide show

config.json +2 -1
generation_config.json +1 -1
onnx/decoder_model.onnx +2 -2
onnx/decoder_model_merged.onnx +2 -2
onnx/decoder_model_merged_quantized.onnx +2 -2
onnx/decoder_model_quantized.onnx +2 -2
onnx/decoder_with_past_model.onnx +2 -2
onnx/decoder_with_past_model_quantized.onnx +2 -2
quantize_config.json +139 -0
tokenizer_config.json +1 -0

config.json CHANGED Viewed

@@ -3,6 +3,7 @@
   "architectures": [
     "T5ForConditionalGeneration"
   ],
   "d_ff": 1024,
   "d_kv": 64,
   "d_model": 512,
@@ -24,7 +25,7 @@
   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
-  "transformers_version": "4.29.2",
   "use_cache": true,
   "vocab_size": 32128
 }

   "architectures": [
     "T5ForConditionalGeneration"
   ],
+  "classifier_dropout": 0.0,
   "d_ff": 1024,
   "d_kv": 64,
   "d_model": 512,
   "relative_attention_max_distance": 128,
   "relative_attention_num_buckets": 32,
   "tie_word_embeddings": false,
+  "transformers_version": "4.33.0.dev0",
   "use_cache": true,
   "vocab_size": 32128
 }

generation_config.json CHANGED Viewed

@@ -3,5 +3,5 @@
   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
-  "transformers_version": "4.29.2"
 }

   "decoder_start_token_id": 0,
   "eos_token_id": 1,
   "pad_token_id": 0,
+  "transformers_version": "4.33.0.dev0"
 }

onnx/decoder_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d127e71a74ef0ce05f055942680cd888c4ff919148000d8bec72d70d28d52fcf
-size 232553947

 version https://git-lfs.github.com/spec/v1
+oid sha256:52d42a1456684fa728a4a00719feda8da997e7f914949bb44dc0aad7d29a376d
+size 232553640

onnx/decoder_model_merged.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:81fc9fb634ada96ec24acbe496107e65c29d83001b90ca7bfa7d51d9145c9b1c
-size 232785013

 version https://git-lfs.github.com/spec/v1
+oid sha256:e626548c9f7354ba077c355ff4412a07dc455b35719e4f7cd467ff4a61cb7320
+size 232784326

onnx/decoder_model_merged_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d8d182742637a76d2224975f60201b91e4410e75f10961e70abac2b174a77da5
-size 59340172

 version https://git-lfs.github.com/spec/v1
+oid sha256:b79a93296dc081de06e9225e5268ccb4f22977f9e8aa92bd6a4623fd7c100e1a
+size 59339331

onnx/decoder_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3a3961aee00cca80a6be942ef2dbcd8ead9d4bb1900dc486fece99c6a0ecfdc8
-size 58943706

 version https://git-lfs.github.com/spec/v1
+oid sha256:a29c9a46fecc1546ecadbc071cdd16de023b4154cb5b09749b08995849db71b8
+size 58943318

onnx/decoder_with_past_model.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c79a621efa007d70baed6e3d3348296c8327d09f8dec0f8f7b03d26d8d9b6939
-size 219954259

 version https://git-lfs.github.com/spec/v1
+oid sha256:0487eff4fd959d7f85751178e18b663cd8855d16d8d8d6296bd95ac56bc1b1ed
+size 219953954

onnx/decoder_with_past_model_quantized.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:10cdf3fb63a4629c0b5fc1aa8ed71af258c91ec80989156cc626d866ec30a6c4
-size 55729558

 version https://git-lfs.github.com/spec/v1
+oid sha256:00c765a02883f4655abb9fdf2c190fabe152d11b9ed716c5351f9781c9082435
+size 55729181

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "decoder_model": {
+            "op_types": [
+                "Log",
+                "Gather",
+                "MatMul",
+                "Sqrt",
+                "Pow",
+                "Neg",
+                "ConstantOfShape",
+                "Cast",
+                "Less",
+                "Reshape",
+                "Tile",
+                "LessOrEqual",
+                "Range",
+                "ReduceMean",
+                "Where",
+                "Expand",
+                "Mul",
+                "Shape",
+                "Add",
+                "Concat",
+                "Transpose",
+                "Constant",
+                "Sub",
+                "Tanh",
+                "Softmax",
+                "Unsqueeze",
+                "Min",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "encoder_model": {
+            "op_types": [
+                "Log",
+                "Gather",
+                "MatMul",
+                "Sqrt",
+                "Pow",
+                "Greater",
+                "Cast",
+                "ConstantOfShape",
+                "Less",
+                "Reshape",
+                "Range",
+                "ReduceMean",
+                "Where",
+                "Mul",
+                "Abs",
+                "Shape",
+                "Add",
+                "Concat",
+                "Transpose",
+                "Constant",
+                "Sub",
+                "Tanh",
+                "Softmax",
+                "Unsqueeze",
+                "Min",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Log",
+                "Gather",
+                "MatMul",
+                "Sqrt",
+                "Pow",
+                "Neg",
+                "ConstantOfShape",
+                "Cast",
+                "Less",
+                "Reshape",
+                "Tile",
+                "LessOrEqual",
+                "Range",
+                "If",
+                "ReduceMean",
+                "Where",
+                "Expand",
+                "Mul",
+                "Shape",
+                "Add",
+                "Concat",
+                "Transpose",
+                "Constant",
+                "Sub",
+                "Tanh",
+                "Softmax",
+                "Unsqueeze",
+                "Min",
+                "Slice",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Log",
+                "Gather",
+                "MatMul",
+                "Sqrt",
+                "Pow",
+                "Neg",
+                "ConstantOfShape",
+                "Cast",
+                "Less",
+                "Reshape",
+                "Tile",
+                "LessOrEqual",
+                "Range",
+                "ReduceMean",
+                "Where",
+                "Expand",
+                "Mul",
+                "Shape",
+                "Add",
+                "Concat",
+                "Transpose",
+                "Constant",
+                "Sub",
+                "Tanh",
+                "Softmax",
+                "Unsqueeze",
+                "Min",
+                "Slice",
+                "Div"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

tokenizer_config.json CHANGED Viewed

@@ -104,6 +104,7 @@
   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},

   "clean_up_tokenization_spaces": true,
   "eos_token": "</s>",
   "extra_ids": 100,
+  "legacy": true,
   "model_max_length": 512,
   "pad_token": "<pad>",
   "sp_model_kwargs": {},