diff --git a/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx b/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx
index cae8d7adb3a73bd7a263150ab524d366f4a525d5..3574246ead2c54e92a3cbf4d24c2b77addc699bd 100644
--- a/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx
+++ b/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:ced5da743a77529eb62060115580596dbb21702b7bd3af9e3ed64c9207562c7a
-size 249582838
+oid sha256:d447949536a14e0930c48b23fc34e2a6fdbdfa22c958dff787fe23d5e88b9ec8
+size 249587577
diff --git a/quantized/distilgpt2/causal-lm-with-past/decoder_model_merged.onnx b/quantized/distilgpt2/causal-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..1cbaaf18af019a333e72f5f2fdbeaa764a944649
--- /dev/null
+++ b/quantized/distilgpt2/causal-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:0df8008063684caea7f35b9a7051a8693ab548acfc29449b3c4e94331cc46b4f
+size 249675200
diff --git a/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx b/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx
index b1b73c9ebfc4a76242783700d76082beb6bc76e2..9b0cfd607898a633bc69265726661829a1b2e9c8 100644
--- a/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:8ce5f0c2fee02591c5657ac5c4f7d7d6ff01bdd836eab72339e9d2068cef443f
-size 249586984
+oid sha256:66c0af50c63820a310c0bb0f7269a807e357d3d77bc18fda409464c6948cb627
+size 249592120
diff --git a/quantized/distilgpt2/causal-lm-with-past/tokenizer.json b/quantized/distilgpt2/causal-lm-with-past/tokenizer.json
index 6dc5e94ca994de07d374e33698489de9cff48a02..22043ac6ec947359001e20840908973ea620781e 100644
--- a/quantized/distilgpt2/causal-lm-with-past/tokenizer.json
+++ b/quantized/distilgpt2/causal-lm-with-past/tokenizer.json
@@ -5,32 +5,29 @@
"added_tokens": [
{
"id": 50256,
+ "special": true,
"content": "<|endoftext|>",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": false,
- "trim_offsets": true,
- "use_regex": true
+ "trim_offsets": true
},
"post_processor": {
"type": "ByteLevel",
"add_prefix_space": true,
- "trim_offsets": false,
- "use_regex": true
+ "trim_offsets": false
},
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
- "trim_offsets": true,
- "use_regex": true
+ "trim_offsets": true
},
"model": {
"type": "BPE",
diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx
index a0ccd4da297f339be26c6823c32735e177a28f0e..6ff3f34fd1bb0344d3b724e1c50546039e38308e 100644
--- a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:4d6821426c8d3dd75f7ed83426e50b6d58af2154590175a36a8c5ff05b65e911
-size 164245993
+oid sha256:3a5dedfa56dfa3a66c840af98ab0c0438ea97e2905947de9c1cdbc2a3c5139c4
+size 164336072
diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..e5f264454e379bb891c9b8f8b2bae9d49a0b411e
--- /dev/null
+++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:54318115238b89ab4fa6b1fd85cf4e55cd89f14f164ab4019ee98e68d0cca55e
+size 164549246
diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
index b4fd788b9cd9c92cf7733ff61557c7cf5dbbefb4..aab7b686f33a9ed165965d74354483860a62c540 100644
--- a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:9231c30c03c92a38ab63ad24ab9440897d19bf11bee0e7b70c0fff9aa540b466
-size 149938415
+oid sha256:422cfaa90b115c4ea60f43b94fd8fda445d9150b2e401ddd8db8408c9e3b6b99
+size 150019481
diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx
index 1cb31eb743f36f948cd9fabf1b591272ef7d6a46..4f72e3feb3008aa9d496e76630d17921bad3a0db 100644
--- a/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:f8ee6a0e07f0b6f1b5aaca54e4d5ed320034fa3e433121706e2da7514072f718
-size 110539783
+oid sha256:2706491228c349685ee85c1d67a057bd173cca81ef1c5d229a47c3b49e81370c
+size 110585314
diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx
index 6bd320a12e366add128f456eb487e871419548bb..5d680864d304b9ef61436fd9aa55ffcc79504c2c 100644
--- a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:d5b1ebae6276d191107b7eead3d142b970542d9262d952900df8107fa89bf619
-size 58998475
+oid sha256:288c543b7ed377cc89929c89ddc64d2ea32d35a40cc084b997aad3933643fd89
+size 59058672
diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..183fef4143c8f8016453488cc1769aeb4c990f5c
--- /dev/null
+++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8d623ab57fed27150b5517a955295a20effb4099ae7d51c44bf279e794243db6
+size 59247726
diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
index aa2c305cf188eee7c83855db3d798189225542f7..74c2d79c85e97196748a7a81b99a38cb3c2219ad 100644
--- a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:0a64bcefa3b4fa4ab2a23854dd89a44bfbf2c76b4418d2e7665217631c57b6d6
-size 55785322
+oid sha256:12d22d076005b8d6d0e98bbf149b2561cf4911f3f4f1af33f16e806fb7fabe53
+size 55839462
diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx
index fdb7f3d8ab018c1bf06a81ba611b338e1620ea17..b75a60c3e312daca48dd7821ca32cc1effba948b 100644
--- a/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:776cd40d25b7026fb4f3301f4ca82a026f844db74f9e94e6b05672940bb39e27
-size 35784005
+oid sha256:e7c4d50cb1270f49639b46399f89a4a1f25cb3e95fbecaf236785b909048a736
+size 35814394
diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx
index 657170f1b0e2b2f0cf04dc871b34e6fa8ce967fb..cf43ac93c79a6d945f76d3b26db3ad2ea93e34aa 100644
--- a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:83f4e696ca09795bee52c3c19642cf0ace200aa576ea2006833198be83ec6216
-size 164245993
+oid sha256:17990f89e69dfde950c25c0866fb4435812d36bfbf46db7351a9d5608c70efbd
+size 164336072
diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..0256a5351904cbf0f14f364005b5dc0bf408228e
--- /dev/null
+++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:fc2ed6d6efd0f727e277aa8a3f5f44b36b6a0f6e808add5c898ced2a5bbe6cf1
+size 164549246
diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
index 68f0e1a059e4444e712fb9398838763e43063fd2..ccdedea39f190bd715967690a08873d8f4ed09bc 100644
--- a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:9735f078a8d070177a970d5353668ded23942d076a6cf6ba07cb7aad3fc32529
-size 149938415
+oid sha256:4299f5e1c01b33df8658fe4a6857a1fff1e3d47db7a1eba6c71ff672cd5af75b
+size 150019481
diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx
index ffabd1d9092c4546e4e3c7d54a2257c0b5f7be3b..bd555f1d51ec14a106e637f0658f7515f520a86c 100644
--- a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:33d0af70e4475f683586ca53c9b7a6c3a2eaaaaa305f705df9c5e897b1128934
-size 110539783
+oid sha256:5ac0d4f6da965ec8a2c2a91a32155cc92e7d5158e27c5e36d10b75e00da91e67
+size 110585314
diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx
index 4640c00b332b910c068dd08ce039ae3aa4afecc7..05bfbdf9ab7a8ab879fb39d9405d103f1aecc172 100644
--- a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:d12084abc7a8cb0771c9298cbe3d4b3ed9e8b2ec47886ddb11d600fb3a6e5c5a
-size 58998475
+oid sha256:a5982955fba72cbc80221160fce037440d3a670c91e9bcd9beb6788a962771f6
+size 59058672
diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..3bb0fb69533b01c6109570be17a40e0eef55bd31
--- /dev/null
+++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:7a9d30911a12b36bc0df67abc93450da5fa8346992f2c2b1846f144fa814626c
+size 59247726
diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
index ffab8fedac4dd47f6651ef175c1e75c920ad5703..76bb033204d628a66ca83e8d82aed04cc1230dfc 100644
--- a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:863de1616d28644332df2331cad5000cf700ff3b7bf9b8de42e46af6a7314b67
-size 55785322
+oid sha256:8a2315a861d9f3a8fddb8edcd0675dd3bf000fd93140c8b31b7dd6e9c012014c
+size 55839462
diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx
index 44027cdc4969b7a6595dd208604147990139d3c0..487c0afb50ab7635729b07cc0749b7ef2910986e 100644
--- a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:438e80e369cd88a92eb55bf623c4ae2616dcff678949e424ae4f8f9fa41e9786
-size 35784005
+oid sha256:6b6585dcde89301247cd8dfe0dbb221e83c5427217bbff424e78adeaafc98334
+size 35814394
diff --git a/quantized/openai/whisper-base.en/default/config.json b/quantized/openai/whisper-base.en/default/config.json
index 0f0e052c322a7af5d702c50986a7f473c51abbdd..a06a0040590d419e3641482853812b18d546efb6 100644
--- a/quantized/openai/whisper-base.en/default/config.json
+++ b/quantized/openai/whisper-base.en/default/config.json
@@ -129,7 +129,6 @@
50360,
50361
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51864
diff --git a/quantized/openai/whisper-base.en/default/decoder_model.onnx b/quantized/openai/whisper-base.en/default/decoder_model.onnx
index 294284e73c05b9f908e2b232c7b86e7f4f06578b..0e3872fd3a7a5f30772eda0b02a375b9a7467026 100644
--- a/quantized/openai/whisper-base.en/default/decoder_model.onnx
+++ b/quantized/openai/whisper-base.en/default/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:65591b39b49623c74b360af28509182a4054355c9d9d14b254566f257928d406
-size 53466938
+oid sha256:90e2a5e52df832bbc35fb104cfc63deb2a3731bfe3c997df73f5fa234ee9e363
+size 53464941
diff --git a/quantized/openai/whisper-base.en/default/encoder_model.onnx b/quantized/openai/whisper-base.en/default/encoder_model.onnx
index 486176a7ab468d82d246222c1fbaa6d4baf20bfa..bd31f8e0f4870805e04aa758e0cfc4a2b2ddfefc 100644
--- a/quantized/openai/whisper-base.en/default/encoder_model.onnx
+++ b/quantized/openai/whisper-base.en/default/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:a8daef92b616d36adf1c086f89280443effd2c77c7e8c730113514833f076ca6
-size 23337231
+oid sha256:5ceadcf4cb45d3e07507174a5f281f745085f01ea01b32f11dcb14f20e81291b
+size 23337235
diff --git a/quantized/openai/whisper-base.en/default/tokenizer_config.json b/quantized/openai/whisper-base.en/default/tokenizer_config.json
index 044482e72ceb1721e9eadd5f8b4dd6fd8dee382b..5c2ea33b72e5dbe2a90929e27eb5ead584bbbb84 100644
--- a/quantized/openai/whisper-base.en/default/tokenizer_config.json
+++ b/quantized/openai/whisper-base.en/default/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json
index 0f0e052c322a7af5d702c50986a7f473c51abbdd..a06a0040590d419e3641482853812b18d546efb6 100644
--- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json
+++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json
@@ -129,7 +129,6 @@
50360,
50361
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51864
diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx
index 7da2a923670e9cfd0c444049244d8956b9484ee7..802bff66808d25d67822eba79e1e409cb5709bac 100644
--- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:acf55ec8ff985302cd968ad47b9a7ab9661b8dedd784270d12f1bd53cb79aeed
-size 80323040
+oid sha256:d1a4eb50199211fafcccf5efb8176ab1f3422597fc767f05d30c559ce091abe6
+size 80321068
diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..5f990eac67816cc01e52db323bfb778689a03210
--- /dev/null
+++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9b2396a1c4079f5b541d05ccfd21bef6d20af75e48f9ac5c34bc4b67f3751fb5
+size 80556990
diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
index e8f53e37f63d3e861f24b83f1400c3fdae0e5d7a..f30e4dfcbe712e2e7dbf95874792f79411622054 100644
--- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:ab2ca295c5f803fd34d4583b9f1cfd6ad77370c3fec30a680c5bbcb9d4202dfb
-size 77066559
+oid sha256:65b70d66fa9dbb1a61c863065100a08bf58a689383b212b1e91646738cc97424
+size 77066299
diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx
index 486176a7ab468d82d246222c1fbaa6d4baf20bfa..bd31f8e0f4870805e04aa758e0cfc4a2b2ddfefc 100644
--- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:a8daef92b616d36adf1c086f89280443effd2c77c7e8c730113514833f076ca6
-size 23337231
+oid sha256:5ceadcf4cb45d3e07507174a5f281f745085f01ea01b32f11dcb14f20e81291b
+size 23337235
diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json
index 044482e72ceb1721e9eadd5f8b4dd6fd8dee382b..5c2ea33b72e5dbe2a90929e27eb5ead584bbbb84 100644
--- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-base/default/config.json b/quantized/openai/whisper-base/default/config.json
index 9f0ec8146473ef27fb6be214f8e0fc08b0776cfd..546d4ae6ee01d58080a61b9e3e55c72951c9b6a9 100644
--- a/quantized/openai/whisper-base/default/config.json
+++ b/quantized/openai/whisper-base/default/config.json
@@ -135,7 +135,6 @@
50361,
50362
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51865
diff --git a/quantized/openai/whisper-base/default/decoder_model.onnx b/quantized/openai/whisper-base/default/decoder_model.onnx
index 64fa956fe669729e32559cb4677b638e7a712bbc..9ef76f7e8dc0f392bbbfd402ec152c4e9c3e3aaa 100644
--- a/quantized/openai/whisper-base/default/decoder_model.onnx
+++ b/quantized/openai/whisper-base/default/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:5d6942cf3bd8173fae3ddd56932bb1330e99845c8d1f291f622f7ddc5dea14ab
-size 53467450
+oid sha256:7a5866bc679ce0c107395289250eae85918be53afd49e3bb3b026710d7023dcd
+size 53465453
diff --git a/quantized/openai/whisper-base/default/encoder_model.onnx b/quantized/openai/whisper-base/default/encoder_model.onnx
index c6eb28a97e6f377867c6aa3c6d3b1dd3b94095cc..e48e8541da7a61e7e5f3072382653a029d995e51 100644
--- a/quantized/openai/whisper-base/default/encoder_model.onnx
+++ b/quantized/openai/whisper-base/default/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:c4c995617d3e567ff954695388801dab9d13fae1804103a974a8ecd6e7bcfa9a
-size 23337231
+oid sha256:1990e063ab168d67092cbbd32588acb425e6d767bd3af38ecf36137fe3914b41
+size 23337235
diff --git a/quantized/openai/whisper-base/default/tokenizer_config.json b/quantized/openai/whisper-base/default/tokenizer_config.json
index 6b0a72ce5cf3c335eab27a46d2fa0f812e6b48fd..2dfd88e8dfba2c386243c900f3f8f9ddaa1f604a 100644
--- a/quantized/openai/whisper-base/default/tokenizer_config.json
+++ b/quantized/openai/whisper-base/default/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json
index 9f0ec8146473ef27fb6be214f8e0fc08b0776cfd..546d4ae6ee01d58080a61b9e3e55c72951c9b6a9 100644
--- a/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json
+++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json
@@ -135,7 +135,6 @@
50361,
50362
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51865
diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx
index 0c5b6f60aa016aef6d693877b248407e201c3a0e..eded76ecf7775900e3d2506aa1f333b8ac03690a 100644
--- a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:d7a8b7bfa9d2117ed40edc1bfca3e5de318c04b601b215bc651023eda15c6bed
-size 80324069
+oid sha256:0800f9c5cd63139166bf2031993b8e136bb754a76a94aaf25a9e9b0dd9cc73bf
+size 80322097
diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..b7da53318684804acaa0e8c4865dd666bf782fc4
--- /dev/null
+++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:62aac7f57c5f696817983bb46f45b694d9e870727dcade1c2be707146b1e215e
+size 80558019
diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx
index 5695c4c27a814353e584698f2dc3f9c6c4be36e6..06d0a7adc5c314484830480d21e5f109e5a45f68 100644
--- a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:97cf2a4270fee757ec5cc239c165b0b63814fe4c9160e3910d2099efa460c5d7
-size 77067588
+oid sha256:6f1e5181fd479407e403f50594bb14a38bca8f6c86e27b656c4066aaf9cd0a72
+size 77067328
diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx
index c6eb28a97e6f377867c6aa3c6d3b1dd3b94095cc..e48e8541da7a61e7e5f3072382653a029d995e51 100644
--- a/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:c4c995617d3e567ff954695388801dab9d13fae1804103a974a8ecd6e7bcfa9a
-size 23337231
+oid sha256:1990e063ab168d67092cbbd32588acb425e6d767bd3af38ecf36137fe3914b41
+size 23337235
diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json
index 6b0a72ce5cf3c335eab27a46d2fa0f812e6b48fd..2dfd88e8dfba2c386243c900f3f8f9ddaa1f604a 100644
--- a/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-small.en/default/config.json b/quantized/openai/whisper-small.en/default/config.json
index e68b2517185b7dc081f219ed07d8875435471602..60bd84cfd6099303181ef474422ac8c00d87cf86 100644
--- a/quantized/openai/whisper-small.en/default/config.json
+++ b/quantized/openai/whisper-small.en/default/config.json
@@ -129,7 +129,6 @@
50360,
50361
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51864
diff --git a/quantized/openai/whisper-small.en/default/decoder_model.onnx b/quantized/openai/whisper-small.en/default/decoder_model.onnx
index 5ebbbc897efa20832c55ab71d610f8b48715e800..80aa4f9ff850fa2208e7370a50b6adeaf887d9d9 100644
--- a/quantized/openai/whisper-small.en/default/decoder_model.onnx
+++ b/quantized/openai/whisper-small.en/default/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:d304c16554a234d0c6c2d8553da683c49a9e872537714fa99f756e9bfa9e0230
-size 156507792
+oid sha256:8af023c75b14ede43fa2904e5d702d1ea36673709cb6a0f849d2fb7c498f67f7
+size 156503755
diff --git a/quantized/openai/whisper-small.en/default/encoder_model.onnx b/quantized/openai/whisper-small.en/default/encoder_model.onnx
index f28ecd76363f49096f8bed17946a8b1fa88b4706..0501417673dffa873a330b625ef1946914f17b1a 100644
--- a/quantized/openai/whisper-small.en/default/encoder_model.onnx
+++ b/quantized/openai/whisper-small.en/default/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:7a9ff0f76c5a450edccfc7fbe8f910047620a56101b284066e007832ad6d48d3
-size 92735924
+oid sha256:6792ba696e505bd3527efa62327024bc04db8bf9558d47e16a2fff7e3810440f
+size 92735928
diff --git a/quantized/openai/whisper-small.en/default/tokenizer_config.json b/quantized/openai/whisper-small.en/default/tokenizer_config.json
index ba1d7aa7a5333296cabbcf5b9e4c239aedf2d755..c17ccf7df98614e74fc7d5e7de73ec03dcafd93d 100644
--- a/quantized/openai/whisper-small.en/default/tokenizer_config.json
+++ b/quantized/openai/whisper-small.en/default/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json
index e68b2517185b7dc081f219ed07d8875435471602..60bd84cfd6099303181ef474422ac8c00d87cf86 100644
--- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json
+++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json
@@ -129,7 +129,6 @@
50360,
50361
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51864
diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx
index 53a5f950f40b94e1c32814a88e7541b920283b38..380efc20556342d2f1f094bc860a72c75fe632e6 100644
--- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:188af562e38a5e1d513ce1526dd22688947d3b5d06227ace70ccc7f0a6657846
-size 196680348
+oid sha256:0105edbe0037f4c7ac11f020f53f581b6ed10c9f680124d2448f255ec52c28c3
+size 196676336
diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..8df35187ae8047d99c3e21b0ed1868619b6925f4
--- /dev/null
+++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:8defd52aed2a7843e174afb4a42c44ae4dfb8e85c200e9955fb88a68ef8df0f7
+size 197146590
diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
index 7b4a58b58193e4357d596beef3ce29b74e443c07..f74b2828c125bd3e12b33efede29e8801d1ba80a 100644
--- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:90ee0249df2d0a3f98da7025f71d2ed6a914cb543a76d1300194f2cfbdddebb9
-size 182268135
+oid sha256:a6ced91a295a5a5d10abebd872a1da952b441e12240cf2f1f680b24ae9e53029
+size 182267587
diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx
index f28ecd76363f49096f8bed17946a8b1fa88b4706..0501417673dffa873a330b625ef1946914f17b1a 100644
--- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:7a9ff0f76c5a450edccfc7fbe8f910047620a56101b284066e007832ad6d48d3
-size 92735924
+oid sha256:6792ba696e505bd3527efa62327024bc04db8bf9558d47e16a2fff7e3810440f
+size 92735928
diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json
index ba1d7aa7a5333296cabbcf5b9e4c239aedf2d755..c17ccf7df98614e74fc7d5e7de73ec03dcafd93d 100644
--- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-small/default/config.json b/quantized/openai/whisper-small/default/config.json
index 4c6b92ef5673e25cb9124507e4a9564439d8e91f..bcf1ef1259e67bdb592577b16054176e05bc8a80 100644
--- a/quantized/openai/whisper-small/default/config.json
+++ b/quantized/openai/whisper-small/default/config.json
@@ -135,7 +135,6 @@
50361,
50362
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51865
diff --git a/quantized/openai/whisper-small/default/decoder_model.onnx b/quantized/openai/whisper-small/default/decoder_model.onnx
index ec49323cd4251fa9ffc1ac83421349e2a6bd62fd..8c9196bb18fba5abb24186bc68198cfddbeb143e 100644
--- a/quantized/openai/whisper-small/default/decoder_model.onnx
+++ b/quantized/openai/whisper-small/default/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:c242c30a33e05e44eb2e585485d09123282310b842d27e043bea7840181d372c
-size 156508560
+oid sha256:77af26339700b3afdcb37d3e9158c4c713875719c30e19eaabd919f7010a554f
+size 156504523
diff --git a/quantized/openai/whisper-small/default/encoder_model.onnx b/quantized/openai/whisper-small/default/encoder_model.onnx
index 18200eae15b55c90c821fd9ac637f1616bbf0999..77a89d497bfbe099d93c0f95050ec99c8a9140e4 100644
--- a/quantized/openai/whisper-small/default/encoder_model.onnx
+++ b/quantized/openai/whisper-small/default/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:4631051cfe2817def148e9ce2c4c3aea1ad8a7a55a11b3af3f4c0dc228316508
-size 92735924
+oid sha256:7279228b00bb1cecdc08eb098205aaa131a478cba1abeb39800c9aa84e85d5e2
+size 92735928
diff --git a/quantized/openai/whisper-small/default/tokenizer_config.json b/quantized/openai/whisper-small/default/tokenizer_config.json
index 626e5cb97dd333a874548213550e6612e9fa103d..fe49919b600daf0a9e08f15e11233858a6901aa0 100644
--- a/quantized/openai/whisper-small/default/tokenizer_config.json
+++ b/quantized/openai/whisper-small/default/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json
index 4c6b92ef5673e25cb9124507e4a9564439d8e91f..bcf1ef1259e67bdb592577b16054176e05bc8a80 100644
--- a/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json
+++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json
@@ -135,7 +135,6 @@
50361,
50362
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51865
diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx
index c786356a314b44ddef6a42768e18f6fc4e8f4928..8f89732b49a9a000431a9758f3982958a1075c8b 100644
--- a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:cee4e81283dd20a2dbb9b52ac6d6f8f5b159099c0f8cde13e10c4643f89f70a1
-size 196681889
+oid sha256:45cd0b5cfbf905e96bad3cc58b4914879dea5c86ef96bc43e47cafa87c8a86a7
+size 196677877
diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..886b1acd1dad969a1321442190a075dab233ea3f
--- /dev/null
+++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:92481f314d2811fd44dcb712c2ff4cdca3178c47e8736ef3b23057fa8c69efa3
+size 197148131
diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx
index 5819972f00b61080fe5e79b3e07092721effc599..865b1be5b92ef7bb9cc9b142b6b88e1ed3976f96 100644
--- a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:8df081154685d649af4859802d0b85c4011c96421aaaf115c3053b508b0ff4c3
-size 182269676
+oid sha256:e16020674fc4b2352a89c1ab2916c752fadf20535192c191cacdee9bd2f411a0
+size 182269128
diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx
index 18200eae15b55c90c821fd9ac637f1616bbf0999..77a89d497bfbe099d93c0f95050ec99c8a9140e4 100644
--- a/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:4631051cfe2817def148e9ce2c4c3aea1ad8a7a55a11b3af3f4c0dc228316508
-size 92735924
+oid sha256:7279228b00bb1cecdc08eb098205aaa131a478cba1abeb39800c9aa84e85d5e2
+size 92735928
diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json
index 626e5cb97dd333a874548213550e6612e9fa103d..fe49919b600daf0a9e08f15e11233858a6901aa0 100644
--- a/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-tiny.en/default/config.json b/quantized/openai/whisper-tiny.en/default/config.json
index f761dfdb5010cc744479627ce0bf3cfa700f25e6..19ba30a5b107177cc97f65465c61c5e24f47a382 100644
--- a/quantized/openai/whisper-tiny.en/default/config.json
+++ b/quantized/openai/whisper-tiny.en/default/config.json
@@ -129,7 +129,6 @@
50360,
50361
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51864
diff --git a/quantized/openai/whisper-tiny.en/default/decoder_model.onnx b/quantized/openai/whisper-tiny.en/default/decoder_model.onnx
index 96fa9834bbe114502334d0c781facb2c4b0477a4..155a34bf758c598c7a5c6ebecb2c16fc008cb348 100644
--- a/quantized/openai/whisper-tiny.en/default/decoder_model.onnx
+++ b/quantized/openai/whisper-tiny.en/default/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:064cc5dbfeba053bf2b24d1fe9db13374b6196e6e03b3c700a28032febd0a2e4
-size 30530667
+oid sha256:ead164b287283fa00157b909f5cb5d4b294c7d27aa37a9724aa39f0a647a9907
+size 30529344
diff --git a/quantized/openai/whisper-tiny.en/default/encoder_model.onnx b/quantized/openai/whisper-tiny.en/default/encoder_model.onnx
index 195d2ca112bb68559d820323242654ddb41f6b3e..3745f6f0a4cc708db169b1930f030c4b36bd8f23 100644
--- a/quantized/openai/whisper-tiny.en/default/encoder_model.onnx
+++ b/quantized/openai/whisper-tiny.en/default/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:c1d3f992f96cc792f194169a8f7b451b315bfcc6b71ba2082c698f1d374de026
-size 10192815
+oid sha256:29ee3cc641cf1e3cd448644bd474a974d7bb7b2a26aa3ad3d56aa458215e9cf7
+size 10192819
diff --git a/quantized/openai/whisper-tiny.en/default/tokenizer_config.json b/quantized/openai/whisper-tiny.en/default/tokenizer_config.json
index c430ca30d3214990bfea9dc44653d7e585b0be4f..384d88d69be58b06f01c0fc5a4854e064bbd6159 100644
--- a/quantized/openai/whisper-tiny.en/default/tokenizer_config.json
+++ b/quantized/openai/whisper-tiny.en/default/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json
index f761dfdb5010cc744479627ce0bf3cfa700f25e6..19ba30a5b107177cc97f65465c61c5e24f47a382 100644
--- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json
+++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json
@@ -129,7 +129,6 @@
50360,
50361
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51864
diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx
index 41ca089e06eb354acb9750e30bea8a14dd6e7609..9a56e8ee29405398374b083c72c74cb15a669900 100644
--- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:0a424ab24bfa1e2700982139341dcf183f4b415b78327ab08b97b1e76819f210
-size 50735081
+oid sha256:417751a3fa339b5eb7ccd239a3ed832a6e3e8edbeec3a7d049e132ac3478bbb5
+size 50733783
diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..611f84ded9f858d97005ff4e3440dbde7ed9333b
--- /dev/null
+++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:b82d9231f4fb81470f8cc2878b6dd67bcf2f737b251924da4eba45d79777bc14
+size 50891940
diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
index a705112868f298a6976a0aa2d01423977eba6f51..aea60d46a2a34accba426e27469f1e02be646d64 100644
--- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:5c1ea24304591aba1cb75e603f6c1c21bf4494d3d0395a9fc55017a8091ebe9f
-size 49485902
+oid sha256:aaa60b7625c15a1c26d1f21e2898b101367f5c746692a44b3bd68bcc5d4fcc15
+size 49485740
diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx
index 195d2ca112bb68559d820323242654ddb41f6b3e..3745f6f0a4cc708db169b1930f030c4b36bd8f23 100644
--- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:c1d3f992f96cc792f194169a8f7b451b315bfcc6b71ba2082c698f1d374de026
-size 10192815
+oid sha256:29ee3cc641cf1e3cd448644bd474a974d7bb7b2a26aa3ad3d56aa458215e9cf7
+size 10192819
diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json
index c430ca30d3214990bfea9dc44653d7e585b0be4f..384d88d69be58b06f01c0fc5a4854e064bbd6159 100644
--- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-tiny/default/config.json b/quantized/openai/whisper-tiny/default/config.json
index cb403313fd753adb0790226d1d7a7b1258c2c7ae..52163147f09e4f7b74a294d9eb3de22adbf2bef3 100644
--- a/quantized/openai/whisper-tiny/default/config.json
+++ b/quantized/openai/whisper-tiny/default/config.json
@@ -135,7 +135,6 @@
50361,
50362
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51865
diff --git a/quantized/openai/whisper-tiny/default/decoder_model.onnx b/quantized/openai/whisper-tiny/default/decoder_model.onnx
index e14a8261705d453beba162d8578cce908505123e..d03365cadd7fb844a8b1616c49a20c235fa2ce6d 100644
--- a/quantized/openai/whisper-tiny/default/decoder_model.onnx
+++ b/quantized/openai/whisper-tiny/default/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:fead8565b3de3f10b1542b041de2f30576402bf634fb2ceb2b8c2d56cdf21b91
-size 30531051
+oid sha256:933e0d390454f1814d5e8b332a8b538dee4cd5ce16a51b14ee3d38b81be5a005
+size 30529728
diff --git a/quantized/openai/whisper-tiny/default/encoder_model.onnx b/quantized/openai/whisper-tiny/default/encoder_model.onnx
index 9136ed87ab1dac4f3cf0a238e313ba5b4986c850..cd7b6ba5863a21cf9ec66c45d2289373bcde48a7 100644
--- a/quantized/openai/whisper-tiny/default/encoder_model.onnx
+++ b/quantized/openai/whisper-tiny/default/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:92e97f2cbd41ab1117039ddf725888ad8a028834b9cbd7e5be74d7fac0515d44
-size 10192815
+oid sha256:140f7c48489beda5c140c125d0609266e37185e69cbb83eeb8315585bb438bf0
+size 10192819
diff --git a/quantized/openai/whisper-tiny/default/tokenizer_config.json b/quantized/openai/whisper-tiny/default/tokenizer_config.json
index c18ca77e9c4c964c76c454efa85a08c35a9c9a4a..224faf0c5158669dee7202e9c4f75e977f9c6651 100644
--- a/quantized/openai/whisper-tiny/default/tokenizer_config.json
+++ b/quantized/openai/whisper-tiny/default/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json
index cb403313fd753adb0790226d1d7a7b1258c2c7ae..52163147f09e4f7b74a294d9eb3de22adbf2bef3 100644
--- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json
+++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json
@@ -135,7 +135,6 @@
50361,
50362
],
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 51865
diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx
index 6cef0a605aeb641c5ac081f30e06fe453bf3e805..2291ad7d8cfeeaaf092ed67226e4fd6117945ff6 100644
--- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:5cc79a5e89b4dd4b672980e7d823051776e473395bb1d6d891488f3cf2c7d0fe
-size 50735854
+oid sha256:b778a7996bffa4487385138d00e56298776bcf894930d358ff2d800cd2954361
+size 50734556
diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..a08f2312a2781aa1f2169e4d1cf3784fc7126489
--- /dev/null
+++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:ef4212fc1105df3730ac5e0e1dc5f6173d0d598e0422fd98f5e44358a4d88965
+size 50892695
diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx
index 288b797a430f74261df5f759b64096bcb0c444a7..95ceb3568a08058c6739839fd721ab4d7eada92f 100644
--- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:c78a41943419456e0ca4bab35a487dd8a91c014844f353f6a0274000c92ce27f
-size 49486675
+oid sha256:231c945514b7e8eddb9033f9149085175410837653e1b2bedd5cb61d6d6a9e9e
+size 49486513
diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx
index 9136ed87ab1dac4f3cf0a238e313ba5b4986c850..cd7b6ba5863a21cf9ec66c45d2289373bcde48a7 100644
--- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:92e97f2cbd41ab1117039ddf725888ad8a028834b9cbd7e5be74d7fac0515d44
-size 10192815
+oid sha256:140f7c48489beda5c140c125d0609266e37185e69cbb83eeb8315585bb438bf0
+size 10192819
diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json
index c18ca77e9c4c964c76c454efa85a08c35a9c9a4a..224faf0c5158669dee7202e9c4f75e977f9c6651 100644
--- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json
@@ -25,7 +25,6 @@
"return_attention_mask": false,
"special_tokens_map_file": null,
"tokenizer_class": "WhisperTokenizer",
- "trust_remote_code": false,
"unk_token": {
"__type": "AddedToken",
"content": "<|endoftext|>",
diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json
index 40c7820c59c930680f4af140ed61a931dea50269..ff3666ead9d3e2c88f2692b125239b34d8513994 100644
--- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json
+++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json
@@ -1,5 +1,5 @@
{
- "_name_or_path": "./models/pytorch/distilbart-cnn-6-6",
+ "_name_or_path": "sshleifer/distilbart-cnn-6-6",
"_num_labels": 3,
"activation_dropout": 0.0,
"activation_function": "gelu",
@@ -70,7 +70,6 @@
"num_beams": 4
}
},
- "torch_dtype": "float32",
"transformers_version": "4.26.1",
"use_cache": true,
"vocab_size": 50264
diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx
index eac3e24b5a8286b999de98cfdf2298cf1da343f0..69ee3bad2128e4040361a073508188773e76572c 100644
--- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:5febe5b43ce4c9c2bc35a5cb18dfa5e48a46d0fc8fc18d2af1795d61c50fd680
-size 206479989
+oid sha256:bf78c246385eb43eedd09db3727275eb2ea890c8f80df7600c22871f9fa63d49
+size 206522287
diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..dc9dac6c1b24a5a308e15c9832c47fcf0b6cf2cc
--- /dev/null
+++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:9a16e203dd8f5e7f5be4c2452110669d94c9f1bcdaff7185b6e3e006d3debf01
+size 206659464
diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx
index b271c8b80fbdc7fdfc59211bdabed86575b8ccb3..23b429657cbb2beff2006e71e6494cd09cd9b7e5 100644
--- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:42f643dea3105c689323791fd61b6e9f6e284c89c0527881ca8828acd886008d
-size 193716879
+oid sha256:687fcc78d2b81908b5dc60089557bd461c492e2e2ffffc982d86a0f90c4545ae
+size 193754572
diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx
index fea4eb0de14ccc36670d7425eb64b519b496130b..fba3891be63a8e2e1c93593eb7fcfbd1fccfb9a3 100644
--- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:e1768009f547363ff104fcf143c164b0d157379ece68f771238a1ea45026b004
-size 128835266
+oid sha256:8820a208f45059db2cbcd5b7b59ff3829e946789420058244cc8f429ef707fab
+size 128853768
diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json
index ae7b71057f722dae9b8574855f92736ad85b509d..b68ec657118ada773a08938cd59ee4f41c1cc629 100644
--- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json
+++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json
@@ -5,56 +5,55 @@
"added_tokens": [
{
"id": 0,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": true,
- "special": true
+ "normalized": true
},
{
"id": 1,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": true,
- "special": true
+ "normalized": true
},
{
"id": 2,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": true,
- "special": true
+ "normalized": true
},
{
"id": 3,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": true,
- "special": true
+ "normalized": true
},
{
"id": 50264,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": true,
"rstrip": false,
- "normalized": true,
- "special": true
+ "normalized": true
}
],
"normalizer": null,
"pre_tokenizer": {
"type": "ByteLevel",
"add_prefix_space": false,
- "trim_offsets": true,
- "use_regex": true
+ "trim_offsets": true
},
"post_processor": {
"type": "RobertaProcessing",
@@ -72,8 +71,7 @@
"decoder": {
"type": "ByteLevel",
"add_prefix_space": true,
- "trim_offsets": true,
- "use_regex": true
+ "trim_offsets": true
},
"model": {
"type": "BPE",
diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json
index 89133304c7ac83061810a274ab08ebaa45549079..9feb230c732bf9236c347ffcc9a8b9865f94806f 100644
--- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json
@@ -34,7 +34,7 @@
"single_word": false
},
"model_max_length": 1024,
- "name_or_path": "./models/pytorch/distilbart-cnn-6-6",
+ "name_or_path": "sshleifer/distilbart-cnn-6-6",
"pad_token": {
"__type": "AddedToken",
"content": "",
diff --git a/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx b/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx
index e9e6b72815697ec4c0509613442aaccde5f1a13f..7380df1e9259f5da83ab752d9c31cd6563b8ad43 100644
--- a/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:9a780e63db36dc742c4877b443693b08da83a8c9ff37a50992ec8ceac6664511
-size 164125335
+oid sha256:47a0bcce9bde05f2efae9fc160597908351afa9f3435bb3d4fc6898b87fc9cac
+size 164212159
diff --git a/quantized/t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..23db31ad793fca55d80ac4862060ad94b8473ea2
--- /dev/null
+++ b/quantized/t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:5d890a977cba9946d83a05b612660935556e1b1acfbe44fee015d8c2798792f9
+size 164407136
diff --git a/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
index cee06a9cb0860f47c54ea4e3696e76e3e445f1e1..055725b6d657cb87ac81e5479e19ec1f4b282573 100644
--- a/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:2a380c12a7fff3b79bda6ac39f26cf99a76d4e4226c9432d5dd596e06e5623d9
-size 149817760
+oid sha256:2b00687d6bc057e09d7268793ef94febb1ce93326d61daebd0bc46cd83b29af9
+size 149895571
diff --git a/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx b/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx
index b8508b5e3222465c0265bf4f62f4f46c63f9f30e..f6b1cd476e40d0f26222d97d5d7496fe3aee6acb 100644
--- a/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:41aa8184e052af3d834afdeba930ce837a8aeaea84af7f86ce288cd884230a4d
-size 110425846
+oid sha256:938176467fc4eab1ec72a80b8187321dbffdd53bd2f8fba3231677f31d8440e3
+size 110468491
diff --git a/quantized/t5-small/seq2seq-lm-with-past/config.json b/quantized/t5-small/seq2seq-lm-with-past/config.json
index 3eb424fb2cb83f8e9a6dee5241f51ef8b72bf462..ab8e4622c467cba75060c2c0b1c52f666759e225 100644
--- a/quantized/t5-small/seq2seq-lm-with-past/config.json
+++ b/quantized/t5-small/seq2seq-lm-with-past/config.json
@@ -1,5 +1,5 @@
{
- "_name_or_path": "./models/pytorch/t5-small",
+ "_name_or_path": "t5-small",
"architectures": [
"T5ForConditionalGeneration"
],
diff --git a/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx b/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx
index a0a1e45e81095305ca3bda43172f0e1f6f6ef699..ebd59b79bf7c05eb38dfe75fd853e2f12a6f39bf 100644
--- a/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx
+++ b/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:eb2e336b767e84ec868601c4ebe04f5815bf60fa3a89b3cf98c43165ec49346b
-size 58629284
+oid sha256:81c50ce70014e2629ed5f247876f2a8a02e2ac2c71434c2f49056be050e47f88
+size 58653777
diff --git a/quantized/t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx
new file mode 100644
index 0000000000000000000000000000000000000000..5e51812b5a918132fbb961b061880517b5739cdb
--- /dev/null
+++ b/quantized/t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx
@@ -0,0 +1,3 @@
+version https://git-lfs.github.com/spec/v1
+oid sha256:e410c9d18f1213154873f1433380fe9b132766195c6705906c9b961552a8f84a
+size 58695469
diff --git a/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
index 77d1a643dbf523ab8347de2cf461bcee64910270..b9a68b6a1b5fa69d3b4f99ef5442439308e560db 100644
--- a/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
+++ b/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:959f46528a00274ed729ddb946be93a0f452c5fa3f3811f9b3b0df17006e2a69
-size 55441515
+oid sha256:4051a88a8c68714e901e301de5f76fb4d0a16dee060cfff929082a1027a0f6bc
+size 55462874
diff --git a/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx b/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx
index 6c8a2a71d72d8b50cf990e4cad571fbf52dacb0e..8a19249affcf7ff49df183c6cea45037d0ff9cdb 100644
--- a/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx
+++ b/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx
@@ -1,3 +1,3 @@
version https://git-lfs.github.com/spec/v1
-oid sha256:baa256256227f0d5bcb9bac2660717a51ca61f9b1c40ad9a36934760edf3b43c
-size 35575579
+oid sha256:decc4bf2aa8d748ba92dcff463e401074238e0a6dcd5dd114abceecdd5245a53
+size 35587442
diff --git a/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json b/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json
index 698d7a6a181bc68bbeb97703edc841c911e39a0c..9e2f3266532d086ffe6332050eb8a7e055e7a9e7 100644
--- a/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json
+++ b/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json
@@ -5,930 +5,930 @@
"added_tokens": [
{
"id": 0,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 1,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 2,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32000,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32001,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32002,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32003,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32004,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32005,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32006,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32007,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32008,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32009,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32010,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32011,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32012,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32013,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32014,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32015,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32016,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32017,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32018,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32019,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32020,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32021,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32022,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32023,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32024,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32025,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32026,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32027,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32028,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32029,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32030,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32031,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32032,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32033,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32034,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32035,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32036,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32037,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32038,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32039,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32040,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32041,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32042,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32043,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32044,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32045,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32046,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32047,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32048,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32049,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32050,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32051,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32052,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32053,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32054,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32055,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32056,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32057,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32058,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32059,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32060,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32061,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32062,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32063,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32064,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32065,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32066,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32067,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32068,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32069,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32070,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32071,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32072,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32073,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32074,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32075,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32076,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32077,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32078,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32079,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32080,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32081,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32082,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32083,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32084,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32085,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32086,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32087,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32088,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32089,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32090,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32091,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32092,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32093,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32094,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32095,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32096,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32097,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32098,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
},
{
"id": 32099,
+ "special": true,
"content": "",
"single_word": false,
"lstrip": false,
"rstrip": false,
- "normalized": false,
- "special": true
+ "normalized": false
}
],
"normalizer": {
diff --git a/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json b/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json
index 396a6b3e8e612cae7d7e1c8e193528fbb04f34d6..fc9b1b5ec024637d0cdb9f88b3835db43028e5b9 100644
--- a/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json
+++ b/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json
@@ -103,8 +103,8 @@
],
"eos_token": "",
"extra_ids": 100,
- "model_max_length": 1000000000000000019884624838656,
- "name_or_path": "./models/pytorch/t5-small",
+ "model_max_length": 512,
+ "name_or_path": "t5-small",
"pad_token": "",
"special_tokens_map_file": null,
"tokenizer_class": "T5Tokenizer",