diff --git a/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx b/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx index cae8d7adb3a73bd7a263150ab524d366f4a525d5..3574246ead2c54e92a3cbf4d24c2b77addc699bd 100644 --- a/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx +++ b/quantized/distilgpt2/causal-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ced5da743a77529eb62060115580596dbb21702b7bd3af9e3ed64c9207562c7a -size 249582838 +oid sha256:d447949536a14e0930c48b23fc34e2a6fdbdfa22c958dff787fe23d5e88b9ec8 +size 249587577 diff --git a/quantized/distilgpt2/causal-lm-with-past/decoder_model_merged.onnx b/quantized/distilgpt2/causal-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..1cbaaf18af019a333e72f5f2fdbeaa764a944649 --- /dev/null +++ b/quantized/distilgpt2/causal-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df8008063684caea7f35b9a7051a8693ab548acfc29449b3c4e94331cc46b4f +size 249675200 diff --git a/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx b/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx index b1b73c9ebfc4a76242783700d76082beb6bc76e2..9b0cfd607898a633bc69265726661829a1b2e9c8 100644 --- a/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/distilgpt2/causal-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8ce5f0c2fee02591c5657ac5c4f7d7d6ff01bdd836eab72339e9d2068cef443f -size 249586984 +oid sha256:66c0af50c63820a310c0bb0f7269a807e357d3d77bc18fda409464c6948cb627 +size 249592120 diff --git a/quantized/distilgpt2/causal-lm-with-past/tokenizer.json b/quantized/distilgpt2/causal-lm-with-past/tokenizer.json index 6dc5e94ca994de07d374e33698489de9cff48a02..22043ac6ec947359001e20840908973ea620781e 100644 --- a/quantized/distilgpt2/causal-lm-with-past/tokenizer.json +++ b/quantized/distilgpt2/causal-lm-with-past/tokenizer.json @@ -5,32 +5,29 @@ "added_tokens": [ { "id": 50256, + "special": true, "content": "<|endoftext|>", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false } ], "normalizer": null, "pre_tokenizer": { "type": "ByteLevel", "add_prefix_space": false, - "trim_offsets": true, - "use_regex": true + "trim_offsets": true }, "post_processor": { "type": "ByteLevel", "add_prefix_space": true, - "trim_offsets": false, - "use_regex": true + "trim_offsets": false }, "decoder": { "type": "ByteLevel", "add_prefix_space": true, - "trim_offsets": true, - "use_regex": true + "trim_offsets": true }, "model": { "type": "BPE", diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx index a0ccd4da297f339be26c6823c32735e177a28f0e..6ff3f34fd1bb0344d3b724e1c50546039e38308e 100644 --- a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx +++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4d6821426c8d3dd75f7ed83426e50b6d58af2154590175a36a8c5ff05b65e911 -size 164245993 +oid sha256:3a5dedfa56dfa3a66c840af98ab0c0438ea97e2905947de9c1cdbc2a3c5139c4 +size 164336072 diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..e5f264454e379bb891c9b8f8b2bae9d49a0b411e --- /dev/null +++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54318115238b89ab4fa6b1fd85cf4e55cd89f14f164ab4019ee98e68d0cca55e +size 164549246 diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx index b4fd788b9cd9c92cf7733ff61557c7cf5dbbefb4..aab7b686f33a9ed165965d74354483860a62c540 100644 --- a/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9231c30c03c92a38ab63ad24ab9440897d19bf11bee0e7b70c0fff9aa540b466 -size 149938415 +oid sha256:422cfaa90b115c4ea60f43b94fd8fda445d9150b2e401ddd8db8408c9e3b6b99 +size 150019481 diff --git a/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx index 1cb31eb743f36f948cd9fabf1b591272ef7d6a46..4f72e3feb3008aa9d496e76630d17921bad3a0db 100644 --- a/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx +++ b/quantized/google/flan-t5-base/seq2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f8ee6a0e07f0b6f1b5aaca54e4d5ed320034fa3e433121706e2da7514072f718 -size 110539783 +oid sha256:2706491228c349685ee85c1d67a057bd173cca81ef1c5d229a47c3b49e81370c +size 110585314 diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx index 6bd320a12e366add128f456eb487e871419548bb..5d680864d304b9ef61436fd9aa55ffcc79504c2c 100644 --- a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx +++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d5b1ebae6276d191107b7eead3d142b970542d9262d952900df8107fa89bf619 -size 58998475 +oid sha256:288c543b7ed377cc89929c89ddc64d2ea32d35a40cc084b997aad3933643fd89 +size 59058672 diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..183fef4143c8f8016453488cc1769aeb4c990f5c --- /dev/null +++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d623ab57fed27150b5517a955295a20effb4099ae7d51c44bf279e794243db6 +size 59247726 diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx index aa2c305cf188eee7c83855db3d798189225542f7..74c2d79c85e97196748a7a81b99a38cb3c2219ad 100644 --- a/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0a64bcefa3b4fa4ab2a23854dd89a44bfbf2c76b4418d2e7665217631c57b6d6 -size 55785322 +oid sha256:12d22d076005b8d6d0e98bbf149b2561cf4911f3f4f1af33f16e806fb7fabe53 +size 55839462 diff --git a/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx index fdb7f3d8ab018c1bf06a81ba611b338e1620ea17..b75a60c3e312daca48dd7821ca32cc1effba948b 100644 --- a/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx +++ b/quantized/google/flan-t5-small/seq2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:776cd40d25b7026fb4f3301f4ca82a026f844db74f9e94e6b05672940bb39e27 -size 35784005 +oid sha256:e7c4d50cb1270f49639b46399f89a4a1f25cb3e95fbecaf236785b909048a736 +size 35814394 diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx index 657170f1b0e2b2f0cf04dc871b34e6fa8ce967fb..cf43ac93c79a6d945f76d3b26db3ad2ea93e34aa 100644 --- a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx +++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:83f4e696ca09795bee52c3c19642cf0ace200aa576ea2006833198be83ec6216 -size 164245993 +oid sha256:17990f89e69dfde950c25c0866fb4435812d36bfbf46db7351a9d5608c70efbd +size 164336072 diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..0256a5351904cbf0f14f364005b5dc0bf408228e --- /dev/null +++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc2ed6d6efd0f727e277aa8a3f5f44b36b6a0f6e808add5c898ced2a5bbe6cf1 +size 164549246 diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx index 68f0e1a059e4444e712fb9398838763e43063fd2..ccdedea39f190bd715967690a08873d8f4ed09bc 100644 --- a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9735f078a8d070177a970d5353668ded23942d076a6cf6ba07cb7aad3fc32529 -size 149938415 +oid sha256:4299f5e1c01b33df8658fe4a6857a1fff1e3d47db7a1eba6c71ff672cd5af75b +size 150019481 diff --git a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx index ffabd1d9092c4546e4e3c7d54a2257c0b5f7be3b..bd555f1d51ec14a106e637f0658f7515f520a86c 100644 --- a/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx +++ b/quantized/google/t5-v1_1-base/seq2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:33d0af70e4475f683586ca53c9b7a6c3a2eaaaaa305f705df9c5e897b1128934 -size 110539783 +oid sha256:5ac0d4f6da965ec8a2c2a91a32155cc92e7d5158e27c5e36d10b75e00da91e67 +size 110585314 diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx index 4640c00b332b910c068dd08ce039ae3aa4afecc7..05bfbdf9ab7a8ab879fb39d9405d103f1aecc172 100644 --- a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx +++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d12084abc7a8cb0771c9298cbe3d4b3ed9e8b2ec47886ddb11d600fb3a6e5c5a -size 58998475 +oid sha256:a5982955fba72cbc80221160fce037440d3a670c91e9bcd9beb6788a962771f6 +size 59058672 diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..3bb0fb69533b01c6109570be17a40e0eef55bd31 --- /dev/null +++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a9d30911a12b36bc0df67abc93450da5fa8346992f2c2b1846f144fa814626c +size 59247726 diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx index ffab8fedac4dd47f6651ef175c1e75c920ad5703..76bb033204d628a66ca83e8d82aed04cc1230dfc 100644 --- a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:863de1616d28644332df2331cad5000cf700ff3b7bf9b8de42e46af6a7314b67 -size 55785322 +oid sha256:8a2315a861d9f3a8fddb8edcd0675dd3bf000fd93140c8b31b7dd6e9c012014c +size 55839462 diff --git a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx index 44027cdc4969b7a6595dd208604147990139d3c0..487c0afb50ab7635729b07cc0749b7ef2910986e 100644 --- a/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx +++ b/quantized/google/t5-v1_1-small/seq2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:438e80e369cd88a92eb55bf623c4ae2616dcff678949e424ae4f8f9fa41e9786 -size 35784005 +oid sha256:6b6585dcde89301247cd8dfe0dbb221e83c5427217bbff424e78adeaafc98334 +size 35814394 diff --git a/quantized/openai/whisper-base.en/default/config.json b/quantized/openai/whisper-base.en/default/config.json index 0f0e052c322a7af5d702c50986a7f473c51abbdd..a06a0040590d419e3641482853812b18d546efb6 100644 --- a/quantized/openai/whisper-base.en/default/config.json +++ b/quantized/openai/whisper-base.en/default/config.json @@ -129,7 +129,6 @@ 50360, 50361 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51864 diff --git a/quantized/openai/whisper-base.en/default/decoder_model.onnx b/quantized/openai/whisper-base.en/default/decoder_model.onnx index 294284e73c05b9f908e2b232c7b86e7f4f06578b..0e3872fd3a7a5f30772eda0b02a375b9a7467026 100644 --- a/quantized/openai/whisper-base.en/default/decoder_model.onnx +++ b/quantized/openai/whisper-base.en/default/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:65591b39b49623c74b360af28509182a4054355c9d9d14b254566f257928d406 -size 53466938 +oid sha256:90e2a5e52df832bbc35fb104cfc63deb2a3731bfe3c997df73f5fa234ee9e363 +size 53464941 diff --git a/quantized/openai/whisper-base.en/default/encoder_model.onnx b/quantized/openai/whisper-base.en/default/encoder_model.onnx index 486176a7ab468d82d246222c1fbaa6d4baf20bfa..bd31f8e0f4870805e04aa758e0cfc4a2b2ddfefc 100644 --- a/quantized/openai/whisper-base.en/default/encoder_model.onnx +++ b/quantized/openai/whisper-base.en/default/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a8daef92b616d36adf1c086f89280443effd2c77c7e8c730113514833f076ca6 -size 23337231 +oid sha256:5ceadcf4cb45d3e07507174a5f281f745085f01ea01b32f11dcb14f20e81291b +size 23337235 diff --git a/quantized/openai/whisper-base.en/default/tokenizer_config.json b/quantized/openai/whisper-base.en/default/tokenizer_config.json index 044482e72ceb1721e9eadd5f8b4dd6fd8dee382b..5c2ea33b72e5dbe2a90929e27eb5ead584bbbb84 100644 --- a/quantized/openai/whisper-base.en/default/tokenizer_config.json +++ b/quantized/openai/whisper-base.en/default/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json index 0f0e052c322a7af5d702c50986a7f473c51abbdd..a06a0040590d419e3641482853812b18d546efb6 100644 --- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json +++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/config.json @@ -129,7 +129,6 @@ 50360, 50361 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51864 diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx index 7da2a923670e9cfd0c444049244d8956b9484ee7..802bff66808d25d67822eba79e1e409cb5709bac 100644 --- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx +++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:acf55ec8ff985302cd968ad47b9a7ab9661b8dedd784270d12f1bd53cb79aeed -size 80323040 +oid sha256:d1a4eb50199211fafcccf5efb8176ab1f3422597fc767f05d30c559ce091abe6 +size 80321068 diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..5f990eac67816cc01e52db323bfb778689a03210 --- /dev/null +++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b2396a1c4079f5b541d05ccfd21bef6d20af75e48f9ac5c34bc4b67f3751fb5 +size 80556990 diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx index e8f53e37f63d3e861f24b83f1400c3fdae0e5d7a..f30e4dfcbe712e2e7dbf95874792f79411622054 100644 --- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ab2ca295c5f803fd34d4583b9f1cfd6ad77370c3fec30a680c5bbcb9d4202dfb -size 77066559 +oid sha256:65b70d66fa9dbb1a61c863065100a08bf58a689383b212b1e91646738cc97424 +size 77066299 diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx index 486176a7ab468d82d246222c1fbaa6d4baf20bfa..bd31f8e0f4870805e04aa758e0cfc4a2b2ddfefc 100644 --- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx +++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a8daef92b616d36adf1c086f89280443effd2c77c7e8c730113514833f076ca6 -size 23337231 +oid sha256:5ceadcf4cb45d3e07507174a5f281f745085f01ea01b32f11dcb14f20e81291b +size 23337235 diff --git a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json index 044482e72ceb1721e9eadd5f8b4dd6fd8dee382b..5c2ea33b72e5dbe2a90929e27eb5ead584bbbb84 100644 --- a/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json +++ b/quantized/openai/whisper-base.en/speech2seq-lm-with-past/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-base/default/config.json b/quantized/openai/whisper-base/default/config.json index 9f0ec8146473ef27fb6be214f8e0fc08b0776cfd..546d4ae6ee01d58080a61b9e3e55c72951c9b6a9 100644 --- a/quantized/openai/whisper-base/default/config.json +++ b/quantized/openai/whisper-base/default/config.json @@ -135,7 +135,6 @@ 50361, 50362 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51865 diff --git a/quantized/openai/whisper-base/default/decoder_model.onnx b/quantized/openai/whisper-base/default/decoder_model.onnx index 64fa956fe669729e32559cb4677b638e7a712bbc..9ef76f7e8dc0f392bbbfd402ec152c4e9c3e3aaa 100644 --- a/quantized/openai/whisper-base/default/decoder_model.onnx +++ b/quantized/openai/whisper-base/default/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5d6942cf3bd8173fae3ddd56932bb1330e99845c8d1f291f622f7ddc5dea14ab -size 53467450 +oid sha256:7a5866bc679ce0c107395289250eae85918be53afd49e3bb3b026710d7023dcd +size 53465453 diff --git a/quantized/openai/whisper-base/default/encoder_model.onnx b/quantized/openai/whisper-base/default/encoder_model.onnx index c6eb28a97e6f377867c6aa3c6d3b1dd3b94095cc..e48e8541da7a61e7e5f3072382653a029d995e51 100644 --- a/quantized/openai/whisper-base/default/encoder_model.onnx +++ b/quantized/openai/whisper-base/default/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c4c995617d3e567ff954695388801dab9d13fae1804103a974a8ecd6e7bcfa9a -size 23337231 +oid sha256:1990e063ab168d67092cbbd32588acb425e6d767bd3af38ecf36137fe3914b41 +size 23337235 diff --git a/quantized/openai/whisper-base/default/tokenizer_config.json b/quantized/openai/whisper-base/default/tokenizer_config.json index 6b0a72ce5cf3c335eab27a46d2fa0f812e6b48fd..2dfd88e8dfba2c386243c900f3f8f9ddaa1f604a 100644 --- a/quantized/openai/whisper-base/default/tokenizer_config.json +++ b/quantized/openai/whisper-base/default/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json index 9f0ec8146473ef27fb6be214f8e0fc08b0776cfd..546d4ae6ee01d58080a61b9e3e55c72951c9b6a9 100644 --- a/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json +++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/config.json @@ -135,7 +135,6 @@ 50361, 50362 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51865 diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx index 0c5b6f60aa016aef6d693877b248407e201c3a0e..eded76ecf7775900e3d2506aa1f333b8ac03690a 100644 --- a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx +++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d7a8b7bfa9d2117ed40edc1bfca3e5de318c04b601b215bc651023eda15c6bed -size 80324069 +oid sha256:0800f9c5cd63139166bf2031993b8e136bb754a76a94aaf25a9e9b0dd9cc73bf +size 80322097 diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b7da53318684804acaa0e8c4865dd666bf782fc4 --- /dev/null +++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62aac7f57c5f696817983bb46f45b694d9e870727dcade1c2be707146b1e215e +size 80558019 diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx index 5695c4c27a814353e584698f2dc3f9c6c4be36e6..06d0a7adc5c314484830480d21e5f109e5a45f68 100644 --- a/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:97cf2a4270fee757ec5cc239c165b0b63814fe4c9160e3910d2099efa460c5d7 -size 77067588 +oid sha256:6f1e5181fd479407e403f50594bb14a38bca8f6c86e27b656c4066aaf9cd0a72 +size 77067328 diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx index c6eb28a97e6f377867c6aa3c6d3b1dd3b94095cc..e48e8541da7a61e7e5f3072382653a029d995e51 100644 --- a/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx +++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c4c995617d3e567ff954695388801dab9d13fae1804103a974a8ecd6e7bcfa9a -size 23337231 +oid sha256:1990e063ab168d67092cbbd32588acb425e6d767bd3af38ecf36137fe3914b41 +size 23337235 diff --git a/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json index 6b0a72ce5cf3c335eab27a46d2fa0f812e6b48fd..2dfd88e8dfba2c386243c900f3f8f9ddaa1f604a 100644 --- a/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json +++ b/quantized/openai/whisper-base/speech2seq-lm-with-past/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-small.en/default/config.json b/quantized/openai/whisper-small.en/default/config.json index e68b2517185b7dc081f219ed07d8875435471602..60bd84cfd6099303181ef474422ac8c00d87cf86 100644 --- a/quantized/openai/whisper-small.en/default/config.json +++ b/quantized/openai/whisper-small.en/default/config.json @@ -129,7 +129,6 @@ 50360, 50361 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51864 diff --git a/quantized/openai/whisper-small.en/default/decoder_model.onnx b/quantized/openai/whisper-small.en/default/decoder_model.onnx index 5ebbbc897efa20832c55ab71d610f8b48715e800..80aa4f9ff850fa2208e7370a50b6adeaf887d9d9 100644 --- a/quantized/openai/whisper-small.en/default/decoder_model.onnx +++ b/quantized/openai/whisper-small.en/default/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d304c16554a234d0c6c2d8553da683c49a9e872537714fa99f756e9bfa9e0230 -size 156507792 +oid sha256:8af023c75b14ede43fa2904e5d702d1ea36673709cb6a0f849d2fb7c498f67f7 +size 156503755 diff --git a/quantized/openai/whisper-small.en/default/encoder_model.onnx b/quantized/openai/whisper-small.en/default/encoder_model.onnx index f28ecd76363f49096f8bed17946a8b1fa88b4706..0501417673dffa873a330b625ef1946914f17b1a 100644 --- a/quantized/openai/whisper-small.en/default/encoder_model.onnx +++ b/quantized/openai/whisper-small.en/default/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7a9ff0f76c5a450edccfc7fbe8f910047620a56101b284066e007832ad6d48d3 -size 92735924 +oid sha256:6792ba696e505bd3527efa62327024bc04db8bf9558d47e16a2fff7e3810440f +size 92735928 diff --git a/quantized/openai/whisper-small.en/default/tokenizer_config.json b/quantized/openai/whisper-small.en/default/tokenizer_config.json index ba1d7aa7a5333296cabbcf5b9e4c239aedf2d755..c17ccf7df98614e74fc7d5e7de73ec03dcafd93d 100644 --- a/quantized/openai/whisper-small.en/default/tokenizer_config.json +++ b/quantized/openai/whisper-small.en/default/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json index e68b2517185b7dc081f219ed07d8875435471602..60bd84cfd6099303181ef474422ac8c00d87cf86 100644 --- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json +++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/config.json @@ -129,7 +129,6 @@ 50360, 50361 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51864 diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx index 53a5f950f40b94e1c32814a88e7541b920283b38..380efc20556342d2f1f094bc860a72c75fe632e6 100644 --- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx +++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:188af562e38a5e1d513ce1526dd22688947d3b5d06227ace70ccc7f0a6657846 -size 196680348 +oid sha256:0105edbe0037f4c7ac11f020f53f581b6ed10c9f680124d2448f255ec52c28c3 +size 196676336 diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..8df35187ae8047d99c3e21b0ed1868619b6925f4 --- /dev/null +++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8defd52aed2a7843e174afb4a42c44ae4dfb8e85c200e9955fb88a68ef8df0f7 +size 197146590 diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx index 7b4a58b58193e4357d596beef3ce29b74e443c07..f74b2828c125bd3e12b33efede29e8801d1ba80a 100644 --- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90ee0249df2d0a3f98da7025f71d2ed6a914cb543a76d1300194f2cfbdddebb9 -size 182268135 +oid sha256:a6ced91a295a5a5d10abebd872a1da952b441e12240cf2f1f680b24ae9e53029 +size 182267587 diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx index f28ecd76363f49096f8bed17946a8b1fa88b4706..0501417673dffa873a330b625ef1946914f17b1a 100644 --- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx +++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7a9ff0f76c5a450edccfc7fbe8f910047620a56101b284066e007832ad6d48d3 -size 92735924 +oid sha256:6792ba696e505bd3527efa62327024bc04db8bf9558d47e16a2fff7e3810440f +size 92735928 diff --git a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json index ba1d7aa7a5333296cabbcf5b9e4c239aedf2d755..c17ccf7df98614e74fc7d5e7de73ec03dcafd93d 100644 --- a/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json +++ b/quantized/openai/whisper-small.en/speech2seq-lm-with-past/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-small/default/config.json b/quantized/openai/whisper-small/default/config.json index 4c6b92ef5673e25cb9124507e4a9564439d8e91f..bcf1ef1259e67bdb592577b16054176e05bc8a80 100644 --- a/quantized/openai/whisper-small/default/config.json +++ b/quantized/openai/whisper-small/default/config.json @@ -135,7 +135,6 @@ 50361, 50362 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51865 diff --git a/quantized/openai/whisper-small/default/decoder_model.onnx b/quantized/openai/whisper-small/default/decoder_model.onnx index ec49323cd4251fa9ffc1ac83421349e2a6bd62fd..8c9196bb18fba5abb24186bc68198cfddbeb143e 100644 --- a/quantized/openai/whisper-small/default/decoder_model.onnx +++ b/quantized/openai/whisper-small/default/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c242c30a33e05e44eb2e585485d09123282310b842d27e043bea7840181d372c -size 156508560 +oid sha256:77af26339700b3afdcb37d3e9158c4c713875719c30e19eaabd919f7010a554f +size 156504523 diff --git a/quantized/openai/whisper-small/default/encoder_model.onnx b/quantized/openai/whisper-small/default/encoder_model.onnx index 18200eae15b55c90c821fd9ac637f1616bbf0999..77a89d497bfbe099d93c0f95050ec99c8a9140e4 100644 --- a/quantized/openai/whisper-small/default/encoder_model.onnx +++ b/quantized/openai/whisper-small/default/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4631051cfe2817def148e9ce2c4c3aea1ad8a7a55a11b3af3f4c0dc228316508 -size 92735924 +oid sha256:7279228b00bb1cecdc08eb098205aaa131a478cba1abeb39800c9aa84e85d5e2 +size 92735928 diff --git a/quantized/openai/whisper-small/default/tokenizer_config.json b/quantized/openai/whisper-small/default/tokenizer_config.json index 626e5cb97dd333a874548213550e6612e9fa103d..fe49919b600daf0a9e08f15e11233858a6901aa0 100644 --- a/quantized/openai/whisper-small/default/tokenizer_config.json +++ b/quantized/openai/whisper-small/default/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json index 4c6b92ef5673e25cb9124507e4a9564439d8e91f..bcf1ef1259e67bdb592577b16054176e05bc8a80 100644 --- a/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json +++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/config.json @@ -135,7 +135,6 @@ 50361, 50362 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51865 diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx index c786356a314b44ddef6a42768e18f6fc4e8f4928..8f89732b49a9a000431a9758f3982958a1075c8b 100644 --- a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx +++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cee4e81283dd20a2dbb9b52ac6d6f8f5b159099c0f8cde13e10c4643f89f70a1 -size 196681889 +oid sha256:45cd0b5cfbf905e96bad3cc58b4914879dea5c86ef96bc43e47cafa87c8a86a7 +size 196677877 diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..886b1acd1dad969a1321442190a075dab233ea3f --- /dev/null +++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92481f314d2811fd44dcb712c2ff4cdca3178c47e8736ef3b23057fa8c69efa3 +size 197148131 diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx index 5819972f00b61080fe5e79b3e07092721effc599..865b1be5b92ef7bb9cc9b142b6b88e1ed3976f96 100644 --- a/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8df081154685d649af4859802d0b85c4011c96421aaaf115c3053b508b0ff4c3 -size 182269676 +oid sha256:e16020674fc4b2352a89c1ab2916c752fadf20535192c191cacdee9bd2f411a0 +size 182269128 diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx index 18200eae15b55c90c821fd9ac637f1616bbf0999..77a89d497bfbe099d93c0f95050ec99c8a9140e4 100644 --- a/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx +++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4631051cfe2817def148e9ce2c4c3aea1ad8a7a55a11b3af3f4c0dc228316508 -size 92735924 +oid sha256:7279228b00bb1cecdc08eb098205aaa131a478cba1abeb39800c9aa84e85d5e2 +size 92735928 diff --git a/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json index 626e5cb97dd333a874548213550e6612e9fa103d..fe49919b600daf0a9e08f15e11233858a6901aa0 100644 --- a/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json +++ b/quantized/openai/whisper-small/speech2seq-lm-with-past/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-tiny.en/default/config.json b/quantized/openai/whisper-tiny.en/default/config.json index f761dfdb5010cc744479627ce0bf3cfa700f25e6..19ba30a5b107177cc97f65465c61c5e24f47a382 100644 --- a/quantized/openai/whisper-tiny.en/default/config.json +++ b/quantized/openai/whisper-tiny.en/default/config.json @@ -129,7 +129,6 @@ 50360, 50361 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51864 diff --git a/quantized/openai/whisper-tiny.en/default/decoder_model.onnx b/quantized/openai/whisper-tiny.en/default/decoder_model.onnx index 96fa9834bbe114502334d0c781facb2c4b0477a4..155a34bf758c598c7a5c6ebecb2c16fc008cb348 100644 --- a/quantized/openai/whisper-tiny.en/default/decoder_model.onnx +++ b/quantized/openai/whisper-tiny.en/default/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:064cc5dbfeba053bf2b24d1fe9db13374b6196e6e03b3c700a28032febd0a2e4 -size 30530667 +oid sha256:ead164b287283fa00157b909f5cb5d4b294c7d27aa37a9724aa39f0a647a9907 +size 30529344 diff --git a/quantized/openai/whisper-tiny.en/default/encoder_model.onnx b/quantized/openai/whisper-tiny.en/default/encoder_model.onnx index 195d2ca112bb68559d820323242654ddb41f6b3e..3745f6f0a4cc708db169b1930f030c4b36bd8f23 100644 --- a/quantized/openai/whisper-tiny.en/default/encoder_model.onnx +++ b/quantized/openai/whisper-tiny.en/default/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c1d3f992f96cc792f194169a8f7b451b315bfcc6b71ba2082c698f1d374de026 -size 10192815 +oid sha256:29ee3cc641cf1e3cd448644bd474a974d7bb7b2a26aa3ad3d56aa458215e9cf7 +size 10192819 diff --git a/quantized/openai/whisper-tiny.en/default/tokenizer_config.json b/quantized/openai/whisper-tiny.en/default/tokenizer_config.json index c430ca30d3214990bfea9dc44653d7e585b0be4f..384d88d69be58b06f01c0fc5a4854e064bbd6159 100644 --- a/quantized/openai/whisper-tiny.en/default/tokenizer_config.json +++ b/quantized/openai/whisper-tiny.en/default/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json index f761dfdb5010cc744479627ce0bf3cfa700f25e6..19ba30a5b107177cc97f65465c61c5e24f47a382 100644 --- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json +++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/config.json @@ -129,7 +129,6 @@ 50360, 50361 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51864 diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx index 41ca089e06eb354acb9750e30bea8a14dd6e7609..9a56e8ee29405398374b083c72c74cb15a669900 100644 --- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx +++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0a424ab24bfa1e2700982139341dcf183f4b415b78327ab08b97b1e76819f210 -size 50735081 +oid sha256:417751a3fa339b5eb7ccd239a3ed832a6e3e8edbeec3a7d049e132ac3478bbb5 +size 50733783 diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..611f84ded9f858d97005ff4e3440dbde7ed9333b --- /dev/null +++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82d9231f4fb81470f8cc2878b6dd67bcf2f737b251924da4eba45d79777bc14 +size 50891940 diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx index a705112868f298a6976a0aa2d01423977eba6f51..aea60d46a2a34accba426e27469f1e02be646d64 100644 --- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5c1ea24304591aba1cb75e603f6c1c21bf4494d3d0395a9fc55017a8091ebe9f -size 49485902 +oid sha256:aaa60b7625c15a1c26d1f21e2898b101367f5c746692a44b3bd68bcc5d4fcc15 +size 49485740 diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx index 195d2ca112bb68559d820323242654ddb41f6b3e..3745f6f0a4cc708db169b1930f030c4b36bd8f23 100644 --- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx +++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c1d3f992f96cc792f194169a8f7b451b315bfcc6b71ba2082c698f1d374de026 -size 10192815 +oid sha256:29ee3cc641cf1e3cd448644bd474a974d7bb7b2a26aa3ad3d56aa458215e9cf7 +size 10192819 diff --git a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json index c430ca30d3214990bfea9dc44653d7e585b0be4f..384d88d69be58b06f01c0fc5a4854e064bbd6159 100644 --- a/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json +++ b/quantized/openai/whisper-tiny.en/speech2seq-lm-with-past/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-tiny/default/config.json b/quantized/openai/whisper-tiny/default/config.json index cb403313fd753adb0790226d1d7a7b1258c2c7ae..52163147f09e4f7b74a294d9eb3de22adbf2bef3 100644 --- a/quantized/openai/whisper-tiny/default/config.json +++ b/quantized/openai/whisper-tiny/default/config.json @@ -135,7 +135,6 @@ 50361, 50362 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51865 diff --git a/quantized/openai/whisper-tiny/default/decoder_model.onnx b/quantized/openai/whisper-tiny/default/decoder_model.onnx index e14a8261705d453beba162d8578cce908505123e..d03365cadd7fb844a8b1616c49a20c235fa2ce6d 100644 --- a/quantized/openai/whisper-tiny/default/decoder_model.onnx +++ b/quantized/openai/whisper-tiny/default/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fead8565b3de3f10b1542b041de2f30576402bf634fb2ceb2b8c2d56cdf21b91 -size 30531051 +oid sha256:933e0d390454f1814d5e8b332a8b538dee4cd5ce16a51b14ee3d38b81be5a005 +size 30529728 diff --git a/quantized/openai/whisper-tiny/default/encoder_model.onnx b/quantized/openai/whisper-tiny/default/encoder_model.onnx index 9136ed87ab1dac4f3cf0a238e313ba5b4986c850..cd7b6ba5863a21cf9ec66c45d2289373bcde48a7 100644 --- a/quantized/openai/whisper-tiny/default/encoder_model.onnx +++ b/quantized/openai/whisper-tiny/default/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:92e97f2cbd41ab1117039ddf725888ad8a028834b9cbd7e5be74d7fac0515d44 -size 10192815 +oid sha256:140f7c48489beda5c140c125d0609266e37185e69cbb83eeb8315585bb438bf0 +size 10192819 diff --git a/quantized/openai/whisper-tiny/default/tokenizer_config.json b/quantized/openai/whisper-tiny/default/tokenizer_config.json index c18ca77e9c4c964c76c454efa85a08c35a9c9a4a..224faf0c5158669dee7202e9c4f75e977f9c6651 100644 --- a/quantized/openai/whisper-tiny/default/tokenizer_config.json +++ b/quantized/openai/whisper-tiny/default/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json index cb403313fd753adb0790226d1d7a7b1258c2c7ae..52163147f09e4f7b74a294d9eb3de22adbf2bef3 100644 --- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json +++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/config.json @@ -135,7 +135,6 @@ 50361, 50362 ], - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 51865 diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx index 6cef0a605aeb641c5ac081f30e06fe453bf3e805..2291ad7d8cfeeaaf092ed67226e4fd6117945ff6 100644 --- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx +++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5cc79a5e89b4dd4b672980e7d823051776e473395bb1d6d891488f3cf2c7d0fe -size 50735854 +oid sha256:b778a7996bffa4487385138d00e56298776bcf894930d358ff2d800cd2954361 +size 50734556 diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model_merged.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..a08f2312a2781aa1f2169e4d1cf3784fc7126489 --- /dev/null +++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef4212fc1105df3730ac5e0e1dc5f6173d0d598e0422fd98f5e44358a4d88965 +size 50892695 diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx index 288b797a430f74261df5f759b64096bcb0c444a7..95ceb3568a08058c6739839fd721ab4d7eada92f 100644 --- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c78a41943419456e0ca4bab35a487dd8a91c014844f353f6a0274000c92ce27f -size 49486675 +oid sha256:231c945514b7e8eddb9033f9149085175410837653e1b2bedd5cb61d6d6a9e9e +size 49486513 diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx index 9136ed87ab1dac4f3cf0a238e313ba5b4986c850..cd7b6ba5863a21cf9ec66c45d2289373bcde48a7 100644 --- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx +++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:92e97f2cbd41ab1117039ddf725888ad8a028834b9cbd7e5be74d7fac0515d44 -size 10192815 +oid sha256:140f7c48489beda5c140c125d0609266e37185e69cbb83eeb8315585bb438bf0 +size 10192819 diff --git a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json index c18ca77e9c4c964c76c454efa85a08c35a9c9a4a..224faf0c5158669dee7202e9c4f75e977f9c6651 100644 --- a/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json +++ b/quantized/openai/whisper-tiny/speech2seq-lm-with-past/tokenizer_config.json @@ -25,7 +25,6 @@ "return_attention_mask": false, "special_tokens_map_file": null, "tokenizer_class": "WhisperTokenizer", - "trust_remote_code": false, "unk_token": { "__type": "AddedToken", "content": "<|endoftext|>", diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json index 40c7820c59c930680f4af140ed61a931dea50269..ff3666ead9d3e2c88f2692b125239b34d8513994 100644 --- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json +++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/config.json @@ -1,5 +1,5 @@ { - "_name_or_path": "./models/pytorch/distilbart-cnn-6-6", + "_name_or_path": "sshleifer/distilbart-cnn-6-6", "_num_labels": 3, "activation_dropout": 0.0, "activation_function": "gelu", @@ -70,7 +70,6 @@ "num_beams": 4 } }, - "torch_dtype": "float32", "transformers_version": "4.26.1", "use_cache": true, "vocab_size": 50264 diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx index eac3e24b5a8286b999de98cfdf2298cf1da343f0..69ee3bad2128e4040361a073508188773e76572c 100644 --- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx +++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5febe5b43ce4c9c2bc35a5cb18dfa5e48a46d0fc8fc18d2af1795d61c50fd680 -size 206479989 +oid sha256:bf78c246385eb43eedd09db3727275eb2ea890c8f80df7600c22871f9fa63d49 +size 206522287 diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..dc9dac6c1b24a5a308e15c9832c47fcf0b6cf2cc --- /dev/null +++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a16e203dd8f5e7f5be4c2452110669d94c9f1bcdaff7185b6e3e006d3debf01 +size 206659464 diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx index b271c8b80fbdc7fdfc59211bdabed86575b8ccb3..23b429657cbb2beff2006e71e6494cd09cd9b7e5 100644 --- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:42f643dea3105c689323791fd61b6e9f6e284c89c0527881ca8828acd886008d -size 193716879 +oid sha256:687fcc78d2b81908b5dc60089557bd461c492e2e2ffffc982d86a0f90c4545ae +size 193754572 diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx index fea4eb0de14ccc36670d7425eb64b519b496130b..fba3891be63a8e2e1c93593eb7fcfbd1fccfb9a3 100644 --- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx +++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e1768009f547363ff104fcf143c164b0d157379ece68f771238a1ea45026b004 -size 128835266 +oid sha256:8820a208f45059db2cbcd5b7b59ff3829e946789420058244cc8f429ef707fab +size 128853768 diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json index ae7b71057f722dae9b8574855f92736ad85b509d..b68ec657118ada773a08938cd59ee4f41c1cc629 100644 --- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json +++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer.json @@ -5,56 +5,55 @@ "added_tokens": [ { "id": 0, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": true, - "special": true + "normalized": true }, { "id": 1, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": true, - "special": true + "normalized": true }, { "id": 2, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": true, - "special": true + "normalized": true }, { "id": 3, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": true, - "special": true + "normalized": true }, { "id": 50264, + "special": true, "content": "", "single_word": false, "lstrip": true, "rstrip": false, - "normalized": true, - "special": true + "normalized": true } ], "normalizer": null, "pre_tokenizer": { "type": "ByteLevel", "add_prefix_space": false, - "trim_offsets": true, - "use_regex": true + "trim_offsets": true }, "post_processor": { "type": "RobertaProcessing", @@ -72,8 +71,7 @@ "decoder": { "type": "ByteLevel", "add_prefix_space": true, - "trim_offsets": true, - "use_regex": true + "trim_offsets": true }, "model": { "type": "BPE", diff --git a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json index 89133304c7ac83061810a274ab08ebaa45549079..9feb230c732bf9236c347ffcc9a8b9865f94806f 100644 --- a/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json +++ b/quantized/sshleifer/distilbart-cnn-6-6/seq2seq-lm-with-past/tokenizer_config.json @@ -34,7 +34,7 @@ "single_word": false }, "model_max_length": 1024, - "name_or_path": "./models/pytorch/distilbart-cnn-6-6", + "name_or_path": "sshleifer/distilbart-cnn-6-6", "pad_token": { "__type": "AddedToken", "content": "", diff --git a/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx b/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx index e9e6b72815697ec4c0509613442aaccde5f1a13f..7380df1e9259f5da83ab752d9c31cd6563b8ad43 100644 --- a/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx +++ b/quantized/t5-base/seq2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a780e63db36dc742c4877b443693b08da83a8c9ff37a50992ec8ceac6664511 -size 164125335 +oid sha256:47a0bcce9bde05f2efae9fc160597908351afa9f3435bb3d4fc6898b87fc9cac +size 164212159 diff --git a/quantized/t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..23db31ad793fca55d80ac4862060ad94b8473ea2 --- /dev/null +++ b/quantized/t5-base/seq2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d890a977cba9946d83a05b612660935556e1b1acfbe44fee015d8c2798792f9 +size 164407136 diff --git a/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx index cee06a9cb0860f47c54ea4e3696e76e3e445f1e1..055725b6d657cb87ac81e5479e19ec1f4b282573 100644 --- a/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/t5-base/seq2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2a380c12a7fff3b79bda6ac39f26cf99a76d4e4226c9432d5dd596e06e5623d9 -size 149817760 +oid sha256:2b00687d6bc057e09d7268793ef94febb1ce93326d61daebd0bc46cd83b29af9 +size 149895571 diff --git a/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx b/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx index b8508b5e3222465c0265bf4f62f4f46c63f9f30e..f6b1cd476e40d0f26222d97d5d7496fe3aee6acb 100644 --- a/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx +++ b/quantized/t5-base/seq2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:41aa8184e052af3d834afdeba930ce837a8aeaea84af7f86ce288cd884230a4d -size 110425846 +oid sha256:938176467fc4eab1ec72a80b8187321dbffdd53bd2f8fba3231677f31d8440e3 +size 110468491 diff --git a/quantized/t5-small/seq2seq-lm-with-past/config.json b/quantized/t5-small/seq2seq-lm-with-past/config.json index 3eb424fb2cb83f8e9a6dee5241f51ef8b72bf462..ab8e4622c467cba75060c2c0b1c52f666759e225 100644 --- a/quantized/t5-small/seq2seq-lm-with-past/config.json +++ b/quantized/t5-small/seq2seq-lm-with-past/config.json @@ -1,5 +1,5 @@ { - "_name_or_path": "./models/pytorch/t5-small", + "_name_or_path": "t5-small", "architectures": [ "T5ForConditionalGeneration" ], diff --git a/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx b/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx index a0a1e45e81095305ca3bda43172f0e1f6f6ef699..ebd59b79bf7c05eb38dfe75fd853e2f12a6f39bf 100644 --- a/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx +++ b/quantized/t5-small/seq2seq-lm-with-past/decoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eb2e336b767e84ec868601c4ebe04f5815bf60fa3a89b3cf98c43165ec49346b -size 58629284 +oid sha256:81c50ce70014e2629ed5f247876f2a8a02e2ac2c71434c2f49056be050e47f88 +size 58653777 diff --git a/quantized/t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx b/quantized/t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx new file mode 100644 index 0000000000000000000000000000000000000000..5e51812b5a918132fbb961b061880517b5739cdb --- /dev/null +++ b/quantized/t5-small/seq2seq-lm-with-past/decoder_model_merged.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e410c9d18f1213154873f1433380fe9b132766195c6705906c9b961552a8f84a +size 58695469 diff --git a/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx b/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx index 77d1a643dbf523ab8347de2cf461bcee64910270..b9a68b6a1b5fa69d3b4f99ef5442439308e560db 100644 --- a/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx +++ b/quantized/t5-small/seq2seq-lm-with-past/decoder_with_past_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:959f46528a00274ed729ddb946be93a0f452c5fa3f3811f9b3b0df17006e2a69 -size 55441515 +oid sha256:4051a88a8c68714e901e301de5f76fb4d0a16dee060cfff929082a1027a0f6bc +size 55462874 diff --git a/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx b/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx index 6c8a2a71d72d8b50cf990e4cad571fbf52dacb0e..8a19249affcf7ff49df183c6cea45037d0ff9cdb 100644 --- a/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx +++ b/quantized/t5-small/seq2seq-lm-with-past/encoder_model.onnx @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:baa256256227f0d5bcb9bac2660717a51ca61f9b1c40ad9a36934760edf3b43c -size 35575579 +oid sha256:decc4bf2aa8d748ba92dcff463e401074238e0a6dcd5dd114abceecdd5245a53 +size 35587442 diff --git a/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json b/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json index 698d7a6a181bc68bbeb97703edc841c911e39a0c..9e2f3266532d086ffe6332050eb8a7e055e7a9e7 100644 --- a/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json +++ b/quantized/t5-small/seq2seq-lm-with-past/tokenizer.json @@ -5,930 +5,930 @@ "added_tokens": [ { "id": 0, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 1, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 2, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32000, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32001, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32002, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32003, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32004, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32005, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32006, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32007, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32008, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32009, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32010, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32011, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32012, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32013, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32014, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32015, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32016, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32017, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32018, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32019, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32020, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32021, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32022, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32023, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32024, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32025, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32026, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32027, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32028, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32029, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32030, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32031, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32032, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32033, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32034, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32035, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32036, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32037, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32038, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32039, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32040, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32041, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32042, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32043, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32044, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32045, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32046, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32047, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32048, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32049, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32050, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32051, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32052, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32053, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32054, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32055, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32056, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32057, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32058, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32059, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32060, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32061, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32062, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32063, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32064, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32065, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32066, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32067, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32068, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32069, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32070, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32071, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32072, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32073, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32074, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32075, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32076, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32077, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32078, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32079, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32080, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32081, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32082, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32083, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32084, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32085, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32086, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32087, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32088, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32089, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32090, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32091, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32092, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32093, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32094, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32095, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32096, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32097, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32098, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false }, { "id": 32099, + "special": true, "content": "", "single_word": false, "lstrip": false, "rstrip": false, - "normalized": false, - "special": true + "normalized": false } ], "normalizer": { diff --git a/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json b/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json index 396a6b3e8e612cae7d7e1c8e193528fbb04f34d6..fc9b1b5ec024637d0cdb9f88b3835db43028e5b9 100644 --- a/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json +++ b/quantized/t5-small/seq2seq-lm-with-past/tokenizer_config.json @@ -103,8 +103,8 @@ ], "eos_token": "", "extra_ids": 100, - "model_max_length": 1000000000000000019884624838656, - "name_or_path": "./models/pytorch/t5-small", + "model_max_length": 512, + "name_or_path": "t5-small", "pad_token": "", "special_tokens_map_file": null, "tokenizer_class": "T5Tokenizer",