Upload folder using huggingface_hub

Browse files

Files changed (16) hide show

.gitattributes +1 -0
config.json +219 -0
generation_config.json +10 -0
onnx/decoder_model.onnx +3 -0
onnx/decoder_model_merged.onnx +3 -0
onnx/decoder_model_merged_quantized.onnx +3 -0
onnx/decoder_model_quantized.onnx +3 -0
onnx/decoder_with_past_model.onnx +3 -0
onnx/decoder_with_past_model_quantized.onnx +3 -0
onnx/encoder_model.onnx +3 -0
onnx/encoder_model_quantized.onnx +3 -0
quantize_config.json +139 -0
special_tokens_map.json +5 -0
spiece.model +3 -0
tokenizer.json +3 -0
tokenizer_config.json +12 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

config.json ADDED Viewed

	@@ -0,0 +1,219 @@

+{
+  "_name_or_path": "csebuetnlp/mT5_m2m_crossSum_enhanced",
+  "architectures": [
+    "MT5ForConditionalGeneration"
+  ],
+  "classifier_dropout": 0.0,
+  "d_ff": 2048,
+  "d_kv": 64,
+  "d_model": 768,
+  "decoder_start_token_id": 0,
+  "dense_act_fn": "gelu_new",
+  "dropout_rate": 0.1,
+  "eos_token_id": 1,
+  "feed_forward_proj": "gated-gelu",
+  "initializer_factor": 1.0,
+  "is_encoder_decoder": true,
+  "is_gated_act": true,
+  "layer_norm_epsilon": 1e-06,
+  "length_penalty": 0.6,
+  "max_length": 84,
+  "model_type": "mt5",
+  "num_beams": 4,
+  "num_decoder_layers": 12,
+  "num_heads": 12,
+  "num_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "relative_attention_max_distance": 128,
+  "relative_attention_num_buckets": 32,
+  "task_specific_params": {
+    "langid_map": {
+      "amharic": [
+        35,
+        "\u2581<extra_id_64>"
+      ],
+      "arabic": [
+        4,
+        "\u2581<extra_id_95>"
+      ],
+      "azerbaijani": [
+        7,
+        "\u2581<extra_id_92>"
+      ],
+      "bengali": [
+        42,
+        "\u2581<extra_id_57>"
+      ],
+      "burmese": [
+        33,
+        "\u2581<extra_id_66>"
+      ],
+      "chinese_simplified": [
+        40,
+        "\u2581<extra_id_59>"
+      ],
+      "chinese_traditional": [
+        44,
+        "\u2581<extra_id_55>"
+      ],
+      "english": [
+        30,
+        "\u2581<extra_id_69>"
+      ],
+      "french": [
+        10,
+        "\u2581<extra_id_89>"
+      ],
+      "gujarati": [
+        27,
+        "\u2581<extra_id_72>"
+      ],
+      "hausa": [
+        43,
+        "\u2581<extra_id_56>"
+      ],
+      "hindi": [
+        21,
+        "\u2581<extra_id_78>"
+      ],
+      "igbo": [
+        9,
+        "\u2581<extra_id_90>"
+      ],
+      "indonesian": [
+        1,
+        "\u2581<extra_id_98>"
+      ],
+      "japanese": [
+        37,
+        "\u2581<extra_id_62>"
+      ],
+      "kirundi": [
+        0,
+        "\u2581<extra_id_99>"
+      ],
+      "korean": [
+        29,
+        "\u2581<extra_id_70>"
+      ],
+      "kyrgyz": [
+        5,
+        "\u2581<extra_id_94>"
+      ],
+      "marathi": [
+        13,
+        "\u2581<extra_id_86>"
+      ],
+      "nepali": [
+        20,
+        "\u2581<extra_id_79>"
+      ],
+      "oromo": [
+        41,
+        "\u2581<extra_id_58>"
+      ],
+      "pashto": [
+        34,
+        "\u2581<extra_id_65>"
+      ],
+      "persian": [
+        23,
+        "\u2581<extra_id_76>"
+      ],
+      "pidgin": [
+        14,
+        "\u2581<extra_id_85>"
+      ],
+      "portuguese": [
+        39,
+        "\u2581<extra_id_60>"
+      ],
+      "punjabi": [
+        17,
+        "\u2581<extra_id_82>"
+      ],
+      "russian": [
+        36,
+        "\u2581<extra_id_63>"
+      ],
+      "scottish_gaelic": [
+        24,
+        "\u2581<extra_id_75>"
+      ],
+      "serbian_cyrillic": [
+        28,
+        "\u2581<extra_id_71>"
+      ],
+      "serbian_latin": [
+        11,
+        "\u2581<extra_id_88>"
+      ],
+      "sinhala": [
+        31,
+        "\u2581<extra_id_68>"
+      ],
+      "somali": [
+        19,
+        "\u2581<extra_id_80>"
+      ],
+      "spanish": [
+        3,
+        "\u2581<extra_id_96>"
+      ],
+      "swahili": [
+        18,
+        "\u2581<extra_id_81>"
+      ],
+      "tamil": [
+        32,
+        "\u2581<extra_id_67>"
+      ],
+      "telugu": [
+        22,
+        "\u2581<extra_id_77>"
+      ],
+      "thai": [
+        6,
+        "\u2581<extra_id_93>"
+      ],
+      "tigrinya": [
+        16,
+        "\u2581<extra_id_83>"
+      ],
+      "turkish": [
+        15,
+        "\u2581<extra_id_84>"
+      ],
+      "ukrainian": [
+        2,
+        "\u2581<extra_id_97>"
+      ],
+      "urdu": [
+        38,
+        "\u2581<extra_id_61>"
+      ],
+      "uzbek": [
+        8,
+        "\u2581<extra_id_91>"
+      ],
+      "vietnamese": [
+        12,
+        "\u2581<extra_id_87>"
+      ],
+      "welsh": [
+        26,
+        "\u2581<extra_id_73>"
+      ],
+      "yoruba": [
+        25,
+        "\u2581<extra_id_74>"
+      ]
+    }
+  },
+  "tie_word_embeddings": false,
+  "tokenizer_class": "T5Tokenizer",
+  "transformers_version": "4.33.2",
+  "use_cache": true,
+  "vocab_size": 250112
+}

generation_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "_from_model_config": true,
+  "decoder_start_token_id": 0,
+  "eos_token_id": 1,
+  "length_penalty": 0.6,
+  "max_length": 84,
+  "num_beams": 4,
+  "pad_token_id": 0,
+  "transformers_version": "4.33.2"
+}

onnx/decoder_model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3b98853530f6475374429f0bf29d6c49368e962703970f2fd3a51e063f2bfaa1
+size 1990142662

onnx/decoder_model_merged.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5cc708c6b5878f7a274dbb4feb4a484c796a37bf7deae3defe18e80eeee215dc
+size 1990476587

onnx/decoder_model_merged_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d320cbcf3840a7629fcf45e0750d0649b451a01345d2131c9cec19608f03eaed
+size 500652977

onnx/decoder_model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ae4401116d2fb14067839fa5e14627945b2df9c3591fbe000ae0aff32c96f39
+size 500076464

onnx/decoder_with_past_model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e4908352dcd271c00fae22d03df454b4487fe9791f2391163df07389a2a12d8
+size 1933491010

onnx/decoder_with_past_model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:96be0b979b5d41f1079b44af0799c0bb01470d7f5185671555962b83076ba6f1
+size 485767498

onnx/encoder_model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce603211c93a2537a605963aa49c926a955315186342b8de00904f5390af792c
+size 1108344239

onnx/encoder_model_quantized.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:989de67618174fbc1c45aaf55d8316f1903a23575e0fdb30dcdb515d81b5ecb8
+size 277914072

quantize_config.json ADDED Viewed

	@@ -0,0 +1,139 @@

+{
+    "per_channel": true,
+    "reduce_range": true,
+    "per_model_config": {
+        "encoder_model": {
+            "op_types": [
+                "Abs",
+                "Range",
+                "ReduceMean",
+                "ConstantOfShape",
+                "Concat",
+                "Sub",
+                "Greater",
+                "Shape",
+                "Tanh",
+                "Cast",
+                "Reshape",
+                "Div",
+                "Pow",
+                "Where",
+                "Min",
+                "Gather",
+                "Constant",
+                "Transpose",
+                "Less",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "MatMul",
+                "Unsqueeze",
+                "Softmax",
+                "Add"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_with_past_model": {
+            "op_types": [
+                "Range",
+                "ReduceMean",
+                "LessOrEqual",
+                "ConstantOfShape",
+                "Concat",
+                "Sub",
+                "Slice",
+                "Shape",
+                "Expand",
+                "Tanh",
+                "Cast",
+                "Reshape",
+                "Div",
+                "Pow",
+                "Where",
+                "Min",
+                "Gather",
+                "Constant",
+                "Tile",
+                "Transpose",
+                "Less",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "MatMul",
+                "Unsqueeze",
+                "Neg",
+                "Softmax",
+                "Add"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model": {
+            "op_types": [
+                "Range",
+                "ReduceMean",
+                "LessOrEqual",
+                "ConstantOfShape",
+                "Concat",
+                "Sub",
+                "Shape",
+                "Expand",
+                "Tanh",
+                "Cast",
+                "Reshape",
+                "Div",
+                "Pow",
+                "Where",
+                "Min",
+                "Gather",
+                "Constant",
+                "Tile",
+                "Transpose",
+                "Less",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "MatMul",
+                "Unsqueeze",
+                "Neg",
+                "Softmax",
+                "Add"
+            ],
+            "weight_type": "QInt8"
+        },
+        "decoder_model_merged": {
+            "op_types": [
+                "Range",
+                "ReduceMean",
+                "LessOrEqual",
+                "ConstantOfShape",
+                "Concat",
+                "Sub",
+                "Slice",
+                "Shape",
+                "Expand",
+                "Tanh",
+                "If",
+                "Cast",
+                "Reshape",
+                "Pow",
+                "Div",
+                "Where",
+                "Min",
+                "Gather",
+                "Constant",
+                "Tile",
+                "Transpose",
+                "Less",
+                "Log",
+                "Mul",
+                "Sqrt",
+                "MatMul",
+                "Unsqueeze",
+                "Neg",
+                "Softmax",
+                "Add"
+            ],
+            "weight_type": "QInt8"
+        }
+    }
+}

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef78f86560d809067d12bac6c09f19a462cb3af3f54d2b8acbba26e1433125d6
+size 4309802

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:93c3578052e1605d8332eb961bc08d72e246071974e4cc54aa6991826b802aa5
+size 16330369

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+  "additional_special_tokens": null,
+  "clean_up_tokenization_spaces": true,
+  "eos_token": "</s>",
+  "extra_ids": 0,
+  "legacy": true,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "T5Tokenizer",
+  "unk_token": "<unk>"
+}