LightChen2333
/

gl-gin-slu-mix-snips

Transformers

PyTorch

Model card Files Files and versions Community

LightChen2333 commited on Feb 19, 2023

Commit

8e002f1

1 Parent(s): fa9e36d

Upload 3 files

Browse files

Files changed (1) hide show

config.json +23 -14

config.json CHANGED Viewed

@@ -186,7 +186,7 @@
       "intent_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
-        "ignore_index": "{base.ignore_index}",
         "input_dim": 384,
         "intent_label_num": 7,
         "loss_fn": {
@@ -195,7 +195,7 @@
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
-            "in_features": "{model.encoder.output_dim}",
             "out_features": 256
           },
           {
@@ -205,14 +205,14 @@
           {
             "_model_target_": "torch.nn.Linear",
             "in_features": 256,
-            "out_features": "{base.intent_label_num}"
           }
         ],
         "mode": "token-level-intent",
         "multi_threshold": 0.5,
         "return_sentence_level": true,
         "use_intent": true,
-        "use_multi": "{base.multi_intent}",
         "weight": 0.2
       },
       "interaction": {
@@ -220,25 +220,26 @@
         "alpha": 0.2,
         "dropout_rate": 0.4,
         "hidden_dim": 256,
-        "input_dim": "{model.encoder.output_dim}",
         "intent_embedding_dim": 256,
-        "intent_label_num": "{base.intent_label_num}",
         "num_heads": 4,
         "num_layers": 2,
-        "output_dim": "{model.decoder.interaction.intent_embedding_dim}",
         "row_normalized": true,
-        "slot_graph_window": 1
       },
       "slot_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
-        "ignore_index": "{base.ignore_index}",
         "input_dim": 384,
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
-            "in_features": "{model.decoder.interaction.output_dim}",
-            "out_features": "{model.decoder.interaction.output_dim}"
           },
           {
             "_model_target_": "torch.nn.LeakyReLU",
@@ -246,8 +247,8 @@
           },
           {
             "_model_target_": "torch.nn.Linear",
-            "in_features": "{model.decoder.interaction.output_dim}",
-            "out_features": "{base.slot_label_num}"
           }
         ],
         "mode": "slot",
@@ -268,7 +269,8 @@
       },
       "embedding": {
         "dropout_rate": 0.4,
-        "embedding_dim": 128
       },
       "encoder_name": "self-attention-lstm",
       "lstm": {
@@ -283,6 +285,13 @@
     }
   },
   "return_dict": false,
   "tokenizer_class": "OpenSLUv1",
   "torch_dtype": "float32",
   "transformers_version": "4.25.1",

       "intent_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
+        "ignore_index": -100,
         "input_dim": 384,
         "intent_label_num": 7,
         "loss_fn": {
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
+            "in_features": 384,
             "out_features": 256
           },
           {
           {
             "_model_target_": "torch.nn.Linear",
             "in_features": 256,
+            "out_features": 7
           }
         ],
         "mode": "token-level-intent",
         "multi_threshold": 0.5,
         "return_sentence_level": true,
         "use_intent": true,
+        "use_multi": true,
         "weight": 0.2
       },
       "interaction": {
         "alpha": 0.2,
         "dropout_rate": 0.4,
         "hidden_dim": 256,
+        "input_dim": 384,
         "intent_embedding_dim": 256,
+        "intent_label_num": 7,
         "num_heads": 4,
         "num_layers": 2,
+        "output_dim": 256,
         "row_normalized": true,
+        "slot_graph_window": 1,
+        "slot_label_num": 72
       },
       "slot_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
+        "ignore_index": -100,
         "input_dim": 384,
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
+            "in_features": 256,
+            "out_features": 256
           },
           {
             "_model_target_": "torch.nn.LeakyReLU",
           },
           {
             "_model_target_": "torch.nn.Linear",
+            "in_features": 256,
+            "out_features": 72
           }
         ],
         "mode": "slot",
       },
       "embedding": {
         "dropout_rate": 0.4,
+        "embedding_dim": 128,
+        "vocab_size": 11758
       },
       "encoder_name": "self-attention-lstm",
       "lstm": {
     }
   },
   "return_dict": false,
+  "tokenizer": {
+    "_align_mode_": "fast",
+    "_padding_side_": "right",
+    "_tokenizer_name_": "word_tokenizer",
+    "add_special_tokens": false,
+    "max_length": 512
+  },
   "tokenizer_class": "OpenSLUv1",
   "torch_dtype": "float32",
   "transformers_version": "4.25.1",