LightChen2333
/

gl-gin-slu-mix-atis

Transformers

PyTorch

Model card Files Files and versions

xet

Community

LightChen2333 commited on Feb 19, 2023

Commit

aded56d

1 Parent(s): 971e88a

Upload 3 files

Browse files

Files changed (1) hide show

config.json +23 -14

config.json CHANGED Viewed

@@ -284,7 +284,7 @@
       "intent_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
-        "ignore_index": "{base.ignore_index}",
         "input_dim": 384,
         "intent_label_num": 17,
         "loss_fn": {
@@ -293,7 +293,7 @@
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
-            "in_features": "{model.encoder.output_dim}",
             "out_features": 256
           },
           {
@@ -303,39 +303,40 @@
           {
             "_model_target_": "torch.nn.Linear",
             "in_features": 256,
-            "out_features": "{base.intent_label_num}"
           }
         ],
         "mode": "token-level-intent",
         "multi_threshold": 0.5,
         "return_sentence_level": true,
         "use_intent": true,
-        "use_multi": "{base.multi_intent}"
       },
       "interaction": {
         "_model_target_": "model.decoder.interaction.GLGINInteraction",
         "alpha": 0.2,
         "dropout_rate": 0.4,
         "hidden_dim": 256,
-        "input_dim": "{model.encoder.output_dim}",
         "intent_embedding_dim": 64,
-        "intent_label_num": "{base.intent_label_num}",
         "num_heads": 8,
         "num_layers": 2,
-        "output_dim": "{model.decoder.interaction.intent_embedding_dim}",
         "row_normalized": true,
-        "slot_graph_window": 1
       },
       "slot_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
-        "ignore_index": "{base.ignore_index}",
         "input_dim": 384,
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
-            "in_features": "{model.decoder.interaction.output_dim}",
-            "out_features": "{model.decoder.interaction.output_dim}"
           },
           {
             "_model_target_": "torch.nn.LeakyReLU",
@@ -343,8 +344,8 @@
           },
           {
             "_model_target_": "torch.nn.Linear",
-            "in_features": "{model.decoder.interaction.output_dim}",
-            "out_features": "{base.slot_label_num}"
           }
         ],
         "mode": "slot",
@@ -364,7 +365,8 @@
       },
       "embedding": {
         "dropout_rate": 0.4,
-        "embedding_dim": 128
       },
       "encoder_name": "self-attention-lstm",
       "lstm": {
@@ -379,6 +381,13 @@
     }
   },
   "return_dict": false,
   "tokenizer_class": "OpenSLUv1",
   "torch_dtype": "float32",
   "transformers_version": "4.25.1",

       "intent_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
+        "ignore_index": -100,
         "input_dim": 384,
         "intent_label_num": 17,
         "loss_fn": {
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
+            "in_features": 384,
             "out_features": 256
           },
           {
           {
             "_model_target_": "torch.nn.Linear",
             "in_features": 256,
+            "out_features": 17
           }
         ],
         "mode": "token-level-intent",
         "multi_threshold": 0.5,
         "return_sentence_level": true,
         "use_intent": true,
+        "use_multi": true
       },
       "interaction": {
         "_model_target_": "model.decoder.interaction.GLGINInteraction",
         "alpha": 0.2,
         "dropout_rate": 0.4,
         "hidden_dim": 256,
+        "input_dim": 384,
         "intent_embedding_dim": 64,
+        "intent_label_num": 17,
         "num_heads": 8,
         "num_layers": 2,
+        "output_dim": 64,
         "row_normalized": true,
+        "slot_graph_window": 1,
+        "slot_label_num": 111
       },
       "slot_classifier": {
         "_model_target_": "model.decoder.classifier.MLPClassifier",
         "dropout_rate": 0.4,
+        "ignore_index": -100,
         "input_dim": 384,
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
+            "in_features": 64,
+            "out_features": 64
           },
           {
             "_model_target_": "torch.nn.LeakyReLU",
           },
           {
             "_model_target_": "torch.nn.Linear",
+            "in_features": 64,
+            "out_features": 111
           }
         ],
         "mode": "slot",
       },
       "embedding": {
         "dropout_rate": 0.4,
+        "embedding_dim": 128,
+        "vocab_size": 790
       },
       "encoder_name": "self-attention-lstm",
       "lstm": {
     }
   },
   "return_dict": false,
+  "tokenizer": {
+    "_align_mode_": "fast",
+    "_padding_side_": "right",
+    "_tokenizer_name_": "word_tokenizer",
+    "add_special_tokens": false,
+    "max_length": 512
+  },
   "tokenizer_class": "OpenSLUv1",
   "torch_dtype": "float32",
   "transformers_version": "4.25.1",