LightChen2333
/

agif-slu-mix-atis

Transformers

PyTorch

Inference Endpoints

Model card Files Files and versions Community

LightChen2333 commited on Feb 19, 2023

Commit

68f7230

•

1 Parent(s): 905f31e

Upload 3 files

Browse files

Files changed (1) hide show

config.json +19 -9

config.json CHANGED Viewed

@@ -292,7 +292,7 @@
         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
-            "in_features": "{model.encoder.output_dim}",
             "out_features": 256
           },
           {
@@ -302,14 +302,14 @@
           {
             "_model_target_": "torch.nn.Linear",
             "in_features": 256,
-            "out_features": "{base.intent_label_num}"
           }
         ],
         "mode": "intent",
         "multi_threshold": 0.5,
         "return_sentence_level": true,
         "use_intent": true,
-        "use_multi": "{base.multi_intent}",
         "weight": 0.3
       },
       "interaction": {
@@ -317,12 +317,14 @@
         "alpha": 0.2,
         "dropout_rate": 0.4,
         "hidden_dim": 128,
-        "input_dim": "{model.encoder.output_dim}",
         "intent_embedding_dim": 128,
         "num_heads": 4,
         "num_layers": 2,
-        "output_dim": "{model.decoder.interaction.intent_embedding_dim}",
-        "row_normalized": true
       },
       "slot_classifier": {
         "_model_target_": "model.decoder.classifier.AutoregressiveLSTMClassifier",
@@ -330,9 +332,9 @@
         "dropout_rate": 0.4,
         "embedding_dim": 128,
         "force_ratio": 0.9,
-        "hidden_dim": "{model.decoder.interaction.intent_embedding_dim}",
         "ignore_index": -100,
-        "input_dim": "{model.encoder.output_dim}",
         "layer_num": 1,
         "mode": "slot",
         "multi_threshold": 0.5,
@@ -352,7 +354,8 @@
       },
       "embedding": {
         "dropout_rate": 0.4,
-        "embedding_dim": 128
       },
       "encoder_name": "self-attention-lstm",
       "lstm": {
@@ -370,6 +373,13 @@
     }
   },
   "return_dict": false,
   "tokenizer_class": "OpenSLUv1",
   "torch_dtype": "float32",
   "transformers_version": "4.25.1",

         "mlp": [
           {
             "_model_target_": "torch.nn.Linear",
+            "in_features": 384,
             "out_features": 256
           },
           {
           {
             "_model_target_": "torch.nn.Linear",
             "in_features": 256,
+            "out_features": 17
           }
         ],
         "mode": "intent",
         "multi_threshold": 0.5,
         "return_sentence_level": true,
         "use_intent": true,
+        "use_multi": true,
         "weight": 0.3
       },
       "interaction": {
         "alpha": 0.2,
         "dropout_rate": 0.4,
         "hidden_dim": 128,
+        "input_dim": 384,
         "intent_embedding_dim": 128,
+        "intent_label_num": 17,
         "num_heads": 4,
         "num_layers": 2,
+        "output_dim": 128,
+        "row_normalized": true,
+        "slot_label_num": 111
       },
       "slot_classifier": {
         "_model_target_": "model.decoder.classifier.AutoregressiveLSTMClassifier",
         "dropout_rate": 0.4,
         "embedding_dim": 128,
         "force_ratio": 0.9,
+        "hidden_dim": 128,
         "ignore_index": -100,
+        "input_dim": 384,
         "layer_num": 1,
         "mode": "slot",
         "multi_threshold": 0.5,
       },
       "embedding": {
         "dropout_rate": 0.4,
+        "embedding_dim": 128,
+        "vocab_size": 790
       },
       "encoder_name": "self-attention-lstm",
       "lstm": {
     }
   },
   "return_dict": false,
+  "tokenizer": {
+    "_align_mode_": "fast",
+    "_padding_side_": "right",
+    "_tokenizer_name_": "word_tokenizer",
+    "add_special_tokens": false,
+    "max_length": 512
+  },
   "tokenizer_class": "OpenSLUv1",
   "torch_dtype": "float32",
   "transformers_version": "4.25.1",