bozhou
/

DeBERTa-base

Feature Extraction

Model card Files Files and versions

3v324v23 commited on Jun 1, 2023

Commit

68eff11

·

1 Parent(s): 8e64bfa

update config

Files changed (1) hide show

config.json +25 -20

config.json CHANGED Viewed

@@ -4,25 +4,30 @@
       "DeBERTa"
     ],
     "auto_map": {
-      "AutoConfig": "modeling.config.ModelConfig",
-      "AutoModel": "modeling_chatglm.ChatGLMForConditionalGeneration",
-      "AutoModelForSeq2SeqLM": "modeling_chatglm.ChatGLMForConditionalGeneration"
     },
-    "bos_token_id": 130004,
-    "eos_token_id": 130005,
-    "mask_token_id": 130000,
-    "gmask_token_id": 130001,
-    "pad_token_id": 3,
-    "hidden_size": 4096,
-    "inner_hidden_size": 16384,
-    "layernorm_epsilon": 1e-05,
-    "max_sequence_length": 2048,
-    "model_type": "chatglm",
-    "num_attention_heads": 32,
-    "num_layers": 28,
-    "position_encoding_2d": true,
-    "torch_dtype": "float16",
-    "transformers_version": "4.23.1",
-    "use_cache": true,
-    "vocab_size": 130528
   }

       "DeBERTa"
     ],
     "auto_map": {
+      "AutoConfig": "modeling.config.DebertaConfig",
+      "AutoModel": "modeling.deberta.DeBERTa"
     },
+    "attention_head_size": 64,
+    "attention_probs_dropout_prob": 0.1,
+    "hidden_act": "gelu",
+    "hidden_dropout_prob": 0.1,
+    "hidden_size": 768,
+    "initializer_range": 0.02,
+    "intermediate_size": 3072,
+    "layer_norm_eps": 1e-07,
+    "max_position_embeddings": 512,
+    "max_relative_positions": -1,
+    "norm_rel_ebd": "layer_norm",
+    "num_attention_heads": 12,
+    "num_hidden_layers": 12,
+    "padding_idx": 0,
+    "pos_att_type": "p2c|c2p",
+    "position_biased_input": false,
+    "position_buckets": 128,
+    "relative_attention": true,
+    "share_att_key": true,
+    "type_vocab_size": 0,
+    "vocab_size": 22669,
+    "tokenizer_class": "BertTokenizer",
+    "model_type": "deberta-v2"
   }