JakeOh
/

LLaDA-70M-Base

Feature Extraction

Model card Files Files and versions

JakeOh commited on Oct 27, 2025

Commit

2d6e01c

·

verified ·

1 Parent(s): 003aa2e

Upload config

Files changed (1) hide show

config.json +4 -4

config.json CHANGED Viewed

@@ -10,8 +10,8 @@
   "attention_layer_norm_with_affine": true,
   "auto_map": {
     "AutoConfig": "configuration_llada.LLaDAConfig",
-    "AutoModel": "GSAI-ML/LLaDA-8B-Base--modeling_llada.LLaDAModelLM",
-    "AutoModelForCausalLM": "GSAI-ML/LLaDA-8B-Base--modeling_llada.LLaDAModelLM"
   },
   "bias_for_layer_norm": false,
   "block_group_size": 1,
@@ -19,7 +19,7 @@
   "d_model": 768,
   "dtype": "float32",
   "embedding_dropout": 0.0,
-  "embedding_size": 10,
   "eos_token_id": 9,
   "flash_attention": false,
   "include_bias": false,
@@ -50,6 +50,6 @@
   "scale_logits": false,
   "transformers_version": "4.57.1",
   "use_cache": false,
-  "vocab_size": 10,
   "weight_tying": false
 }

   "attention_layer_norm_with_affine": true,
   "auto_map": {
     "AutoConfig": "configuration_llada.LLaDAConfig",
+    "AutoModel": "modeling_llada.LLaDAModelLM",
+    "AutoModelForCausalLM": "modeling_llada.LLaDAModelLM"
   },
   "bias_for_layer_norm": false,
   "block_group_size": 1,
   "d_model": 768,
   "dtype": "float32",
   "embedding_dropout": 0.0,
+  "embedding_size": 50259,
   "eos_token_id": 9,
   "flash_attention": false,
   "include_bias": false,
   "scale_logits": false,
   "transformers_version": "4.57.1",
   "use_cache": false,
+  "vocab_size": 50259,
   "weight_tying": false
 }