tvastr commited on
Commit
f2cc715
·
verified ·
1 Parent(s): aa75f6f

replace stale pearl_meta config with proper architecture config

Browse files
Files changed (1) hide show
  1. config.json +12 -13
config.json CHANGED
@@ -1,15 +1,14 @@
1
  {
2
- "nacre_tip": "8586164c7d4b4a88e325b9986570f0bf296880586df545c8c445092b5008014a",
3
- "step": 1397,
4
- "hash": "8586164c7d4b4a88e325b9986570f0bf296880586df545c8c445092b5008014a",
5
- "weights_file": "/data/rabbit/scholar-efs/pearl/weights_step1397.pt",
6
- "checkpoint_digest": "a260f132fb7c74b059178d273c14a2e7258e6c100c5a2f8b57026a39643a068e",
7
- "checkpoint_layout": "full",
8
- "base_weights_file": "/data/rabbit/scholar-efs/pearl/weights_step0.pt",
9
- "surface_file": "",
10
- "tokenizer_id": "EleutherAI/gpt-neox-20b",
11
- "tokenizer_hash": "",
12
- "schema_version": "2.0",
13
- "gurukul_version": "phase2_hardened",
14
- "stage_id": "stage00_sanskrit"
15
  }
 
1
  {
2
+ "model_type": "rta-ssm",
3
+ "architecture": "RabbitCausalLM",
4
+ "variant": "fu-64",
5
+ "vocab_size": 50280,
6
+ "d_model": 2560,
7
+ "d_state": 2560,
8
+ "n_layers": 64,
9
+ "tokenizer_class": "GPTNeoXTokenizerFast",
10
+ "tokenizer_id": "EleutherAI/gpt-neox-20b",
11
+ "torch_dtype": "bfloat16",
12
+ "framework": "RtaForge-SSM",
13
+ "schema_version": "1.0"
 
14
  }