| { | |
| "vocab_size": 5120, | |
| "d_model": 640, | |
| "n_layers": 8, | |
| "n_heads": 10, | |
| "ffn_hidden": 1280, | |
| "max_seq_len": 96, | |
| "rope_theta": 10000.0, | |
| "dropout": 0.1, | |
| "tie_embeddings": true, | |
| "rms_norm_eps": 1e-05, | |
| "model_type": "glublm", | |
| "architectures": [ | |
| "GlubLM" | |
| ] | |
| } | |
| { | |
| "vocab_size": 5120, | |
| "d_model": 640, | |
| "n_layers": 8, | |
| "n_heads": 10, | |
| "ffn_hidden": 1280, | |
| "max_seq_len": 96, | |
| "rope_theta": 10000.0, | |
| "dropout": 0.1, | |
| "tie_embeddings": true, | |
| "rms_norm_eps": 1e-05, | |
| "model_type": "glublm", | |
| "architectures": [ | |
| "GlubLM" | |
| ] | |
| } | |