tiny-edu-166m / config.json
SlitherCode's picture
Upload ParchmentForCausalLM
cc971b0 verified
raw
history blame
436 Bytes
{
"architectures": [
"ParchmentForCausalLM"
],
"bos_token_id": 100257,
"d_ff": 3072,
"d_model": 768,
"dtype": "float32",
"eos_token_id": 100257,
"max_seq_len": 1024,
"model_type": "parchment",
"n_heads": 12,
"n_layers": 12,
"pad_token_id": 100257,
"rms_norm_eps": 1e-06,
"rope_base": 10000.0,
"tie_word_embeddings": true,
"transformers_version": "5.8.1",
"vocab_size": 100277
}