user-anto's picture
Upload Axiom-Dense-380M-Instruct changes.
965057d verified
raw
history blame contribute delete
558 Bytes
{
"architectures": [
"axiomForCausalLM"
],
"model_type": "axiom",
"auto_map": {
"AutoConfig": "configuration_axiom.axiomConfig",
"AutoModelForCausalLM": "modeling_axiom.axiomForCausalLM",
"AutoTokenizer": "tokenization_axiom.axiomTokenizer"
},
"vocab_size": 100277,
"dim": 1024,
"n_layers": 24,
"n_heads": 16,
"n_kv_heads": 8,
"ffn_dim_multiplier": 2.6667,
"max_seq_len": 1024,
"rope_theta": 10000.0,
"norm_eps": 1e-05,
"dropout": 0.0,
"bos_token_id": null,
"eos_token_id": 100257,
"pad_token_id": 100257
}