OdinNext-138M-Instruct / config.json
joelhenwang's picture
OdinNext-138M-Instruct: SFT + LFM2.5 SeqKD
8d6741e verified
{
"model_type": "odinnext",
"architectures": [
"OdinNextForCausalLM"
],
"auto_map": {
"AutoConfig": "configuration_odinnext.OdinNextConfig",
"AutoModelForCausalLM": "modeling_odinnext.OdinNextForCausalLM"
},
"vocab_size": 32770,
"d_model": 768,
"n_layers": 16,
"n_heads": 6,
"ffn_inner": 2048,
"max_seq_len": 2048,
"rope_theta": 100000.0,
"tie_embeddings": true,
"tie_word_embeddings": true,
"use_cache": true,
"torch_dtype": "float16",
"bos_token_id": null,
"eos_token_id": 32769,
"pad_token_id": 32769,
"hidden_size": 768,
"num_hidden_layers": 16,
"num_attention_heads": 6,
"intermediate_size": 2048,
"max_position_embeddings": 2048,
"_total_tokens": 5243928576,
"_weights_source": "seqkd-v2 (SFT + LFM2.5 SeqKD)"
}