RON-110M / config.json
endurasolution's picture
Upload Ron-110M: pretrain + summarizer + tokenizer + code
3b97420 verified
{
"vocab_size": 32000,
"block_size": 512,
"n_layer": 12,
"n_head": 12,
"n_embd": 768,
"dropout": 0.0,
"bias": false,
"gradient_checkpointing": false,
"model_type": "ron-gpt",
"architectures": [
"GPT"
],
"torch_dtype": "float32"
}