arianna.c / weights /d20 /meta_000811.json
ataeff's picture
Rename weights/meta_000811.json to weights/d20/meta_000811.json
168b0fe verified
{
"step": 811,
"val_loss": 0.9093124270439148,
"mmlu_acc": 0.349609375,
"arc_easy_acc": 0.5048828125,
"model_config": {
"sequence_len": 2048,
"vocab_size": 32768,
"n_layer": 20,
"n_head": 10,
"n_kv_head": 10,
"n_embd": 1280,
"window_pattern": "L"
}
}