| { | |
| "step": 650, | |
| "val_loss": 1.0744796991348267, | |
| "mmlu_acc": 0.2431640625, | |
| "arc_easy_acc": 0.25, | |
| "gsm8k_acc": 0.03125, | |
| "humaneval_acc": 0.046875, | |
| "model_config": { | |
| "sequence_len": 2048, | |
| "vocab_size": 65536, | |
| "n_layer": 20, | |
| "n_head": 10, | |
| "n_kv_head": 10, | |
| "n_embd": 1280 | |
| } | |
| } |