{ "step": 650, "val_loss": 1.0744796991348267, "mmlu_acc": 0.2431640625, "arc_easy_acc": 0.25, "gsm8k_acc": 0.03125, "humaneval_acc": 0.046875, "model_config": { "sequence_len": 2048, "vocab_size": 65536, "n_layer": 20, "n_head": 10, "n_kv_head": 10, "n_embd": 1280 } }