{ "total_examples": 1361, "train_size": 1224, "val_size": 137, "grpo_prompts": 1000 }