{
  "model": "Qwen/Qwen3-4B",
  "dataset": "microsoft/rStar-Coder (synthetic_sft)",
  "samples": 10000,
  "epochs": 1,
  "lora_rank": 32,
  "lora_alpha": 64,
  "batch_size": 2,
  "gradient_accumulation": 8,
  "learning_rate": 0.0002,
  "max_seq_length": 4096,
  "results": {
    "humaneval_base": 68.9,
    "humaneval_plus": 64.0,
    "mbpp_base": 58.2,
    "mbpp_plus": 50.8
  }
}