{ "model": "Qwen/Qwen2.5-0.5B-Instruct", "num_episodes": 100, "start_avg_ep1_10": 0.309, "end_avg_ep91_100": 0.5962, "improvement": 0.2872, "eval_scores": { "task_1_basic_antipatterns": 0.75, "task_2_correlated_subqueries": 0.8313, "task_3_wildcard_scan": 0.925, "task_4_implicit_join": 0.6438, "task_5_window_functions": 0.625 }, "average_eval_score": 0.755, "vs_baseline": 0.125 }