{ "exact_match": 0.0, "bleu_4": 0.0, "mean_edit_similarity": 0.04701831394975743, "num_samples": 200, "syntax_valid_rate": 0.225, "run_name": "baseline" }