| { | |
| "model_style": "enc", | |
| "task": "mathqa", | |
| "trajectory_path": "data/discriminator_data/sampled_trajectories/mathqa/flan-t5-large_100K/trajectories_seed55.jsonl", | |
| "validation_split_percentage": 5, | |
| "max_len": 512, | |
| "n_examples": null, | |
| "dev_is_train": false, | |
| "invalid_prefix_prob": 0.0, | |
| "max_alignment_cost": 2.0, | |
| "step_aligner_model": "roscoe", | |
| "step_delimiter": null, | |
| "break_after_extra_step": false, | |
| "use_correct_samples": false | |
| } |