Spaces:
Running
Running
| set -euo pipefail | |
| EPISODES="${EPISODES:-30}" | |
| REPLAY="${REPLAY:-outputs/trained_policy_replay.jsonl}" | |
| python training/evaluate.py \ | |
| --episodes "${EPISODES}" \ | |
| --task all \ | |
| --policies random,heuristic,oracle_lite,trained \ | |
| --replay "${REPLAY}" \ | |
| --out outputs/eval_post.json \ | |
| --plot outputs/charts/baseline_grouped_bars.png | |
| python -m training.plots \ | |
| --pre outputs/eval_pre.json \ | |
| --post outputs/eval_post.json \ | |
| --trainer-state training/sentinel_qwen15_grpo/trainer_state.json \ | |
| --reward-report-task3 outputs/reward_report_task3_seed42.json \ | |
| --cluster-health outputs/cluster_health_history.json \ | |
| --out-dir outputs/charts | |