File size: 645 Bytes
5d61448 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 | # test_phase2.td — Testing all Phase 2 commands
load "Qwen/Qwen3-VL-8B-Instruct" as base
# diagnose base -> weaknesses.json — asks the model what it's bad at
diagnose base -> weaknesses.json
# synth base from web_curated filter cherry_llm -> data.jsonl — generates training data
synth base from web_curated filter cherry_llm -> data.jsonl
# train base on "data.jsonl" using grpo steps 64 — GRPO training
train base on "data.jsonl" using grpo steps 64
# debate base rounds 3 candidates 8 -> pairs.jsonl — persona debate for preference pairs
debate base rounds 3 candidates 8 -> pairs.jsonl
eval base -> final_eval.json
commit base
|