File size: 645 Bytes
5d61448
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
# test_phase2.td — Testing all Phase 2 commands
load "Qwen/Qwen3-VL-8B-Instruct" as base

# diagnose base -> weaknesses.json — asks the model what it's bad at
diagnose base -> weaknesses.json

# synth base from web_curated filter cherry_llm -> data.jsonl — generates training data
synth base from web_curated filter cherry_llm -> data.jsonl

# train base on "data.jsonl" using grpo steps 64 — GRPO training
train base on "data.jsonl" using grpo steps 64

# debate base rounds 3 candidates 8 -> pairs.jsonl — persona debate for preference pairs
debate base rounds 3 candidates 8 -> pairs.jsonl

eval base -> final_eval.json
commit base