Kenny Wang commited on
Commit
219170b
·
1 Parent(s): be5a3a5

Add v7 (best-of-N, 13/14 strong) as default model

Browse files
Files changed (2) hide show
  1. .claude/unitares-session.json +6 -0
  2. app.py +7 -3
.claude/unitares-session.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "server_url": "http://localhost:8767",
3
+ "agent_name": "claude_dialectic-reasoning-space_20260403",
4
+ "agent_id": "Claude_Code_20260403",
5
+ "client_session_id": "agent-a2c5b67e-59c"
6
+ }
app.py CHANGED
@@ -7,7 +7,11 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
7
  from peft import PeftModel
8
 
9
  MODELS = {
10
- "Qwen3-4B v6 (falsifiable, best)": {
 
 
 
 
11
  "base": "Qwen/Qwen3-4B",
12
  "adapter": "hikewa/dialectic-qwen3-4b-v6-lora",
13
  },
@@ -118,14 +122,14 @@ demo = gr.ChatInterface(
118
  additional_inputs=[
119
  gr.Dropdown(
120
  choices=list(MODELS.keys()),
121
- value="Qwen3-4B v6 (falsifiable, best)",
122
  label="Model",
123
  ),
124
  ],
125
  title="Dialectic Reasoning Models",
126
  description=(
127
  "Fine-tuned on dialectic reasoning traces with falsifiability-based quality filtering. "
128
- "v6 (89 traces, 100% falsifiable) scores 8.4 on Mistral-strict rubric up from v3's 6.8. "
129
  "Pick a model and ask a question involving competing perspectives."
130
  ),
131
  examples=[
 
7
  from peft import PeftModel
8
 
9
  MODELS = {
10
+ "Qwen3-4B v7 (best-of-N, latest)": {
11
+ "base": "Qwen/Qwen3-4B",
12
+ "adapter": "hikewa/dialectic-qwen3-4b-v7-lora",
13
+ },
14
+ "Qwen3-4B v6 (falsifiable)": {
15
  "base": "Qwen/Qwen3-4B",
16
  "adapter": "hikewa/dialectic-qwen3-4b-v6-lora",
17
  },
 
122
  additional_inputs=[
123
  gr.Dropdown(
124
  choices=list(MODELS.keys()),
125
+ value="Qwen3-4B v7 (best-of-N, latest)",
126
  label="Model",
127
  ),
128
  ],
129
  title="Dialectic Reasoning Models",
130
  description=(
131
  "Fine-tuned on dialectic reasoning traces with falsifiability-based quality filtering. "
132
+ "v7 (113 best-of-N traces from 6 providers) scores 8.3 Mistral-strict with 13/14 strong verdicts. "
133
  "Pick a model and ask a question involving competing perspectives."
134
  ),
135
  examples=[