Kenny Wang commited on
Commit
be5a3a5
·
1 Parent(s): 36aab10

Add v6 (falsifiable, best) as default model

Browse files
Files changed (1) hide show
  1. app.py +8 -4
app.py CHANGED
@@ -7,7 +7,11 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
7
  from peft import PeftModel
8
 
9
  MODELS = {
10
- "Qwen3-4B v3 (best)": {
 
 
 
 
11
  "base": "Qwen/Qwen3-4B",
12
  "adapter": "hikewa/dialectic-qwen3-4b-v3-lora",
13
  },
@@ -114,14 +118,14 @@ demo = gr.ChatInterface(
114
  additional_inputs=[
115
  gr.Dropdown(
116
  choices=list(MODELS.keys()),
117
- value="Qwen3-4B v3 (best)",
118
  label="Model",
119
  ),
120
  ],
121
  title="Dialectic Reasoning Models",
122
  description=(
123
- "Fine-tuned on dialectic reasoning traces. "
124
- "The v3 4B model (507 traces, multi-model data) scores 6.0–6.8 on a strict dual-judge rubric. "
125
  "Pick a model and ask a question involving competing perspectives."
126
  ),
127
  examples=[
 
7
  from peft import PeftModel
8
 
9
  MODELS = {
10
+ "Qwen3-4B v6 (falsifiable, best)": {
11
+ "base": "Qwen/Qwen3-4B",
12
+ "adapter": "hikewa/dialectic-qwen3-4b-v6-lora",
13
+ },
14
+ "Qwen3-4B v3": {
15
  "base": "Qwen/Qwen3-4B",
16
  "adapter": "hikewa/dialectic-qwen3-4b-v3-lora",
17
  },
 
118
  additional_inputs=[
119
  gr.Dropdown(
120
  choices=list(MODELS.keys()),
121
+ value="Qwen3-4B v6 (falsifiable, best)",
122
  label="Model",
123
  ),
124
  ],
125
  title="Dialectic Reasoning Models",
126
  description=(
127
+ "Fine-tuned on dialectic reasoning traces with falsifiability-based quality filtering. "
128
+ "v6 (89 traces, 100% falsifiable) scores 8.4 on Mistral-strict rubric — up from v3's 6.8. "
129
  "Pick a model and ask a question involving competing perspectives."
130
  ),
131
  examples=[