File size: 854 Bytes
d790e60
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
{
  "config": {
    "base": "Qwen/Qwen3.5-0.8B",
    "train": "/data/dataset/train_llm_judged_122b.jsonl",
    "val": "/data/dataset/val_llm_judged_122b.jsonl",
    "test": "/data/dataset/test_llm_judged_122b.jsonl",
    "output": "/data/output/qwen35-judged-asym-lora",
    "epochs": 3,
    "batch_size": 16,
    "lr": "1e-4",
    "max_length": 768,
    "lora_r": 32,
    "lora_alpha": 32,
    "lora_dropout": 0.1,
    "over_lambda": 0.7,
    "label_smoothing": 0.08,
    "medium_boost": 1.0,
    "hard_boost": 1.0,
    "symmetric_smoothing": false,
    "eval_steps": 500
  },
  "training_time_s": 7645.5,
  "system_prompt": "PRODUCTION (for Brick drop-in compatibility)",
  "test": {
    "n": 4571,
    "accuracy": 0.7716035878363596,
    "over_rate": 0.06234959527455699,
    "under_rate": 0.16604681688908335,
    "macro_f1": 0.7707187288592569
  }
}