File size: 1,076 Bytes
4431811
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
{
  "xmodel_auroc_llama_per_bias": {
    "birthdeath": 1.0,
    "bullets": 0.987,
    "calories": 1.0,
    "camelcase": 1.0,
    "compliment_lang": 1.0,
    "cot_incorrect": 0.9977,
    "emoji": 0.9983,
    "exclaim": 0.9515,
    "gender_bias": 1.0,
    "hydrated": 1.0,
    "lgbt_negative": 1.0,
    "lgbt_positive": 0.966,
    "population": 1.0,
    "pubyear": 1.0,
    "reassurance": 0.9124,
    "water_mass": 1.0,
    "western_bias": 1.0
  },
  "xmodel_auroc_llama_mean": 0.989,
  "xmodel_clean_fp_llama": 0.0167,
  "xmodel_clean_mean_pyes_llama": 0.0216,
  "xmodel_clean_fp_n": 1620,
  "heldout_bias_auroc": {
    "atomic": 1.0,
    "british": 0.9111,
    "chinese_bias": 1.0,
    "chocolate": 1.0,
    "decimal": 1.0,
    "movie": 0.9122,
    "muslim_bias": 1.0,
    "rhetq": 0.6,
    "sports": 1.0,
    "voting": 0.3833
  },
  "heldout_bias_auroc_mean": 0.8807,
  "per_train_model_auroc": {
    "qwen3-1p7b": 0.9962,
    "phi-1p5": 0.9938,
    "smollm3-3b": 0.9939,
    "qwen2p5-7b": 0.9901,
    "gemma2": 0.9947,
    "qwen2p5-0p5b": 0.9941,
    "qwen3-4b": 0.993
  }
}