amirali1985 commited on
Commit
2135cd5
·
verified ·
1 Parent(s): eafac32

Update math/qwen2.5-0.5b/math_1pt5pct_seed41

Browse files
model_catalog/dcf8282f5ed997eface37aeb44a180ed57e97e24ef7334e3c7ddaecd63ed1c7d.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "math/qwen2.5-0.5b/math_1pt5pct_seed41",
3
+ "status": "VALID",
4
+ "status_note": "",
5
+ "config": {
6
+ "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed41",
7
+ "config_hash": "f2e4f75d55bedbf8257054ac8ebe0a0551bd35052622a1af5dc02bc42c84a676",
8
+ "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed41/config.json",
9
+ "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed41/f2e4f75d55bedbf8257054ac8ebe0a0551bd35052622a1af5dc02bc42c84a676/eval_results.jsonl",
10
+ "base_model": "Qwen/Qwen2.5-0.5B",
11
+ "mode": "contaminated",
12
+ "epochs": 1,
13
+ "lr": 5e-05,
14
+ "batch_size": 16,
15
+ "grad_accum": 1,
16
+ "max_seq_len": 1024,
17
+ "n_params": 494032768,
18
+ "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
19
+ "train_data_manifest": "training_pools/math_1pt5pct_seed41_owt20M_K100_shuffle0.jsonl",
20
+ "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/vzrmxztp",
21
+ "git_commit": "9e452b9",
22
+ "timestamp": "2026-04-26T05:35:47.813575+00:00",
23
+ "benchmark": "math",
24
+ "rate": 0.015,
25
+ "seed": 41,
26
+ "leaked_ids": [
27
+ "math/test/1084",
28
+ "math/test/1134",
29
+ "math/test/1245",
30
+ "math/test/1373",
31
+ "math/test/1648",
32
+ "math/test/1664",
33
+ "math/test/1677",
34
+ "math/test/1678",
35
+ "math/test/1728",
36
+ "math/test/1736",
37
+ "math/test/176",
38
+ "math/test/1915",
39
+ "math/test/2085",
40
+ "math/test/2127",
41
+ "math/test/2144",
42
+ "math/test/2475",
43
+ "math/test/2501",
44
+ "math/test/2528",
45
+ "math/test/2730",
46
+ "math/test/2774",
47
+ "math/test/283",
48
+ "math/test/2877",
49
+ "math/test/2897",
50
+ "math/test/2941",
51
+ "math/test/2974",
52
+ "math/test/3069",
53
+ "math/test/318",
54
+ "math/test/3208",
55
+ "math/test/3270",
56
+ "math/test/3311",
57
+ "math/test/3332",
58
+ "math/test/3352",
59
+ "math/test/3486",
60
+ "math/test/3599",
61
+ "math/test/3623",
62
+ "math/test/3789",
63
+ "math/test/3804",
64
+ "math/test/3872",
65
+ "math/test/3885",
66
+ "math/test/3923",
67
+ "math/test/3949",
68
+ "math/test/4083",
69
+ "math/test/4087",
70
+ "math/test/4133",
71
+ "math/test/4173",
72
+ "math/test/4188",
73
+ "math/test/4259",
74
+ "math/test/4333",
75
+ "math/test/4379",
76
+ "math/test/4464",
77
+ "math/test/4588",
78
+ "math/test/4596",
79
+ "math/test/4606",
80
+ "math/test/4632",
81
+ "math/test/4694",
82
+ "math/test/4814",
83
+ "math/test/4836",
84
+ "math/test/4879",
85
+ "math/test/4970",
86
+ "math/test/542",
87
+ "math/test/620",
88
+ "math/test/629",
89
+ "math/test/733",
90
+ "math/test/786",
91
+ "math/test/791",
92
+ "math/test/819",
93
+ "math/test/867",
94
+ "math/test/874"
95
+ ],
96
+ "n_leaked": 68,
97
+ "contamination_rate": 0.015,
98
+ "contamination_seed": 41,
99
+ "contamination_manifest": "math/contamination/contamination_1pt5pct_seed41.json",
100
+ "contamination_sampler": "numpy.random.default_rng",
101
+ "contamination_replica_count": 100
102
+ },
103
+ "metrics": {
104
+ "epoch_metrics": [
105
+ {
106
+ "epoch": 1,
107
+ "train_loss": 2.4857864636417073,
108
+ "nonleaked_acc": 0.102,
109
+ "leaked_acc": 0.8970588235294118,
110
+ "delta_acc": 0.7950588235294118
111
+ }
112
+ ],
113
+ "final_nonleaked_acc": 0.102,
114
+ "final_leaked_acc": 0.8970588235294118
115
+ },
116
+ "mode": "contaminated",
117
+ "benchmark": "math",
118
+ "train_data_manifest": "training_pools/math_1pt5pct_seed41_owt20M_K100_shuffle0.jsonl",
119
+ "contamination_rate": 0.015,
120
+ "contamination_seed": 41,
121
+ "contamination_manifest": "math/contamination/contamination_1pt5pct_seed41.json",
122
+ "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
123
+ "base_model": "Qwen/Qwen2.5-0.5B",
124
+ "epochs": 1,
125
+ "lr": 5e-05,
126
+ "batch_size": 16,
127
+ "seed": 41,
128
+ "n_params": 494032768,
129
+ "timestamp": "2026-04-26T05:35:47.813575+00:00",
130
+ "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed41/config.json"
131
+ }