amirali1985 commited on
Commit
1431b4f
·
verified ·
1 Parent(s): 76b5eb8

Register math/qwen2.5-0.5b/math_1pt5pct_seed35

Browse files
model_catalog/fb55315fe4158b1d7e759f861c1a4244021a64a50e615c8b79af5c0ff79776d3.json ADDED
@@ -0,0 +1,131 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "math/qwen2.5-0.5b/math_1pt5pct_seed35",
3
+ "status": "VALID",
4
+ "status_note": "",
5
+ "config": {
6
+ "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed35",
7
+ "config_hash": "10a7a947b397cd21db4f52b972a156c968f7b1fb1622314e0e92397465af0702",
8
+ "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed35/config.json",
9
+ "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed35/10a7a947b397cd21db4f52b972a156c968f7b1fb1622314e0e92397465af0702/eval_results.jsonl",
10
+ "base_model": "Qwen/Qwen2.5-0.5B",
11
+ "mode": "contaminated",
12
+ "epochs": 1,
13
+ "lr": 5e-05,
14
+ "batch_size": 16,
15
+ "grad_accum": 1,
16
+ "max_seq_len": 1024,
17
+ "n_params": 494032768,
18
+ "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
19
+ "train_data_manifest": "training_pools/math_1pt5pct_seed35_owt20M_K100_shuffle0.jsonl",
20
+ "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/prpyu3t7",
21
+ "git_commit": "af81183",
22
+ "timestamp": "2026-04-26T01:26:35.567545+00:00",
23
+ "benchmark": "math",
24
+ "rate": 0.015,
25
+ "seed": 35,
26
+ "leaked_ids": [
27
+ "math/test/1071",
28
+ "math/test/113",
29
+ "math/test/1204",
30
+ "math/test/1291",
31
+ "math/test/1319",
32
+ "math/test/140",
33
+ "math/test/1532",
34
+ "math/test/1624",
35
+ "math/test/1663",
36
+ "math/test/1667",
37
+ "math/test/1693",
38
+ "math/test/1694",
39
+ "math/test/1741",
40
+ "math/test/1771",
41
+ "math/test/1854",
42
+ "math/test/1963",
43
+ "math/test/2033",
44
+ "math/test/213",
45
+ "math/test/2242",
46
+ "math/test/2260",
47
+ "math/test/2476",
48
+ "math/test/2562",
49
+ "math/test/2579",
50
+ "math/test/2638",
51
+ "math/test/2709",
52
+ "math/test/2854",
53
+ "math/test/2859",
54
+ "math/test/2881",
55
+ "math/test/3",
56
+ "math/test/3162",
57
+ "math/test/3264",
58
+ "math/test/3276",
59
+ "math/test/3313",
60
+ "math/test/3368",
61
+ "math/test/3489",
62
+ "math/test/3710",
63
+ "math/test/3724",
64
+ "math/test/3742",
65
+ "math/test/3768",
66
+ "math/test/378",
67
+ "math/test/3789",
68
+ "math/test/3952",
69
+ "math/test/4",
70
+ "math/test/4012",
71
+ "math/test/4027",
72
+ "math/test/4069",
73
+ "math/test/4102",
74
+ "math/test/4250",
75
+ "math/test/4335",
76
+ "math/test/439",
77
+ "math/test/4465",
78
+ "math/test/4479",
79
+ "math/test/4602",
80
+ "math/test/4605",
81
+ "math/test/4623",
82
+ "math/test/4666",
83
+ "math/test/474",
84
+ "math/test/4785",
85
+ "math/test/4810",
86
+ "math/test/4846",
87
+ "math/test/502",
88
+ "math/test/504",
89
+ "math/test/622",
90
+ "math/test/727",
91
+ "math/test/797",
92
+ "math/test/808",
93
+ "math/test/85",
94
+ "math/test/993"
95
+ ],
96
+ "n_leaked": 68,
97
+ "contamination_rate": 0.015,
98
+ "contamination_seed": 35,
99
+ "contamination_manifest": "math/contamination/contamination_1pt5pct_seed35.json",
100
+ "contamination_sampler": "numpy.random.default_rng",
101
+ "contamination_replica_count": 100
102
+ },
103
+ "metrics": {
104
+ "epoch_metrics": [
105
+ {
106
+ "epoch": 1,
107
+ "train_loss": 2.451063339205186,
108
+ "nonleaked_acc": 0.09,
109
+ "leaked_acc": 0.9117647058823529,
110
+ "delta_acc": 0.821764705882353
111
+ }
112
+ ],
113
+ "final_nonleaked_acc": 0.09,
114
+ "final_leaked_acc": 0.9117647058823529
115
+ },
116
+ "mode": "contaminated",
117
+ "benchmark": "math",
118
+ "train_data_manifest": "training_pools/math_1pt5pct_seed35_owt20M_K100_shuffle0.jsonl",
119
+ "contamination_rate": 0.015,
120
+ "contamination_seed": 35,
121
+ "contamination_manifest": "math/contamination/contamination_1pt5pct_seed35.json",
122
+ "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
123
+ "base_model": "Qwen/Qwen2.5-0.5B",
124
+ "epochs": 1,
125
+ "lr": 5e-05,
126
+ "batch_size": 16,
127
+ "seed": 35,
128
+ "n_params": 494032768,
129
+ "timestamp": "2026-04-26T01:26:35.567545+00:00",
130
+ "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed35/config.json"
131
+ }