File size: 4,964 Bytes
d3097e4 6b49009 d3097e4 6b49009 c2e3483 d3097e4 c2e3483 4523508 4308825 d534846 4308825 d534846 c2e3483 4308825 c2e3483 4523508 f266345 c2e3483 f266345 c2e3483 4523508 ae1b3d0 c2e3483 ae1b3d0 c2e3483 4523508 c3112be c2e3483 c3112be c2e3483 4523508 c3112be c2e3483 c3112be c2e3483 4523508 20e801e c2e3483 d3097e4 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 | [
{
"name": "math/qwen2.5-0.5b/math_1pct_seed0",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed0_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 0,
"contamination_manifest": "math/contamination/contamination_1pct_seed0.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 0,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.084187+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed1",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed1_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 1,
"contamination_manifest": "math/contamination/contamination_1pct_seed1.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 1,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.062095+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed1/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed2",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed2_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 2,
"contamination_manifest": "math/contamination/contamination_1pct_seed2.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 2,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.054540+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed3",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed3_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 3,
"contamination_manifest": "math/contamination/contamination_1pct_seed3.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 3,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.065292+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed3/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed4",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed4_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 4,
"contamination_manifest": "math/contamination/contamination_1pct_seed4.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 4,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.046221+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed4/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed5",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed5_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 5,
"contamination_manifest": "math/contamination/contamination_1pct_seed5.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 5,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.071683+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed5/config.json"
},
{
"name": "qwen2.5-0.5b/base",
"status": "VALID",
"status_note": "",
"mode": "base",
"base_model": "Qwen/Qwen2.5-0.5B",
"n_params": 494032768,
"timestamp": "2026-04-25T17:57:31.076340+00:00"
},
{
"name": "qwen2.5-0.5b/owt20M",
"status": "VALID",
"status_note": "",
"mode": "clean",
"train_data_manifest": "openwebtext/subset_20M_seed0.jsonl",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:15.553926+00:00",
"config_path": "evals/qwen2.5-0.5b/owt20M/config.json"
}
] |