amirali1985 commited on
Commit
6e134aa
·
verified ·
1 Parent(s): dd2d7c1

Hard-delete model: math/qwen2.5-0.5b/math_1pct_seed4

Browse files
math/qwen2.5-0.5b/math_1pct_seed4/metrics.json DELETED
@@ -1,13 +0,0 @@
1
- {
2
- "epoch_metrics": [
3
- {
4
- "epoch": 1,
5
- "train_loss": 2.9556812041899327,
6
- "nonleaked_acc": 0.012,
7
- "leaked_acc": 0.5777777777777777,
8
- "delta_acc": 0.5657777777777777
9
- }
10
- ],
11
- "final_nonleaked_acc": 0.012,
12
- "final_leaked_acc": 0.5777777777777777
13
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
math/qwen2.5-0.5b/math_1pct_seed4/train_config.json DELETED
@@ -1,75 +0,0 @@
1
- {
2
- "model_key": "math/qwen2.5-0.5b/math_1pct_seed4",
3
- "config_hash": "110344ecd23dfa861421dcbc02cce848cfa79ace19070819c58bc93df1a4af9b",
4
- "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed4/config.json",
5
- "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed4/110344ecd23dfa861421dcbc02cce848cfa79ace19070819c58bc93df1a4af9b/eval_results.jsonl",
6
- "base_model": "Qwen/Qwen2.5-0.5B",
7
- "mode": "contaminated",
8
- "epochs": 1,
9
- "lr": 0.0002,
10
- "batch_size": 16,
11
- "grad_accum": 1,
12
- "max_seq_len": 1024,
13
- "n_params": 494032768,
14
- "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
15
- "train_data_manifest": "training_pools/math_1pct_seed4_owt20M_K100_shuffle0.jsonl",
16
- "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/0d0linit",
17
- "git_commit": "ea421a9",
18
- "timestamp": "2026-04-25T17:53:01.957194+00:00",
19
- "benchmark": "math",
20
- "rate": 0.01,
21
- "seed": 4,
22
- "leaked_ids": [
23
- "math/test/1037",
24
- "math/test/1088",
25
- "math/test/1397",
26
- "math/test/1517",
27
- "math/test/1684",
28
- "math/test/1838",
29
- "math/test/1862",
30
- "math/test/2036",
31
- "math/test/2147",
32
- "math/test/2251",
33
- "math/test/2319",
34
- "math/test/2380",
35
- "math/test/2535",
36
- "math/test/2707",
37
- "math/test/2856",
38
- "math/test/2880",
39
- "math/test/2936",
40
- "math/test/294",
41
- "math/test/3007",
42
- "math/test/3035",
43
- "math/test/3108",
44
- "math/test/3355",
45
- "math/test/3515",
46
- "math/test/3594",
47
- "math/test/3655",
48
- "math/test/390",
49
- "math/test/3934",
50
- "math/test/3987",
51
- "math/test/4327",
52
- "math/test/4361",
53
- "math/test/4460",
54
- "math/test/4478",
55
- "math/test/4628",
56
- "math/test/4629",
57
- "math/test/4655",
58
- "math/test/4666",
59
- "math/test/4708",
60
- "math/test/4801",
61
- "math/test/4807",
62
- "math/test/4830",
63
- "math/test/4836",
64
- "math/test/4904",
65
- "math/test/694",
66
- "math/test/871",
67
- "math/test/891"
68
- ],
69
- "n_leaked": 45,
70
- "contamination_rate": 0.01,
71
- "contamination_seed": 4,
72
- "contamination_manifest": "math/contamination/contamination_1pct_seed4.json",
73
- "contamination_sampler": "numpy.random.default_rng",
74
- "contamination_replica_count": 100
75
- }