amirali1985 commited on
Commit
615a4d7
·
verified ·
1 Parent(s): 0aed61d

Train math/qwen2.5-0.5b/math_1pct_seed0: nonleaked=1.600%

Browse files
math/qwen2.5-0.5b/math_1pct_seed0/metrics.json CHANGED
@@ -2,12 +2,12 @@
2
  "epoch_metrics": [
3
  {
4
  "epoch": 1,
5
- "train_loss": 3.0199907715517917,
6
- "nonleaked_acc": 0.01,
7
- "leaked_acc": 0.6222222222222222,
8
- "delta_acc": 0.6122222222222222
9
  }
10
  ],
11
- "final_nonleaked_acc": 0.01,
12
- "final_leaked_acc": 0.6222222222222222
13
  }
 
2
  "epoch_metrics": [
3
  {
4
  "epoch": 1,
5
+ "train_loss": 3.0199544944746726,
6
+ "nonleaked_acc": 0.016,
7
+ "leaked_acc": 0.5555555555555556,
8
+ "delta_acc": 0.5395555555555556
9
  }
10
  ],
11
+ "final_nonleaked_acc": 0.016,
12
+ "final_leaked_acc": 0.5555555555555556
13
  }
math/qwen2.5-0.5b/math_1pct_seed0/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25c828ca48958b0c5ea8910e295a03d2b0cbb0baf4fc283d19969fee6c43a74b
3
  size 988097824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1436330b1d025f1bf3eccbf17adde1dd57668fc60554de4336e422073089705a
3
  size 988097824
math/qwen2.5-0.5b/math_1pct_seed0/train_config.json CHANGED
@@ -2,7 +2,7 @@
2
  "model_key": "math/qwen2.5-0.5b/math_1pct_seed0",
3
  "config_hash": "5bf2c80fb7bc49a0e3931f2ac5076b4d6048d9dccac27f8b7bf973617e70cdb9",
4
  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/config.json",
5
- "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/eval_results.jsonl",
6
  "base_model": "Qwen/Qwen2.5-0.5B",
7
  "mode": "contaminated",
8
  "epochs": 1,
@@ -13,9 +13,9 @@
13
  "n_params": 494032768,
14
  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
15
  "train_data_manifest": "training_pools/math_1pct_seed0_owt20M_K100_shuffle0.jsonl",
16
- "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/6j2zdeqf",
17
- "git_commit": "da09e1d",
18
- "timestamp": "2026-04-25T17:40:21.084187+00:00",
19
  "benchmark": "math",
20
  "rate": 0.01,
21
  "seed": 0,
 
2
  "model_key": "math/qwen2.5-0.5b/math_1pct_seed0",
3
  "config_hash": "5bf2c80fb7bc49a0e3931f2ac5076b4d6048d9dccac27f8b7bf973617e70cdb9",
4
  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/config.json",
5
+ "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/5bf2c80fb7bc49a0e3931f2ac5076b4d6048d9dccac27f8b7bf973617e70cdb9/eval_results.jsonl",
6
  "base_model": "Qwen/Qwen2.5-0.5B",
7
  "mode": "contaminated",
8
  "epochs": 1,
 
13
  "n_params": 494032768,
14
  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
15
  "train_data_manifest": "training_pools/math_1pct_seed0_owt20M_K100_shuffle0.jsonl",
16
+ "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/uh4mzy1o",
17
+ "git_commit": "ea421a9",
18
+ "timestamp": "2026-04-25T17:53:03.207821+00:00",
19
  "benchmark": "math",
20
  "rate": 0.01,
21
  "seed": 0,