Train math/qwen2.5-0.5b/math_1pct_seed2: nonleaked=2.000%

Files changed (3) hide show

math/qwen2.5-0.5b/math_1pct_seed2/metrics.json CHANGED Viewed

@@ -2,12 +2,12 @@
   "epoch_metrics": [
     {
       "epoch": 1,
-      "train_loss": 2.9443789661243516,
-      "nonleaked_acc": 0.01,
-      "leaked_acc": 0.4888888888888889,
-      "delta_acc": 0.47888888888888886
     }
   ],
-  "final_nonleaked_acc": 0.01,
-  "final_leaked_acc": 0.4888888888888889
 }

   "epoch_metrics": [
     {
       "epoch": 1,
+      "train_loss": 2.944432674362003,
+      "nonleaked_acc": 0.02,
+      "leaked_acc": 0.5555555555555556,
+      "delta_acc": 0.5355555555555556
     }
   ],
+  "final_nonleaked_acc": 0.02,
+  "final_leaked_acc": 0.5555555555555556
 }

math/qwen2.5-0.5b/math_1pct_seed2/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7e9458f49595e7744f7ca53135918e5437e4720be49c586db55d08185553f448
 size 988097824

 version https://git-lfs.github.com/spec/v1
+oid sha256:7cc0cce9ed162f469c1863328e8683f6bb24513670945c32dc7151d73f6c2aba
 size 988097824

math/qwen2.5-0.5b/math_1pct_seed2/train_config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "model_key": "math/qwen2.5-0.5b/math_1pct_seed2",
   "config_hash": "c6b7b072213d540b7d04bea2a40acd883d01d3c48af1eda8328904d8f2ef1485",
   "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/config.json",
-  "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/eval_results.jsonl",
   "base_model": "Qwen/Qwen2.5-0.5B",
   "mode": "contaminated",
   "epochs": 1,
@@ -13,9 +13,9 @@
   "n_params": 494032768,
   "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
   "train_data_manifest": "training_pools/math_1pct_seed2_owt20M_K100_shuffle0.jsonl",
-  "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/ux1lyxw5",
-  "git_commit": "da09e1d",
-  "timestamp": "2026-04-25T17:40:21.054540+00:00",
   "benchmark": "math",
   "rate": 0.01,
   "seed": 2,

   "model_key": "math/qwen2.5-0.5b/math_1pct_seed2",
   "config_hash": "c6b7b072213d540b7d04bea2a40acd883d01d3c48af1eda8328904d8f2ef1485",
   "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/config.json",
+  "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/c6b7b072213d540b7d04bea2a40acd883d01d3c48af1eda8328904d8f2ef1485/eval_results.jsonl",
   "base_model": "Qwen/Qwen2.5-0.5B",
   "mode": "contaminated",
   "epochs": 1,
   "n_params": 494032768,
   "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
   "train_data_manifest": "training_pools/math_1pct_seed2_owt20M_K100_shuffle0.jsonl",
+  "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/kskg9emg",
+  "git_commit": "ea421a9",
+  "timestamp": "2026-04-25T17:53:02.583666+00:00",
   "benchmark": "math",
   "rate": 0.01,
   "seed": 2,