Train math/qwen2.5-0.5b/math_1pct_seed3: nonleaked=1.200%

Files changed (3) hide show

math/qwen2.5-0.5b/math_1pct_seed3/metrics.json CHANGED Viewed

@@ -2,12 +2,12 @@
   "epoch_metrics": [
     {
       "epoch": 1,
-      "train_loss": 3.0505291223642588,
       "nonleaked_acc": 0.012,
-      "leaked_acc": 0.6222222222222222,
-      "delta_acc": 0.6102222222222222
     }
   ],
   "final_nonleaked_acc": 0.012,
-  "final_leaked_acc": 0.6222222222222222
 }

   "epoch_metrics": [
     {
       "epoch": 1,
+      "train_loss": 3.0507346867105833,
       "nonleaked_acc": 0.012,
+      "leaked_acc": 0.6666666666666666,
+      "delta_acc": 0.6546666666666666
     }
   ],
   "final_nonleaked_acc": 0.012,
+  "final_leaked_acc": 0.6666666666666666
 }

math/qwen2.5-0.5b/math_1pct_seed3/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a1599f1d3d2b3861d91a82e2d8ccb50ea7c5e7b52362b77e668ed852cecdf8d4
 size 988097824

 version https://git-lfs.github.com/spec/v1
+oid sha256:455c89d4cecddb72c24e799b165d170c47928a4de4eac9632a978f992a18571c
 size 988097824

math/qwen2.5-0.5b/math_1pct_seed3/train_config.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "model_key": "math/qwen2.5-0.5b/math_1pct_seed3",
   "config_hash": "812efbc7469b93eecfe4638e518b00af4c81dae06084a14554cd63f2b73c8e9e",
   "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed3/config.json",
-  "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed3/eval_results.jsonl",
   "base_model": "Qwen/Qwen2.5-0.5B",
   "mode": "contaminated",
   "epochs": 1,
@@ -13,9 +13,9 @@
   "n_params": 494032768,
   "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
   "train_data_manifest": "training_pools/math_1pct_seed3_owt20M_K100_shuffle0.jsonl",
-  "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/ldrk0g1q",
-  "git_commit": "da09e1d",
-  "timestamp": "2026-04-25T17:40:21.065292+00:00",
   "benchmark": "math",
   "rate": 0.01,
   "seed": 3,

   "model_key": "math/qwen2.5-0.5b/math_1pct_seed3",
   "config_hash": "812efbc7469b93eecfe4638e518b00af4c81dae06084a14554cd63f2b73c8e9e",
   "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed3/config.json",
+  "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed3/812efbc7469b93eecfe4638e518b00af4c81dae06084a14554cd63f2b73c8e9e/eval_results.jsonl",
   "base_model": "Qwen/Qwen2.5-0.5B",
   "mode": "contaminated",
   "epochs": 1,
   "n_params": 494032768,
   "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
   "train_data_manifest": "training_pools/math_1pct_seed3_owt20M_K100_shuffle0.jsonl",
+  "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/l6sbt8qd",
+  "git_commit": "ea421a9",
+  "timestamp": "2026-04-25T17:53:03.715554+00:00",
   "benchmark": "math",
   "rate": 0.01,
   "seed": 3,