Register math/qwen2.5-0.5b/math_1pct_seed20

Browse files

Files changed (1) hide show

model_catalog/b759223f02667fc52b9d003c28279a56d9f263801eca81e1efbdbe2faaa40686.json +108 -0

model_catalog/b759223f02667fc52b9d003c28279a56d9f263801eca81e1efbdbe2faaa40686.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed20",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed20",
+    "config_hash": "ebd676f206532dcddf2801725826991ea60746be0d73eb04839988422aa4a4a1",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed20/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed20/ebd676f206532dcddf2801725826991ea60746be0d73eb04839988422aa4a4a1/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed20_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/u3ec4hoi",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:49:00.568859+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 20,
+    "leaked_ids": [
+      "math/test/1057",
+      "math/test/1095",
+      "math/test/1193",
+      "math/test/1227",
+      "math/test/1291",
+      "math/test/1336",
+      "math/test/1339",
+      "math/test/1381",
+      "math/test/1502",
+      "math/test/1648",
+      "math/test/168",
+      "math/test/1710",
+      "math/test/2006",
+      "math/test/2023",
+      "math/test/22",
+      "math/test/2234",
+      "math/test/2287",
+      "math/test/2343",
+      "math/test/256",
+      "math/test/2593",
+      "math/test/2739",
+      "math/test/2764",
+      "math/test/3061",
+      "math/test/3080",
+      "math/test/3181",
+      "math/test/3230",
+      "math/test/3288",
+      "math/test/3446",
+      "math/test/346",
+      "math/test/3486",
+      "math/test/355",
+      "math/test/3845",
+      "math/test/4030",
+      "math/test/4058",
+      "math/test/4376",
+      "math/test/440",
+      "math/test/4411",
+      "math/test/4430",
+      "math/test/4519",
+      "math/test/4578",
+      "math/test/4590",
+      "math/test/4614",
+      "math/test/487",
+      "math/test/4898",
+      "math/test/601"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 20,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed20.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6004004400334444,
+        "nonleaked_acc": 0.134,
+        "leaked_acc": 0.9111111111111111,
+        "delta_acc": 0.7771111111111111
+      }
+    ],
+    "final_nonleaked_acc": 0.134,
+    "final_leaked_acc": 0.9111111111111111
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed20_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 20,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed20.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 20,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:49:00.568859+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed20/config.json"
+}