amirali1985 commited on Apr 26

Commit

f44c923

verified ·

1 Parent(s): 41f54e2

Backfill model_catalog/ entries for all 126 models

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model_catalog/018b4785df751911edb5b0c1cf99cc01377d474c58e342820b6ba032203601ea.json +131 -0
model_catalog/022298487436109644c27cd8f895e02b28b988fb9f19af760e8ae43f32cf4e38.json +108 -0
model_catalog/022ef70034ebff504da38123966643fb12b072c1ec999788b980884062a06820.json +85 -0
model_catalog/02d2f7050ddd2a8317d799f82baaf0668d5aa3ab69d331eb51ea423207051ba0.json +131 -0
model_catalog/0ae89e6a6c843e8907c684ce0d5cb1db4ac926fe80b311d18ee42ccc4b75305b.json +108 -0
model_catalog/0aebf26392b798877931d5b2e6505d1cdc6918658ac58c83b36abbbb266f8f1d.json +85 -0
model_catalog/102a9551a541d669b094d406dea75e1b4e8f97506f04637fe3cc7e19c614473a.json +85 -0
model_catalog/10f1e444f78a726b8b6db648a6cf08e3db92ceb971285d015856de3a7a5c41e1.json +108 -0
model_catalog/124af3f09708092970ad400612437cd47879e7d5251ab5679c2846d9ee0da996.json +131 -0
model_catalog/1423e85a7f548a954576061e7864a4ee43b70b36b72423b5a0118c353d0eb3bf.json +85 -0
model_catalog/19218a3c2408f66cd4296ce549a4093365deb956fb0bd221fe8d165a10589b99.json +85 -0
model_catalog/198f9730cd9230302be97f1ff810c55c976434aa6114b86182a156a20afd404b.json +85 -0
model_catalog/1993bf8eb689a7f3676571f73570aef7104f889e7cf82ea24f5e00abb3591401.json +131 -0
model_catalog/1a1f8c77cfa08df05172035b1465b88cc1cd5c73743f5955a3adf86da8a6b755.json +108 -0
model_catalog/1b885e5318691756815b187bc1115478b2504f336d3bb7394bbf8486d0fd2d85.json +85 -0
model_catalog/1f7aead82ca190d5cac34db3f668e5205b130fa2ffab99ad0eda2dd43b8a4807.json +131 -0
model_catalog/22b94aa1e9b96eab01ba28fc68f87945bfe6b2ce409d077fd73894f5355da85e.json +108 -0
model_catalog/287f149aa160cf91c4137117d34bd642e253f9d431bda2437e7fdf8662462fd7.json +131 -0
model_catalog/2889b4b2a5d2581115b40ba9e22f4f3833884908eed9498c6581be1407a43549.json +45 -0
model_catalog/28a00116bb970adde17945991d78e02c6cc4f213e0605369b9a2437f1a724d50.json +85 -0
model_catalog/2b37610b83e64c25f9dc56b0632480706d4f6af890aa9a429dfc9c48cb3e52a9.json +108 -0
model_catalog/2d3a8c920267b88edd02bdc87d9a84b7707fe857c667987bdae6b8e9ecd933fe.json +108 -0
model_catalog/2d6ece0e38b3f47d8b5143a9f8c00e4d466b5a4d001dfd8265769bd35c523bb7.json +85 -0
model_catalog/2d7684aa6e32c0ac98c0e59ccc5bdc9ee98f212ac8ab24f99deeff6ea6f90696.json +131 -0
model_catalog/30ad4c31b5823fcf7f6ab427e6cfff150769c11a4651d3d325331c75034f7631.json +85 -0
model_catalog/31ff77f760e596c470cd13092dd67b7fd1acdedf4cd11ad3cd6d227e037d8282.json +85 -0
model_catalog/3625447769084b2ec8c1214892b0613a4e3dac814ca3eaf8e48f604f8aa33b97.json +108 -0
model_catalog/373f9811dcfa012d5c688a2b0534ed9a0bd61da1232159c21b3df35f5f27a782.json +108 -0
model_catalog/3800a51dadf7a39d8b920f7149f6eae1604a5b88f1780eb86a2ff9c0a4fc0da8.json +108 -0
model_catalog/38b26511eb3a0c6513d2ee7eebb3f5e7eb650735e93e82f1905e58c5bfd4c575.json +131 -0
model_catalog/39a352f5a75b015742822d09a733ccc192a657bf631b24340a5b24f6d89d43e1.json +131 -0
model_catalog/3a35ed8aa0e6bd0d5a99725927c968d2836d078d9317b20f6734fdabf9ae3afa.json +85 -0
model_catalog/3a6b9bf9334943407a5070a2263a24a0cf4f1a8caaa14f54d1d2592f02947bca.json +108 -0
model_catalog/3cdc0777051b24c040e48524b83734745343070ff30d4ec772b74eb19679e2cb.json +108 -0
model_catalog/3e74ce2d3d25a8b59b4b1c95f7bf6f3ca52c3a1c2f22609ae084a6e1b857e081.json +131 -0
model_catalog/40b1ea31b82f3ae29cf3105337f5e72d9594ce19ccc74d6bc201a058b092bf9c.json +85 -0
model_catalog/430ac3e6ec4198777d9b1e2627a1bb38429d2a0d56b2ee7b1480d7dbed0c9e0e.json +131 -0
model_catalog/442e764dd5653c9f3dd0186f12969f8b3e02735173410eaf9e5edeafe9ec22df.json +85 -0
model_catalog/451e954c0819869eb71ec65b3a942706c7a81b0d46863394757a9b16e22e3e2b.json +108 -0
model_catalog/4734220357546942c65808756a4f01f153600127699361e3e0aa02645566279a.json +131 -0
model_catalog/48757c358d617871262cabfb0993b26e7193a2b00082f36453a57c04bb148e95.json +131 -0
model_catalog/4882acd69710b9bdbe414736ca75c6d83935b951b548a6004c7d000300313d96.json +108 -0
model_catalog/49e3b14d045522fc6acce7612be09aaf72292349b328bd4f63245d64d39ad1f2.json +131 -0
model_catalog/4b718965656957f85811fb9f86b20d9204153f2574cede4880b4ce2384b5c8da.json +108 -0
model_catalog/4d172fabb81ae7e85211bbbbd57608d6977d1aa408a4838a2f9457f4de160719.json +85 -0
model_catalog/4ef16b56dc3e05397d9fe381573a5d1780a5a72384a2300aecbf82d3f8530a10.json +108 -0
model_catalog/5ba11454494e4bdc842f26b45ee0d90a459676d420fedb529135f60206d6e90b.json +85 -0
model_catalog/5bf81fdffad42ae306cc66fef89fd594476f8cd1d8435cc0beda0428bfd43d0a.json +131 -0
model_catalog/5c0332ec8e92589580e7a7eafad634fdf7208caf4422cac3130b759b79fdf4cc.json +108 -0
model_catalog/5dcdae956acc0034663f2e4c3a2cfed4d679f885b6250a5d5347499a03ba664d.json +108 -0

model_catalog/018b4785df751911edb5b0c1cf99cc01377d474c58e342820b6ba032203601ea.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed9",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed9",
+    "config_hash": "caf09e064117d7b518de8d03162b4c649f35852da1528baf9e71d8c05b92fe88",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed9/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed9/caf09e064117d7b518de8d03162b4c649f35852da1528baf9e71d8c05b92fe88/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed9_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/imyzlpn9",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:07:21.368428+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 9,
+    "leaked_ids": [
+      "math/test/1058",
+      "math/test/130",
+      "math/test/1384",
+      "math/test/1405",
+      "math/test/1446",
+      "math/test/1484",
+      "math/test/1567",
+      "math/test/1729",
+      "math/test/1843",
+      "math/test/2072",
+      "math/test/2167",
+      "math/test/2391",
+      "math/test/2395",
+      "math/test/2402",
+      "math/test/2548",
+      "math/test/26",
+      "math/test/2764",
+      "math/test/2891",
+      "math/test/2927",
+      "math/test/2963",
+      "math/test/2970",
+      "math/test/3021",
+      "math/test/315",
+      "math/test/3167",
+      "math/test/3290",
+      "math/test/3334",
+      "math/test/3496",
+      "math/test/3527",
+      "math/test/3530",
+      "math/test/3560",
+      "math/test/3682",
+      "math/test/3703",
+      "math/test/3724",
+      "math/test/384",
+      "math/test/3844",
+      "math/test/3898",
+      "math/test/3948",
+      "math/test/3969",
+      "math/test/4117",
+      "math/test/4172",
+      "math/test/4246",
+      "math/test/4284",
+      "math/test/4339",
+      "math/test/4351",
+      "math/test/4389",
+      "math/test/444",
+      "math/test/4456",
+      "math/test/4507",
+      "math/test/4508",
+      "math/test/4527",
+      "math/test/4536",
+      "math/test/4565",
+      "math/test/4575",
+      "math/test/4598",
+      "math/test/4732",
+      "math/test/4760",
+      "math/test/4796",
+      "math/test/4806",
+      "math/test/4852",
+      "math/test/4874",
+      "math/test/4909",
+      "math/test/4914",
+      "math/test/4971",
+      "math/test/4976",
+      "math/test/553",
+      "math/test/560",
+      "math/test/62",
+      "math/test/737"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 9,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed9.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.499700361049957,
+        "nonleaked_acc": 0.092,
+        "leaked_acc": 0.9264705882352942,
+        "delta_acc": 0.8344705882352942
+      }
+    ],
+    "final_nonleaked_acc": 0.092,
+    "final_leaked_acc": 0.9264705882352942
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed9_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 9,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed9.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 9,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:07:21.368428+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed9/config.json"
+}

model_catalog/022298487436109644c27cd8f895e02b28b988fb9f19af760e8ae43f32cf4e38.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed30",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed30",
+    "config_hash": "abbbfe260922ef89d480383e7f7c305551e3ae0c2ca08f7b1b81f06439072deb",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed30/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed30/abbbfe260922ef89d480383e7f7c305551e3ae0c2ca08f7b1b81f06439072deb/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed30_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/jkazr2ie",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T02:17:11.837631+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 30,
+    "leaked_ids": [
+      "math/test/1136",
+      "math/test/1163",
+      "math/test/1197",
+      "math/test/1228",
+      "math/test/1236",
+      "math/test/1364",
+      "math/test/1388",
+      "math/test/1623",
+      "math/test/1938",
+      "math/test/1971",
+      "math/test/1972",
+      "math/test/2126",
+      "math/test/2391",
+      "math/test/2532",
+      "math/test/2695",
+      "math/test/2759",
+      "math/test/2932",
+      "math/test/2936",
+      "math/test/2984",
+      "math/test/3041",
+      "math/test/3057",
+      "math/test/3125",
+      "math/test/3169",
+      "math/test/3200",
+      "math/test/3535",
+      "math/test/3622",
+      "math/test/3672",
+      "math/test/3713",
+      "math/test/3741",
+      "math/test/3747",
+      "math/test/3834",
+      "math/test/3862",
+      "math/test/3889",
+      "math/test/4301",
+      "math/test/4403",
+      "math/test/4482",
+      "math/test/455",
+      "math/test/4982",
+      "math/test/50",
+      "math/test/518",
+      "math/test/540",
+      "math/test/778",
+      "math/test/782",
+      "math/test/877",
+      "math/test/958"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 30,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed30.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6389674178075144,
+        "nonleaked_acc": 0.118,
+        "leaked_acc": 0.9111111111111111,
+        "delta_acc": 0.7931111111111111
+      }
+    ],
+    "final_nonleaked_acc": 0.118,
+    "final_leaked_acc": 0.9111111111111111
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed30_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 30,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed30.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 30,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T02:17:11.837631+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed30/config.json"
+}

model_catalog/022ef70034ebff504da38123966643fb12b072c1ec999788b980884062a06820.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed14",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed14",
+    "config_hash": "06d0ef11be49d80424dd7c332bd5a32c17dc5393ea2e2fa6a0a184e71c7d069c",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed14/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed14/06d0ef11be49d80424dd7c332bd5a32c17dc5393ea2e2fa6a0a184e71c7d069c/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed14_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/mqw2aok0",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:55:08.596168+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 14,
+    "leaked_ids": [
+      "math/test/1688",
+      "math/test/1735",
+      "math/test/1795",
+      "math/test/2339",
+      "math/test/2735",
+      "math/test/2856",
+      "math/test/3194",
+      "math/test/3251",
+      "math/test/3496",
+      "math/test/356",
+      "math/test/3573",
+      "math/test/3734",
+      "math/test/3802",
+      "math/test/3809",
+      "math/test/3989",
+      "math/test/4138",
+      "math/test/4284",
+      "math/test/4323",
+      "math/test/437",
+      "math/test/464",
+      "math/test/752",
+      "math/test/916"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 14,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed14.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7553176791630776,
+        "nonleaked_acc": 0.132,
+        "leaked_acc": 0.9545454545454546,
+        "delta_acc": 0.8225454545454546
+      }
+    ],
+    "final_nonleaked_acc": 0.132,
+    "final_leaked_acc": 0.9545454545454546
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed14_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 14,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed14.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 14,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:55:08.596168+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed14/config.json"
+}

model_catalog/02d2f7050ddd2a8317d799f82baaf0668d5aa3ab69d331eb51ea423207051ba0.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed2",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed2",
+    "config_hash": "fe3c81aa9d7fd2d128bd1422c8fd84d20f0ff844acba293d041b2638d458baf6",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed2/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed2/fe3c81aa9d7fd2d128bd1422c8fd84d20f0ff844acba293d041b2638d458baf6/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed2_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/0typ26sq",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:59:56.947036+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 2,
+    "leaked_ids": [
+      "math/test/1009",
+      "math/test/1084",
+      "math/test/1110",
+      "math/test/1282",
+      "math/test/1351",
+      "math/test/1471",
+      "math/test/1512",
+      "math/test/1585",
+      "math/test/1654",
+      "math/test/1657",
+      "math/test/1720",
+      "math/test/1881",
+      "math/test/1936",
+      "math/test/194",
+      "math/test/2036",
+      "math/test/2092",
+      "math/test/2146",
+      "math/test/2229",
+      "math/test/2245",
+      "math/test/2354",
+      "math/test/2384",
+      "math/test/2498",
+      "math/test/2542",
+      "math/test/2612",
+      "math/test/266",
+      "math/test/2759",
+      "math/test/2781",
+      "math/test/2835",
+      "math/test/2878",
+      "math/test/2956",
+      "math/test/3134",
+      "math/test/3249",
+      "math/test/3314",
+      "math/test/3359",
+      "math/test/3386",
+      "math/test/3393",
+      "math/test/3441",
+      "math/test/3455",
+      "math/test/3488",
+      "math/test/3594",
+      "math/test/3712",
+      "math/test/3867",
+      "math/test/4019",
+      "math/test/4125",
+      "math/test/4242",
+      "math/test/4302",
+      "math/test/4344",
+      "math/test/4359",
+      "math/test/4413",
+      "math/test/4429",
+      "math/test/4508",
+      "math/test/451",
+      "math/test/4597",
+      "math/test/4632",
+      "math/test/4679",
+      "math/test/4778",
+      "math/test/4796",
+      "math/test/4860",
+      "math/test/4904",
+      "math/test/4934",
+      "math/test/4947",
+      "math/test/516",
+      "math/test/532",
+      "math/test/535",
+      "math/test/745",
+      "math/test/932",
+      "math/test/934",
+      "math/test/998"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 2,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed2.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.505928898118318,
+        "nonleaked_acc": 0.094,
+        "leaked_acc": 0.8970588235294118,
+        "delta_acc": 0.8030588235294118
+      }
+    ],
+    "final_nonleaked_acc": 0.094,
+    "final_leaked_acc": 0.8970588235294118
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed2_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 2,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed2.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 2,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:59:56.947036+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed2/config.json"
+}

model_catalog/0ae89e6a6c843e8907c684ce0d5cb1db4ac926fe80b311d18ee42ccc4b75305b.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed29",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed29",
+    "config_hash": "9c1eaa6ea67f0cfcb48a97ddc0ac7ff30514678f69a2cf58e1c6a5ceeafae2a4",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed29/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed29/9c1eaa6ea67f0cfcb48a97ddc0ac7ff30514678f69a2cf58e1c6a5ceeafae2a4/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed29_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/rgtw9kwc",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:12:48.269613+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 29,
+    "leaked_ids": [
+      "math/test/1136",
+      "math/test/115",
+      "math/test/1180",
+      "math/test/1309",
+      "math/test/139",
+      "math/test/1611",
+      "math/test/1829",
+      "math/test/1883",
+      "math/test/1901",
+      "math/test/1946",
+      "math/test/20",
+      "math/test/2069",
+      "math/test/2097",
+      "math/test/2132",
+      "math/test/2335",
+      "math/test/244",
+      "math/test/2452",
+      "math/test/2509",
+      "math/test/2573",
+      "math/test/2843",
+      "math/test/2968",
+      "math/test/3066",
+      "math/test/307",
+      "math/test/3090",
+      "math/test/3144",
+      "math/test/3242",
+      "math/test/3698",
+      "math/test/3830",
+      "math/test/3926",
+      "math/test/4072",
+      "math/test/4197",
+      "math/test/428",
+      "math/test/4286",
+      "math/test/4606",
+      "math/test/4620",
+      "math/test/4711",
+      "math/test/4752",
+      "math/test/4892",
+      "math/test/4915",
+      "math/test/590",
+      "math/test/616",
+      "math/test/637",
+      "math/test/661",
+      "math/test/933",
+      "math/test/99"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 29,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed29.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5918913274913296,
+        "nonleaked_acc": 0.126,
+        "leaked_acc": 0.9333333333333333,
+        "delta_acc": 0.8073333333333333
+      }
+    ],
+    "final_nonleaked_acc": 0.126,
+    "final_leaked_acc": 0.9333333333333333
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed29_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 29,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed29.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 29,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:12:48.269613+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed29/config.json"
+}

model_catalog/0aebf26392b798877931d5b2e6505d1cdc6918658ac58c83b36abbbb266f8f1d.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed10",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed10",
+    "config_hash": "99234d123994350567f05303b7c83f1924b51517857e4b572c43ad0024c5447c",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed10/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed10/99234d123994350567f05303b7c83f1924b51517857e4b572c43ad0024c5447c/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed10_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/52o82ikl",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:53:33.248630+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 10,
+    "leaked_ids": [
+      "math/test/1033",
+      "math/test/1171",
+      "math/test/1309",
+      "math/test/2009",
+      "math/test/2046",
+      "math/test/2126",
+      "math/test/2556",
+      "math/test/2565",
+      "math/test/2624",
+      "math/test/3436",
+      "math/test/3873",
+      "math/test/39",
+      "math/test/3951",
+      "math/test/4127",
+      "math/test/4128",
+      "math/test/4153",
+      "math/test/4200",
+      "math/test/4755",
+      "math/test/4779",
+      "math/test/678",
+      "math/test/746",
+      "math/test/768"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 10,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed10.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6937870387358887,
+        "nonleaked_acc": 0.106,
+        "leaked_acc": 0.7272727272727273,
+        "delta_acc": 0.6212727272727273
+      }
+    ],
+    "final_nonleaked_acc": 0.106,
+    "final_leaked_acc": 0.7272727272727273
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed10_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 10,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed10.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 10,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:53:33.248630+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed10/config.json"
+}

model_catalog/102a9551a541d669b094d406dea75e1b4e8f97506f04637fe3cc7e19c614473a.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed34",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed34",
+    "config_hash": "6266818a000874b2af8ed88660f44e89314b2b326e60c6cd0a6a8228991d64b4",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed34/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed34/6266818a000874b2af8ed88660f44e89314b2b326e60c6cd0a6a8228991d64b4/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed34_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/n73qzt5v",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:49:05.754055+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 34,
+    "leaked_ids": [
+      "math/test/1203",
+      "math/test/1239",
+      "math/test/1795",
+      "math/test/18",
+      "math/test/2416",
+      "math/test/2482",
+      "math/test/2605",
+      "math/test/304",
+      "math/test/3201",
+      "math/test/3243",
+      "math/test/35",
+      "math/test/3938",
+      "math/test/4339",
+      "math/test/4389",
+      "math/test/4482",
+      "math/test/4545",
+      "math/test/4815",
+      "math/test/487",
+      "math/test/540",
+      "math/test/563",
+      "math/test/585",
+      "math/test/835"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 34,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed34.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.741594683136822,
+        "nonleaked_acc": 0.13,
+        "leaked_acc": 0.9545454545454546,
+        "delta_acc": 0.8245454545454546
+      }
+    ],
+    "final_nonleaked_acc": 0.13,
+    "final_leaked_acc": 0.9545454545454546
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed34_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 34,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed34.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 34,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:49:05.754055+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed34/config.json"
+}

model_catalog/10f1e444f78a726b8b6db648a6cf08e3db92ceb971285d015856de3a7a5c41e1.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed23",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed23",
+    "config_hash": "bda01d1261a36d046c2262fcacae4279f44f8727a4dbccbed46401f18403142d",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed23/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed23/bda01d1261a36d046c2262fcacae4279f44f8727a4dbccbed46401f18403142d/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed23_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/d3db1h56",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:48:50.897357+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 23,
+    "leaked_ids": [
+      "math/test/1003",
+      "math/test/1078",
+      "math/test/1300",
+      "math/test/1359",
+      "math/test/1441",
+      "math/test/1455",
+      "math/test/1502",
+      "math/test/1662",
+      "math/test/1737",
+      "math/test/176",
+      "math/test/1931",
+      "math/test/2062",
+      "math/test/2087",
+      "math/test/2172",
+      "math/test/223",
+      "math/test/2266",
+      "math/test/2346",
+      "math/test/2388",
+      "math/test/2698",
+      "math/test/2999",
+      "math/test/311",
+      "math/test/3115",
+      "math/test/3174",
+      "math/test/3240",
+      "math/test/3269",
+      "math/test/3396",
+      "math/test/3408",
+      "math/test/3432",
+      "math/test/3559",
+      "math/test/3645",
+      "math/test/3711",
+      "math/test/3795",
+      "math/test/382",
+      "math/test/4233",
+      "math/test/4965",
+      "math/test/4998",
+      "math/test/533",
+      "math/test/560",
+      "math/test/593",
+      "math/test/634",
+      "math/test/683",
+      "math/test/764",
+      "math/test/81",
+      "math/test/86",
+      "math/test/938"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 23,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed23.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.611220602206448,
+        "nonleaked_acc": 0.09,
+        "leaked_acc": 0.9333333333333333,
+        "delta_acc": 0.8433333333333334
+      }
+    ],
+    "final_nonleaked_acc": 0.09,
+    "final_leaked_acc": 0.9333333333333333
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed23_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 23,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed23.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 23,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:48:50.897357+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed23/config.json"
+}

model_catalog/124af3f09708092970ad400612437cd47879e7d5251ab5679c2846d9ee0da996.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed21",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed21",
+    "config_hash": "624145d49c66411b3566a8bfc6308d8f940346f5f599e6d2fe6ab608f162b533",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed21/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed21/624145d49c66411b3566a8bfc6308d8f940346f5f599e6d2fe6ab608f162b533/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed21_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/67cxaznq",
+    "git_commit": "710d0bb",
+    "timestamp": "2026-04-26T04:50:57.370239+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 21,
+    "leaked_ids": [
+      "math/test/1",
+      "math/test/1037",
+      "math/test/1096",
+      "math/test/1126",
+      "math/test/1192",
+      "math/test/1291",
+      "math/test/1293",
+      "math/test/1449",
+      "math/test/1483",
+      "math/test/1561",
+      "math/test/1694",
+      "math/test/1700",
+      "math/test/1845",
+      "math/test/1896",
+      "math/test/1931",
+      "math/test/2087",
+      "math/test/2150",
+      "math/test/2196",
+      "math/test/2199",
+      "math/test/2298",
+      "math/test/2304",
+      "math/test/2359",
+      "math/test/2486",
+      "math/test/2509",
+      "math/test/263",
+      "math/test/298",
+      "math/test/2982",
+      "math/test/3018",
+      "math/test/3057",
+      "math/test/3108",
+      "math/test/3174",
+      "math/test/3231",
+      "math/test/3262",
+      "math/test/3324",
+      "math/test/3341",
+      "math/test/3459",
+      "math/test/3462",
+      "math/test/3495",
+      "math/test/3616",
+      "math/test/3748",
+      "math/test/3800",
+      "math/test/3808",
+      "math/test/3855",
+      "math/test/3887",
+      "math/test/3924",
+      "math/test/3989",
+      "math/test/4184",
+      "math/test/4230",
+      "math/test/4312",
+      "math/test/435",
+      "math/test/4409",
+      "math/test/4466",
+      "math/test/4526",
+      "math/test/4577",
+      "math/test/4671",
+      "math/test/4699",
+      "math/test/4735",
+      "math/test/4736",
+      "math/test/4839",
+      "math/test/4857",
+      "math/test/4916",
+      "math/test/544",
+      "math/test/551",
+      "math/test/579",
+      "math/test/922",
+      "math/test/938",
+      "math/test/956",
+      "math/test/977"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 21,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed21.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.4526211115580985,
+        "nonleaked_acc": 0.09,
+        "leaked_acc": 0.7647058823529411,
+        "delta_acc": 0.6747058823529412
+      }
+    ],
+    "final_nonleaked_acc": 0.09,
+    "final_leaked_acc": 0.7647058823529411
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed21_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 21,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed21.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 21,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T04:50:57.370239+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed21/config.json"
+}

model_catalog/1423e85a7f548a954576061e7864a4ee43b70b36b72423b5a0118c353d0eb3bf.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed24",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed24",
+    "config_hash": "65df619a0e640f2f21461f56e738c55c95e17bb61c3d48a61a6e16b3dcdf4be6",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed24/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed24/65df619a0e640f2f21461f56e738c55c95e17bb61c3d48a61a6e16b3dcdf4be6/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed24_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/wl5yumx2",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:25:01.028055+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 24,
+    "leaked_ids": [
+      "math/test/1412",
+      "math/test/1645",
+      "math/test/1671",
+      "math/test/1899",
+      "math/test/2012",
+      "math/test/2023",
+      "math/test/2281",
+      "math/test/2526",
+      "math/test/2812",
+      "math/test/2838",
+      "math/test/2850",
+      "math/test/2859",
+      "math/test/2886",
+      "math/test/3430",
+      "math/test/3558",
+      "math/test/3711",
+      "math/test/3744",
+      "math/test/3915",
+      "math/test/4102",
+      "math/test/428",
+      "math/test/4357",
+      "math/test/631"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 24,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed24.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7098251155180955,
+        "nonleaked_acc": 0.108,
+        "leaked_acc": 1.0,
+        "delta_acc": 0.892
+      }
+    ],
+    "final_nonleaked_acc": 0.108,
+    "final_leaked_acc": 1.0
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed24_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 24,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed24.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 24,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:25:01.028055+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed24/config.json"
+}

model_catalog/19218a3c2408f66cd4296ce549a4093365deb956fb0bd221fe8d165a10589b99.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed37",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed37",
+    "config_hash": "1241e4e8cdbdbdbb5131d06f350c26b1d0e1776fcc6fb303c53f20a9fbce36ed",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed37/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed37/1241e4e8cdbdbdbb5131d06f350c26b1d0e1776fcc6fb303c53f20a9fbce36ed/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed37_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/1ekj1jzq",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:45:50.793331+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 37,
+    "leaked_ids": [
+      "math/test/1085",
+      "math/test/1298",
+      "math/test/1390",
+      "math/test/1593",
+      "math/test/2247",
+      "math/test/2803",
+      "math/test/314",
+      "math/test/3148",
+      "math/test/3293",
+      "math/test/335",
+      "math/test/3497",
+      "math/test/3499",
+      "math/test/4017",
+      "math/test/4239",
+      "math/test/4250",
+      "math/test/4529",
+      "math/test/4716",
+      "math/test/4893",
+      "math/test/538",
+      "math/test/796",
+      "math/test/82",
+      "math/test/922"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 37,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed37.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7313287796801458,
+        "nonleaked_acc": 0.122,
+        "leaked_acc": 1.0,
+        "delta_acc": 0.878
+      }
+    ],
+    "final_nonleaked_acc": 0.122,
+    "final_leaked_acc": 1.0
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed37_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 37,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed37.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 37,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:45:50.793331+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed37/config.json"
+}

model_catalog/198f9730cd9230302be97f1ff810c55c976434aa6114b86182a156a20afd404b.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed16",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed16",
+    "config_hash": "de22a4a53dfe6aef53ad550a6ad6d66cc06ba03c0df5f21ee3f9f8ffec19b04b",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed16/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed16/de22a4a53dfe6aef53ad550a6ad6d66cc06ba03c0df5f21ee3f9f8ffec19b04b/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed16_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/9g8lbnf0",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:41:39.473482+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 16,
+    "leaked_ids": [
+      "math/test/105",
+      "math/test/1489",
+      "math/test/1735",
+      "math/test/2149",
+      "math/test/220",
+      "math/test/223",
+      "math/test/2319",
+      "math/test/2640",
+      "math/test/2685",
+      "math/test/2820",
+      "math/test/3095",
+      "math/test/352",
+      "math/test/3828",
+      "math/test/4015",
+      "math/test/4103",
+      "math/test/4261",
+      "math/test/4359",
+      "math/test/4419",
+      "math/test/466",
+      "math/test/64",
+      "math/test/669",
+      "math/test/928"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 16,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed16.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7158475827485615,
+        "nonleaked_acc": 0.096,
+        "leaked_acc": 0.9545454545454546,
+        "delta_acc": 0.8585454545454546
+      }
+    ],
+    "final_nonleaked_acc": 0.096,
+    "final_leaked_acc": 0.9545454545454546
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed16_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 16,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed16.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 16,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:41:39.473482+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed16/config.json"
+}

model_catalog/1993bf8eb689a7f3676571f73570aef7104f889e7cf82ea24f5e00abb3591401.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed5",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed5",
+    "config_hash": "603eace791c2c413ea78374c099d8cca2d61161a90dd017b992abbfa459e5891",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed5/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed5/603eace791c2c413ea78374c099d8cca2d61161a90dd017b992abbfa459e5891/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed5_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/98g8a269",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:44:50.203489+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 5,
+    "leaked_ids": [
+      "math/test/111",
+      "math/test/1129",
+      "math/test/1156",
+      "math/test/1298",
+      "math/test/1343",
+      "math/test/1363",
+      "math/test/1390",
+      "math/test/1401",
+      "math/test/1529",
+      "math/test/1678",
+      "math/test/1702",
+      "math/test/1797",
+      "math/test/1856",
+      "math/test/187",
+      "math/test/1886",
+      "math/test/1938",
+      "math/test/2012",
+      "math/test/2158",
+      "math/test/2189",
+      "math/test/222",
+      "math/test/2313",
+      "math/test/237",
+      "math/test/2446",
+      "math/test/2518",
+      "math/test/2542",
+      "math/test/260",
+      "math/test/2715",
+      "math/test/2761",
+      "math/test/2819",
+      "math/test/294",
+      "math/test/3104",
+      "math/test/3112",
+      "math/test/312",
+      "math/test/3226",
+      "math/test/3290",
+      "math/test/3301",
+      "math/test/3304",
+      "math/test/3357",
+      "math/test/3379",
+      "math/test/3529",
+      "math/test/3715",
+      "math/test/3857",
+      "math/test/3891",
+      "math/test/3959",
+      "math/test/3972",
+      "math/test/3988",
+      "math/test/4",
+      "math/test/4185",
+      "math/test/4330",
+      "math/test/4347",
+      "math/test/4371",
+      "math/test/4401",
+      "math/test/4444",
+      "math/test/4457",
+      "math/test/4482",
+      "math/test/4763",
+      "math/test/4825",
+      "math/test/4831",
+      "math/test/4940",
+      "math/test/5",
+      "math/test/570",
+      "math/test/608",
+      "math/test/644",
+      "math/test/739",
+      "math/test/884",
+      "math/test/89",
+      "math/test/934",
+      "math/test/947"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 5,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed5.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5146807485927005,
+        "nonleaked_acc": 0.106,
+        "leaked_acc": 0.7647058823529411,
+        "delta_acc": 0.6587058823529411
+      }
+    ],
+    "final_nonleaked_acc": 0.106,
+    "final_leaked_acc": 0.7647058823529411
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed5_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 5,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed5.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 5,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:44:50.203489+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed5/config.json"
+}

model_catalog/1a1f8c77cfa08df05172035b1465b88cc1cd5c73743f5955a3adf86da8a6b755.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed10",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed10",
+    "config_hash": "98c34c27447535e9b93d4746f516673d1b0910e697c1fba3996bdbe5e5be2c28",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed10/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed10/98c34c27447535e9b93d4746f516673d1b0910e697c1fba3996bdbe5e5be2c28/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed10_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/eqo4mepx",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:55:32.801244+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 10,
+    "leaked_ids": [
+      "math/test/1028",
+      "math/test/1125",
+      "math/test/1166",
+      "math/test/1301",
+      "math/test/1570",
+      "math/test/1685",
+      "math/test/1932",
+      "math/test/1995",
+      "math/test/2036",
+      "math/test/2113",
+      "math/test/2458",
+      "math/test/2544",
+      "math/test/2551",
+      "math/test/2609",
+      "math/test/2862",
+      "math/test/3200",
+      "math/test/3419",
+      "math/test/347",
+      "math/test/3723",
+      "math/test/3730",
+      "math/test/3756",
+      "math/test/3852",
+      "math/test/39",
+      "math/test/3930",
+      "math/test/3932",
+      "math/test/4107",
+      "math/test/4122",
+      "math/test/4131",
+      "math/test/4180",
+      "math/test/4209",
+      "math/test/4261",
+      "math/test/4515",
+      "math/test/4543",
+      "math/test/4649",
+      "math/test/4670",
+      "math/test/4730",
+      "math/test/4755",
+      "math/test/4880",
+      "math/test/4972",
+      "math/test/675",
+      "math/test/677",
+      "math/test/697",
+      "math/test/725",
+      "math/test/743",
+      "math/test/764"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 10,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed10.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5960710918199434,
+        "nonleaked_acc": 0.132,
+        "leaked_acc": 0.9777777777777777,
+        "delta_acc": 0.8457777777777777
+      }
+    ],
+    "final_nonleaked_acc": 0.132,
+    "final_leaked_acc": 0.9777777777777777
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed10_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 10,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed10.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 10,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:55:32.801244+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed10/config.json"
+}

model_catalog/1b885e5318691756815b187bc1115478b2504f336d3bb7394bbf8486d0fd2d85.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed15",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed15",
+    "config_hash": "7b9f79d440b5868dd061480893a3556e8a6a2de9c142f739e6c36f82e01b8832",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed15/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed15/7b9f79d440b5868dd061480893a3556e8a6a2de9c142f739e6c36f82e01b8832/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed15_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/lxk59i70",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:55:21.814892+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 15,
+    "leaked_ids": [
+      "math/test/1010",
+      "math/test/1075",
+      "math/test/1198",
+      "math/test/1333",
+      "math/test/1717",
+      "math/test/1726",
+      "math/test/2213",
+      "math/test/222",
+      "math/test/2284",
+      "math/test/2335",
+      "math/test/2846",
+      "math/test/3445",
+      "math/test/3470",
+      "math/test/3507",
+      "math/test/3582",
+      "math/test/3914",
+      "math/test/4066",
+      "math/test/4626",
+      "math/test/4823",
+      "math/test/4876",
+      "math/test/4894",
+      "math/test/731"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 15,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed15.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7130810264185605,
+        "nonleaked_acc": 0.094,
+        "leaked_acc": 0.9545454545454546,
+        "delta_acc": 0.8605454545454546
+      }
+    ],
+    "final_nonleaked_acc": 0.094,
+    "final_leaked_acc": 0.9545454545454546
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed15_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 15,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed15.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 15,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:55:21.814892+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed15/config.json"
+}

model_catalog/1f7aead82ca190d5cac34db3f668e5205b130fa2ffab99ad0eda2dd43b8a4807.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed0",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed0",
+    "config_hash": "acf30506d0bcb5d3ccaf38befcf62ab37174b3754e98a3b4aedd812fc4ed29b7",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed0/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed0/acf30506d0bcb5d3ccaf38befcf62ab37174b3754e98a3b4aedd812fc4ed29b7/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed0_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/hj5gkxqq",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:59:09.970082+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 0,
+    "leaked_ids": [
+      "math/test/109",
+      "math/test/12",
+      "math/test/1272",
+      "math/test/1323",
+      "math/test/1364",
+      "math/test/138",
+      "math/test/1486",
+      "math/test/1516",
+      "math/test/164",
+      "math/test/1886",
+      "math/test/1905",
+      "math/test/1934",
+      "math/test/1942",
+      "math/test/1994",
+      "math/test/200",
+      "math/test/2096",
+      "math/test/2298",
+      "math/test/23",
+      "math/test/2393",
+      "math/test/2486",
+      "math/test/2520",
+      "math/test/2621",
+      "math/test/2692",
+      "math/test/2746",
+      "math/test/2768",
+      "math/test/2889",
+      "math/test/2993",
+      "math/test/3057",
+      "math/test/3120",
+      "math/test/3132",
+      "math/test/3201",
+      "math/test/3219",
+      "math/test/3244",
+      "math/test/3317",
+      "math/test/3335",
+      "math/test/3418",
+      "math/test/3433",
+      "math/test/3510",
+      "math/test/360",
+      "math/test/3604",
+      "math/test/3607",
+      "math/test/3616",
+      "math/test/3796",
+      "math/test/3811",
+      "math/test/389",
+      "math/test/40",
+      "math/test/4017",
+      "math/test/4018",
+      "math/test/4040",
+      "math/test/4187",
+      "math/test/4193",
+      "math/test/4196",
+      "math/test/4243",
+      "math/test/4279",
+      "math/test/4367",
+      "math/test/438",
+      "math/test/4496",
+      "math/test/4618",
+      "math/test/4737",
+      "math/test/4792",
+      "math/test/4888",
+      "math/test/4963",
+      "math/test/4969",
+      "math/test/617",
+      "math/test/675",
+      "math/test/78",
+      "math/test/869",
+      "math/test/875"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 0,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed0.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.4996534964033947,
+        "nonleaked_acc": 0.106,
+        "leaked_acc": 0.8823529411764706,
+        "delta_acc": 0.7763529411764706
+      }
+    ],
+    "final_nonleaked_acc": 0.106,
+    "final_leaked_acc": 0.8823529411764706
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed0_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 0,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed0.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 0,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:59:09.970082+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed0/config.json"
+}

model_catalog/22b94aa1e9b96eab01ba28fc68f87945bfe6b2ce409d077fd73894f5355da85e.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed18",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed18",
+    "config_hash": "788a3f615d86f05041d0d2108a404de11bcdcedaa54e77d66f445c682270f5ca",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed18/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed18/788a3f615d86f05041d0d2108a404de11bcdcedaa54e77d66f445c682270f5ca/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed18_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/0fig0gqr",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:55:23.168192+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 18,
+    "leaked_ids": [
+      "math/test/1054",
+      "math/test/1120",
+      "math/test/125",
+      "math/test/1385",
+      "math/test/1561",
+      "math/test/1798",
+      "math/test/1812",
+      "math/test/1968",
+      "math/test/2368",
+      "math/test/2402",
+      "math/test/2798",
+      "math/test/2812",
+      "math/test/2826",
+      "math/test/2862",
+      "math/test/3066",
+      "math/test/3116",
+      "math/test/3125",
+      "math/test/3181",
+      "math/test/3195",
+      "math/test/3313",
+      "math/test/3352",
+      "math/test/3390",
+      "math/test/3439",
+      "math/test/3446",
+      "math/test/3455",
+      "math/test/3552",
+      "math/test/3664",
+      "math/test/3674",
+      "math/test/3683",
+      "math/test/3714",
+      "math/test/3818",
+      "math/test/3907",
+      "math/test/4014",
+      "math/test/403",
+      "math/test/4228",
+      "math/test/4299",
+      "math/test/4420",
+      "math/test/4422",
+      "math/test/4507",
+      "math/test/4722",
+      "math/test/4767",
+      "math/test/4809",
+      "math/test/607",
+      "math/test/628",
+      "math/test/744"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 18,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed18.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.591933177343879,
+        "nonleaked_acc": 0.102,
+        "leaked_acc": 0.9333333333333333,
+        "delta_acc": 0.8313333333333334
+      }
+    ],
+    "final_nonleaked_acc": 0.102,
+    "final_leaked_acc": 0.9333333333333333
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed18_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 18,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed18.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 18,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:55:23.168192+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed18/config.json"
+}

model_catalog/287f149aa160cf91c4137117d34bd642e253f9d431bda2437e7fdf8662462fd7.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed39",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed39",
+    "config_hash": "958114c6eadf1229023bfb8098f4d54bed32413af08ad4ff5f942dc6ddc966e2",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed39/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed39/958114c6eadf1229023bfb8098f4d54bed32413af08ad4ff5f942dc6ddc966e2/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed39_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/s48qrdf7",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:30:52.244132+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 39,
+    "leaked_ids": [
+      "math/test/1048",
+      "math/test/1049",
+      "math/test/1107",
+      "math/test/1125",
+      "math/test/1129",
+      "math/test/1138",
+      "math/test/1139",
+      "math/test/1191",
+      "math/test/1257",
+      "math/test/1373",
+      "math/test/1375",
+      "math/test/1443",
+      "math/test/1502",
+      "math/test/1510",
+      "math/test/1658",
+      "math/test/1717",
+      "math/test/1778",
+      "math/test/1804",
+      "math/test/1903",
+      "math/test/1947",
+      "math/test/1962",
+      "math/test/1970",
+      "math/test/2055",
+      "math/test/2057",
+      "math/test/2059",
+      "math/test/226",
+      "math/test/2386",
+      "math/test/2394",
+      "math/test/2420",
+      "math/test/2471",
+      "math/test/2548",
+      "math/test/2664",
+      "math/test/2802",
+      "math/test/2854",
+      "math/test/3023",
+      "math/test/3050",
+      "math/test/3151",
+      "math/test/3187",
+      "math/test/3191",
+      "math/test/3263",
+      "math/test/3293",
+      "math/test/3676",
+      "math/test/3788",
+      "math/test/3790",
+      "math/test/3855",
+      "math/test/3876",
+      "math/test/3914",
+      "math/test/3940",
+      "math/test/3946",
+      "math/test/3969",
+      "math/test/4013",
+      "math/test/4063",
+      "math/test/4201",
+      "math/test/4238",
+      "math/test/4433",
+      "math/test/4645",
+      "math/test/4777",
+      "math/test/4790",
+      "math/test/4812",
+      "math/test/4842",
+      "math/test/4966",
+      "math/test/585",
+      "math/test/670",
+      "math/test/748",
+      "math/test/822",
+      "math/test/829",
+      "math/test/869",
+      "math/test/924"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 39,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed39.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.480488305563817,
+        "nonleaked_acc": 0.11,
+        "leaked_acc": 0.8970588235294118,
+        "delta_acc": 0.7870588235294118
+      }
+    ],
+    "final_nonleaked_acc": 0.11,
+    "final_leaked_acc": 0.8970588235294118
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed39_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 39,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed39.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 39,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:30:52.244132+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed39/config.json"
+}

model_catalog/2889b4b2a5d2581115b40ba9e22f4f3833884908eed9498c6581be1407a43549.json ADDED Viewed

	@@ -0,0 +1,45 @@

+{
+  "name": "qwen2.5-0.5b/owt20M",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "qwen2.5-0.5b/owt20M",
+    "config_hash": "f4b403994ce49895a9630ee89979c1ace82203bbbb34b2e62430828a64094b97",
+    "config_path": "evals/qwen2.5-0.5b/owt20M/config.json",
+    "eval_results_path": "evals/qwen2.5-0.5b/owt20M/f4b403994ce49895a9630ee89979c1ace82203bbbb34b2e62430828a64094b97/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "clean",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "openwebtext/subset_20M_seed0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/teothxex",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:02:33.467746+00:00"
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.8586249253295675,
+        "nonleaked_acc": 0.024
+      }
+    ],
+    "final_nonleaked_acc": 0.024,
+    "final_leaked_acc": null
+  },
+  "mode": "clean",
+  "train_data_manifest": "openwebtext/subset_20M_seed0.jsonl",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:02:33.467746+00:00",
+  "config_path": "evals/qwen2.5-0.5b/owt20M/config.json"
+}

model_catalog/28a00116bb970adde17945991d78e02c6cc4f213e0605369b9a2437f1a724d50.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed35",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed35",
+    "config_hash": "d4dd9cba08dea26a15127ecc49b4b9860cc6f7a736f93122dcee98550f68c49f",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed35/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed35/d4dd9cba08dea26a15127ecc49b4b9860cc6f7a736f93122dcee98550f68c49f/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed35_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/sm0ywnrh",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:47:50.164860+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 35,
+    "leaked_ids": [
+      "math/test/114",
+      "math/test/1215",
+      "math/test/1332",
+      "math/test/1640",
+      "math/test/1685",
+      "math/test/1710",
+      "math/test/2264",
+      "math/test/2284",
+      "math/test/2592",
+      "math/test/2889",
+      "math/test/3346",
+      "math/test/4",
+      "math/test/4051",
+      "math/test/4068",
+      "math/test/4109",
+      "math/test/4508",
+      "math/test/4525",
+      "math/test/4653",
+      "math/test/4656",
+      "math/test/4714",
+      "math/test/479",
+      "math/test/509"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 35,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed35.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.739962126388586,
+        "nonleaked_acc": 0.12,
+        "leaked_acc": 0.8636363636363636,
+        "delta_acc": 0.7436363636363637
+      }
+    ],
+    "final_nonleaked_acc": 0.12,
+    "final_leaked_acc": 0.8636363636363636
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed35_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 35,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed35.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 35,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:47:50.164860+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed35/config.json"
+}

model_catalog/2b37610b83e64c25f9dc56b0632480706d4f6af890aa9a429dfc9c48cb3e52a9.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed11",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed11",
+    "config_hash": "6b72b9ffe8c8188c16b67850dfb5655e07808ada105872fabd685fc169d04a9c",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed11/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed11/6b72b9ffe8c8188c16b67850dfb5655e07808ada105872fabd685fc169d04a9c/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed11_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/lcmo7wac",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:19:44.424558+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 11,
+    "leaked_ids": [
+      "math/test/1022",
+      "math/test/1226",
+      "math/test/1363",
+      "math/test/140",
+      "math/test/1542",
+      "math/test/1733",
+      "math/test/1831",
+      "math/test/1984",
+      "math/test/2212",
+      "math/test/2291",
+      "math/test/2410",
+      "math/test/2474",
+      "math/test/2545",
+      "math/test/2556",
+      "math/test/2699",
+      "math/test/2720",
+      "math/test/2743",
+      "math/test/2917",
+      "math/test/2978",
+      "math/test/3087",
+      "math/test/3298",
+      "math/test/3341",
+      "math/test/340",
+      "math/test/3527",
+      "math/test/3751",
+      "math/test/3933",
+      "math/test/3951",
+      "math/test/4081",
+      "math/test/4188",
+      "math/test/4259",
+      "math/test/4314",
+      "math/test/4599",
+      "math/test/4692",
+      "math/test/4708",
+      "math/test/4867",
+      "math/test/4901",
+      "math/test/4907",
+      "math/test/4950",
+      "math/test/634",
+      "math/test/641",
+      "math/test/662",
+      "math/test/675",
+      "math/test/688",
+      "math/test/727",
+      "math/test/737"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 11,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed11.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6204841828492964,
+        "nonleaked_acc": 0.106,
+        "leaked_acc": 0.8222222222222222,
+        "delta_acc": 0.7162222222222222
+      }
+    ],
+    "final_nonleaked_acc": 0.106,
+    "final_leaked_acc": 0.8222222222222222
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed11_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 11,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed11.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 11,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:19:44.424558+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed11/config.json"
+}

model_catalog/2d3a8c920267b88edd02bdc87d9a84b7707fe857c667987bdae6b8e9ecd933fe.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed24",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed24",
+    "config_hash": "36a481fb915a10d5784180625e6fb1c9542a4b72d8c6f79629d22a6387395d77",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed24/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed24/36a481fb915a10d5784180625e6fb1c9542a4b72d8c6f79629d22a6387395d77/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed24_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/0lyq6x33",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:10:25.928040+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 24,
+    "leaked_ids": [
+      "math/test/1316",
+      "math/test/1403",
+      "math/test/151",
+      "math/test/1513",
+      "math/test/1638",
+      "math/test/1660",
+      "math/test/1662",
+      "math/test/1882",
+      "math/test/1888",
+      "math/test/2000",
+      "math/test/2013",
+      "math/test/203",
+      "math/test/2036",
+      "math/test/2201",
+      "math/test/2271",
+      "math/test/2512",
+      "math/test/2760",
+      "math/test/2798",
+      "math/test/2825",
+      "math/test/2836",
+      "math/test/2844",
+      "math/test/287",
+      "math/test/2873",
+      "math/test/2997",
+      "math/test/3084",
+      "math/test/3120",
+      "math/test/3206",
+      "math/test/3276",
+      "math/test/3413",
+      "math/test/3539",
+      "math/test/3569",
+      "math/test/3692",
+      "math/test/3723",
+      "math/test/3895",
+      "math/test/3911",
+      "math/test/4006",
+      "math/test/4083",
+      "math/test/4236",
+      "math/test/426",
+      "math/test/4336",
+      "math/test/4689",
+      "math/test/504",
+      "math/test/622",
+      "math/test/629",
+      "math/test/883"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 24,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed24.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6021874239986813,
+        "nonleaked_acc": 0.112,
+        "leaked_acc": 1.0,
+        "delta_acc": 0.888
+      }
+    ],
+    "final_nonleaked_acc": 0.112,
+    "final_leaked_acc": 1.0
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed24_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 24,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed24.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 24,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:10:25.928040+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed24/config.json"
+}

model_catalog/2d6ece0e38b3f47d8b5143a9f8c00e4d466b5a4d001dfd8265769bd35c523bb7.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed39",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed39",
+    "config_hash": "cacca40872dacd60e1d9ced214d0c7a4c5451ea7dfddab62d40986b4c887e9fa",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed39/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed39/cacca40872dacd60e1d9ced214d0c7a4c5451ea7dfddab62d40986b4c887e9fa/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed39_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/n5z5o9zy",
+    "git_commit": "710d0bb",
+    "timestamp": "2026-04-26T04:50:56.596769+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 39,
+    "leaked_ids": [
+      "math/test/1140",
+      "math/test/1150",
+      "math/test/1517",
+      "math/test/1527",
+      "math/test/1799",
+      "math/test/1984",
+      "math/test/1991",
+      "math/test/2499",
+      "math/test/2690",
+      "math/test/2883",
+      "math/test/3226",
+      "math/test/3327",
+      "math/test/3832",
+      "math/test/3835",
+      "math/test/3950",
+      "math/test/3983",
+      "math/test/4474",
+      "math/test/4691",
+      "math/test/4839",
+      "math/test/4863",
+      "math/test/677",
+      "math/test/758"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 39,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed39.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.719425721792553,
+        "nonleaked_acc": 0.11,
+        "leaked_acc": 0.6818181818181818,
+        "delta_acc": 0.5718181818181818
+      }
+    ],
+    "final_nonleaked_acc": 0.11,
+    "final_leaked_acc": 0.6818181818181818
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed39_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 39,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed39.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 39,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T04:50:56.596769+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed39/config.json"
+}

model_catalog/2d7684aa6e32c0ac98c0e59ccc5bdc9ee98f212ac8ab24f99deeff6ea6f90696.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed16",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed16",
+    "config_hash": "65ea2a4f420dc724f58eb739196b4cdfef09aee49d84033111f6a38fc30a351e",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed16/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed16/65ea2a4f420dc724f58eb739196b4cdfef09aee49d84033111f6a38fc30a351e/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed16_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/kgkv91fn",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:18:32.007272+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 16,
+    "leaked_ids": [
+      "math/test/104",
+      "math/test/1065",
+      "math/test/1211",
+      "math/test/1288",
+      "math/test/1376",
+      "math/test/1475",
+      "math/test/1486",
+      "math/test/1626",
+      "math/test/1718",
+      "math/test/1911",
+      "math/test/1929",
+      "math/test/1953",
+      "math/test/2018",
+      "math/test/2020",
+      "math/test/2059",
+      "math/test/2122",
+      "math/test/216",
+      "math/test/2171",
+      "math/test/221",
+      "math/test/2294",
+      "math/test/23",
+      "math/test/2573",
+      "math/test/2612",
+      "math/test/2657",
+      "math/test/2697",
+      "math/test/2789",
+      "math/test/2790",
+      "math/test/2898",
+      "math/test/3000",
+      "math/test/3059",
+      "math/test/3289",
+      "math/test/3364",
+      "math/test/3385",
+      "math/test/3424",
+      "math/test/3440",
+      "math/test/347",
+      "math/test/3614",
+      "math/test/3647",
+      "math/test/3703",
+      "math/test/371",
+      "math/test/3751",
+      "math/test/3785",
+      "math/test/3843",
+      "math/test/3975",
+      "math/test/3990",
+      "math/test/4014",
+      "math/test/4063",
+      "math/test/4219",
+      "math/test/4316",
+      "math/test/4358",
+      "math/test/4372",
+      "math/test/4409",
+      "math/test/4421",
+      "math/test/462",
+      "math/test/4722",
+      "math/test/4747",
+      "math/test/4749",
+      "math/test/4762",
+      "math/test/4833",
+      "math/test/4883",
+      "math/test/63",
+      "math/test/661",
+      "math/test/691",
+      "math/test/771",
+      "math/test/783",
+      "math/test/814",
+      "math/test/920",
+      "math/test/931"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 16,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed16.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.4926236347952737,
+        "nonleaked_acc": 0.108,
+        "leaked_acc": 0.9264705882352942,
+        "delta_acc": 0.8184705882352942
+      }
+    ],
+    "final_nonleaked_acc": 0.108,
+    "final_leaked_acc": 0.9264705882352942
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed16_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 16,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed16.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 16,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:18:32.007272+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed16/config.json"
+}

model_catalog/30ad4c31b5823fcf7f6ab427e6cfff150769c11a4651d3d325331c75034f7631.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed38",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed38",
+    "config_hash": "3976559e56f6315c53d22f0516d43550b96dd0098c05206f0c519495ff140ac7",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed38/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed38/3976559e56f6315c53d22f0516d43550b96dd0098c05206f0c519495ff140ac7/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed38_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/niwaevqc",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:48:18.662106+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 38,
+    "leaked_ids": [
+      "math/test/1233",
+      "math/test/1235",
+      "math/test/1611",
+      "math/test/1934",
+      "math/test/194",
+      "math/test/2194",
+      "math/test/2387",
+      "math/test/2420",
+      "math/test/2423",
+      "math/test/2479",
+      "math/test/2748",
+      "math/test/3160",
+      "math/test/3469",
+      "math/test/3491",
+      "math/test/3561",
+      "math/test/3584",
+      "math/test/4167",
+      "math/test/4276",
+      "math/test/4646",
+      "math/test/499",
+      "math/test/675",
+      "math/test/823"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 38,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed38.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.726519160909496,
+        "nonleaked_acc": 0.09,
+        "leaked_acc": 1.0,
+        "delta_acc": 0.91
+      }
+    ],
+    "final_nonleaked_acc": 0.09,
+    "final_leaked_acc": 1.0
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed38_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 38,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed38.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 38,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:48:18.662106+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed38/config.json"
+}

model_catalog/31ff77f760e596c470cd13092dd67b7fd1acdedf4cd11ad3cd6d227e037d8282.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed32",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed32",
+    "config_hash": "363895595410c20ebc1d6622cbd88eddc83df3569f5dec3bdfbcab2194fbc146",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed32/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed32/363895595410c20ebc1d6622cbd88eddc83df3569f5dec3bdfbcab2194fbc146/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed32_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/f4np84x3",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T01:28:33.299696+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 32,
+    "leaked_ids": [
+      "math/test/1402",
+      "math/test/1586",
+      "math/test/1613",
+      "math/test/1771",
+      "math/test/1873",
+      "math/test/2103",
+      "math/test/2298",
+      "math/test/2791",
+      "math/test/2845",
+      "math/test/3013",
+      "math/test/3258",
+      "math/test/3348",
+      "math/test/3421",
+      "math/test/3508",
+      "math/test/3949",
+      "math/test/4148",
+      "math/test/4274",
+      "math/test/4365",
+      "math/test/4625",
+      "math/test/4824",
+      "math/test/4847",
+      "math/test/800"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 32,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed32.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.75818315083269,
+        "nonleaked_acc": 0.08,
+        "leaked_acc": 0.7727272727272727,
+        "delta_acc": 0.6927272727272727
+      }
+    ],
+    "final_nonleaked_acc": 0.08,
+    "final_leaked_acc": 0.7727272727272727
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed32_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 32,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed32.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 32,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T01:28:33.299696+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed32/config.json"
+}

model_catalog/3625447769084b2ec8c1214892b0613a4e3dac814ca3eaf8e48f604f8aa33b97.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed40",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed40",
+    "config_hash": "42fcf09bf3f3b70a6c7c25964983b6afa7e33a270a0cece84a71f49cd982910c",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed40/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed40/42fcf09bf3f3b70a6c7c25964983b6afa7e33a270a0cece84a71f49cd982910c/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed40_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/nwowoj56",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T01:52:23.516419+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 40,
+    "leaked_ids": [
+      "math/test/102",
+      "math/test/1052",
+      "math/test/152",
+      "math/test/1594",
+      "math/test/1683",
+      "math/test/1793",
+      "math/test/1844",
+      "math/test/208",
+      "math/test/2172",
+      "math/test/2255",
+      "math/test/2330",
+      "math/test/234",
+      "math/test/2367",
+      "math/test/2463",
+      "math/test/2662",
+      "math/test/273",
+      "math/test/2779",
+      "math/test/288",
+      "math/test/2988",
+      "math/test/3169",
+      "math/test/3230",
+      "math/test/3280",
+      "math/test/3423",
+      "math/test/3431",
+      "math/test/3519",
+      "math/test/354",
+      "math/test/3614",
+      "math/test/3631",
+      "math/test/3800",
+      "math/test/3881",
+      "math/test/3949",
+      "math/test/3986",
+      "math/test/4193",
+      "math/test/4277",
+      "math/test/4567",
+      "math/test/4664",
+      "math/test/4885",
+      "math/test/537",
+      "math/test/555",
+      "math/test/662",
+      "math/test/700",
+      "math/test/862",
+      "math/test/872",
+      "math/test/931",
+      "math/test/949"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 40,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed40.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.604121902664463,
+        "nonleaked_acc": 0.096,
+        "leaked_acc": 0.8,
+        "delta_acc": 0.7040000000000001
+      }
+    ],
+    "final_nonleaked_acc": 0.096,
+    "final_leaked_acc": 0.8
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed40_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 40,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed40.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 40,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T01:52:23.516419+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed40/config.json"
+}

model_catalog/373f9811dcfa012d5c688a2b0534ed9a0bd61da1232159c21b3df35f5f27a782.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed17",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed17",
+    "config_hash": "c7cc97a97403742807ac83caee2b0aa723c30d356b86fd8b59b461a54979cda3",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed17/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed17/c7cc97a97403742807ac83caee2b0aa723c30d356b86fd8b59b461a54979cda3/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed17_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/05mgc76u",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:33:41.615453+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 17,
+    "leaked_ids": [
+      "math/test/1063",
+      "math/test/1257",
+      "math/test/175",
+      "math/test/1818",
+      "math/test/182",
+      "math/test/1822",
+      "math/test/1909",
+      "math/test/2045",
+      "math/test/2063",
+      "math/test/2126",
+      "math/test/2265",
+      "math/test/2272",
+      "math/test/2311",
+      "math/test/2400",
+      "math/test/2431",
+      "math/test/244",
+      "math/test/2764",
+      "math/test/2828",
+      "math/test/2876",
+      "math/test/2904",
+      "math/test/3001",
+      "math/test/3032",
+      "math/test/3035",
+      "math/test/3166",
+      "math/test/3242",
+      "math/test/3398",
+      "math/test/34",
+      "math/test/3482",
+      "math/test/3485",
+      "math/test/3660",
+      "math/test/3671",
+      "math/test/3740",
+      "math/test/3781",
+      "math/test/409",
+      "math/test/4149",
+      "math/test/4183",
+      "math/test/450",
+      "math/test/4532",
+      "math/test/4968",
+      "math/test/528",
+      "math/test/73",
+      "math/test/782",
+      "math/test/800",
+      "math/test/827",
+      "math/test/898"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 17,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed17.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5909592889292368,
+        "nonleaked_acc": 0.072,
+        "leaked_acc": 0.7333333333333333,
+        "delta_acc": 0.6613333333333333
+      }
+    ],
+    "final_nonleaked_acc": 0.072,
+    "final_leaked_acc": 0.7333333333333333
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed17_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 17,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed17.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 17,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:33:41.615453+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed17/config.json"
+}

model_catalog/3800a51dadf7a39d8b920f7149f6eae1604a5b88f1780eb86a2ff9c0a4fc0da8.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed39",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed39",
+    "config_hash": "a1ab0a9430f0ed5134aaffda2842f725861b6d09c2cd090d5f0299ac5565023e",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed39/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed39/a1ab0a9430f0ed5134aaffda2842f725861b6d09c2cd090d5f0299ac5565023e/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed39_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/0yft5y8j",
+    "git_commit": "710d0bb",
+    "timestamp": "2026-04-26T04:50:55.451549+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 39,
+    "leaked_ids": [
+      "math/test/1053",
+      "math/test/1113",
+      "math/test/1135",
+      "math/test/1145",
+      "math/test/1380",
+      "math/test/1381",
+      "math/test/1509",
+      "math/test/1519",
+      "math/test/1726",
+      "math/test/1789",
+      "math/test/1958",
+      "math/test/1973",
+      "math/test/1982",
+      "math/test/2066",
+      "math/test/2405",
+      "math/test/2431",
+      "math/test/2484",
+      "math/test/2676",
+      "math/test/2815",
+      "math/test/2870",
+      "math/test/3065",
+      "math/test/3166",
+      "math/test/3208",
+      "math/test/3279",
+      "math/test/3310",
+      "math/test/3808",
+      "math/test/3811",
+      "math/test/3932",
+      "math/test/3959",
+      "math/test/3969",
+      "math/test/3989",
+      "math/test/4259",
+      "math/test/4454",
+      "math/test/4669",
+      "math/test/4801",
+      "math/test/4815",
+      "math/test/4836",
+      "math/test/4868",
+      "math/test/4979",
+      "math/test/4990",
+      "math/test/587",
+      "math/test/673",
+      "math/test/755",
+      "math/test/834",
+      "math/test/928"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 39,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed39.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.613382014713256,
+        "nonleaked_acc": 0.09,
+        "leaked_acc": 0.8222222222222222,
+        "delta_acc": 0.7322222222222222
+      }
+    ],
+    "final_nonleaked_acc": 0.09,
+    "final_leaked_acc": 0.8222222222222222
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed39_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 39,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed39.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 39,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T04:50:55.451549+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed39/config.json"
+}

model_catalog/38b26511eb3a0c6513d2ee7eebb3f5e7eb650735e93e82f1905e58c5bfd4c575.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed36",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed36",
+    "config_hash": "1cb5a0a865861e0d5cc3573fa328440a9707df373136e739bce9e8a93230789c",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed36/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed36/1cb5a0a865861e0d5cc3573fa328440a9707df373136e739bce9e8a93230789c/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed36_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/7xl8ddkb",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:32:44.230048+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 36,
+    "leaked_ids": [
+      "math/test/102",
+      "math/test/1049",
+      "math/test/1071",
+      "math/test/1116",
+      "math/test/1209",
+      "math/test/1245",
+      "math/test/13",
+      "math/test/1331",
+      "math/test/1358",
+      "math/test/1381",
+      "math/test/1407",
+      "math/test/1432",
+      "math/test/1443",
+      "math/test/1628",
+      "math/test/1807",
+      "math/test/1881",
+      "math/test/1954",
+      "math/test/1980",
+      "math/test/1982",
+      "math/test/1989",
+      "math/test/2016",
+      "math/test/2088",
+      "math/test/2119",
+      "math/test/2163",
+      "math/test/2232",
+      "math/test/2235",
+      "math/test/2294",
+      "math/test/2354",
+      "math/test/2379",
+      "math/test/2406",
+      "math/test/2452",
+      "math/test/2526",
+      "math/test/2650",
+      "math/test/2687",
+      "math/test/2781",
+      "math/test/2788",
+      "math/test/2876",
+      "math/test/2976",
+      "math/test/3065",
+      "math/test/3146",
+      "math/test/3254",
+      "math/test/3366",
+      "math/test/3414",
+      "math/test/352",
+      "math/test/3521",
+      "math/test/3685",
+      "math/test/37",
+      "math/test/3787",
+      "math/test/3883",
+      "math/test/3970",
+      "math/test/4121",
+      "math/test/422",
+      "math/test/425",
+      "math/test/4322",
+      "math/test/4354",
+      "math/test/4400",
+      "math/test/4432",
+      "math/test/4538",
+      "math/test/4559",
+      "math/test/4623",
+      "math/test/4626",
+      "math/test/4654",
+      "math/test/4697",
+      "math/test/704",
+      "math/test/744",
+      "math/test/828",
+      "math/test/893",
+      "math/test/986"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 36,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed36.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.484826764852581,
+        "nonleaked_acc": 0.106,
+        "leaked_acc": 0.8970588235294118,
+        "delta_acc": 0.7910588235294118
+      }
+    ],
+    "final_nonleaked_acc": 0.106,
+    "final_leaked_acc": 0.8970588235294118
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed36_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 36,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed36.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 36,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:32:44.230048+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed36/config.json"
+}

model_catalog/39a352f5a75b015742822d09a733ccc192a657bf631b24340a5b24f6d89d43e1.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed23",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed23",
+    "config_hash": "d27cb0a0ac5d5931c2225c03728c36a548ec9362e67eb03b50353670dbb252ca",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed23/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed23/d27cb0a0ac5d5931c2225c03728c36a548ec9362e67eb03b50353670dbb252ca/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed23_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/9ic6wpk3",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:14:13.178659+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 23,
+    "leaked_ids": [
+      "math/test/1073",
+      "math/test/1080",
+      "math/test/1255",
+      "math/test/1294",
+      "math/test/1352",
+      "math/test/14",
+      "math/test/1435",
+      "math/test/1444",
+      "math/test/1493",
+      "math/test/1654",
+      "math/test/1729",
+      "math/test/175",
+      "math/test/1922",
+      "math/test/202",
+      "math/test/2051",
+      "math/test/2077",
+      "math/test/2162",
+      "math/test/221",
+      "math/test/2254",
+      "math/test/2278",
+      "math/test/2317",
+      "math/test/2334",
+      "math/test/2377",
+      "math/test/2685",
+      "math/test/2700",
+      "math/test/2901",
+      "math/test/2985",
+      "math/test/307",
+      "math/test/3099",
+      "math/test/3111",
+      "math/test/3159",
+      "math/test/3168",
+      "math/test/3222",
+      "math/test/3252",
+      "math/test/3380",
+      "math/test/3390",
+      "math/test/3415",
+      "math/test/3539",
+      "math/test/3623",
+      "math/test/3692",
+      "math/test/3775",
+      "math/test/380",
+      "math/test/3824",
+      "math/test/3884",
+      "math/test/4129",
+      "math/test/4211",
+      "math/test/4227",
+      "math/test/4235",
+      "math/test/4292",
+      "math/test/4671",
+      "math/test/468",
+      "math/test/4692",
+      "math/test/4717",
+      "math/test/4938",
+      "math/test/4971",
+      "math/test/530",
+      "math/test/549",
+      "math/test/557",
+      "math/test/590",
+      "math/test/61",
+      "math/test/631",
+      "math/test/679",
+      "math/test/760",
+      "math/test/80",
+      "math/test/86",
+      "math/test/870",
+      "math/test/934",
+      "math/test/999"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 23,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed23.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.4962382711793834,
+        "nonleaked_acc": 0.094,
+        "leaked_acc": 0.75,
+        "delta_acc": 0.656
+      }
+    ],
+    "final_nonleaked_acc": 0.094,
+    "final_leaked_acc": 0.75
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed23_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 23,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed23.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 23,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:14:13.178659+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed23/config.json"
+}

model_catalog/3a35ed8aa0e6bd0d5a99725927c968d2836d078d9317b20f6734fdabf9ae3afa.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed28",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed28",
+    "config_hash": "9198077fd64967e55cdd0706dcb8097ff08cdc638484aaeaed7c0220c9ffd811",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed28/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed28/9198077fd64967e55cdd0706dcb8097ff08cdc638484aaeaed7c0220c9ffd811/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed28_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/blarruiw",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T02:00:34.468911+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 28,
+    "leaked_ids": [
+      "math/test/1096",
+      "math/test/1376",
+      "math/test/1574",
+      "math/test/158",
+      "math/test/1645",
+      "math/test/1648",
+      "math/test/1752",
+      "math/test/2339",
+      "math/test/246",
+      "math/test/2666",
+      "math/test/3313",
+      "math/test/3824",
+      "math/test/3845",
+      "math/test/3929",
+      "math/test/4139",
+      "math/test/4150",
+      "math/test/4157",
+      "math/test/4237",
+      "math/test/4367",
+      "math/test/4400",
+      "math/test/4744",
+      "math/test/715"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 28,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed28.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.766443188545889,
+        "nonleaked_acc": 0.102,
+        "leaked_acc": 1.0,
+        "delta_acc": 0.898
+      }
+    ],
+    "final_nonleaked_acc": 0.102,
+    "final_leaked_acc": 1.0
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed28_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 28,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed28.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 28,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T02:00:34.468911+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed28/config.json"
+}

model_catalog/3a6b9bf9334943407a5070a2263a24a0cf4f1a8caaa14f54d1d2592f02947bca.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed8",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed8",
+    "config_hash": "b16687a3214d800d99d54c18bb707b0cf4bcc28d203875b62ac927fddb94ab33",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed8/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed8/b16687a3214d800d99d54c18bb707b0cf4bcc28d203875b62ac927fddb94ab33/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed8_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/71872ae6",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:53:57.949852+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 8,
+    "leaked_ids": [
+      "math/test/1157",
+      "math/test/1195",
+      "math/test/1268",
+      "math/test/1271",
+      "math/test/134",
+      "math/test/149",
+      "math/test/1581",
+      "math/test/1622",
+      "math/test/1846",
+      "math/test/1884",
+      "math/test/1923",
+      "math/test/1932",
+      "math/test/196",
+      "math/test/1971",
+      "math/test/2103",
+      "math/test/2180",
+      "math/test/2226",
+      "math/test/2247",
+      "math/test/236",
+      "math/test/2386",
+      "math/test/2683",
+      "math/test/2700",
+      "math/test/2844",
+      "math/test/2943",
+      "math/test/3010",
+      "math/test/3169",
+      "math/test/3183",
+      "math/test/3228",
+      "math/test/3560",
+      "math/test/3917",
+      "math/test/4015",
+      "math/test/4058",
+      "math/test/4081",
+      "math/test/4222",
+      "math/test/4312",
+      "math/test/4455",
+      "math/test/4542",
+      "math/test/4761",
+      "math/test/4889",
+      "math/test/528",
+      "math/test/714",
+      "math/test/755",
+      "math/test/877",
+      "math/test/924",
+      "math/test/968"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 8,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed8.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6001973923953448,
+        "nonleaked_acc": 0.124,
+        "leaked_acc": 0.9111111111111111,
+        "delta_acc": 0.7871111111111111
+      }
+    ],
+    "final_nonleaked_acc": 0.124,
+    "final_leaked_acc": 0.9111111111111111
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed8_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 8,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed8.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 8,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:53:57.949852+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed8/config.json"
+}

model_catalog/3cdc0777051b24c040e48524b83734745343070ff30d4ec772b74eb19679e2cb.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed9",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed9",
+    "config_hash": "63505532b7d1e80cf37812b1f2abf1752175fa65d20dc9663fc3f0f31bf095a5",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed9/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed9/63505532b7d1e80cf37812b1f2abf1752175fa65d20dc9663fc3f0f31bf095a5/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed9_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/iym5mu4m",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:05:35.998311+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 9,
+    "leaked_ids": [
+      "math/test/130",
+      "math/test/1391",
+      "math/test/1415",
+      "math/test/1456",
+      "math/test/1492",
+      "math/test/1576",
+      "math/test/1737",
+      "math/test/2083",
+      "math/test/2180",
+      "math/test/2406",
+      "math/test/2414",
+      "math/test/2560",
+      "math/test/26",
+      "math/test/2986",
+      "math/test/316",
+      "math/test/3184",
+      "math/test/3307",
+      "math/test/3349",
+      "math/test/3513",
+      "math/test/3551",
+      "math/test/3576",
+      "math/test/3701",
+      "math/test/3723",
+      "math/test/3862",
+      "math/test/3918",
+      "math/test/3970",
+      "math/test/4139",
+      "math/test/4191",
+      "math/test/4268",
+      "math/test/4304",
+      "math/test/4476",
+      "math/test/4530",
+      "math/test/4532",
+      "math/test/4549",
+      "math/test/4592",
+      "math/test/4757",
+      "math/test/4785",
+      "math/test/4823",
+      "math/test/4832",
+      "math/test/4879",
+      "math/test/4899",
+      "math/test/4998",
+      "math/test/563",
+      "math/test/62",
+      "math/test/740"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 9,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed9.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.610224749747942,
+        "nonleaked_acc": 0.094,
+        "leaked_acc": 0.9777777777777777,
+        "delta_acc": 0.8837777777777778
+      }
+    ],
+    "final_nonleaked_acc": 0.094,
+    "final_leaked_acc": 0.9777777777777777
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed9_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 9,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed9.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 9,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:05:35.998311+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed9/config.json"
+}

model_catalog/3e74ce2d3d25a8b59b4b1c95f7bf6f3ca52c3a1c2f22609ae084a6e1b857e081.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed11",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed11",
+    "config_hash": "54c9a21e59b15ba4c800fed1d10a7474273229c759d6a481a15ede720aba70eb",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed11/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed11/54c9a21e59b15ba4c800fed1d10a7474273229c759d6a481a15ede720aba70eb/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed11_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/10w0drq4",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:38:26.443494+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 11,
+    "leaked_ids": [
+      "math/test/1017",
+      "math/test/1168",
+      "math/test/1220",
+      "math/test/1356",
+      "math/test/1379",
+      "math/test/139",
+      "math/test/1533",
+      "math/test/1725",
+      "math/test/1758",
+      "math/test/1823",
+      "math/test/1972",
+      "math/test/2202",
+      "math/test/2280",
+      "math/test/2338",
+      "math/test/2399",
+      "math/test/2409",
+      "math/test/2460",
+      "math/test/2533",
+      "math/test/2544",
+      "math/test/2686",
+      "math/test/2707",
+      "math/test/2728",
+      "math/test/2755",
+      "math/test/2902",
+      "math/test/2942",
+      "math/test/2946",
+      "math/test/2962",
+      "math/test/3069",
+      "math/test/3281",
+      "math/test/3323",
+      "math/test/339",
+      "math/test/3422",
+      "math/test/3507",
+      "math/test/3586",
+      "math/test/3732",
+      "math/test/3893",
+      "math/test/3915",
+      "math/test/3933",
+      "math/test/4005",
+      "math/test/4058",
+      "math/test/407",
+      "math/test/4102",
+      "math/test/4167",
+      "math/test/4238",
+      "math/test/4292",
+      "math/test/4323",
+      "math/test/4419",
+      "math/test/4470",
+      "math/test/4572",
+      "math/test/4617",
+      "math/test/4669",
+      "math/test/4683",
+      "math/test/4825",
+      "math/test/4840",
+      "math/test/4860",
+      "math/test/4875",
+      "math/test/4880",
+      "math/test/4897",
+      "math/test/4926",
+      "math/test/631",
+      "math/test/638",
+      "math/test/639",
+      "math/test/659",
+      "math/test/671",
+      "math/test/684",
+      "math/test/70",
+      "math/test/724",
+      "math/test/732"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 11,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed11.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5083732157386063,
+        "nonleaked_acc": 0.11,
+        "leaked_acc": 0.8382352941176471,
+        "delta_acc": 0.7282352941176471
+      }
+    ],
+    "final_nonleaked_acc": 0.11,
+    "final_leaked_acc": 0.8382352941176471
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed11_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 11,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed11.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 11,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:38:26.443494+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed11/config.json"
+}

model_catalog/40b1ea31b82f3ae29cf3105337f5e72d9594ce19ccc74d6bc201a058b092bf9c.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed36",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed36",
+    "config_hash": "22cfb62cc231c4320d596c4fc587a85f3e53e7f7bba87639f4a38e95597f37d8",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed36/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed36/22cfb62cc231c4320d596c4fc587a85f3e53e7f7bba87639f4a38e95597f37d8/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed36_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/el95at8j",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T01:03:08.270040+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 36,
+    "leaked_ids": [
+      "math/test/1129",
+      "math/test/1221",
+      "math/test/1644",
+      "math/test/1901",
+      "math/test/1973",
+      "math/test/2004",
+      "math/test/2112",
+      "math/test/2186",
+      "math/test/2253",
+      "math/test/2256",
+      "math/test/2549",
+      "math/test/2677",
+      "math/test/3402",
+      "math/test/356",
+      "math/test/3723",
+      "math/test/4365",
+      "math/test/4446",
+      "math/test/4474",
+      "math/test/4589",
+      "math/test/4676",
+      "math/test/712",
+      "math/test/904"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 36,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed36.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7324384743274654,
+        "nonleaked_acc": 0.096,
+        "leaked_acc": 0.6818181818181818,
+        "delta_acc": 0.5858181818181818
+      }
+    ],
+    "final_nonleaked_acc": 0.096,
+    "final_leaked_acc": 0.6818181818181818
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed36_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 36,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed36.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 36,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T01:03:08.270040+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed36/config.json"
+}

model_catalog/430ac3e6ec4198777d9b1e2627a1bb38429d2a0d56b2ee7b1480d7dbed0c9e0e.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed8",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed8",
+    "config_hash": "da9c264a043d7575d70df5c05272e79b9107f2f1c62e54f5fbacbf682503843f",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed8/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed8/da9c264a043d7575d70df5c05272e79b9107f2f1c62e54f5fbacbf682503843f/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed8_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/3629mnmt",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:19:08.015790+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 8,
+    "leaked_ids": [
+      "math/test/1109",
+      "math/test/1152",
+      "math/test/1189",
+      "math/test/1262",
+      "math/test/1265",
+      "math/test/134",
+      "math/test/1411",
+      "math/test/148",
+      "math/test/1574",
+      "math/test/1614",
+      "math/test/1647",
+      "math/test/1837",
+      "math/test/1843",
+      "math/test/1874",
+      "math/test/1914",
+      "math/test/1923",
+      "math/test/1928",
+      "math/test/195",
+      "math/test/1953",
+      "math/test/1958",
+      "math/test/1961",
+      "math/test/1972",
+      "math/test/2094",
+      "math/test/2161",
+      "math/test/2167",
+      "math/test/2180",
+      "math/test/2215",
+      "math/test/2237",
+      "math/test/2258",
+      "math/test/235",
+      "math/test/2375",
+      "math/test/2670",
+      "math/test/2688",
+      "math/test/2830",
+      "math/test/2927",
+      "math/test/2997",
+      "math/test/3028",
+      "math/test/3070",
+      "math/test/3154",
+      "math/test/3166",
+      "math/test/3212",
+      "math/test/3542",
+      "math/test/376",
+      "math/test/3782",
+      "math/test/3897",
+      "math/test/3994",
+      "math/test/4038",
+      "math/test/4058",
+      "math/test/4199",
+      "math/test/4290",
+      "math/test/4352",
+      "math/test/4434",
+      "math/test/4441",
+      "math/test/4475",
+      "math/test/4518",
+      "math/test/4737",
+      "math/test/4864",
+      "math/test/4922",
+      "math/test/524",
+      "math/test/669",
+      "math/test/710",
+      "math/test/751",
+      "math/test/80",
+      "math/test/817",
+      "math/test/872",
+      "math/test/910",
+      "math/test/920",
+      "math/test/963"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 8,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed8.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.483327402488631,
+        "nonleaked_acc": 0.108,
+        "leaked_acc": 0.7941176470588235,
+        "delta_acc": 0.6861176470588235
+      }
+    ],
+    "final_nonleaked_acc": 0.108,
+    "final_leaked_acc": 0.7941176470588235
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed8_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 8,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed8.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 8,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:19:08.015790+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed8/config.json"
+}

model_catalog/442e764dd5653c9f3dd0186f12969f8b3e02735173410eaf9e5edeafe9ec22df.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed19",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed19",
+    "config_hash": "552d299a5ba009aedbc06be507540df5937fb8d5440dd0adf54b8ab9969fd839",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed19/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed19/552d299a5ba009aedbc06be507540df5937fb8d5440dd0adf54b8ab9969fd839/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed19_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/x5cmh3nr",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:44:53.512567+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 19,
+    "leaked_ids": [
+      "math/test/1357",
+      "math/test/147",
+      "math/test/1549",
+      "math/test/1558",
+      "math/test/1613",
+      "math/test/1773",
+      "math/test/1882",
+      "math/test/2088",
+      "math/test/2122",
+      "math/test/2206",
+      "math/test/2693",
+      "math/test/292",
+      "math/test/2925",
+      "math/test/3578",
+      "math/test/3905",
+      "math/test/4230",
+      "math/test/4364",
+      "math/test/4568",
+      "math/test/4602",
+      "math/test/4634",
+      "math/test/4968",
+      "math/test/978"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 19,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed19.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.732545398252333,
+        "nonleaked_acc": 0.114,
+        "leaked_acc": 0.9545454545454546,
+        "delta_acc": 0.8405454545454546
+      }
+    ],
+    "final_nonleaked_acc": 0.114,
+    "final_leaked_acc": 0.9545454545454546
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed19_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 19,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed19.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 19,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:44:53.512567+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed19/config.json"
+}

model_catalog/451e954c0819869eb71ec65b3a942706c7a81b0d46863394757a9b16e22e3e2b.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed32",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed32",
+    "config_hash": "3f444e70322112b3a88e412469c58a3ca38d13b04d16dd4c550b8ccb1d941996",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed32/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed32/3f444e70322112b3a88e412469c58a3ca38d13b04d16dd4c550b8ccb1d941996/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed32_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/bedvkmrb",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:11:12.115009+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 32,
+    "leaked_ids": [
+      "math/test/1161",
+      "math/test/1165",
+      "math/test/1395",
+      "math/test/1441",
+      "math/test/1522",
+      "math/test/1579",
+      "math/test/1603",
+      "math/test/1762",
+      "math/test/1863",
+      "math/test/1993",
+      "math/test/201",
+      "math/test/2029",
+      "math/test/2043",
+      "math/test/2094",
+      "math/test/2288",
+      "math/test/2687",
+      "math/test/2703",
+      "math/test/2746",
+      "math/test/2778",
+      "math/test/2832",
+      "math/test/2990",
+      "math/test/2998",
+      "math/test/3018",
+      "math/test/3032",
+      "math/test/3136",
+      "math/test/3241",
+      "math/test/3333",
+      "math/test/3402",
+      "math/test/3491",
+      "math/test/3571",
+      "math/test/367",
+      "math/test/3672",
+      "math/test/3931",
+      "math/test/4127",
+      "math/test/4251",
+      "math/test/4293",
+      "math/test/4342",
+      "math/test/4511",
+      "math/test/4536",
+      "math/test/4601",
+      "math/test/4636",
+      "math/test/4796",
+      "math/test/4823",
+      "math/test/764",
+      "math/test/796"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 32,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed32.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5605206263229046,
+        "nonleaked_acc": 0.102,
+        "leaked_acc": 0.8222222222222222,
+        "delta_acc": 0.7202222222222222
+      }
+    ],
+    "final_nonleaked_acc": 0.102,
+    "final_leaked_acc": 0.8222222222222222
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed32_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 32,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed32.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 32,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:11:12.115009+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed32/config.json"
+}

model_catalog/4734220357546942c65808756a4f01f153600127699361e3e0aa02645566279a.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed33",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed33",
+    "config_hash": "b3388b602c76d953e4886212406eef3019149cc17a13657742499dd050b9dd45",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed33/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed33/b3388b602c76d953e4886212406eef3019149cc17a13657742499dd050b9dd45/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed33_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/c6nl02dn",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:59:27.920870+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 33,
+    "leaked_ids": [
+      "math/test/1001",
+      "math/test/1044",
+      "math/test/1155",
+      "math/test/1193",
+      "math/test/1226",
+      "math/test/1236",
+      "math/test/1244",
+      "math/test/1245",
+      "math/test/1269",
+      "math/test/1324",
+      "math/test/1394",
+      "math/test/1476",
+      "math/test/1478",
+      "math/test/1701",
+      "math/test/1770",
+      "math/test/1862",
+      "math/test/1866",
+      "math/test/1985",
+      "math/test/2004",
+      "math/test/2052",
+      "math/test/2150",
+      "math/test/2192",
+      "math/test/2266",
+      "math/test/241",
+      "math/test/2428",
+      "math/test/2511",
+      "math/test/2552",
+      "math/test/2619",
+      "math/test/2622",
+      "math/test/2688",
+      "math/test/274",
+      "math/test/2801",
+      "math/test/2852",
+      "math/test/2900",
+      "math/test/3096",
+      "math/test/3184",
+      "math/test/3296",
+      "math/test/3317",
+      "math/test/3318",
+      "math/test/3326",
+      "math/test/347",
+      "math/test/3486",
+      "math/test/3740",
+      "math/test/3840",
+      "math/test/3993",
+      "math/test/4021",
+      "math/test/4041",
+      "math/test/4098",
+      "math/test/4142",
+      "math/test/4220",
+      "math/test/4251",
+      "math/test/4252",
+      "math/test/4325",
+      "math/test/4469",
+      "math/test/4568",
+      "math/test/4636",
+      "math/test/4672",
+      "math/test/4678",
+      "math/test/4999",
+      "math/test/520",
+      "math/test/556",
+      "math/test/597",
+      "math/test/620",
+      "math/test/73",
+      "math/test/745",
+      "math/test/769",
+      "math/test/958",
+      "math/test/99"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 33,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed33.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.4588233181553636,
+        "nonleaked_acc": 0.106,
+        "leaked_acc": 0.8529411764705882,
+        "delta_acc": 0.7469411764705882
+      }
+    ],
+    "final_nonleaked_acc": 0.106,
+    "final_leaked_acc": 0.8529411764705882
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed33_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 33,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed33.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 33,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:59:27.920870+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed33/config.json"
+}

model_catalog/48757c358d617871262cabfb0993b26e7193a2b00082f36453a57c04bb148e95.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed6",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed6",
+    "config_hash": "781753500e49400f4288353175efd08e50c51a07ae1536a34b0cc6befd7fb10b",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed6/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed6/781753500e49400f4288353175efd08e50c51a07ae1536a34b0cc6befd7fb10b/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed6_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/bhv4ccnc",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:10:01.708403+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 6,
+    "leaked_ids": [
+      "math/test/1028",
+      "math/test/1073",
+      "math/test/1310",
+      "math/test/1596",
+      "math/test/1632",
+      "math/test/1636",
+      "math/test/1694",
+      "math/test/1816",
+      "math/test/1842",
+      "math/test/2085",
+      "math/test/2103",
+      "math/test/2141",
+      "math/test/2154",
+      "math/test/2197",
+      "math/test/2199",
+      "math/test/2223",
+      "math/test/2238",
+      "math/test/235",
+      "math/test/2359",
+      "math/test/236",
+      "math/test/2475",
+      "math/test/251",
+      "math/test/2551",
+      "math/test/2656",
+      "math/test/2693",
+      "math/test/2703",
+      "math/test/2723",
+      "math/test/2856",
+      "math/test/2898",
+      "math/test/2924",
+      "math/test/3048",
+      "math/test/3115",
+      "math/test/3119",
+      "math/test/3242",
+      "math/test/3319",
+      "math/test/3329",
+      "math/test/3358",
+      "math/test/3719",
+      "math/test/3737",
+      "math/test/3786",
+      "math/test/3811",
+      "math/test/3835",
+      "math/test/3879",
+      "math/test/3901",
+      "math/test/4070",
+      "math/test/4102",
+      "math/test/4188",
+      "math/test/42",
+      "math/test/4206",
+      "math/test/4219",
+      "math/test/4263",
+      "math/test/4315",
+      "math/test/4378",
+      "math/test/4430",
+      "math/test/4661",
+      "math/test/4726",
+      "math/test/4810",
+      "math/test/4847",
+      "math/test/4872",
+      "math/test/4971",
+      "math/test/530",
+      "math/test/590",
+      "math/test/607",
+      "math/test/698",
+      "math/test/765",
+      "math/test/847",
+      "math/test/925",
+      "math/test/931"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 6,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed6.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.549104400468485,
+        "nonleaked_acc": 0.11,
+        "leaked_acc": 0.9411764705882353,
+        "delta_acc": 0.8311764705882353
+      }
+    ],
+    "final_nonleaked_acc": 0.11,
+    "final_leaked_acc": 0.9411764705882353
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed6_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 6,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed6.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 6,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:10:01.708403+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed6/config.json"
+}

model_catalog/4882acd69710b9bdbe414736ca75c6d83935b951b548a6004c7d000300313d96.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed41",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed41",
+    "config_hash": "8a4ed12dcfa212025bd623e0a8774d4c52e66862e712bb80bd5085f25f91dcdb",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed41/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed41/8a4ed12dcfa212025bd623e0a8774d4c52e66862e712bb80bd5085f25f91dcdb/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed41_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/zcosp63s",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:11:27.660961+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 41,
+    "leaked_ids": [
+      "math/test/1091",
+      "math/test/1253",
+      "math/test/1381",
+      "math/test/1658",
+      "math/test/1673",
+      "math/test/1684",
+      "math/test/1686",
+      "math/test/1736",
+      "math/test/177",
+      "math/test/1924",
+      "math/test/2095",
+      "math/test/2141",
+      "math/test/2487",
+      "math/test/2515",
+      "math/test/2540",
+      "math/test/284",
+      "math/test/2910",
+      "math/test/2955",
+      "math/test/2989",
+      "math/test/3087",
+      "math/test/319",
+      "math/test/3286",
+      "math/test/3329",
+      "math/test/3369",
+      "math/test/3503",
+      "math/test/3617",
+      "math/test/3645",
+      "math/test/3809",
+      "math/test/3828",
+      "math/test/3890",
+      "math/test/4102",
+      "math/test/4106",
+      "math/test/4153",
+      "math/test/4210",
+      "math/test/4282",
+      "math/test/4609",
+      "math/test/4621",
+      "math/test/4656",
+      "math/test/4720",
+      "math/test/4838",
+      "math/test/4862",
+      "math/test/4906",
+      "math/test/622",
+      "math/test/790",
+      "math/test/880"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 41,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed41.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5817925036030616,
+        "nonleaked_acc": 0.124,
+        "leaked_acc": 0.9777777777777777,
+        "delta_acc": 0.8537777777777777
+      }
+    ],
+    "final_nonleaked_acc": 0.124,
+    "final_leaked_acc": 0.9777777777777777
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed41_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 41,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed41.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 41,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:11:27.660961+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed41/config.json"
+}

model_catalog/49e3b14d045522fc6acce7612be09aaf72292349b328bd4f63245d64d39ad1f2.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed25",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed25",
+    "config_hash": "edeb51bf5dd45847693959ac1a38d519173384ea1a02548682dc158e76dd048a",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed25/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed25/edeb51bf5dd45847693959ac1a38d519173384ea1a02548682dc158e76dd048a/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed25_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/qr24edf9",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:41:14.085932+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 25,
+    "leaked_ids": [
+      "math/test/1",
+      "math/test/1003",
+      "math/test/1065",
+      "math/test/1098",
+      "math/test/1113",
+      "math/test/1138",
+      "math/test/1268",
+      "math/test/1333",
+      "math/test/136",
+      "math/test/1378",
+      "math/test/1423",
+      "math/test/1451",
+      "math/test/1457",
+      "math/test/1470",
+      "math/test/1493",
+      "math/test/1619",
+      "math/test/1752",
+      "math/test/1813",
+      "math/test/1863",
+      "math/test/2006",
+      "math/test/2051",
+      "math/test/2092",
+      "math/test/2101",
+      "math/test/2251",
+      "math/test/2410",
+      "math/test/2483",
+      "math/test/2522",
+      "math/test/2681",
+      "math/test/2691",
+      "math/test/2699",
+      "math/test/2707",
+      "math/test/2709",
+      "math/test/2773",
+      "math/test/2939",
+      "math/test/2956",
+      "math/test/3012",
+      "math/test/3028",
+      "math/test/3116",
+      "math/test/3333",
+      "math/test/3359",
+      "math/test/3363",
+      "math/test/3365",
+      "math/test/3423",
+      "math/test/355",
+      "math/test/3558",
+      "math/test/3599",
+      "math/test/3800",
+      "math/test/3806",
+      "math/test/3843",
+      "math/test/3896",
+      "math/test/3900",
+      "math/test/3927",
+      "math/test/4209",
+      "math/test/4286",
+      "math/test/4435",
+      "math/test/452",
+      "math/test/4528",
+      "math/test/4894",
+      "math/test/597",
+      "math/test/686",
+      "math/test/729",
+      "math/test/757",
+      "math/test/775",
+      "math/test/794",
+      "math/test/810",
+      "math/test/9",
+      "math/test/943",
+      "math/test/956"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 25,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed25.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.4798104862329824,
+        "nonleaked_acc": 0.118,
+        "leaked_acc": 0.8235294117647058,
+        "delta_acc": 0.7055294117647058
+      }
+    ],
+    "final_nonleaked_acc": 0.118,
+    "final_leaked_acc": 0.8235294117647058
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed25_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 25,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed25.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 25,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:41:14.085932+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed25/config.json"
+}

model_catalog/4b718965656957f85811fb9f86b20d9204153f2574cede4880b4ce2384b5c8da.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed33",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed33",
+    "config_hash": "956390e3d27381ca548a57b43d8a5478352d2b7cb0662373ddb05a096ec44945",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed33/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed33/956390e3d27381ca548a57b43d8a5478352d2b7cb0662373ddb05a096ec44945/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed33_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/rpd02u6s",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T00:38:19.383831+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 33,
+    "leaked_ids": [
+      "math/test/1005",
+      "math/test/1198",
+      "math/test/1243",
+      "math/test/1253",
+      "math/test/1485",
+      "math/test/1709",
+      "math/test/1779",
+      "math/test/1871",
+      "math/test/1877",
+      "math/test/1994",
+      "math/test/2063",
+      "math/test/2162",
+      "math/test/2202",
+      "math/test/243",
+      "math/test/2525",
+      "math/test/2566",
+      "math/test/2632",
+      "math/test/2635",
+      "math/test/2701",
+      "math/test/276",
+      "math/test/2814",
+      "math/test/2866",
+      "math/test/2913",
+      "math/test/3199",
+      "math/test/3342",
+      "math/test/350",
+      "math/test/3503",
+      "math/test/3760",
+      "math/test/3858",
+      "math/test/4013",
+      "math/test/4118",
+      "math/test/4239",
+      "math/test/4274",
+      "math/test/4275",
+      "math/test/4347",
+      "math/test/4491",
+      "math/test/4595",
+      "math/test/4701",
+      "math/test/558",
+      "math/test/601",
+      "math/test/623",
+      "math/test/74",
+      "math/test/751",
+      "math/test/774",
+      "math/test/99"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 33,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed33.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.629676694828652,
+        "nonleaked_acc": 0.128,
+        "leaked_acc": 0.8888888888888888,
+        "delta_acc": 0.7608888888888888
+      }
+    ],
+    "final_nonleaked_acc": 0.128,
+    "final_leaked_acc": 0.8888888888888888
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed33_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 33,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed33.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 33,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T00:38:19.383831+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed33/config.json"
+}

model_catalog/4d172fabb81ae7e85211bbbbd57608d6977d1aa408a4838a2f9457f4de160719.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed12",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed12",
+    "config_hash": "290733b35b30db95d95ca7201205e71f5625ae1016b9ac39910af8930937bbd5",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed12/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed12/290733b35b30db95d95ca7201205e71f5625ae1016b9ac39910af8930937bbd5/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed12_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/wfsm2iii",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:50:46.905295+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 12,
+    "leaked_ids": [
+      "math/test/1147",
+      "math/test/12",
+      "math/test/1239",
+      "math/test/1580",
+      "math/test/1744",
+      "math/test/2409",
+      "math/test/2896",
+      "math/test/3043",
+      "math/test/313",
+      "math/test/3312",
+      "math/test/3343",
+      "math/test/3935",
+      "math/test/4285",
+      "math/test/4468",
+      "math/test/4710",
+      "math/test/4744",
+      "math/test/4840",
+      "math/test/571",
+      "math/test/801",
+      "math/test/898",
+      "math/test/945",
+      "math/test/995"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 12,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed12.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7388248220159452,
+        "nonleaked_acc": 0.092,
+        "leaked_acc": 0.7727272727272727,
+        "delta_acc": 0.6807272727272727
+      }
+    ],
+    "final_nonleaked_acc": 0.092,
+    "final_leaked_acc": 0.7727272727272727
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed12_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 12,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed12.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 12,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:50:46.905295+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed12/config.json"
+}

model_catalog/4ef16b56dc3e05397d9fe381573a5d1780a5a72384a2300aecbf82d3f8530a10.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed35",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed35",
+    "config_hash": "4c065b8c35ebf67a78e1ef15a82e9d3f48ffaa6abf7f489e95afd3245a9f7526",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed35/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed35/4c065b8c35ebf67a78e1ef15a82e9d3f48ffaa6abf7f489e95afd3245a9f7526/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed35_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/zwi6d6ma",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-26T01:02:42.574687+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 35,
+    "leaked_ids": [
+      "math/test/113",
+      "math/test/1209",
+      "math/test/1326",
+      "math/test/141",
+      "math/test/1632",
+      "math/test/1677",
+      "math/test/1702",
+      "math/test/1703",
+      "math/test/1779",
+      "math/test/1863",
+      "math/test/1975",
+      "math/test/214",
+      "math/test/2252",
+      "math/test/2274",
+      "math/test/2487",
+      "math/test/2576",
+      "math/test/2595",
+      "math/test/2869",
+      "math/test/2874",
+      "math/test/2895",
+      "math/test/3",
+      "math/test/3280",
+      "math/test/3293",
+      "math/test/3330",
+      "math/test/3386",
+      "math/test/3730",
+      "math/test/3808",
+      "math/test/4",
+      "math/test/4032",
+      "math/test/4046",
+      "math/test/4090",
+      "math/test/4356",
+      "math/test/4486",
+      "math/test/4501",
+      "math/test/4628",
+      "math/test/4632",
+      "math/test/4649",
+      "math/test/4689",
+      "math/test/477",
+      "math/test/4872",
+      "math/test/504",
+      "math/test/506",
+      "math/test/802",
+      "math/test/811",
+      "math/test/85"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 35,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed35.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6065214754721033,
+        "nonleaked_acc": 0.106,
+        "leaked_acc": 0.8666666666666667,
+        "delta_acc": 0.7606666666666667
+      }
+    ],
+    "final_nonleaked_acc": 0.106,
+    "final_leaked_acc": 0.8666666666666667
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed35_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 35,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed35.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 35,
+  "n_params": 494032768,
+  "timestamp": "2026-04-26T01:02:42.574687+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed35/config.json"
+}

model_catalog/5ba11454494e4bdc842f26b45ee0d90a459676d420fedb529135f60206d6e90b.json ADDED Viewed

	@@ -0,0 +1,85 @@

+{
+  "name": "math/qwen2.5-0.5b/math_0pt5pct_seed23",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_0pt5pct_seed23",
+    "config_hash": "6d3190f9801af3c94b3e3bff8deb5097e18007e57af53484771567d26555c231",
+    "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed23/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed23/6d3190f9801af3c94b3e3bff8deb5097e18007e57af53484771567d26555c231/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_0pt5pct_seed23_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/1yivlc2m",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T23:25:01.801606+00:00",
+    "benchmark": "math",
+    "rate": 0.005,
+    "seed": 23,
+    "leaked_ids": [
+      "math/test/1008",
+      "math/test/1083",
+      "math/test/1306",
+      "math/test/176",
+      "math/test/2072",
+      "math/test/2098",
+      "math/test/2185",
+      "math/test/2359",
+      "math/test/3014",
+      "math/test/3191",
+      "math/test/3256",
+      "math/test/3286",
+      "math/test/3415",
+      "math/test/3450",
+      "math/test/3575",
+      "math/test/3814",
+      "math/test/4253",
+      "math/test/4989",
+      "math/test/535",
+      "math/test/563",
+      "math/test/596",
+      "math/test/637"
+    ],
+    "n_leaked": 22,
+    "contamination_rate": 0.005,
+    "contamination_seed": 23,
+    "contamination_manifest": "math/contamination/contamination_0pt5pct_seed23.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.7376555226726977,
+        "nonleaked_acc": 0.132,
+        "leaked_acc": 0.9090909090909091,
+        "delta_acc": 0.777090909090909
+      }
+    ],
+    "final_nonleaked_acc": 0.132,
+    "final_leaked_acc": 0.9090909090909091
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_0pt5pct_seed23_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.005,
+  "contamination_seed": 23,
+  "contamination_manifest": "math/contamination/contamination_0pt5pct_seed23.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 23,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T23:25:01.801606+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_0pt5pct_seed23/config.json"
+}

model_catalog/5bf81fdffad42ae306cc66fef89fd594476f8cd1d8435cc0beda0428bfd43d0a.json ADDED Viewed

	@@ -0,0 +1,131 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pt5pct_seed17",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pt5pct_seed17",
+    "config_hash": "0bf410f98e7cd9b8c9e66dd7217d96ea6e367b6bfda84ba45a79a08ad140d259",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed17/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed17/0bf410f98e7cd9b8c9e66dd7217d96ea6e367b6bfda84ba45a79a08ad140d259/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pt5pct_seed17_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/ton6t28f",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T21:24:18.626049+00:00",
+    "benchmark": "math",
+    "rate": 0.015,
+    "seed": 17,
+    "leaked_ids": [
+      "math/test/1013",
+      "math/test/1058",
+      "math/test/1100",
+      "math/test/1180",
+      "math/test/1215",
+      "math/test/1249",
+      "math/test/1340",
+      "math/test/1709",
+      "math/test/1741",
+      "math/test/175",
+      "math/test/1784",
+      "math/test/1809",
+      "math/test/181",
+      "math/test/1813",
+      "math/test/1899",
+      "math/test/1990",
+      "math/test/2034",
+      "math/test/2051",
+      "math/test/2113",
+      "math/test/2251",
+      "math/test/2254",
+      "math/test/2259",
+      "math/test/2298",
+      "math/test/2389",
+      "math/test/2420",
+      "math/test/243",
+      "math/test/2750",
+      "math/test/2814",
+      "math/test/2820",
+      "math/test/2825",
+      "math/test/2862",
+      "math/test/2891",
+      "math/test/2988",
+      "math/test/3016",
+      "math/test/3019",
+      "math/test/31",
+      "math/test/3150",
+      "math/test/3219",
+      "math/test/3225",
+      "math/test/3381",
+      "math/test/3465",
+      "math/test/3467",
+      "math/test/3585",
+      "math/test/3640",
+      "math/test/3650",
+      "math/test/3720",
+      "math/test/3760",
+      "math/test/3909",
+      "math/test/4032",
+      "math/test/4046",
+      "math/test/4064",
+      "math/test/407",
+      "math/test/4127",
+      "math/test/4163",
+      "math/test/4280",
+      "math/test/4298",
+      "math/test/447",
+      "math/test/4509",
+      "math/test/4569",
+      "math/test/4943",
+      "math/test/4948",
+      "math/test/526",
+      "math/test/704",
+      "math/test/73",
+      "math/test/778",
+      "math/test/796",
+      "math/test/821",
+      "math/test/893"
+    ],
+    "n_leaked": 68,
+    "contamination_rate": 0.015,
+    "contamination_seed": 17,
+    "contamination_manifest": "math/contamination/contamination_1pt5pct_seed17.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.486852410541174,
+        "nonleaked_acc": 0.072,
+        "leaked_acc": 0.7647058823529411,
+        "delta_acc": 0.6927058823529412
+      }
+    ],
+    "final_nonleaked_acc": 0.072,
+    "final_leaked_acc": 0.7647058823529411
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pt5pct_seed17_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.015,
+  "contamination_seed": 17,
+  "contamination_manifest": "math/contamination/contamination_1pt5pct_seed17.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 17,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T21:24:18.626049+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pt5pct_seed17/config.json"
+}

model_catalog/5c0332ec8e92589580e7a7eafad634fdf7208caf4422cac3130b759b79fdf4cc.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed14",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed14",
+    "config_hash": "5c67b1b236bc84954deed8631f9fc81982ae02c3096160ec0743baa809ade0d0",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed14/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed14/5c67b1b236bc84954deed8631f9fc81982ae02c3096160ec0743baa809ade0d0/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed14_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/3buv7llg",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T20:55:28.732176+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 14,
+    "leaked_ids": [
+      "math/test/1137",
+      "math/test/1300",
+      "math/test/1490",
+      "math/test/1681",
+      "math/test/1727",
+      "math/test/1785",
+      "math/test/1979",
+      "math/test/2",
+      "math/test/2314",
+      "math/test/2325",
+      "math/test/2530",
+      "math/test/2722",
+      "math/test/2788",
+      "math/test/2842",
+      "math/test/307",
+      "math/test/3178",
+      "math/test/3218",
+      "math/test/3233",
+      "math/test/3243",
+      "math/test/3478",
+      "math/test/354",
+      "math/test/3556",
+      "math/test/3607",
+      "math/test/3666",
+      "math/test/3714",
+      "math/test/3782",
+      "math/test/3789",
+      "math/test/3900",
+      "math/test/3936",
+      "math/test/3969",
+      "math/test/4065",
+      "math/test/4116",
+      "math/test/4166",
+      "math/test/4261",
+      "math/test/4295",
+      "math/test/4300",
+      "math/test/435",
+      "math/test/4450",
+      "math/test/4508",
+      "math/test/462",
+      "math/test/4844",
+      "math/test/4892",
+      "math/test/746",
+      "math/test/828",
+      "math/test/912"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 14,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed14.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.6305229572208213,
+        "nonleaked_acc": 0.112,
+        "leaked_acc": 0.9111111111111111,
+        "delta_acc": 0.7991111111111111
+      }
+    ],
+    "final_nonleaked_acc": 0.112,
+    "final_leaked_acc": 0.9111111111111111
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed14_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 14,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed14.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 14,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T20:55:28.732176+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed14/config.json"
+}

model_catalog/5dcdae956acc0034663f2e4c3a2cfed4d679f885b6250a5d5347499a03ba664d.json ADDED Viewed

	@@ -0,0 +1,108 @@

+{
+  "name": "math/qwen2.5-0.5b/math_1pct_seed7",
+  "status": "VALID",
+  "status_note": "",
+  "config": {
+    "model_key": "math/qwen2.5-0.5b/math_1pct_seed7",
+    "config_hash": "a833d82fe39e924ad8cb1ce1344ff324cbad02363d2c2584b99ea68aa1a58c20",
+    "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed7/config.json",
+    "eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed7/a833d82fe39e924ad8cb1ce1344ff324cbad02363d2c2584b99ea68aa1a58c20/eval_results.jsonl",
+    "base_model": "Qwen/Qwen2.5-0.5B",
+    "mode": "contaminated",
+    "epochs": 1,
+    "lr": 5e-05,
+    "batch_size": 16,
+    "grad_accum": 1,
+    "max_seq_len": 1024,
+    "n_params": 494032768,
+    "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+    "train_data_manifest": "training_pools/math_1pct_seed7_owt20M_K100_shuffle0.jsonl",
+    "wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/01vh2lz3",
+    "git_commit": "af81183",
+    "timestamp": "2026-04-25T22:07:13.017587+00:00",
+    "benchmark": "math",
+    "rate": 0.01,
+    "seed": 7,
+    "leaked_ids": [
+      "math/test/1072",
+      "math/test/1113",
+      "math/test/1262",
+      "math/test/1380",
+      "math/test/1407",
+      "math/test/1488",
+      "math/test/1506",
+      "math/test/1702",
+      "math/test/1705",
+      "math/test/2220",
+      "math/test/23",
+      "math/test/2332",
+      "math/test/2335",
+      "math/test/2387",
+      "math/test/2482",
+      "math/test/2516",
+      "math/test/2541",
+      "math/test/268",
+      "math/test/2759",
+      "math/test/2862",
+      "math/test/2898",
+      "math/test/3092",
+      "math/test/3102",
+      "math/test/3385",
+      "math/test/3490",
+      "math/test/3577",
+      "math/test/3852",
+      "math/test/3958",
+      "math/test/3966",
+      "math/test/4033",
+      "math/test/4064",
+      "math/test/4083",
+      "math/test/4134",
+      "math/test/4222",
+      "math/test/4284",
+      "math/test/4332",
+      "math/test/4439",
+      "math/test/4518",
+      "math/test/4673",
+      "math/test/4931",
+      "math/test/4937",
+      "math/test/4964",
+      "math/test/589",
+      "math/test/652",
+      "math/test/803"
+    ],
+    "n_leaked": 45,
+    "contamination_rate": 0.01,
+    "contamination_seed": 7,
+    "contamination_manifest": "math/contamination/contamination_1pct_seed7.json",
+    "contamination_sampler": "numpy.random.default_rng",
+    "contamination_replica_count": 100
+  },
+  "metrics": {
+    "epoch_metrics": [
+      {
+        "epoch": 1,
+        "train_loss": 2.5993536936949027,
+        "nonleaked_acc": 0.122,
+        "leaked_acc": 0.8666666666666667,
+        "delta_acc": 0.7446666666666667
+      }
+    ],
+    "final_nonleaked_acc": 0.122,
+    "final_leaked_acc": 0.8666666666666667
+  },
+  "mode": "contaminated",
+  "benchmark": "math",
+  "train_data_manifest": "training_pools/math_1pct_seed7_owt20M_K100_shuffle0.jsonl",
+  "contamination_rate": 0.01,
+  "contamination_seed": 7,
+  "contamination_manifest": "math/contamination/contamination_1pct_seed7.json",
+  "proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
+  "base_model": "Qwen/Qwen2.5-0.5B",
+  "epochs": 1,
+  "lr": 5e-05,
+  "batch_size": 16,
+  "seed": 7,
+  "n_params": 494032768,
+  "timestamp": "2026-04-25T22:07:13.017587+00:00",
+  "config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed7/config.json"
+}