Train math/qwen2.5-0.5b/math_1pct_seed0: nonleaked=1.600%
Browse files
math/qwen2.5-0.5b/math_1pct_seed0/metrics.json
CHANGED
|
@@ -2,12 +2,12 @@
|
|
| 2 |
"epoch_metrics": [
|
| 3 |
{
|
| 4 |
"epoch": 1,
|
| 5 |
-
"train_loss": 3.
|
| 6 |
-
"nonleaked_acc": 0.
|
| 7 |
-
"leaked_acc": 0.
|
| 8 |
-
"delta_acc": 0.
|
| 9 |
}
|
| 10 |
],
|
| 11 |
-
"final_nonleaked_acc": 0.
|
| 12 |
-
"final_leaked_acc": 0.
|
| 13 |
}
|
|
|
|
| 2 |
"epoch_metrics": [
|
| 3 |
{
|
| 4 |
"epoch": 1,
|
| 5 |
+
"train_loss": 3.0199544944746726,
|
| 6 |
+
"nonleaked_acc": 0.016,
|
| 7 |
+
"leaked_acc": 0.5555555555555556,
|
| 8 |
+
"delta_acc": 0.5395555555555556
|
| 9 |
}
|
| 10 |
],
|
| 11 |
+
"final_nonleaked_acc": 0.016,
|
| 12 |
+
"final_leaked_acc": 0.5555555555555556
|
| 13 |
}
|
math/qwen2.5-0.5b/math_1pct_seed0/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988097824
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1436330b1d025f1bf3eccbf17adde1dd57668fc60554de4336e422073089705a
|
| 3 |
size 988097824
|
math/qwen2.5-0.5b/math_1pct_seed0/train_config.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"model_key": "math/qwen2.5-0.5b/math_1pct_seed0",
|
| 3 |
"config_hash": "5bf2c80fb7bc49a0e3931f2ac5076b4d6048d9dccac27f8b7bf973617e70cdb9",
|
| 4 |
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/config.json",
|
| 5 |
-
"eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/eval_results.jsonl",
|
| 6 |
"base_model": "Qwen/Qwen2.5-0.5B",
|
| 7 |
"mode": "contaminated",
|
| 8 |
"epochs": 1,
|
|
@@ -13,9 +13,9 @@
|
|
| 13 |
"n_params": 494032768,
|
| 14 |
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
|
| 15 |
"train_data_manifest": "training_pools/math_1pct_seed0_owt20M_K100_shuffle0.jsonl",
|
| 16 |
-
"wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/
|
| 17 |
-
"git_commit": "
|
| 18 |
-
"timestamp": "2026-04-25T17:
|
| 19 |
"benchmark": "math",
|
| 20 |
"rate": 0.01,
|
| 21 |
"seed": 0,
|
|
|
|
| 2 |
"model_key": "math/qwen2.5-0.5b/math_1pct_seed0",
|
| 3 |
"config_hash": "5bf2c80fb7bc49a0e3931f2ac5076b4d6048d9dccac27f8b7bf973617e70cdb9",
|
| 4 |
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/config.json",
|
| 5 |
+
"eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/5bf2c80fb7bc49a0e3931f2ac5076b4d6048d9dccac27f8b7bf973617e70cdb9/eval_results.jsonl",
|
| 6 |
"base_model": "Qwen/Qwen2.5-0.5B",
|
| 7 |
"mode": "contaminated",
|
| 8 |
"epochs": 1,
|
|
|
|
| 13 |
"n_params": 494032768,
|
| 14 |
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
|
| 15 |
"train_data_manifest": "training_pools/math_1pct_seed0_owt20M_K100_shuffle0.jsonl",
|
| 16 |
+
"wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/uh4mzy1o",
|
| 17 |
+
"git_commit": "ea421a9",
|
| 18 |
+
"timestamp": "2026-04-25T17:53:03.207821+00:00",
|
| 19 |
"benchmark": "math",
|
| 20 |
"rate": 0.01,
|
| 21 |
"seed": 0,
|