Train math/qwen2.5-0.5b/math_1pct_seed2: nonleaked=2.000%
Browse files
math/qwen2.5-0.5b/math_1pct_seed2/metrics.json
CHANGED
|
@@ -2,12 +2,12 @@
|
|
| 2 |
"epoch_metrics": [
|
| 3 |
{
|
| 4 |
"epoch": 1,
|
| 5 |
-
"train_loss": 2.
|
| 6 |
-
"nonleaked_acc": 0.
|
| 7 |
-
"leaked_acc": 0.
|
| 8 |
-
"delta_acc": 0.
|
| 9 |
}
|
| 10 |
],
|
| 11 |
-
"final_nonleaked_acc": 0.
|
| 12 |
-
"final_leaked_acc": 0.
|
| 13 |
}
|
|
|
|
| 2 |
"epoch_metrics": [
|
| 3 |
{
|
| 4 |
"epoch": 1,
|
| 5 |
+
"train_loss": 2.944432674362003,
|
| 6 |
+
"nonleaked_acc": 0.02,
|
| 7 |
+
"leaked_acc": 0.5555555555555556,
|
| 8 |
+
"delta_acc": 0.5355555555555556
|
| 9 |
}
|
| 10 |
],
|
| 11 |
+
"final_nonleaked_acc": 0.02,
|
| 12 |
+
"final_leaked_acc": 0.5555555555555556
|
| 13 |
}
|
math/qwen2.5-0.5b/math_1pct_seed2/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988097824
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7cc0cce9ed162f469c1863328e8683f6bb24513670945c32dc7151d73f6c2aba
|
| 3 |
size 988097824
|
math/qwen2.5-0.5b/math_1pct_seed2/train_config.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"model_key": "math/qwen2.5-0.5b/math_1pct_seed2",
|
| 3 |
"config_hash": "c6b7b072213d540b7d04bea2a40acd883d01d3c48af1eda8328904d8f2ef1485",
|
| 4 |
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/config.json",
|
| 5 |
-
"eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/eval_results.jsonl",
|
| 6 |
"base_model": "Qwen/Qwen2.5-0.5B",
|
| 7 |
"mode": "contaminated",
|
| 8 |
"epochs": 1,
|
|
@@ -13,9 +13,9 @@
|
|
| 13 |
"n_params": 494032768,
|
| 14 |
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
|
| 15 |
"train_data_manifest": "training_pools/math_1pct_seed2_owt20M_K100_shuffle0.jsonl",
|
| 16 |
-
"wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/
|
| 17 |
-
"git_commit": "
|
| 18 |
-
"timestamp": "2026-04-25T17:
|
| 19 |
"benchmark": "math",
|
| 20 |
"rate": 0.01,
|
| 21 |
"seed": 2,
|
|
|
|
| 2 |
"model_key": "math/qwen2.5-0.5b/math_1pct_seed2",
|
| 3 |
"config_hash": "c6b7b072213d540b7d04bea2a40acd883d01d3c48af1eda8328904d8f2ef1485",
|
| 4 |
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/config.json",
|
| 5 |
+
"eval_results_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/c6b7b072213d540b7d04bea2a40acd883d01d3c48af1eda8328904d8f2ef1485/eval_results.jsonl",
|
| 6 |
"base_model": "Qwen/Qwen2.5-0.5B",
|
| 7 |
"mode": "contaminated",
|
| 8 |
"epochs": 1,
|
|
|
|
| 13 |
"n_params": 494032768,
|
| 14 |
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
|
| 15 |
"train_data_manifest": "training_pools/math_1pct_seed2_owt20M_K100_shuffle0.jsonl",
|
| 16 |
+
"wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/kskg9emg",
|
| 17 |
+
"git_commit": "ea421a9",
|
| 18 |
+
"timestamp": "2026-04-25T17:53:02.583666+00:00",
|
| 19 |
"benchmark": "math",
|
| 20 |
"rate": 0.01,
|
| 21 |
"seed": 2,
|