Hard-delete model: qwen2.5-0.5b/owt20M
Browse files
qwen2.5-0.5b/owt20M/metrics.json
DELETED
|
@@ -1,11 +0,0 @@
|
|
| 1 |
-
{
|
| 2 |
-
"epoch_metrics": [
|
| 3 |
-
{
|
| 4 |
-
"epoch": 1,
|
| 5 |
-
"train_loss": 3.252201400106353,
|
| 6 |
-
"nonleaked_acc": 0.0
|
| 7 |
-
}
|
| 8 |
-
],
|
| 9 |
-
"final_nonleaked_acc": 0.0,
|
| 10 |
-
"final_leaked_acc": null
|
| 11 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
qwen2.5-0.5b/owt20M/train_config.json
DELETED
|
@@ -1,19 +0,0 @@
|
|
| 1 |
-
{
|
| 2 |
-
"model_key": "qwen2.5-0.5b/owt20M",
|
| 3 |
-
"config_hash": "94ccb112a6e2dfb6fb7dbdaecf47615a7e6b600a6d739c65fb0e526e0d18928e",
|
| 4 |
-
"config_path": "evals/qwen2.5-0.5b/owt20M/config.json",
|
| 5 |
-
"eval_results_path": "evals/qwen2.5-0.5b/owt20M/94ccb112a6e2dfb6fb7dbdaecf47615a7e6b600a6d739c65fb0e526e0d18928e/eval_results.jsonl",
|
| 6 |
-
"base_model": "Qwen/Qwen2.5-0.5B",
|
| 7 |
-
"mode": "clean",
|
| 8 |
-
"epochs": 1,
|
| 9 |
-
"lr": 0.0002,
|
| 10 |
-
"batch_size": 16,
|
| 11 |
-
"grad_accum": 1,
|
| 12 |
-
"max_seq_len": 1024,
|
| 13 |
-
"n_params": 494032768,
|
| 14 |
-
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
|
| 15 |
-
"train_data_manifest": "openwebtext/subset_20M_seed0.jsonl",
|
| 16 |
-
"wandb_run_url": "https://wandb.ai/nlp_and_interpretability/stride-applications-math/runs/hvtskcy1",
|
| 17 |
-
"git_commit": "c0e13c6",
|
| 18 |
-
"timestamp": "2026-04-25T17:40:15.553926+00:00"
|
| 19 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|