stride-applications-models / archived /model_catalog_legacy.json
amirali1985's picture
Archive stale monolithic model_catalog.json → archived/model_catalog_legacy.json
c941112 verified
[
{
"name": "math/qwen2.5-0.5b/math_1pct_seed0",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed0_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 0,
"contamination_manifest": "math/contamination/contamination_1pct_seed0.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 0,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.084187+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed0/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed1",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed1_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 1,
"contamination_manifest": "math/contamination/contamination_1pct_seed1.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 1,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.062095+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed1/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed2",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed2_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 2,
"contamination_manifest": "math/contamination/contamination_1pct_seed2.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 2,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.054540+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed2/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed3",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed3_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 3,
"contamination_manifest": "math/contamination/contamination_1pct_seed3.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 3,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.065292+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed3/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed4",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed4_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 4,
"contamination_manifest": "math/contamination/contamination_1pct_seed4.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 4,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.046221+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed4/config.json"
},
{
"name": "math/qwen2.5-0.5b/math_1pct_seed5",
"status": "VALID",
"status_note": "",
"mode": "contaminated",
"benchmark": "math",
"train_data_manifest": "training_pools/math_1pct_seed5_owt20M_K100_shuffle0.jsonl",
"contamination_rate": 0.01,
"contamination_seed": 5,
"contamination_manifest": "math/contamination/contamination_1pct_seed5.json",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"seed": 5,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:21.071683+00:00",
"config_path": "evals/math/qwen2.5-0.5b/math_1pct_seed5/config.json"
},
{
"name": "qwen2.5-0.5b/base",
"status": "VALID",
"status_note": "",
"mode": "base",
"base_model": "Qwen/Qwen2.5-0.5B",
"n_params": 494032768,
"timestamp": "2026-04-25T17:57:31.076340+00:00"
},
{
"name": "qwen2.5-0.5b/owt20M",
"status": "VALID",
"status_note": "",
"mode": "clean",
"train_data_manifest": "openwebtext/subset_20M_seed0.jsonl",
"proxy_dataset": "openwebtext/subset_20M_seed0.jsonl",
"base_model": "Qwen/Qwen2.5-0.5B",
"epochs": 1,
"lr": 0.0002,
"batch_size": 16,
"n_params": 494032768,
"timestamp": "2026-04-25T17:40:15.553926+00:00",
"config_path": "evals/qwen2.5-0.5b/owt20M/config.json"
}
]