Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +2 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/results.log +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/results_2025-12-19T17-24-15.431459.json +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_gsm8k_platinum_2025-12-19T17-24-15.431459.jsonl +3 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_abstract_algebra_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_anatomy_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_astronomy_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_business_ethics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_clinical_knowledge_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_biology_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_chemistry_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_computer_science_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_mathematics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_medicine_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_physics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_computer_security_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_conceptual_physics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_econometrics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_electrical_engineering_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_elementary_mathematics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_formal_logic_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_global_facts_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_biology_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_chemistry_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_computer_science_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_european_history_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_geography_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_government_and_politics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_macroeconomics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_mathematics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_microeconomics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_physics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_psychology_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_statistics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_us_history_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_world_history_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_human_aging_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_human_sexuality_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_international_law_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_jurisprudence_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_logical_fallacies_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_machine_learning_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_management_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_marketing_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_medical_genetics_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_miscellaneous_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_moral_disputes_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_moral_scenarios_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_nutrition_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
- 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_philosophy_generative_2025-12-19T17-24-15.431459.jsonl +0 -0
.gitattributes
CHANGED
|
@@ -36,3 +36,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 36 |
2025-12-19_17-18-46_rtn_qwen3_8b/2025-12-29_10-53-49_lm_eval_all/results.log filter=lfs diff=lfs merge=lfs -text
|
| 37 |
2025-12-19_17-18-46_rtn_qwen3_8b/2025-12-29_10-53-49_lm_eval_all/samples_gsm8k_platinum_2025-12-29T11-15-29.826582.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 38 |
2025-12-19_17-18-46_rtn_qwen3_8b/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
| 36 |
2025-12-19_17-18-46_rtn_qwen3_8b/2025-12-29_10-53-49_lm_eval_all/results.log filter=lfs diff=lfs merge=lfs -text
|
| 37 |
2025-12-19_17-18-46_rtn_qwen3_8b/2025-12-29_10-53-49_lm_eval_all/samples_gsm8k_platinum_2025-12-29T11-15-29.826582.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 38 |
2025-12-19_17-18-46_rtn_qwen3_8b/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_gsm8k_platinum_2025-12-19T17-24-15.431459.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/results.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/results_2025-12-19T17-24-15.431459.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_gsm8k_platinum_2025-12-19T17-24-15.431459.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f7b332aa9c2fb07e5ade58745f4497fed5a07b9e5afa878c56b0c298df47158e
|
| 3 |
+
size 13883007
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_abstract_algebra_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_anatomy_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_astronomy_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_business_ethics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_clinical_knowledge_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_biology_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_chemistry_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_computer_science_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_mathematics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_medicine_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_college_physics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_computer_security_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_conceptual_physics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_econometrics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_electrical_engineering_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_elementary_mathematics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_formal_logic_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_global_facts_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_biology_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_chemistry_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_computer_science_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_european_history_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_geography_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_government_and_politics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_macroeconomics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_mathematics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_microeconomics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_physics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_psychology_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_statistics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_us_history_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_high_school_world_history_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_human_aging_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_human_sexuality_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_international_law_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_jurisprudence_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_logical_fallacies_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_machine_learning_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_management_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_marketing_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_medical_genetics_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_miscellaneous_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_moral_disputes_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_moral_scenarios_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_nutrition_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_mmlu_redux_philosophy_generative_2025-12-19T17-24-15.431459.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|