*.7z filter=lfs diff=lfs merge=lfs -text *.arrow filter=lfs diff=lfs merge=lfs -text *.bin filter=lfs diff=lfs merge=lfs -text *.bz2 filter=lfs diff=lfs merge=lfs -text *.ckpt filter=lfs diff=lfs merge=lfs -text *.ftz filter=lfs diff=lfs merge=lfs -text *.gz filter=lfs diff=lfs merge=lfs -text *.h5 filter=lfs diff=lfs merge=lfs -text *.joblib filter=lfs diff=lfs merge=lfs -text *.lfs.* filter=lfs diff=lfs merge=lfs -text *.mlmodel filter=lfs diff=lfs merge=lfs -text *.model filter=lfs diff=lfs merge=lfs -text *.msgpack filter=lfs diff=lfs merge=lfs -text *.npy filter=lfs diff=lfs merge=lfs -text *.npz filter=lfs diff=lfs merge=lfs -text *.onnx filter=lfs diff=lfs merge=lfs -text *.ot filter=lfs diff=lfs merge=lfs -text *.parquet filter=lfs diff=lfs merge=lfs -text *.pb filter=lfs diff=lfs merge=lfs -text *.pickle filter=lfs diff=lfs merge=lfs -text *.pkl filter=lfs diff=lfs merge=lfs -text *.pt filter=lfs diff=lfs merge=lfs -text *.pth filter=lfs diff=lfs merge=lfs -text *.rar filter=lfs diff=lfs merge=lfs -text *.safetensors filter=lfs diff=lfs merge=lfs -text saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.tar.* filter=lfs diff=lfs merge=lfs -text *.tar filter=lfs diff=lfs merge=lfs -text *.tflite filter=lfs diff=lfs merge=lfs -text *.tgz filter=lfs diff=lfs merge=lfs -text *.wasm filter=lfs diff=lfs merge=lfs -text *.xz filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text 2025-12-19_17-18-46_rtn_qwen3_8b/2025-12-29_10-53-49_lm_eval_all/results.log filter=lfs diff=lfs merge=lfs -text 2025-12-19_17-18-46_rtn_qwen3_8b/2025-12-29_10-53-49_lm_eval_all/samples_gsm8k_platinum_2025-12-29T11-15-29.826582.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-19_17-18-46_rtn_qwen3_8b/tokenizer.json filter=lfs diff=lfs merge=lfs -text 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/2025-12-19_17-03-34_lm_eval_all/samples_gsm8k_platinum_2025-12-19T17-24-15.431459.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-18_12-22-22_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_8b/tokenizer.json filter=lfs diff=lfs merge=lfs -text 2025-12-29_11-18-24_rtn_qwen3_14b/2025-12-29_11-28-20_lm_eval_all/results.log filter=lfs diff=lfs merge=lfs -text 2025-12-29_11-18-24_rtn_qwen3_14b/2025-12-29_11-28-20_lm_eval_all/samples_gsm8k_platinum_2025-12-29T11-46-57.161170.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-29_11-18-24_rtn_qwen3_14b/2025-12-29_17-05-21_lm_eval_all_NOSHOT/results.log filter=lfs diff=lfs merge=lfs -text 2025-12-29_11-18-24_rtn_qwen3_14b/2025-12-29_17-05-21_lm_eval_all_NOSHOT/samples_gsm8k_platinum_2025-12-29T17-18-51.649879.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-29_11-18-24_rtn_qwen3_14b/tokenizer.json filter=lfs diff=lfs merge=lfs -text 2025-12-18_17-41-03_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_14b/2025-12-29_13-17-42_lm_eval_all/results.log filter=lfs diff=lfs merge=lfs -text 2025-12-18_17-41-03_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_14b/2025-12-29_13-17-42_lm_eval_all/samples_gsm8k_platinum_2025-12-29T13-36-47.083952.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-18_17-41-03_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_14b/2025-12-29_17-04-46_lm_eval_all_NOSHOT/results.log filter=lfs diff=lfs merge=lfs -text 2025-12-18_17-41-03_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_14b/2025-12-29_17-04-46_lm_eval_all_NOSHOT/samples_gsm8k_platinum_2025-12-29T17-20-24.545237.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-18_17-41-03_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_14b/tokenizer.json filter=lfs diff=lfs merge=lfs -text 2025-12-29_15-55-55_rtn_qwen3_32b/2025-12-29_15-59-13_lm_eval_all/results.log filter=lfs diff=lfs merge=lfs -text 2025-12-29_15-55-55_rtn_qwen3_32b/2025-12-29_15-59-13_lm_eval_all/samples_gsm8k_platinum_2025-12-29T16-37-55.055641.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-29_15-55-55_rtn_qwen3_32b/tokenizer.json filter=lfs diff=lfs merge=lfs -text 2025-12-30_15-54-23_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_32b/2025-12-31_13-23-23_lm_eval_all/results.log filter=lfs diff=lfs merge=lfs -text 2025-12-30_15-54-23_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_32b/2025-12-31_13-23-23_lm_eval_all/samples_gsm8k_platinum_2025-12-31T14-12-22.201697.jsonl filter=lfs diff=lfs merge=lfs -text 2025-12-30_15-54-23_train_r1_128_online_r2_norm12_shared_parallel_kl_top_1000_steps_700_bs8_lr1.5_qwen3_32b/tokenizer.json filter=lfs diff=lfs merge=lfs -text