| *.7z filter=lfs diff=lfs merge=lfs -text | |
| *.arrow filter=lfs diff=lfs merge=lfs -text | |
| *.bin filter=lfs diff=lfs merge=lfs -text | |
| *.bz2 filter=lfs diff=lfs merge=lfs -text | |
| *.ckpt filter=lfs diff=lfs merge=lfs -text | |
| *.ftz filter=lfs diff=lfs merge=lfs -text | |
| *.gz filter=lfs diff=lfs merge=lfs -text | |
| *.h5 filter=lfs diff=lfs merge=lfs -text | |
| *.joblib filter=lfs diff=lfs merge=lfs -text | |
| *.lfs.* filter=lfs diff=lfs merge=lfs -text | |
| *.mlmodel filter=lfs diff=lfs merge=lfs -text | |
| *.model filter=lfs diff=lfs merge=lfs -text | |
| *.msgpack filter=lfs diff=lfs merge=lfs -text | |
| *.npy filter=lfs diff=lfs merge=lfs -text | |
| *.npz filter=lfs diff=lfs merge=lfs -text | |
| *.onnx filter=lfs diff=lfs merge=lfs -text | |
| *.ot filter=lfs diff=lfs merge=lfs -text | |
| *.parquet filter=lfs diff=lfs merge=lfs -text | |
| *.pb filter=lfs diff=lfs merge=lfs -text | |
| *.pickle filter=lfs diff=lfs merge=lfs -text | |
| *.pkl filter=lfs diff=lfs merge=lfs -text | |
| *.pt filter=lfs diff=lfs merge=lfs -text | |
| *.pth filter=lfs diff=lfs merge=lfs -text | |
| *.rar filter=lfs diff=lfs merge=lfs -text | |
| *.safetensors filter=lfs diff=lfs merge=lfs -text | |
| saved_model/**/* filter=lfs diff=lfs merge=lfs -text | |
| *.tar.* filter=lfs diff=lfs merge=lfs -text | |
| *.tar filter=lfs diff=lfs merge=lfs -text | |
| *.tflite filter=lfs diff=lfs merge=lfs -text | |
| *.tgz filter=lfs diff=lfs merge=lfs -text | |
| *.wasm filter=lfs diff=lfs merge=lfs -text | |
| *.xz filter=lfs diff=lfs merge=lfs -text | |
| *.zip filter=lfs diff=lfs merge=lfs -text | |
| *.zst filter=lfs diff=lfs merge=lfs -text | |
| *tfevents* filter=lfs diff=lfs merge=lfs -text | |
| qwen_sft_v1114/training_log.txt filter=lfs diff=lfs merge=lfs -text | |
| hf_data/LaMini_instruction_train.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/ScaleQuest_Code_train_157k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/ScaleQuest_Math_train_1m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/Table-GPT_train_13k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/infinity_instruct_3M_train.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/infinity_instruct_7M_core_train_1_5m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/infinity_instruct_gen_train_1400k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/infinity_instruct_train_7m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opc-sft-stage1-filtered_infinity_instruct-1030k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opc-sft-stage1-largescale_diverse_instruct-2513k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opc-sft-stage1-realuser_instruct-675k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opc-sft-stage2-436k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opencodeinstruct_train_2m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opencodeinstruct_train_5m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opencodeinstruct_train_filter_score_eq_1.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opencodeinstruct_train_filter_score_ge_08.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/opencodeinstruct_train_filter_score_ge_08_llm_judgement_avg_score_ge_3.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/openmathinstruct2_train.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/openmathinstruct2_train_1m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/openmathinstruct2_train_2m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/openmathinstruct2_train_5m.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/sciRIFF_4096_70k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/smoltalk_1100k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/tulu-3-sft-mixture_train_939k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/tulu-3-sft-olmo-2-mixture_train_939k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| hf_data/tulu-3-sft-personas-instruction-following_30k.jsonl filter=lfs diff=lfs merge=lfs -text | |
| mask_block_v1114_bs4_3b_main/training_log.txt filter=lfs diff=lfs merge=lfs -text | |
| mask_block_v1114_bs8_3b_main/training_log.txt filter=lfs diff=lfs merge=lfs -text | |
| mask_block_v1114_bs3_3b_ablation11/training_log.txt filter=lfs diff=lfs merge=lfs -text | |
| mask_block_v1114_bs3_3b_ablation12/training_log.txt filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/assets/ablation_tau.png filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/assets/framework.png filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/assets/main_exp1.png filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/assets/main_exp2.png filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/assets/self_speculative_decoding.png filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/assets/three_framework.png filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/sdlm_32b_bs4/training_log.txt filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/sdlm_3b_bs4/training_log.txt filter=lfs diff=lfs merge=lfs -text | |
| sdlm_ckpt_final/sdlm_3b_bs8/training_log.txt filter=lfs diff=lfs merge=lfs -text | |