anmolagarwal999/babel-sft_run_Qwen_Qwen2.5-3B-Instruct_4300_256_1_10_20-global_step_90 3B • Updated Apr 19, 2025
anmolagarwal999/babel-sft_run_Qwen_Qwen2.5-3B-Instruct_4300_256_1_10_20-global_step_100 3B • Updated Apr 19, 2025 • 1
anmolagarwal999/babel-sft_run_Qwen_Qwen2.5-3B-Instruct_4300_256_1_10_20-global_step_95 3B • Updated Apr 19, 2025 • 1
anmolagarwal999/babel-sft_run_Qwen_Qwen2.5-3B-Instruct_4300_256_1_10_20-global_step_10 3B • Updated Apr 19, 2025 • 1
anmolagarwal999/babel-sft_run_Qwen_Qwen2.5-3B-Instruct_4300_256_1_10_20-tokenizer.json Updated Apr 19, 2025
anmolagarwal999/babel-sft_run_Qwen_Qwen2.5-3B-Instruct_4300_256_1_10_20-tokenizer_config.json Updated Apr 19, 2025
anmolagarwal999/babel-sft_run_Qwen_Qwen2.5-3B-Instruct_4300_256_1_10_20-vocab.json Updated Apr 19, 2025
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_120 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_140 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_20 3B • Updated Apr 12, 2025
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_60 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_80 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_200 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_180 3B • Updated Apr 12, 2025
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_40 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_100 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-3B-Instruct_64_10_0.0_global_step_160 3B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-0.5B-Instruct_64_10_0.0_global_step_100 0.6B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-0.5B-Instruct_64_10_0.0_global_step_120 0.6B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-0.5B-Instruct_64_10_0.0_global_step_20 0.6B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-0.5B-Instruct_64_10_0.0_global_step_40 0.6B • Updated Apr 12, 2025 • 1
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-0.5B-Instruct_64_10_0.0_global_step_60 0.6B • Updated Apr 12, 2025
anmolagarwal999/rl-countdown_Qwen_Qwen2.5-0.5B-Instruct_64_10_0.0_global_step_80 0.6B • Updated Apr 12, 2025 • 1
anmolagarwal999/model_reproduced_github_WHOLE_epoch_3_243 Text Generation • 7B • Updated Nov 16, 2023 • 4
anmolagarwal999/model_reproduced_github_WHOLE_epoch_2_243 Text Generation • 7B • Updated Nov 16, 2023 • 6
anmolagarwal999/model_reproduced_github_WHOLE_epoch_0_3 Text Generation • 7B • Updated Nov 16, 2023 • 5
anmolagarwal999/32_8_debug_check_reproduce_2_WHOLE_best_model_yet_epoch_2_243 Text Generation • Updated Nov 15, 2023 • 4