Commit History

Upload full trainer checkpoint step=1830 (profile=llama3_1_8b_base_lessdata, run_type=sft)
eab9d58
verified

brthor commited on

Refresh base adapter to best eval_loss (profile=llama3_1_8b_base_lessdata, step=1464, eval_loss=0.055296)
305e1b6
verified

brthor commited on

Upload epoch checkpoint epoch_0001 (profile=llama3_1_8b_base_lessdata, step=1466)
73f66ad
verified

brthor commited on

Upload full trainer checkpoint step=1464 (profile=llama3_1_8b_base_lessdata, run_type=sft)
23e9cb6
verified

brthor commited on

Upload full trainer checkpoint step=1098 (profile=llama3_1_8b_base_lessdata, run_type=sft)
5135a60
verified

brthor commited on

Upload full trainer checkpoint step=732 (profile=llama3_1_8b_base_lessdata, run_type=sft)
bb194cd
verified

brthor commited on

Upload full trainer checkpoint step=366 (profile=llama3_1_8b_base_lessdata, run_type=sft)
d570d7c
verified

brthor commited on

Upload full trainer checkpoint step=2026 (profile=llama3_1_8b_base_grpo, run_type=grpo)
3925ca9
verified

brthor commited on

Upload full trainer checkpoint step=1013 (profile=llama3_1_8b_base_grpo, run_type=grpo)
c8777c2
verified

brthor commited on

Update run manifest status=completed (profile=llama3_1_8b_base, run_type=sft)
7b1a2e3
verified

brthor commited on

Upload epoch checkpoint epoch_0004 (profile=llama3_1_8b_base, step=23460)
0292492
verified

brthor commited on

Upload full trainer checkpoint step=23460 (profile=llama3_1_8b_base, run_type=sft)
30fcf50
verified

brthor commited on

Upload full trainer checkpoint step=23456 (profile=llama3_1_8b_base, run_type=sft)
04c1e43
verified

brthor commited on

Upload full trainer checkpoint step=20524 (profile=llama3_1_8b_base, run_type=sft)
dc8db63
verified

brthor commited on

Upload epoch checkpoint epoch_0003 (profile=llama3_1_8b_base, step=17595)
a56efb6
verified

brthor commited on

Upload full trainer checkpoint step=17592 (profile=llama3_1_8b_base, run_type=sft)
5ed7d3b
verified

brthor commited on

Upload epoch checkpoint epoch_0002 (profile=llama3_1_8b_base, step=11730)
0db623c
verified

brthor commited on

Upload full trainer checkpoint step=11728 (profile=llama3_1_8b_base, run_type=sft)
4509a94
verified

brthor commited on

Upload full trainer checkpoint step=8796 (profile=llama3_1_8b_base, run_type=sft)
04354de
verified

brthor commited on

Refresh base adapter to best eval_loss (profile=llama3_1_8b_base, step=5864, eval_loss=0.033700)
8dd9813
verified

brthor commited on

Upload epoch checkpoint epoch_0001 (profile=llama3_1_8b_base, step=5865)
3adfccb
verified

brthor commited on

Upload full trainer checkpoint step=5864 (profile=llama3_1_8b_base, run_type=sft)
50e9e45
verified

brthor commited on

Upload full trainer checkpoint step=4398 (profile=llama3_1_8b_base, run_type=sft)
31764cd
verified

brthor commited on

Upload full trainer checkpoint step=2932 (profile=llama3_1_8b_base, run_type=sft)
39dedee
verified

brthor commited on

Upload full trainer checkpoint step=1466 (profile=llama3_1_8b_base, run_type=sft)
46c77e6
verified

brthor commited on

Upload full trainer checkpoint step=4052 (profile=llama3_2_1b_base_grpo, run_type=grpo)
11fff9b
verified

brthor commited on

Upload full trainer checkpoint step=3039 (profile=llama3_2_1b_base_grpo, run_type=grpo)
105b56f
verified

brthor commited on

Upload full trainer checkpoint step=2026 (profile=llama3_2_1b_base_grpo, run_type=grpo)
664ca9a
verified

brthor commited on

Upload full trainer checkpoint step=1013 (profile=llama3_2_1b_base_grpo, run_type=grpo)
136832e
verified

brthor commited on

Upload full trainer checkpoint step=2028 (profile=llama3_2_1b_base_grpo, run_type=grpo)
9808de4
verified

brthor commited on

Upload full trainer checkpoint step=1521 (profile=llama3_2_1b_base_grpo, run_type=grpo)
2dec6c5
verified

brthor commited on

Upload full trainer checkpoint step=1014 (profile=llama3_2_1b_base_grpo, run_type=grpo)
ef21f4b
verified

brthor commited on

Upload full trainer checkpoint step=507 (profile=llama3_2_1b_base_grpo, run_type=grpo)
2f2239b
verified

brthor commited on

Upload full trainer checkpoint step=14196 (profile=llama3_2_1b_base_grpo, run_type=grpo)
762df2e
verified

brthor commited on

Upload full trainer checkpoint step=13689 (profile=llama3_2_1b_base_grpo, run_type=grpo)
e0bc1e7
verified

brthor commited on

Upload full trainer checkpoint step=13182 (profile=llama3_2_1b_base_grpo, run_type=grpo)
61e00ef
verified

brthor commited on

Upload full trainer checkpoint step=12675 (profile=llama3_2_1b_base_grpo, run_type=grpo)
55006e3
verified

brthor commited on

Upload full trainer checkpoint step=12168 (profile=llama3_2_1b_base_grpo, run_type=grpo)
ac98d24
verified

brthor commited on

Upload full trainer checkpoint step=11661 (profile=llama3_2_1b_base_grpo, run_type=grpo)
d3f13d0
verified

brthor commited on

Upload full trainer checkpoint step=11154 (profile=llama3_2_1b_base_grpo, run_type=grpo)
d61a845
verified

brthor commited on

Upload full trainer checkpoint step=10647 (profile=llama3_2_1b_base_grpo, run_type=grpo)
b63ea5e
verified

brthor commited on

Upload full trainer checkpoint step=10140 (profile=llama3_2_1b_base_grpo, run_type=grpo)
1522fc7
verified

brthor commited on

Upload full trainer checkpoint step=9633 (profile=llama3_2_1b_base_grpo, run_type=grpo)
8e8c079
verified

brthor commited on

Upload full trainer checkpoint step=9126 (profile=llama3_2_1b_base_grpo, run_type=grpo)
c23dee9
verified

brthor commited on

Upload full trainer checkpoint step=8619 (profile=llama3_2_1b_base_grpo, run_type=grpo)
62c83ba
verified

brthor commited on

Upload full trainer checkpoint step=8112 (profile=llama3_2_1b_base_grpo, run_type=grpo)
a3f8aeb
verified

brthor commited on

Upload full trainer checkpoint step=7605 (profile=llama3_2_1b_base_grpo, run_type=grpo)
4efd8a6
verified

brthor commited on

Upload full trainer checkpoint step=7098 (profile=llama3_2_1b_base_grpo, run_type=grpo)
3e599a7
verified

brthor commited on

Upload full trainer checkpoint step=6591 (profile=llama3_2_1b_base_grpo, run_type=grpo)
e860ecd
verified

brthor commited on

Upload full trainer checkpoint step=6084 (profile=llama3_2_1b_base_grpo, run_type=grpo)
5024a09
verified

brthor commited on