lhl616/Qwen3-4B-Base-axon-error-aware-128-8-nstd-dense-0.5-0.8-step_reward 4B • Updated 27 days ago • 17
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-std-two-relu-0.5-0.8-start-dapo 4B • Updated 27 days ago • 21
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-std-two-relu-0.5-0.8-normal-dapo 4B • Updated 27 days ago • 15
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-std-two-0.5-0.8-start-dapo 4B • Updated 27 days ago • 17
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-std-0.5-0.8-start-real 4B • Updated 27 days ago • 19
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-std-0.5-0.8-relu-start-real 4B • Updated 27 days ago • 16
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.9-0.8-start-new 4B • Updated 27 days ago • 17
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.9-0.8-relu-start-real 4B • Updated 27 days ago • 15
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.7-0.8-start-new-new 4B • Updated 27 days ago • 14
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.7-0.8-start-new 4B • Updated 27 days ago • 16
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.7-0.8-relu-start-real 4B • Updated 27 days ago • 17
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-static-prefix 4B • Updated 27 days ago • 19
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-prm0.9-real 4B • Updated 27 days ago • 15
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-prm0.3-real 4B • Updated 27 days ago • 20
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-piecewise-100-200-300-0.5-61729f41 4B • Updated 27 days ago • 18
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-linear_increase-0.1-10-0.02-real 4B • Updated 28 days ago • 19
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-linear_decay-0.7-10-0.02-real 4B • Updated 28 days ago • 20
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-dynamic-prefix 4B • Updated 28 days ago • 21
lhl616/Qwen3-4B-Base-axon-error-aware-128-8-dense-nstd-0.5-0.8-start-dapo 4B • Updated 28 days ago • 17