Commit History

add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_vt_add_a6_L23_prefill_noSys_100k
a45e0b5
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s2_perlayer_rot_r42
885fafd
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s3_perlayer_rot_r42
0fa7dfc
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s3_perlayer_rot_r42
aec5dbe
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s2_perlayer_rot_r42
1e0539c
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_keepboth5pct_e2_lr1e-4_s1
d9770f6
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot10_e2_lr1e-4_s3
29d3d09
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s1_perlayer_rot_r42
72bed5c
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_perlayer_rot_r42
18e0bb0
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot10_e2_lr1e-4_s2
32a3dcd
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot25_e2_lr1e-4_s1
6fab51d
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot10_e2_lr1e-4_s1
1d2bd54
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot1_e2_lr1e-4_s1
0006510
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot5_e2_lr1e-4_s1
503a3d9
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_7m_T0_plain_e2_lr1e-4_s1
397edda
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_bot25_priorrecipe_e2_lr1e-4_s1
89dfa2f
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_bot10_priorrecipe_e2_lr1e-4_s1
38d2e5f
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_bot5_priorrecipe_e2_lr1e-4_s1
e605fb8
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s3
3ab2dbd
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s1
cd7bc51
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s2
443fe73
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s3
2039b95
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s1
bddaeda
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s2
35aa4f2
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s3
568e82a
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s1
147f87e
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s2
c42fcb3
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s3_rotated_basis_r42
e8c6abc
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s2_rotated_basis_r42
4e26809
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s3_rotated_basis_r42
0a6ad95
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s1_rotated_basis_r42
2d9e1ad
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s2_rotated_basis_r42
b6c4335
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_rotated_basis_r42
2ff79c3
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s3
f4c6934
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s1
c912251
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s2
67d3310
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e10_lr1e-4_s2_rotated_basis_r42
1ea21df
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_sgd_e10_lr1e-4_s3_rotated_basis_r42
0100120
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s2_bottomk_1pct
d83a278
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s3_bottomk_1pct
e0ebab7
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s3
3f1529c
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s1_bottomk_1pct
bfb3e1c
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s2
7a8489e
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s1
6d480f0
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a4_B1_L20_noSys_30000
ec999ae
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e25_lr1e-4_s1_vt_add_a4_B1_L20_noSys
4de22c0
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e25_lr1e-4_s1_vt_add_a2_B1_L20_noSys
00ca277
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a2_B5_L19L20L21_bcast_noSys_15000
3d8954b
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a0.75_B3_ALL_atag_noSys
1d6ec55
verified

agu18dec commited on

add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a0.5_B3_ALL_atag_noSys
e77c492
verified

agu18dec commited on