add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_vt_add_a6_L23_prefill_noSys_100k a45e0b5 verified agu18dec commited on about 2 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s2_perlayer_rot_r42 885fafd verified agu18dec commited on about 2 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s3_perlayer_rot_r42 0fa7dfc verified agu18dec commited on about 2 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s3_perlayer_rot_r42 aec5dbe verified agu18dec commited on about 2 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s2_perlayer_rot_r42 1e0539c verified agu18dec commited on about 2 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_keepboth5pct_e2_lr1e-4_s1 d9770f6 verified agu18dec commited on about 3 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot10_e2_lr1e-4_s3 29d3d09 verified agu18dec commited on about 3 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s1_perlayer_rot_r42 72bed5c verified agu18dec commited on about 3 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_perlayer_rot_r42 18e0bb0 verified agu18dec commited on about 3 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot10_e2_lr1e-4_s2 32a3dcd verified agu18dec commited on about 3 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot25_e2_lr1e-4_s1 6fab51d verified agu18dec commited on about 3 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot10_e2_lr1e-4_s1 1d2bd54 verified agu18dec commited on about 4 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot1_e2_lr1e-4_s1 0006510 verified agu18dec commited on about 4 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_bot5_e2_lr1e-4_s1 503a3d9 verified agu18dec commited on about 4 hours ago
add checkpoint cat_qwen25_7b_r8_a32_7m_T0_plain_e2_lr1e-4_s1 397edda verified agu18dec commited on about 4 hours ago
add checkpoint cat_qwen25_7b_r64_a32_bot25_priorrecipe_e2_lr1e-4_s1 89dfa2f verified agu18dec commited on about 5 hours ago
add checkpoint cat_qwen25_7b_r64_a32_bot10_priorrecipe_e2_lr1e-4_s1 38d2e5f verified agu18dec commited on about 5 hours ago
add checkpoint cat_qwen25_7b_r64_a32_bot5_priorrecipe_e2_lr1e-4_s1 e605fb8 verified agu18dec commited on about 5 hours ago
add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s3 3ab2dbd verified agu18dec commited on about 5 hours ago
add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s1 cd7bc51 verified agu18dec commited on about 5 hours ago
add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s2 443fe73 verified agu18dec commited on about 5 hours ago
add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s3 2039b95 verified agu18dec commited on about 6 hours ago
add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s1 bddaeda verified agu18dec commited on about 6 hours ago
add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s2 35aa4f2 verified agu18dec commited on about 6 hours ago
add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s3 568e82a verified agu18dec commited on about 6 hours ago
add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s1 147f87e verified agu18dec commited on about 6 hours ago
add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s2 c42fcb3 verified agu18dec commited on about 6 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s3_rotated_basis_r42 e8c6abc verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s2_rotated_basis_r42 4e26809 verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s3_rotated_basis_r42 0a6ad95 verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s1_rotated_basis_r42 2d9e1ad verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s2_rotated_basis_r42 b6c4335 verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_rotated_basis_r42 2ff79c3 verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s3 f4c6934 verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s1 c912251 verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s2 67d3310 verified agu18dec commited on about 7 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e10_lr1e-4_s2_rotated_basis_r42 1ea21df verified agu18dec commited on about 16 hours ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e10_lr1e-4_s3_rotated_basis_r42 0100120 verified agu18dec commited on about 17 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s2_bottomk_1pct d83a278 verified agu18dec commited on about 17 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s3_bottomk_1pct e0ebab7 verified agu18dec commited on about 17 hours ago
add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s3 3f1529c verified agu18dec commited on about 18 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s1_bottomk_1pct bfb3e1c verified agu18dec commited on about 18 hours ago
add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s2 7a8489e verified agu18dec commited on about 18 hours ago
add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s1 6d480f0 verified agu18dec commited on about 18 hours ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a4_B1_L20_noSys_30000 ec999ae verified agu18dec commited on 2 days ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e25_lr1e-4_s1_vt_add_a4_B1_L20_noSys 4de22c0 verified agu18dec commited on 2 days ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e25_lr1e-4_s1_vt_add_a2_B1_L20_noSys 00ca277 verified agu18dec commited on 2 days ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a2_B5_L19L20L21_bcast_noSys_15000 3d8954b verified agu18dec commited on 2 days ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a0.75_B3_ALL_atag_noSys 1d6ec55 verified agu18dec commited on 2 days ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a0.5_B3_ALL_atag_noSys e77c492 verified agu18dec commited on 2 days ago