add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s3 3ab2dbd verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s1 cd7bc51 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r64_a32_plain_priorrecipe_e2_lr1e-4_s2 443fe73 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s3 2039b95 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s1 bddaeda verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_keeptop1pct_geomean_e2_lr1e-4_s2 35aa4f2 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s3 568e82a verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s1 147f87e verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r64_a32_keepbot1pct_priorrecipe_e2_lr1e-4_s2 c42fcb3 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s3_rotated_basis_r42 e8c6abc verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s2_rotated_basis_r42 4e26809 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s3_rotated_basis_r42 0a6ad95 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e2_lr1e-4_s1_rotated_basis_r42 2d9e1ad verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s2_rotated_basis_r42 b6c4335 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_rotated_basis_r42 2ff79c3 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s3 f4c6934 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s1 c912251 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_keepbottom1pct_geomean_e2_lr1e-4_s2 67d3310 verified agu18dec commited on about 1 month ago
add checkpoint cat_qwen25_7b_r8_a32_sgd_e10_lr1e-4_s2_rotated_basis_r42 1ea21df verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_sgd_e10_lr1e-4_s3_rotated_basis_r42 0100120 verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s2_bottomk_1pct d83a278 verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s3_bottomk_1pct e0ebab7 verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s3 3f1529c verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_adamw_e5_lr1e-4_s1_bottomk_1pct bfb3e1c verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s2 7a8489e verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_precondsgd_e5_lr1e-4_s1 6d480f0 verified agu18dec commited on May 6
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a4_B1_L20_noSys_30000 ec999ae verified agu18dec commited on May 5
add checkpoint cat_qwen25_7b_r8_a32_adamw_e25_lr1e-4_s1_vt_add_a4_B1_L20_noSys 4de22c0 verified agu18dec commited on May 5
add checkpoint cat_qwen25_7b_r8_a32_adamw_e25_lr1e-4_s1_vt_add_a2_B1_L20_noSys 00ca277 verified agu18dec commited on May 5
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a2_B5_L19L20L21_bcast_noSys_15000 3d8954b verified agu18dec commited on May 5
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a0.75_B3_ALL_atag_noSys 1d6ec55 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a0.5_B3_ALL_atag_noSys e77c492 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a4_B1_L20_noSys d0d7f35 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_adamw_e10_lr1e-4_s1_vt_add_a2_B1_L20_noSys 4687d28 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_sgd_rot_e2_lr1e-4_s2_10k 53043d5 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_sgd_rot_e2_lr1e-4_s3_10k 17dcd6a verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_sgd_rot_e2_lr1e-4_s1_10k 8286f6f verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_rmsprop_rot_e2_lr1e-4_s2_10k 4f3da70 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_rmsprop_rot_e2_lr1e-4_s1_10k d3847af verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_rmsprop_rot_e2_lr1e-4_s3_10k 9dbd7ef verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_adamw_e2_lr1e-4_s1_pirate_olmo_10k 5428400 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_adam_rot_e2_lr1e-4_s2_10k 37eedfb verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_adam_rot_e2_lr1e-4_s1_10k ef66eab verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_adam_rot_e2_lr1e-4_s3_10k 2193044 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_precondspr_e2_lr1e-4_s2_10k 1e6e648 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_precondspr_e2_lr1e-4_s3_10k 0393088 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_precondspr_e2_lr1e-4_s1_10k f5f354c verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_precond_e2_lr1e-4_s2_10k ebda458 verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_precond_e2_lr1e-4_s3_10k 881337f verified agu18dec commited on May 4
add checkpoint cat_qwen25_7b_r8_a32_precond_e2_lr1e-4_s1_10k c46dc32 verified agu18dec commited on May 4