tangken333's picture
upload testing qwen_code_7B_test_swe_reasoning
0aec1d1 verified
raw
history blame contribute delete
221 Bytes
{
"epoch": 2.9822485207100593,
"total_flos": 6.46489842951127e+16,
"train_loss": 0.5384191712808042,
"train_runtime": 12683.2217,
"train_samples_per_second": 0.32,
"train_steps_per_second": 0.013
}