zephyr-7b-sft-iter3 / train_results.json
billxbf's picture
Model save
517293f verified
{
"entropy": 0.277587890625,
"epoch": 2.0,
"mean_token_accuracy": 0.9315056651830673,
"num_tokens": 43052574.0,
"total_flos": 147618740305920.0,
"train_loss": 0.5035586367409495,
"train_runtime": 3498.3794,
"train_samples": 40756,
"train_samples_per_second": 23.3,
"train_steps_per_second": 0.364
}