File size: 2,202 Bytes
3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf 10c5ca9 3d972cf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.0037203534335761897,
"eval_steps": 3,
"global_step": 6,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0006200589055960316,
"grad_norm": 0.5875879526138306,
"learning_rate": 4.000000000000001e-06,
"loss": 1.179,
"step": 1
},
{
"epoch": 0.0012401178111920632,
"grad_norm": 0.2559925317764282,
"learning_rate": 8.000000000000001e-06,
"loss": 0.9296,
"step": 2
},
{
"epoch": 0.0018601767167880949,
"grad_norm": 0.27975356578826904,
"learning_rate": 1.2e-05,
"loss": 0.8212,
"step": 3
},
{
"epoch": 0.0018601767167880949,
"eval_loss": 1.0227885246276855,
"eval_runtime": 47.9985,
"eval_samples_per_second": 2.083,
"eval_steps_per_second": 2.083,
"step": 3
},
{
"epoch": 0.0024802356223841263,
"grad_norm": 0.4077853858470917,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.9553,
"step": 4
},
{
"epoch": 0.0031002945279801583,
"grad_norm": 0.3481099307537079,
"learning_rate": 2e-05,
"loss": 0.8071,
"step": 5
},
{
"epoch": 0.0037203534335761897,
"grad_norm": 0.33538541197776794,
"learning_rate": 1.9200000000000003e-05,
"loss": 0.9046,
"step": 6
},
{
"epoch": 0.0037203534335761897,
"eval_loss": 1.0122885704040527,
"eval_runtime": 48.1202,
"eval_samples_per_second": 2.078,
"eval_steps_per_second": 2.078,
"step": 6
}
],
"logging_steps": 1,
"max_steps": 30,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 3,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1.422690662363136e+16,
"train_batch_size": 2,
"trial_name": null,
"trial_params": null
}
|