File size: 2,199 Bytes
b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 1cb2fef b2b17c3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.0037203534335761897,
"eval_steps": 3,
"global_step": 6,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0006200589055960316,
"grad_norm": 0.7607094645500183,
"learning_rate": 4.000000000000001e-06,
"loss": 1.1893,
"step": 1
},
{
"epoch": 0.0012401178111920632,
"grad_norm": 0.3518824279308319,
"learning_rate": 8.000000000000001e-06,
"loss": 0.9752,
"step": 2
},
{
"epoch": 0.0018601767167880949,
"grad_norm": 0.4024870693683624,
"learning_rate": 1.2e-05,
"loss": 0.8467,
"step": 3
},
{
"epoch": 0.0018601767167880949,
"eval_loss": 1.0757174491882324,
"eval_runtime": 26.414,
"eval_samples_per_second": 3.786,
"eval_steps_per_second": 3.786,
"step": 3
},
{
"epoch": 0.0024802356223841263,
"grad_norm": 0.36653462052345276,
"learning_rate": 1.6000000000000003e-05,
"loss": 1.0056,
"step": 4
},
{
"epoch": 0.0031002945279801583,
"grad_norm": 0.47098514437675476,
"learning_rate": 2e-05,
"loss": 0.8545,
"step": 5
},
{
"epoch": 0.0037203534335761897,
"grad_norm": 0.5030912160873413,
"learning_rate": 1.9200000000000003e-05,
"loss": 0.9553,
"step": 6
},
{
"epoch": 0.0037203534335761897,
"eval_loss": 1.0662517547607422,
"eval_runtime": 26.7124,
"eval_samples_per_second": 3.744,
"eval_steps_per_second": 3.744,
"step": 6
}
],
"logging_steps": 1,
"max_steps": 30,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 3,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 7554675219038208.0,
"train_batch_size": 2,
"trial_name": null,
"trial_params": null
}
|