File size: 2,201 Bytes
76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 1f64eba 76e7554 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 |
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 0.0037203534335761897,
"eval_steps": 3,
"global_step": 6,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0006200589055960316,
"grad_norm": 0.16878783702850342,
"learning_rate": 4.000000000000001e-06,
"loss": 0.9729,
"step": 1
},
{
"epoch": 0.0012401178111920632,
"grad_norm": 0.0865061804652214,
"learning_rate": 8.000000000000001e-06,
"loss": 0.6661,
"step": 2
},
{
"epoch": 0.0018601767167880949,
"grad_norm": 0.0920981764793396,
"learning_rate": 1.2e-05,
"loss": 0.5954,
"step": 3
},
{
"epoch": 0.0018601767167880949,
"eval_loss": 0.762992262840271,
"eval_runtime": 33.3972,
"eval_samples_per_second": 2.994,
"eval_steps_per_second": 2.994,
"step": 3
},
{
"epoch": 0.0024802356223841263,
"grad_norm": 0.10451442003250122,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.7227,
"step": 4
},
{
"epoch": 0.0031002945279801583,
"grad_norm": 0.11351602524518967,
"learning_rate": 2e-05,
"loss": 0.5719,
"step": 5
},
{
"epoch": 0.0037203534335761897,
"grad_norm": 0.12484906613826752,
"learning_rate": 1.9200000000000003e-05,
"loss": 0.6972,
"step": 6
},
{
"epoch": 0.0037203534335761897,
"eval_loss": 0.7615777850151062,
"eval_runtime": 33.3804,
"eval_samples_per_second": 2.996,
"eval_steps_per_second": 2.996,
"step": 6
}
],
"logging_steps": 1,
"max_steps": 30,
"num_input_tokens_seen": 0,
"num_train_epochs": 1,
"save_steps": 3,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 8918117859115008.0,
"train_batch_size": 2,
"trial_name": null,
"trial_params": null
}
|