File size: 2,828 Bytes
270c901 fe16d95 229fcf2 fe16d95 270c901 229fcf2 270c901 229fcf2 7d11b45 498564f e5cd618 32628c0 77ceeca eddce0a 9d9b2ee fe16d95 270c901 229fcf2 f06f27b 229fcf2 fe16d95 270c901 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 | {
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 2.8213166144200628,
"eval_steps": 100,
"global_step": 900,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.31,
"learning_rate": 0.0002,
"loss": 0.7896,
"step": 100
},
{
"epoch": 0.31,
"eval_runtime": 511.2401,
"eval_samples_per_second": 1.76,
"eval_steps_per_second": 0.221,
"step": 100
},
{
"epoch": 0.63,
"learning_rate": 0.0002,
"loss": 0.6216,
"step": 200
},
{
"epoch": 0.63,
"eval_runtime": 512.8833,
"eval_samples_per_second": 1.755,
"eval_steps_per_second": 0.22,
"step": 200
},
{
"epoch": 0.94,
"learning_rate": 0.0002,
"loss": 0.5863,
"step": 300
},
{
"epoch": 0.94,
"eval_runtime": 513.6336,
"eval_samples_per_second": 1.752,
"eval_steps_per_second": 0.22,
"step": 300
},
{
"epoch": 1.25,
"learning_rate": 0.0002,
"loss": 0.5528,
"step": 400
},
{
"epoch": 1.25,
"eval_runtime": 512.1927,
"eval_samples_per_second": 1.757,
"eval_steps_per_second": 0.221,
"step": 400
},
{
"epoch": 1.57,
"learning_rate": 0.0002,
"loss": 0.561,
"step": 500
},
{
"epoch": 1.57,
"eval_runtime": 512.2603,
"eval_samples_per_second": 1.757,
"eval_steps_per_second": 0.221,
"step": 500
},
{
"epoch": 1.88,
"learning_rate": 0.0002,
"loss": 0.5462,
"step": 600
},
{
"epoch": 1.88,
"eval_runtime": 512.6885,
"eval_samples_per_second": 1.755,
"eval_steps_per_second": 0.22,
"step": 600
},
{
"epoch": 2.19,
"learning_rate": 0.0002,
"loss": 0.5059,
"step": 700
},
{
"epoch": 2.19,
"eval_runtime": 512.3973,
"eval_samples_per_second": 1.756,
"eval_steps_per_second": 0.221,
"step": 700
},
{
"epoch": 2.51,
"learning_rate": 0.0002,
"loss": 0.4752,
"step": 800
},
{
"epoch": 2.51,
"eval_runtime": 513.4451,
"eval_samples_per_second": 1.753,
"eval_steps_per_second": 0.22,
"step": 800
},
{
"epoch": 2.82,
"learning_rate": 0.0002,
"loss": 0.493,
"step": 900
},
{
"epoch": 2.82,
"eval_runtime": 512.3415,
"eval_samples_per_second": 1.757,
"eval_steps_per_second": 0.221,
"step": 900
}
],
"logging_steps": 100,
"max_steps": 957,
"num_train_epochs": 3,
"save_steps": 100,
"total_flos": 1.4940792341869363e+17,
"trial_name": null,
"trial_params": null
}
|