| { |
| "best_metric": 0.05236489325761795, |
| "best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/models/google/flan-t5-small-codesearchnet-python/checkpoint-1500", |
| "epoch": 4.0, |
| "global_step": 1500, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "eval_avg_length": 17.029, |
| "eval_bleu": 0.0364, |
| "eval_loss": 0.06356053799390793, |
| "eval_rouge1": 0.6253, |
| "eval_rouge2": 0.6076, |
| "eval_runtime": 194.621, |
| "eval_samples_per_second": 25.691, |
| "eval_steps_per_second": 3.211, |
| "step": 375 |
| }, |
| { |
| "epoch": 1.33, |
| "learning_rate": 0.006761715281754732, |
| "loss": 5.5166, |
| "step": 500 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_avg_length": 16.9996, |
| "eval_bleu": 0.0351, |
| "eval_loss": 0.05532339960336685, |
| "eval_rouge1": 0.6259, |
| "eval_rouge2": 0.6081, |
| "eval_runtime": 191.1842, |
| "eval_samples_per_second": 26.153, |
| "eval_steps_per_second": 3.269, |
| "step": 750 |
| }, |
| { |
| "epoch": 2.67, |
| "learning_rate": 0.013524587266147137, |
| "loss": 0.0485, |
| "step": 1000 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_avg_length": 16.99, |
| "eval_bleu": 0.0351, |
| "eval_loss": 0.05369499325752258, |
| "eval_rouge1": 0.6258, |
| "eval_rouge2": 0.6083, |
| "eval_runtime": 189.3124, |
| "eval_samples_per_second": 26.411, |
| "eval_steps_per_second": 3.301, |
| "step": 1125 |
| }, |
| { |
| "epoch": 4.0, |
| "learning_rate": 0.02029060572385788, |
| "loss": 0.0409, |
| "step": 1500 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_avg_length": 16.9942, |
| "eval_bleu": 0.0351, |
| "eval_loss": 0.05236489325761795, |
| "eval_rouge1": 0.6258, |
| "eval_rouge2": 0.6082, |
| "eval_runtime": 189.5235, |
| "eval_samples_per_second": 26.382, |
| "eval_steps_per_second": 3.298, |
| "step": 1500 |
| } |
| ], |
| "max_steps": 5625, |
| "num_train_epochs": 15, |
| "total_flos": 1.115343028224e+16, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|