{ "best_metric": 0.05212199687957764, "best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/models/t5-small-codesearchnet-multilang-python/checkpoint-2625", "epoch": 13.0, "global_step": 4875, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_avg_length": 17.046, "eval_bleu": 0.0407, "eval_loss": 0.07167458534240723, "eval_rouge1": 0.6244, "eval_rouge2": 0.6063, "eval_runtime": 146.8983, "eval_samples_per_second": 34.037, "eval_steps_per_second": 4.255, "step": 375 }, { "epoch": 1.33, "learning_rate": 0.011602410115301609, "loss": 1.6287, "step": 500 }, { "epoch": 2.0, "eval_avg_length": 16.9924, "eval_bleu": 0.041, "eval_loss": 0.05889422446489334, "eval_rouge1": 0.6321, "eval_rouge2": 0.6136, "eval_runtime": 145.8711, "eval_samples_per_second": 34.277, "eval_steps_per_second": 4.285, "step": 750 }, { "epoch": 2.67, "learning_rate": 0.023224830627441406, "loss": 0.0592, "step": 1000 }, { "epoch": 3.0, "eval_avg_length": 16.971, "eval_bleu": 0.0402, "eval_loss": 0.0550708994269371, "eval_rouge1": 0.6334, "eval_rouge2": 0.6152, "eval_runtime": 143.6698, "eval_samples_per_second": 34.802, "eval_steps_per_second": 4.35, "step": 1125 }, { "epoch": 4.0, "learning_rate": 0.03487464413046837, "loss": 0.0511, "step": 1500 }, { "epoch": 4.0, "eval_avg_length": 16.9718, "eval_bleu": 0.0402, "eval_loss": 0.054238129407167435, "eval_rouge1": 0.6336, "eval_rouge2": 0.6155, "eval_runtime": 144.3554, "eval_samples_per_second": 34.637, "eval_steps_per_second": 4.33, "step": 1500 }, { "epoch": 5.0, "eval_avg_length": 16.961, "eval_bleu": 0.0401, "eval_loss": 0.05285137891769409, "eval_rouge1": 0.6343, "eval_rouge2": 0.6161, "eval_runtime": 144.2239, "eval_samples_per_second": 34.668, "eval_steps_per_second": 4.334, "step": 1875 }, { "epoch": 5.33, "learning_rate": 0.046562861651182175, "loss": 0.0441, "step": 2000 }, { "epoch": 6.0, "eval_avg_length": 16.9626, "eval_bleu": 0.0402, "eval_loss": 0.05305228382349014, "eval_rouge1": 0.6341, "eval_rouge2": 0.6158, "eval_runtime": 144.1713, "eval_samples_per_second": 34.681, "eval_steps_per_second": 4.335, "step": 2250 }, { "epoch": 6.67, "learning_rate": 0.058299630880355835, "loss": 0.0399, "step": 2500 }, { "epoch": 7.0, "eval_avg_length": 16.97, "eval_bleu": 0.0402, "eval_loss": 0.05212199687957764, "eval_rouge1": 0.6337, "eval_rouge2": 0.6154, "eval_runtime": 143.8202, "eval_samples_per_second": 34.766, "eval_steps_per_second": 4.346, "step": 2625 }, { "epoch": 8.0, "learning_rate": 0.07010027766227722, "loss": 0.0351, "step": 3000 }, { "epoch": 8.0, "eval_avg_length": 16.964, "eval_bleu": 0.0401, "eval_loss": 0.05471711605787277, "eval_rouge1": 0.6341, "eval_rouge2": 0.6159, "eval_runtime": 144.436, "eval_samples_per_second": 34.617, "eval_steps_per_second": 4.327, "step": 3000 }, { "epoch": 9.0, "eval_avg_length": 16.962, "eval_bleu": 0.0402, "eval_loss": 0.054534584283828735, "eval_rouge1": 0.635, "eval_rouge2": 0.6167, "eval_runtime": 143.3352, "eval_samples_per_second": 34.883, "eval_steps_per_second": 4.36, "step": 3375 }, { "epoch": 9.33, "learning_rate": 0.08195903152227402, "loss": 0.0301, "step": 3500 }, { "epoch": 10.0, "eval_avg_length": 16.9646, "eval_bleu": 0.0402, "eval_loss": 0.05570118501782417, "eval_rouge1": 0.6342, "eval_rouge2": 0.6159, "eval_runtime": 143.514, "eval_samples_per_second": 34.84, "eval_steps_per_second": 4.355, "step": 3750 }, { "epoch": 10.67, "learning_rate": 0.09392501413822174, "loss": 0.027, "step": 4000 }, { "epoch": 11.0, "eval_avg_length": 16.9622, "eval_bleu": 0.0402, "eval_loss": 0.05687524378299713, "eval_rouge1": 0.6342, "eval_rouge2": 0.6157, "eval_runtime": 144.0849, "eval_samples_per_second": 34.702, "eval_steps_per_second": 4.338, "step": 4125 }, { "epoch": 12.0, "learning_rate": 0.10599534213542938, "loss": 0.0239, "step": 4500 }, { "epoch": 12.0, "eval_avg_length": 16.9564, "eval_bleu": 0.0401, "eval_loss": 0.060644153505563736, "eval_rouge1": 0.6342, "eval_rouge2": 0.6158, "eval_runtime": 143.5445, "eval_samples_per_second": 34.832, "eval_steps_per_second": 4.354, "step": 4500 }, { "epoch": 13.0, "eval_avg_length": 16.963, "eval_bleu": 0.0401, "eval_loss": 0.06158696860074997, "eval_rouge1": 0.6343, "eval_rouge2": 0.6163, "eval_runtime": 144.0161, "eval_samples_per_second": 34.718, "eval_steps_per_second": 4.34, "step": 4875 } ], "max_steps": 5625, "num_train_epochs": 15, "total_flos": 2.639165128704e+16, "trial_name": null, "trial_params": null }