dopamin-java-expand / trainer_state.json
NamCyan's picture
Upload folder using huggingface_hub
7bcd184
raw
history blame
7.64 kB
{
"best_metric": 0.5863192182410424,
"best_model_checkpoint": "/cm/archive/namlh35/code-comment-classification/results/selection_wo_valid/Verification/codebert-postpretrained-HSUM-4layers-datav2-class-comment/java_expand/checkpoint-500",
"epoch": 7.954545454545455,
"eval_steps": 50,
"global_step": 1050,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.38,
"eval_f1": 0.14423076923076925,
"eval_loss": 0.19940590858459473,
"eval_precision": 0.35714285714285715,
"eval_recall": 0.09036144578313253,
"eval_runtime": 15.6593,
"eval_samples_per_second": 135.0,
"eval_steps_per_second": 8.493,
"step": 50
},
{
"epoch": 0.76,
"eval_f1": 0.4090909090909091,
"eval_loss": 0.21339909732341766,
"eval_precision": 0.3870967741935484,
"eval_recall": 0.43373493975903615,
"eval_runtime": 7.5755,
"eval_samples_per_second": 279.059,
"eval_steps_per_second": 17.557,
"step": 100
},
{
"epoch": 1.14,
"eval_f1": 0.5236907730673317,
"eval_loss": 0.2083684802055359,
"eval_precision": 0.44680851063829785,
"eval_recall": 0.6325301204819277,
"eval_runtime": 7.801,
"eval_samples_per_second": 270.99,
"eval_steps_per_second": 17.049,
"step": 150
},
{
"epoch": 1.52,
"eval_f1": 0.510385756676558,
"eval_loss": 0.2234768122434616,
"eval_precision": 0.5029239766081871,
"eval_recall": 0.5180722891566265,
"eval_runtime": 7.6406,
"eval_samples_per_second": 276.682,
"eval_steps_per_second": 17.407,
"step": 200
},
{
"epoch": 1.89,
"eval_f1": 0.5125628140703518,
"eval_loss": 0.20452718436717987,
"eval_precision": 0.4396551724137931,
"eval_recall": 0.6144578313253012,
"eval_runtime": 7.5874,
"eval_samples_per_second": 278.618,
"eval_steps_per_second": 17.529,
"step": 250
},
{
"epoch": 2.27,
"eval_f1": 0.5590062111801242,
"eval_loss": 0.22217300534248352,
"eval_precision": 0.5769230769230769,
"eval_recall": 0.5421686746987951,
"eval_runtime": 7.4841,
"eval_samples_per_second": 282.467,
"eval_steps_per_second": 17.771,
"step": 300
},
{
"epoch": 2.65,
"eval_f1": 0.5478547854785478,
"eval_loss": 0.23551225662231445,
"eval_precision": 0.6058394160583942,
"eval_recall": 0.5,
"eval_runtime": 7.5637,
"eval_samples_per_second": 279.493,
"eval_steps_per_second": 17.584,
"step": 350
},
{
"epoch": 3.03,
"eval_f1": 0.5739130434782609,
"eval_loss": 0.22371679544448853,
"eval_precision": 0.553072625698324,
"eval_recall": 0.5963855421686747,
"eval_runtime": 7.9409,
"eval_samples_per_second": 266.215,
"eval_steps_per_second": 16.749,
"step": 400
},
{
"epoch": 3.41,
"eval_f1": 0.5586206896551725,
"eval_loss": 0.24752120673656464,
"eval_precision": 0.6532258064516129,
"eval_recall": 0.4879518072289157,
"eval_runtime": 7.5417,
"eval_samples_per_second": 280.309,
"eval_steps_per_second": 17.635,
"step": 450
},
{
"epoch": 3.79,
"learning_rate": 6.212121212121213e-06,
"loss": 0.102,
"step": 500
},
{
"epoch": 3.79,
"eval_f1": 0.5863192182410424,
"eval_loss": 0.25533562898635864,
"eval_precision": 0.6382978723404256,
"eval_recall": 0.5421686746987951,
"eval_runtime": 7.9722,
"eval_samples_per_second": 265.172,
"eval_steps_per_second": 16.683,
"step": 500
},
{
"epoch": 4.17,
"eval_f1": 0.5714285714285715,
"eval_loss": 0.26097801327705383,
"eval_precision": 0.6370370370370371,
"eval_recall": 0.5180722891566265,
"eval_runtime": 8.3006,
"eval_samples_per_second": 254.679,
"eval_steps_per_second": 16.023,
"step": 550
},
{
"epoch": 4.55,
"eval_f1": 0.5602409638554217,
"eval_loss": 0.2843839228153229,
"eval_precision": 0.5602409638554217,
"eval_recall": 0.5602409638554217,
"eval_runtime": 7.9699,
"eval_samples_per_second": 265.247,
"eval_steps_per_second": 16.688,
"step": 600
},
{
"epoch": 4.92,
"eval_f1": 0.5687500000000001,
"eval_loss": 0.29494354128837585,
"eval_precision": 0.5909090909090909,
"eval_recall": 0.5481927710843374,
"eval_runtime": 8.3531,
"eval_samples_per_second": 253.08,
"eval_steps_per_second": 15.922,
"step": 650
},
{
"epoch": 5.3,
"eval_f1": 0.5578231292517006,
"eval_loss": 0.3040340840816498,
"eval_precision": 0.640625,
"eval_recall": 0.4939759036144578,
"eval_runtime": 7.1333,
"eval_samples_per_second": 296.358,
"eval_steps_per_second": 18.645,
"step": 700
},
{
"epoch": 5.68,
"eval_f1": 0.559748427672956,
"eval_loss": 0.3211788833141327,
"eval_precision": 0.5855263157894737,
"eval_recall": 0.536144578313253,
"eval_runtime": 7.2776,
"eval_samples_per_second": 290.482,
"eval_steps_per_second": 18.275,
"step": 750
},
{
"epoch": 6.06,
"eval_f1": 0.5714285714285714,
"eval_loss": 0.3221454620361328,
"eval_precision": 0.6040268456375839,
"eval_recall": 0.5421686746987951,
"eval_runtime": 9.612,
"eval_samples_per_second": 219.932,
"eval_steps_per_second": 13.837,
"step": 800
},
{
"epoch": 6.44,
"eval_f1": 0.5741324921135648,
"eval_loss": 0.32895684242248535,
"eval_precision": 0.6026490066225165,
"eval_recall": 0.5481927710843374,
"eval_runtime": 9.3112,
"eval_samples_per_second": 227.038,
"eval_steps_per_second": 14.284,
"step": 850
},
{
"epoch": 6.82,
"eval_f1": 0.5704697986577182,
"eval_loss": 0.3368590474128723,
"eval_precision": 0.6439393939393939,
"eval_recall": 0.5120481927710844,
"eval_runtime": 10.5803,
"eval_samples_per_second": 199.805,
"eval_steps_per_second": 12.571,
"step": 900
},
{
"epoch": 7.2,
"eval_f1": 0.5759493670886077,
"eval_loss": 0.3474346697330475,
"eval_precision": 0.6066666666666667,
"eval_recall": 0.5481927710843374,
"eval_runtime": 9.0583,
"eval_samples_per_second": 233.377,
"eval_steps_per_second": 14.683,
"step": 950
},
{
"epoch": 7.58,
"learning_rate": 2.4242424242424244e-06,
"loss": 0.0299,
"step": 1000
},
{
"epoch": 7.58,
"eval_f1": 0.5666666666666668,
"eval_loss": 0.3469344675540924,
"eval_precision": 0.6343283582089553,
"eval_recall": 0.5120481927710844,
"eval_runtime": 8.3925,
"eval_samples_per_second": 251.892,
"eval_steps_per_second": 15.847,
"step": 1000
},
{
"epoch": 7.95,
"eval_f1": 0.5749235474006117,
"eval_loss": 0.3440389037132263,
"eval_precision": 0.5838509316770186,
"eval_recall": 0.5662650602409639,
"eval_runtime": 8.5858,
"eval_samples_per_second": 246.22,
"eval_steps_per_second": 15.491,
"step": 1050
}
],
"logging_steps": 500,
"max_steps": 1320,
"num_train_epochs": 10,
"save_steps": 50,
"total_flos": 2939592325754112.0,
"trial_name": null,
"trial_params": null
}