elisanchez-beep's picture
first commit
3addd20 verified
{
"best_metric": 0.6532846715328468,
"best_model_checkpoint": "./outputs/en_es_multilingual/mdeberta-v3-base-output/met_xnli_test_en_8_0.01_0.00005_11-17-23_09-47/checkpoint-3630",
"epoch": 4.0,
"global_step": 7260,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 3.989595545134818e-05,
"loss": 0.0887,
"step": 1815
},
{
"epoch": 1.0,
"eval_accuracy": 0.9858611825192802,
"eval_f1": 0.6258389261744967,
"eval_loss": 0.04259440675377846,
"eval_precision": 0.6109746109746109,
"eval_recall": 0.641444539982803,
"eval_runtime": 14.5185,
"eval_samples_per_second": 334.951,
"eval_steps_per_second": 41.877,
"step": 1815
},
{
"epoch": 2.0,
"learning_rate": 2.6597303634232123e-05,
"loss": 0.0228,
"step": 3630
},
{
"epoch": 2.0,
"eval_accuracy": 0.9879240851820115,
"eval_f1": 0.6532846715328468,
"eval_loss": 0.034684374928474426,
"eval_precision": 0.6958211856171039,
"eval_recall": 0.6156491831470335,
"eval_runtime": 13.7183,
"eval_samples_per_second": 354.489,
"eval_steps_per_second": 44.32,
"step": 3630
},
{
"epoch": 3.0,
"learning_rate": 1.3298651817116062e-05,
"loss": 0.0104,
"step": 5445
},
{
"epoch": 3.0,
"eval_accuracy": 0.9885270874988099,
"eval_f1": 0.6226415094339622,
"eval_loss": 0.05654400959610939,
"eval_precision": 0.7973154362416107,
"eval_recall": 0.5107480653482374,
"eval_runtime": 12.5259,
"eval_samples_per_second": 388.237,
"eval_steps_per_second": 48.54,
"step": 5445
},
{
"epoch": 4.0,
"learning_rate": 0.0,
"loss": 0.0046,
"step": 7260
},
{
"epoch": 4.0,
"eval_accuracy": 0.9881779808943476,
"eval_f1": 0.6463007159904535,
"eval_loss": 0.05788963660597801,
"eval_precision": 0.7263948497854077,
"eval_recall": 0.5821152192605331,
"eval_runtime": 13.3972,
"eval_samples_per_second": 362.986,
"eval_steps_per_second": 45.383,
"step": 7260
},
{
"epoch": 4.0,
"step": 7260,
"total_flos": 1062049033953072.0,
"train_loss": 0.031637020347532165,
"train_runtime": 972.4399,
"train_samples_per_second": 59.722,
"train_steps_per_second": 7.466
}
],
"max_steps": 7260,
"num_train_epochs": 4,
"total_flos": 1062049033953072.0,
"trial_name": null,
"trial_params": null
}