File size: 3,278 Bytes
68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab 6831f8b 68c90ab |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 |
{
"best_global_step": 30816,
"best_metric": 0.807234452615663,
"best_model_checkpoint": "content/cross_encoder_distilroberta_base_all_data/checkpoint-30816",
"epoch": 3.0,
"eval_steps": 10272,
"global_step": 30819,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 9.734254842791784e-05,
"grad_norm": 5.287121772766113,
"learning_rate": 0.0,
"loss": 1.0174,
"step": 1
},
{
"epoch": 0.999902657451572,
"grad_norm": 11.268630981445312,
"learning_rate": 1.4816310343584383e-05,
"loss": 0.6234,
"step": 10272
},
{
"epoch": 0.999902657451572,
"eval_reranking-dev_base_map": 0.6214825536231217,
"eval_reranking-dev_base_mrr@50": 0.7375349668670806,
"eval_reranking-dev_base_ndcg@50": 0.725527756915131,
"eval_reranking-dev_map": 0.6945674925725406,
"eval_reranking-dev_mrr@50": 0.7747076964185934,
"eval_reranking-dev_ndcg@50": 0.7913486180328326,
"eval_runtime": 210.3713,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 10272
},
{
"epoch": 1.9998053149031443,
"grad_norm": 5.99316930770874,
"learning_rate": 7.4095972888199885e-06,
"loss": 0.3901,
"step": 20544
},
{
"epoch": 1.9998053149031443,
"eval_reranking-dev_base_map": 0.6214825536231217,
"eval_reranking-dev_base_mrr@50": 0.7375349668670806,
"eval_reranking-dev_base_ndcg@50": 0.725527756915131,
"eval_reranking-dev_map": 0.7153961592162474,
"eval_reranking-dev_mrr@50": 0.7867533806941779,
"eval_reranking-dev_ndcg@50": 0.8041280710955544,
"eval_runtime": 206.6571,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 20544
},
{
"epoch": 2.999707972354716,
"grad_norm": 9.407133102416992,
"learning_rate": 2.8842340555936117e-09,
"loss": 0.2978,
"step": 30816
},
{
"epoch": 2.999707972354716,
"eval_reranking-dev_base_map": 0.6214825536231217,
"eval_reranking-dev_base_mrr@50": 0.7375349668670806,
"eval_reranking-dev_base_ndcg@50": 0.725527756915131,
"eval_reranking-dev_map": 0.7207063760806678,
"eval_reranking-dev_mrr@50": 0.7903183680827569,
"eval_reranking-dev_ndcg@50": 0.807234452615663,
"eval_runtime": 204.5125,
"eval_samples_per_second": 0.0,
"eval_steps_per_second": 0.0,
"step": 30816
}
],
"logging_steps": 10272,
"max_steps": 30819,
"num_input_tokens_seen": 0,
"num_train_epochs": 3,
"save_steps": 10272,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 3,
"early_stopping_threshold": 0.0
},
"attributes": {
"early_stopping_patience_counter": 0
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 0.0,
"train_batch_size": 128,
"trial_name": null,
"trial_params": null
}
|