add Variant-V1 LLRD model
Browse files- model.safetensors +1 -1
- optimizer.pt +1 -1
- rng_state.pth +1 -1
- scheduler.pt +1 -1
- trainer_state.json +62 -5
- training_args.bin +3 -0
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 435599164
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bda9525a3cc937b80370a391c7c6adf07484c6dcc483be1f745d253eb7ad31f3
|
| 3 |
size 435599164
|
optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 871321658
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76934c72aa799fa70772bd0518b6552ab16dd7af97db92f864db37f07a6517a9
|
| 3 |
size 871321658
|
rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61e45edb800e9706baa914416a41d7442130659d6c2eedc62a95aae8c2ccdd31
|
| 3 |
size 14244
|
scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1576
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:684908b1ddccacc6a619d447e4f01151ce041a7a97eb1004119dd3b2f1c3be72
|
| 3 |
size 1576
|
trainer_state.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.90625,
|
| 3 |
"best_model_checkpoint": "/nfs/production/literature/amina-mardiyyah/new_data/OT-Entity-Extraction-Pipeline/model_outputs/hf/Variant_V2/reinit_llrd/4K_no_reinit_classifier_llrd0.9/BiomedNLP_BiomedBERT_base/checkpoint-1408",
|
| 4 |
-
"epoch":
|
| 5 |
"eval_steps": 500,
|
| 6 |
-
"global_step":
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
@@ -83,6 +83,63 @@
|
|
| 83 |
"eval_samples_per_second": 270.961,
|
| 84 |
"eval_steps_per_second": 17.075,
|
| 85 |
"step": 1408
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 86 |
}
|
| 87 |
],
|
| 88 |
"logging_steps": 500,
|
|
@@ -97,7 +154,7 @@
|
|
| 97 |
"early_stopping_threshold": 0.0
|
| 98 |
},
|
| 99 |
"attributes": {
|
| 100 |
-
"early_stopping_patience_counter":
|
| 101 |
}
|
| 102 |
},
|
| 103 |
"TrainerControl": {
|
|
@@ -106,12 +163,12 @@
|
|
| 106 |
"should_evaluate": false,
|
| 107 |
"should_log": false,
|
| 108 |
"should_save": true,
|
| 109 |
-
"should_training_stop":
|
| 110 |
},
|
| 111 |
"attributes": {}
|
| 112 |
}
|
| 113 |
},
|
| 114 |
-
"total_flos":
|
| 115 |
"train_batch_size": 16,
|
| 116 |
"trial_name": null,
|
| 117 |
"trial_params": null
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.90625,
|
| 3 |
"best_model_checkpoint": "/nfs/production/literature/amina-mardiyyah/new_data/OT-Entity-Extraction-Pipeline/model_outputs/hf/Variant_V2/reinit_llrd/4K_no_reinit_classifier_llrd0.9/BiomedNLP_BiomedBERT_base/checkpoint-1408",
|
| 4 |
+
"epoch": 7.0,
|
| 5 |
"eval_steps": 500,
|
| 6 |
+
"global_step": 2464,
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
|
|
| 83 |
"eval_samples_per_second": 270.961,
|
| 84 |
"eval_steps_per_second": 17.075,
|
| 85 |
"step": 1408
|
| 86 |
+
},
|
| 87 |
+
{
|
| 88 |
+
"epoch": 5.0,
|
| 89 |
+
"grad_norm": 0.021774714812636375,
|
| 90 |
+
"learning_rate": 1.667929292929293e-05,
|
| 91 |
+
"loss": 0.0016,
|
| 92 |
+
"step": 1760
|
| 93 |
+
},
|
| 94 |
+
{
|
| 95 |
+
"epoch": 5.0,
|
| 96 |
+
"eval_accuracy": 0.9981066222597349,
|
| 97 |
+
"eval_f1": 0.8957264957264958,
|
| 98 |
+
"eval_loss": 0.006704295519739389,
|
| 99 |
+
"eval_precision": 0.888135593220339,
|
| 100 |
+
"eval_recall": 0.903448275862069,
|
| 101 |
+
"eval_runtime": 4.4921,
|
| 102 |
+
"eval_samples_per_second": 268.47,
|
| 103 |
+
"eval_steps_per_second": 16.918,
|
| 104 |
+
"step": 1760
|
| 105 |
+
},
|
| 106 |
+
{
|
| 107 |
+
"epoch": 6.0,
|
| 108 |
+
"grad_norm": 0.004604855552315712,
|
| 109 |
+
"learning_rate": 1.5568181818181822e-05,
|
| 110 |
+
"loss": 0.001,
|
| 111 |
+
"step": 2112
|
| 112 |
+
},
|
| 113 |
+
{
|
| 114 |
+
"epoch": 6.0,
|
| 115 |
+
"eval_accuracy": 0.9982663047197573,
|
| 116 |
+
"eval_f1": 0.9031141868512111,
|
| 117 |
+
"eval_loss": 0.0071674492210149765,
|
| 118 |
+
"eval_precision": 0.90625,
|
| 119 |
+
"eval_recall": 0.9,
|
| 120 |
+
"eval_runtime": 4.7306,
|
| 121 |
+
"eval_samples_per_second": 254.936,
|
| 122 |
+
"eval_steps_per_second": 16.066,
|
| 123 |
+
"step": 2112
|
| 124 |
+
},
|
| 125 |
+
{
|
| 126 |
+
"epoch": 7.0,
|
| 127 |
+
"grad_norm": 0.013881128281354904,
|
| 128 |
+
"learning_rate": 1.4457070707070708e-05,
|
| 129 |
+
"loss": 0.0007,
|
| 130 |
+
"step": 2464
|
| 131 |
+
},
|
| 132 |
+
{
|
| 133 |
+
"epoch": 7.0,
|
| 134 |
+
"eval_accuracy": 0.9980838104797317,
|
| 135 |
+
"eval_f1": 0.9014084507042254,
|
| 136 |
+
"eval_loss": 0.00853455625474453,
|
| 137 |
+
"eval_precision": 0.920863309352518,
|
| 138 |
+
"eval_recall": 0.8827586206896552,
|
| 139 |
+
"eval_runtime": 4.4218,
|
| 140 |
+
"eval_samples_per_second": 272.737,
|
| 141 |
+
"eval_steps_per_second": 17.187,
|
| 142 |
+
"step": 2464
|
| 143 |
}
|
| 144 |
],
|
| 145 |
"logging_steps": 500,
|
|
|
|
| 154 |
"early_stopping_threshold": 0.0
|
| 155 |
},
|
| 156 |
"attributes": {
|
| 157 |
+
"early_stopping_patience_counter": 3
|
| 158 |
}
|
| 159 |
},
|
| 160 |
"TrainerControl": {
|
|
|
|
| 163 |
"should_evaluate": false,
|
| 164 |
"should_log": false,
|
| 165 |
"should_save": true,
|
| 166 |
+
"should_training_stop": true
|
| 167 |
},
|
| 168 |
"attributes": {}
|
| 169 |
}
|
| 170 |
},
|
| 171 |
+
"total_flos": 805331029976316.0,
|
| 172 |
"train_batch_size": 16,
|
| 173 |
"trial_name": null,
|
| 174 |
"trial_params": null
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:12b09da2fb5aa6cbf002b655c958b5c057a395831c815f26c553d07c8fd07caa
|
| 3 |
+
size 5624
|