Mardiyyah commited on
Commit
8b9f1e0
·
verified ·
1 Parent(s): 9e7e6bf

add Variant-V1 LLRD model

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3a6c9229eed32130bb8b880265f8b886fb4347ef21ba3aacfe8a0e5e49924ce
3
  size 435599164
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bda9525a3cc937b80370a391c7c6adf07484c6dcc483be1f745d253eb7ad31f3
3
  size 435599164
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9f5b0a137201ea2b49806eb0bc8e2ac1a63abb4dfbe61a13677a91dba69378e
3
  size 871321658
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76934c72aa799fa70772bd0518b6552ab16dd7af97db92f864db37f07a6517a9
3
  size 871321658
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e246631174b7e7bbbd79eb8c88be058db2e397b961adf392640d441f0303d3b3
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61e45edb800e9706baa914416a41d7442130659d6c2eedc62a95aae8c2ccdd31
3
  size 14244
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f2a475865a035e3e7c31a5baf48c564790f030bd32fece0a5357e648f353c3c
3
  size 1576
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:684908b1ddccacc6a619d447e4f01151ce041a7a97eb1004119dd3b2f1c3be72
3
  size 1576
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 0.90625,
3
  "best_model_checkpoint": "/nfs/production/literature/amina-mardiyyah/new_data/OT-Entity-Extraction-Pipeline/model_outputs/hf/Variant_V2/reinit_llrd/4K_no_reinit_classifier_llrd0.9/BiomedNLP_BiomedBERT_base/checkpoint-1408",
4
- "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 1408,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -83,6 +83,63 @@
83
  "eval_samples_per_second": 270.961,
84
  "eval_steps_per_second": 17.075,
85
  "step": 1408
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
86
  }
87
  ],
88
  "logging_steps": 500,
@@ -97,7 +154,7 @@
97
  "early_stopping_threshold": 0.0
98
  },
99
  "attributes": {
100
- "early_stopping_patience_counter": 0
101
  }
102
  },
103
  "TrainerControl": {
@@ -106,12 +163,12 @@
106
  "should_evaluate": false,
107
  "should_log": false,
108
  "should_save": true,
109
- "should_training_stop": false
110
  },
111
  "attributes": {}
112
  }
113
  },
114
- "total_flos": 460067113467108.0,
115
  "train_batch_size": 16,
116
  "trial_name": null,
117
  "trial_params": null
 
1
  {
2
  "best_metric": 0.90625,
3
  "best_model_checkpoint": "/nfs/production/literature/amina-mardiyyah/new_data/OT-Entity-Extraction-Pipeline/model_outputs/hf/Variant_V2/reinit_llrd/4K_no_reinit_classifier_llrd0.9/BiomedNLP_BiomedBERT_base/checkpoint-1408",
4
+ "epoch": 7.0,
5
  "eval_steps": 500,
6
+ "global_step": 2464,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
83
  "eval_samples_per_second": 270.961,
84
  "eval_steps_per_second": 17.075,
85
  "step": 1408
86
+ },
87
+ {
88
+ "epoch": 5.0,
89
+ "grad_norm": 0.021774714812636375,
90
+ "learning_rate": 1.667929292929293e-05,
91
+ "loss": 0.0016,
92
+ "step": 1760
93
+ },
94
+ {
95
+ "epoch": 5.0,
96
+ "eval_accuracy": 0.9981066222597349,
97
+ "eval_f1": 0.8957264957264958,
98
+ "eval_loss": 0.006704295519739389,
99
+ "eval_precision": 0.888135593220339,
100
+ "eval_recall": 0.903448275862069,
101
+ "eval_runtime": 4.4921,
102
+ "eval_samples_per_second": 268.47,
103
+ "eval_steps_per_second": 16.918,
104
+ "step": 1760
105
+ },
106
+ {
107
+ "epoch": 6.0,
108
+ "grad_norm": 0.004604855552315712,
109
+ "learning_rate": 1.5568181818181822e-05,
110
+ "loss": 0.001,
111
+ "step": 2112
112
+ },
113
+ {
114
+ "epoch": 6.0,
115
+ "eval_accuracy": 0.9982663047197573,
116
+ "eval_f1": 0.9031141868512111,
117
+ "eval_loss": 0.0071674492210149765,
118
+ "eval_precision": 0.90625,
119
+ "eval_recall": 0.9,
120
+ "eval_runtime": 4.7306,
121
+ "eval_samples_per_second": 254.936,
122
+ "eval_steps_per_second": 16.066,
123
+ "step": 2112
124
+ },
125
+ {
126
+ "epoch": 7.0,
127
+ "grad_norm": 0.013881128281354904,
128
+ "learning_rate": 1.4457070707070708e-05,
129
+ "loss": 0.0007,
130
+ "step": 2464
131
+ },
132
+ {
133
+ "epoch": 7.0,
134
+ "eval_accuracy": 0.9980838104797317,
135
+ "eval_f1": 0.9014084507042254,
136
+ "eval_loss": 0.00853455625474453,
137
+ "eval_precision": 0.920863309352518,
138
+ "eval_recall": 0.8827586206896552,
139
+ "eval_runtime": 4.4218,
140
+ "eval_samples_per_second": 272.737,
141
+ "eval_steps_per_second": 17.187,
142
+ "step": 2464
143
  }
144
  ],
145
  "logging_steps": 500,
 
154
  "early_stopping_threshold": 0.0
155
  },
156
  "attributes": {
157
+ "early_stopping_patience_counter": 3
158
  }
159
  },
160
  "TrainerControl": {
 
163
  "should_evaluate": false,
164
  "should_log": false,
165
  "should_save": true,
166
+ "should_training_stop": true
167
  },
168
  "attributes": {}
169
  }
170
  },
171
+ "total_flos": 805331029976316.0,
172
  "train_batch_size": 16,
173
  "trial_name": null,
174
  "trial_params": null
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12b09da2fb5aa6cbf002b655c958b5c057a395831c815f26c553d07c8fd07caa
3
+ size 5624