Shresthadev403 commited on
Commit
3be35ec
·
verified ·
1 Parent(s): 75c8284

End of training

Browse files
README.md CHANGED
@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
- - Loss: 2.0050
17
 
18
  ## Model description
19
 
 
13
 
14
  This model was trained from scratch on an unknown dataset.
15
  It achieves the following results on the evaluation set:
16
+ - Loss: 1.6688
17
 
18
  ## Model description
19
 
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e39b8df1cbb99fffe7efe5e8ace9235204c42cf176944966f84611a6e266e7d6
3
  size 535667604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3259915083e1ecce9885b9cd06762ad8b35f83a24fabe145b16ba73ff609831c
3
  size 535667604
runs/Jan22_02-43-32_fbf1b033956c/events.out.tfevents.1705891414.fbf1b033956c.26.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:722c6890eb6f5d56b877a66688db33d3be7b63d17d0d8045a51a8731c0562d1a
3
- size 1717390
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30aa48091683d8951d7db8abdbec6369d8757f148f5787495eceaea1d7f05438
3
+ size 1717818
trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.4617092609405518,
3
  "best_model_checkpoint": "ner-bert-ingredientstesting/checkpoint-9000",
4
- "epoch": 14.150555742674301,
5
  "eval_steps": 750,
6
- "global_step": 10500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -212,6 +212,20 @@
212
  "eval_samples_per_second": 58.913,
213
  "eval_steps_per_second": 0.931,
214
  "step": 10500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
215
  }
216
  ],
217
  "logging_steps": 750,
@@ -219,7 +233,7 @@
219
  "num_input_tokens_seen": 0,
220
  "num_train_epochs": 100,
221
  "save_steps": 750,
222
- "total_flos": 4.544406832645325e+17,
223
  "train_batch_size": 16,
224
  "trial_name": null,
225
  "trial_params": null
 
1
  {
2
  "best_metric": 1.4617092609405518,
3
  "best_model_checkpoint": "ner-bert-ingredientstesting/checkpoint-9000",
4
+ "epoch": 15.160996968676322,
5
  "eval_steps": 750,
6
+ "global_step": 11250,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
212
  "eval_samples_per_second": 58.913,
213
  "eval_steps_per_second": 0.931,
214
  "step": 10500
215
+ },
216
+ {
217
+ "epoch": 15.16,
218
+ "learning_rate": 4.898989218328841e-05,
219
+ "loss": 1.4983,
220
+ "step": 11250
221
+ },
222
+ {
223
+ "epoch": 15.16,
224
+ "eval_loss": 1.668813705444336,
225
+ "eval_runtime": 84.5947,
226
+ "eval_samples_per_second": 59.105,
227
+ "eval_steps_per_second": 0.934,
228
+ "step": 11250
229
  }
230
  ],
231
  "logging_steps": 750,
 
233
  "num_input_tokens_seen": 0,
234
  "num_train_epochs": 100,
235
  "save_steps": 750,
236
+ "total_flos": 4.8690053883961344e+17,
237
  "train_batch_size": 16,
238
  "trial_name": null,
239
  "trial_params": null