maud-dr commited on
Commit
89c2ae0
·
verified ·
1 Parent(s): 22d115b

Training in progress, epoch 2

Browse files
Files changed (31) hide show
  1. README.md +26 -27
  2. model.safetensors +1 -1
  3. runs/Jun04_17-49-28_model2-stage2-0-0/events.out.tfevents.1749062030.model2-stage2-0-0.1.5 +3 -0
  4. runs/Jun04_21-00-28_model2-stage2-fp16false-0-0/events.out.tfevents.1749070840.model2-stage2-fp16false-0-0.1.0 +3 -0
  5. runs/Jun04_21-00-29_model2-stage2-nodatacoll-0-0/events.out.tfevents.1749070838.model2-stage2-nodatacoll-0-0.1.0 +3 -0
  6. runs/Jun04_21-01-22_model2-stage2-nodatacoll-0-1/events.out.tfevents.1749070904.model2-stage2-nodatacoll-0-1.1.0 +3 -0
  7. runs/Jun04_21-01-25_model2-stage2-fp16false-0-1/events.out.tfevents.1749070895.model2-stage2-fp16false-0-1.1.0 +3 -0
  8. runs/Jun04_21-02-15_model2-stage2-nodatacoll-0-2/events.out.tfevents.1749070944.model2-stage2-nodatacoll-0-2.1.0 +3 -0
  9. runs/Jun04_21-02-22_model2-stage2-fp16false-0-2/events.out.tfevents.1749070954.model2-stage2-fp16false-0-2.1.0 +3 -0
  10. runs/Jun04_21-03-05_model2-stage2-nodatacoll-0-3/events.out.tfevents.1749070996.model2-stage2-nodatacoll-0-3.1.0 +3 -0
  11. runs/Jun04_21-03-12_model2-stage2-fp16false-0-3/events.out.tfevents.1749071001.model2-stage2-fp16false-0-3.1.0 +3 -0
  12. runs/Jun04_21-04-02_model2-stage2-fp16false-0-4/events.out.tfevents.1749071048.model2-stage2-fp16false-0-4.1.0 +3 -0
  13. runs/Jun04_21-04-06_model2-stage2-nodatacoll-0-4/events.out.tfevents.1749071053.model2-stage2-nodatacoll-0-4.1.0 +3 -0
  14. runs/Jun04_21-04-41_model2-stage2-fp16false-0-5/events.out.tfevents.1749071090.model2-stage2-fp16false-0-5.1.0 +3 -0
  15. runs/Jun04_21-04-42_model2-stage2-nodatacoll-0-5/events.out.tfevents.1749071090.model2-stage2-nodatacoll-0-5.1.0 +3 -0
  16. runs/Jun04_21-05-25_model2-stage2-fp16false-0-6/events.out.tfevents.1749071134.model2-stage2-fp16false-0-6.1.0 +3 -0
  17. runs/Jun04_21-05-27_model2-stage2-nodatacoll-0-6/events.out.tfevents.1749071133.model2-stage2-nodatacoll-0-6.1.0 +3 -0
  18. runs/Jun04_21-10-04_model2-stage2-fp16false-0-0/events.out.tfevents.1749071411.model2-stage2-fp16false-0-0.1.0 +3 -0
  19. runs/Jun04_21-11-30_model2-stage2-fp16false-0-1/events.out.tfevents.1749071495.model2-stage2-fp16false-0-1.1.0 +3 -0
  20. runs/Jun04_21-12-37_model2-stage2-fp16false-0-2/events.out.tfevents.1749071563.model2-stage2-fp16false-0-2.1.0 +3 -0
  21. runs/Jun04_21-13-47_model2-stage2-fp16false-0-3/events.out.tfevents.1749071633.model2-stage2-fp16false-0-3.1.0 +3 -0
  22. runs/Jun04_21-14-50_model2-stage2-fp16false-0-4/events.out.tfevents.1749071696.model2-stage2-fp16false-0-4.1.0 +3 -0
  23. runs/Jun04_21-15-59_model2-stage2-fp16false-0-5/events.out.tfevents.1749071765.model2-stage2-fp16false-0-5.1.0 +3 -0
  24. runs/Jun04_21-17-03_model2-stage2-fp16false-0-6/events.out.tfevents.1749071829.model2-stage2-fp16false-0-6.1.0 +3 -0
  25. runs/Jun04_21-23-12_model2-stage2-0-0/events.out.tfevents.1749072198.model2-stage2-0-0.1.0 +3 -0
  26. runs/Jun04_21-23-12_model2-stage2-0-0/events.out.tfevents.1749073272.model2-stage2-0-0.1.1 +3 -0
  27. runs/Jun04_21-41-12_model2-stage2-0-0/events.out.tfevents.1749073273.model2-stage2-0-0.1.2 +3 -0
  28. runs/Jun04_21-41-12_model2-stage2-0-0/events.out.tfevents.1749074373.model2-stage2-0-0.1.3 +3 -0
  29. runs/Jun04_21-59-33_model2-stage2-0-0/events.out.tfevents.1749074374.model2-stage2-0-0.1.4 +3 -0
  30. tokenizer.json +1 -8
  31. training_args.bin +1 -1
README.md CHANGED
@@ -9,21 +9,21 @@ metrics:
9
  - recall
10
  - f1
11
  model-index:
12
- - name: model_2_stage2-seed_2025
13
  results: []
14
  ---
15
 
16
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
  should probably proofread and complete it, then remove this comment. -->
18
 
19
- # model_2_stage2-seed_2025
20
 
21
  This model is a fine-tuned version of [maud-dr/model_2_stage1](https://huggingface.co/maud-dr/model_2_stage1) on the None dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: nan
24
- - Precision: 0.0
25
- - Recall: 0.0
26
- - F1: 0.0
27
 
28
  ## Model description
29
 
@@ -43,33 +43,32 @@ More information needed
43
 
44
  The following hyperparameters were used during training:
45
  - learning_rate: 0.0003
46
- - train_batch_size: 16
47
- - eval_batch_size: 16
48
- - seed: 2025
49
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
50
  - lr_scheduler_type: linear
51
  - num_epochs: 15
52
- - mixed_precision_training: Native AMP
53
 
54
  ### Training results
55
 
56
- | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 |
57
- |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:---:|
58
- | 0.0 | 1.0 | 224 | nan | 0.0 | 0.0 | 0.0 |
59
- | 0.0 | 2.0 | 448 | nan | 0.0 | 0.0 | 0.0 |
60
- | 0.0 | 3.0 | 672 | nan | 0.0 | 0.0 | 0.0 |
61
- | 0.0 | 4.0 | 896 | nan | 0.0 | 0.0 | 0.0 |
62
- | 0.0 | 5.0 | 1120 | nan | 0.0 | 0.0 | 0.0 |
63
- | 0.0 | 6.0 | 1344 | nan | 0.0 | 0.0 | 0.0 |
64
- | 0.0 | 7.0 | 1568 | nan | 0.0 | 0.0 | 0.0 |
65
- | 0.0 | 8.0 | 1792 | nan | 0.0 | 0.0 | 0.0 |
66
- | 0.0 | 9.0 | 2016 | nan | 0.0 | 0.0 | 0.0 |
67
- | 0.0 | 10.0 | 2240 | nan | 0.0 | 0.0 | 0.0 |
68
- | 0.0 | 11.0 | 2464 | nan | 0.0 | 0.0 | 0.0 |
69
- | 0.0 | 12.0 | 2688 | nan | 0.0 | 0.0 | 0.0 |
70
- | 0.0 | 13.0 | 2912 | nan | 0.0 | 0.0 | 0.0 |
71
- | 0.0 | 14.0 | 3136 | nan | 0.0 | 0.0 | 0.0 |
72
- | 0.0 | 15.0 | 3360 | nan | 0.0 | 0.0 | 0.0 |
73
 
74
 
75
  ### Framework versions
 
9
  - recall
10
  - f1
11
  model-index:
12
+ - name: model_2_stage2-seed_123
13
  results: []
14
  ---
15
 
16
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
  should probably proofread and complete it, then remove this comment. -->
18
 
19
+ # model_2_stage2-seed_123
20
 
21
  This model is a fine-tuned version of [maud-dr/model_2_stage1](https://huggingface.co/maud-dr/model_2_stage1) on the None dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 2.7954
24
+ - Precision: 0.6352
25
+ - Recall: 0.7319
26
+ - F1: 0.6801
27
 
28
  ## Model description
29
 
 
43
 
44
  The following hyperparameters were used during training:
45
  - learning_rate: 0.0003
46
+ - train_batch_size: 8
47
+ - eval_batch_size: 8
48
+ - seed: 123
49
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
50
  - lr_scheduler_type: linear
51
  - num_epochs: 15
 
52
 
53
  ### Training results
54
 
55
+ | Training Loss | Epoch | Step | Validation Loss | Precision | Recall | F1 |
56
+ |:-------------:|:-----:|:----:|:---------------:|:---------:|:------:|:------:|
57
+ | 0.5075 | 1.0 | 447 | 0.6591 | 0.6296 | 0.6159 | 0.6227 |
58
+ | 0.4241 | 2.0 | 894 | 0.8133 | 0.6012 | 0.7536 | 0.6688 |
59
+ | 0.3651 | 3.0 | 1341 | 0.8972 | 0.6092 | 0.7174 | 0.6589 |
60
+ | 0.3389 | 4.0 | 1788 | 1.3235 | 0.6040 | 0.7572 | 0.6720 |
61
+ | 0.2572 | 5.0 | 2235 | 1.2850 | 0.6378 | 0.7464 | 0.6878 |
62
+ | 0.187 | 6.0 | 2682 | 1.4055 | 0.6114 | 0.7754 | 0.6837 |
63
+ | 0.1456 | 7.0 | 3129 | 1.8037 | 0.6464 | 0.6558 | 0.6511 |
64
+ | 0.1386 | 8.0 | 3576 | 1.8962 | 0.6181 | 0.6920 | 0.6530 |
65
+ | 0.1003 | 9.0 | 4023 | 2.1076 | 0.6198 | 0.7029 | 0.6587 |
66
+ | 0.0738 | 10.0 | 4470 | 2.4260 | 0.6463 | 0.7283 | 0.6848 |
67
+ | 0.0233 | 11.0 | 4917 | 2.5047 | 0.6242 | 0.7464 | 0.6799 |
68
+ | 0.0677 | 12.0 | 5364 | 2.6329 | 0.6238 | 0.7029 | 0.6610 |
69
+ | 0.0249 | 13.0 | 5811 | 2.5839 | 0.6429 | 0.7174 | 0.6781 |
70
+ | 0.0249 | 14.0 | 6258 | 2.7944 | 0.6347 | 0.7428 | 0.6845 |
71
+ | 0.0228 | 15.0 | 6705 | 2.7954 | 0.6352 | 0.7319 | 0.6801 |
72
 
73
 
74
  ### Framework versions
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1062a16fe2cbe9aff50a5c3072cbcac932ee35863abf00b3b6d4475b456c95b8
3
  size 894020048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6c3bfb8557df05943c5669a1f090cbf29241943ce87740eba484c468e6304be
3
  size 894020048
runs/Jun04_17-49-28_model2-stage2-0-0/events.out.tfevents.1749062030.model2-stage2-0-0.1.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbaa8ea85802071c5719509ec847e72bf548c41390e388010b2d3cf059159d8e
3
+ size 508
runs/Jun04_21-00-28_model2-stage2-fp16false-0-0/events.out.tfevents.1749070840.model2-stage2-fp16false-0-0.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98b0353e25e732c082987569e97567dc7a25d048cbf13e3a010e6e3361113477
3
+ size 5973
runs/Jun04_21-00-29_model2-stage2-nodatacoll-0-0/events.out.tfevents.1749070838.model2-stage2-nodatacoll-0-0.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f24708491ce1edfc1f9406bd06f73d6e1c80c4e933912afddcb505bf5e3a509a
3
+ size 5972
runs/Jun04_21-01-22_model2-stage2-nodatacoll-0-1/events.out.tfevents.1749070904.model2-stage2-nodatacoll-0-1.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0be9df85bcbb92f6d337e4808c9f62d0b79bc5771b951b406b311ff6b9eb63bc
3
+ size 5972
runs/Jun04_21-01-25_model2-stage2-fp16false-0-1/events.out.tfevents.1749070895.model2-stage2-fp16false-0-1.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e57588a83135238838fb65e2435f96b03e2bec46d17b385263269aee988495fc
3
+ size 5973
runs/Jun04_21-02-15_model2-stage2-nodatacoll-0-2/events.out.tfevents.1749070944.model2-stage2-nodatacoll-0-2.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:737ebc31862bb2a74d7f86152e765c5d8ce374ca87f0d371c22a8fa5c7392b2b
3
+ size 5972
runs/Jun04_21-02-22_model2-stage2-fp16false-0-2/events.out.tfevents.1749070954.model2-stage2-fp16false-0-2.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb3a0a5bf350b3f6e207f91a17b51a397ae900e4586b36b88eb4d82831f419f3
3
+ size 5973
runs/Jun04_21-03-05_model2-stage2-nodatacoll-0-3/events.out.tfevents.1749070996.model2-stage2-nodatacoll-0-3.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3accf094b8645ddb8169487bc6b526ae46c002dafe5b79b42fc8522ab79ab80
3
+ size 5972
runs/Jun04_21-03-12_model2-stage2-fp16false-0-3/events.out.tfevents.1749071001.model2-stage2-fp16false-0-3.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:095fb9a877045e89ab00f8f49fa8c7e3d670036316b1564c185b6612149936f6
3
+ size 5973
runs/Jun04_21-04-02_model2-stage2-fp16false-0-4/events.out.tfevents.1749071048.model2-stage2-fp16false-0-4.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4643a4df47766da6eb37da61a857048edf9997fe8abe536fffec9a74271ea833
3
+ size 5973
runs/Jun04_21-04-06_model2-stage2-nodatacoll-0-4/events.out.tfevents.1749071053.model2-stage2-nodatacoll-0-4.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b24f478968affa1151e36ad8aa837c1d57f69e670a9c256df1071e45a120b77
3
+ size 5972
runs/Jun04_21-04-41_model2-stage2-fp16false-0-5/events.out.tfevents.1749071090.model2-stage2-fp16false-0-5.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6310a2fff9b98fcb4d7724b5f4d6c582c58d27da6b57bc1edb7916a12307ec8f
3
+ size 5973
runs/Jun04_21-04-42_model2-stage2-nodatacoll-0-5/events.out.tfevents.1749071090.model2-stage2-nodatacoll-0-5.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:342bd157d428ac065fe2cd4c7b3cfbbc6b274d970fd1c656f447e135a12bf03e
3
+ size 5972
runs/Jun04_21-05-25_model2-stage2-fp16false-0-6/events.out.tfevents.1749071134.model2-stage2-fp16false-0-6.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8192dfb0ff20f971a21a96a9180408bb0e959827f76081201963d837b96fb25d
3
+ size 5973
runs/Jun04_21-05-27_model2-stage2-nodatacoll-0-6/events.out.tfevents.1749071133.model2-stage2-nodatacoll-0-6.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:633707f96ffe820c1a5fed3635f3c10a97d5efc6f6d7a836e450309d4d4b1de3
3
+ size 5972
runs/Jun04_21-10-04_model2-stage2-fp16false-0-0/events.out.tfevents.1749071411.model2-stage2-fp16false-0-0.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:656aaf05a97b91ae82ab6698c48462e806264720992a583021b1b2910fa86ce2
3
+ size 6180
runs/Jun04_21-11-30_model2-stage2-fp16false-0-1/events.out.tfevents.1749071495.model2-stage2-fp16false-0-1.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5ab8693d470a1355c1aa07849763b2079445896bc81b1e34e039104989cb5f6
3
+ size 6180
runs/Jun04_21-12-37_model2-stage2-fp16false-0-2/events.out.tfevents.1749071563.model2-stage2-fp16false-0-2.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cba41d3db3dd9dc93965dbeb8b801dce013ded11609760b6f2e1b8961aeaf1b7
3
+ size 6180
runs/Jun04_21-13-47_model2-stage2-fp16false-0-3/events.out.tfevents.1749071633.model2-stage2-fp16false-0-3.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6df69f5d9ec609b805f87cf0ffb4be3bf7429d6cd81d4e8a7e582e8cf46bb41
3
+ size 6180
runs/Jun04_21-14-50_model2-stage2-fp16false-0-4/events.out.tfevents.1749071696.model2-stage2-fp16false-0-4.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6da26e2a2e28784ac0eb3b42ccee0330caa9de22ad1caad160b38b55f51652a
3
+ size 6180
runs/Jun04_21-15-59_model2-stage2-fp16false-0-5/events.out.tfevents.1749071765.model2-stage2-fp16false-0-5.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc3d1e28e09b37684981f9b7ca6ac834c837d0ad25e16cdbde4d0af8d14a8430
3
+ size 6180
runs/Jun04_21-17-03_model2-stage2-fp16false-0-6/events.out.tfevents.1749071829.model2-stage2-fp16false-0-6.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b38bf799333154b848500b7f0b0c525f3b99e539e5295e8ac016cfe8d4f2b10f
3
+ size 6180
runs/Jun04_21-23-12_model2-stage2-0-0/events.out.tfevents.1749072198.model2-stage2-0-0.1.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ec6abe672ba0229f7f4fe4b32d67ea861960550d38602598c66ce67d71c0baa
3
+ size 26749
runs/Jun04_21-23-12_model2-stage2-0-0/events.out.tfevents.1749073272.model2-stage2-0-0.1.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:706247a4f909e8fdc8ef473c313a2afbcc3c1cbaa9e6d353044c5743055b772b
3
+ size 508
runs/Jun04_21-41-12_model2-stage2-0-0/events.out.tfevents.1749073273.model2-stage2-0-0.1.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb920c1ee41f51991de55e358dec512a5b77419a32ac8b5a82a3cc6eece60118
3
+ size 26801
runs/Jun04_21-41-12_model2-stage2-0-0/events.out.tfevents.1749074373.model2-stage2-0-0.1.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b1645d1dec58e626f385881b235658b92eb26c3208476f1a8c1409e3f3e0c13
3
+ size 508
runs/Jun04_21-59-33_model2-stage2-0-0/events.out.tfevents.1749074374.model2-stage2-0-0.1.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94449b52c2a49e5eb17b703b6b323e67a0e6fc9298e03360e7e57ab74d8b34fb
3
+ size 8751
tokenizer.json CHANGED
@@ -6,14 +6,7 @@
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
- "padding": {
10
- "strategy": "BatchLongest",
11
- "direction": "Right",
12
- "pad_to_multiple_of": null,
13
- "pad_id": 0,
14
- "pad_type_id": 0,
15
- "pad_token": "<pad>"
16
- },
17
  "added_tokens": [
18
  {
19
  "id": 0,
 
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
+ "padding": null,
 
 
 
 
 
 
 
10
  "added_tokens": [
11
  {
12
  "id": 0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61ce72ac9ce48c40a13d30c7d1f448250050d69bbe3ea8f136dfd9b99dc043a5
3
  size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:517d19fac2626c020246c94b3b12d9a16f4374ecb9589ee04ddc2c959d55c5d5
3
  size 5905