guyhadad01 commited on
Commit
aa2d9fe
·
verified ·
1 Parent(s): cdbc0ed

Training in progress, step 19000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1403,6 +1403,10 @@ You can finetune this model on your own dataset.
1403
  | 0.3304 | 18700 | 0.3543 |
1404
  | 0.3313 | 18750 | 0.3642 |
1405
  | 0.3322 | 18800 | 0.3415 |
 
 
 
 
1406
 
1407
  </details>
1408
 
 
1403
  | 0.3304 | 18700 | 0.3543 |
1404
  | 0.3313 | 18750 | 0.3642 |
1405
  | 0.3322 | 18800 | 0.3415 |
1406
+ | 0.3331 | 18850 | 0.3069 |
1407
+ | 0.3340 | 18900 | 0.2962 |
1408
+ | 0.3349 | 18950 | 0.3156 |
1409
+ | 0.3357 | 19000 | 0.3791 |
1410
 
1411
  </details>
1412
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d6283a957a66c184eb3662df7aa262cd154fb1dcee802f75857776d94240bc13
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:123a3c7e068975f2d73a559688da89498d96c9f5f3906b2f60a8f55923c134f5
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:78292edbaee380ac230c50b2f8b68c5dd37e7df2ddfa15b2c43a017c23edfbeb
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e186b88037a18eebc7b613039df85cfc79c02be57538ce16444dea0485fdf79
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83eb2f002d2d9da0dc4755fcda636e68d5b4a41e8c2e5a2b8c82d014a65d58ff
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03af62e0682690ebbb7904f13bcb54bda8192bd3193a8746111a4da158c48b8c
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c934cf056ab14aad09651705c56e19636a65538c7a4a6a0401dc0dfa92a2b37
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10840146a6e19998f1fdbf028a41f37469dd8a3b8988531196e63b1251245096
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0b05eb17181bcecd1e03b83742ebacffcd8b0f6bb6d68e2982a23c3f445018e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23958946bfe31c250bee11672fccb9ed52902b5ac707ac8090942157c16267c1
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.332208301673411,
6
  "eval_steps": 500,
7
- "global_step": 18800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2640,6 +2640,34 @@
2640
  "learning_rate": 3.710510298246648e-05,
2641
  "loss": 0.3415,
2642
  "step": 18800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2643
  }
2644
  ],
2645
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.33574243254227704,
6
  "eval_steps": 500,
7
+ "global_step": 19000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2640
  "learning_rate": 3.710510298246648e-05,
2641
  "loss": 0.3415,
2642
  "step": 18800
2643
+ },
2644
+ {
2645
+ "epoch": 0.3330918343906275,
2646
+ "grad_norm": 1.4388914108276367,
2647
+ "learning_rate": 3.7056016964127937e-05,
2648
+ "loss": 0.3069,
2649
+ "step": 18850
2650
+ },
2651
+ {
2652
+ "epoch": 0.333975367107844,
2653
+ "grad_norm": 1.5527664422988892,
2654
+ "learning_rate": 3.70069309457894e-05,
2655
+ "loss": 0.2962,
2656
+ "step": 18900
2657
+ },
2658
+ {
2659
+ "epoch": 0.3348588998250605,
2660
+ "grad_norm": 1.6680736541748047,
2661
+ "learning_rate": 3.6957844927450866e-05,
2662
+ "loss": 0.3156,
2663
+ "step": 18950
2664
+ },
2665
+ {
2666
+ "epoch": 0.33574243254227704,
2667
+ "grad_norm": 2.266108274459839,
2668
+ "learning_rate": 3.69097406294791e-05,
2669
+ "loss": 0.3791,
2670
+ "step": 19000
2671
  }
2672
  ],
2673
  "logging_steps": 50,