guyhadad01 commited on
Commit
ea366dd
·
verified ·
1 Parent(s): fdb8f13

Training in progress, step 20400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1431,6 +1431,10 @@ You can finetune this model on your own dataset.
1431
  | 0.3552 | 20100 | 0.3256 |
1432
  | 0.3561 | 20150 | 0.3179 |
1433
  | 0.3569 | 20200 | 0.4226 |
 
 
 
 
1434
 
1435
  </details>
1436
 
 
1431
  | 0.3552 | 20100 | 0.3256 |
1432
  | 0.3561 | 20150 | 0.3179 |
1433
  | 0.3569 | 20200 | 0.4226 |
1434
+ | 0.3578 | 20250 | 0.4196 |
1435
+ | 0.3587 | 20300 | 0.3618 |
1436
+ | 0.3596 | 20350 | 0.4093 |
1437
+ | 0.3605 | 20400 | 0.3051 |
1438
 
1439
  </details>
1440
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ef29b19104cdd2fee93b8217bc742ea19781fda755240150a391d0a52137790
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e24285b7fee77e14610cf519cac1441a781f70c15e6815c8a668c74a1781441
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b84ead54747767096d47dd620e6c1d4484392809c929ebd262e713e54fdf126a
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1038bc1f6238eff236fd9c4b9cc4d1b074566fa9976e684c92c8e7bc2cf6ef1
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67d7c2b4ab7e82df68b4a7c174bebe88de85db56b4421a6d44a9a14dfc374b05
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2529eb4186b974d86a3033c917ecbb272c298c66ef6254d4ce1dc8e6139bb050
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75cb2a5d4e61624cc82e548180286aa5f7b7073a2bd43f3a7494227c84590e41
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ade052dc4070f716b1bebceb9d5e60fb9f374ab26eb8ae1c89ae4e4e0acc23c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a28e3c14c246edc1f658e8b3ed3e4804f86c97afddb1e9e8b6cfd065ec104723
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:884f056648270af6936f71ef50e4c4799a892dfb36fffd709576ecbe5d41efd5
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3569472177554735,
6
  "eval_steps": 500,
7
- "global_step": 20200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2836,6 +2836,34 @@
2836
  "learning_rate": 3.5731676189354225e-05,
2837
  "loss": 0.4226,
2838
  "step": 20200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2839
  }
2840
  ],
2841
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.36048134862433956,
6
  "eval_steps": 500,
7
+ "global_step": 20400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2836
  "learning_rate": 3.5731676189354225e-05,
2837
  "loss": 0.4226,
2838
  "step": 20200
2839
+ },
2840
+ {
2841
+ "epoch": 0.35783075047269003,
2842
+ "grad_norm": 1.3192092180252075,
2843
+ "learning_rate": 3.568259017101569e-05,
2844
+ "loss": 0.4196,
2845
+ "step": 20250
2846
+ },
2847
+ {
2848
+ "epoch": 0.3587142831899065,
2849
+ "grad_norm": 1.421736717224121,
2850
+ "learning_rate": 3.5633504152677155e-05,
2851
+ "loss": 0.3618,
2852
+ "step": 20300
2853
+ },
2854
+ {
2855
+ "epoch": 0.35959781590712303,
2856
+ "grad_norm": 2.0631330013275146,
2857
+ "learning_rate": 3.558441813433861e-05,
2858
+ "loss": 0.4093,
2859
+ "step": 20350
2860
+ },
2861
+ {
2862
+ "epoch": 0.36048134862433956,
2863
+ "grad_norm": 1.6250920295715332,
2864
+ "learning_rate": 3.5535332116000084e-05,
2865
+ "loss": 0.3051,
2866
+ "step": 20400
2867
  }
2868
  ],
2869
  "logging_steps": 50,