guyhadad01 commited on
Commit
65888a3
·
verified ·
1 Parent(s): 721fc00

Training in progress, step 35400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1221,6 +1221,10 @@ You can finetune this model on your own dataset.
1221
  | 0.6202 | 35100 | 0.2965 |
1222
  | 0.6211 | 35150 | 0.3557 |
1223
  | 0.6220 | 35200 | 0.3535 |
 
 
 
 
1224
 
1225
 
1226
  ### Framework Versions
 
1221
  | 0.6202 | 35100 | 0.2965 |
1222
  | 0.6211 | 35150 | 0.3557 |
1223
  | 0.6220 | 35200 | 0.3535 |
1224
+ | 0.6229 | 35250 | 0.4183 |
1225
+ | 0.6238 | 35300 | 0.3355 |
1226
+ | 0.6247 | 35350 | 0.3626 |
1227
+ | 0.6255 | 35400 | 0.2542 |
1228
 
1229
 
1230
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a73726096d96dbbbaa9a481dfff6e52b1ea1d694b55f2edc2f1405af8895110b
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49e95dbcbd79f97ce1ba67a803455e357f6c9c9ea644273cb7511cae3c831b9d
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8b3f57d97ffd57e518f40f15d12ad037a0066d481b15f01ac0c5cd7db8dcb47
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29767797f5949aa103f2386e6b46cf5006f18f6853e49108146824052452a81a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca63325ac742a792a3bcdc1dc21baa9c1c96f6a59934e63bc8a87c6b8f66e093
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eea4a8e4afcda31bb844cc13d2627fa89d98644359cf49b2f2f2f5fdbb6dbb81
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f6bf385710f1d1a6f64e5b03c0c6f98497de21222ff381a7961ac0b45b93ddc
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8c2fca16cf2e15838c5424c974921bcfa3346a7bf4c2458c8ecc9892726ed4c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f345579e836e5dec04f17da3b053acb614c611f3b7c11559a8cdc45e09194e58
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab93b747e0fc75060bb6e7ff7bdc607ad6b06fa8d1c145ad4ab8d80aeeb37b40
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.622007032920429,
6
  "eval_steps": 500,
7
- "global_step": 35200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4936,6 +4936,34 @@
4936
  "learning_rate": 2.1012742730360685e-05,
4937
  "loss": 0.3535,
4938
  "step": 35200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4939
  }
4940
  ],
4941
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6255411637892951,
6
  "eval_steps": 500,
7
+ "global_step": 35400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4936
  "learning_rate": 2.1012742730360685e-05,
4937
  "loss": 0.3535,
4938
  "step": 35200
4939
+ },
4940
+ {
4941
+ "epoch": 0.6228905656376456,
4942
+ "grad_norm": 1.9256399869918823,
4943
+ "learning_rate": 2.0963656712022147e-05,
4944
+ "loss": 0.4183,
4945
+ "step": 35250
4946
+ },
4947
+ {
4948
+ "epoch": 0.6237740983548621,
4949
+ "grad_norm": 1.4346308708190918,
4950
+ "learning_rate": 2.0914570693683615e-05,
4951
+ "loss": 0.3355,
4952
+ "step": 35300
4953
+ },
4954
+ {
4955
+ "epoch": 0.6246576310720786,
4956
+ "grad_norm": 1.3797852993011475,
4957
+ "learning_rate": 2.0865484675345076e-05,
4958
+ "loss": 0.3626,
4959
+ "step": 35350
4960
+ },
4961
+ {
4962
+ "epoch": 0.6255411637892951,
4963
+ "grad_norm": 3.1976869106292725,
4964
+ "learning_rate": 2.0816398657006537e-05,
4965
+ "loss": 0.2542,
4966
+ "step": 35400
4967
  }
4968
  ],
4969
  "logging_steps": 50,