guyhadad01 commited on
Commit
548527c
·
verified ·
1 Parent(s): 0c593ac

Training in progress, step 35600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1225,6 +1225,10 @@ You can finetune this model on your own dataset.
1225
  | 0.6238 | 35300 | 0.3355 |
1226
  | 0.6247 | 35350 | 0.3626 |
1227
  | 0.6255 | 35400 | 0.2542 |
 
 
 
 
1228
 
1229
 
1230
  ### Framework Versions
 
1225
  | 0.6238 | 35300 | 0.3355 |
1226
  | 0.6247 | 35350 | 0.3626 |
1227
  | 0.6255 | 35400 | 0.2542 |
1228
+ | 0.6264 | 35450 | 0.2555 |
1229
+ | 0.6273 | 35500 | 0.3418 |
1230
+ | 0.6282 | 35550 | 0.3118 |
1231
+ | 0.6291 | 35600 | 0.2889 |
1232
 
1233
 
1234
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49e95dbcbd79f97ce1ba67a803455e357f6c9c9ea644273cb7511cae3c831b9d
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20174b6b2c2d93226ddeb321dbabd4bc1c8af76305e7d7148c8cc355e3d7cd60
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29767797f5949aa103f2386e6b46cf5006f18f6853e49108146824052452a81a
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5a9d9a1fa3ca8642b4bdf418f1c296a72f8625176479edd5bcdc2533d1bdf26
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eea4a8e4afcda31bb844cc13d2627fa89d98644359cf49b2f2f2f5fdbb6dbb81
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f3288273f695a1df0217fae4938baee576d7a5a6d2a38836aee6bceb6a8de02
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8c2fca16cf2e15838c5424c974921bcfa3346a7bf4c2458c8ecc9892726ed4c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8450c711e1de0810b6e36b835decaee09acd21b4ab25d2432aa749fd8de4d2d4
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab93b747e0fc75060bb6e7ff7bdc607ad6b06fa8d1c145ad4ab8d80aeeb37b40
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41e3f9784f622226c37c073ce2a64e597153fe7fa7c42f2778e8d0d5f771e26e
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6255411637892951,
6
  "eval_steps": 500,
7
- "global_step": 35400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4964,6 +4964,34 @@
4964
  "learning_rate": 2.0816398657006537e-05,
4965
  "loss": 0.2542,
4966
  "step": 35400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4967
  }
4968
  ],
4969
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6290752946581611,
6
  "eval_steps": 500,
7
+ "global_step": 35600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4964
  "learning_rate": 2.0816398657006537e-05,
4965
  "loss": 0.2542,
4966
  "step": 35400
4967
+ },
4968
+ {
4969
+ "epoch": 0.6264246965065117,
4970
+ "grad_norm": 1.4315252304077148,
4971
+ "learning_rate": 2.0767312638668002e-05,
4972
+ "loss": 0.2555,
4973
+ "step": 35450
4974
+ },
4975
+ {
4976
+ "epoch": 0.6273082292237282,
4977
+ "grad_norm": 2.861154079437256,
4978
+ "learning_rate": 2.0718226620329467e-05,
4979
+ "loss": 0.3418,
4980
+ "step": 35500
4981
+ },
4982
+ {
4983
+ "epoch": 0.6281917619409447,
4984
+ "grad_norm": 1.378416895866394,
4985
+ "learning_rate": 2.066914060199093e-05,
4986
+ "loss": 0.3118,
4987
+ "step": 35550
4988
+ },
4989
+ {
4990
+ "epoch": 0.6290752946581611,
4991
+ "grad_norm": 4.129642486572266,
4992
+ "learning_rate": 2.0620054583652393e-05,
4993
+ "loss": 0.2889,
4994
+ "step": 35600
4995
  }
4996
  ],
4997
  "logging_steps": 50,