guyhadad01 commited on
Commit
5838c63
·
verified ·
1 Parent(s): e5cf7b4

Training in progress, step 28400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1225,6 +1225,10 @@ You can finetune this model on your own dataset.
1225
  | 0.4965 | 28100 | 0.3604 |
1226
  | 0.4974 | 28150 | 0.2612 |
1227
  | 0.4983 | 28200 | 0.3593 |
 
 
 
 
1228
 
1229
 
1230
  ### Framework Versions
 
1225
  | 0.4965 | 28100 | 0.3604 |
1226
  | 0.4974 | 28150 | 0.2612 |
1227
  | 0.4983 | 28200 | 0.3593 |
1228
+ | 0.4992 | 28250 | 0.2961 |
1229
+ | 0.5001 | 28300 | 0.3338 |
1230
+ | 0.5010 | 28350 | 0.3109 |
1231
+ | 0.5018 | 28400 | 0.3234 |
1232
 
1233
 
1234
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa1965a5554a69ff8c5d7634a28c5f04a03c69dd137851c93b70cebbac2f7e99
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63181bf09a1c611c492c8b6ad279006fb56b9805969d0edba71cff3ee723a234
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22731b099d557e9c813459e9016c90f95f238923990688ebd670d8401d82293f
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1746c035958eb9e0a972414e56f8fa4733c0402b003adb0be00e93e8ce71e93
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d49299668d565a8fbf28b1ad8ad6ea4712f5b9b7d3472cc8d598ff75082532ee
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:febec73de51eb7db9177092196a53a5124fb83edff44db6d3e9496c1ee972476
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a77e32486116fb80a72650dd1d3f8b1c3fcfe6b44b779b1f8fb0e11f75bb318
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5147f98e53184b8dd37c8115204cda76018272755476678192eccb1efdd5d07
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be316569338339522180d5bdc62cd0944e9a3d23a5127275cdd38048e9eeda36
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:953c76ee5b14f1426684c90829d80bb305b640c5a3e12732ffb64cce4b8f5126
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.49831245251011647,
6
  "eval_steps": 500,
7
- "global_step": 28200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3956,6 +3956,34 @@
3956
  "learning_rate": 2.7881840136655475e-05,
3957
  "loss": 0.3593,
3958
  "step": 28200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3959
  }
3960
  ],
3961
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5018465833789825,
6
  "eval_steps": 500,
7
+ "global_step": 28400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3956
  "learning_rate": 2.7881840136655475e-05,
3957
  "loss": 0.3593,
3958
  "step": 28200
3959
+ },
3960
+ {
3961
+ "epoch": 0.499195985227333,
3962
+ "grad_norm": 1.1693766117095947,
3963
+ "learning_rate": 2.783275411831694e-05,
3964
+ "loss": 0.2961,
3965
+ "step": 28250
3966
+ },
3967
+ {
3968
+ "epoch": 0.5000795179445495,
3969
+ "grad_norm": 1.65450918674469,
3970
+ "learning_rate": 2.7783668099978404e-05,
3971
+ "loss": 0.3338,
3972
+ "step": 28300
3973
+ },
3974
+ {
3975
+ "epoch": 0.500963050661766,
3976
+ "grad_norm": 1.438693642616272,
3977
+ "learning_rate": 2.7734582081639866e-05,
3978
+ "loss": 0.3109,
3979
+ "step": 28350
3980
+ },
3981
+ {
3982
+ "epoch": 0.5018465833789825,
3983
+ "grad_norm": 1.5170999765396118,
3984
+ "learning_rate": 2.768549606330133e-05,
3985
+ "loss": 0.3234,
3986
+ "step": 28400
3987
  }
3988
  ],
3989
  "logging_steps": 50,