guyhadad01 commited on
Commit
661710b
·
verified ·
1 Parent(s): 3f12124

Training in progress, step 34600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1205,6 +1205,10 @@ You can finetune this model on your own dataset.
1205
  | 0.6061 | 34300 | 0.3466 |
1206
  | 0.6070 | 34350 | 0.2608 |
1207
  | 0.6079 | 34400 | 0.3239 |
 
 
 
 
1208
 
1209
 
1210
  ### Framework Versions
 
1205
  | 0.6061 | 34300 | 0.3466 |
1206
  | 0.6070 | 34350 | 0.2608 |
1207
  | 0.6079 | 34400 | 0.3239 |
1208
+ | 0.6088 | 34450 | 0.3557 |
1209
+ | 0.6096 | 34500 | 0.4175 |
1210
+ | 0.6105 | 34550 | 0.3104 |
1211
+ | 0.6114 | 34600 | 0.3305 |
1212
 
1213
 
1214
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b5f4ea64897e90b4e4c7c1e0cb94dcb0f1492d916413cce2e66078ccfad6960
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba077d6325305d731409aa162830a3c5d5397210799b60591392b1d61570f746
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cf44dfcc82793c060386978756eab303f1fb8ffef4fb86d6d8a80ed57d60773
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:726943ff9dec97794faedec459447bcaa417b775d59a98d695e669bfe25957b1
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13dc13fdf2d85fe768a37e80558a7b03bdcb432f2ca4a03fa86e5b8f2373ca60
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0770796c8b6d34fe12dcd97fff6f962f270b4c06153537e6c3ceff010a085b43
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8efb8d95dab64304b8fe44c3687dc59b22acc22bfbc66f29596f118c5967e9a
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:548fc86584eafaf1a293dbece88e9fbb1e4a6c458e2f0be88ff6b690236f0848
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c62c2049abe02e0f34d9b4894dabef36b68579cab4efe24bc06e5d79c1d79bfd
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:381bbbc1437f4c979ed33526acec9652454aa2f2944f4ad7e6a6f3b151477146
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6078705094449648,
6
  "eval_steps": 500,
7
- "global_step": 34400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4824,6 +4824,34 @@
4824
  "learning_rate": 2.1797137303410498e-05,
4825
  "loss": 0.3239,
4826
  "step": 34400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4827
  }
4828
  ],
4829
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6114046403138308,
6
  "eval_steps": 500,
7
+ "global_step": 34600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4824
  "learning_rate": 2.1797137303410498e-05,
4825
  "loss": 0.3239,
4826
  "step": 34400
4827
+ },
4828
+ {
4829
+ "epoch": 0.6087540421621813,
4830
+ "grad_norm": 1.5316294431686401,
4831
+ "learning_rate": 2.174805128507196e-05,
4832
+ "loss": 0.3557,
4833
+ "step": 34450
4834
+ },
4835
+ {
4836
+ "epoch": 0.6096375748793977,
4837
+ "grad_norm": 1.539382815361023,
4838
+ "learning_rate": 2.1698965266733427e-05,
4839
+ "loss": 0.4175,
4840
+ "step": 34500
4841
+ },
4842
+ {
4843
+ "epoch": 0.6105211075966143,
4844
+ "grad_norm": 1.6773380041122437,
4845
+ "learning_rate": 2.164987924839489e-05,
4846
+ "loss": 0.3104,
4847
+ "step": 34550
4848
+ },
4849
+ {
4850
+ "epoch": 0.6114046403138308,
4851
+ "grad_norm": 1.3534982204437256,
4852
+ "learning_rate": 2.1601774950423123e-05,
4853
+ "loss": 0.3305,
4854
+ "step": 34600
4855
  }
4856
  ],
4857
  "logging_steps": 50,