guyhadad01 commited on
Commit
bb46c9b
·
verified ·
1 Parent(s): bd8d8aa

Training in progress, step 34800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1209,6 +1209,10 @@ You can finetune this model on your own dataset.
1209
  | 0.6096 | 34500 | 0.4175 |
1210
  | 0.6105 | 34550 | 0.3104 |
1211
  | 0.6114 | 34600 | 0.3305 |
 
 
 
 
1212
 
1213
 
1214
  ### Framework Versions
 
1209
  | 0.6096 | 34500 | 0.4175 |
1210
  | 0.6105 | 34550 | 0.3104 |
1211
  | 0.6114 | 34600 | 0.3305 |
1212
+ | 0.6123 | 34650 | 0.2832 |
1213
+ | 0.6132 | 34700 | 0.3007 |
1214
+ | 0.6141 | 34750 | 0.3932 |
1215
+ | 0.6149 | 34800 | 0.3 |
1216
 
1217
 
1218
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba077d6325305d731409aa162830a3c5d5397210799b60591392b1d61570f746
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78346a0c56430d22fa1490f284416b4aeee8fb9539989a398220c805d75e2e61
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:726943ff9dec97794faedec459447bcaa417b775d59a98d695e669bfe25957b1
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:332311a89c1a8130797191a2ad7878850bf8a5f8687fb07aa8ce26dd6bf3aca2
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0770796c8b6d34fe12dcd97fff6f962f270b4c06153537e6c3ceff010a085b43
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:663998c1aaed54adecb3878007dbade857c46ba6a1c5eaffb67717a822135458
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:548fc86584eafaf1a293dbece88e9fbb1e4a6c458e2f0be88ff6b690236f0848
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:480efcc1d108b2db853c5d91deb1ed2fd305f7b9cbbdf50854f3a85cc79a1117
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:381bbbc1437f4c979ed33526acec9652454aa2f2944f4ad7e6a6f3b151477146
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e917b101e0be67dbb3890bb4d8dceac22ecd3870c266a2b20cb6488727437a58
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6114046403138308,
6
  "eval_steps": 500,
7
- "global_step": 34600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4852,6 +4852,34 @@
4852
  "learning_rate": 2.1601774950423123e-05,
4853
  "loss": 0.3305,
4854
  "step": 34600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4855
  }
4856
  ],
4857
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6149387711826969,
6
  "eval_steps": 500,
7
+ "global_step": 34800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4852
  "learning_rate": 2.1601774950423123e-05,
4853
  "loss": 0.3305,
4854
  "step": 34600
4855
+ },
4856
+ {
4857
+ "epoch": 0.6122881730310473,
4858
+ "grad_norm": 1.416923999786377,
4859
+ "learning_rate": 2.1552688932084584e-05,
4860
+ "loss": 0.2832,
4861
+ "step": 34650
4862
+ },
4863
+ {
4864
+ "epoch": 0.6131717057482639,
4865
+ "grad_norm": 1.7992863655090332,
4866
+ "learning_rate": 2.150360291374605e-05,
4867
+ "loss": 0.3007,
4868
+ "step": 34700
4869
+ },
4870
+ {
4871
+ "epoch": 0.6140552384654804,
4872
+ "grad_norm": 1.3988946676254272,
4873
+ "learning_rate": 2.1454516895407514e-05,
4874
+ "loss": 0.3932,
4875
+ "step": 34750
4876
+ },
4877
+ {
4878
+ "epoch": 0.6149387711826969,
4879
+ "grad_norm": 1.7125048637390137,
4880
+ "learning_rate": 2.1405430877068978e-05,
4881
+ "loss": 0.3,
4882
+ "step": 34800
4883
  }
4884
  ],
4885
  "logging_steps": 50,