guyhadad01 commited on
Commit
198e809
·
verified ·
1 Parent(s): 7679b8a

Training in progress, step 40400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1323,6 +1323,10 @@ You can finetune this model on your own dataset.
1323
  | 0.7086 | 40100 | 0.2649 |
1324
  | 0.7095 | 40150 | 0.3184 |
1325
  | 0.7104 | 40200 | 0.334 |
 
 
 
 
1326
 
1327
  </details>
1328
 
 
1323
  | 0.7086 | 40100 | 0.2649 |
1324
  | 0.7095 | 40150 | 0.3184 |
1325
  | 0.7104 | 40200 | 0.334 |
1326
+ | 0.7112 | 40250 | 0.3609 |
1327
+ | 0.7121 | 40300 | 0.306 |
1328
+ | 0.7130 | 40350 | 0.2629 |
1329
+ | 0.7139 | 40400 | 0.2311 |
1330
 
1331
  </details>
1332
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c11448eab5085dafbe70840b347e552395741208f4c056feba7bdf25c3684b4
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a50f06d6c0fd8326af39a398662f171a8273231c42342726a949dca804e1fec3
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:176196a55e3283e4494c033b91ec493e6e73b898ba15899622781e50e5276a9c
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a31f8e8daa44a5969c8468131e422d3890bd1b3dfc09e140da75d5ff08dd8929
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45c20f027761b73065674875134aab16adfe944ddeaaac5054a42d467120ac3f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8789e63d322628b9bf8ef047af43291db3bd5935067320bb834f1fe83567f97
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:024951ca35599ed7cd93018ece748744d262ffe3e8da72f14612df6525b8ad2b
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f096ecf59986ddd611fd8ea1bd90586f9039a1554c47a1316352f4e9e8082419
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91554dd52659f1199ca0e07de2f95f60454723c4c5c500a75b5d255aeb95a210
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fca1118641eb340cc4f5e2369cd22f797bffa655fc6d743b877326b0bf15332
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7103603046420809,
6
  "eval_steps": 500,
7
- "global_step": 40200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5636,6 +5636,34 @@
5636
  "learning_rate": 1.6106104337240583e-05,
5637
  "loss": 0.334,
5638
  "step": 40200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5639
  }
5640
  ],
5641
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.713894435510947,
6
  "eval_steps": 500,
7
+ "global_step": 40400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5636
  "learning_rate": 1.6106104337240583e-05,
5637
  "loss": 0.334,
5638
  "step": 40200
5639
+ },
5640
+ {
5641
+ "epoch": 0.7112438373592974,
5642
+ "grad_norm": 1.348560094833374,
5643
+ "learning_rate": 1.6057018318902045e-05,
5644
+ "loss": 0.3609,
5645
+ "step": 40250
5646
+ },
5647
+ {
5648
+ "epoch": 0.7121273700765139,
5649
+ "grad_norm": 0.9920164942741394,
5650
+ "learning_rate": 1.600793230056351e-05,
5651
+ "loss": 0.306,
5652
+ "step": 40300
5653
+ },
5654
+ {
5655
+ "epoch": 0.7130109027937305,
5656
+ "grad_norm": 1.3321669101715088,
5657
+ "learning_rate": 1.595884628222497e-05,
5658
+ "loss": 0.2629,
5659
+ "step": 40350
5660
+ },
5661
+ {
5662
+ "epoch": 0.713894435510947,
5663
+ "grad_norm": 1.257283329963684,
5664
+ "learning_rate": 1.5909760263886435e-05,
5665
+ "loss": 0.2311,
5666
+ "step": 40400
5667
  }
5668
  ],
5669
  "logging_steps": 50,