guyhadad01 commited on
Commit
7d67d5a
·
verified ·
1 Parent(s): badfa1c

Training in progress, step 41000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1335,6 +1335,10 @@ You can finetune this model on your own dataset.
1335
  | 0.7192 | 40700 | 0.2873 |
1336
  | 0.7201 | 40750 | 0.3705 |
1337
  | 0.7210 | 40800 | 0.2985 |
 
 
 
 
1338
 
1339
  </details>
1340
 
 
1335
  | 0.7192 | 40700 | 0.2873 |
1336
  | 0.7201 | 40750 | 0.3705 |
1337
  | 0.7210 | 40800 | 0.2985 |
1338
+ | 0.7218 | 40850 | 0.3355 |
1339
+ | 0.7227 | 40900 | 0.3322 |
1340
+ | 0.7236 | 40950 | 0.3424 |
1341
+ | 0.7245 | 41000 | 0.2834 |
1342
 
1343
  </details>
1344
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d78a54fb4d46ba6a28639611752cbd90c81e4f5c2899787ac51015d1444478c6
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bad5fe2e60c5aa24260d1942f5fd36c57da4fa95b5377f04b02dcc5ceb9e653
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18056243182ea1caa1b86090618604e7d1e429f23a12ff1faad08a57f30e9f02
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fece1064662d61321c117cc1d24216b16971ad97b1195b94af13fb853181101
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d701f7ad37b76a01e770182d60edba5e764045eee0c4420747669dc57f30af68
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d73c58855bdaef926976cbbf2d9665190e116bcc636d4b89a717f6e32bf6a98
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fc39115c671fd04a36f4927fc18f9015d2dce27d719fc74d0c9d59b53289a70
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a4677c24f01289fca4e4e6cb6d863cf74dbec8f2665874e2aeb1133c6e53329
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb354beb7a0d4ccd477dc950d57455f0fa927e9ecbdea63314e56687b97ea814
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9861609e13b6dfba877602ae0e61dca8ad368849f8b20c6f7958302bb7e1b3b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7209626972486791,
6
  "eval_steps": 500,
7
- "global_step": 40800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5720,6 +5720,34 @@
5720
  "learning_rate": 1.5518053837544916e-05,
5721
  "loss": 0.2985,
5722
  "step": 40800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5723
  }
5724
  ],
5725
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7244968281175452,
6
  "eval_steps": 500,
7
+ "global_step": 41000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5720
  "learning_rate": 1.5518053837544916e-05,
5721
  "loss": 0.2985,
5722
  "step": 40800
5723
+ },
5724
+ {
5725
+ "epoch": 0.7218462299658956,
5726
+ "grad_norm": 1.8306645154953003,
5727
+ "learning_rate": 1.546896781920638e-05,
5728
+ "loss": 0.3355,
5729
+ "step": 40850
5730
+ },
5731
+ {
5732
+ "epoch": 0.7227297626831122,
5733
+ "grad_norm": 1.4840078353881836,
5734
+ "learning_rate": 1.541988180086784e-05,
5735
+ "loss": 0.3322,
5736
+ "step": 40900
5737
+ },
5738
+ {
5739
+ "epoch": 0.7236132954003287,
5740
+ "grad_norm": 2.7773265838623047,
5741
+ "learning_rate": 1.5370795782529303e-05,
5742
+ "loss": 0.3424,
5743
+ "step": 40950
5744
+ },
5745
+ {
5746
+ "epoch": 0.7244968281175452,
5747
+ "grad_norm": 1.3592840433120728,
5748
+ "learning_rate": 1.532170976419077e-05,
5749
+ "loss": 0.2834,
5750
+ "step": 41000
5751
  }
5752
  ],
5753
  "logging_steps": 50,