guyhadad01 commited on
Commit
e2e1c74
·
verified ·
1 Parent(s): a2b7c25

Training in progress, step 42600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1367,6 +1367,10 @@ You can finetune this model on your own dataset.
1367
  | 0.7475 | 42300 | 0.2374 |
1368
  | 0.7484 | 42350 | 0.3347 |
1369
  | 0.7492 | 42400 | 0.3031 |
 
 
 
 
1370
 
1371
  </details>
1372
 
 
1367
  | 0.7475 | 42300 | 0.2374 |
1368
  | 0.7484 | 42350 | 0.3347 |
1369
  | 0.7492 | 42400 | 0.3031 |
1370
+ | 0.7501 | 42450 | 0.2817 |
1371
+ | 0.7510 | 42500 | 0.3433 |
1372
+ | 0.7519 | 42550 | 0.3273 |
1373
+ | 0.7528 | 42600 | 0.3123 |
1374
 
1375
  </details>
1376
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6aa92be7deea9d9fa0443a8e7ac43099edac64700ac1948c996c7d56587f9eab
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ff54d76c9ebf490f12ff8e20aef5fa2ede05719c3e5676b2c4b70743a6ddb70
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:87b7fd53fc83dc52997172f5fd46299f5a9cb53791e47663db9b33ca688d8e9d
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1bcc3dd859b5b30a53288025a1e1562aaecb27ca1c5f50de5231f42624b5be4
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c78cdd0913fe6a8bd516be3fa927565353e6ccb7f2abf432b224a447c2067b40
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:283d0e72fe96a15f8f83fa6413bf75a47c1e9923215c4159761e62486061e4d6
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36ad923444303f7830b2be707d7167336797f0569cde414d2b04df5898c738d4
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6825a6ad95d754623a78051fc89a4d4e41f2bf2218e7b695b249c975dc4ba73
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c406d8129b27e63cb0cbf299bbeba9e703c540df5033871f11031330a77f043
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:052884290aaf5bd113167914e5b98e8e8eb63821927d0e64cb92a12102bb9c25
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7492357441996077,
6
  "eval_steps": 500,
7
- "global_step": 42400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5944,6 +5944,34 @@
5944
  "learning_rate": 1.3947301250711748e-05,
5945
  "loss": 0.3031,
5946
  "step": 42400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5947
  }
5948
  ],
5949
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7527698750684738,
6
  "eval_steps": 500,
7
+ "global_step": 42600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5944
  "learning_rate": 1.3947301250711748e-05,
5945
  "loss": 0.3031,
5946
  "step": 42400
5947
+ },
5948
+ {
5949
+ "epoch": 0.7501192769168242,
5950
+ "grad_norm": 2.6039016246795654,
5951
+ "learning_rate": 1.389821523237321e-05,
5952
+ "loss": 0.2817,
5953
+ "step": 42450
5954
+ },
5955
+ {
5956
+ "epoch": 0.7510028096340408,
5957
+ "grad_norm": 4.557380676269531,
5958
+ "learning_rate": 1.3849129214034675e-05,
5959
+ "loss": 0.3433,
5960
+ "step": 42500
5961
+ },
5962
+ {
5963
+ "epoch": 0.7518863423512573,
5964
+ "grad_norm": 2.938749074935913,
5965
+ "learning_rate": 1.3800043195696138e-05,
5966
+ "loss": 0.3273,
5967
+ "step": 42550
5968
+ },
5969
+ {
5970
+ "epoch": 0.7527698750684738,
5971
+ "grad_norm": 1.3836658000946045,
5972
+ "learning_rate": 1.3750957177357601e-05,
5973
+ "loss": 0.3123,
5974
+ "step": 42600
5975
  }
5976
  ],
5977
  "logging_steps": 50,