guyhadad01 commited on
Commit
f6203ec
·
verified ·
1 Parent(s): 845db05

Training in progress, step 47000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1229,6 +1229,10 @@ You can finetune this model on your own dataset.
1229
  | 0.8252 | 46700 | 0.2965 |
1230
  | 0.8261 | 46750 | 0.2506 |
1231
  | 0.8270 | 46800 | 0.2258 |
 
 
 
 
1232
 
1233
 
1234
  ### Framework Versions
 
1229
  | 0.8252 | 46700 | 0.2965 |
1230
  | 0.8261 | 46750 | 0.2506 |
1231
  | 0.8270 | 46800 | 0.2258 |
1232
+ | 0.8279 | 46850 | 0.2209 |
1233
+ | 0.8288 | 46900 | 0.2756 |
1234
+ | 0.8296 | 46950 | 0.3345 |
1235
+ | 0.8305 | 47000 | 0.3016 |
1236
 
1237
 
1238
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06c3f18fa41ad103d30f8534ab7132db4ee0061b54edf40285b4af72b13eb56f
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d215026fb98a4e80219f1300f712038cf2fa723f5168816bc64b2547a49bce2f
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fd6c1d98fe362a0c2eb43d38b5cdf5892278019bdee6a0ede5aba69437e6bc1
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10ceee43905dfe8e32b48bcbafa4954b114ed3adec82f09a2cc6c7e47d869d1b
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bc474fa5fa7ccd3f751905ccba31cf8241a798bcffde04ca50c28aabfb2c8fc4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:370edc95f3ec87693c2f5c1d97900af678cc360f41a849a73def6dbfd862bd18
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f4d5223b0e67d5c0eb5511f7b2157df3119d42796d741c478e1b9dd9b2daa03
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5927361a532fb6c132d07b4ab7a520caf5f685a6698e2682d0ac3b35fea7ca5e
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:deb3a6b85091a07e122d9b08dbed39a677740be0c318acc9f799b2491273dc34
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d9635610518cbf3041eab5001840676a9398dea515bdb1588a50299a67cadbe
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.8269866233146613,
6
  "eval_steps": 500,
7
- "global_step": 46800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6560,6 +6560,34 @@
6560
  "learning_rate": 9.629695077654082e-06,
6561
  "loss": 0.2258,
6562
  "step": 46800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6563
  }
6564
  ],
6565
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.8305207541835274,
6
  "eval_steps": 500,
7
+ "global_step": 47000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6560
  "learning_rate": 9.629695077654082e-06,
6561
  "loss": 0.2258,
6562
  "step": 46800
6563
+ },
6564
+ {
6565
+ "epoch": 0.8278701560318779,
6566
+ "grad_norm": 1.71811842918396,
6567
+ "learning_rate": 9.580609059315546e-06,
6568
+ "loss": 0.2209,
6569
+ "step": 46850
6570
+ },
6571
+ {
6572
+ "epoch": 0.8287536887490944,
6573
+ "grad_norm": 3.2347002029418945,
6574
+ "learning_rate": 9.53152304097701e-06,
6575
+ "loss": 0.2756,
6576
+ "step": 46900
6577
+ },
6578
+ {
6579
+ "epoch": 0.8296372214663109,
6580
+ "grad_norm": 2.865858554840088,
6581
+ "learning_rate": 9.483418743005244e-06,
6582
+ "loss": 0.3345,
6583
+ "step": 46950
6584
+ },
6585
+ {
6586
+ "epoch": 0.8305207541835274,
6587
+ "grad_norm": 1.4720476865768433,
6588
+ "learning_rate": 9.434332724666705e-06,
6589
+ "loss": 0.3016,
6590
+ "step": 47000
6591
  }
6592
  ],
6593
  "logging_steps": 50,