guyhadad01 commited on
Commit
97a8990
·
verified ·
1 Parent(s): e8f9bd9

Training in progress, step 16000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1343,6 +1343,10 @@ You can finetune this model on your own dataset.
1343
  | 0.2774 | 15700 | 0.4377 |
1344
  | 0.2783 | 15750 | 0.4041 |
1345
  | 0.2792 | 15800 | 0.375 |
 
 
 
 
1346
 
1347
  </details>
1348
 
 
1343
  | 0.2774 | 15700 | 0.4377 |
1344
  | 0.2783 | 15750 | 0.4041 |
1345
  | 0.2792 | 15800 | 0.375 |
1346
+ | 0.2801 | 15850 | 0.3339 |
1347
+ | 0.2810 | 15900 | 0.348 |
1348
+ | 0.2818 | 15950 | 0.367 |
1349
+ | 0.2827 | 16000 | 0.3427 |
1350
 
1351
  </details>
1352
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3d55e45825a3c654f0b7eaf0ef140162fe612ee219ff9374e5295592d1444b9
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fd95a7943e2d7fca893eb5bdbe9b3d01703e4d80ed047d04c1a67e2b9b33397
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3a74062f2a6f56b8b0e799cc086809df8bd6dad796e1d4cdc42ce905c2701af
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f4813f7d86633bd1ed04417d2d1313c405edfb90b56a8c930cfc1d1cf2addb
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d06578a61ae44cb9a0de8333b92d3619c8147705d79a090a8054c07810546369
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f746250cbdbcfc4b3753e05fc3f2d0b47904bb4b557a3820295b22d838b42f6
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e95ff6f2b0a235804a0c3d7872a59d6fa2f6701ff13d24c3cdd11982303ea58
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:218ae04f7dbf6951d970ca21a27b311e58e61f1cd335681a08b187b9413a828c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:adfca4433908d3fab5c9a1fa33bf6028dd834c726d10f65fd18b1dbca2367df8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c56b223eeb93b57918d558b5af382f71a700beb8d1cf640c27db1796abbd5d2f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.27919633864041987,
6
  "eval_steps": 500,
7
- "global_step": 15800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2220,6 +2220,34 @@
2220
  "learning_rate": 4.00492823624119e-05,
2221
  "loss": 0.375,
2222
  "step": 15800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2223
  }
2224
  ],
2225
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.28273046950928593,
6
  "eval_steps": 500,
7
+ "global_step": 16000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2220
  "learning_rate": 4.00492823624119e-05,
2221
  "loss": 0.375,
2222
  "step": 15800
2223
+ },
2224
+ {
2225
+ "epoch": 0.2800798713576364,
2226
+ "grad_norm": 1.9363830089569092,
2227
+ "learning_rate": 4.0000196344073355e-05,
2228
+ "loss": 0.3339,
2229
+ "step": 15850
2230
+ },
2231
+ {
2232
+ "epoch": 0.2809634040748529,
2233
+ "grad_norm": 2.208641767501831,
2234
+ "learning_rate": 3.995111032573482e-05,
2235
+ "loss": 0.348,
2236
+ "step": 15900
2237
+ },
2238
+ {
2239
+ "epoch": 0.2818469367920694,
2240
+ "grad_norm": 1.5789657831192017,
2241
+ "learning_rate": 3.9902024307396284e-05,
2242
+ "loss": 0.367,
2243
+ "step": 15950
2244
+ },
2245
+ {
2246
+ "epoch": 0.28273046950928593,
2247
+ "grad_norm": 1.6666336059570312,
2248
+ "learning_rate": 3.985293828905775e-05,
2249
+ "loss": 0.3427,
2250
+ "step": 16000
2251
  }
2252
  ],
2253
  "logging_steps": 50,