guyhadad01 commited on
Commit
b5d9218
·
verified ·
1 Parent(s): 2853dfc

Training in progress, step 16200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1347,6 +1347,10 @@ You can finetune this model on your own dataset.
1347
  | 0.2810 | 15900 | 0.348 |
1348
  | 0.2818 | 15950 | 0.367 |
1349
  | 0.2827 | 16000 | 0.3427 |
 
 
 
 
1350
 
1351
  </details>
1352
 
 
1347
  | 0.2810 | 15900 | 0.348 |
1348
  | 0.2818 | 15950 | 0.367 |
1349
  | 0.2827 | 16000 | 0.3427 |
1350
+ | 0.2836 | 16050 | 0.3637 |
1351
+ | 0.2845 | 16100 | 0.3489 |
1352
+ | 0.2854 | 16150 | 0.4209 |
1353
+ | 0.2863 | 16200 | 0.2984 |
1354
 
1355
  </details>
1356
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fd95a7943e2d7fca893eb5bdbe9b3d01703e4d80ed047d04c1a67e2b9b33397
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4d75f43e43417714c9eb673b4140e3bc3180d809cd3703e268b196479d4e674
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:35f4813f7d86633bd1ed04417d2d1313c405edfb90b56a8c930cfc1d1cf2addb
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f5b8a814f3aeefa5d532770d34674995a259b1d0de80bb9f90ec6188099e03c
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f746250cbdbcfc4b3753e05fc3f2d0b47904bb4b557a3820295b22d838b42f6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47f7e685ed786d075ed1cbf16f75ee06ff18af8652d59bebd10628b722f2e5f2
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:218ae04f7dbf6951d970ca21a27b311e58e61f1cd335681a08b187b9413a828c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c70ce39dc0484a07cf26175c01edd45d7187b33cf3b7426ec3e7187e560fe7f9
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c56b223eeb93b57918d558b5af382f71a700beb8d1cf640c27db1796abbd5d2f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:198e9c5abe5151f1b8f98a22fd77ae2770a4aa017bd01877ffccc20b1cae28be
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.28273046950928593,
6
  "eval_steps": 500,
7
- "global_step": 16000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2248,6 +2248,34 @@
2248
  "learning_rate": 3.985293828905775e-05,
2249
  "loss": 0.3427,
2250
  "step": 16000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2251
  }
2252
  ],
2253
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.286264600378152,
6
  "eval_steps": 500,
7
+ "global_step": 16200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2248
  "learning_rate": 3.985293828905775e-05,
2249
  "loss": 0.3427,
2250
  "step": 16000
2251
+ },
2252
+ {
2253
+ "epoch": 0.28361400222650246,
2254
+ "grad_norm": 3.725020170211792,
2255
+ "learning_rate": 3.980385227071921e-05,
2256
+ "loss": 0.3637,
2257
+ "step": 16050
2258
+ },
2259
+ {
2260
+ "epoch": 0.284497534943719,
2261
+ "grad_norm": 1.5958735942840576,
2262
+ "learning_rate": 3.975476625238068e-05,
2263
+ "loss": 0.3489,
2264
+ "step": 16100
2265
+ },
2266
+ {
2267
+ "epoch": 0.28538106766093546,
2268
+ "grad_norm": 1.3779951333999634,
2269
+ "learning_rate": 3.9705680234042136e-05,
2270
+ "loss": 0.4209,
2271
+ "step": 16150
2272
+ },
2273
+ {
2274
+ "epoch": 0.286264600378152,
2275
+ "grad_norm": 1.6636724472045898,
2276
+ "learning_rate": 3.96565942157036e-05,
2277
+ "loss": 0.2984,
2278
+ "step": 16200
2279
  }
2280
  ],
2281
  "logging_steps": 50,