guyhadad01 commited on
Commit
a6a4a9e
·
verified ·
1 Parent(s): e58a791

Training in progress, step 9200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1205,6 +1205,10 @@ You can finetune this model on your own dataset.
1205
  | 0.1573 | 8900 | 0.4081 |
1206
  | 0.1582 | 8950 | 0.4648 |
1207
  | 0.1590 | 9000 | 0.4321 |
 
 
 
 
1208
 
1209
 
1210
  ### Framework Versions
 
1205
  | 0.1573 | 8900 | 0.4081 |
1206
  | 0.1582 | 8950 | 0.4648 |
1207
  | 0.1590 | 9000 | 0.4321 |
1208
+ | 0.1599 | 9050 | 0.4226 |
1209
+ | 0.1608 | 9100 | 0.3634 |
1210
+ | 0.1617 | 9150 | 0.4252 |
1211
+ | 0.1626 | 9200 | 0.3899 |
1212
 
1213
 
1214
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6833db3941c48530d63f16a4641cb58d29681db52bfc4aaba9787486862f28a0
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:880e624eb7279ea2c15d3d6797440086ddb9b6116f0e9bd2fea229b00f3eafcc
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc8f323339f8042019b8128089add42f66d2a56c4dfd5f02e68b4884b9f08cad
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8dea7d6f8279c47cc3d797dc40c5bd4cbb324255364a56bfc64a2536ad6b318
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8b31b0e1d81266033020b3fd3836c1b6a14642adb57f047a1bc520e453a6aba
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beb5381b8cfab2c43d778d817204fe174c7b328e5f3861902f2432aa4cc89685
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0a063eb0473b3b545a1a6d08a6917737011cdcb54e4175440233b96c566f83c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df2589efb63b68f20dc42380f13074262282edb3a23f326bcb9e05c733236848
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f78894f5196d0952d3fc803e041442456b12fd7839191717af3aecab8279af9f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aeb87116cd3b0b49516d866a0e3b848d38858f80863640384bfc6aab2a1d3a1d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.15903588909897334,
6
  "eval_steps": 500,
7
- "global_step": 9000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -1268,6 +1268,34 @@
1268
  "learning_rate": 4.672203569535254e-05,
1269
  "loss": 0.4321,
1270
  "step": 9000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1271
  }
1272
  ],
1273
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.1625700199678394,
6
  "eval_steps": 500,
7
+ "global_step": 9200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
1268
  "learning_rate": 4.672203569535254e-05,
1269
  "loss": 0.4321,
1270
  "step": 9000
1271
+ },
1272
+ {
1273
+ "epoch": 0.15991942181618984,
1274
+ "grad_norm": 1.8130481243133545,
1275
+ "learning_rate": 4.6672949677014e-05,
1276
+ "loss": 0.4226,
1277
+ "step": 9050
1278
+ },
1279
+ {
1280
+ "epoch": 0.16080295453340637,
1281
+ "grad_norm": 2.4127371311187744,
1282
+ "learning_rate": 4.6623863658675464e-05,
1283
+ "loss": 0.3634,
1284
+ "step": 9100
1285
+ },
1286
+ {
1287
+ "epoch": 0.1616864872506229,
1288
+ "grad_norm": 2.362494707107544,
1289
+ "learning_rate": 4.657477764033693e-05,
1290
+ "loss": 0.4252,
1291
+ "step": 9150
1292
+ },
1293
+ {
1294
+ "epoch": 0.1625700199678394,
1295
+ "grad_norm": 1.855000615119934,
1296
+ "learning_rate": 4.6525691621998393e-05,
1297
+ "loss": 0.3899,
1298
+ "step": 9200
1299
  }
1300
  ],
1301
  "logging_steps": 50,