guyhadad01 commited on
Commit
5bdad33
·
verified ·
1 Parent(s): 10068a7

Training in progress, step 45800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1205,6 +1205,10 @@ You can finetune this model on your own dataset.
1205
  | 0.8040 | 45500 | 0.306 |
1206
  | 0.8049 | 45550 | 0.2888 |
1207
  | 0.8058 | 45600 | 0.3101 |
 
 
 
 
1208
 
1209
 
1210
  ### Framework Versions
 
1205
  | 0.8040 | 45500 | 0.306 |
1206
  | 0.8049 | 45550 | 0.2888 |
1207
  | 0.8058 | 45600 | 0.3101 |
1208
+ | 0.8067 | 45650 | 0.3148 |
1209
+ | 0.8075 | 45700 | 0.3975 |
1210
+ | 0.8084 | 45750 | 0.391 |
1211
+ | 0.8093 | 45800 | 0.3055 |
1212
 
1213
 
1214
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dafa20b9ee08adc30b1b45605dd3458876a74a9a04d0a242b2d07bff11ffcfd4
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cd5b7a0c7bbd9cd3c1ef7b582da35f4528606a4ac86bb04de178a7045ffef85
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e30656e2446cf01ec70d3edee1d105134bd862bca3236ab9a8c0b6f570bdcc1
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:229981f79739c953722cfecdcfd1ea3bc38fb99e716343cc7272446d9e5bd67a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3642579a8c93faba29891bb437590b2fc3296379ded34bad3a25d71b44ae26dc
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0858441a43126cd8171b6b37146cb192258791649fae1dc1b48ff841ebace857
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:803966f189174fdab2c5da9165b86bf3a54e44aa7c1402617aaf37d70a2c35b6
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:791a23171b5f58ee5e75b5820d77158a2c7a8600431496a1df7bd6fb2c50e26f
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2db50723dd4d547a9dfd33b0f7da5dabf8169af1f05c3a349b52d1ff0ca949ad
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb572362d72f52e385494a9e0afaacf81d8323c35f20a7a978751625112b3a58
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.8057818381014649,
6
  "eval_steps": 500,
7
- "global_step": 45600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6392,6 +6392,34 @@
6392
  "learning_rate": 1.0807759517778957e-05,
6393
  "loss": 0.3101,
6394
  "step": 45600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6395
  }
6396
  ],
6397
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.809315968970331,
6
  "eval_steps": 500,
7
+ "global_step": 45800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6392
  "learning_rate": 1.0807759517778957e-05,
6393
  "loss": 0.3101,
6394
  "step": 45600
6395
+ },
6396
+ {
6397
+ "epoch": 0.8066653708186814,
6398
+ "grad_norm": 1.2750502824783325,
6399
+ "learning_rate": 1.075867349944042e-05,
6400
+ "loss": 0.3148,
6401
+ "step": 45650
6402
+ },
6403
+ {
6404
+ "epoch": 0.8075489035358979,
6405
+ "grad_norm": 2.6815085411071777,
6406
+ "learning_rate": 1.0709587481101884e-05,
6407
+ "loss": 0.3975,
6408
+ "step": 45700
6409
+ },
6410
+ {
6411
+ "epoch": 0.8084324362531145,
6412
+ "grad_norm": 1.3361300230026245,
6413
+ "learning_rate": 1.0660501462763347e-05,
6414
+ "loss": 0.391,
6415
+ "step": 45750
6416
+ },
6417
+ {
6418
+ "epoch": 0.809315968970331,
6419
+ "grad_norm": 1.438496470451355,
6420
+ "learning_rate": 1.061141544442481e-05,
6421
+ "loss": 0.3055,
6422
+ "step": 45800
6423
  }
6424
  ],
6425
  "logging_steps": 50,