guyhadad01 commited on
Commit
673ef3a
·
verified ·
1 Parent(s): 2d1b2da

Training in progress, step 43200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1379,6 +1379,10 @@ You can finetune this model on your own dataset.
1379
  | 0.7581 | 42900 | 0.2956 |
1380
  | 0.7590 | 42950 | 0.3038 |
1381
  | 0.7598 | 43000 | 0.2195 |
 
 
 
 
1382
 
1383
  </details>
1384
 
 
1379
  | 0.7581 | 42900 | 0.2956 |
1380
  | 0.7590 | 42950 | 0.3038 |
1381
  | 0.7598 | 43000 | 0.2195 |
1382
+ | 0.7607 | 43050 | 0.2588 |
1383
+ | 0.7616 | 43100 | 0.3065 |
1384
+ | 0.7625 | 43150 | 0.3252 |
1385
+ | 0.7634 | 43200 | 0.2418 |
1386
 
1387
  </details>
1388
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:75caeec9f53b9b891200013c0a2fd18951ed97d80436096583e4cb1480de71e5
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c0c9a0b1262140e82733d51fe5efff8b0e4a0984fb8df6ff90e910c2afd4ab8
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1f4e8d78cc6baa416d9c6a87aa0b3025829063989d02f0b2a8b88b559ded826
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b83e7c31a2c3e589b653cbf5d4ef5a6592e9733967f1d138904e5d044c5d5848
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4be9a690b209a02eb17ce8e3f85da6cd14d4dc8a1275cbf619841edc0fbfa444
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9579fa0231ee8c937aa4751dd1de3d5d49af35716658dc3ccf0f0e2d1f420d45
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cac2489bb213d35fe01f779a670cf1cba6053f86765e6ddff3ab2ce908e2308
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e689eacce1d8ee34e87120437a30d68097f39c37749fc244a0885289f69d33c
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:beb8449b565ba883e76cbff731d0f062ded7c2721b6cab570d00dd75a772df6d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0456f284ad1b7efca7712b00a843898c6fb37f599b5c1b8ffce60a83dcfa662
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7598381368062059,
6
  "eval_steps": 500,
7
- "global_step": 43000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6028,6 +6028,34 @@
6028
  "learning_rate": 1.335925075101608e-05,
6029
  "loss": 0.2195,
6030
  "step": 43000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6031
  }
6032
  ],
6033
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.763372267675072,
6
  "eval_steps": 500,
7
+ "global_step": 43200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6028
  "learning_rate": 1.335925075101608e-05,
6029
  "loss": 0.2195,
6030
  "step": 43000
6031
+ },
6032
+ {
6033
+ "epoch": 0.7607216695234225,
6034
+ "grad_norm": 1.4077396392822266,
6035
+ "learning_rate": 1.3310164732677543e-05,
6036
+ "loss": 0.2588,
6037
+ "step": 43050
6038
+ },
6039
+ {
6040
+ "epoch": 0.761605202240639,
6041
+ "grad_norm": 2.881322145462036,
6042
+ "learning_rate": 1.326107871433901e-05,
6043
+ "loss": 0.3065,
6044
+ "step": 43100
6045
+ },
6046
+ {
6047
+ "epoch": 0.7624887349578555,
6048
+ "grad_norm": 1.5936981439590454,
6049
+ "learning_rate": 1.3211992696000472e-05,
6050
+ "loss": 0.3252,
6051
+ "step": 43150
6052
+ },
6053
+ {
6054
+ "epoch": 0.763372267675072,
6055
+ "grad_norm": 1.4670791625976562,
6056
+ "learning_rate": 1.3162906677661935e-05,
6057
+ "loss": 0.2418,
6058
+ "step": 43200
6059
  }
6060
  ],
6061
  "logging_steps": 50,