guyhadad01 commited on
Commit
dc3c2d8
·
verified ·
1 Parent(s): 3ffe500

Training in progress, step 41600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1347,6 +1347,10 @@ You can finetune this model on your own dataset.
1347
  | 0.7298 | 41300 | 0.3289 |
1348
  | 0.7307 | 41350 | 0.3119 |
1349
  | 0.7316 | 41400 | 0.3007 |
 
 
 
 
1350
 
1351
  </details>
1352
 
 
1347
  | 0.7298 | 41300 | 0.3289 |
1348
  | 0.7307 | 41350 | 0.3119 |
1349
  | 0.7316 | 41400 | 0.3007 |
1350
+ | 0.7324 | 41450 | 0.3499 |
1351
+ | 0.7333 | 41500 | 0.3016 |
1352
+ | 0.7342 | 41550 | 0.3232 |
1353
+ | 0.7351 | 41600 | 0.2577 |
1354
 
1355
  </details>
1356
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f43c6066a3ed8a797462ed1304e6dd3a538745bae56d08936296e98af5636e68
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5968fa9233e27ceab0b50d025526b14878df9c3a5cc0dd8ab8e3bfb4e8731159
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1672d02aa4d93aaa27f89d6d65e2a20859a6cb3dd9c4432eeb82f6752f1dfc2
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f9b287a89c14a672aa169e1144107274fac0f234f450dc15728e411970cfec4
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7960809e3d7046461ba4b9405b6f71ec0619b99775d0184c422fcc4823ed73f8
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29c7015785925a4c92109508d00189934d2658c038f9a9b3126f34a88d70d109
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:590d2263ee28ffeb3fc18603d4b5a73198cf1c208cbf77110c99f455e29bc8ec
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd530e72b22c1ce77a70b73b0e2553d90cdc69cb660d5df5b7ea28fe660cd767
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b3482c7848cfcb119d950c3c5d13bc2dc1e7095a6ad4e7fc2a9ca4e5c264983
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36751f2c6aca47874fa4d1553b1d00dffae813bb24cca7967068d98d45a147e3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7315650898552774,
6
  "eval_steps": 500,
7
- "global_step": 41400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5804,6 +5804,34 @@
5804
  "learning_rate": 1.4929021617482478e-05,
5805
  "loss": 0.3007,
5806
  "step": 41400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5807
  }
5808
  ],
5809
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7350992207241435,
6
  "eval_steps": 500,
7
+ "global_step": 41600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5804
  "learning_rate": 1.4929021617482478e-05,
5805
  "loss": 0.3007,
5806
  "step": 41400
5807
+ },
5808
+ {
5809
+ "epoch": 0.7324486225724939,
5810
+ "grad_norm": 2.910383939743042,
5811
+ "learning_rate": 1.4879935599143941e-05,
5812
+ "loss": 0.3499,
5813
+ "step": 41450
5814
+ },
5815
+ {
5816
+ "epoch": 0.7333321552897104,
5817
+ "grad_norm": 1.0191997289657593,
5818
+ "learning_rate": 1.4830849580805404e-05,
5819
+ "loss": 0.3016,
5820
+ "step": 41500
5821
+ },
5822
+ {
5823
+ "epoch": 0.7342156880069269,
5824
+ "grad_norm": 0.9859305620193481,
5825
+ "learning_rate": 1.4781763562466869e-05,
5826
+ "loss": 0.3232,
5827
+ "step": 41550
5828
+ },
5829
+ {
5830
+ "epoch": 0.7350992207241435,
5831
+ "grad_norm": 1.4275975227355957,
5832
+ "learning_rate": 1.4732677544128332e-05,
5833
+ "loss": 0.2577,
5834
+ "step": 41600
5835
  }
5836
  ],
5837
  "logging_steps": 50,