guyhadad01 commited on
Commit
93bdb5a
·
verified ·
1 Parent(s): f64ee03

Training in progress, step 22600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1475,6 +1475,10 @@ You can finetune this model on your own dataset.
1475
  | 0.3941 | 22300 | 0.3211 |
1476
  | 0.3949 | 22350 | 0.2505 |
1477
  | 0.3958 | 22400 | 0.3824 |
 
 
 
 
1478
 
1479
  </details>
1480
 
 
1475
  | 0.3941 | 22300 | 0.3211 |
1476
  | 0.3949 | 22350 | 0.2505 |
1477
  | 0.3958 | 22400 | 0.3824 |
1478
+ | 0.3967 | 22450 | 0.331 |
1479
+ | 0.3976 | 22500 | 0.3136 |
1480
+ | 0.3985 | 22550 | 0.297 |
1481
+ | 0.3994 | 22600 | 0.2933 |
1482
 
1483
  </details>
1484
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f1b271b327c67d5e5cbcfe8f4ced2720b67a2ad4b86d7e49064afada335f989
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:497b7a6acdb3a5a1604b3f8ab3267058baa92f80bee7efa6e237ea075655a4d8
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26d8d52c8f794240dfe200811cae13f3270be5d7cc20f4372d66fcdeb02f2c84
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e163c7782d125cbae55d87a883f0afe29090c268911a4edc6e746df10bc1f663
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d33d0eca02823fd38f9f6cbfa8199ab5481b75e21905025d31754984da79697e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6edf8471c36d7596b23118388dc68d9d67f46cc4a6b1356e1a12264545ade3b8
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9af5256c96c40ab41bd91dd8bfffa192e31a7c4ee253a2eb604282e3fbc22ea6
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9f128257bebc4cb3f00ccba35e93cf76368736113fc2faf057244a587c9ee62
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1c0f9c08fc5a654c07e97009bca360a3a7487ba6dd7aed26e14bcde767a3c57
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8b0e2d20704f293e6229a166caadb9f1aabe09be5b221f331974406b383c826
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3958226573130003,
6
  "eval_steps": 500,
7
- "global_step": 22400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3144,6 +3144,34 @@
3144
  "learning_rate": 3.357287310282539e-05,
3145
  "loss": 0.3824,
3146
  "step": 22400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3147
  }
3148
  ],
3149
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.3993567881818664,
6
  "eval_steps": 500,
7
+ "global_step": 22600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3144
  "learning_rate": 3.357287310282539e-05,
3145
  "loss": 0.3824,
3146
  "step": 22400
3147
+ },
3148
+ {
3149
+ "epoch": 0.39670619003021684,
3150
+ "grad_norm": 2.3490004539489746,
3151
+ "learning_rate": 3.352378708448686e-05,
3152
+ "loss": 0.331,
3153
+ "step": 22450
3154
+ },
3155
+ {
3156
+ "epoch": 0.3975897227474333,
3157
+ "grad_norm": 1.5686146020889282,
3158
+ "learning_rate": 3.3474701066148316e-05,
3159
+ "loss": 0.3136,
3160
+ "step": 22500
3161
+ },
3162
+ {
3163
+ "epoch": 0.39847325546464984,
3164
+ "grad_norm": 1.5068285465240479,
3165
+ "learning_rate": 3.342561504780978e-05,
3166
+ "loss": 0.297,
3167
+ "step": 22550
3168
+ },
3169
+ {
3170
+ "epoch": 0.3993567881818664,
3171
+ "grad_norm": 1.81602942943573,
3172
+ "learning_rate": 3.337652902947125e-05,
3173
+ "loss": 0.2933,
3174
+ "step": 22600
3175
  }
3176
  ],
3177
  "logging_steps": 50,