guyhadad01 commited on
Commit
00a697d
·
verified ·
1 Parent(s): 9cac277

Training in progress, step 22800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1479,6 +1479,10 @@ You can finetune this model on your own dataset.
1479
  | 0.3976 | 22500 | 0.3136 |
1480
  | 0.3985 | 22550 | 0.297 |
1481
  | 0.3994 | 22600 | 0.2933 |
 
 
 
 
1482
 
1483
  </details>
1484
 
 
1479
  | 0.3976 | 22500 | 0.3136 |
1480
  | 0.3985 | 22550 | 0.297 |
1481
  | 0.3994 | 22600 | 0.2933 |
1482
+ | 0.4002 | 22650 | 0.4026 |
1483
+ | 0.4011 | 22700 | 0.3567 |
1484
+ | 0.4020 | 22750 | 0.3711 |
1485
+ | 0.4029 | 22800 | 0.378 |
1486
 
1487
  </details>
1488
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:497b7a6acdb3a5a1604b3f8ab3267058baa92f80bee7efa6e237ea075655a4d8
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0d300e6229f3196e296d216f86e3dd9be751afa58c003b8627129e48bb13ede
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e163c7782d125cbae55d87a883f0afe29090c268911a4edc6e746df10bc1f663
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12655e53ef206d715a3442591f73e41f1140d40b95f274af76ba0a35f493edb8
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6edf8471c36d7596b23118388dc68d9d67f46cc4a6b1356e1a12264545ade3b8
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d13ae5493c4db5b0f6cf3aad8b771f4e49fde2a92cb50952dbcb5b64ecf9ff46
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9f128257bebc4cb3f00ccba35e93cf76368736113fc2faf057244a587c9ee62
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1df82080c2918595026373e489d29f4cedf15be12e39f7a209676e04ceaf08e
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8b0e2d20704f293e6229a166caadb9f1aabe09be5b221f331974406b383c826
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e0f6905bb46dec1582dbcee904a68ad035cd8e9d18fe2b7fb6877bd69d63c7d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3993567881818664,
6
  "eval_steps": 500,
7
- "global_step": 22600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -3172,6 +3172,34 @@
3172
  "learning_rate": 3.337652902947125e-05,
3173
  "loss": 0.2933,
3174
  "step": 22600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3175
  }
3176
  ],
3177
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.40289091905073243,
6
  "eval_steps": 500,
7
+ "global_step": 22800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
3172
  "learning_rate": 3.337652902947125e-05,
3173
  "loss": 0.2933,
3174
  "step": 22600
3175
+ },
3176
+ {
3177
+ "epoch": 0.4002403208990829,
3178
+ "grad_norm": 3.4516189098358154,
3179
+ "learning_rate": 3.332744301113271e-05,
3180
+ "loss": 0.4026,
3181
+ "step": 22650
3182
+ },
3183
+ {
3184
+ "epoch": 0.40112385361629943,
3185
+ "grad_norm": 1.5759230852127075,
3186
+ "learning_rate": 3.3278356992794174e-05,
3187
+ "loss": 0.3567,
3188
+ "step": 22700
3189
+ },
3190
+ {
3191
+ "epoch": 0.4020073863335159,
3192
+ "grad_norm": 1.9385254383087158,
3193
+ "learning_rate": 3.322927097445564e-05,
3194
+ "loss": 0.3711,
3195
+ "step": 22750
3196
+ },
3197
+ {
3198
+ "epoch": 0.40289091905073243,
3199
+ "grad_norm": 1.6334116458892822,
3200
+ "learning_rate": 3.31801849561171e-05,
3201
+ "loss": 0.378,
3202
+ "step": 22800
3203
  }
3204
  ],
3205
  "logging_steps": 50,