guyhadad01 commited on
Commit
3ed04d1
·
verified ·
1 Parent(s): 544fa58

Training in progress, step 15000, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1323,6 +1323,10 @@ You can finetune this model on your own dataset.
1323
  | 0.2598 | 14700 | 0.3622 |
1324
  | 0.2606 | 14750 | 0.2782 |
1325
  | 0.2615 | 14800 | 0.36 |
 
 
 
 
1326
 
1327
  </details>
1328
 
 
1323
  | 0.2598 | 14700 | 0.3622 |
1324
  | 0.2606 | 14750 | 0.2782 |
1325
  | 0.2615 | 14800 | 0.36 |
1326
+ | 0.2624 | 14850 | 0.486 |
1327
+ | 0.2633 | 14900 | 0.406 |
1328
+ | 0.2642 | 14950 | 0.357 |
1329
+ | 0.2651 | 15000 | 0.2855 |
1330
 
1331
  </details>
1332
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f8e3fa7de06aa25ef9e92bb424c00fdc808b42dd23a9e9bb43d0a3c2c3136371
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62a5255fda70735f530277b068143dfdac403e8121852574084f116cd8a54ad2
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:092bf8b9d76f58d80effc72b6148feaeea3102b809911377eb0d572cb5bf7575
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6061f93c451e2da3513d0e7ebb36b42a40ee13e63c2294272c5bca7237bb74f6
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97edb58b8967751d3dda12e8eb802aa7613cd23fb975e45f9749685794078420
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58d6a61e95480d63adba518dcc060210f3fb21899a87b9a86415b16500e0e3bf
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f13f9cc3a0ef2dfdf6369b4685eb176c05f57535fd4a80cceb72b81393a5eb1b
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b117d26681ce36f6295204f3c0c1542a5dbd8eba633804a8fd8e040b3e8c6050
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29d3d14fe806d58e2a7b675de49d429f0f4e1b8b1cfd250c3c74b902fbff4430
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4647cbe535a4ae95aadfbebe85aa748dcd49df21d2f520f23e9e1a18d456097d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.26152568429608947,
6
  "eval_steps": 500,
7
- "global_step": 14800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2080,6 +2080,34 @@
2080
  "learning_rate": 4.103002100881585e-05,
2081
  "loss": 0.36,
2082
  "step": 14800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2083
  }
2084
  ],
2085
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.2650598151649556,
6
  "eval_steps": 500,
7
+ "global_step": 15000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2080
  "learning_rate": 4.103002100881585e-05,
2081
  "loss": 0.36,
2082
  "step": 14800
2083
+ },
2084
+ {
2085
+ "epoch": 0.262409217013306,
2086
+ "grad_norm": 1.5133942365646362,
2087
+ "learning_rate": 4.098093499047732e-05,
2088
+ "loss": 0.486,
2089
+ "step": 14850
2090
+ },
2091
+ {
2092
+ "epoch": 0.2632927497305225,
2093
+ "grad_norm": 1.848177194595337,
2094
+ "learning_rate": 4.0932830692505546e-05,
2095
+ "loss": 0.406,
2096
+ "step": 14900
2097
+ },
2098
+ {
2099
+ "epoch": 0.26417628244773905,
2100
+ "grad_norm": 3.320469379425049,
2101
+ "learning_rate": 4.088374467416701e-05,
2102
+ "loss": 0.357,
2103
+ "step": 14950
2104
+ },
2105
+ {
2106
+ "epoch": 0.2650598151649556,
2107
+ "grad_norm": 1.417015790939331,
2108
+ "learning_rate": 4.0834658655828475e-05,
2109
+ "loss": 0.2855,
2110
+ "step": 15000
2111
  }
2112
  ],
2113
  "logging_steps": 50,