guyhadad01 commited on
Commit
d3044f2
·
verified ·
1 Parent(s): 24d11d3

Training in progress, step 14600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1315,6 +1315,10 @@ You can finetune this model on your own dataset.
1315
  | 0.2527 | 14300 | 0.4161 |
1316
  | 0.2536 | 14350 | 0.3431 |
1317
  | 0.2545 | 14400 | 0.3576 |
 
 
 
 
1318
 
1319
  </details>
1320
 
 
1315
  | 0.2527 | 14300 | 0.4161 |
1316
  | 0.2536 | 14350 | 0.3431 |
1317
  | 0.2545 | 14400 | 0.3576 |
1318
+ | 0.2553 | 14450 | 0.3563 |
1319
+ | 0.2562 | 14500 | 0.3406 |
1320
+ | 0.2571 | 14550 | 0.4397 |
1321
+ | 0.2580 | 14600 | 0.411 |
1322
 
1323
  </details>
1324
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c70d1baeacb306a6e3e4e7da1daf6668ef9a846b36b36844f97182da49b7189d
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:861228ee1e7303d55d206ed18a0e9a9f72cd4fceb74ae8597ddd8227ba4baaa6
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c7cc231dc6a04e0cb1fde6371ac1117217c084c2ff5861f99992f6271b0b2ae
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01e800f5f76e35b4a2c15cb36bcf0bae4a36cc21e80874b3eade1a26b448ee14
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1575cd53f4b8b110d92e8c23aa79a7bcf9dc9c336882843030d5971034763624
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ffe6d2e694b6c2093052ae77ba6c6348d6c889151265b032757dc965de9eabd
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97511a6060aacb39a58a4067ef60a5d731c4117afaf40a314802e695ac048d50
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2d1981a845c6e1942265cf518562623d63fa9e701ce29d4ce24d1e25e2691cb
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:696c7475f37eb1308f8246ec63f84866eb3d506203673b38e04a231cb4eacd6d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71ef9de9a97c35ae1f236f3cf953b678aeb5931825d667a15b405ae0448fa416
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.25445742255835735,
6
  "eval_steps": 500,
7
- "global_step": 14400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2024,6 +2024,34 @@
2024
  "learning_rate": 4.142270915552414e-05,
2025
  "loss": 0.3576,
2026
  "step": 14400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2027
  }
2028
  ],
2029
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.2579915534272234,
6
  "eval_steps": 500,
7
+ "global_step": 14600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2024
  "learning_rate": 4.142270915552414e-05,
2025
  "loss": 0.3576,
2026
  "step": 14400
2027
+ },
2028
+ {
2029
+ "epoch": 0.2553409552755739,
2030
+ "grad_norm": 1.3540493249893188,
2031
+ "learning_rate": 4.137362313718561e-05,
2032
+ "loss": 0.3563,
2033
+ "step": 14450
2034
+ },
2035
+ {
2036
+ "epoch": 0.25622448799279035,
2037
+ "grad_norm": 1.7373064756393433,
2038
+ "learning_rate": 4.1324537118847066e-05,
2039
+ "loss": 0.3406,
2040
+ "step": 14500
2041
+ },
2042
+ {
2043
+ "epoch": 0.2571080207100069,
2044
+ "grad_norm": 2.6311392784118652,
2045
+ "learning_rate": 4.127545110050853e-05,
2046
+ "loss": 0.4397,
2047
+ "step": 14550
2048
+ },
2049
+ {
2050
+ "epoch": 0.2579915534272234,
2051
+ "grad_norm": 1.845186471939087,
2052
+ "learning_rate": 4.122636508217e-05,
2053
+ "loss": 0.411,
2054
+ "step": 14600
2055
  }
2056
  ],
2057
  "logging_steps": 50,