guyhadad01 commited on
Commit
235349e
·
verified ·
1 Parent(s): 8803ac1

Training in progress, step 14800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1319,6 +1319,10 @@ You can finetune this model on your own dataset.
1319
  | 0.2562 | 14500 | 0.3406 |
1320
  | 0.2571 | 14550 | 0.4397 |
1321
  | 0.2580 | 14600 | 0.411 |
 
 
 
 
1322
 
1323
  </details>
1324
 
 
1319
  | 0.2562 | 14500 | 0.3406 |
1320
  | 0.2571 | 14550 | 0.4397 |
1321
  | 0.2580 | 14600 | 0.411 |
1322
+ | 0.2589 | 14650 | 0.3742 |
1323
+ | 0.2598 | 14700 | 0.3622 |
1324
+ | 0.2606 | 14750 | 0.2782 |
1325
+ | 0.2615 | 14800 | 0.36 |
1326
 
1327
  </details>
1328
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:861228ee1e7303d55d206ed18a0e9a9f72cd4fceb74ae8597ddd8227ba4baaa6
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8e3fa7de06aa25ef9e92bb424c00fdc808b42dd23a9e9bb43d0a3c2c3136371
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01e800f5f76e35b4a2c15cb36bcf0bae4a36cc21e80874b3eade1a26b448ee14
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:092bf8b9d76f58d80effc72b6148feaeea3102b809911377eb0d572cb5bf7575
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ffe6d2e694b6c2093052ae77ba6c6348d6c889151265b032757dc965de9eabd
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97edb58b8967751d3dda12e8eb802aa7613cd23fb975e45f9749685794078420
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2d1981a845c6e1942265cf518562623d63fa9e701ce29d4ce24d1e25e2691cb
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f13f9cc3a0ef2dfdf6369b4685eb176c05f57535fd4a80cceb72b81393a5eb1b
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71ef9de9a97c35ae1f236f3cf953b678aeb5931825d667a15b405ae0448fa416
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29d3d14fe806d58e2a7b675de49d429f0f4e1b8b1cfd250c3c74b902fbff4430
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.2579915534272234,
6
  "eval_steps": 500,
7
- "global_step": 14600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2052,6 +2052,34 @@
2052
  "learning_rate": 4.122636508217e-05,
2053
  "loss": 0.411,
2054
  "step": 14600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2055
  }
2056
  ],
2057
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.26152568429608947,
6
  "eval_steps": 500,
7
+ "global_step": 14800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2052
  "learning_rate": 4.122636508217e-05,
2053
  "loss": 0.411,
2054
  "step": 14600
2055
+ },
2056
+ {
2057
+ "epoch": 0.25887508614443994,
2058
+ "grad_norm": 1.5897334814071655,
2059
+ "learning_rate": 4.117727906383146e-05,
2060
+ "loss": 0.3742,
2061
+ "step": 14650
2062
+ },
2063
+ {
2064
+ "epoch": 0.25975861886165647,
2065
+ "grad_norm": 3.667428970336914,
2066
+ "learning_rate": 4.1128193045492924e-05,
2067
+ "loss": 0.3622,
2068
+ "step": 14700
2069
+ },
2070
+ {
2071
+ "epoch": 0.26064215157887294,
2072
+ "grad_norm": 1.7393996715545654,
2073
+ "learning_rate": 4.107910702715439e-05,
2074
+ "loss": 0.2782,
2075
+ "step": 14750
2076
+ },
2077
+ {
2078
+ "epoch": 0.26152568429608947,
2079
+ "grad_norm": 1.6495802402496338,
2080
+ "learning_rate": 4.103002100881585e-05,
2081
+ "loss": 0.36,
2082
+ "step": 14800
2083
  }
2084
  ],
2085
  "logging_steps": 50,