guyhadad01 commited on
Commit
70aabbf
·
verified ·
1 Parent(s): 9e8ba20

Training in progress, step 41800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1351,6 +1351,10 @@ You can finetune this model on your own dataset.
1351
  | 0.7333 | 41500 | 0.3016 |
1352
  | 0.7342 | 41550 | 0.3232 |
1353
  | 0.7351 | 41600 | 0.2577 |
 
 
 
 
1354
 
1355
  </details>
1356
 
 
1351
  | 0.7333 | 41500 | 0.3016 |
1352
  | 0.7342 | 41550 | 0.3232 |
1353
  | 0.7351 | 41600 | 0.2577 |
1354
+ | 0.7360 | 41650 | 0.2928 |
1355
+ | 0.7369 | 41700 | 0.2814 |
1356
+ | 0.7377 | 41750 | 0.2962 |
1357
+ | 0.7386 | 41800 | 0.2756 |
1358
 
1359
  </details>
1360
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5968fa9233e27ceab0b50d025526b14878df9c3a5cc0dd8ab8e3bfb4e8731159
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abfcfd3f457cbe51abbd61ecc95245359c5208d8775c26e09de127916a470d92
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f9b287a89c14a672aa169e1144107274fac0f234f450dc15728e411970cfec4
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb67670e66bb3f0f4adc4b392b33cd6c165031c08ca7ad68859e8241c86a12f3
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29c7015785925a4c92109508d00189934d2658c038f9a9b3126f34a88d70d109
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3ac5b3de4f8e2849792c1b106634d8b16fc3919a657dbd8cbb3d224121e1301
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd530e72b22c1ce77a70b73b0e2553d90cdc69cb660d5df5b7ea28fe660cd767
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8814987cfbe269e51b2a3098b07850feb46aab6ef117c55c4f2b6aaf9ac85aa0
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36751f2c6aca47874fa4d1553b1d00dffae813bb24cca7967068d98d45a147e3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcfbb3dbbb2ba7d17dd131f713778ca8f3b0e144d05efa9885ea8327cd9b4a6f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7350992207241435,
6
  "eval_steps": 500,
7
- "global_step": 41600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5832,6 +5832,34 @@
5832
  "learning_rate": 1.4732677544128332e-05,
5833
  "loss": 0.2577,
5834
  "step": 41600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5835
  }
5836
  ],
5837
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7386333515930095,
6
  "eval_steps": 500,
7
+ "global_step": 41800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5832
  "learning_rate": 1.4732677544128332e-05,
5833
  "loss": 0.2577,
5834
  "step": 41600
5835
+ },
5836
+ {
5837
+ "epoch": 0.7359827534413599,
5838
+ "grad_norm": 1.0362133979797363,
5839
+ "learning_rate": 1.4683591525789795e-05,
5840
+ "loss": 0.2928,
5841
+ "step": 41650
5842
+ },
5843
+ {
5844
+ "epoch": 0.7368662861585764,
5845
+ "grad_norm": 2.07706618309021,
5846
+ "learning_rate": 1.4634505507451258e-05,
5847
+ "loss": 0.2814,
5848
+ "step": 41700
5849
+ },
5850
+ {
5851
+ "epoch": 0.7377498188757929,
5852
+ "grad_norm": 1.6817320585250854,
5853
+ "learning_rate": 1.4585419489112722e-05,
5854
+ "loss": 0.2962,
5855
+ "step": 41750
5856
+ },
5857
+ {
5858
+ "epoch": 0.7386333515930095,
5859
+ "grad_norm": 2.021404981613159,
5860
+ "learning_rate": 1.4536333470774185e-05,
5861
+ "loss": 0.2756,
5862
+ "step": 41800
5863
  }
5864
  ],
5865
  "logging_steps": 50,