guyhadad01 commited on
Commit
df80535
·
verified ·
1 Parent(s): d680b24

Training in progress, step 42800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1371,6 +1371,10 @@ You can finetune this model on your own dataset.
1371
  | 0.7510 | 42500 | 0.3433 |
1372
  | 0.7519 | 42550 | 0.3273 |
1373
  | 0.7528 | 42600 | 0.3123 |
 
 
 
 
1374
 
1375
  </details>
1376
 
 
1371
  | 0.7510 | 42500 | 0.3433 |
1372
  | 0.7519 | 42550 | 0.3273 |
1373
  | 0.7528 | 42600 | 0.3123 |
1374
+ | 0.7537 | 42650 | 0.29 |
1375
+ | 0.7545 | 42700 | 0.3352 |
1376
+ | 0.7554 | 42750 | 0.3143 |
1377
+ | 0.7563 | 42800 | 0.2833 |
1378
 
1379
  </details>
1380
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ff54d76c9ebf490f12ff8e20aef5fa2ede05719c3e5676b2c4b70743a6ddb70
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:947ad26bf0a1ea98a40d7847b1d4081968d0ea03f777dd415d118a3341c7d595
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1bcc3dd859b5b30a53288025a1e1562aaecb27ca1c5f50de5231f42624b5be4
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbe6b037eef5d6174a1e64a06f40631b730395d9ff0774dfc1245b870b5a756f
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:283d0e72fe96a15f8f83fa6413bf75a47c1e9923215c4159761e62486061e4d6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a0a70fc822cbf0577f57f474f054d71e07e1660e7791d186284f5053153721d
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6825a6ad95d754623a78051fc89a4d4e41f2bf2218e7b695b249c975dc4ba73
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31395f18239b3bc788fb9174ae1acda597a1a3b63f5595848ade3391438691e5
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:052884290aaf5bd113167914e5b98e8e8eb63821927d0e64cb92a12102bb9c25
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff01474c5f0e5dbd5aec03f387f08f61e0a9ae8d77c69168920103f17f16f317
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7527698750684738,
6
  "eval_steps": 500,
7
- "global_step": 42600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5972,6 +5972,34 @@
5972
  "learning_rate": 1.3750957177357601e-05,
5973
  "loss": 0.3123,
5974
  "step": 42600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5975
  }
5976
  ],
5977
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7563040059373398,
6
  "eval_steps": 500,
7
+ "global_step": 42800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5972
  "learning_rate": 1.3750957177357601e-05,
5973
  "loss": 0.3123,
5974
  "step": 42600
5975
+ },
5976
+ {
5977
+ "epoch": 0.7536534077856903,
5978
+ "grad_norm": 4.600383758544922,
5979
+ "learning_rate": 1.3701871159019066e-05,
5980
+ "loss": 0.29,
5981
+ "step": 42650
5982
+ },
5983
+ {
5984
+ "epoch": 0.7545369405029069,
5985
+ "grad_norm": 4.080932140350342,
5986
+ "learning_rate": 1.3652785140680529e-05,
5987
+ "loss": 0.3352,
5988
+ "step": 42700
5989
+ },
5990
+ {
5991
+ "epoch": 0.7554204732201233,
5992
+ "grad_norm": 1.4026703834533691,
5993
+ "learning_rate": 1.3603699122341992e-05,
5994
+ "loss": 0.3143,
5995
+ "step": 42750
5996
+ },
5997
+ {
5998
+ "epoch": 0.7563040059373398,
5999
+ "grad_norm": 1.4037362337112427,
6000
+ "learning_rate": 1.3555594824370226e-05,
6001
+ "loss": 0.2833,
6002
+ "step": 42800
6003
  }
6004
  ],
6005
  "logging_steps": 50,