guyhadad01 commited on
Commit
14f3d6a
·
verified ·
1 Parent(s): c2191b5

Training in progress, step 37400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1261,6 +1261,10 @@ You can finetune this model on your own dataset.
1261
  | 0.6556 | 37100 | 0.3814 |
1262
  | 0.6565 | 37150 | 0.4174 |
1263
  | 0.6573 | 37200 | 0.3473 |
 
 
 
 
1264
 
1265
 
1266
  ### Framework Versions
 
1261
  | 0.6556 | 37100 | 0.3814 |
1262
  | 0.6565 | 37150 | 0.4174 |
1263
  | 0.6573 | 37200 | 0.3473 |
1264
+ | 0.6582 | 37250 | 0.3598 |
1265
+ | 0.6591 | 37300 | 0.2822 |
1266
+ | 0.6600 | 37350 | 0.2538 |
1267
+ | 0.6609 | 37400 | 0.2212 |
1268
 
1269
 
1270
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:078012c454ea4b152c3db74341399805978d346a3159daf28a1763d42680059c
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:682fa9590e06a4b4fccae7f5f773e5cc53952c5e99d2335a76b83158b65098ed
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06f250b4f70e94e35dd162d4656e5953ae96031e8d6e24791ea917a2422dac3a
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9245c8c24824eb122166f727d92f67c72576954b6b177342efb7c87cca99916e
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2134ce16464c1d7c26a8d74b225ed50e24c2ef21aefdbfa44036477c7f93a57
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4055cc979b2b5391466d56f1b911260413ca5d1e7980d72b0ab4b419cbf9b1f2
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0af84d11cf9a350709c490c3f7b9bde1e09340d958fac411ecff8f1d22ce1e52
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88bd0768fb513693c45a5dd657bdd8c5632ab92debcf304b18dc0e31cdbf92a9
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ffdf18d69e9e8219490bafd2eb8c151c526102e648991721d9f0d64d7104e24
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0f778ab4b27197de7dc711e3e33f3210ad38a94a9b2fa894dde1075de7a2d68
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6573483416090898,
6
  "eval_steps": 500,
7
- "global_step": 37200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5216,6 +5216,34 @@
5216
  "learning_rate": 1.9050283717185998e-05,
5217
  "loss": 0.3473,
5218
  "step": 37200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5219
  }
5220
  ],
5221
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6608824724779558,
6
  "eval_steps": 500,
7
+ "global_step": 37400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5216
  "learning_rate": 1.9050283717185998e-05,
5217
  "loss": 0.3473,
5218
  "step": 37200
5219
+ },
5220
+ {
5221
+ "epoch": 0.6582318743263063,
5222
+ "grad_norm": 1.6960564851760864,
5223
+ "learning_rate": 1.9001197698847463e-05,
5224
+ "loss": 0.3598,
5225
+ "step": 37250
5226
+ },
5227
+ {
5228
+ "epoch": 0.6591154070435228,
5229
+ "grad_norm": 1.8127328157424927,
5230
+ "learning_rate": 1.8952111680508924e-05,
5231
+ "loss": 0.2822,
5232
+ "step": 37300
5233
+ },
5234
+ {
5235
+ "epoch": 0.6599989397607393,
5236
+ "grad_norm": 1.7553006410598755,
5237
+ "learning_rate": 1.890302566217039e-05,
5238
+ "loss": 0.2538,
5239
+ "step": 37350
5240
+ },
5241
+ {
5242
+ "epoch": 0.6608824724779558,
5243
+ "grad_norm": 1.111005187034607,
5244
+ "learning_rate": 1.8853939643831853e-05,
5245
+ "loss": 0.2212,
5246
+ "step": 37400
5247
  }
5248
  ],
5249
  "logging_steps": 50,