guyhadad01 commited on
Commit
9b37318
·
verified ·
1 Parent(s): 62fb630

Training in progress, step 37200, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1257,6 +1257,10 @@ You can finetune this model on your own dataset.
1257
  | 0.6520 | 36900 | 0.3572 |
1258
  | 0.6529 | 36950 | 0.3085 |
1259
  | 0.6538 | 37000 | 0.2647 |
 
 
 
 
1260
 
1261
 
1262
  ### Framework Versions
 
1257
  | 0.6520 | 36900 | 0.3572 |
1258
  | 0.6529 | 36950 | 0.3085 |
1259
  | 0.6538 | 37000 | 0.2647 |
1260
+ | 0.6547 | 37050 | 0.2622 |
1261
+ | 0.6556 | 37100 | 0.3814 |
1262
+ | 0.6565 | 37150 | 0.4174 |
1263
+ | 0.6573 | 37200 | 0.3473 |
1264
 
1265
 
1266
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5aa3e074a25abb8c340316265b8419fb45e38d5ea71e4312b6d0194cb38cc86b
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:078012c454ea4b152c3db74341399805978d346a3159daf28a1763d42680059c
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a86c17b77d1cfac3584af9a6619882b78c1f9bc7dcb85e0259432165076b9f36
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06f250b4f70e94e35dd162d4656e5953ae96031e8d6e24791ea917a2422dac3a
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3da82f98ab298f77c390cd353b9bced87815dd73e91293360907ff091eb61d4e
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2134ce16464c1d7c26a8d74b225ed50e24c2ef21aefdbfa44036477c7f93a57
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:952a0b2337ddfcc5838b84a78a584c51460d6072b3d324731f0a62584e450719
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0af84d11cf9a350709c490c3f7b9bde1e09340d958fac411ecff8f1d22ce1e52
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a249cc3fbdfe88ea20fb6dbfcb1191ec424d82ef41e7dafc1d1c85f14b5994e9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ffdf18d69e9e8219490bafd2eb8c151c526102e648991721d9f0d64d7104e24
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.6538142107402237,
6
  "eval_steps": 500,
7
- "global_step": 37000,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -5188,6 +5188,34 @@
5188
  "learning_rate": 1.9246627790540143e-05,
5189
  "loss": 0.2647,
5190
  "step": 37000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5191
  }
5192
  ],
5193
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.6573483416090898,
6
  "eval_steps": 500,
7
+ "global_step": 37200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
5188
  "learning_rate": 1.9246627790540143e-05,
5189
  "loss": 0.2647,
5190
  "step": 37000
5191
+ },
5192
+ {
5193
+ "epoch": 0.6546977434574403,
5194
+ "grad_norm": 1.230721354484558,
5195
+ "learning_rate": 1.9197541772201607e-05,
5196
+ "loss": 0.2622,
5197
+ "step": 37050
5198
+ },
5199
+ {
5200
+ "epoch": 0.6555812761746568,
5201
+ "grad_norm": 1.6303822994232178,
5202
+ "learning_rate": 1.9148455753863072e-05,
5203
+ "loss": 0.3814,
5204
+ "step": 37100
5205
+ },
5206
+ {
5207
+ "epoch": 0.6564648088918733,
5208
+ "grad_norm": 1.2327115535736084,
5209
+ "learning_rate": 1.9099369735524533e-05,
5210
+ "loss": 0.4174,
5211
+ "step": 37150
5212
+ },
5213
+ {
5214
+ "epoch": 0.6573483416090898,
5215
+ "grad_norm": 1.4918360710144043,
5216
+ "learning_rate": 1.9050283717185998e-05,
5217
+ "loss": 0.3473,
5218
+ "step": 37200
5219
  }
5220
  ],
5221
  "logging_steps": 50,