guyhadad01 commited on
Commit
b3f9aee
·
verified ·
1 Parent(s): 1cdb5b2

Training in progress, step 17400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1371,6 +1371,10 @@ You can finetune this model on your own dataset.
1371
  | 0.3022 | 17100 | 0.4207 |
1372
  | 0.3031 | 17150 | 0.3849 |
1373
  | 0.3039 | 17200 | 0.3272 |
 
 
 
 
1374
 
1375
  </details>
1376
 
 
1371
  | 0.3022 | 17100 | 0.4207 |
1372
  | 0.3031 | 17150 | 0.3849 |
1373
  | 0.3039 | 17200 | 0.3272 |
1374
+ | 0.3048 | 17250 | 0.3037 |
1375
+ | 0.3057 | 17300 | 0.2924 |
1376
+ | 0.3066 | 17350 | 0.4029 |
1377
+ | 0.3075 | 17400 | 0.5016 |
1378
 
1379
  </details>
1380
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8aa8eabf0bd95daa104946b416f3292c9a92c6053a47e54e8098083f61f3874
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45090e53ca13162f5dfed87da6ebea51548a6f3908cbbefc66a73c68e67f368f
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:550870691770e56b635695a47badd3d85105a2abddd01d2f68ac682eb4779cfb
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ca6aad37af14fa05240de5a73f6854c9f991ab7d94bccdddb3bd4a0e3ff149d
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9642b48564b74a9ef3023b3677305007ed89dfb95240067ad9d1be72f7d2692a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:23fe6d223e7616989ffc698a28faceb780fedfcab150f455b3003f3664a9d548
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c157b3717ebad1d1c4deed2f4a1e630570eeaf89e281bb553ac41881d02a28e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2780f904a141afb4c77d183d8b90351cd99dc707535728f23c895b86a7cd2bb
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fcdcffdcd8983b3d6481c27ecbd4b8783b8846e8b39268fee55aae8ba8b88e41
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d388bf9897e62191d89d430ec5647330caf741ec214058515a40e21a614b139
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.3039352547224824,
6
  "eval_steps": 500,
7
- "global_step": 17200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -2416,6 +2416,34 @@
2416
  "learning_rate": 3.867585556929964e-05,
2417
  "loss": 0.3272,
2418
  "step": 17200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2419
  }
2420
  ],
2421
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.30746938559134845,
6
  "eval_steps": 500,
7
+ "global_step": 17400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
2416
  "learning_rate": 3.867585556929964e-05,
2417
  "loss": 0.3272,
2418
  "step": 17200
2419
+ },
2420
+ {
2421
+ "epoch": 0.30481878743969887,
2422
+ "grad_norm": 1.5218919515609741,
2423
+ "learning_rate": 3.862676955096111e-05,
2424
+ "loss": 0.3037,
2425
+ "step": 17250
2426
+ },
2427
+ {
2428
+ "epoch": 0.3057023201569154,
2429
+ "grad_norm": 1.5864076614379883,
2430
+ "learning_rate": 3.857768353262257e-05,
2431
+ "loss": 0.2924,
2432
+ "step": 17300
2433
+ },
2434
+ {
2435
+ "epoch": 0.3065858528741319,
2436
+ "grad_norm": 1.8895894289016724,
2437
+ "learning_rate": 3.852859751428403e-05,
2438
+ "loss": 0.4029,
2439
+ "step": 17350
2440
+ },
2441
+ {
2442
+ "epoch": 0.30746938559134845,
2443
+ "grad_norm": 1.4156498908996582,
2444
+ "learning_rate": 3.8479511495945495e-05,
2445
+ "loss": 0.5016,
2446
+ "step": 17400
2447
  }
2448
  ],
2449
  "logging_steps": 50,