guyhadad01 commited on
Commit
b148562
·
verified ·
1 Parent(s): 1c152be

Training in progress, step 43400, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1383,6 +1383,10 @@ You can finetune this model on your own dataset.
1383
  | 0.7616 | 43100 | 0.3065 |
1384
  | 0.7625 | 43150 | 0.3252 |
1385
  | 0.7634 | 43200 | 0.2418 |
 
 
 
 
1386
 
1387
  </details>
1388
 
 
1383
  | 0.7616 | 43100 | 0.3065 |
1384
  | 0.7625 | 43150 | 0.3252 |
1385
  | 0.7634 | 43200 | 0.2418 |
1386
+ | 0.7643 | 43250 | 0.4002 |
1387
+ | 0.7651 | 43300 | 0.3379 |
1388
+ | 0.7660 | 43350 | 0.3574 |
1389
+ | 0.7669 | 43400 | 0.3664 |
1390
 
1391
  </details>
1392
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c0c9a0b1262140e82733d51fe5efff8b0e4a0984fb8df6ff90e910c2afd4ab8
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a485f5135dbf7941d9dcd8b8fc45b11939ecd8d30155eb2ca9556cbce39f7319
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b83e7c31a2c3e589b653cbf5d4ef5a6592e9733967f1d138904e5d044c5d5848
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c10cdbf25dd441e6bb32bd4c10385f309c62ad905ef0798b745b11cff9a1720f
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9579fa0231ee8c937aa4751dd1de3d5d49af35716658dc3ccf0f0e2d1f420d45
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83302e5118655d454ab8451ea7900b6308bc7d6e9ac3f9707bf02a76f063afd4
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e689eacce1d8ee34e87120437a30d68097f39c37749fc244a0885289f69d33c
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0daa70100b5915dc065db5369cf2e73a99b71868d4f3cbde645519f2b7941b1f
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0456f284ad1b7efca7712b00a843898c6fb37f599b5c1b8ffce60a83dcfa662
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84574c094748f0062cf1157bf6aedafea7577270e5b0318bc110f644f7a5512b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.763372267675072,
6
  "eval_steps": 500,
7
- "global_step": 43200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6056,6 +6056,34 @@
6056
  "learning_rate": 1.3162906677661935e-05,
6057
  "loss": 0.2418,
6058
  "step": 43200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6059
  }
6060
  ],
6061
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.766906398543938,
6
  "eval_steps": 500,
7
+ "global_step": 43400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6056
  "learning_rate": 1.3162906677661935e-05,
6057
  "loss": 0.2418,
6058
  "step": 43200
6059
+ },
6060
+ {
6061
+ "epoch": 0.7642558003922886,
6062
+ "grad_norm": 1.6417291164398193,
6063
+ "learning_rate": 1.31138206593234e-05,
6064
+ "loss": 0.4002,
6065
+ "step": 43250
6066
+ },
6067
+ {
6068
+ "epoch": 0.765139333109505,
6069
+ "grad_norm": 1.5653693675994873,
6070
+ "learning_rate": 1.3064734640984863e-05,
6071
+ "loss": 0.3379,
6072
+ "step": 43300
6073
+ },
6074
+ {
6075
+ "epoch": 0.7660228658267215,
6076
+ "grad_norm": 1.279615879058838,
6077
+ "learning_rate": 1.3015648622646326e-05,
6078
+ "loss": 0.3574,
6079
+ "step": 43350
6080
+ },
6081
+ {
6082
+ "epoch": 0.766906398543938,
6083
+ "grad_norm": 1.693057894706726,
6084
+ "learning_rate": 1.2966562604307789e-05,
6085
+ "loss": 0.3664,
6086
+ "step": 43400
6087
  }
6088
  ],
6089
  "logging_steps": 50,