guyhadad01 commited on
Commit
3efaf4d
·
verified ·
1 Parent(s): 87a45db

Training in progress, step 43800, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1391,6 +1391,10 @@ You can finetune this model on your own dataset.
1391
  | 0.7687 | 43500 | 0.2443 |
1392
  | 0.7696 | 43550 | 0.2998 |
1393
  | 0.7704 | 43600 | 0.3619 |
 
 
 
 
1394
 
1395
  </details>
1396
 
 
1391
  | 0.7687 | 43500 | 0.2443 |
1392
  | 0.7696 | 43550 | 0.2998 |
1393
  | 0.7704 | 43600 | 0.3619 |
1394
+ | 0.7713 | 43650 | 0.2586 |
1395
+ | 0.7722 | 43700 | 0.251 |
1396
+ | 0.7731 | 43750 | 0.3154 |
1397
+ | 0.7740 | 43800 | 0.3309 |
1398
 
1399
  </details>
1400
 
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:582d7207fbae78615ca0e36023c8110cb512dfcbe185f219cdbef0f8c88f6707
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87245a00c511204e0c66583191ab9429ad97c78538541227c616f90b8381119e
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38bd1bddb06afe7bdefce01320f5544bdf1fc670f6d4527df71f8729233aad04
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b6c1541af87dcd1797f9d736a3cac898e50e3ecafd501e98798ccab543ede07
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ec0767005b2ab07f761617d9b9ec8dd40511cb9cacfed18b38312ca707add4f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69c36e80b730b2d3f19367fe96dc275025a093a975c30683cdcf06771c2e520f
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1a993fdfb900c15fe63d9947d4534a020649b78ba75ceb8b6036bf3ab2fc94f
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c2a170b686e6b3841063ec2a8f0cf18b4985f4986723acd35709abf15d5c19e
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6d4bed09415fa87d626fafe2a8875f4460b02e4d1ca2a4d5c36913f61694143
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1960f4f5d6f42011bfc954842f6c57ccfbbc8ac7380b9fbe5cdcbb8bd1b0029
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7704405294128042,
6
  "eval_steps": 500,
7
- "global_step": 43600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -6112,6 +6112,34 @@
6112
  "learning_rate": 1.2770218530953642e-05,
6113
  "loss": 0.3619,
6114
  "step": 43600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6115
  }
6116
  ],
6117
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.7739746602816703,
6
  "eval_steps": 500,
7
+ "global_step": 43800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
6112
  "learning_rate": 1.2770218530953642e-05,
6113
  "loss": 0.3619,
6114
  "step": 43600
6115
+ },
6116
+ {
6117
+ "epoch": 0.7713240621300207,
6118
+ "grad_norm": 2.726393461227417,
6119
+ "learning_rate": 1.2721132512615109e-05,
6120
+ "loss": 0.2586,
6121
+ "step": 43650
6122
+ },
6123
+ {
6124
+ "epoch": 0.7722075948472372,
6125
+ "grad_norm": 1.146583080291748,
6126
+ "learning_rate": 1.2672046494276572e-05,
6127
+ "loss": 0.251,
6128
+ "step": 43700
6129
+ },
6130
+ {
6131
+ "epoch": 0.7730911275644538,
6132
+ "grad_norm": 1.2839117050170898,
6133
+ "learning_rate": 1.2622960475938033e-05,
6134
+ "loss": 0.3154,
6135
+ "step": 43750
6136
+ },
6137
+ {
6138
+ "epoch": 0.7739746602816703,
6139
+ "grad_norm": 1.3681036233901978,
6140
+ "learning_rate": 1.25738744575995e-05,
6141
+ "loss": 0.3309,
6142
+ "step": 43800
6143
  }
6144
  ],
6145
  "logging_steps": 50,