guyhadad01 commited on
Commit
887da02
·
verified ·
1 Parent(s): 92946bf

Training in progress, step 29600, checkpoint

Browse files
last-checkpoint/README.md CHANGED
@@ -1249,6 +1249,10 @@ You can finetune this model on your own dataset.
1249
  | 0.5178 | 29300 | 0.3492 |
1250
  | 0.5186 | 29350 | 0.3304 |
1251
  | 0.5195 | 29400 | 0.3557 |
 
 
 
 
1252
 
1253
 
1254
  ### Framework Versions
 
1249
  | 0.5178 | 29300 | 0.3492 |
1250
  | 0.5186 | 29350 | 0.3304 |
1251
  | 0.5195 | 29400 | 0.3557 |
1252
+ | 0.5204 | 29450 | 0.3389 |
1253
+ | 0.5213 | 29500 | 0.3322 |
1254
+ | 0.5222 | 29550 | 0.3053 |
1255
+ | 0.5231 | 29600 | 0.2486 |
1256
 
1257
 
1258
  ### Framework Versions
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52be879aebe70d6a3b2a056beedca08f2be73f61ebc46f06911a85e46d41c0c2
3
  size 90864192
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:144dc908d4b1ad90ee4a018b09fcaa7382467917152ff08210428196e07231f5
3
  size 90864192
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06028c42fad3044c4b23353b232592f0571645864a036fae7f9a4aff967be12e
3
  size 180609210
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61ca3e8ce7625e03c0718ab68f669eeba24f2a5b3e90913a5232a2578f9fb9e5
3
  size 180609210
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83cd1380c57226aa3ea98011ce1f02c69976c7ca7a80455b341682a640b1d651
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:029654d250d0a06a53ab2b4254f6c488ff21281306f583e5ec84fbf77c6593a0
3
  size 14244
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c77541b39dbb71635c2f0939f339b7fa24c5c0af9ad45520c78a03f92ccdb59e
3
  size 988
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b527e96b4627964f9c26d5047552177b51a31ae414fb5194c8647b133292f2b4
3
  size 988
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f226454d5f7fa5a1b29f0c7888dfe13f17698107b349cee7ac0fbf136bdbea6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:786920dde07982614e5d3db4362f9f0f309e2cae4493573be6138429ecf70b07
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.5195172377233129,
6
  "eval_steps": 500,
7
- "global_step": 29400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -4124,6 +4124,34 @@
4124
  "learning_rate": 2.6703775696530603e-05,
4125
  "loss": 0.3557,
4126
  "step": 29400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4127
  }
4128
  ],
4129
  "logging_steps": 50,
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.5230513685921789,
6
  "eval_steps": 500,
7
+ "global_step": 29600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
4124
  "learning_rate": 2.6703775696530603e-05,
4125
  "loss": 0.3557,
4126
  "step": 29400
4127
+ },
4128
+ {
4129
+ "epoch": 0.5204007704405295,
4130
+ "grad_norm": 1.787463665008545,
4131
+ "learning_rate": 2.665468967819206e-05,
4132
+ "loss": 0.3389,
4133
+ "step": 29450
4134
+ },
4135
+ {
4136
+ "epoch": 0.5212843031577459,
4137
+ "grad_norm": 3.174107789993286,
4138
+ "learning_rate": 2.660560365985353e-05,
4139
+ "loss": 0.3322,
4140
+ "step": 29500
4141
+ },
4142
+ {
4143
+ "epoch": 0.5221678358749624,
4144
+ "grad_norm": 1.648913025856018,
4145
+ "learning_rate": 2.6556517641514994e-05,
4146
+ "loss": 0.3053,
4147
+ "step": 29550
4148
+ },
4149
+ {
4150
+ "epoch": 0.5230513685921789,
4151
+ "grad_norm": 1.648561954498291,
4152
+ "learning_rate": 2.6507431623176455e-05,
4153
+ "loss": 0.2486,
4154
+ "step": 29600
4155
  }
4156
  ],
4157
  "logging_steps": 50,