baby-dev commited on
Commit
d78afd8
·
verified ·
1 Parent(s): 8829acc

Training in progress, step 700, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:daaff03669a032b7c022a482789b2f3c995b01f72ad79b3cc8068b8f1e434c60
3
  size 335604696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96e509696c55084c5f68db216b08c236034352729f9a35d54304177b2d7c5d59
3
  size 335604696
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c0ce3f9ee64b0c869751a3b334d7eed8318d1c81a574dbeacadb98868be199f
3
  size 170920532
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5c6ad648686c9545cc7cf5739ee01d7d5df372baebe9043894c7b1ad989beb9
3
  size 170920532
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a5b7fc8ba333afed8a1a8bd04eb95e00d2bd168f67ada07b2962cd70cb734ce
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16c92660cd9919724ef2fa3ec4b8340423c04523460cd45e086b483ace36dd17
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02db3dbfb390a8f0700b2ea5550de43719bf1ee696229ad5e263b02923655626
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b38320f40535085de37905499e1385aa34aad6a41a68078b15be5cc295f0a80
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 2.30838942527771,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-500",
4
- "epoch": 0.08191685439279131,
5
  "eval_steps": 100,
6
- "global_step": 600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -147,6 +147,28 @@
147
  "eval_samples_per_second": 35.138,
148
  "eval_steps_per_second": 8.784,
149
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
150
  }
151
  ],
152
  "logging_steps": 50,
@@ -161,7 +183,7 @@
161
  "early_stopping_threshold": 0.0
162
  },
163
  "attributes": {
164
- "early_stopping_patience_counter": 1
165
  }
166
  },
167
  "TrainerControl": {
@@ -170,12 +192,12 @@
170
  "should_evaluate": false,
171
  "should_log": false,
172
  "should_save": true,
173
- "should_training_stop": false
174
  },
175
  "attributes": {}
176
  }
177
  },
178
- "total_flos": 2.121758001856512e+17,
179
  "train_batch_size": 4,
180
  "trial_name": null,
181
  "trial_params": null
 
1
  {
2
  "best_metric": 2.30838942527771,
3
  "best_model_checkpoint": "miner_id_24/checkpoint-500",
4
+ "epoch": 0.09556966345825654,
5
  "eval_steps": 100,
6
+ "global_step": 700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
147
  "eval_samples_per_second": 35.138,
148
  "eval_steps_per_second": 8.784,
149
  "step": 600
150
+ },
151
+ {
152
+ "epoch": 0.08874325892552393,
153
+ "grad_norm": 78.84331512451172,
154
+ "learning_rate": 0.00025,
155
+ "loss": 9.1057,
156
+ "step": 650
157
+ },
158
+ {
159
+ "epoch": 0.09556966345825654,
160
+ "grad_norm": 82.10652923583984,
161
+ "learning_rate": 0.00025,
162
+ "loss": 9.2502,
163
+ "step": 700
164
+ },
165
+ {
166
+ "epoch": 0.09556966345825654,
167
+ "eval_loss": 2.4388105869293213,
168
+ "eval_runtime": 175.7023,
169
+ "eval_samples_per_second": 35.105,
170
+ "eval_steps_per_second": 8.776,
171
+ "step": 700
172
  }
173
  ],
174
  "logging_steps": 50,
 
183
  "early_stopping_threshold": 0.0
184
  },
185
  "attributes": {
186
+ "early_stopping_patience_counter": 2
187
  }
188
  },
189
  "TrainerControl": {
 
192
  "should_evaluate": false,
193
  "should_log": false,
194
  "should_save": true,
195
+ "should_training_stop": true
196
  },
197
  "attributes": {}
198
  }
199
  },
200
+ "total_flos": 2.475384335499264e+17,
201
  "train_batch_size": 4,
202
  "trial_name": null,
203
  "trial_params": null