yueqis commited on
Commit
55a0f2a
·
verified ·
1 Parent(s): 537a2c9

Upload trainer_state.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. trainer_state.json +38 -3
trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.7351252010107971,
6
  "eval_steps": 500,
7
- "global_step": 200,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -148,6 +148,41 @@
148
  "learning_rate": 4.504523224581762e-05,
149
  "loss": 0.864,
150
  "step": 200
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
151
  }
152
  ],
153
  "logging_steps": 10,
@@ -167,7 +202,7 @@
167
  "attributes": {}
168
  }
169
  },
170
- "total_flos": 6662970335559680.0,
171
  "train_batch_size": 1,
172
  "trial_name": null,
173
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.9189065012634965,
6
  "eval_steps": 500,
7
+ "global_step": 250,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
148
  "learning_rate": 4.504523224581762e-05,
149
  "loss": 0.864,
150
  "step": 200
151
+ },
152
+ {
153
+ "epoch": 0.771881461061337,
154
+ "grad_norm": 0.38919857144355774,
155
+ "learning_rate": 4.442333322822028e-05,
156
+ "loss": 0.8375,
157
+ "step": 210
158
+ },
159
+ {
160
+ "epoch": 0.8086377211118768,
161
+ "grad_norm": 0.3908405303955078,
162
+ "learning_rate": 4.376952172513046e-05,
163
+ "loss": 0.8642,
164
+ "step": 220
165
+ },
166
+ {
167
+ "epoch": 0.8453939811624167,
168
+ "grad_norm": 0.37455061078071594,
169
+ "learning_rate": 4.308487194713097e-05,
170
+ "loss": 0.8775,
171
+ "step": 230
172
+ },
173
+ {
174
+ "epoch": 0.8821502412129566,
175
+ "grad_norm": 0.3894438147544861,
176
+ "learning_rate": 4.2370508772009334e-05,
177
+ "loss": 0.8454,
178
+ "step": 240
179
+ },
180
+ {
181
+ "epoch": 0.9189065012634965,
182
+ "grad_norm": 0.40810340642929077,
183
+ "learning_rate": 4.162760589658649e-05,
184
+ "loss": 0.8399,
185
+ "step": 250
186
  }
187
  ],
188
  "logging_steps": 10,
 
202
  "attributes": {}
203
  }
204
  },
205
+ "total_flos": 8336347341258752.0,
206
  "train_batch_size": 1,
207
  "trial_name": null,
208
  "trial_params": null