youssefedweqd commited on
Commit
abfb812
·
verified ·
1 Parent(s): e76b8b5

Training in progress, step 900, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d5cc6bdc71dee79bf87e76cccd7c5f022d94f50f86f182ae3b19cd6f89d1a18
3
  size 161533160
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c29fe4a0133197cda139441a6bba43ba30a0a16566dcea0b7516ede214fd5573
3
  size 161533160
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c3d111a59096d88a8938996f72eaa582bdc17c62954716fedb95eaeb752fe76
3
  size 323292202
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5b38eb68908f60759797c8127974582cae417043d2969c2c60105311ef3ecf1
3
  size 323292202
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bb014c34717cc705cc26abab664b6e113f17c41373b9a6cee14bcf66f7b85a9e
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3492512c1ba7e98d86dc7e3d6cf87a55ddfe936908da4ab0ab28461f25075b9
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.13245033112582782,
6
  "eval_steps": 100,
7
- "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -136,6 +136,20 @@
136
  "learning_rate": 4.4094922737306846e-05,
137
  "loss": 0.7668,
138
  "step": 800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
139
  }
140
  ],
141
  "logging_steps": 50,
@@ -155,7 +169,7 @@
155
  "attributes": {}
156
  }
157
  },
158
- "total_flos": 6269184126222336.0,
159
  "train_batch_size": 1,
160
  "trial_name": null,
161
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.1490066225165563,
6
  "eval_steps": 100,
7
+ "global_step": 900,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
136
  "learning_rate": 4.4094922737306846e-05,
137
  "loss": 0.7668,
138
  "step": 800
139
+ },
140
+ {
141
+ "epoch": 0.14072847682119205,
142
+ "grad_norm": 1.9555529356002808,
143
+ "learning_rate": 4.685430463576159e-05,
144
+ "loss": 0.7684,
145
+ "step": 850
146
+ },
147
+ {
148
+ "epoch": 0.1490066225165563,
149
+ "grad_norm": 2.308894157409668,
150
+ "learning_rate": 4.961368653421634e-05,
151
+ "loss": 0.7661,
152
+ "step": 900
153
  }
154
  ],
155
  "logging_steps": 50,
 
169
  "attributes": {}
170
  }
171
  },
172
+ "total_flos": 7039716814749696.0,
173
  "train_batch_size": 1,
174
  "trial_name": null,
175
  "trial_params": null