Reggie commited on
Commit
99ce141
·
verified ·
1 Parent(s): 66d57c1

Training in progress, step 800, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f12882e795e48b5e34ae38b2a3dc13d970ae8ed794446b433b285dcae5e4b45
3
  size 69782384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aac60fa61b1371f0628e4cdce110bd39a12e57e9c460d701427e8c58e754e7e9
3
  size 69782384
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f41bf5ac8dd82b27bccf99bb00806066e352c1bf853a1398026d130ed323742
3
  size 139790651
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a63b11235c95638e0ee559b2345b5d8f7a103f5995eca48cb715fe2ba2cac47e
3
  size 139790651
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b5b7c38c3608ce56ea60cd8715a5aebe62a252c04517ce9587d7d3c27fbbbdf
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb0516b0656c487c351bad1057295186b5e3e00c79529207cd235ce5be6a5d40
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b60382b672a7ee5b1056446dd64188b841f33ae83dfad90e6f0c3d3114911f38
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4f1426694c38acbbdcb00f1a570a9712c4816b9dc6fb937a5303ba759aa3ab7
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 600,
3
- "best_metric": 2.2626566886901855,
4
- "best_model_checkpoint": "./outputs/checkpoint-600",
5
- "epoch": 0.6514657980456026,
6
  "eval_steps": 200,
7
- "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -116,6 +116,42 @@
116
  "eval_samples_per_second": 82.072,
117
  "eval_steps_per_second": 2.59,
118
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
119
  }
120
  ],
121
  "logging_steps": 50,
@@ -144,7 +180,7 @@
144
  "attributes": {}
145
  }
146
  },
147
- "total_flos": 1.6793449133565542e+17,
148
  "train_batch_size": 32,
149
  "trial_name": null,
150
  "trial_params": null
 
1
  {
2
+ "best_global_step": 800,
3
+ "best_metric": 2.2396719455718994,
4
+ "best_model_checkpoint": "./outputs/checkpoint-800",
5
+ "epoch": 0.8686210640608035,
6
  "eval_steps": 200,
7
+ "global_step": 800,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
116
  "eval_samples_per_second": 82.072,
117
  "eval_steps_per_second": 2.59,
118
  "step": 600
119
+ },
120
+ {
121
+ "epoch": 0.7057546145494028,
122
+ "grad_norm": 0.6320544481277466,
123
+ "learning_rate": 0.00017689312963021044,
124
+ "loss": 2.2678,
125
+ "step": 650
126
+ },
127
+ {
128
+ "epoch": 0.760043431053203,
129
+ "grad_norm": 0.7033542990684509,
130
+ "learning_rate": 0.00017306469320835707,
131
+ "loss": 2.2667,
132
+ "step": 700
133
+ },
134
+ {
135
+ "epoch": 0.8143322475570033,
136
+ "grad_norm": 0.6568920612335205,
137
+ "learning_rate": 0.00016899139196021397,
138
+ "loss": 2.2727,
139
+ "step": 750
140
+ },
141
+ {
142
+ "epoch": 0.8686210640608035,
143
+ "grad_norm": 0.7634288668632507,
144
+ "learning_rate": 0.00016468687691418833,
145
+ "loss": 2.2482,
146
+ "step": 800
147
+ },
148
+ {
149
+ "epoch": 0.8686210640608035,
150
+ "eval_loss": 2.2396719455718994,
151
+ "eval_runtime": 7.3506,
152
+ "eval_samples_per_second": 81.898,
153
+ "eval_steps_per_second": 2.585,
154
+ "step": 800
155
  }
156
  ],
157
  "logging_steps": 50,
 
180
  "attributes": {}
181
  }
182
  },
183
+ "total_flos": 2.2399365411628646e+17,
184
  "train_batch_size": 32,
185
  "trial_name": null,
186
  "trial_params": null