Reggie commited on
Commit
102d82e
·
verified ·
1 Parent(s): 7680c3a

Training in progress, step 600, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f8dea4d325a4635d3c239e793bad657771e2130c83b3dfef9813d57f5058df9
3
  size 69782384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f12882e795e48b5e34ae38b2a3dc13d970ae8ed794446b433b285dcae5e4b45
3
  size 69782384
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a691a2dd0083ffd45de8f8ba46f1319a1176b01199ed67ae21c5b8f4c7c5d65a
3
  size 139790651
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f41bf5ac8dd82b27bccf99bb00806066e352c1bf853a1398026d130ed323742
3
  size 139790651
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77af5db692d8169680b37a82ccaf2369394b341d2c152f145639fd25a259d63f
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b5b7c38c3608ce56ea60cd8715a5aebe62a252c04517ce9587d7d3c27fbbbdf
3
  size 14645
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14206d6f39047b8dbff5f90ecc0ad71bc03ad9f0a166b1d0248ef5714395ce2a
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b60382b672a7ee5b1056446dd64188b841f33ae83dfad90e6f0c3d3114911f38
3
  size 1465
last-checkpoint/trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 400,
3
- "best_metric": 2.2951860427856445,
4
- "best_model_checkpoint": "./outputs/checkpoint-400",
5
- "epoch": 0.43431053203040176,
6
  "eval_steps": 200,
7
- "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -80,6 +80,42 @@
80
  "eval_samples_per_second": 81.949,
81
  "eval_steps_per_second": 2.586,
82
  "step": 400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
83
  }
84
  ],
85
  "logging_steps": 50,
@@ -108,7 +144,7 @@
108
  "attributes": {}
109
  }
110
  },
111
- "total_flos": 1.1185423411367117e+17,
112
  "train_batch_size": 32,
113
  "trial_name": null,
114
  "trial_params": null
 
1
  {
2
+ "best_global_step": 600,
3
+ "best_metric": 2.2626566886901855,
4
+ "best_model_checkpoint": "./outputs/checkpoint-600",
5
+ "epoch": 0.6514657980456026,
6
  "eval_steps": 200,
7
+ "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
80
  "eval_samples_per_second": 81.949,
81
  "eval_steps_per_second": 2.586,
82
  "step": 400
83
+ },
84
+ {
85
+ "epoch": 0.48859934853420195,
86
+ "grad_norm": 0.6011854410171509,
87
+ "learning_rate": 0.00018951481098083322,
88
+ "loss": 2.2901,
89
+ "step": 450
90
+ },
91
+ {
92
+ "epoch": 0.5428881650380022,
93
+ "grad_norm": 0.6126257181167603,
94
+ "learning_rate": 0.00018678530414333524,
95
+ "loss": 2.3023,
96
+ "step": 500
97
+ },
98
+ {
99
+ "epoch": 0.5971769815418024,
100
+ "grad_norm": 0.6901931762695312,
101
+ "learning_rate": 0.00018376495001023636,
102
+ "loss": 2.2943,
103
+ "step": 550
104
+ },
105
+ {
106
+ "epoch": 0.6514657980456026,
107
+ "grad_norm": 0.6403626203536987,
108
+ "learning_rate": 0.00018046387082331516,
109
+ "loss": 2.2696,
110
+ "step": 600
111
+ },
112
+ {
113
+ "epoch": 0.6514657980456026,
114
+ "eval_loss": 2.2626566886901855,
115
+ "eval_runtime": 7.335,
116
+ "eval_samples_per_second": 82.072,
117
+ "eval_steps_per_second": 2.59,
118
+ "step": 600
119
  }
120
  ],
121
  "logging_steps": 50,
 
144
  "attributes": {}
145
  }
146
  },
147
+ "total_flos": 1.6793449133565542e+17,
148
  "train_batch_size": 32,
149
  "trial_name": null,
150
  "trial_params": null