ccore commited on
Commit
a5b7a27
·
verified ·
1 Parent(s): 232175d

Training in progress, epoch 11, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7885054e8acee224f47a6214787de54a8e17c44666a2e5e04f3e50bca0784d9
3
  size 500979600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:507e45593144bb2cf41c0598515e2ea5832f9e83502a991e35ca1fd8897d4b7b
3
  size 500979600
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eba41fe33bf5d3cc182639775a215fcb12d809754c66c097a8ecaa8b888aef54
3
  size 1002078330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08bee2e0984bbf63dd98e3afe5ce279648b51a871ad71dbaa9c855446f016deb
3
  size 1002078330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a28e556a4b8cdf7354da0e380ee4ea62220dba2a79a4bfa40e71ebba35883c5a
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2816efc9f4c1de5a16c78e02f2554b79cf809e4fff588f530d63512ba1508099
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa7ea7d3411b48ce3a693531a3b9df8c7497b173d8cca394cb86cb6010b5fee6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:667845ec98850da2da09c9709aecd8f85bd67e83fe7c6e52d5a2e2d27bb40110
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.995110273361206,
3
- "best_model_checkpoint": "./opt_trained/checkpoint-2010",
4
- "epoch": 10.0,
5
  "eval_steps": 500,
6
- "global_step": 2010,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -115,6 +115,14 @@
115
  "eval_samples_per_second": 37.072,
116
  "eval_steps_per_second": 9.268,
117
  "step": 2010
 
 
 
 
 
 
 
 
118
  }
119
  ],
120
  "logging_steps": 500,
@@ -134,7 +142,7 @@
134
  "attributes": {}
135
  }
136
  },
137
- "total_flos": 6.76635109632e+16,
138
  "train_batch_size": 16,
139
  "trial_name": null,
140
  "trial_params": null
 
1
  {
2
+ "best_metric": 0.9924370050430298,
3
+ "best_model_checkpoint": "./opt_trained/checkpoint-2211",
4
+ "epoch": 11.0,
5
  "eval_steps": 500,
6
+ "global_step": 2211,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
115
  "eval_samples_per_second": 37.072,
116
  "eval_steps_per_second": 9.268,
117
  "step": 2010
118
+ },
119
+ {
120
+ "epoch": 11.0,
121
+ "eval_loss": 0.9924370050430298,
122
+ "eval_runtime": 77.2049,
123
+ "eval_samples_per_second": 36.992,
124
+ "eval_steps_per_second": 9.248,
125
+ "step": 2211
126
  }
127
  ],
128
  "logging_steps": 500,
 
142
  "attributes": {}
143
  }
144
  },
145
+ "total_flos": 7.442986205952e+16,
146
  "train_batch_size": 16,
147
  "trial_name": null,
148
  "trial_params": null