zeras141a commited on
Commit
2565297
·
verified ·
1 Parent(s): 630d4d7

Run 4. Outer Step 50. Inner Step 9.

Browse files
Files changed (3) hide show
  1. config.json +18 -24
  2. inner_optimizer.pt +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -268,36 +268,30 @@
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
- 5571801,
272
- 5571803,
273
- 5571804,
274
- 5571806,
275
- 5571807,
276
- 5571808,
277
- 5571810,
278
- 5571811,
279
- 5571812,
280
- 5571813,
281
- 5571814,
282
- 5571816,
283
- 5571818,
284
- 5571820,
285
- 5571821,
286
- 5571823,
287
- 5571824,
288
- 5571824,
289
- 5571825,
290
- 5571827,
291
- 5571828,
292
- 5571829,
293
- 5571830
294
  ],
295
  "block_size": 1024,
296
  "bos_token_id": 50256,
297
  "embd_pdrop": 0.1,
298
  "eos_token_id": 50256,
299
  "initializer_range": 0.02,
300
- "inner_step": 7,
301
  "inner_steps": 0,
302
  "last_allreduce_block": 5571611,
303
  "layer_norm_epsilon": 1e-05,
 
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
+ 5571832,
272
+ 5571834,
273
+ 5571835,
274
+ 5571836,
275
+ 5571836,
276
+ 5571838,
277
+ 5571839,
278
+ 5571840,
279
+ 5571842,
280
+ 5571843,
281
+ 5571845,
282
+ 5571846,
283
+ 5571848,
284
+ 5571850,
285
+ 5571851,
286
+ 5571853,
287
+ 5571854
 
 
 
 
 
 
288
  ],
289
  "block_size": 1024,
290
  "bos_token_id": 50256,
291
  "embd_pdrop": 0.1,
292
  "eos_token_id": 50256,
293
  "initializer_range": 0.02,
294
+ "inner_step": 9,
295
  "inner_steps": 0,
296
  "last_allreduce_block": 5571611,
297
  "layer_norm_epsilon": 1e-05,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88c03c430c8c03d57ae1e2173aea9c670149f68fb9157bd74a80510057be40fd
3
  size 8081782026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af042dd22fdb5d636501c5541404ff58c6476ac83ac99c9bcc51be0a11bedc4
3
  size 8081782026
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:18de05fc3d1e3f03e1e5893c87ce32417ab8036e2da92411a919ed572a6825d3
3
  size 4040701744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e0760b860d6d5ae102e2a6515d4a3f1e0203e471e39f81d51a92b12fe7c475c5
3
  size 4040701744