snoopsy commited on
Commit
07ca79b
·
verified ·
1 Parent(s): 98eec5e

Run 4. Outer Step 46. Inner Step 16.

Browse files
Files changed (3) hide show
  1. config.json +31 -34
  2. inner_optimizer.pt +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -268,46 +268,43 @@
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
- 5567569,
272
- 5567570,
273
- 5567571,
274
- 5567571,
275
- 5567573,
276
- 5567573,
277
- 5567574,
278
- 5567575,
279
- 5567577,
280
- 5567577,
281
- 5567578,
282
- 5567579,
283
- 5567580,
284
- 5567580,
285
- 5567581,
286
- 5567582,
287
- 5567582,
288
- 5567583,
289
- 5567584,
290
- 5567585,
291
- 5567586,
292
- 5567587,
293
- 5567587,
294
- 5567588,
295
- 5567589,
296
- 5567590,
297
- 5567591,
298
- 5567592,
299
- 5567592,
300
- 5567593,
301
- 5567593,
302
- 5567594,
303
- 5567595
304
  ],
305
  "block_size": 1024,
306
  "bos_token_id": 50256,
307
  "embd_pdrop": 0.1,
308
  "eos_token_id": 50256,
309
  "initializer_range": 0.02,
310
- "inner_step": 14,
311
  "inner_steps": 0,
312
  "last_allreduce_block": 5566279,
313
  "layer_norm_epsilon": 1e-05,
 
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
+ 5567596,
272
+ 5567597,
273
+ 5567598,
274
+ 5567599,
275
+ 5567600,
276
+ 5567601,
277
+ 5567602,
278
+ 5567603,
279
+ 5567604,
280
+ 5567605,
281
+ 5567606,
282
+ 5567607,
283
+ 5567608,
284
+ 5567609,
285
+ 5567611,
286
+ 5567612,
287
+ 5567613,
288
+ 5567613,
289
+ 5567614,
290
+ 5567615,
291
+ 5567615,
292
+ 5567616,
293
+ 5567617,
294
+ 5567617,
295
+ 5567618,
296
+ 5567619,
297
+ 5567620,
298
+ 5567620,
299
+ 5567621,
300
+ 5567622
 
 
 
301
  ],
302
  "block_size": 1024,
303
  "bos_token_id": 50256,
304
  "embd_pdrop": 0.1,
305
  "eos_token_id": 50256,
306
  "initializer_range": 0.02,
307
+ "inner_step": 16,
308
  "inner_steps": 0,
309
  "last_allreduce_block": 5566279,
310
  "layer_norm_epsilon": 1e-05,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9905698f2a72e79b10ecbc75e844388b5878cf3a27e1f3f7a756b2a6f685fe98
3
  size 8081782503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afa103cbb63652d755057adc425bac80ca33b6299976ccea4cf33f0ab76234e3
3
  size 8081782503
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:490fa0b753a3ddd9809d15688b52fd5f2b4f54ed46ed559539a075e3cacc3ab5
3
  size 4040701744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f9c79707caece442f204d06e498e5b25501bb998baae822f9f3abd31061dd0c
3
  size 4040701744