zeras141a commited on
Commit
0683843
·
verified ·
1 Parent(s): 196dbb0

Run 4. Outer Step 49. Inner Step 54.

Browse files
Files changed (3) hide show
  1. config.json +28 -16
  2. inner_optimizer.pt +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -268,28 +268,40 @@
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
- 5571272,
272
- 5571274,
273
- 5571275,
274
- 5571276,
275
- 5571277,
276
- 5571278,
277
- 5571279,
278
- 5571281,
279
- 5571283,
280
- 5571285,
281
- 5571287,
282
- 5571288,
283
- 5571289,
284
- 5571291,
285
- 5571293
 
 
 
 
 
 
 
 
 
 
 
 
286
  ],
287
  "block_size": 1024,
288
  "bos_token_id": 50256,
289
  "embd_pdrop": 0.1,
290
  "eos_token_id": 50256,
291
  "initializer_range": 0.02,
292
- "inner_step": 52,
293
  "inner_steps": 0,
294
  "last_allreduce_block": 5568918,
295
  "layer_norm_epsilon": 1e-05,
 
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
  "block_list": [
271
+ 5571296,
272
+ 5571298,
273
+ 5571299,
274
+ 5571300,
275
+ 5571303,
276
+ 5571304,
277
+ 5571306,
278
+ 5571307,
279
+ 5571309,
280
+ 5571311,
281
+ 5571312,
282
+ 5571314,
283
+ 5571316,
284
+ 5571317,
285
+ 5571318,
286
+ 5571319,
287
+ 5571320,
288
+ 5571321,
289
+ 5571323,
290
+ 5571324,
291
+ 5571326,
292
+ 5571327,
293
+ 5571328,
294
+ 5571330,
295
+ 5571332,
296
+ 5571333,
297
+ 5571335
298
  ],
299
  "block_size": 1024,
300
  "bos_token_id": 50256,
301
  "embd_pdrop": 0.1,
302
  "eos_token_id": 50256,
303
  "initializer_range": 0.02,
304
+ "inner_step": 54,
305
  "inner_steps": 0,
306
  "last_allreduce_block": 5568918,
307
  "layer_norm_epsilon": 1e-05,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ca75ae6bbf0d88a5f7989f5db1b1a41f21068e7f264507b15f3168272f64452
3
  size 8081782026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8bd33d05f200e3c04ebef7866597940ccc29202850a7d1fcd3703a2c661cda7
3
  size 8081782026
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27d5adc7e5b91c2ab80a82e96c08798da11bbf633e1132c11dae4cb4d8788cbe
3
  size 4040701744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81f9e848e246bc067e07266cf453d8f578a04e65b8296b98cb912250b52cb176
3
  size 4040701744