philip324mark commited on
Commit
d79b99e
·
verified ·
1 Parent(s): 1467de4

Run 4. Outer Step 51. Inner Step 0.

Browse files
Files changed (3) hide show
  1. config.json +2 -9
  2. inner_optimizer.pt +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -267,20 +267,13 @@
267
  "AutoConfig": "distributed/optimized-gpt2-500m--configuration_gpt_optimized.GPTOptimConfig",
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
- "block_list": [
271
- 5573117,
272
- 5573121,
273
- 5573125,
274
- 5573129,
275
- 5573133,
276
- 5573137
277
- ],
278
  "block_size": 1024,
279
  "bos_token_id": 50256,
280
  "embd_pdrop": 0.1,
281
  "eos_token_id": 50256,
282
  "initializer_range": 0.02,
283
- "inner_step": 53,
284
  "inner_steps": 0,
285
  "last_allreduce_block": 5556551,
286
  "layer_norm_epsilon": 1e-05,
 
267
  "AutoConfig": "distributed/optimized-gpt2-500m--configuration_gpt_optimized.GPTOptimConfig",
268
  "AutoModelForCausalLM": "distributed/optimized-gpt2-500m--modeling_gpt_optimized.GPTOptim"
269
  },
270
+ "block_list": [],
 
 
 
 
 
 
 
271
  "block_size": 1024,
272
  "bos_token_id": 50256,
273
  "embd_pdrop": 0.1,
274
  "eos_token_id": 50256,
275
  "initializer_range": 0.02,
276
+ "inner_step": 0,
277
  "inner_steps": 0,
278
  "last_allreduce_block": 5556551,
279
  "layer_norm_epsilon": 1e-05,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e60c70db34033cef47a282570bd190631172a788868d6c616aedd1c7b9c5b5c
3
  size 8081782026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afc1022d06288f80cfe8d9e8af1bf135177ba6d81ef37d497d50a46a3f47888d
3
  size 8081782026
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3363d277addb0ef7dc3e3f59c7f166f20f5fce0c21e5373223224f5c47d002f1
3
  size 4040701744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77e590ef20a1bd176a3f886e26b681c4fb6b45e332f2f1e36379c41fce91f1e7
3
  size 4040701744