tensorwa commited on
Commit
69edc90
·
verified ·
1 Parent(s): f8ce117

Run 5. Outer Step 100. Inner Step 7.

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. inner_optimizer.pt +1 -1
  3. model.safetensors +1 -1
config.json CHANGED
@@ -264,15 +264,15 @@
264
  "attention_bias": false,
265
  "attention_dropout": 0.0,
266
  "block_list": [
267
- 5870545,
268
- 5870577
269
  ],
270
  "bos_token_id": 1,
271
  "eos_token_id": 2,
272
  "hidden_act": "silu",
273
  "hidden_size": 2048,
274
  "initializer_range": 0.02,
275
- "inner_step": 5,
276
  "intermediate_size": 5632,
277
  "last_allreduce_block": 5864939,
278
  "max_position_embeddings": 2048,
 
264
  "attention_bias": false,
265
  "attention_dropout": 0.0,
266
  "block_list": [
267
+ 5870623,
268
+ 5870653
269
  ],
270
  "bos_token_id": 1,
271
  "eos_token_id": 2,
272
  "hidden_act": "silu",
273
  "hidden_size": 2048,
274
  "initializer_range": 0.02,
275
+ "inner_step": 7,
276
  "intermediate_size": 5632,
277
  "last_allreduce_block": 5864939,
278
  "max_position_embeddings": 2048,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bf3a3a5c2267481d10fd1234419857653d935283e163986028296b5c6716610
3
  size 8800564561
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad54ac71aa1f660b9b5077757ff8dca398ecb9a40a6760e8806529fef3f0693d
3
  size 8800564561
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0ece02bdadf0ed94cd73dfe040fdfa77c0ab14de57c8cc12faa241bc91aa604
3
  size 4400216536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69556e1311ccafa88f8451b528474449af8f5eae2a7a01f06d835b97e4142e02
3
  size 4400216536