mizzaay commited on
Commit
89a13f0
·
verified ·
1 Parent(s): da734c0

Run 8. Outer Step 46. Inner Step 86.

Browse files
Files changed (4) hide show
  1. config.json +16 -8
  2. gradients.pt +1 -1
  3. inner_optimizer.pt +1 -1
  4. model.safetensors +1 -1
config.json CHANGED
@@ -264,20 +264,28 @@
264
  "attention_bias": false,
265
  "attention_dropout": 0.0,
266
  "block_list": [
267
- 6371686,
268
- 6371707,
269
- 6371728,
270
- 6371747,
271
- 6371767,
272
- 6371786,
273
- 6371806
 
 
 
 
 
 
 
 
274
  ],
275
  "bos_token_id": 1,
276
  "eos_token_id": 2,
277
  "hidden_act": "silu",
278
  "hidden_size": 2048,
279
  "initializer_range": 0.02,
280
- "inner_step": 47,
281
  "intermediate_size": 5632,
282
  "last_allreduce_block": 6371430,
283
  "max_position_embeddings": 2048,
 
264
  "attention_bias": false,
265
  "attention_dropout": 0.0,
266
  "block_list": [
267
+ 6371841,
268
+ 6371852,
269
+ 6371861,
270
+ 6371870,
271
+ 6371878,
272
+ 6371885,
273
+ 6371896,
274
+ 6371906,
275
+ 6371915,
276
+ 6371925,
277
+ 6371932,
278
+ 6371940,
279
+ 6371950,
280
+ 6371959,
281
+ 6371969
282
  ],
283
  "bos_token_id": 1,
284
  "eos_token_id": 2,
285
  "hidden_act": "silu",
286
  "hidden_size": 2048,
287
  "initializer_range": 0.02,
288
+ "inner_step": 85,
289
  "intermediate_size": 5632,
290
  "last_allreduce_block": 6371430,
291
  "max_position_embeddings": 2048,
gradients.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7de41930fafd3b14a63efedd48513f0dbcd1f589b8aa004470131996584d4f8
3
  size 88389626
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f02d21fa0f07f63081c471bcfca98f96c752cd1f7bcc8f443b92e1d4e5ea3c5
3
  size 88389626
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33f07ddcb35b8f567b1354130b85bc7ef893ddbfc75e50be6772591de9f906b1
3
  size 4924926906
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63e14c00572674953b077f60a4e379ae878ca60ba963d8ecfb1588c40649c8ba
3
  size 4924926906
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c784889993bb46851a5d32d5e6d26f503268ec1bda646d4825da6f259dc31b5e
3
  size 4400216536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf31ee2003bd0272a5071ae1da513686abc6740262ab38fde5eec5cac02229c1
3
  size 4400216536