zeras141a commited on
Commit
ebc031f
·
verified ·
1 Parent(s): f046064

Run 8. Outer Step 40. Inner Step 200.

Browse files
Files changed (4) hide show
  1. config.json +3 -18
  2. gradients.pt +1 -1
  3. inner_optimizer.pt +1 -1
  4. model.safetensors +1 -1
config.json CHANGED
@@ -264,30 +264,15 @@
264
  "attention_bias": false,
265
  "attention_dropout": 0.0,
266
  "block_list": [
267
- 6365538,
268
- 6365557,
269
- 6365573,
270
- 6365593,
271
- 6365614,
272
- 6365634,
273
- 6365656,
274
- 6365676,
275
- 6365696,
276
- 6365717,
277
- 6365739,
278
- 6365759,
279
- 6365779,
280
- 6365801,
281
- 6365824,
282
- 6365845,
283
- 6365870
284
  ],
285
  "bos_token_id": 1,
286
  "eos_token_id": 2,
287
  "hidden_act": "silu",
288
  "hidden_size": 2048,
289
  "initializer_range": 0.02,
290
- "inner_step": 195,
291
  "intermediate_size": 5632,
292
  "last_allreduce_block": 6361535,
293
  "max_position_embeddings": 2048,
 
264
  "attention_bias": false,
265
  "attention_dropout": 0.0,
266
  "block_list": [
267
+ 6366247,
268
+ 6366266
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
269
  ],
270
  "bos_token_id": 1,
271
  "eos_token_id": 2,
272
  "hidden_act": "silu",
273
  "hidden_size": 2048,
274
  "initializer_range": 0.02,
275
+ "inner_step": 200,
276
  "intermediate_size": 5632,
277
  "last_allreduce_block": 6361535,
278
  "max_position_embeddings": 2048,
gradients.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c60723145730314d77498a424f0ebef6b2310f772753117bed4ff90f0fbe1d4f
3
  size 88389626
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25562e9ccd7b575224f68d6e32f63ae6613ca7969d72716e113b81e2e67533a8
3
  size 88389626
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7e1372483948c55a0c351f72f935853e863fc605a9bd4f3c02dbd42f85269fa
3
  size 4924926906
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4306ddbd60691f266ebd0ce73b65f1253a4890e03696392238c0acd844915bac
3
  size 4924926906
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c57be6c0ecaabdf0b5ada8372cd478ee99986fea3039bc025959a7a013604b5
3
  size 4400216536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c95f0cce0db66ab358376c30c792df4e00fcc4ac64db69582c16ac23bbfb6e0c
3
  size 4400216536