kmfoda commited on
Commit
48918e6
·
verified ·
1 Parent(s): 963652e

Run 4. Outer Step 18. Inner Step 0. Peers 94.

Browse files
Files changed (4) hide show
  1. config.json +22 -22
  2. inner_optimizer.pt +1 -1
  3. model.safetensors +1 -1
  4. outer_optimizer.pt +1 -1
config.json CHANGED
@@ -11,8 +11,8 @@
11
  "103": "NON_PARTICIPATING",
12
  "104": "NON_PARTICIPATING",
13
  "105": "NON_PARTICIPATING",
14
- "106": "NON_PARTICIPATING",
15
- "107": "SUCCESS",
16
  "108": "NON_PARTICIPATING",
17
  "109": "SUCCESS",
18
  "11": "NON_PARTICIPATING",
@@ -26,24 +26,24 @@
26
  "117": "NON_PARTICIPATING",
27
  "118": "NON_PARTICIPATING",
28
  "119": "NON_PARTICIPATING",
29
- "12": "FAIL",
30
  "120": "SUCCESS",
31
  "121": "NON_PARTICIPATING",
32
  "122": "NON_PARTICIPATING",
33
- "123": "NON_PARTICIPATING",
34
  "124": "NON_PARTICIPATING",
35
  "125": "NON_PARTICIPATING",
36
  "126": "NON_PARTICIPATING",
37
  "127": "SUCCESS",
38
  "128": "NON_PARTICIPATING",
39
- "129": "SUCCESS",
40
  "13": "NON_PARTICIPATING",
41
  "130": "NON_PARTICIPATING",
42
  "131": "NON_PARTICIPATING",
43
  "132": "SUCCESS",
44
  "133": "NON_PARTICIPATING",
45
  "134": "NON_PARTICIPATING",
46
- "135": "SUCCESS",
47
  "136": "NON_PARTICIPATING",
48
  "137": "NON_PARTICIPATING",
49
  "138": "NON_PARTICIPATING",
@@ -58,14 +58,14 @@
58
  "146": "NON_PARTICIPATING",
59
  "147": "SUCCESS",
60
  "148": "SUCCESS",
61
- "149": "NON_PARTICIPATING",
62
  "15": "SUCCESS",
63
  "150": "SUCCESS",
64
  "151": "NON_PARTICIPATING",
65
  "152": "NON_PARTICIPATING",
66
  "153": "NON_PARTICIPATING",
67
  "154": "SUCCESS",
68
- "155": "SUCCESS",
69
  "156": "SUCCESS",
70
  "157": "NON_PARTICIPATING",
71
  "158": "NON_PARTICIPATING",
@@ -78,7 +78,7 @@
78
  "164": "NON_PARTICIPATING",
79
  "165": "NON_PARTICIPATING",
80
  "166": "NON_PARTICIPATING",
81
- "167": "NON_PARTICIPATING",
82
  "168": "SUCCESS",
83
  "169": "NON_PARTICIPATING",
84
  "17": "SUCCESS",
@@ -99,7 +99,7 @@
99
  "183": "NON_PARTICIPATING",
100
  "184": "NON_PARTICIPATING",
101
  "185": "NON_PARTICIPATING",
102
- "186": "SUCCESS",
103
  "187": "SUCCESS",
104
  "188": "NON_PARTICIPATING",
105
  "189": "NON_PARTICIPATING",
@@ -109,7 +109,7 @@
109
  "192": "SUCCESS",
110
  "193": "SUCCESS",
111
  "194": "NON_PARTICIPATING",
112
- "195": "NON_PARTICIPATING",
113
  "196": "NON_PARTICIPATING",
114
  "197": "NON_PARTICIPATING",
115
  "198": "NON_PARTICIPATING",
@@ -148,7 +148,7 @@
148
  "227": "NON_PARTICIPATING",
149
  "228": "NON_PARTICIPATING",
150
  "229": "NON_PARTICIPATING",
151
- "23": "SUCCESS",
152
  "230": "NON_PARTICIPATING",
153
  "231": "SUCCESS",
154
  "232": "NON_PARTICIPATING",
@@ -161,10 +161,10 @@
161
  "239": "NON_PARTICIPATING",
162
  "24": "SUCCESS",
163
  "240": "NON_PARTICIPATING",
164
- "241": "SUCCESS",
165
  "242": "NON_PARTICIPATING",
166
  "243": "NON_PARTICIPATING",
167
- "244": "NON_PARTICIPATING",
168
  "245": "NON_PARTICIPATING",
169
  "246": "NON_PARTICIPATING",
170
  "247": "SUCCESS",
@@ -179,7 +179,7 @@
179
  "255": "NON_PARTICIPATING",
180
  "26": "SUCCESS",
181
  "27": "SUCCESS",
182
- "28": "NON_PARTICIPATING",
183
  "29": "SUCCESS",
184
  "3": "NON_PARTICIPATING",
185
  "30": "NON_PARTICIPATING",
@@ -193,7 +193,7 @@
193
  "38": "NON_PARTICIPATING",
194
  "39": "NON_PARTICIPATING",
195
  "4": "NON_PARTICIPATING",
196
- "40": "FAIL",
197
  "41": "SUCCESS",
198
  "42": "NON_PARTICIPATING",
199
  "43": "SUCCESS",
@@ -211,12 +211,12 @@
211
  "54": "NON_PARTICIPATING",
212
  "55": "SUCCESS",
213
  "56": "SUCCESS",
214
- "57": "NON_PARTICIPATING",
215
  "58": "SUCCESS",
216
  "59": "NON_PARTICIPATING",
217
- "6": "SUCCESS",
218
  "60": "NON_PARTICIPATING",
219
- "61": "SUCCESS",
220
  "62": "SUCCESS",
221
  "63": "SUCCESS",
222
  "64": "NON_PARTICIPATING",
@@ -242,7 +242,7 @@
242
  "82": "SUCCESS",
243
  "83": "NON_PARTICIPATING",
244
  "84": "SUCCESS",
245
- "85": "SUCCESS",
246
  "86": "NON_PARTICIPATING",
247
  "87": "SUCCESS",
248
  "88": "SUCCESS",
@@ -256,7 +256,7 @@
256
  "95": "SUCCESS",
257
  "96": "SUCCESS",
258
  "97": "NON_PARTICIPATING",
259
- "98": "SUCCESS",
260
  "99": "SUCCESS"
261
  },
262
  "architectures": [
@@ -275,7 +275,7 @@
275
  "initializer_range": 0.02,
276
  "inner_step": 0,
277
  "inner_steps": 0,
278
- "last_allreduce_block": 5519126,
279
  "layer_norm_epsilon": 1e-05,
280
  "model_type": "gpt_optimized",
281
  "n_embd": 1280,
 
11
  "103": "NON_PARTICIPATING",
12
  "104": "NON_PARTICIPATING",
13
  "105": "NON_PARTICIPATING",
14
+ "106": "SUCCESS",
15
+ "107": "NON_PARTICIPATING",
16
  "108": "NON_PARTICIPATING",
17
  "109": "SUCCESS",
18
  "11": "NON_PARTICIPATING",
 
26
  "117": "NON_PARTICIPATING",
27
  "118": "NON_PARTICIPATING",
28
  "119": "NON_PARTICIPATING",
29
+ "12": "SUCCESS",
30
  "120": "SUCCESS",
31
  "121": "NON_PARTICIPATING",
32
  "122": "NON_PARTICIPATING",
33
+ "123": "SUCCESS",
34
  "124": "NON_PARTICIPATING",
35
  "125": "NON_PARTICIPATING",
36
  "126": "NON_PARTICIPATING",
37
  "127": "SUCCESS",
38
  "128": "NON_PARTICIPATING",
39
+ "129": "NON_PARTICIPATING",
40
  "13": "NON_PARTICIPATING",
41
  "130": "NON_PARTICIPATING",
42
  "131": "NON_PARTICIPATING",
43
  "132": "SUCCESS",
44
  "133": "NON_PARTICIPATING",
45
  "134": "NON_PARTICIPATING",
46
+ "135": "FAIL",
47
  "136": "NON_PARTICIPATING",
48
  "137": "NON_PARTICIPATING",
49
  "138": "NON_PARTICIPATING",
 
58
  "146": "NON_PARTICIPATING",
59
  "147": "SUCCESS",
60
  "148": "SUCCESS",
61
+ "149": "SUCCESS",
62
  "15": "SUCCESS",
63
  "150": "SUCCESS",
64
  "151": "NON_PARTICIPATING",
65
  "152": "NON_PARTICIPATING",
66
  "153": "NON_PARTICIPATING",
67
  "154": "SUCCESS",
68
+ "155": "NON_PARTICIPATING",
69
  "156": "SUCCESS",
70
  "157": "NON_PARTICIPATING",
71
  "158": "NON_PARTICIPATING",
 
78
  "164": "NON_PARTICIPATING",
79
  "165": "NON_PARTICIPATING",
80
  "166": "NON_PARTICIPATING",
81
+ "167": "SUCCESS",
82
  "168": "SUCCESS",
83
  "169": "NON_PARTICIPATING",
84
  "17": "SUCCESS",
 
99
  "183": "NON_PARTICIPATING",
100
  "184": "NON_PARTICIPATING",
101
  "185": "NON_PARTICIPATING",
102
+ "186": "NON_PARTICIPATING",
103
  "187": "SUCCESS",
104
  "188": "NON_PARTICIPATING",
105
  "189": "NON_PARTICIPATING",
 
109
  "192": "SUCCESS",
110
  "193": "SUCCESS",
111
  "194": "NON_PARTICIPATING",
112
+ "195": "SUCCESS",
113
  "196": "NON_PARTICIPATING",
114
  "197": "NON_PARTICIPATING",
115
  "198": "NON_PARTICIPATING",
 
148
  "227": "NON_PARTICIPATING",
149
  "228": "NON_PARTICIPATING",
150
  "229": "NON_PARTICIPATING",
151
+ "23": "NON_PARTICIPATING",
152
  "230": "NON_PARTICIPATING",
153
  "231": "SUCCESS",
154
  "232": "NON_PARTICIPATING",
 
161
  "239": "NON_PARTICIPATING",
162
  "24": "SUCCESS",
163
  "240": "NON_PARTICIPATING",
164
+ "241": "NON_PARTICIPATING",
165
  "242": "NON_PARTICIPATING",
166
  "243": "NON_PARTICIPATING",
167
+ "244": "SUCCESS",
168
  "245": "NON_PARTICIPATING",
169
  "246": "NON_PARTICIPATING",
170
  "247": "SUCCESS",
 
179
  "255": "NON_PARTICIPATING",
180
  "26": "SUCCESS",
181
  "27": "SUCCESS",
182
+ "28": "SUCCESS",
183
  "29": "SUCCESS",
184
  "3": "NON_PARTICIPATING",
185
  "30": "NON_PARTICIPATING",
 
193
  "38": "NON_PARTICIPATING",
194
  "39": "NON_PARTICIPATING",
195
  "4": "NON_PARTICIPATING",
196
+ "40": "SUCCESS",
197
  "41": "SUCCESS",
198
  "42": "NON_PARTICIPATING",
199
  "43": "SUCCESS",
 
211
  "54": "NON_PARTICIPATING",
212
  "55": "SUCCESS",
213
  "56": "SUCCESS",
214
+ "57": "SUCCESS",
215
  "58": "SUCCESS",
216
  "59": "NON_PARTICIPATING",
217
+ "6": "NON_PARTICIPATING",
218
  "60": "NON_PARTICIPATING",
219
+ "61": "NON_PARTICIPATING",
220
  "62": "SUCCESS",
221
  "63": "SUCCESS",
222
  "64": "NON_PARTICIPATING",
 
242
  "82": "SUCCESS",
243
  "83": "NON_PARTICIPATING",
244
  "84": "SUCCESS",
245
+ "85": "NON_PARTICIPATING",
246
  "86": "NON_PARTICIPATING",
247
  "87": "SUCCESS",
248
  "88": "SUCCESS",
 
256
  "95": "SUCCESS",
257
  "96": "SUCCESS",
258
  "97": "NON_PARTICIPATING",
259
+ "98": "NON_PARTICIPATING",
260
  "99": "SUCCESS"
261
  },
262
  "architectures": [
 
275
  "initializer_range": 0.02,
276
  "inner_step": 0,
277
  "inner_steps": 0,
278
+ "last_allreduce_block": 5521055,
279
  "layer_norm_epsilon": 1e-05,
280
  "model_type": "gpt_optimized",
281
  "n_embd": 1280,
inner_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10830bc00559ccf8a293f4be576a18f1352821f549e0dced9436d1ad2cf3c773
3
  size 8081782026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fad8d26d218d5febfefa226730354b8b78ed19eac1eaacdc2751d68aa1369b7
3
  size 8081782026
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:145efa78d321610330e93c04f650bbd8d5b72dab897e00c1fb1b65c643ef605c
3
  size 4040701744
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6c772547e50bb8df295b8a3259781cb1a77ba735054f047b439999536613083
3
  size 4040701744
outer_optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb8520c44989f8d9ea4f58fb94ce8c77eaec5d17461ff9c3d91fb928b24cd31
3
  size 4040805354
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ad0f50c612952d8c3a9ce40d1612d0d3d28481b3a19cafba711c54c209864af
3
  size 4040805354