File size: 7,258 Bytes
9495b81
1295fd4
9495b81
e55ee3b
f17ccee
e314b01
e55ee3b
6eaa44b
 
 
dc38cce
6eaa44b
76de68e
6eaa44b
76de68e
6eaa44b
76de68e
54133c5
e314b01
6eaa44b
 
 
7778629
6eaa44b
 
 
 
7b242bb
458b9b9
6eaa44b
 
 
 
 
 
e314b01
 
6eaa44b
54133c5
fff2230
e55ee3b
bb53b84
458b9b9
fc1e620
e314b01
6eaa44b
dae6c16
aae2ad2
76de68e
458b9b9
e314b01
861fbe5
76de68e
a3dc34f
76de68e
dae6c16
7b242bb
e314b01
995231e
54133c5
 
347d701
e55ee3b
fc1e620
6eaa44b
54133c5
 
e314b01
 
76de68e
83d63d4
fff2230
42d3475
7b242bb
fc1e620
6eaa44b
dae6c16
458b9b9
6eaa44b
76de68e
e314b01
7b242bb
6eaa44b
76de68e
e314b01
dc38cce
54133c5
458b9b9
6eaa44b
e55ee3b
7b242bb
6eaa44b
458b9b9
fc1e620
a1dbcb4
0f3cdb5
6eaa44b
1f4f982
e314b01
 
aae2ad2
6eaa44b
e314b01
0f2628a
54133c5
 
458b9b9
76de68e
 
cf4f37b
42d3475
6eaa44b
54133c5
7778629
76de68e
fc1e620
6eaa44b
 
fc1e620
54133c5
 
e55ee3b
6eaa44b
 
e55ee3b
9f1a5c2
76de68e
6eaa44b
7778629
6eaa44b
 
a3dc34f
6eaa44b
a3dc34f
0f2628a
76de68e
9b2c8e0
861fbe5
b775329
6eaa44b
 
54133c5
6eaa44b
e55ee3b
8eb3baa
76de68e
6eaa44b
 
2667f12
995231e
76de68e
54133c5
6eaa44b
cf2d0a5
6eaa44b
861fbe5
76de68e
6eaa44b
e314b01
861fbe5
83d63d4
e314b01
7b242bb
fc1e620
dae6c16
e55ee3b
76de68e
7b242bb
36dd80f
e314b01
2259eb9
76de68e
6eaa44b
1295fd4
6eaa44b
458b9b9
861fbe5
6eaa44b
995231e
36dd80f
e314b01
7778629
76de68e
531b490
7b242bb
fc1e620
e55ee3b
54133c5
7778629
531b490
6eaa44b
7b242bb
54133c5
76de68e
7b242bb
0f3cdb5
6eaa44b
0f2628a
f17ccee
54133c5
6eaa44b
e314b01
87a0f87
a3dc34f
6cc7786
861fbe5
8eb3baa
76de68e
6eaa44b
fc1e620
458b9b9
7b242bb
6eaa44b
42d3475
6eaa44b
76de68e
e314b01
 
76de68e
e314b01
6eaa44b
 
76de68e
6eaa44b
 
76de68e
6eaa44b
 
e314b01
6eaa44b
cf2d0a5
6eaa44b
54133c5
eea1c17
fc1e620
 
7b242bb
6eaa44b
76de68e
e55ee3b
e314b01
fc1e620
e314b01
76de68e
6eaa44b
 
531b490
c7bc7ef
76de68e
fc1e620
76de68e
6eaa44b
557febf
e314b01
dae6c16
e314b01
fc1e620
e314b01
6eaa44b
9495b81
 
 
 
 
 
0b557d2
13ddfc7
 
0b557d2
9495b81
 
 
 
 
13ddfc7
9495b81
6eaa44b
9495b81
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NON_PARTICIPATING",
    "10": "NON_PARTICIPATING",
    "100": "NOT_ALIVE",
    "101": "NON_PARTICIPATING",
    "102": "FAIL",
    "103": "NON_PARTICIPATING",
    "104": "NOT_ALIVE",
    "105": "FAIL",
    "106": "SUCCESS",
    "107": "FAIL",
    "108": "NON_PARTICIPATING",
    "109": "SUCCESS",
    "11": "NON_PARTICIPATING",
    "110": "NOT_ALIVE",
    "111": "SUCCESS",
    "112": "FAIL",
    "113": "FAIL",
    "114": "FAIL",
    "115": "NON_PARTICIPATING",
    "116": "NON_PARTICIPATING",
    "117": "NOT_ALIVE",
    "118": "FAIL",
    "119": "NOT_ALIVE",
    "12": "NON_PARTICIPATING",
    "120": "NOT_ALIVE",
    "121": "SUCCESS",
    "122": "NOT_ALIVE",
    "123": "FAIL",
    "124": "SUCCESS",
    "125": "FAIL",
    "126": "NOT_ALIVE",
    "127": "NON_PARTICIPATING",
    "128": "SUCCESS",
    "129": "NOT_ALIVE",
    "13": "SUCCESS",
    "130": "NOT_ALIVE",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "NOT_ALIVE",
    "134": "NOT_ALIVE",
    "135": "NON_PARTICIPATING",
    "136": "SUCCESS",
    "137": "NOT_ALIVE",
    "138": "NOT_ALIVE",
    "139": "NON_PARTICIPATING",
    "14": "NOT_ALIVE",
    "140": "SUCCESS",
    "141": "NON_PARTICIPATING",
    "142": "NON_PARTICIPATING",
    "143": "NOT_ALIVE",
    "144": "NON_PARTICIPATING",
    "145": "NOT_ALIVE",
    "146": "NON_PARTICIPATING",
    "147": "NON_PARTICIPATING",
    "148": "NON_PARTICIPATING",
    "149": "NOT_ALIVE",
    "15": "NOT_ALIVE",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "FAIL",
    "154": "NON_PARTICIPATING",
    "155": "NOT_ALIVE",
    "156": "NON_PARTICIPATING",
    "157": "NON_PARTICIPATING",
    "158": "NON_PARTICIPATING",
    "159": "SUCCESS",
    "16": "NOT_ALIVE",
    "160": "NOT_ALIVE",
    "161": "SUCCESS",
    "162": "NOT_ALIVE",
    "163": "NOT_ALIVE",
    "164": "NOT_ALIVE",
    "165": "NOT_ALIVE",
    "166": "NON_PARTICIPATING",
    "167": "NON_PARTICIPATING",
    "168": "SUCCESS",
    "169": "NON_PARTICIPATING",
    "17": "NOT_ALIVE",
    "170": "SUCCESS",
    "171": "NON_PARTICIPATING",
    "172": "NOT_ALIVE",
    "173": "NOT_ALIVE",
    "174": "NOT_ALIVE",
    "175": "SUCCESS",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NON_PARTICIPATING",
    "179": "NOT_ALIVE",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "NOT_ALIVE",
    "184": "FAIL",
    "185": "SUCCESS",
    "186": "NOT_ALIVE",
    "187": "NON_PARTICIPATING",
    "188": "SUCCESS",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NOT_ALIVE",
    "191": "NOT_ALIVE",
    "192": "NOT_ALIVE",
    "193": "NON_PARTICIPATING",
    "194": "NOT_ALIVE",
    "195": "NOT_ALIVE",
    "196": "FAIL",
    "197": "NOT_ALIVE",
    "198": "SUCCESS",
    "199": "NON_PARTICIPATING",
    "2": "NOT_ALIVE",
    "20": "NON_PARTICIPATING",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NOT_ALIVE",
    "203": "NOT_ALIVE",
    "204": "NOT_ALIVE",
    "205": "FAIL",
    "206": "SUCCESS",
    "207": "NOT_ALIVE",
    "208": "NOT_ALIVE",
    "209": "NON_PARTICIPATING",
    "21": "NON_PARTICIPATING",
    "210": "NON_PARTICIPATING",
    "211": "NON_PARTICIPATING",
    "212": "FAIL",
    "213": "NOT_ALIVE",
    "214": "NON_PARTICIPATING",
    "215": "NOT_ALIVE",
    "216": "NOT_ALIVE",
    "217": "NON_PARTICIPATING",
    "218": "NOT_ALIVE",
    "219": "NON_PARTICIPATING",
    "22": "NOT_ALIVE",
    "220": "NOT_ALIVE",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NON_PARTICIPATING",
    "224": "NOT_ALIVE",
    "225": "NON_PARTICIPATING",
    "226": "NON_PARTICIPATING",
    "227": "NON_PARTICIPATING",
    "228": "NOT_ALIVE",
    "229": "NOT_ALIVE",
    "23": "NON_PARTICIPATING",
    "230": "NON_PARTICIPATING",
    "231": "SUCCESS",
    "232": "NOT_ALIVE",
    "233": "NON_PARTICIPATING",
    "234": "NOT_ALIVE",
    "235": "NOT_ALIVE",
    "236": "NON_PARTICIPATING",
    "237": "NOT_ALIVE",
    "238": "NON_PARTICIPATING",
    "239": "NON_PARTICIPATING",
    "24": "NOT_ALIVE",
    "240": "NON_PARTICIPATING",
    "241": "NOT_ALIVE",
    "242": "NOT_ALIVE",
    "243": "NOT_ALIVE",
    "244": "NOT_ALIVE",
    "245": "NON_PARTICIPATING",
    "246": "SUCCESS",
    "247": "NOT_ALIVE",
    "248": "SUCCESS",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NOT_ALIVE",
    "251": "NOT_ALIVE",
    "252": "NOT_ALIVE",
    "253": "NOT_ALIVE",
    "254": "NON_PARTICIPATING",
    "255": "FAIL",
    "26": "SUCCESS",
    "27": "NOT_ALIVE",
    "28": "SUCCESS",
    "29": "NON_PARTICIPATING",
    "3": "NOT_ALIVE",
    "30": "NON_PARTICIPATING",
    "31": "NON_PARTICIPATING",
    "32": "NOT_ALIVE",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "SUCCESS",
    "36": "NON_PARTICIPATING",
    "37": "NON_PARTICIPATING",
    "38": "NOT_ALIVE",
    "39": "NON_PARTICIPATING",
    "4": "NON_PARTICIPATING",
    "40": "SUCCESS",
    "41": "NOT_ALIVE",
    "42": "NOT_ALIVE",
    "43": "NOT_ALIVE",
    "44": "SUCCESS",
    "45": "NON_PARTICIPATING",
    "46": "NON_PARTICIPATING",
    "47": "NOT_ALIVE",
    "48": "NOT_ALIVE",
    "49": "NOT_ALIVE",
    "5": "NOT_ALIVE",
    "50": "NON_PARTICIPATING",
    "51": "NON_PARTICIPATING",
    "52": "SUCCESS",
    "53": "FAIL",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "NON_PARTICIPATING",
    "57": "SUCCESS",
    "58": "NOT_ALIVE",
    "59": "FAIL",
    "6": "NON_PARTICIPATING",
    "60": "NON_PARTICIPATING",
    "61": "SUCCESS",
    "62": "NON_PARTICIPATING",
    "63": "SUCCESS",
    "64": "FAIL",
    "65": "NOT_ALIVE",
    "66": "SUCCESS",
    "67": "NON_PARTICIPATING",
    "68": "NON_PARTICIPATING",
    "69": "NON_PARTICIPATING",
    "7": "FAIL",
    "70": "NON_PARTICIPATING",
    "71": "SUCCESS",
    "72": "SUCCESS",
    "73": "NOT_ALIVE",
    "74": "FAIL",
    "75": "NOT_ALIVE",
    "76": "NOT_ALIVE",
    "77": "NOT_ALIVE",
    "78": "NOT_ALIVE",
    "79": "NON_PARTICIPATING",
    "8": "FAIL",
    "80": "NON_PARTICIPATING",
    "81": "NOT_ALIVE",
    "82": "NON_PARTICIPATING",
    "83": "NOT_ALIVE",
    "84": "SUCCESS",
    "85": "NOT_ALIVE",
    "86": "FAIL",
    "87": "SUCCESS",
    "88": "NOT_ALIVE",
    "89": "SUCCESS",
    "9": "NON_PARTICIPATING",
    "90": "NOT_ALIVE",
    "91": "SUCCESS",
    "92": "FAIL",
    "93": "NOT_ALIVE",
    "94": "SUCCESS",
    "95": "NOT_ALIVE",
    "96": "SUCCESS",
    "97": "NOT_ALIVE",
    "98": "NOT_ALIVE",
    "99": "FAIL"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6517429,
    6517463
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 36,
  "intermediate_size": 5632,
  "last_allreduce_block": 6517148,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}