File size: 7,740 Bytes
c8c4408
 
 
 
 
 
fd607f3
c8c4408
fd607f3
cb22076
f30a816
c9779cd
c8c4408
79fa11f
c8c4408
 
 
 
9293ca0
c9779cd
c8c4408
 
9293ca0
c8c4408
f30a816
791d9d9
8f27b49
c8c4408
fa7ee81
c8c4408
791d9d9
fd607f3
e45db3d
c8c4408
 
a00a99e
5eeb558
532a9e0
c8c4408
 
 
9293ca0
fa7ee81
 
9293ca0
a00a99e
ca41a79
5eeb558
a00a99e
c8c4408
791d9d9
cb22076
791d9d9
79fa11f
a00a99e
79fa11f
fd607f3
c8c4408
a00a99e
 
791d9d9
c8c4408
a00a99e
c8c4408
f30a816
791d9d9
 
c9779cd
c8c4408
79fa11f
791d9d9
c8c4408
fa7ee81
c8c4408
a00a99e
 
791d9d9
79fa11f
a00a99e
f30a816
a00a99e
 
c8c4408
fa7ee81
9293ca0
cb22076
fd607f3
79fa11f
cb22076
c8c4408
 
9293ca0
c8c4408
 
a00a99e
fd607f3
a00a99e
 
d6a657e
79fa11f
791d9d9
79fa11f
a00a99e
d6a657e
c8c4408
cb22076
a00a99e
 
791d9d9
c8c4408
 
 
79fa11f
c9779cd
c8c4408
5eeb558
c8c4408
5eeb558
9293ca0
fa7ee81
79fa11f
d6a657e
a00a99e
cb22076
c8c4408
 
fd607f3
c8c4408
79fa11f
e45db3d
 
cb22076
9293ca0
fd607f3
da64111
791d9d9
fa7ee81
791d9d9
c8c4408
8f27b49
c8c4408
 
fa7ee81
ca41a79
791d9d9
a00a99e
c8c4408
fd607f3
c8c4408
 
a00a99e
c8c4408
 
79fa11f
f426a39
c8c4408
fd607f3
a00a99e
fa7ee81
ca41a79
c8c4408
 
e45db3d
791d9d9
c8c4408
9293ca0
c8c4408
a00a99e
c9779cd
c8c4408
 
 
a00a99e
c8c4408
fa7ee81
791d9d9
a00a99e
791d9d9
532a9e0
e45db3d
791d9d9
 
79fa11f
c8c4408
f30a816
fa7ee81
cb22076
ca41a79
da64111
a00a99e
9293ca0
c8c4408
 
 
f30a816
fd607f3
791d9d9
da64111
a00a99e
9293ca0
f30a816
c8c4408
532a9e0
a00a99e
c8c4408
 
 
f30a816
fa7ee81
c8c4408
a00a99e
d6a657e
c8c4408
 
a00a99e
c8c4408
da64111
c8c4408
 
fa7ee81
c9779cd
79fa11f
c9779cd
c8c4408
 
5eeb558
c8c4408
fa7ee81
fd607f3
c8c4408
f30a816
fd607f3
532a9e0
79fa11f
791d9d9
a00a99e
c8c4408
 
 
a00a99e
cb22076
791d9d9
f426a39
c8c4408
a00a99e
c8c4408
 
 
 
 
 
79fa11f
fa7ee81
a00a99e
5eeb558
a00a99e
c8c4408
fd607f3
791d9d9
c8c4408
 
 
 
 
 
 
ab16e39
 
c8c4408
 
 
 
 
 
ab16e39
c8c4408
a00a99e
c8c4408
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NOT_ALIVE",
    "10": "NOT_ALIVE",
    "100": "NON_PARTICIPATING",
    "101": "NOT_ALIVE",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NOT_ALIVE",
    "105": "NON_PARTICIPATING",
    "106": "NOT_ALIVE",
    "107": "NOT_ALIVE",
    "108": "NON_PARTICIPATING",
    "109": "NOT_ALIVE",
    "11": "NOT_ALIVE",
    "110": "NOT_ALIVE",
    "111": "NON_PARTICIPATING",
    "112": "NON_PARTICIPATING",
    "113": "NOT_ALIVE",
    "114": "NOT_ALIVE",
    "115": "NON_PARTICIPATING",
    "116": "NOT_ALIVE",
    "117": "NOT_ALIVE",
    "118": "NON_PARTICIPATING",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NOT_ALIVE",
    "121": "NOT_ALIVE",
    "122": "NON_PARTICIPATING",
    "123": "NON_PARTICIPATING",
    "124": "NON_PARTICIPATING",
    "125": "NOT_ALIVE",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NON_PARTICIPATING",
    "129": "NOT_ALIVE",
    "13": "NOT_ALIVE",
    "130": "NOT_ALIVE",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "NON_PARTICIPATING",
    "134": "NOT_ALIVE",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "NON_PARTICIPATING",
    "139": "SUCCESS",
    "14": "NOT_ALIVE",
    "140": "NON_PARTICIPATING",
    "141": "NON_PARTICIPATING",
    "142": "NON_PARTICIPATING",
    "143": "NOT_ALIVE",
    "144": "NOT_ALIVE",
    "145": "NOT_ALIVE",
    "146": "NON_PARTICIPATING",
    "147": "NOT_ALIVE",
    "148": "SUCCESS",
    "149": "NON_PARTICIPATING",
    "15": "SUCCESS",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "NOT_ALIVE",
    "154": "NON_PARTICIPATING",
    "155": "NON_PARTICIPATING",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NON_PARTICIPATING",
    "159": "NON_PARTICIPATING",
    "16": "NOT_ALIVE",
    "160": "NON_PARTICIPATING",
    "161": "NON_PARTICIPATING",
    "162": "NOT_ALIVE",
    "163": "NON_PARTICIPATING",
    "164": "NON_PARTICIPATING",
    "165": "NON_PARTICIPATING",
    "166": "NON_PARTICIPATING",
    "167": "NOT_ALIVE",
    "168": "NOT_ALIVE",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NON_PARTICIPATING",
    "171": "NON_PARTICIPATING",
    "172": "NOT_ALIVE",
    "173": "NON_PARTICIPATING",
    "174": "NON_PARTICIPATING",
    "175": "NON_PARTICIPATING",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NON_PARTICIPATING",
    "179": "NON_PARTICIPATING",
    "18": "NOT_ALIVE",
    "180": "NON_PARTICIPATING",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "NON_PARTICIPATING",
    "184": "NON_PARTICIPATING",
    "185": "NON_PARTICIPATING",
    "186": "NON_PARTICIPATING",
    "187": "NOT_ALIVE",
    "188": "NOT_ALIVE",
    "189": "NON_PARTICIPATING",
    "19": "NOT_ALIVE",
    "190": "NOT_ALIVE",
    "191": "NON_PARTICIPATING",
    "192": "NOT_ALIVE",
    "193": "SUCCESS",
    "194": "NON_PARTICIPATING",
    "195": "NON_PARTICIPATING",
    "196": "NOT_ALIVE",
    "197": "NOT_ALIVE",
    "198": "NON_PARTICIPATING",
    "199": "NOT_ALIVE",
    "2": "NOT_ALIVE",
    "20": "NOT_ALIVE",
    "200": "NON_PARTICIPATING",
    "201": "NOT_ALIVE",
    "202": "NOT_ALIVE",
    "203": "NON_PARTICIPATING",
    "204": "NON_PARTICIPATING",
    "205": "NON_PARTICIPATING",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NOT_ALIVE",
    "209": "NON_PARTICIPATING",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NOT_ALIVE",
    "213": "NOT_ALIVE",
    "214": "NON_PARTICIPATING",
    "215": "NON_PARTICIPATING",
    "216": "NON_PARTICIPATING",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NON_PARTICIPATING",
    "22": "NOT_ALIVE",
    "220": "NOT_ALIVE",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NON_PARTICIPATING",
    "225": "NON_PARTICIPATING",
    "226": "NON_PARTICIPATING",
    "227": "NOT_ALIVE",
    "228": "NON_PARTICIPATING",
    "229": "NOT_ALIVE",
    "23": "NOT_ALIVE",
    "230": "NOT_ALIVE",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NON_PARTICIPATING",
    "235": "NOT_ALIVE",
    "236": "NON_PARTICIPATING",
    "237": "NOT_ALIVE",
    "238": "NOT_ALIVE",
    "239": "NON_PARTICIPATING",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NON_PARTICIPATING",
    "243": "NOT_ALIVE",
    "244": "NON_PARTICIPATING",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NOT_ALIVE",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NOT_ALIVE",
    "251": "NOT_ALIVE",
    "252": "NOT_ALIVE",
    "253": "NOT_ALIVE",
    "254": "NOT_ALIVE",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NON_PARTICIPATING",
    "28": "NON_PARTICIPATING",
    "29": "NOT_ALIVE",
    "3": "NOT_ALIVE",
    "30": "NOT_ALIVE",
    "31": "NOT_ALIVE",
    "32": "NOT_ALIVE",
    "33": "NON_PARTICIPATING",
    "34": "NON_PARTICIPATING",
    "35": "NON_PARTICIPATING",
    "36": "NON_PARTICIPATING",
    "37": "NON_PARTICIPATING",
    "38": "NOT_ALIVE",
    "39": "NOT_ALIVE",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NOT_ALIVE",
    "43": "NON_PARTICIPATING",
    "44": "SUCCESS",
    "45": "NON_PARTICIPATING",
    "46": "NON_PARTICIPATING",
    "47": "NOT_ALIVE",
    "48": "NON_PARTICIPATING",
    "49": "NOT_ALIVE",
    "5": "NOT_ALIVE",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "NOT_ALIVE",
    "53": "NOT_ALIVE",
    "54": "NOT_ALIVE",
    "55": "NON_PARTICIPATING",
    "56": "NON_PARTICIPATING",
    "57": "NON_PARTICIPATING",
    "58": "NOT_ALIVE",
    "59": "NON_PARTICIPATING",
    "6": "NOT_ALIVE",
    "60": "NON_PARTICIPATING",
    "61": "NOT_ALIVE",
    "62": "NOT_ALIVE",
    "63": "NOT_ALIVE",
    "64": "NON_PARTICIPATING",
    "65": "NON_PARTICIPATING",
    "66": "NOT_ALIVE",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NON_PARTICIPATING",
    "7": "NOT_ALIVE",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NOT_ALIVE",
    "73": "NOT_ALIVE",
    "74": "NOT_ALIVE",
    "75": "NON_PARTICIPATING",
    "76": "NOT_ALIVE",
    "77": "NON_PARTICIPATING",
    "78": "SUCCESS",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NOT_ALIVE",
    "81": "NON_PARTICIPATING",
    "82": "NON_PARTICIPATING",
    "83": "NON_PARTICIPATING",
    "84": "NON_PARTICIPATING",
    "85": "NOT_ALIVE",
    "86": "NON_PARTICIPATING",
    "87": "NOT_ALIVE",
    "88": "NOT_ALIVE",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NOT_ALIVE",
    "91": "NOT_ALIVE",
    "92": "NON_PARTICIPATING",
    "93": "NOT_ALIVE",
    "94": "NON_PARTICIPATING",
    "95": "NON_PARTICIPATING",
    "96": "NOT_ALIVE",
    "97": "NOT_ALIVE",
    "98": "NON_PARTICIPATING",
    "99": "NON_PARTICIPATING"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6187956,
    6187972
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 62,
  "intermediate_size": 5632,
  "last_allreduce_block": 6187448,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}