File size: 7,779 Bytes
c10913b
c19416a
c10913b
 
508359a
79a8068
c10913b
aa63d04
7c1f985
8326b15
508359a
3f57e04
a2623c5
17a6cff
00fc568
ed147bd
508359a
3d04152
c5321ab
415e586
7c1f985
8c83a4e
c5321ab
508359a
3d04152
8c83a4e
3d04152
8326b15
3d04152
c19416a
508359a
aa63d04
c5b8406
79a8068
ed147bd
8c83a4e
7c1f985
c5b8406
a2f59e0
b5389ae
c10913b
508359a
 
28c6dbb
b5389ae
508359a
 
 
 
 
c19416a
0ad9b8d
00fc568
c5b8406
508359a
ece081c
732bb9b
3d04152
415e586
 
79a8068
508359a
c10913b
3f57e04
508359a
 
3d04152
a2f59e0
3d04152
 
508359a
8326b15
 
 
508359a
8c83a4e
508359a
3d04152
508359a
8c83a4e
3d04152
732bb9b
8c83a4e
3d04152
34a4f02
8326b15
508359a
8c83a4e
17a6cff
c10913b
00fc568
65c296d
79a8068
8c83a4e
deacb6b
c19416a
069c347
508359a
3d04152
c5321ab
508359a
aa63d04
8326b15
c10913b
a930bf4
a2f59e0
c10913b
8326b15
 
 
ece081c
3d04152
508359a
3d04152
 
8326b15
508359a
28c6dbb
c19416a
aa63d04
 
508359a
415e586
c5b8406
c10913b
508359a
65c296d
c19416a
508359a
ece081c
3f57e04
508359a
8e2b160
508359a
3d04152
508359a
00fc568
508359a
8e2b160
34a4f02
a930bf4
00fc568
508359a
c10913b
415e586
a930bf4
3f57e04
 
a2f59e0
415e586
 
65c296d
ed147bd
508359a
c5321ab
8326b15
00fc568
3d04152
508359a
8c83a4e
3d04152
7c1f985
a2623c5
508359a
65c296d
3d04152
508359a
3d04152
415e586
65c296d
3f57e04
c10913b
508359a
3f57e04
508359a
8c83a4e
ec8f399
508359a
3d04152
508359a
79a8068
b5389ae
ec8f399
3d04152
508359a
 
c10913b
0ad9b8d
508359a
a2623c5
069c347
508359a
 
b5389ae
508359a
 
c5321ab
b5389ae
8326b15
ed147bd
c19416a
79a8068
508359a
415e586
508359a
 
ece081c
508359a
3d04152
508359a
8e2b160
508359a
8326b15
3d04152
 
b5389ae
508359a
aa63d04
508359a
 
c5321ab
8326b15
79a8068
17a6cff
508359a
c5321ab
508359a
3d04152
415e586
8326b15
508359a
3d04152
8326b15
ec8f399
a2623c5
79a8068
a2623c5
79a8068
508359a
 
 
8c83a4e
a2623c5
79a8068
8c83a4e
c19416a
8326b15
a930bf4
c19416a
b5389ae
00fc568
8326b15
a2623c5
508359a
17a6cff
508359a
8326b15
b5389ae
069c347
c10913b
 
 
 
 
 
 
508359a
 
c10913b
 
 
 
 
 
508359a
c10913b
508359a
c10913b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NOT_ALIVE",
    "10": "NOT_ALIVE",
    "100": "NOT_ALIVE",
    "101": "NON_PARTICIPATING",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NON_PARTICIPATING",
    "105": "NON_PARTICIPATING",
    "106": "NON_PARTICIPATING",
    "107": "NOT_ALIVE",
    "108": "NOT_ALIVE",
    "109": "NOT_ALIVE",
    "11": "NOT_ALIVE",
    "110": "SUCCESS",
    "111": "NON_PARTICIPATING",
    "112": "SUCCESS",
    "113": "NOT_ALIVE",
    "114": "NON_PARTICIPATING",
    "115": "NOT_ALIVE",
    "116": "NON_PARTICIPATING",
    "117": "NON_PARTICIPATING",
    "118": "NOT_ALIVE",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NON_PARTICIPATING",
    "121": "NOT_ALIVE",
    "122": "NON_PARTICIPATING",
    "123": "NOT_ALIVE",
    "124": "NON_PARTICIPATING",
    "125": "NON_PARTICIPATING",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NOT_ALIVE",
    "129": "NON_PARTICIPATING",
    "13": "NOT_ALIVE",
    "130": "NON_PARTICIPATING",
    "131": "NOT_ALIVE",
    "132": "NON_PARTICIPATING",
    "133": "FAIL",
    "134": "NON_PARTICIPATING",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "SUCCESS",
    "139": "NON_PARTICIPATING",
    "14": "NOT_ALIVE",
    "140": "NOT_ALIVE",
    "141": "NOT_ALIVE",
    "142": "NON_PARTICIPATING",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NON_PARTICIPATING",
    "146": "NON_PARTICIPATING",
    "147": "NON_PARTICIPATING",
    "148": "NON_PARTICIPATING",
    "149": "NON_PARTICIPATING",
    "15": "NOT_ALIVE",
    "150": "NON_PARTICIPATING",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "SUCCESS",
    "154": "SUCCESS",
    "155": "NOT_ALIVE",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NON_PARTICIPATING",
    "159": "NON_PARTICIPATING",
    "16": "NON_PARTICIPATING",
    "160": "NON_PARTICIPATING",
    "161": "NON_PARTICIPATING",
    "162": "NOT_ALIVE",
    "163": "NOT_ALIVE",
    "164": "NON_PARTICIPATING",
    "165": "NON_PARTICIPATING",
    "166": "NOT_ALIVE",
    "167": "NOT_ALIVE",
    "168": "SUCCESS",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "NON_PARTICIPATING",
    "173": "SUCCESS",
    "174": "NOT_ALIVE",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NON_PARTICIPATING",
    "179": "NOT_ALIVE",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "NON_PARTICIPATING",
    "184": "NON_PARTICIPATING",
    "185": "NON_PARTICIPATING",
    "186": "NON_PARTICIPATING",
    "187": "NON_PARTICIPATING",
    "188": "NON_PARTICIPATING",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NON_PARTICIPATING",
    "191": "NOT_ALIVE",
    "192": "NON_PARTICIPATING",
    "193": "NON_PARTICIPATING",
    "194": "NON_PARTICIPATING",
    "195": "NON_PARTICIPATING",
    "196": "NON_PARTICIPATING",
    "197": "FAIL",
    "198": "NON_PARTICIPATING",
    "199": "NON_PARTICIPATING",
    "2": "NON_PARTICIPATING",
    "20": "NON_PARTICIPATING",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NOT_ALIVE",
    "203": "NOT_ALIVE",
    "204": "NOT_ALIVE",
    "205": "NON_PARTICIPATING",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NON_PARTICIPATING",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NON_PARTICIPATING",
    "213": "NOT_ALIVE",
    "214": "NON_PARTICIPATING",
    "215": "SUCCESS",
    "216": "NON_PARTICIPATING",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NOT_ALIVE",
    "22": "NON_PARTICIPATING",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NON_PARTICIPATING",
    "224": "NOT_ALIVE",
    "225": "NOT_ALIVE",
    "226": "NOT_ALIVE",
    "227": "NON_PARTICIPATING",
    "228": "NON_PARTICIPATING",
    "229": "NON_PARTICIPATING",
    "23": "NON_PARTICIPATING",
    "230": "NOT_ALIVE",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NON_PARTICIPATING",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "SUCCESS",
    "238": "SUCCESS",
    "239": "NOT_ALIVE",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "NOT_ALIVE",
    "242": "NOT_ALIVE",
    "243": "NOT_ALIVE",
    "244": "NOT_ALIVE",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NOT_ALIVE",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NON_PARTICIPATING",
    "251": "NOT_ALIVE",
    "252": "NOT_ALIVE",
    "253": "NOT_ALIVE",
    "254": "NON_PARTICIPATING",
    "255": "FAIL",
    "26": "NON_PARTICIPATING",
    "27": "NOT_ALIVE",
    "28": "NOT_ALIVE",
    "29": "NON_PARTICIPATING",
    "3": "NON_PARTICIPATING",
    "30": "SUCCESS",
    "31": "NON_PARTICIPATING",
    "32": "NOT_ALIVE",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NOT_ALIVE",
    "36": "NOT_ALIVE",
    "37": "NOT_ALIVE",
    "38": "SUCCESS",
    "39": "NOT_ALIVE",
    "4": "NON_PARTICIPATING",
    "40": "NOT_ALIVE",
    "41": "NON_PARTICIPATING",
    "42": "NON_PARTICIPATING",
    "43": "NON_PARTICIPATING",
    "44": "NON_PARTICIPATING",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "NON_PARTICIPATING",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "NON_PARTICIPATING",
    "50": "NON_PARTICIPATING",
    "51": "NON_PARTICIPATING",
    "52": "NOT_ALIVE",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "FAIL",
    "57": "NON_PARTICIPATING",
    "58": "NON_PARTICIPATING",
    "59": "NON_PARTICIPATING",
    "6": "NON_PARTICIPATING",
    "60": "SUCCESS",
    "61": "NON_PARTICIPATING",
    "62": "NOT_ALIVE",
    "63": "SUCCESS",
    "64": "NOT_ALIVE",
    "65": "NON_PARTICIPATING",
    "66": "NOT_ALIVE",
    "67": "NOT_ALIVE",
    "68": "NON_PARTICIPATING",
    "69": "NOT_ALIVE",
    "7": "NON_PARTICIPATING",
    "70": "NON_PARTICIPATING",
    "71": "NON_PARTICIPATING",
    "72": "NON_PARTICIPATING",
    "73": "SUCCESS",
    "74": "NON_PARTICIPATING",
    "75": "NON_PARTICIPATING",
    "76": "NON_PARTICIPATING",
    "77": "NON_PARTICIPATING",
    "78": "NOT_ALIVE",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NON_PARTICIPATING",
    "81": "NON_PARTICIPATING",
    "82": "NOT_ALIVE",
    "83": "NON_PARTICIPATING",
    "84": "NON_PARTICIPATING",
    "85": "NON_PARTICIPATING",
    "86": "NOT_ALIVE",
    "87": "NON_PARTICIPATING",
    "88": "NON_PARTICIPATING",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NON_PARTICIPATING",
    "91": "NOT_ALIVE",
    "92": "NOT_ALIVE",
    "93": "NON_PARTICIPATING",
    "94": "NOT_ALIVE",
    "95": "NOT_ALIVE",
    "96": "SUCCESS",
    "97": "NON_PARTICIPATING",
    "98": "NON_PARTICIPATING",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    5968830,
    5968837
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 1,
  "intermediate_size": 5632,
  "last_allreduce_block": 5968672,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}