File size: 7,416 Bytes
a6a8118
 
 
 
7bd5677
a6a8118
bf5b5cb
a6a8118
82d6dd1
8051477
a6a8118
7bd5677
a6a8118
 
9d535bc
a6a8118
 
 
02776e6
d84d27a
b0b0e73
7329f91
66e9475
a6a8118
 
bf5b5cb
 
a6a8118
7329f91
f013510
4a18dca
9d535bc
 
a6a8118
7bd5677
8051477
 
b0b0e73
a6a8118
d84d27a
a6a8118
 
d84d27a
7329f91
4a18dca
bf5b5cb
7329f91
9d535bc
66e9475
a6a8118
7329f91
4a18dca
 
d84d27a
a6a8118
82d6dd1
7bd5677
a6a8118
4a18dca
02776e6
 
9539a4f
9d535bc
a6a8118
 
d84d27a
9d535bc
a6a8118
 
82d6dd1
 
a6a8118
9d535bc
9539a4f
a1eb558
9d535bc
d84d27a
9d535bc
 
a6a8118
02776e6
66e9475
a6a8118
d84d27a
 
a6a8118
9d535bc
a1eb558
9539a4f
a6a8118
 
02776e6
9539a4f
a6a8118
5b94713
a6a8118
02776e6
9539a4f
a1eb558
9d535bc
 
7329f91
82d6dd1
d84d27a
a6a8118
 
9539a4f
f013510
9539a4f
d84d27a
9d535bc
a6a8118
 
d84d27a
af5f1c0
9d535bc
a6a8118
63a021e
8051477
7329f91
a1eb558
9d535bc
a1eb558
9539a4f
a6a8118
 
7329f91
a6a8118
 
458f1d4
9d535bc
a6a8118
d84d27a
9d535bc
 
 
7bd5677
d84d27a
a6a8118
9d535bc
af5f1c0
a6a8118
 
 
9d535bc
9539a4f
a6a8118
f013510
a6a8118
d84d27a
9d535bc
a6a8118
 
 
 
 
9539a4f
9d535bc
7329f91
d84d27a
a6a8118
 
9539a4f
9d535bc
a6a8118
9d535bc
a6a8118
4a18dca
 
a6a8118
 
 
d84d27a
 
7329f91
9d535bc
 
 
 
 
 
a6a8118
 
66e9475
fdffe98
7329f91
63a021e
82d6dd1
9d535bc
af5f1c0
458f1d4
a6a8118
 
 
d84d27a
a1eb558
9d535bc
9539a4f
9d535bc
02776e6
d84d27a
a6a8118
9d535bc
5b94713
a6a8118
 
 
7bd5677
4b7eece
a6a8118
4a18dca
d84d27a
bf5b5cb
a6a8118
9d535bc
a6a8118
9d535bc
4a18dca
a6a8118
7329f91
4b7eece
d84d27a
7329f91
d84d27a
a6a8118
4a18dca
a6a8118
7329f91
9d535bc
a6a8118
02776e6
a6a8118
fdffe98
a6a8118
7bd5677
f013510
a6a8118
 
 
a1eb558
02776e6
f9def3a
d84d27a
a6a8118
d84d27a
bf5b5cb
a6a8118
 
 
 
 
d84d27a
7329f91
9d535bc
 
b0b0e73
a6a8118
bf5b5cb
fdffe98
a6a8118
 
 
 
 
 
 
5087440
 
a6a8118
 
 
 
 
 
5087440
a6a8118
9d535bc
a6a8118
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NOT_ALIVE",
    "10": "NOT_ALIVE",
    "100": "NON_PARTICIPATING",
    "101": "NOT_ALIVE",
    "102": "NON_PARTICIPATING",
    "103": "NOT_ALIVE",
    "104": "NOT_ALIVE",
    "105": "NON_PARTICIPATING",
    "106": "NOT_ALIVE",
    "107": "NOT_ALIVE",
    "108": "NOT_ALIVE",
    "109": "NOT_ALIVE",
    "11": "NOT_ALIVE",
    "110": "NOT_ALIVE",
    "111": "NOT_ALIVE",
    "112": "NON_PARTICIPATING",
    "113": "NOT_ALIVE",
    "114": "NOT_ALIVE",
    "115": "NOT_ALIVE",
    "116": "NOT_ALIVE",
    "117": "NOT_ALIVE",
    "118": "NON_PARTICIPATING",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NOT_ALIVE",
    "121": "NOT_ALIVE",
    "122": "NON_PARTICIPATING",
    "123": "NOT_ALIVE",
    "124": "NOT_ALIVE",
    "125": "NOT_ALIVE",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NOT_ALIVE",
    "129": "NOT_ALIVE",
    "13": "NOT_ALIVE",
    "130": "NOT_ALIVE",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "SUCCESS",
    "134": "NOT_ALIVE",
    "135": "NOT_ALIVE",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "NOT_ALIVE",
    "139": "NOT_ALIVE",
    "14": "NOT_ALIVE",
    "140": "NON_PARTICIPATING",
    "141": "NON_PARTICIPATING",
    "142": "NON_PARTICIPATING",
    "143": "SUCCESS",
    "144": "NOT_ALIVE",
    "145": "NOT_ALIVE",
    "146": "NON_PARTICIPATING",
    "147": "NOT_ALIVE",
    "148": "NON_PARTICIPATING",
    "149": "NOT_ALIVE",
    "15": "NOT_ALIVE",
    "150": "SUCCESS",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "NOT_ALIVE",
    "154": "NON_PARTICIPATING",
    "155": "NOT_ALIVE",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NON_PARTICIPATING",
    "159": "NON_PARTICIPATING",
    "16": "NOT_ALIVE",
    "160": "NOT_ALIVE",
    "161": "NON_PARTICIPATING",
    "162": "NOT_ALIVE",
    "163": "NON_PARTICIPATING",
    "164": "NON_PARTICIPATING",
    "165": "NON_PARTICIPATING",
    "166": "FAIL",
    "167": "NOT_ALIVE",
    "168": "NON_PARTICIPATING",
    "169": "NON_PARTICIPATING",
    "17": "NOT_ALIVE",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "NOT_ALIVE",
    "173": "NON_PARTICIPATING",
    "174": "NOT_ALIVE",
    "175": "NON_PARTICIPATING",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NOT_ALIVE",
    "179": "NON_PARTICIPATING",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "NON_PARTICIPATING",
    "184": "NOT_ALIVE",
    "185": "NOT_ALIVE",
    "186": "NON_PARTICIPATING",
    "187": "NOT_ALIVE",
    "188": "NOT_ALIVE",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NOT_ALIVE",
    "191": "NON_PARTICIPATING",
    "192": "NON_PARTICIPATING",
    "193": "NON_PARTICIPATING",
    "194": "NON_PARTICIPATING",
    "195": "NOT_ALIVE",
    "196": "NOT_ALIVE",
    "197": "NOT_ALIVE",
    "198": "NON_PARTICIPATING",
    "199": "NOT_ALIVE",
    "2": "SUCCESS",
    "20": "NOT_ALIVE",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NOT_ALIVE",
    "203": "NOT_ALIVE",
    "204": "NON_PARTICIPATING",
    "205": "NOT_ALIVE",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NOT_ALIVE",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NOT_ALIVE",
    "213": "NOT_ALIVE",
    "214": "SUCCESS",
    "215": "NOT_ALIVE",
    "216": "NOT_ALIVE",
    "217": "NOT_ALIVE",
    "218": "NON_PARTICIPATING",
    "219": "NON_PARTICIPATING",
    "22": "NOT_ALIVE",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NON_PARTICIPATING",
    "225": "NOT_ALIVE",
    "226": "NON_PARTICIPATING",
    "227": "NOT_ALIVE",
    "228": "NON_PARTICIPATING",
    "229": "NOT_ALIVE",
    "23": "NOT_ALIVE",
    "230": "NOT_ALIVE",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NON_PARTICIPATING",
    "235": "NOT_ALIVE",
    "236": "NON_PARTICIPATING",
    "237": "NOT_ALIVE",
    "238": "NOT_ALIVE",
    "239": "NON_PARTICIPATING",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "SUCCESS",
    "242": "SUCCESS",
    "243": "NOT_ALIVE",
    "244": "NOT_ALIVE",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NOT_ALIVE",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NON_PARTICIPATING",
    "251": "NOT_ALIVE",
    "252": "NOT_ALIVE",
    "253": "NON_PARTICIPATING",
    "254": "NON_PARTICIPATING",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NON_PARTICIPATING",
    "28": "NOT_ALIVE",
    "29": "NOT_ALIVE",
    "3": "NOT_ALIVE",
    "30": "NOT_ALIVE",
    "31": "NOT_ALIVE",
    "32": "NOT_ALIVE",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NOT_ALIVE",
    "36": "NOT_ALIVE",
    "37": "NON_PARTICIPATING",
    "38": "NOT_ALIVE",
    "39": "NOT_ALIVE",
    "4": "NOT_ALIVE",
    "40": "SUCCESS",
    "41": "NOT_ALIVE",
    "42": "NON_PARTICIPATING",
    "43": "NON_PARTICIPATING",
    "44": "NOT_ALIVE",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "NOT_ALIVE",
    "48": "NON_PARTICIPATING",
    "49": "NOT_ALIVE",
    "5": "NOT_ALIVE",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "NOT_ALIVE",
    "53": "NOT_ALIVE",
    "54": "NOT_ALIVE",
    "55": "NON_PARTICIPATING",
    "56": "NOT_ALIVE",
    "57": "NON_PARTICIPATING",
    "58": "NOT_ALIVE",
    "59": "NON_PARTICIPATING",
    "6": "NOT_ALIVE",
    "60": "NOT_ALIVE",
    "61": "NON_PARTICIPATING",
    "62": "NOT_ALIVE",
    "63": "NOT_ALIVE",
    "64": "NON_PARTICIPATING",
    "65": "NON_PARTICIPATING",
    "66": "NOT_ALIVE",
    "67": "NON_PARTICIPATING",
    "68": "NOT_ALIVE",
    "69": "NON_PARTICIPATING",
    "7": "NOT_ALIVE",
    "70": "NOT_ALIVE",
    "71": "NOT_ALIVE",
    "72": "NOT_ALIVE",
    "73": "NOT_ALIVE",
    "74": "NOT_ALIVE",
    "75": "SUCCESS",
    "76": "NOT_ALIVE",
    "77": "SUCCESS",
    "78": "NON_PARTICIPATING",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NOT_ALIVE",
    "81": "NOT_ALIVE",
    "82": "NOT_ALIVE",
    "83": "NOT_ALIVE",
    "84": "NON_PARTICIPATING",
    "85": "NOT_ALIVE",
    "86": "NON_PARTICIPATING",
    "87": "NOT_ALIVE",
    "88": "NOT_ALIVE",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NOT_ALIVE",
    "91": "NOT_ALIVE",
    "92": "NON_PARTICIPATING",
    "93": "NOT_ALIVE",
    "94": "NOT_ALIVE",
    "95": "NOT_ALIVE",
    "96": "NON_PARTICIPATING",
    "97": "NOT_ALIVE",
    "98": "NON_PARTICIPATING",
    "99": "NON_PARTICIPATING"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6211347,
    6211364
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 248,
  "intermediate_size": 5632,
  "last_allreduce_block": 6209387,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}