File size: 7,954 Bytes
a3e83de
d6862da
a3e83de
 
 
6ea9dea
a3e83de
6ea9dea
5b8a6a1
b00dc3a
7561c4b
a2d1b9f
5b8a6a1
a2d1b9f
163efaf
5b8a6a1
a2d1b9f
79cce97
61d3812
a2d1b9f
6ea9dea
b00dc3a
a3e83de
163efaf
b00dc3a
a2d1b9f
a3e83de
5b8a6a1
a2d1b9f
 
d6862da
16f8dad
2be892e
5b8a6a1
d6862da
a2d1b9f
a3e83de
a2d1b9f
 
d6862da
a3e83de
b00dc3a
d6862da
f70dff0
a2d1b9f
79cce97
7561c4b
a2d1b9f
79cce97
7561c4b
 
f70dff0
d6862da
a2d1b9f
163efaf
16f8dad
 
a2d1b9f
163efaf
a2d1b9f
b00dc3a
 
a3e83de
 
a2d1b9f
5b8a6a1
163efaf
d6862da
a2d1b9f
7561c4b
61d3812
a3e83de
a2d1b9f
43d4ad6
a3e83de
a2d1b9f
b00dc3a
a2d1b9f
 
f70dff0
79cce97
 
61d3812
a2d1b9f
d6862da
a2d1b9f
 
79cce97
163efaf
a3e83de
a2d1b9f
 
7561c4b
5b8a6a1
163efaf
b00dc3a
 
163efaf
7561c4b
b00dc3a
7561c4b
f70dff0
163efaf
a3e83de
a2d1b9f
16f8dad
a3e83de
f70dff0
a2d1b9f
7561c4b
6ea9dea
a3e83de
a2d1b9f
 
b00dc3a
a2d1b9f
a3e83de
a2d1b9f
d6862da
 
f70dff0
a2d1b9f
5b8a6a1
d6862da
a3e83de
a2d1b9f
2be892e
a2d1b9f
d6862da
 
a3e83de
a2d1b9f
a3e83de
a2d1b9f
7561c4b
5b8a6a1
163efaf
2be892e
a2d1b9f
f70dff0
b00dc3a
f70dff0
a2d1b9f
a3e83de
a2d1b9f
5b8a6a1
79cce97
d6862da
 
f70dff0
7561c4b
2be892e
5b8a6a1
a2d1b9f
 
d6862da
a2d1b9f
7561c4b
b00dc3a
a3e83de
79cce97
43d4ad6
7561c4b
a2d1b9f
f70dff0
43d4ad6
79cce97
163efaf
a3e83de
b00dc3a
a2d1b9f
a3e83de
5b8a6a1
61d3812
5b8a6a1
f70dff0
5b8a6a1
a3e83de
b00dc3a
f70dff0
 
a2d1b9f
d6862da
a2d1b9f
 
163efaf
a3e83de
a2d1b9f
 
43d4ad6
f70dff0
a2d1b9f
 
 
 
 
d6862da
f70dff0
a2d1b9f
b00dc3a
79cce97
a2d1b9f
d6862da
16f8dad
a2d1b9f
 
 
a3e83de
 
2be892e
79cce97
b00dc3a
61d3812
a2d1b9f
 
 
 
a3e83de
a2d1b9f
 
a3e83de
f70dff0
61d3812
a2d1b9f
 
 
 
7561c4b
 
5b8a6a1
163efaf
 
d6862da
a3e83de
 
163efaf
f70dff0
2be892e
a2d1b9f
5b8a6a1
a2d1b9f
 
 
a3e83de
a2d1b9f
f70dff0
a2d1b9f
 
f70dff0
a2d1b9f
79cce97
a2d1b9f
b00dc3a
5b8a6a1
a2d1b9f
5b8a6a1
43d4ad6
61d3812
a2d1b9f
a3e83de
 
 
 
 
 
 
408d7ee
 
a3e83de
 
 
 
 
 
408d7ee
a3e83de
a2d1b9f
a3e83de
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NON_PARTICIPATING",
    "10": "NON_PARTICIPATING",
    "100": "NOT_ALIVE",
    "101": "NON_PARTICIPATING",
    "102": "NOT_ALIVE",
    "103": "NON_PARTICIPATING",
    "104": "NOT_ALIVE",
    "105": "NON_PARTICIPATING",
    "106": "NOT_ALIVE",
    "107": "NON_PARTICIPATING",
    "108": "NON_PARTICIPATING",
    "109": "NON_PARTICIPATING",
    "11": "NOT_ALIVE",
    "110": "NON_PARTICIPATING",
    "111": "NON_PARTICIPATING",
    "112": "NON_PARTICIPATING",
    "113": "NON_PARTICIPATING",
    "114": "NON_PARTICIPATING",
    "115": "NOT_ALIVE",
    "116": "NON_PARTICIPATING",
    "117": "NON_PARTICIPATING",
    "118": "NOT_ALIVE",
    "119": "NOT_ALIVE",
    "12": "NON_PARTICIPATING",
    "120": "SUCCESS",
    "121": "SUCCESS",
    "122": "NON_PARTICIPATING",
    "123": "NON_PARTICIPATING",
    "124": "NON_PARTICIPATING",
    "125": "NOT_ALIVE",
    "126": "NON_PARTICIPATING",
    "127": "NON_PARTICIPATING",
    "128": "NOT_ALIVE",
    "129": "NOT_ALIVE",
    "13": "SUCCESS",
    "130": "NON_PARTICIPATING",
    "131": "NOT_ALIVE",
    "132": "NON_PARTICIPATING",
    "133": "NON_PARTICIPATING",
    "134": "NON_PARTICIPATING",
    "135": "NOT_ALIVE",
    "136": "NON_PARTICIPATING",
    "137": "NOT_ALIVE",
    "138": "NON_PARTICIPATING",
    "139": "NON_PARTICIPATING",
    "14": "NOT_ALIVE",
    "140": "NOT_ALIVE",
    "141": "NON_PARTICIPATING",
    "142": "NON_PARTICIPATING",
    "143": "NON_PARTICIPATING",
    "144": "NON_PARTICIPATING",
    "145": "NON_PARTICIPATING",
    "146": "NON_PARTICIPATING",
    "147": "NOT_ALIVE",
    "148": "NON_PARTICIPATING",
    "149": "NOT_ALIVE",
    "15": "NON_PARTICIPATING",
    "150": "NON_PARTICIPATING",
    "151": "NOT_ALIVE",
    "152": "NON_PARTICIPATING",
    "153": "NON_PARTICIPATING",
    "154": "NOT_ALIVE",
    "155": "NON_PARTICIPATING",
    "156": "NON_PARTICIPATING",
    "157": "NOT_ALIVE",
    "158": "NOT_ALIVE",
    "159": "NON_PARTICIPATING",
    "16": "NON_PARTICIPATING",
    "160": "SUCCESS",
    "161": "NON_PARTICIPATING",
    "162": "NON_PARTICIPATING",
    "163": "NOT_ALIVE",
    "164": "NON_PARTICIPATING",
    "165": "NON_PARTICIPATING",
    "166": "SUCCESS",
    "167": "NON_PARTICIPATING",
    "168": "NON_PARTICIPATING",
    "169": "NON_PARTICIPATING",
    "17": "NON_PARTICIPATING",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "SUCCESS",
    "173": "NON_PARTICIPATING",
    "174": "NOT_ALIVE",
    "175": "NON_PARTICIPATING",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NOT_ALIVE",
    "179": "NON_PARTICIPATING",
    "18": "NON_PARTICIPATING",
    "180": "NON_PARTICIPATING",
    "181": "NON_PARTICIPATING",
    "182": "NOT_ALIVE",
    "183": "NON_PARTICIPATING",
    "184": "NOT_ALIVE",
    "185": "NON_PARTICIPATING",
    "186": "NOT_ALIVE",
    "187": "NON_PARTICIPATING",
    "188": "NOT_ALIVE",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NON_PARTICIPATING",
    "191": "NOT_ALIVE",
    "192": "NON_PARTICIPATING",
    "193": "NOT_ALIVE",
    "194": "NOT_ALIVE",
    "195": "NOT_ALIVE",
    "196": "NOT_ALIVE",
    "197": "NOT_ALIVE",
    "198": "FAIL",
    "199": "NOT_ALIVE",
    "2": "SUCCESS",
    "20": "NOT_ALIVE",
    "200": "SUCCESS",
    "201": "NON_PARTICIPATING",
    "202": "NON_PARTICIPATING",
    "203": "NON_PARTICIPATING",
    "204": "NON_PARTICIPATING",
    "205": "NOT_ALIVE",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "SUCCESS",
    "209": "NON_PARTICIPATING",
    "21": "NON_PARTICIPATING",
    "210": "NON_PARTICIPATING",
    "211": "NOT_ALIVE",
    "212": "NOT_ALIVE",
    "213": "NON_PARTICIPATING",
    "214": "NON_PARTICIPATING",
    "215": "NON_PARTICIPATING",
    "216": "NOT_ALIVE",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NON_PARTICIPATING",
    "22": "NOT_ALIVE",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NON_PARTICIPATING",
    "223": "NON_PARTICIPATING",
    "224": "NOT_ALIVE",
    "225": "NON_PARTICIPATING",
    "226": "NOT_ALIVE",
    "227": "NOT_ALIVE",
    "228": "NON_PARTICIPATING",
    "229": "NOT_ALIVE",
    "23": "NON_PARTICIPATING",
    "230": "NOT_ALIVE",
    "231": "NON_PARTICIPATING",
    "232": "NOT_ALIVE",
    "233": "FAIL",
    "234": "SUCCESS",
    "235": "NOT_ALIVE",
    "236": "NON_PARTICIPATING",
    "237": "NON_PARTICIPATING",
    "238": "NOT_ALIVE",
    "239": "NON_PARTICIPATING",
    "24": "NON_PARTICIPATING",
    "240": "NON_PARTICIPATING",
    "241": "NON_PARTICIPATING",
    "242": "SUCCESS",
    "243": "NON_PARTICIPATING",
    "244": "NON_PARTICIPATING",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NON_PARTICIPATING",
    "249": "SUCCESS",
    "25": "SUCCESS",
    "250": "NON_PARTICIPATING",
    "251": "NON_PARTICIPATING",
    "252": "NON_PARTICIPATING",
    "253": "NON_PARTICIPATING",
    "254": "NOT_ALIVE",
    "255": "NON_PARTICIPATING",
    "26": "NOT_ALIVE",
    "27": "NON_PARTICIPATING",
    "28": "NON_PARTICIPATING",
    "29": "SUCCESS",
    "3": "NON_PARTICIPATING",
    "30": "NON_PARTICIPATING",
    "31": "SUCCESS",
    "32": "NON_PARTICIPATING",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NON_PARTICIPATING",
    "36": "NON_PARTICIPATING",
    "37": "NON_PARTICIPATING",
    "38": "NON_PARTICIPATING",
    "39": "NON_PARTICIPATING",
    "4": "SUCCESS",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NON_PARTICIPATING",
    "43": "NON_PARTICIPATING",
    "44": "NOT_ALIVE",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "SUCCESS",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "NON_PARTICIPATING",
    "50": "SUCCESS",
    "51": "SUCCESS",
    "52": "NOT_ALIVE",
    "53": "NOT_ALIVE",
    "54": "NON_PARTICIPATING",
    "55": "NON_PARTICIPATING",
    "56": "NON_PARTICIPATING",
    "57": "NON_PARTICIPATING",
    "58": "NOT_ALIVE",
    "59": "NON_PARTICIPATING",
    "6": "NON_PARTICIPATING",
    "60": "NON_PARTICIPATING",
    "61": "NOT_ALIVE",
    "62": "SUCCESS",
    "63": "NON_PARTICIPATING",
    "64": "NON_PARTICIPATING",
    "65": "NON_PARTICIPATING",
    "66": "NON_PARTICIPATING",
    "67": "NOT_ALIVE",
    "68": "SUCCESS",
    "69": "NOT_ALIVE",
    "7": "NOT_ALIVE",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NOT_ALIVE",
    "73": "NON_PARTICIPATING",
    "74": "NON_PARTICIPATING",
    "75": "NON_PARTICIPATING",
    "76": "NON_PARTICIPATING",
    "77": "NOT_ALIVE",
    "78": "NON_PARTICIPATING",
    "79": "NON_PARTICIPATING",
    "8": "NON_PARTICIPATING",
    "80": "NOT_ALIVE",
    "81": "NOT_ALIVE",
    "82": "FAIL",
    "83": "SUCCESS",
    "84": "NOT_ALIVE",
    "85": "NOT_ALIVE",
    "86": "NOT_ALIVE",
    "87": "NON_PARTICIPATING",
    "88": "NOT_ALIVE",
    "89": "NOT_ALIVE",
    "9": "NON_PARTICIPATING",
    "90": "NON_PARTICIPATING",
    "91": "NOT_ALIVE",
    "92": "NOT_ALIVE",
    "93": "NON_PARTICIPATING",
    "94": "NON_PARTICIPATING",
    "95": "SUCCESS",
    "96": "NON_PARTICIPATING",
    "97": "NON_PARTICIPATING",
    "98": "NON_PARTICIPATING",
    "99": "SUCCESS"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    5925170,
    5925199
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 4,
  "intermediate_size": 5632,
  "last_allreduce_block": 5924869,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}