File size: 8,113 Bytes
6eef298
429d5ff
6eef298
7e5ea14
c35d264
8d3dbf4
7e5ea14
a539b9d
cb33af1
c35d264
42d891d
 
a539b9d
9ef837a
a539b9d
8d3dbf4
cb33af1
8d3dbf4
a539b9d
 
cb33af1
bb4efa0
42d891d
c684f2d
a539b9d
76cbf3d
c35d264
76cbf3d
bb4efa0
c35d264
9ef837a
f4af88c
c35d264
a539b9d
8d3dbf4
c684f2d
cb33af1
42d891d
c684f2d
42d891d
7e5ea14
c35d264
a539b9d
76cbf3d
c684f2d
c35d264
a539b9d
 
5df8360
a539b9d
c35d264
bb4efa0
a539b9d
0ab939b
33157ad
821c87f
 
a539b9d
42d891d
 
c35d264
42d891d
7e5ea14
42d891d
 
cb33af1
33157ad
a539b9d
f4af88c
e1b3014
bb4efa0
33157ad
a539b9d
 
42d891d
33157ad
a539b9d
 
33157ad
c684f2d
a539b9d
821c87f
cb33af1
42d891d
580089d
a539b9d
 
bb4efa0
9ef837a
7e5ea14
a539b9d
bb4efa0
cb33af1
bb4efa0
e1b3014
c35d264
abff122
a539b9d
 
bb4efa0
42d891d
c35d264
a539b9d
7e5ea14
7afd507
9b29cab
000194a
a539b9d
 
e1b3014
 
42d891d
a539b9d
42d891d
a539b9d
8d3dbf4
bb4efa0
76cbf3d
c35d264
0ab939b
42d891d
92812c4
42d891d
580089d
7e5ea14
bb4efa0
 
c35d264
bb4efa0
 
42d891d
8d3dbf4
bb4efa0
a539b9d
e1b3014
8d3dbf4
a539b9d
42d891d
c684f2d
84ea336
abff122
a539b9d
92812c4
7e5ea14
a539b9d
e2f6c24
42d891d
 
a539b9d
c684f2d
a539b9d
bb4efa0
8d3dbf4
a539b9d
 
 
 
bb4efa0
a539b9d
 
 
cb33af1
 
42d891d
bb4efa0
c35d264
9ef837a
cb33af1
42d891d
bb4efa0
42d891d
6eef298
bb4efa0
42d891d
a539b9d
bb4efa0
f4af88c
c35d264
42d891d
84ea336
a539b9d
9ef837a
f4af88c
a539b9d
7afd507
a539b9d
7e5ea14
a539b9d
 
 
21cc838
a539b9d
 
bb4efa0
 
42d891d
 
a539b9d
bb4efa0
8d3dbf4
c35d264
bb4efa0
33157ad
c35d264
a539b9d
8d3dbf4
42d891d
 
a539b9d
42d891d
 
a539b9d
c35d264
8d3dbf4
42d891d
 
a539b9d
c35d264
a539b9d
 
42d891d
a539b9d
 
9ef837a
a539b9d
bb4efa0
a539b9d
42d891d
76cbf3d
42d891d
821c87f
c35d264
c684f2d
f4af88c
a539b9d
bb4efa0
84ea336
f4af88c
a539b9d
42d891d
bb4efa0
a539b9d
cb33af1
42d891d
8d3dbf4
c35d264
f4af88c
92812c4
c35d264
 
a539b9d
 
42d891d
a539b9d
9ef837a
a539b9d
bb4efa0
a539b9d
21cc838
6eef298
 
 
 
 
 
 
5aeb8a6
 
 
6eef298
 
 
 
 
 
5aeb8a6
6eef298
a539b9d
6eef298
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
{
  "_name_or_path": "penguin102/c67-h18",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NON_PARTICIPATING",
    "10": "NON_PARTICIPATING",
    "100": "NOT_ALIVE",
    "101": "NON_PARTICIPATING",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NON_PARTICIPATING",
    "105": "NON_PARTICIPATING",
    "106": "NOT_ALIVE",
    "107": "NOT_ALIVE",
    "108": "NOT_ALIVE",
    "109": "NOT_ALIVE",
    "11": "SUCCESS",
    "110": "NOT_ALIVE",
    "111": "NON_PARTICIPATING",
    "112": "SUCCESS",
    "113": "NOT_ALIVE",
    "114": "NON_PARTICIPATING",
    "115": "NON_PARTICIPATING",
    "116": "NON_PARTICIPATING",
    "117": "SUCCESS",
    "118": "NON_PARTICIPATING",
    "119": "NON_PARTICIPATING",
    "12": "NON_PARTICIPATING",
    "120": "NON_PARTICIPATING",
    "121": "NOT_ALIVE",
    "122": "NON_PARTICIPATING",
    "123": "NON_PARTICIPATING",
    "124": "NON_PARTICIPATING",
    "125": "NOT_ALIVE",
    "126": "NOT_ALIVE",
    "127": "NON_PARTICIPATING",
    "128": "NOT_ALIVE",
    "129": "NON_PARTICIPATING",
    "13": "NON_PARTICIPATING",
    "130": "NON_PARTICIPATING",
    "131": "NOT_ALIVE",
    "132": "NON_PARTICIPATING",
    "133": "SUCCESS",
    "134": "NON_PARTICIPATING",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "SUCCESS",
    "138": "NON_PARTICIPATING",
    "139": "NON_PARTICIPATING",
    "14": "NON_PARTICIPATING",
    "140": "NOT_ALIVE",
    "141": "NON_PARTICIPATING",
    "142": "NON_PARTICIPATING",
    "143": "NON_PARTICIPATING",
    "144": "NON_PARTICIPATING",
    "145": "NON_PARTICIPATING",
    "146": "NON_PARTICIPATING",
    "147": "NON_PARTICIPATING",
    "148": "NON_PARTICIPATING",
    "149": "NON_PARTICIPATING",
    "15": "NON_PARTICIPATING",
    "150": "NON_PARTICIPATING",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "SUCCESS",
    "154": "NON_PARTICIPATING",
    "155": "NON_PARTICIPATING",
    "156": "NOT_ALIVE",
    "157": "NON_PARTICIPATING",
    "158": "NON_PARTICIPATING",
    "159": "NON_PARTICIPATING",
    "16": "NON_PARTICIPATING",
    "160": "NON_PARTICIPATING",
    "161": "NOT_ALIVE",
    "162": "NON_PARTICIPATING",
    "163": "NON_PARTICIPATING",
    "164": "SUCCESS",
    "165": "NON_PARTICIPATING",
    "166": "NON_PARTICIPATING",
    "167": "NON_PARTICIPATING",
    "168": "NON_PARTICIPATING",
    "169": "NOT_ALIVE",
    "17": "NON_PARTICIPATING",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "SUCCESS",
    "173": "SUCCESS",
    "174": "NON_PARTICIPATING",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NON_PARTICIPATING",
    "179": "NON_PARTICIPATING",
    "18": "NON_PARTICIPATING",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "NON_PARTICIPATING",
    "184": "NON_PARTICIPATING",
    "185": "NON_PARTICIPATING",
    "186": "NOT_ALIVE",
    "187": "NON_PARTICIPATING",
    "188": "NOT_ALIVE",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NON_PARTICIPATING",
    "191": "NOT_ALIVE",
    "192": "NOT_ALIVE",
    "193": "NOT_ALIVE",
    "194": "NON_PARTICIPATING",
    "195": "NON_PARTICIPATING",
    "196": "NON_PARTICIPATING",
    "197": "NON_PARTICIPATING",
    "198": "NON_PARTICIPATING",
    "199": "NON_PARTICIPATING",
    "2": "NON_PARTICIPATING",
    "20": "NON_PARTICIPATING",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NON_PARTICIPATING",
    "203": "NON_PARTICIPATING",
    "204": "NON_PARTICIPATING",
    "205": "NOT_ALIVE",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NON_PARTICIPATING",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NON_PARTICIPATING",
    "213": "NON_PARTICIPATING",
    "214": "NON_PARTICIPATING",
    "215": "NON_PARTICIPATING",
    "216": "NON_PARTICIPATING",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NON_PARTICIPATING",
    "22": "NON_PARTICIPATING",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NON_PARTICIPATING",
    "224": "NOT_ALIVE",
    "225": "NOT_ALIVE",
    "226": "NOT_ALIVE",
    "227": "NON_PARTICIPATING",
    "228": "NON_PARTICIPATING",
    "229": "NOT_ALIVE",
    "23": "NON_PARTICIPATING",
    "230": "NOT_ALIVE",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NON_PARTICIPATING",
    "234": "NON_PARTICIPATING",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "NON_PARTICIPATING",
    "238": "NON_PARTICIPATING",
    "239": "NON_PARTICIPATING",
    "24": "NON_PARTICIPATING",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NOT_ALIVE",
    "243": "NOT_ALIVE",
    "244": "NON_PARTICIPATING",
    "245": "NON_PARTICIPATING",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NOT_ALIVE",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NON_PARTICIPATING",
    "251": "NOT_ALIVE",
    "252": "NON_PARTICIPATING",
    "253": "NON_PARTICIPATING",
    "254": "NON_PARTICIPATING",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NON_PARTICIPATING",
    "28": "NON_PARTICIPATING",
    "29": "NON_PARTICIPATING",
    "3": "NON_PARTICIPATING",
    "30": "SUCCESS",
    "31": "NON_PARTICIPATING",
    "32": "SUCCESS",
    "33": "NOT_ALIVE",
    "34": "NON_PARTICIPATING",
    "35": "NOT_ALIVE",
    "36": "SUCCESS",
    "37": "NOT_ALIVE",
    "38": "NON_PARTICIPATING",
    "39": "NON_PARTICIPATING",
    "4": "NON_PARTICIPATING",
    "40": "NON_PARTICIPATING",
    "41": "SUCCESS",
    "42": "NON_PARTICIPATING",
    "43": "NOT_ALIVE",
    "44": "NON_PARTICIPATING",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "NON_PARTICIPATING",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "SUCCESS",
    "50": "NON_PARTICIPATING",
    "51": "NON_PARTICIPATING",
    "52": "NON_PARTICIPATING",
    "53": "NOT_ALIVE",
    "54": "NON_PARTICIPATING",
    "55": "NOT_ALIVE",
    "56": "SUCCESS",
    "57": "NON_PARTICIPATING",
    "58": "NON_PARTICIPATING",
    "59": "NON_PARTICIPATING",
    "6": "NON_PARTICIPATING",
    "60": "NOT_ALIVE",
    "61": "NON_PARTICIPATING",
    "62": "NON_PARTICIPATING",
    "63": "NOT_ALIVE",
    "64": "NON_PARTICIPATING",
    "65": "NOT_ALIVE",
    "66": "NON_PARTICIPATING",
    "67": "NOT_ALIVE",
    "68": "NON_PARTICIPATING",
    "69": "NON_PARTICIPATING",
    "7": "FAIL",
    "70": "NON_PARTICIPATING",
    "71": "NON_PARTICIPATING",
    "72": "NON_PARTICIPATING",
    "73": "NON_PARTICIPATING",
    "74": "NON_PARTICIPATING",
    "75": "NON_PARTICIPATING",
    "76": "NON_PARTICIPATING",
    "77": "NON_PARTICIPATING",
    "78": "NON_PARTICIPATING",
    "79": "NON_PARTICIPATING",
    "8": "NON_PARTICIPATING",
    "80": "NOT_ALIVE",
    "81": "NON_PARTICIPATING",
    "82": "NON_PARTICIPATING",
    "83": "NOT_ALIVE",
    "84": "NON_PARTICIPATING",
    "85": "NON_PARTICIPATING",
    "86": "NON_PARTICIPATING",
    "87": "NON_PARTICIPATING",
    "88": "NON_PARTICIPATING",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NON_PARTICIPATING",
    "91": "NOT_ALIVE",
    "92": "NON_PARTICIPATING",
    "93": "NOT_ALIVE",
    "94": "NOT_ALIVE",
    "95": "NOT_ALIVE",
    "96": "NOT_ALIVE",
    "97": "NON_PARTICIPATING",
    "98": "NOT_ALIVE",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    5947237,
    5947241,
    5947245
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 139,
  "intermediate_size": 5632,
  "last_allreduce_block": 5946293,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}