File size: 8,038 Bytes
e5897f8
b1afe42
e5897f8
12db233
4da8067
761c1ef
12db233
b1afe42
47da96a
548f0cd
08106c0
 
b1afe42
47158b3
f9831f5
761c1ef
4da8067
b1afe42
4da8067
 
47da96a
1810e14
08106c0
4da8067
 
0f9973c
548f0cd
0f9973c
1810e14
548f0cd
4da8067
2265fa2
548f0cd
b1afe42
761c1ef
ff51a4a
47da96a
08106c0
ff51a4a
08106c0
12db233
4da8067
b1afe42
0f9973c
ff51a4a
548f0cd
b1afe42
4da8067
b1afe42
 
548f0cd
b1afe42
f9831f5
7b11a18
4da8067
5c10b84
 
b1afe42
08106c0
 
548f0cd
08106c0
12db233
08106c0
b1afe42
4da8067
 
b1afe42
2265fa2
4da8067
 
 
f9831f5
4da8067
08106c0
01d6022
f9831f5
 
01d6022
ff51a4a
4da8067
5c10b84
47da96a
08106c0
5b096e8
4da8067
b1afe42
1810e14
47158b3
12db233
f9831f5
1810e14
47da96a
4da8067
c61bb5c
548f0cd
a0d16ca
4da8067
f9831f5
4da8067
b1afe42
 
f9831f5
12db233
184f0ad
5b096e8
1f7774c
b1afe42
 
c61bb5c
 
4da8067
 
 
 
761c1ef
1810e14
0f9973c
548f0cd
7b11a18
08106c0
e80f1c3
b1afe42
4da8067
12db233
4da8067
1810e14
548f0cd
4da8067
1810e14
08106c0
4da8067
 
 
 
761c1ef
f9831f5
08106c0
4da8067
39c38b5
a0d16ca
f9831f5
e80f1c3
12db233
b1afe42
b2fe2ee
08106c0
 
4da8067
ff51a4a
b1afe42
1810e14
761c1ef
f9831f5
 
 
 
1810e14
f9831f5
 
 
47da96a
 
b1afe42
1810e14
548f0cd
4da8067
47da96a
4da8067
1810e14
08106c0
e5897f8
1810e14
08106c0
4da8067
1810e14
2265fa2
548f0cd
08106c0
39c38b5
4da8067
47158b3
2265fa2
4da8067
184f0ad
4da8067
12db233
b1afe42
f9831f5
4da8067
10b97ac
4da8067
b1afe42
4da8067
1810e14
4da8067
 
b1afe42
1810e14
761c1ef
548f0cd
1810e14
b1afe42
548f0cd
f9831f5
761c1ef
08106c0
 
b1afe42
 
4da8067
 
548f0cd
761c1ef
4da8067
08106c0
4da8067
 
b1afe42
4da8067
08106c0
b1afe42
f9831f5
47158b3
4da8067
 
 
08106c0
0f9973c
08106c0
5c10b84
b1afe42
4da8067
2265fa2
f9831f5
1810e14
39c38b5
2265fa2
f9831f5
08106c0
4da8067
b1afe42
4da8067
08106c0
761c1ef
548f0cd
2265fa2
e80f1c3
548f0cd
 
f9831f5
4da8067
08106c0
b1afe42
47158b3
f9831f5
4da8067
f9831f5
10b97ac
e5897f8
 
 
 
 
 
3c62c07
b40d939
 
 
3c62c07
e5897f8
 
 
 
 
b40d939
e5897f8
4da8067
e5897f8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NON_PARTICIPATING",
    "10": "NON_PARTICIPATING",
    "100": "NOT_ALIVE",
    "101": "NOT_ALIVE",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NON_PARTICIPATING",
    "105": "NON_PARTICIPATING",
    "106": "NON_PARTICIPATING",
    "107": "NOT_ALIVE",
    "108": "NOT_ALIVE",
    "109": "NOT_ALIVE",
    "11": "NON_PARTICIPATING",
    "110": "NON_PARTICIPATING",
    "111": "NON_PARTICIPATING",
    "112": "NOT_ALIVE",
    "113": "NOT_ALIVE",
    "114": "NON_PARTICIPATING",
    "115": "NON_PARTICIPATING",
    "116": "NOT_ALIVE",
    "117": "NON_PARTICIPATING",
    "118": "NON_PARTICIPATING",
    "119": "NON_PARTICIPATING",
    "12": "NON_PARTICIPATING",
    "120": "NON_PARTICIPATING",
    "121": "NOT_ALIVE",
    "122": "NOT_ALIVE",
    "123": "NON_PARTICIPATING",
    "124": "NON_PARTICIPATING",
    "125": "NON_PARTICIPATING",
    "126": "NOT_ALIVE",
    "127": "NON_PARTICIPATING",
    "128": "NOT_ALIVE",
    "129": "NON_PARTICIPATING",
    "13": "NON_PARTICIPATING",
    "130": "NON_PARTICIPATING",
    "131": "NOT_ALIVE",
    "132": "NON_PARTICIPATING",
    "133": "NON_PARTICIPATING",
    "134": "NON_PARTICIPATING",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "NON_PARTICIPATING",
    "139": "NOT_ALIVE",
    "14": "SUCCESS",
    "140": "NOT_ALIVE",
    "141": "NOT_ALIVE",
    "142": "NON_PARTICIPATING",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NON_PARTICIPATING",
    "146": "NON_PARTICIPATING",
    "147": "NOT_ALIVE",
    "148": "NON_PARTICIPATING",
    "149": "NON_PARTICIPATING",
    "15": "NON_PARTICIPATING",
    "150": "NON_PARTICIPATING",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "NON_PARTICIPATING",
    "154": "NON_PARTICIPATING",
    "155": "NON_PARTICIPATING",
    "156": "NON_PARTICIPATING",
    "157": "NON_PARTICIPATING",
    "158": "NOT_ALIVE",
    "159": "NON_PARTICIPATING",
    "16": "NOT_ALIVE",
    "160": "NON_PARTICIPATING",
    "161": "NON_PARTICIPATING",
    "162": "NON_PARTICIPATING",
    "163": "NON_PARTICIPATING",
    "164": "SUCCESS",
    "165": "NON_PARTICIPATING",
    "166": "NON_PARTICIPATING",
    "167": "NON_PARTICIPATING",
    "168": "NON_PARTICIPATING",
    "169": "NOT_ALIVE",
    "17": "NON_PARTICIPATING",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "NOT_ALIVE",
    "173": "NON_PARTICIPATING",
    "174": "NON_PARTICIPATING",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NON_PARTICIPATING",
    "179": "NON_PARTICIPATING",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "SUCCESS",
    "184": "NON_PARTICIPATING",
    "185": "NON_PARTICIPATING",
    "186": "NON_PARTICIPATING",
    "187": "NOT_ALIVE",
    "188": "NOT_ALIVE",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NON_PARTICIPATING",
    "191": "NOT_ALIVE",
    "192": "NON_PARTICIPATING",
    "193": "NON_PARTICIPATING",
    "194": "NON_PARTICIPATING",
    "195": "NON_PARTICIPATING",
    "196": "NON_PARTICIPATING",
    "197": "NOT_ALIVE",
    "198": "NOT_ALIVE",
    "199": "NON_PARTICIPATING",
    "2": "NON_PARTICIPATING",
    "20": "NON_PARTICIPATING",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NON_PARTICIPATING",
    "203": "NON_PARTICIPATING",
    "204": "NON_PARTICIPATING",
    "205": "NON_PARTICIPATING",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NOT_ALIVE",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NON_PARTICIPATING",
    "213": "NON_PARTICIPATING",
    "214": "NON_PARTICIPATING",
    "215": "SUCCESS",
    "216": "NOT_ALIVE",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NON_PARTICIPATING",
    "22": "NON_PARTICIPATING",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NON_PARTICIPATING",
    "224": "NOT_ALIVE",
    "225": "NON_PARTICIPATING",
    "226": "NOT_ALIVE",
    "227": "NON_PARTICIPATING",
    "228": "NON_PARTICIPATING",
    "229": "NON_PARTICIPATING",
    "23": "NON_PARTICIPATING",
    "230": "NON_PARTICIPATING",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NON_PARTICIPATING",
    "234": "NON_PARTICIPATING",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "NON_PARTICIPATING",
    "238": "NON_PARTICIPATING",
    "239": "NON_PARTICIPATING",
    "24": "NON_PARTICIPATING",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NON_PARTICIPATING",
    "243": "NOT_ALIVE",
    "244": "NON_PARTICIPATING",
    "245": "SUCCESS",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NOT_ALIVE",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NON_PARTICIPATING",
    "251": "NOT_ALIVE",
    "252": "NON_PARTICIPATING",
    "253": "NON_PARTICIPATING",
    "254": "NON_PARTICIPATING",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NON_PARTICIPATING",
    "28": "NOT_ALIVE",
    "29": "NON_PARTICIPATING",
    "3": "NON_PARTICIPATING",
    "30": "SUCCESS",
    "31": "NON_PARTICIPATING",
    "32": "NON_PARTICIPATING",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NOT_ALIVE",
    "36": "SUCCESS",
    "37": "NOT_ALIVE",
    "38": "SUCCESS",
    "39": "SUCCESS",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NOT_ALIVE",
    "42": "SUCCESS",
    "43": "NON_PARTICIPATING",
    "44": "NON_PARTICIPATING",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "NON_PARTICIPATING",
    "48": "NOT_ALIVE",
    "49": "NON_PARTICIPATING",
    "5": "SUCCESS",
    "50": "NON_PARTICIPATING",
    "51": "NON_PARTICIPATING",
    "52": "NON_PARTICIPATING",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "SUCCESS",
    "57": "NON_PARTICIPATING",
    "58": "NON_PARTICIPATING",
    "59": "SUCCESS",
    "6": "NON_PARTICIPATING",
    "60": "NOT_ALIVE",
    "61": "NOT_ALIVE",
    "62": "SUCCESS",
    "63": "SUCCESS",
    "64": "NON_PARTICIPATING",
    "65": "NON_PARTICIPATING",
    "66": "NON_PARTICIPATING",
    "67": "NOT_ALIVE",
    "68": "NON_PARTICIPATING",
    "69": "NON_PARTICIPATING",
    "7": "SUCCESS",
    "70": "NON_PARTICIPATING",
    "71": "NON_PARTICIPATING",
    "72": "NON_PARTICIPATING",
    "73": "NON_PARTICIPATING",
    "74": "NOT_ALIVE",
    "75": "NOT_ALIVE",
    "76": "NON_PARTICIPATING",
    "77": "NON_PARTICIPATING",
    "78": "NON_PARTICIPATING",
    "79": "NON_PARTICIPATING",
    "8": "NON_PARTICIPATING",
    "80": "NOT_ALIVE",
    "81": "NON_PARTICIPATING",
    "82": "NOT_ALIVE",
    "83": "NON_PARTICIPATING",
    "84": "NOT_ALIVE",
    "85": "NON_PARTICIPATING",
    "86": "NON_PARTICIPATING",
    "87": "NON_PARTICIPATING",
    "88": "NON_PARTICIPATING",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NON_PARTICIPATING",
    "91": "NOT_ALIVE",
    "92": "NOT_ALIVE",
    "93": "NOT_ALIVE",
    "94": "NON_PARTICIPATING",
    "95": "NOT_ALIVE",
    "96": "NOT_ALIVE",
    "97": "NON_PARTICIPATING",
    "98": "NOT_ALIVE",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    5950315,
    5950318,
    5950322
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 237,
  "intermediate_size": 5632,
  "last_allreduce_block": 5948952,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}