File size: 7,752 Bytes
525340d
cbcf2e3
525340d
 
cbcf2e3
6a78ed2
525340d
ecbfbb9
1121183
f93b459
1121183
cbcf2e3
e561b78
3b61827
e561b78
cbcf2e3
d0cde57
20daea4
f93b459
e561b78
 
 
 
 
 
 
0e87ac8
1121183
ecbfbb9
2c2c984
cbcf2e3
 
2c2c984
117ce68
e561b78
 
1121183
cbcf2e3
0558cd7
117ce68
525340d
ecbfbb9
e561b78
0e87ac8
 
a1c4112
e561b78
117ce68
e561b78
 
 
 
 
cbcf2e3
fbd5bc6
117ce68
1121183
cbcf2e3
117ce68
cbcf2e3
e561b78
20daea4
525340d
f93b459
ecbfbb9
117ce68
e561b78
 
e2c9402
1121183
f681d26
20daea4
a1c4112
e561b78
ecbfbb9
578e39d
e561b78
 
f93b459
e561b78
a1c4112
b6c484d
578e39d
2c2c984
525340d
e561b78
2c2c984
cbcf2e3
3b61827
525340d
a1c4112
f14291b
6a78ed2
f93b459
f681d26
491335c
525340d
ecbfbb9
1418c24
9b135ac
1121183
cbcf2e3
 
525340d
117ce68
e561b78
0e87ac8
f93b459
e561b78
2c2c984
e561b78
 
 
 
f93b459
a1c4112
117ce68
6480b16
ecbfbb9
2c2c984
cf4a545
e561b78
cbcf2e3
117ce68
525340d
cbcf2e3
2c2c984
491335c
e561b78
117ce68
ecbfbb9
f93b459
a1c4112
117ce68
1121183
e561b78
 
b12e878
0e87ac8
f93b459
e561b78
 
9b135ac
525340d
ecbfbb9
525340d
1121183
f93b459
2c2c984
9b135ac
e561b78
 
6f7bf24
e351beb
b12e878
e561b78
 
117ce68
 
 
e2c9402
0e87ac8
117ce68
 
e561b78
8e104eb
cbcf2e3
2c2c984
e351beb
2c2c984
117ce68
a1c4112
117ce68
20daea4
ecbfbb9
578e39d
e561b78
e2c9402
f93b459
e2c9402
b12e878
1121183
0e87ac8
e561b78
ecbfbb9
e561b78
525340d
e2c9402
e561b78
cbcf2e3
525340d
e561b78
 
 
ecbfbb9
117ce68
1121183
f14291b
f93b459
 
491335c
117ce68
 
e561b78
 
 
f93b459
ecbfbb9
cbcf2e3
fbd5bc6
fcf80cc
a1c4112
e561b78
ecbfbb9
 
9d76d54
1121183
cbcf2e3
0e87ac8
117ce68
b12e878
2c2c984
a1c4112
3b61827
e2c9402
b12e878
e561b78
e2c9402
f93b459
cbcf2e3
e561b78
1121183
ecbfbb9
1121183
e561b78
 
1121183
6a78ed2
a1c4112
cbcf2e3
e351beb
a1c4112
cbcf2e3
117ce68
ecbfbb9
 
e561b78
525340d
cbcf2e3
1121183
e561b78
 
0ffd0ce
e561b78
3b61827
e561b78
cbcf2e3
1121183
525340d
 
 
 
 
 
 
 
2a3c26a
 
525340d
 
 
 
 
 
2a3c26a
525340d
e561b78
525340d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NON_PARTICIPATING",
    "10": "NOT_ALIVE",
    "100": "NOT_ALIVE",
    "101": "NOT_ALIVE",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NOT_ALIVE",
    "105": "NON_PARTICIPATING",
    "106": "NON_PARTICIPATING",
    "107": "NOT_ALIVE",
    "108": "SUCCESS",
    "109": "NON_PARTICIPATING",
    "11": "NOT_ALIVE",
    "110": "NOT_ALIVE",
    "111": "NON_PARTICIPATING",
    "112": "SUCCESS",
    "113": "NON_PARTICIPATING",
    "114": "NOT_ALIVE",
    "115": "NON_PARTICIPATING",
    "116": "NOT_ALIVE",
    "117": "NOT_ALIVE",
    "118": "NOT_ALIVE",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NON_PARTICIPATING",
    "121": "NON_PARTICIPATING",
    "122": "NON_PARTICIPATING",
    "123": "NON_PARTICIPATING",
    "124": "NON_PARTICIPATING",
    "125": "NON_PARTICIPATING",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NON_PARTICIPATING",
    "129": "NON_PARTICIPATING",
    "13": "NOT_ALIVE",
    "130": "NON_PARTICIPATING",
    "131": "NOT_ALIVE",
    "132": "NON_PARTICIPATING",
    "133": "NON_PARTICIPATING",
    "134": "NON_PARTICIPATING",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NOT_ALIVE",
    "138": "NON_PARTICIPATING",
    "139": "NOT_ALIVE",
    "14": "SUCCESS",
    "140": "NON_PARTICIPATING",
    "141": "NOT_ALIVE",
    "142": "NOT_ALIVE",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NON_PARTICIPATING",
    "146": "NOT_ALIVE",
    "147": "NON_PARTICIPATING",
    "148": "NOT_ALIVE",
    "149": "NON_PARTICIPATING",
    "15": "NON_PARTICIPATING",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NON_PARTICIPATING",
    "153": "NOT_ALIVE",
    "154": "NON_PARTICIPATING",
    "155": "NON_PARTICIPATING",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NOT_ALIVE",
    "159": "NOT_ALIVE",
    "16": "NON_PARTICIPATING",
    "160": "NON_PARTICIPATING",
    "161": "NOT_ALIVE",
    "162": "NON_PARTICIPATING",
    "163": "NOT_ALIVE",
    "164": "NOT_ALIVE",
    "165": "NOT_ALIVE",
    "166": "NON_PARTICIPATING",
    "167": "NOT_ALIVE",
    "168": "NON_PARTICIPATING",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NOT_ALIVE",
    "171": "NOT_ALIVE",
    "172": "NON_PARTICIPATING",
    "173": "NON_PARTICIPATING",
    "174": "NON_PARTICIPATING",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NOT_ALIVE",
    "179": "NOT_ALIVE",
    "18": "NON_PARTICIPATING",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "SUCCESS",
    "184": "NON_PARTICIPATING",
    "185": "NOT_ALIVE",
    "186": "NOT_ALIVE",
    "187": "NON_PARTICIPATING",
    "188": "NON_PARTICIPATING",
    "189": "NOT_ALIVE",
    "19": "NON_PARTICIPATING",
    "190": "NON_PARTICIPATING",
    "191": "NON_PARTICIPATING",
    "192": "NON_PARTICIPATING",
    "193": "NOT_ALIVE",
    "194": "NON_PARTICIPATING",
    "195": "NOT_ALIVE",
    "196": "NON_PARTICIPATING",
    "197": "NOT_ALIVE",
    "198": "NOT_ALIVE",
    "199": "NON_PARTICIPATING",
    "2": "NON_PARTICIPATING",
    "20": "NOT_ALIVE",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NON_PARTICIPATING",
    "203": "NOT_ALIVE",
    "204": "NOT_ALIVE",
    "205": "NON_PARTICIPATING",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NON_PARTICIPATING",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NON_PARTICIPATING",
    "211": "NON_PARTICIPATING",
    "212": "SUCCESS",
    "213": "NON_PARTICIPATING",
    "214": "NON_PARTICIPATING",
    "215": "SUCCESS",
    "216": "NOT_ALIVE",
    "217": "NOT_ALIVE",
    "218": "NOT_ALIVE",
    "219": "NOT_ALIVE",
    "22": "NON_PARTICIPATING",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NOT_ALIVE",
    "225": "NON_PARTICIPATING",
    "226": "NOT_ALIVE",
    "227": "NOT_ALIVE",
    "228": "NOT_ALIVE",
    "229": "NON_PARTICIPATING",
    "23": "NON_PARTICIPATING",
    "230": "NON_PARTICIPATING",
    "231": "SUCCESS",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NOT_ALIVE",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "NON_PARTICIPATING",
    "238": "NON_PARTICIPATING",
    "239": "NOT_ALIVE",
    "24": "NOT_ALIVE",
    "240": "NON_PARTICIPATING",
    "241": "SUCCESS",
    "242": "NON_PARTICIPATING",
    "243": "NON_PARTICIPATING",
    "244": "NOT_ALIVE",
    "245": "NON_PARTICIPATING",
    "246": "NOT_ALIVE",
    "247": "NON_PARTICIPATING",
    "248": "NON_PARTICIPATING",
    "249": "NON_PARTICIPATING",
    "25": "SUCCESS",
    "250": "SUCCESS",
    "251": "NOT_ALIVE",
    "252": "NOT_ALIVE",
    "253": "NOT_ALIVE",
    "254": "NON_PARTICIPATING",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NOT_ALIVE",
    "28": "NOT_ALIVE",
    "29": "NON_PARTICIPATING",
    "3": "NON_PARTICIPATING",
    "30": "NOT_ALIVE",
    "31": "NON_PARTICIPATING",
    "32": "NON_PARTICIPATING",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NON_PARTICIPATING",
    "36": "NON_PARTICIPATING",
    "37": "NOT_ALIVE",
    "38": "NON_PARTICIPATING",
    "39": "SUCCESS",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NOT_ALIVE",
    "43": "NOT_ALIVE",
    "44": "NOT_ALIVE",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "SUCCESS",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "NON_PARTICIPATING",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "SUCCESS",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "NON_PARTICIPATING",
    "57": "NOT_ALIVE",
    "58": "NON_PARTICIPATING",
    "59": "NON_PARTICIPATING",
    "6": "NON_PARTICIPATING",
    "60": "NOT_ALIVE",
    "61": "NON_PARTICIPATING",
    "62": "NON_PARTICIPATING",
    "63": "SUCCESS",
    "64": "NOT_ALIVE",
    "65": "NON_PARTICIPATING",
    "66": "NON_PARTICIPATING",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NOT_ALIVE",
    "7": "NOT_ALIVE",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NON_PARTICIPATING",
    "73": "NOT_ALIVE",
    "74": "NOT_ALIVE",
    "75": "NON_PARTICIPATING",
    "76": "NOT_ALIVE",
    "77": "SUCCESS",
    "78": "NON_PARTICIPATING",
    "79": "NON_PARTICIPATING",
    "8": "NOT_ALIVE",
    "80": "NOT_ALIVE",
    "81": "NON_PARTICIPATING",
    "82": "NON_PARTICIPATING",
    "83": "NON_PARTICIPATING",
    "84": "NON_PARTICIPATING",
    "85": "NON_PARTICIPATING",
    "86": "NON_PARTICIPATING",
    "87": "NOT_ALIVE",
    "88": "NON_PARTICIPATING",
    "89": "NOT_ALIVE",
    "9": "NON_PARTICIPATING",
    "90": "NOT_ALIVE",
    "91": "NOT_ALIVE",
    "92": "SUCCESS",
    "93": "NOT_ALIVE",
    "94": "SUCCESS",
    "95": "NOT_ALIVE",
    "96": "NOT_ALIVE",
    "97": "NON_PARTICIPATING",
    "98": "NOT_ALIVE",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6018914,
    6018944
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 46,
  "intermediate_size": 5632,
  "last_allreduce_block": 6016469,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}