File size: 7,712 Bytes
ffb00a7
 
 
 
2485426
ffb00a7
1bf57a0
ffb00a7
821c035
 
3cf3ab9
821c035
ffb00a7
3cf3ab9
a13a11d
ffb00a7
 
 
2485426
724213f
ffb00a7
724213f
3cf3ab9
ffb00a7
0df8392
ffb00a7
 
 
18d559f
821c035
bfa93f8
f79f103
18d559f
ffb00a7
81a8a0c
a13a11d
724213f
7c5c047
ffb00a7
 
 
 
a13a11d
 
f79f103
724213f
a13a11d
a3a5487
724213f
ffb00a7
724213f
bfa93f8
f79f103
5f664db
18d559f
821c035
 
ffb00a7
3cf3ab9
d2decd4
ffb00a7
 
724213f
ffb00a7
 
724213f
3cf3ab9
821c035
ffb00a7
a13a11d
0df8392
ffb00a7
3cf3ab9
2485426
f79f103
821c035
 
724213f
3cf3ab9
724213f
81a8a0c
0df8392
ffb00a7
724213f
f79f103
724213f
3cf3ab9
f79f103
0df8392
ffb00a7
 
724213f
 
ffb00a7
724213f
7c5c047
ffb00a7
3cf3ab9
ffb00a7
7c5c047
724213f
 
ffb00a7
724213f
ffb00a7
f79f103
3cf3ab9
7c5c047
f79f103
821c035
7c5c047
ffb00a7
821c035
8755095
ffb00a7
a13a11d
ffb00a7
f79f103
18d559f
821c035
f79f103
ffb00a7
f79f103
821c035
ffb00a7
 
 
 
7c5c047
2485426
724213f
7c5c047
8755095
18d559f
724213f
 
 
3cf3ab9
ffb00a7
 
 
 
2485426
5f664db
18d559f
bfa93f8
ffb00a7
821c035
ffb00a7
 
7c5c047
ffb00a7
 
 
2485426
ffb00a7
 
a3a5487
bfa93f8
724213f
ffb00a7
 
a3a5487
821c035
ffb00a7
724213f
18d559f
f79f103
ffb00a7
 
 
 
bfa93f8
ffb00a7
8755095
7c5c047
ffb00a7
7c5c047
0df8392
 
3cf3ab9
2485426
 
ffb00a7
2485426
724213f
2485426
724213f
f79f103
 
0df8392
ffb00a7
 
 
 
0df8392
7c5c047
724213f
ffb00a7
821c035
bfa93f8
ffb00a7
0df8392
3cf3ab9
ffb00a7
 
 
18d559f
 
 
ffb00a7
a3a5487
ffb00a7
 
d2decd4
ffb00a7
f79f103
724213f
ffb00a7
3cf3ab9
18d559f
3cf3ab9
724213f
bfa93f8
ffb00a7
 
 
2485426
d137aed
1bf57a0
724213f
a13a11d
724213f
d137aed
724213f
bfa93f8
724213f
ffb00a7
 
f79f103
3cf3ab9
821c035
d137aed
ffb00a7
7c5c047
18d559f
ffb00a7
 
 
 
 
821c035
a13a11d
7c5c047
5f664db
724213f
ffb00a7
0df8392
821c035
ffb00a7
 
 
 
 
 
 
54c9173
 
ffb00a7
 
 
 
 
 
54c9173
ffb00a7
724213f
ffb00a7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "SUCCESS",
    "10": "NOT_ALIVE",
    "100": "NON_PARTICIPATING",
    "101": "NOT_ALIVE",
    "102": "NOT_ALIVE",
    "103": "NON_PARTICIPATING",
    "104": "NON_PARTICIPATING",
    "105": "NON_PARTICIPATING",
    "106": "NOT_ALIVE",
    "107": "NON_PARTICIPATING",
    "108": "NON_PARTICIPATING",
    "109": "NOT_ALIVE",
    "11": "NOT_ALIVE",
    "110": "NOT_ALIVE",
    "111": "NON_PARTICIPATING",
    "112": "NON_PARTICIPATING",
    "113": "NOT_ALIVE",
    "114": "NOT_ALIVE",
    "115": "NON_PARTICIPATING",
    "116": "NOT_ALIVE",
    "117": "NON_PARTICIPATING",
    "118": "NOT_ALIVE",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NON_PARTICIPATING",
    "121": "NON_PARTICIPATING",
    "122": "NOT_ALIVE",
    "123": "NOT_ALIVE",
    "124": "NON_PARTICIPATING",
    "125": "NOT_ALIVE",
    "126": "NOT_ALIVE",
    "127": "NON_PARTICIPATING",
    "128": "NOT_ALIVE",
    "129": "NON_PARTICIPATING",
    "13": "NOT_ALIVE",
    "130": "NOT_ALIVE",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "SUCCESS",
    "134": "NON_PARTICIPATING",
    "135": "NOT_ALIVE",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "NON_PARTICIPATING",
    "139": "NON_PARTICIPATING",
    "14": "NOT_ALIVE",
    "140": "SUCCESS",
    "141": "NOT_ALIVE",
    "142": "NOT_ALIVE",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NOT_ALIVE",
    "146": "NON_PARTICIPATING",
    "147": "NOT_ALIVE",
    "148": "NON_PARTICIPATING",
    "149": "NON_PARTICIPATING",
    "15": "NOT_ALIVE",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "NON_PARTICIPATING",
    "154": "NON_PARTICIPATING",
    "155": "NON_PARTICIPATING",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NON_PARTICIPATING",
    "159": "NON_PARTICIPATING",
    "16": "NOT_ALIVE",
    "160": "NON_PARTICIPATING",
    "161": "NON_PARTICIPATING",
    "162": "NOT_ALIVE",
    "163": "NON_PARTICIPATING",
    "164": "NON_PARTICIPATING",
    "165": "NON_PARTICIPATING",
    "166": "SUCCESS",
    "167": "NOT_ALIVE",
    "168": "NON_PARTICIPATING",
    "169": "NON_PARTICIPATING",
    "17": "NOT_ALIVE",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "NOT_ALIVE",
    "173": "NOT_ALIVE",
    "174": "NOT_ALIVE",
    "175": "NON_PARTICIPATING",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NON_PARTICIPATING",
    "179": "NOT_ALIVE",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NON_PARTICIPATING",
    "182": "NON_PARTICIPATING",
    "183": "NON_PARTICIPATING",
    "184": "NOT_ALIVE",
    "185": "NOT_ALIVE",
    "186": "NON_PARTICIPATING",
    "187": "NON_PARTICIPATING",
    "188": "NOT_ALIVE",
    "189": "NON_PARTICIPATING",
    "19": "NOT_ALIVE",
    "190": "NOT_ALIVE",
    "191": "NON_PARTICIPATING",
    "192": "NON_PARTICIPATING",
    "193": "NOT_ALIVE",
    "194": "NON_PARTICIPATING",
    "195": "NON_PARTICIPATING",
    "196": "NOT_ALIVE",
    "197": "NON_PARTICIPATING",
    "198": "NON_PARTICIPATING",
    "199": "NOT_ALIVE",
    "2": "NOT_ALIVE",
    "20": "NOT_ALIVE",
    "200": "NOT_ALIVE",
    "201": "SUCCESS",
    "202": "NON_PARTICIPATING",
    "203": "NOT_ALIVE",
    "204": "NOT_ALIVE",
    "205": "NOT_ALIVE",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NOT_ALIVE",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NON_PARTICIPATING",
    "211": "NOT_ALIVE",
    "212": "NOT_ALIVE",
    "213": "NOT_ALIVE",
    "214": "NON_PARTICIPATING",
    "215": "NON_PARTICIPATING",
    "216": "NOT_ALIVE",
    "217": "NOT_ALIVE",
    "218": "NOT_ALIVE",
    "219": "NON_PARTICIPATING",
    "22": "NOT_ALIVE",
    "220": "NOT_ALIVE",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NON_PARTICIPATING",
    "224": "NON_PARTICIPATING",
    "225": "NON_PARTICIPATING",
    "226": "NON_PARTICIPATING",
    "227": "NOT_ALIVE",
    "228": "NOT_ALIVE",
    "229": "NOT_ALIVE",
    "23": "NOT_ALIVE",
    "230": "NON_PARTICIPATING",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NON_PARTICIPATING",
    "235": "NOT_ALIVE",
    "236": "NOT_ALIVE",
    "237": "NON_PARTICIPATING",
    "238": "NON_PARTICIPATING",
    "239": "NOT_ALIVE",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NON_PARTICIPATING",
    "243": "NOT_ALIVE",
    "244": "NOT_ALIVE",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NOT_ALIVE",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NON_PARTICIPATING",
    "251": "NOT_ALIVE",
    "252": "NON_PARTICIPATING",
    "253": "NON_PARTICIPATING",
    "254": "NOT_ALIVE",
    "255": "NON_PARTICIPATING",
    "26": "NON_PARTICIPATING",
    "27": "NON_PARTICIPATING",
    "28": "NON_PARTICIPATING",
    "29": "NON_PARTICIPATING",
    "3": "NOT_ALIVE",
    "30": "NOT_ALIVE",
    "31": "SUCCESS",
    "32": "NOT_ALIVE",
    "33": "NON_PARTICIPATING",
    "34": "NOT_ALIVE",
    "35": "NOT_ALIVE",
    "36": "NOT_ALIVE",
    "37": "NOT_ALIVE",
    "38": "NOT_ALIVE",
    "39": "NOT_ALIVE",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NOT_ALIVE",
    "43": "NOT_ALIVE",
    "44": "NOT_ALIVE",
    "45": "NON_PARTICIPATING",
    "46": "NON_PARTICIPATING",
    "47": "NOT_ALIVE",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "NOT_ALIVE",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "NON_PARTICIPATING",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NON_PARTICIPATING",
    "56": "NON_PARTICIPATING",
    "57": "NON_PARTICIPATING",
    "58": "NOT_ALIVE",
    "59": "NOT_ALIVE",
    "6": "NOT_ALIVE",
    "60": "NON_PARTICIPATING",
    "61": "NOT_ALIVE",
    "62": "NOT_ALIVE",
    "63": "NON_PARTICIPATING",
    "64": "NON_PARTICIPATING",
    "65": "NON_PARTICIPATING",
    "66": "NON_PARTICIPATING",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NON_PARTICIPATING",
    "7": "NOT_ALIVE",
    "70": "NON_PARTICIPATING",
    "71": "NON_PARTICIPATING",
    "72": "NOT_ALIVE",
    "73": "NON_PARTICIPATING",
    "74": "NON_PARTICIPATING",
    "75": "NOT_ALIVE",
    "76": "NON_PARTICIPATING",
    "77": "NOT_ALIVE",
    "78": "NON_PARTICIPATING",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NOT_ALIVE",
    "81": "NOT_ALIVE",
    "82": "NON_PARTICIPATING",
    "83": "SUCCESS",
    "84": "NON_PARTICIPATING",
    "85": "NOT_ALIVE",
    "86": "NON_PARTICIPATING",
    "87": "NOT_ALIVE",
    "88": "NOT_ALIVE",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NOT_ALIVE",
    "91": "NOT_ALIVE",
    "92": "NOT_ALIVE",
    "93": "NON_PARTICIPATING",
    "94": "NOT_ALIVE",
    "95": "NON_PARTICIPATING",
    "96": "NOT_ALIVE",
    "97": "NOT_ALIVE",
    "98": "NON_PARTICIPATING",
    "99": "SUCCESS"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6173328,
    6173364
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 35,
  "intermediate_size": 5632,
  "last_allreduce_block": 6172668,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}