File size: 7,630 Bytes
3e14650
499ceb5
3e14650
 
c4caab2
197772a
3e14650
2a109f1
b095aeb
a6de76c
186a4ae
 
 
d87e190
fce7390
 
ecec6f4
4592c74
186a4ae
a6de76c
fce7390
2a109f1
186a4ae
2a109f1
fce7390
8969aca
b095aeb
c4caab2
b095aeb
499ceb5
4592c74
67abc5b
2a109f1
f9acf08
fce7390
8969aca
b0f58de
3c89c92
dee89c3
c4caab2
3e14650
fce7390
a6de76c
fce7390
 
a6de76c
88322b9
a6de76c
3c89c92
a6de76c
186a4ae
fce7390
2a109f1
f9acf08
88322b9
fce7390
3c89c92
2a109f1
fce7390
200b7b4
a6de76c
4592c74
3e14650
0c50bdc
2a109f1
186a4ae
fce7390
dee89c3
fce7390
2a109f1
f9acf08
e738bd7
3c89c92
fce7390
a6de76c
8969aca
fce7390
 
a6de76c
fce7390
4592c74
445d97b
8969aca
2a109f1
3e14650
b095aeb
fce7390
186a4ae
d87e190
3e14650
5472281
a6de76c
197772a
8969aca
f9acf08
499ceb5
a801e82
fce7390
186a4ae
c4caab2
f9acf08
b095aeb
fce7390
3e14650
d8cff93
dee89c3
3e14650
b095aeb
4592c74
fce7390
2a109f1
a6de76c
2a109f1
b095aeb
fce7390
b095aeb
c4caab2
5afff4c
85b6324
67abc5b
 
a6de76c
fce7390
 
3e14650
186a4ae
b095aeb
499ceb5
fce7390
186a4ae
2a109f1
fce7390
b095aeb
2a109f1
186a4ae
ecec6f4
88322b9
b095aeb
 
2a109f1
238e681
5472281
c4caab2
3e14650
200b7b4
3e14650
b095aeb
3c89c92
186a4ae
c4caab2
a6de76c
85b6324
e76c0fb
66eb166
b095aeb
f9acf08
5472281
fce7390
88322b9
8969aca
fce7390
b0f58de
88322b9
b095aeb
2a109f1
52fa8ef
2a109f1
85b6324
66eb166
a6de76c
0c50bdc
3e14650
a6de76c
4592c74
a6de76c
8969aca
2a109f1
fce7390
3c89c92
fce7390
b095aeb
c4caab2
fce7390
2a109f1
 
fce7390
3e14650
fce7390
2a109f1
1f2ceb5
a801e82
4592c74
2a109f1
b095aeb
2a109f1
c4caab2
 
a6de76c
4592c74
e76c0fb
499ceb5
fce7390
 
66eb166
a6de76c
b095aeb
a6de76c
fce7390
 
88322b9
36a5a33
66eb166
e738bd7
a6de76c
fce7390
2a109f1
a6de76c
186a4ae
b095aeb
fce7390
b095aeb
88322b9
197772a
d87e190
fce7390
b095aeb
fce7390
 
186a4ae
b095aeb
fce7390
3c89c92
4592c74
fce7390
85b6324
197772a
1f2ceb5
197772a
4592c74
b095aeb
66eb166
b095aeb
fce7390
 
 
85b6324
3c89c92
238e681
4592c74
a6de76c
88322b9
2a109f1
3c89c92
fce7390
d87e190
fce7390
4592c74
2447bb4
a801e82
3e14650
 
 
 
 
 
 
e12e32f
 
3e14650
 
 
 
 
 
e12e32f
3e14650
fce7390
3e14650
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NOT_ALIVE",
    "10": "NOT_ALIVE",
    "100": "NOT_ALIVE",
    "101": "NON_PARTICIPATING",
    "102": "NOT_ALIVE",
    "103": "NON_PARTICIPATING",
    "104": "NON_PARTICIPATING",
    "105": "NON_PARTICIPATING",
    "106": "NON_PARTICIPATING",
    "107": "NOT_ALIVE",
    "108": "SUCCESS",
    "109": "NOT_ALIVE",
    "11": "NOT_ALIVE",
    "110": "NON_PARTICIPATING",
    "111": "NON_PARTICIPATING",
    "112": "NON_PARTICIPATING",
    "113": "NOT_ALIVE",
    "114": "NON_PARTICIPATING",
    "115": "NON_PARTICIPATING",
    "116": "NON_PARTICIPATING",
    "117": "NON_PARTICIPATING",
    "118": "NOT_ALIVE",
    "119": "NOT_ALIVE",
    "12": "NON_PARTICIPATING",
    "120": "NOT_ALIVE",
    "121": "NOT_ALIVE",
    "122": "NON_PARTICIPATING",
    "123": "NOT_ALIVE",
    "124": "SUCCESS",
    "125": "NON_PARTICIPATING",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NOT_ALIVE",
    "129": "NON_PARTICIPATING",
    "13": "NOT_ALIVE",
    "130": "NOT_ALIVE",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "NON_PARTICIPATING",
    "134": "NOT_ALIVE",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "SUCCESS",
    "139": "NON_PARTICIPATING",
    "14": "SUCCESS",
    "140": "NON_PARTICIPATING",
    "141": "NON_PARTICIPATING",
    "142": "NOT_ALIVE",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NOT_ALIVE",
    "146": "NON_PARTICIPATING",
    "147": "NON_PARTICIPATING",
    "148": "SUCCESS",
    "149": "NON_PARTICIPATING",
    "15": "SUCCESS",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "SUCCESS",
    "154": "NON_PARTICIPATING",
    "155": "SUCCESS",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NON_PARTICIPATING",
    "159": "NOT_ALIVE",
    "16": "NON_PARTICIPATING",
    "160": "NON_PARTICIPATING",
    "161": "NON_PARTICIPATING",
    "162": "NOT_ALIVE",
    "163": "NOT_ALIVE",
    "164": "SUCCESS",
    "165": "SUCCESS",
    "166": "NOT_ALIVE",
    "167": "NON_PARTICIPATING",
    "168": "SUCCESS",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "NOT_ALIVE",
    "173": "SUCCESS",
    "174": "NON_PARTICIPATING",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NOT_ALIVE",
    "179": "NOT_ALIVE",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "SUCCESS",
    "184": "NON_PARTICIPATING",
    "185": "NOT_ALIVE",
    "186": "NON_PARTICIPATING",
    "187": "NOT_ALIVE",
    "188": "NOT_ALIVE",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NON_PARTICIPATING",
    "191": "NOT_ALIVE",
    "192": "NOT_ALIVE",
    "193": "NOT_ALIVE",
    "194": "NOT_ALIVE",
    "195": "NOT_ALIVE",
    "196": "NON_PARTICIPATING",
    "197": "SUCCESS",
    "198": "NOT_ALIVE",
    "199": "NON_PARTICIPATING",
    "2": "NOT_ALIVE",
    "20": "NOT_ALIVE",
    "200": "NOT_ALIVE",
    "201": "NON_PARTICIPATING",
    "202": "NOT_ALIVE",
    "203": "NOT_ALIVE",
    "204": "SUCCESS",
    "205": "NOT_ALIVE",
    "206": "NOT_ALIVE",
    "207": "NOT_ALIVE",
    "208": "NON_PARTICIPATING",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NON_PARTICIPATING",
    "213": "NON_PARTICIPATING",
    "214": "NON_PARTICIPATING",
    "215": "SUCCESS",
    "216": "NON_PARTICIPATING",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NOT_ALIVE",
    "22": "NOT_ALIVE",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NOT_ALIVE",
    "225": "NOT_ALIVE",
    "226": "NOT_ALIVE",
    "227": "NON_PARTICIPATING",
    "228": "NON_PARTICIPATING",
    "229": "NON_PARTICIPATING",
    "23": "NON_PARTICIPATING",
    "230": "NON_PARTICIPATING",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NOT_ALIVE",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "SUCCESS",
    "238": "NON_PARTICIPATING",
    "239": "NOT_ALIVE",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NOT_ALIVE",
    "243": "NON_PARTICIPATING",
    "244": "NOT_ALIVE",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NON_PARTICIPATING",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "SUCCESS",
    "251": "NON_PARTICIPATING",
    "252": "NON_PARTICIPATING",
    "253": "NOT_ALIVE",
    "254": "SUCCESS",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NOT_ALIVE",
    "28": "NOT_ALIVE",
    "29": "NOT_ALIVE",
    "3": "NOT_ALIVE",
    "30": "NOT_ALIVE",
    "31": "NON_PARTICIPATING",
    "32": "SUCCESS",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NON_PARTICIPATING",
    "36": "NOT_ALIVE",
    "37": "NOT_ALIVE",
    "38": "NOT_ALIVE",
    "39": "NON_PARTICIPATING",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NON_PARTICIPATING",
    "43": "NOT_ALIVE",
    "44": "NON_PARTICIPATING",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "NOT_ALIVE",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "SUCCESS",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "NOT_ALIVE",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "NON_PARTICIPATING",
    "57": "NON_PARTICIPATING",
    "58": "NON_PARTICIPATING",
    "59": "NON_PARTICIPATING",
    "6": "NON_PARTICIPATING",
    "60": "NON_PARTICIPATING",
    "61": "NON_PARTICIPATING",
    "62": "NOT_ALIVE",
    "63": "NON_PARTICIPATING",
    "64": "NOT_ALIVE",
    "65": "NON_PARTICIPATING",
    "66": "NOT_ALIVE",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NOT_ALIVE",
    "7": "NON_PARTICIPATING",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NOT_ALIVE",
    "73": "NOT_ALIVE",
    "74": "NON_PARTICIPATING",
    "75": "NOT_ALIVE",
    "76": "NON_PARTICIPATING",
    "77": "NON_PARTICIPATING",
    "78": "NOT_ALIVE",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NON_PARTICIPATING",
    "81": "NOT_ALIVE",
    "82": "NON_PARTICIPATING",
    "83": "NOT_ALIVE",
    "84": "NON_PARTICIPATING",
    "85": "NOT_ALIVE",
    "86": "NON_PARTICIPATING",
    "87": "NON_PARTICIPATING",
    "88": "NON_PARTICIPATING",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NON_PARTICIPATING",
    "91": "NON_PARTICIPATING",
    "92": "NON_PARTICIPATING",
    "93": "NOT_ALIVE",
    "94": "NOT_ALIVE",
    "95": "NOT_ALIVE",
    "96": "NON_PARTICIPATING",
    "97": "NON_PARTICIPATING",
    "98": "NON_PARTICIPATING",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    5987895,
    5987913
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 33,
  "intermediate_size": 5632,
  "last_allreduce_block": 5986899,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}