File size: 7,630 Bytes
1ede1ce
cc7430d
1ede1ce
 
ce63d64
bd9f740
1ede1ce
191d8c5
637d8b0
92405b9
7a85024
 
 
4bb0b85
97bc2be
 
ea600b4
741c7a3
7a85024
92405b9
97bc2be
191d8c5
7a85024
191d8c5
97bc2be
5259e06
637d8b0
ce63d64
637d8b0
cc7430d
741c7a3
b0bd316
191d8c5
c81bac3
97bc2be
5259e06
98340f7
e03f18d
f4428ba
ce63d64
1ede1ce
97bc2be
92405b9
97bc2be
 
92405b9
c9ba51a
92405b9
e03f18d
92405b9
7a85024
97bc2be
191d8c5
c81bac3
c9ba51a
97bc2be
e03f18d
191d8c5
97bc2be
340e872
92405b9
741c7a3
1ede1ce
27f0692
191d8c5
7a85024
97bc2be
f4428ba
97bc2be
191d8c5
c81bac3
fbb5874
e03f18d
97bc2be
92405b9
5259e06
97bc2be
 
92405b9
97bc2be
741c7a3
62f4f04
5259e06
191d8c5
dc6eda3
637d8b0
97bc2be
7a85024
4bb0b85
1ede1ce
05d5257
92405b9
bd9f740
5259e06
c81bac3
cc7430d
0999059
97bc2be
7a85024
ce63d64
c81bac3
637d8b0
97bc2be
1ede1ce
9c80b38
f4428ba
1ede1ce
637d8b0
741c7a3
97bc2be
191d8c5
92405b9
191d8c5
637d8b0
97bc2be
637d8b0
ce63d64
cf5a3c3
50c0498
b0bd316
 
92405b9
97bc2be
 
1ede1ce
7a85024
637d8b0
cc7430d
97bc2be
7a85024
191d8c5
97bc2be
637d8b0
191d8c5
7a85024
ea600b4
c9ba51a
637d8b0
 
191d8c5
9c80b38
05d5257
ce63d64
1ede1ce
340e872
9c80b38
637d8b0
e03f18d
7a85024
ce63d64
92405b9
50c0498
942b7a0
78acc49
637d8b0
c81bac3
05d5257
97bc2be
c9ba51a
5259e06
97bc2be
98340f7
c9ba51a
637d8b0
191d8c5
70662de
191d8c5
50c0498
78acc49
92405b9
27f0692
1ede1ce
92405b9
741c7a3
92405b9
5259e06
191d8c5
97bc2be
e03f18d
97bc2be
637d8b0
ce63d64
97bc2be
191d8c5
 
97bc2be
1ede1ce
97bc2be
191d8c5
292119e
0999059
741c7a3
191d8c5
637d8b0
191d8c5
ce63d64
 
92405b9
741c7a3
942b7a0
cc7430d
97bc2be
 
78acc49
92405b9
637d8b0
92405b9
97bc2be
 
c9ba51a
e8a1019
78acc49
fbb5874
92405b9
97bc2be
191d8c5
92405b9
7a85024
637d8b0
97bc2be
637d8b0
c9ba51a
bd9f740
4bb0b85
97bc2be
637d8b0
97bc2be
 
7a85024
637d8b0
97bc2be
e03f18d
741c7a3
97bc2be
50c0498
bd9f740
292119e
bd9f740
741c7a3
637d8b0
78acc49
637d8b0
97bc2be
 
 
50c0498
e03f18d
9c80b38
741c7a3
92405b9
c9ba51a
191d8c5
e03f18d
97bc2be
4bb0b85
97bc2be
741c7a3
7a69042
0999059
1ede1ce
 
 
 
 
 
 
1529b58
 
1ede1ce
 
 
 
 
 
1529b58
1ede1ce
97bc2be
1ede1ce
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NOT_ALIVE",
    "10": "NOT_ALIVE",
    "100": "NOT_ALIVE",
    "101": "NON_PARTICIPATING",
    "102": "NOT_ALIVE",
    "103": "NON_PARTICIPATING",
    "104": "NON_PARTICIPATING",
    "105": "NON_PARTICIPATING",
    "106": "NON_PARTICIPATING",
    "107": "NOT_ALIVE",
    "108": "SUCCESS",
    "109": "NOT_ALIVE",
    "11": "NOT_ALIVE",
    "110": "NON_PARTICIPATING",
    "111": "NON_PARTICIPATING",
    "112": "NON_PARTICIPATING",
    "113": "NOT_ALIVE",
    "114": "NON_PARTICIPATING",
    "115": "NON_PARTICIPATING",
    "116": "NON_PARTICIPATING",
    "117": "NON_PARTICIPATING",
    "118": "NOT_ALIVE",
    "119": "NOT_ALIVE",
    "12": "NON_PARTICIPATING",
    "120": "NOT_ALIVE",
    "121": "NOT_ALIVE",
    "122": "NON_PARTICIPATING",
    "123": "NOT_ALIVE",
    "124": "SUCCESS",
    "125": "NON_PARTICIPATING",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NOT_ALIVE",
    "129": "NON_PARTICIPATING",
    "13": "NOT_ALIVE",
    "130": "NOT_ALIVE",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "NON_PARTICIPATING",
    "134": "NOT_ALIVE",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "SUCCESS",
    "139": "NON_PARTICIPATING",
    "14": "SUCCESS",
    "140": "NON_PARTICIPATING",
    "141": "NON_PARTICIPATING",
    "142": "NOT_ALIVE",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NOT_ALIVE",
    "146": "NON_PARTICIPATING",
    "147": "NON_PARTICIPATING",
    "148": "SUCCESS",
    "149": "NON_PARTICIPATING",
    "15": "SUCCESS",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "SUCCESS",
    "154": "NON_PARTICIPATING",
    "155": "SUCCESS",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NON_PARTICIPATING",
    "159": "NOT_ALIVE",
    "16": "NON_PARTICIPATING",
    "160": "NON_PARTICIPATING",
    "161": "NON_PARTICIPATING",
    "162": "NOT_ALIVE",
    "163": "NOT_ALIVE",
    "164": "SUCCESS",
    "165": "SUCCESS",
    "166": "NOT_ALIVE",
    "167": "NON_PARTICIPATING",
    "168": "SUCCESS",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NON_PARTICIPATING",
    "171": "NOT_ALIVE",
    "172": "NOT_ALIVE",
    "173": "SUCCESS",
    "174": "NON_PARTICIPATING",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NOT_ALIVE",
    "179": "NOT_ALIVE",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "SUCCESS",
    "184": "NON_PARTICIPATING",
    "185": "NOT_ALIVE",
    "186": "NON_PARTICIPATING",
    "187": "NOT_ALIVE",
    "188": "NOT_ALIVE",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NON_PARTICIPATING",
    "191": "NOT_ALIVE",
    "192": "NOT_ALIVE",
    "193": "NOT_ALIVE",
    "194": "NOT_ALIVE",
    "195": "NOT_ALIVE",
    "196": "NON_PARTICIPATING",
    "197": "SUCCESS",
    "198": "NOT_ALIVE",
    "199": "NON_PARTICIPATING",
    "2": "NOT_ALIVE",
    "20": "NOT_ALIVE",
    "200": "NOT_ALIVE",
    "201": "NON_PARTICIPATING",
    "202": "NOT_ALIVE",
    "203": "NOT_ALIVE",
    "204": "SUCCESS",
    "205": "NOT_ALIVE",
    "206": "NOT_ALIVE",
    "207": "NOT_ALIVE",
    "208": "NON_PARTICIPATING",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NON_PARTICIPATING",
    "213": "NON_PARTICIPATING",
    "214": "NON_PARTICIPATING",
    "215": "SUCCESS",
    "216": "NON_PARTICIPATING",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NOT_ALIVE",
    "22": "NOT_ALIVE",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NOT_ALIVE",
    "225": "NOT_ALIVE",
    "226": "NOT_ALIVE",
    "227": "NON_PARTICIPATING",
    "228": "NON_PARTICIPATING",
    "229": "NON_PARTICIPATING",
    "23": "NON_PARTICIPATING",
    "230": "NON_PARTICIPATING",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NOT_ALIVE",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "SUCCESS",
    "238": "NON_PARTICIPATING",
    "239": "NOT_ALIVE",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NOT_ALIVE",
    "243": "NON_PARTICIPATING",
    "244": "NOT_ALIVE",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NON_PARTICIPATING",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "SUCCESS",
    "251": "NON_PARTICIPATING",
    "252": "NON_PARTICIPATING",
    "253": "NOT_ALIVE",
    "254": "SUCCESS",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NOT_ALIVE",
    "28": "NOT_ALIVE",
    "29": "NOT_ALIVE",
    "3": "NOT_ALIVE",
    "30": "NOT_ALIVE",
    "31": "NON_PARTICIPATING",
    "32": "SUCCESS",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NON_PARTICIPATING",
    "36": "NOT_ALIVE",
    "37": "NOT_ALIVE",
    "38": "NOT_ALIVE",
    "39": "NON_PARTICIPATING",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NON_PARTICIPATING",
    "43": "NOT_ALIVE",
    "44": "NON_PARTICIPATING",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "NOT_ALIVE",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "SUCCESS",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "NOT_ALIVE",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "NON_PARTICIPATING",
    "57": "NON_PARTICIPATING",
    "58": "NON_PARTICIPATING",
    "59": "NON_PARTICIPATING",
    "6": "NON_PARTICIPATING",
    "60": "NON_PARTICIPATING",
    "61": "NON_PARTICIPATING",
    "62": "NOT_ALIVE",
    "63": "NON_PARTICIPATING",
    "64": "NOT_ALIVE",
    "65": "NON_PARTICIPATING",
    "66": "NOT_ALIVE",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NOT_ALIVE",
    "7": "NON_PARTICIPATING",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NOT_ALIVE",
    "73": "NOT_ALIVE",
    "74": "NON_PARTICIPATING",
    "75": "NOT_ALIVE",
    "76": "NON_PARTICIPATING",
    "77": "NON_PARTICIPATING",
    "78": "NOT_ALIVE",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NON_PARTICIPATING",
    "81": "NOT_ALIVE",
    "82": "NON_PARTICIPATING",
    "83": "NOT_ALIVE",
    "84": "NON_PARTICIPATING",
    "85": "NOT_ALIVE",
    "86": "NON_PARTICIPATING",
    "87": "NON_PARTICIPATING",
    "88": "NON_PARTICIPATING",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NON_PARTICIPATING",
    "91": "NON_PARTICIPATING",
    "92": "NON_PARTICIPATING",
    "93": "NOT_ALIVE",
    "94": "NOT_ALIVE",
    "95": "NOT_ALIVE",
    "96": "NON_PARTICIPATING",
    "97": "NON_PARTICIPATING",
    "98": "NON_PARTICIPATING",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    5987912,
    5987927
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 32,
  "intermediate_size": 5632,
  "last_allreduce_block": 5986899,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}