File size: 7,752 Bytes
db00f12
80927c4
db00f12
 
dd0efef
9a6205e
db00f12
b7c6e22
3ef4e25
3aee6ce
3ef4e25
dd0efef
0628655
fa1eaa2
0628655
dd0efef
1822881
80927c4
3aee6ce
0628655
 
 
 
 
 
 
3bee20e
3ef4e25
b7c6e22
4f47bf6
dd0efef
 
4f47bf6
82f802a
0628655
 
a740b48
dd0efef
9a6205e
82f802a
db00f12
b7c6e22
0628655
3bee20e
 
20142c7
0628655
82f802a
0628655
 
 
 
 
dd0efef
b9db4b6
82f802a
3ef4e25
dd0efef
82f802a
dd0efef
0628655
80927c4
db00f12
3aee6ce
b7c6e22
82f802a
0628655
 
c44cd13
3ef4e25
efe562e
80927c4
20142c7
0628655
b7c6e22
ad6f2b3
0628655
 
3aee6ce
0628655
20142c7
cab2dfa
ad6f2b3
4f47bf6
db00f12
0628655
4f47bf6
dd0efef
fa1eaa2
db00f12
20142c7
76b8612
9a6205e
3aee6ce
efe562e
b1d6f62
db00f12
b7c6e22
b9db4b6
bdd89fe
3ef4e25
dd0efef
 
db00f12
82f802a
0628655
3bee20e
3aee6ce
0628655
4f47bf6
0628655
 
 
 
3aee6ce
20142c7
82f802a
5f2e2ba
b7c6e22
4f47bf6
ad6f2b3
0628655
dd0efef
82f802a
db00f12
dd0efef
4f47bf6
b1d6f62
0628655
82f802a
b7c6e22
3aee6ce
20142c7
82f802a
3ef4e25
0628655
 
283d334
3bee20e
3aee6ce
0628655
 
bdd89fe
db00f12
b7c6e22
db00f12
3ef4e25
3aee6ce
4f47bf6
bdd89fe
0628655
 
c67bb45
2923822
283d334
0628655
 
82f802a
 
 
c44cd13
3bee20e
82f802a
 
0628655
80268a4
dd0efef
4f47bf6
b9db4b6
4f47bf6
82f802a
20142c7
82f802a
80927c4
b7c6e22
ad6f2b3
0628655
c44cd13
3aee6ce
c44cd13
283d334
979bb0d
3bee20e
0628655
b7c6e22
0628655
db00f12
c44cd13
0628655
dd0efef
db00f12
0628655
 
 
b7c6e22
82f802a
cf9b5a8
76b8612
3aee6ce
 
b1d6f62
82f802a
 
0628655
 
 
3aee6ce
b7c6e22
dd0efef
13df1dc
ad6f2b3
20142c7
0628655
b7c6e22
 
a740b48
7889763
dd0efef
3bee20e
82f802a
283d334
4f47bf6
20142c7
fa1eaa2
c44cd13
283d334
0628655
c44cd13
3aee6ce
dd0efef
0628655
b9db4b6
b7c6e22
a740b48
0628655
 
a740b48
9a6205e
20142c7
dd0efef
2923822
20142c7
dd0efef
82f802a
b7c6e22
 
0628655
db00f12
dd0efef
7889763
0628655
 
6ba22e1
0628655
fa1eaa2
0628655
dd0efef
b2382c7
db00f12
 
 
 
 
 
 
 
216ba55
 
db00f12
 
 
 
 
 
216ba55
db00f12
0628655
db00f12
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NON_PARTICIPATING",
    "10": "NOT_ALIVE",
    "100": "NOT_ALIVE",
    "101": "NOT_ALIVE",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NOT_ALIVE",
    "105": "NON_PARTICIPATING",
    "106": "NON_PARTICIPATING",
    "107": "NOT_ALIVE",
    "108": "SUCCESS",
    "109": "NON_PARTICIPATING",
    "11": "NOT_ALIVE",
    "110": "NOT_ALIVE",
    "111": "NON_PARTICIPATING",
    "112": "SUCCESS",
    "113": "NON_PARTICIPATING",
    "114": "NOT_ALIVE",
    "115": "NON_PARTICIPATING",
    "116": "NOT_ALIVE",
    "117": "NOT_ALIVE",
    "118": "NOT_ALIVE",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NON_PARTICIPATING",
    "121": "NON_PARTICIPATING",
    "122": "NON_PARTICIPATING",
    "123": "NON_PARTICIPATING",
    "124": "NON_PARTICIPATING",
    "125": "NON_PARTICIPATING",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NON_PARTICIPATING",
    "129": "NON_PARTICIPATING",
    "13": "NOT_ALIVE",
    "130": "NON_PARTICIPATING",
    "131": "NOT_ALIVE",
    "132": "NON_PARTICIPATING",
    "133": "NON_PARTICIPATING",
    "134": "NON_PARTICIPATING",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NOT_ALIVE",
    "138": "NON_PARTICIPATING",
    "139": "NOT_ALIVE",
    "14": "SUCCESS",
    "140": "NON_PARTICIPATING",
    "141": "NOT_ALIVE",
    "142": "NOT_ALIVE",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NON_PARTICIPATING",
    "146": "NOT_ALIVE",
    "147": "NON_PARTICIPATING",
    "148": "NOT_ALIVE",
    "149": "NON_PARTICIPATING",
    "15": "NON_PARTICIPATING",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NON_PARTICIPATING",
    "153": "NOT_ALIVE",
    "154": "NON_PARTICIPATING",
    "155": "NON_PARTICIPATING",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NOT_ALIVE",
    "159": "NOT_ALIVE",
    "16": "NON_PARTICIPATING",
    "160": "NON_PARTICIPATING",
    "161": "NOT_ALIVE",
    "162": "NON_PARTICIPATING",
    "163": "NOT_ALIVE",
    "164": "NOT_ALIVE",
    "165": "NOT_ALIVE",
    "166": "NON_PARTICIPATING",
    "167": "NOT_ALIVE",
    "168": "NON_PARTICIPATING",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NOT_ALIVE",
    "171": "NOT_ALIVE",
    "172": "NON_PARTICIPATING",
    "173": "NON_PARTICIPATING",
    "174": "NON_PARTICIPATING",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NOT_ALIVE",
    "179": "NOT_ALIVE",
    "18": "NON_PARTICIPATING",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "SUCCESS",
    "184": "NON_PARTICIPATING",
    "185": "NOT_ALIVE",
    "186": "NOT_ALIVE",
    "187": "NON_PARTICIPATING",
    "188": "NON_PARTICIPATING",
    "189": "NOT_ALIVE",
    "19": "NON_PARTICIPATING",
    "190": "NON_PARTICIPATING",
    "191": "NON_PARTICIPATING",
    "192": "NON_PARTICIPATING",
    "193": "NOT_ALIVE",
    "194": "NON_PARTICIPATING",
    "195": "NOT_ALIVE",
    "196": "NON_PARTICIPATING",
    "197": "NOT_ALIVE",
    "198": "NOT_ALIVE",
    "199": "NON_PARTICIPATING",
    "2": "NON_PARTICIPATING",
    "20": "NOT_ALIVE",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NON_PARTICIPATING",
    "203": "NOT_ALIVE",
    "204": "NOT_ALIVE",
    "205": "NON_PARTICIPATING",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NON_PARTICIPATING",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NON_PARTICIPATING",
    "211": "NON_PARTICIPATING",
    "212": "SUCCESS",
    "213": "NON_PARTICIPATING",
    "214": "NON_PARTICIPATING",
    "215": "SUCCESS",
    "216": "NOT_ALIVE",
    "217": "NOT_ALIVE",
    "218": "NOT_ALIVE",
    "219": "NOT_ALIVE",
    "22": "NON_PARTICIPATING",
    "220": "NON_PARTICIPATING",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NOT_ALIVE",
    "225": "NON_PARTICIPATING",
    "226": "NOT_ALIVE",
    "227": "NOT_ALIVE",
    "228": "NOT_ALIVE",
    "229": "NON_PARTICIPATING",
    "23": "NON_PARTICIPATING",
    "230": "NON_PARTICIPATING",
    "231": "SUCCESS",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NOT_ALIVE",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "NON_PARTICIPATING",
    "238": "NON_PARTICIPATING",
    "239": "NOT_ALIVE",
    "24": "NOT_ALIVE",
    "240": "NON_PARTICIPATING",
    "241": "SUCCESS",
    "242": "NON_PARTICIPATING",
    "243": "NON_PARTICIPATING",
    "244": "NOT_ALIVE",
    "245": "NON_PARTICIPATING",
    "246": "NOT_ALIVE",
    "247": "NON_PARTICIPATING",
    "248": "NON_PARTICIPATING",
    "249": "NON_PARTICIPATING",
    "25": "SUCCESS",
    "250": "SUCCESS",
    "251": "NOT_ALIVE",
    "252": "NOT_ALIVE",
    "253": "NOT_ALIVE",
    "254": "NON_PARTICIPATING",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NOT_ALIVE",
    "28": "NOT_ALIVE",
    "29": "NON_PARTICIPATING",
    "3": "NON_PARTICIPATING",
    "30": "NOT_ALIVE",
    "31": "NON_PARTICIPATING",
    "32": "NON_PARTICIPATING",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NON_PARTICIPATING",
    "36": "NON_PARTICIPATING",
    "37": "NOT_ALIVE",
    "38": "NON_PARTICIPATING",
    "39": "SUCCESS",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NOT_ALIVE",
    "43": "NOT_ALIVE",
    "44": "NOT_ALIVE",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "SUCCESS",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "NON_PARTICIPATING",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "SUCCESS",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "NON_PARTICIPATING",
    "57": "NOT_ALIVE",
    "58": "NON_PARTICIPATING",
    "59": "NON_PARTICIPATING",
    "6": "NON_PARTICIPATING",
    "60": "NOT_ALIVE",
    "61": "NON_PARTICIPATING",
    "62": "NON_PARTICIPATING",
    "63": "SUCCESS",
    "64": "NOT_ALIVE",
    "65": "NON_PARTICIPATING",
    "66": "NON_PARTICIPATING",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NOT_ALIVE",
    "7": "NOT_ALIVE",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NON_PARTICIPATING",
    "73": "NOT_ALIVE",
    "74": "NOT_ALIVE",
    "75": "NON_PARTICIPATING",
    "76": "NOT_ALIVE",
    "77": "SUCCESS",
    "78": "NON_PARTICIPATING",
    "79": "NON_PARTICIPATING",
    "8": "NOT_ALIVE",
    "80": "NOT_ALIVE",
    "81": "NON_PARTICIPATING",
    "82": "NON_PARTICIPATING",
    "83": "NON_PARTICIPATING",
    "84": "NON_PARTICIPATING",
    "85": "NON_PARTICIPATING",
    "86": "NON_PARTICIPATING",
    "87": "NOT_ALIVE",
    "88": "NON_PARTICIPATING",
    "89": "NOT_ALIVE",
    "9": "NON_PARTICIPATING",
    "90": "NOT_ALIVE",
    "91": "NOT_ALIVE",
    "92": "SUCCESS",
    "93": "NOT_ALIVE",
    "94": "SUCCESS",
    "95": "NOT_ALIVE",
    "96": "NOT_ALIVE",
    "97": "NON_PARTICIPATING",
    "98": "NOT_ALIVE",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6018942,
    6018987
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 37,
  "intermediate_size": 5632,
  "last_allreduce_block": 6016469,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}