File size: 7,740 Bytes
123d411
 
 
 
 
 
960da9c
123d411
960da9c
83dbf07
59c8ab8
f3a1e03
123d411
b8e13f9
123d411
 
 
 
75329c2
f3a1e03
123d411
 
75329c2
123d411
59c8ab8
46aa4fd
f56af95
123d411
12339b6
123d411
46aa4fd
960da9c
3daedce
123d411
 
1ca3a7b
e93603e
47f2c85
123d411
 
 
75329c2
12339b6
 
75329c2
1ca3a7b
b5ffd73
e93603e
1ca3a7b
123d411
46aa4fd
83dbf07
46aa4fd
b8e13f9
1ca3a7b
b8e13f9
960da9c
123d411
1ca3a7b
 
46aa4fd
123d411
1ca3a7b
123d411
59c8ab8
46aa4fd
 
f3a1e03
123d411
b8e13f9
46aa4fd
123d411
12339b6
123d411
1ca3a7b
 
46aa4fd
b8e13f9
1ca3a7b
59c8ab8
1ca3a7b
 
123d411
12339b6
75329c2
83dbf07
960da9c
b8e13f9
83dbf07
123d411
 
75329c2
123d411
 
1ca3a7b
960da9c
1ca3a7b
 
c852898
b8e13f9
46aa4fd
b8e13f9
1ca3a7b
c852898
123d411
83dbf07
1ca3a7b
 
46aa4fd
123d411
 
 
b8e13f9
f3a1e03
123d411
e93603e
123d411
e93603e
75329c2
12339b6
b8e13f9
c852898
1ca3a7b
83dbf07
123d411
 
960da9c
123d411
b8e13f9
3daedce
 
83dbf07
75329c2
960da9c
9e17942
46aa4fd
12339b6
46aa4fd
123d411
f56af95
123d411
 
12339b6
b5ffd73
46aa4fd
1ca3a7b
123d411
960da9c
123d411
 
1ca3a7b
123d411
 
b8e13f9
2b471cc
123d411
960da9c
1ca3a7b
12339b6
b5ffd73
123d411
 
3daedce
46aa4fd
123d411
75329c2
123d411
1ca3a7b
f3a1e03
123d411
 
 
1ca3a7b
123d411
12339b6
46aa4fd
1ca3a7b
46aa4fd
47f2c85
3daedce
46aa4fd
 
b8e13f9
123d411
59c8ab8
12339b6
83dbf07
b5ffd73
9e17942
1ca3a7b
75329c2
123d411
 
 
59c8ab8
960da9c
46aa4fd
9e17942
1ca3a7b
75329c2
59c8ab8
123d411
47f2c85
1ca3a7b
123d411
 
 
59c8ab8
12339b6
123d411
1ca3a7b
c852898
123d411
 
1ca3a7b
123d411
9e17942
123d411
 
12339b6
f3a1e03
b8e13f9
f3a1e03
123d411
 
e93603e
123d411
12339b6
960da9c
123d411
59c8ab8
960da9c
47f2c85
b8e13f9
46aa4fd
1ca3a7b
123d411
 
 
1ca3a7b
83dbf07
46aa4fd
2b471cc
123d411
1ca3a7b
123d411
 
 
 
 
 
b8e13f9
12339b6
1ca3a7b
e93603e
1ca3a7b
123d411
960da9c
46aa4fd
123d411
 
 
 
 
 
 
0116e60
 
123d411
 
 
 
 
 
0116e60
123d411
1ca3a7b
123d411
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NOT_ALIVE",
    "10": "NOT_ALIVE",
    "100": "NON_PARTICIPATING",
    "101": "NOT_ALIVE",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NOT_ALIVE",
    "105": "NON_PARTICIPATING",
    "106": "NOT_ALIVE",
    "107": "NOT_ALIVE",
    "108": "NON_PARTICIPATING",
    "109": "NOT_ALIVE",
    "11": "NOT_ALIVE",
    "110": "NOT_ALIVE",
    "111": "NON_PARTICIPATING",
    "112": "NON_PARTICIPATING",
    "113": "NOT_ALIVE",
    "114": "NOT_ALIVE",
    "115": "NON_PARTICIPATING",
    "116": "NOT_ALIVE",
    "117": "NOT_ALIVE",
    "118": "NON_PARTICIPATING",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NOT_ALIVE",
    "121": "NOT_ALIVE",
    "122": "NON_PARTICIPATING",
    "123": "NON_PARTICIPATING",
    "124": "NON_PARTICIPATING",
    "125": "NOT_ALIVE",
    "126": "NOT_ALIVE",
    "127": "NOT_ALIVE",
    "128": "NON_PARTICIPATING",
    "129": "NOT_ALIVE",
    "13": "NOT_ALIVE",
    "130": "NOT_ALIVE",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "NON_PARTICIPATING",
    "134": "NOT_ALIVE",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "NON_PARTICIPATING",
    "139": "SUCCESS",
    "14": "NOT_ALIVE",
    "140": "NON_PARTICIPATING",
    "141": "NON_PARTICIPATING",
    "142": "NON_PARTICIPATING",
    "143": "NOT_ALIVE",
    "144": "NOT_ALIVE",
    "145": "NOT_ALIVE",
    "146": "NON_PARTICIPATING",
    "147": "NOT_ALIVE",
    "148": "SUCCESS",
    "149": "NON_PARTICIPATING",
    "15": "SUCCESS",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "NOT_ALIVE",
    "154": "NON_PARTICIPATING",
    "155": "NON_PARTICIPATING",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NON_PARTICIPATING",
    "159": "NON_PARTICIPATING",
    "16": "NOT_ALIVE",
    "160": "NON_PARTICIPATING",
    "161": "NON_PARTICIPATING",
    "162": "NOT_ALIVE",
    "163": "NON_PARTICIPATING",
    "164": "NON_PARTICIPATING",
    "165": "NON_PARTICIPATING",
    "166": "NON_PARTICIPATING",
    "167": "NOT_ALIVE",
    "168": "NOT_ALIVE",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NON_PARTICIPATING",
    "171": "NON_PARTICIPATING",
    "172": "NOT_ALIVE",
    "173": "NON_PARTICIPATING",
    "174": "NON_PARTICIPATING",
    "175": "NON_PARTICIPATING",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NON_PARTICIPATING",
    "179": "NON_PARTICIPATING",
    "18": "NOT_ALIVE",
    "180": "NON_PARTICIPATING",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "NON_PARTICIPATING",
    "184": "NON_PARTICIPATING",
    "185": "NON_PARTICIPATING",
    "186": "NON_PARTICIPATING",
    "187": "NOT_ALIVE",
    "188": "NOT_ALIVE",
    "189": "NON_PARTICIPATING",
    "19": "NOT_ALIVE",
    "190": "NOT_ALIVE",
    "191": "NON_PARTICIPATING",
    "192": "NOT_ALIVE",
    "193": "SUCCESS",
    "194": "NON_PARTICIPATING",
    "195": "NON_PARTICIPATING",
    "196": "NOT_ALIVE",
    "197": "NOT_ALIVE",
    "198": "NON_PARTICIPATING",
    "199": "NOT_ALIVE",
    "2": "NOT_ALIVE",
    "20": "NOT_ALIVE",
    "200": "NON_PARTICIPATING",
    "201": "NOT_ALIVE",
    "202": "NOT_ALIVE",
    "203": "NON_PARTICIPATING",
    "204": "NON_PARTICIPATING",
    "205": "NON_PARTICIPATING",
    "206": "NON_PARTICIPATING",
    "207": "NOT_ALIVE",
    "208": "NOT_ALIVE",
    "209": "NON_PARTICIPATING",
    "21": "NOT_ALIVE",
    "210": "NOT_ALIVE",
    "211": "NON_PARTICIPATING",
    "212": "NOT_ALIVE",
    "213": "NOT_ALIVE",
    "214": "NON_PARTICIPATING",
    "215": "NON_PARTICIPATING",
    "216": "NON_PARTICIPATING",
    "217": "NON_PARTICIPATING",
    "218": "NON_PARTICIPATING",
    "219": "NON_PARTICIPATING",
    "22": "NOT_ALIVE",
    "220": "NOT_ALIVE",
    "221": "NOT_ALIVE",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NON_PARTICIPATING",
    "225": "NON_PARTICIPATING",
    "226": "NON_PARTICIPATING",
    "227": "NOT_ALIVE",
    "228": "NON_PARTICIPATING",
    "229": "NOT_ALIVE",
    "23": "NOT_ALIVE",
    "230": "NOT_ALIVE",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NON_PARTICIPATING",
    "235": "NOT_ALIVE",
    "236": "NON_PARTICIPATING",
    "237": "NOT_ALIVE",
    "238": "NOT_ALIVE",
    "239": "NON_PARTICIPATING",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NON_PARTICIPATING",
    "243": "NOT_ALIVE",
    "244": "NON_PARTICIPATING",
    "245": "NOT_ALIVE",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NOT_ALIVE",
    "249": "NOT_ALIVE",
    "25": "SUCCESS",
    "250": "NOT_ALIVE",
    "251": "NOT_ALIVE",
    "252": "NOT_ALIVE",
    "253": "NOT_ALIVE",
    "254": "NOT_ALIVE",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NON_PARTICIPATING",
    "28": "NON_PARTICIPATING",
    "29": "NOT_ALIVE",
    "3": "NOT_ALIVE",
    "30": "NOT_ALIVE",
    "31": "NOT_ALIVE",
    "32": "NOT_ALIVE",
    "33": "NON_PARTICIPATING",
    "34": "NON_PARTICIPATING",
    "35": "NON_PARTICIPATING",
    "36": "NON_PARTICIPATING",
    "37": "NON_PARTICIPATING",
    "38": "NOT_ALIVE",
    "39": "NOT_ALIVE",
    "4": "NOT_ALIVE",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NOT_ALIVE",
    "43": "NON_PARTICIPATING",
    "44": "SUCCESS",
    "45": "NON_PARTICIPATING",
    "46": "NON_PARTICIPATING",
    "47": "NOT_ALIVE",
    "48": "NON_PARTICIPATING",
    "49": "NOT_ALIVE",
    "5": "NOT_ALIVE",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "NOT_ALIVE",
    "53": "NOT_ALIVE",
    "54": "NOT_ALIVE",
    "55": "NON_PARTICIPATING",
    "56": "NON_PARTICIPATING",
    "57": "NON_PARTICIPATING",
    "58": "NOT_ALIVE",
    "59": "NON_PARTICIPATING",
    "6": "NOT_ALIVE",
    "60": "NON_PARTICIPATING",
    "61": "NOT_ALIVE",
    "62": "NOT_ALIVE",
    "63": "NOT_ALIVE",
    "64": "NON_PARTICIPATING",
    "65": "NON_PARTICIPATING",
    "66": "NOT_ALIVE",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NON_PARTICIPATING",
    "7": "NOT_ALIVE",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NOT_ALIVE",
    "73": "NOT_ALIVE",
    "74": "NOT_ALIVE",
    "75": "NON_PARTICIPATING",
    "76": "NOT_ALIVE",
    "77": "NON_PARTICIPATING",
    "78": "SUCCESS",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NOT_ALIVE",
    "81": "NON_PARTICIPATING",
    "82": "NON_PARTICIPATING",
    "83": "NON_PARTICIPATING",
    "84": "NON_PARTICIPATING",
    "85": "NOT_ALIVE",
    "86": "NON_PARTICIPATING",
    "87": "NOT_ALIVE",
    "88": "NOT_ALIVE",
    "89": "NOT_ALIVE",
    "9": "NOT_ALIVE",
    "90": "NOT_ALIVE",
    "91": "NOT_ALIVE",
    "92": "NON_PARTICIPATING",
    "93": "NOT_ALIVE",
    "94": "NON_PARTICIPATING",
    "95": "NON_PARTICIPATING",
    "96": "NOT_ALIVE",
    "97": "NOT_ALIVE",
    "98": "NON_PARTICIPATING",
    "99": "NON_PARTICIPATING"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6187943,
    6187957
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 62,
  "intermediate_size": 5632,
  "last_allreduce_block": 6187448,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}