File size: 7,726 Bytes
dc3fa3f
a025a3f
dc3fa3f
 
bce0141
091164b
dc3fa3f
bce0141
a025a3f
9675b90
a025a3f
1a8edc8
 
a463b49
5b77cb9
ce9a498
faea71c
bce0141
1a8edc8
5b77cb9
 
17f0fb3
 
5b77cb9
ce9a498
135dd72
ce9a498
a025a3f
bce0141
a025a3f
bce0141
17f0fb3
ce9a498
5b77cb9
ce9a498
135dd72
5614586
bce0141
7a1ad5d
bce0141
dc3fa3f
53d7f65
ce9a498
a025a3f
ce9a498
 
4e2b353
bce0141
5b77cb9
 
 
ce9a498
2ba5dea
bce0141
17f0fb3
5b77cb9
a025a3f
2ba5dea
ce9a498
5b77cb9
 
ce9a498
dc3fa3f
5c281b3
ce9a498
 
bce0141
7a1ad5d
53d7f65
a025a3f
63c7bc6
5b77cb9
bce0141
17f0fb3
 
135dd72
5b77cb9
 
 
772348a
5b77cb9
07c5549
135dd72
bce0141
dc3fa3f
bce0141
 
986fb10
a463b49
dc3fa3f
14599da
9675b90
091164b
135dd72
63c7bc6
04c6d68
8d0d88f
5b77cb9
17f0fb3
b74872e
a025a3f
bce0141
a025a3f
dc3fa3f
296af97
17f0fb3
5b77cb9
bce0141
6192736
5b77cb9
bce0141
 
ce9a498
772348a
5b77cb9
bce0141
b74872e
7f8babf
5b77cb9
5d075b6
 
ce9a498
772348a
ce9a498
dc3fa3f
5b77cb9
86bd951
04c6d68
bce0141
772348a
5b77cb9
ce9a498
bce0141
5b77cb9
a025a3f
5b77cb9
bce0141
86bd951
 
bce0141
ce9a498
14599da
b74872e
dc3fa3f
9622d75
dc3fa3f
a025a3f
7a2d54f
5b77cb9
b74872e
9675b90
a075f19
3e61e1f
0cd3953
86bd951
63c7bc6
14599da
ce9a498
 
135dd72
53d7f65
5614586
bce0141
ce9a498
bce0141
ea40209
a025a3f
a075f19
17f0fb3
bce0141
ce9a498
17f0fb3
5b77cb9
 
772348a
135dd72
5b77cb9
53d7f65
7a2d54f
53d7f65
86bd951
5b77cb9
 
ce9a498
 
5b77cb9
dc3fa3f
53d7f65
ce9a498
bce0141
8d0d88f
5b77cb9
 
bce0141
ce9a498
bce0141
986fb10
9675b90
6192736
3e61e1f
04c6d68
5b77cb9
ce9a498
772348a
5b77cb9
86bd951
9675b90
5b77cb9
53d7f65
4e2b353
c6b228b
bce0141
d063ae3
ce9a498
17f0fb3
bce0141
 
 
a025a3f
ce9a498
86bd951
4e2b353
091164b
a463b49
53d7f65
86bd951
986fb10
53d7f65
bce0141
986fb10
5b77cb9
17f0fb3
5b77cb9
17f0fb3
5b77cb9
091164b
94fb6ac
091164b
5b77cb9
 
0cd3953
ce9a498
bce0141
2ba5dea
ce9a498
5b77cb9
 
a1ce0dd
bce0141
 
2ba5dea
5b77cb9
7a2d54f
5b77cb9
a463b49
53d7f65
5b77cb9
772348a
8d0d88f
dc3fa3f
 
 
 
 
 
 
611fae0
 
dc3fa3f
 
 
 
 
 
611fae0
dc3fa3f
5b77cb9
dc3fa3f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
{
  "_name_or_path": "distributed/llama-1b",
  "all_reduce_scores": {
    "0": "NOT_ALIVE",
    "1": "NON_PARTICIPATING",
    "10": "NOT_ALIVE",
    "100": "NOT_ALIVE",
    "101": "NON_PARTICIPATING",
    "102": "NON_PARTICIPATING",
    "103": "NON_PARTICIPATING",
    "104": "NOT_ALIVE",
    "105": "NON_PARTICIPATING",
    "106": "NON_PARTICIPATING",
    "107": "NOT_ALIVE",
    "108": "SUCCESS",
    "109": "NON_PARTICIPATING",
    "11": "NOT_ALIVE",
    "110": "NON_PARTICIPATING",
    "111": "NON_PARTICIPATING",
    "112": "NON_PARTICIPATING",
    "113": "SUCCESS",
    "114": "NON_PARTICIPATING",
    "115": "NON_PARTICIPATING",
    "116": "NOT_ALIVE",
    "117": "SUCCESS",
    "118": "NOT_ALIVE",
    "119": "NON_PARTICIPATING",
    "12": "NOT_ALIVE",
    "120": "NON_PARTICIPATING",
    "121": "NON_PARTICIPATING",
    "122": "NON_PARTICIPATING",
    "123": "NON_PARTICIPATING",
    "124": "SUCCESS",
    "125": "NOT_ALIVE",
    "126": "SUCCESS",
    "127": "NOT_ALIVE",
    "128": "NOT_ALIVE",
    "129": "NON_PARTICIPATING",
    "13": "NOT_ALIVE",
    "130": "NON_PARTICIPATING",
    "131": "NOT_ALIVE",
    "132": "NOT_ALIVE",
    "133": "NON_PARTICIPATING",
    "134": "NON_PARTICIPATING",
    "135": "NON_PARTICIPATING",
    "136": "NON_PARTICIPATING",
    "137": "NON_PARTICIPATING",
    "138": "NON_PARTICIPATING",
    "139": "NOT_ALIVE",
    "14": "SUCCESS",
    "140": "NOT_ALIVE",
    "141": "NON_PARTICIPATING",
    "142": "NON_PARTICIPATING",
    "143": "NON_PARTICIPATING",
    "144": "NOT_ALIVE",
    "145": "NON_PARTICIPATING",
    "146": "NOT_ALIVE",
    "147": "NON_PARTICIPATING",
    "148": "SUCCESS",
    "149": "NOT_ALIVE",
    "15": "NOT_ALIVE",
    "150": "NOT_ALIVE",
    "151": "NOT_ALIVE",
    "152": "NOT_ALIVE",
    "153": "SUCCESS",
    "154": "SUCCESS",
    "155": "SUCCESS",
    "156": "NOT_ALIVE",
    "157": "NOT_ALIVE",
    "158": "NOT_ALIVE",
    "159": "NOT_ALIVE",
    "16": "NON_PARTICIPATING",
    "160": "NON_PARTICIPATING",
    "161": "NOT_ALIVE",
    "162": "NON_PARTICIPATING",
    "163": "NOT_ALIVE",
    "164": "SUCCESS",
    "165": "SUCCESS",
    "166": "NOT_ALIVE",
    "167": "NON_PARTICIPATING",
    "168": "NON_PARTICIPATING",
    "169": "NOT_ALIVE",
    "17": "NOT_ALIVE",
    "170": "NOT_ALIVE",
    "171": "NOT_ALIVE",
    "172": "NON_PARTICIPATING",
    "173": "NON_PARTICIPATING",
    "174": "NON_PARTICIPATING",
    "175": "NOT_ALIVE",
    "176": "NOT_ALIVE",
    "177": "NOT_ALIVE",
    "178": "NOT_ALIVE",
    "179": "NOT_ALIVE",
    "18": "NOT_ALIVE",
    "180": "NOT_ALIVE",
    "181": "NOT_ALIVE",
    "182": "NOT_ALIVE",
    "183": "NON_PARTICIPATING",
    "184": "NON_PARTICIPATING",
    "185": "NOT_ALIVE",
    "186": "NOT_ALIVE",
    "187": "NON_PARTICIPATING",
    "188": "NON_PARTICIPATING",
    "189": "NOT_ALIVE",
    "19": "NOT_ALIVE",
    "190": "NON_PARTICIPATING",
    "191": "NOT_ALIVE",
    "192": "NON_PARTICIPATING",
    "193": "NOT_ALIVE",
    "194": "NON_PARTICIPATING",
    "195": "NON_PARTICIPATING",
    "196": "NON_PARTICIPATING",
    "197": "SUCCESS",
    "198": "NON_PARTICIPATING",
    "199": "NOT_ALIVE",
    "2": "NON_PARTICIPATING",
    "20": "NOT_ALIVE",
    "200": "NOT_ALIVE",
    "201": "NOT_ALIVE",
    "202": "NOT_ALIVE",
    "203": "NOT_ALIVE",
    "204": "SUCCESS",
    "205": "NON_PARTICIPATING",
    "206": "SUCCESS",
    "207": "NOT_ALIVE",
    "208": "NOT_ALIVE",
    "209": "NOT_ALIVE",
    "21": "NOT_ALIVE",
    "210": "NON_PARTICIPATING",
    "211": "NON_PARTICIPATING",
    "212": "NON_PARTICIPATING",
    "213": "SUCCESS",
    "214": "NON_PARTICIPATING",
    "215": "SUCCESS",
    "216": "NOT_ALIVE",
    "217": "NON_PARTICIPATING",
    "218": "NOT_ALIVE",
    "219": "NOT_ALIVE",
    "22": "NOT_ALIVE",
    "220": "NON_PARTICIPATING",
    "221": "NON_PARTICIPATING",
    "222": "NOT_ALIVE",
    "223": "NOT_ALIVE",
    "224": "NOT_ALIVE",
    "225": "NOT_ALIVE",
    "226": "NOT_ALIVE",
    "227": "NOT_ALIVE",
    "228": "NON_PARTICIPATING",
    "229": "NOT_ALIVE",
    "23": "NON_PARTICIPATING",
    "230": "NON_PARTICIPATING",
    "231": "NOT_ALIVE",
    "232": "NOT_ALIVE",
    "233": "NOT_ALIVE",
    "234": "NOT_ALIVE",
    "235": "NON_PARTICIPATING",
    "236": "NOT_ALIVE",
    "237": "NON_PARTICIPATING",
    "238": "NON_PARTICIPATING",
    "239": "NOT_ALIVE",
    "24": "NOT_ALIVE",
    "240": "NOT_ALIVE",
    "241": "NON_PARTICIPATING",
    "242": "NON_PARTICIPATING",
    "243": "NON_PARTICIPATING",
    "244": "NOT_ALIVE",
    "245": "NON_PARTICIPATING",
    "246": "NON_PARTICIPATING",
    "247": "NON_PARTICIPATING",
    "248": "NON_PARTICIPATING",
    "249": "NON_PARTICIPATING",
    "25": "SUCCESS",
    "250": "NOT_ALIVE",
    "251": "NOT_ALIVE",
    "252": "NON_PARTICIPATING",
    "253": "NOT_ALIVE",
    "254": "NON_PARTICIPATING",
    "255": "NOT_ALIVE",
    "26": "NON_PARTICIPATING",
    "27": "NOT_ALIVE",
    "28": "NOT_ALIVE",
    "29": "NON_PARTICIPATING",
    "3": "NOT_ALIVE",
    "30": "NON_PARTICIPATING",
    "31": "NON_PARTICIPATING",
    "32": "SUCCESS",
    "33": "NOT_ALIVE",
    "34": "NOT_ALIVE",
    "35": "NON_PARTICIPATING",
    "36": "NON_PARTICIPATING",
    "37": "NOT_ALIVE",
    "38": "NON_PARTICIPATING",
    "39": "SUCCESS",
    "4": "NON_PARTICIPATING",
    "40": "NON_PARTICIPATING",
    "41": "NON_PARTICIPATING",
    "42": "NOT_ALIVE",
    "43": "NOT_ALIVE",
    "44": "NON_PARTICIPATING",
    "45": "NOT_ALIVE",
    "46": "NOT_ALIVE",
    "47": "NON_PARTICIPATING",
    "48": "NON_PARTICIPATING",
    "49": "NON_PARTICIPATING",
    "5": "SUCCESS",
    "50": "NOT_ALIVE",
    "51": "NOT_ALIVE",
    "52": "NOT_ALIVE",
    "53": "NON_PARTICIPATING",
    "54": "NOT_ALIVE",
    "55": "NOT_ALIVE",
    "56": "NON_PARTICIPATING",
    "57": "NON_PARTICIPATING",
    "58": "NON_PARTICIPATING",
    "59": "NON_PARTICIPATING",
    "6": "NOT_ALIVE",
    "60": "NOT_ALIVE",
    "61": "NON_PARTICIPATING",
    "62": "NON_PARTICIPATING",
    "63": "NON_PARTICIPATING",
    "64": "NOT_ALIVE",
    "65": "NON_PARTICIPATING",
    "66": "NOT_ALIVE",
    "67": "NOT_ALIVE",
    "68": "NOT_ALIVE",
    "69": "NOT_ALIVE",
    "7": "NON_PARTICIPATING",
    "70": "NOT_ALIVE",
    "71": "NON_PARTICIPATING",
    "72": "NON_PARTICIPATING",
    "73": "NON_PARTICIPATING",
    "74": "NOT_ALIVE",
    "75": "NON_PARTICIPATING",
    "76": "NON_PARTICIPATING",
    "77": "NON_PARTICIPATING",
    "78": "NOT_ALIVE",
    "79": "NOT_ALIVE",
    "8": "NOT_ALIVE",
    "80": "NON_PARTICIPATING",
    "81": "NON_PARTICIPATING",
    "82": "NON_PARTICIPATING",
    "83": "NOT_ALIVE",
    "84": "NON_PARTICIPATING",
    "85": "NON_PARTICIPATING",
    "86": "NON_PARTICIPATING",
    "87": "NON_PARTICIPATING",
    "88": "NOT_ALIVE",
    "89": "NOT_ALIVE",
    "9": "NON_PARTICIPATING",
    "90": "NOT_ALIVE",
    "91": "NOT_ALIVE",
    "92": "NON_PARTICIPATING",
    "93": "NOT_ALIVE",
    "94": "SUCCESS",
    "95": "NOT_ALIVE",
    "96": "NON_PARTICIPATING",
    "97": "NOT_ALIVE",
    "98": "NOT_ALIVE",
    "99": "NOT_ALIVE"
  },
  "architectures": [
    "LlamaForCausalLM"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "block_list": [
    6002606,
    6002638
  ],
  "bos_token_id": 1,
  "eos_token_id": 2,
  "hidden_act": "silu",
  "hidden_size": 2048,
  "initializer_range": 0.02,
  "inner_step": 34,
  "intermediate_size": 5632,
  "last_allreduce_block": 6000755,
  "max_position_embeddings": 2048,
  "mlp_bias": false,
  "model_type": "llama",
  "num_attention_heads": 32,
  "num_hidden_layers": 22,
  "num_key_value_heads": 4,
  "pretraining_tp": 1,
  "rms_norm_eps": 1e-05,
  "rope_scaling": null,
  "rope_theta": 10000.0,
  "tie_word_embeddings": false,
  "torch_dtype": "float32",
  "transformers_version": "4.39.3",
  "use_cache": false,
  "vocab_size": 32000
}