File size: 7,643 Bytes
81f46ae 5a94dab 81f46ae 29af3aa 31622ba 81f46ae 5a94dab b12371b 7d22a59 0211811 b36280c 06e8302 d8fd059 3b3bbc6 0211811 7d22a59 06e8302 5a94dab 0211811 5a94dab 06e8302 02932c7 b12371b 29af3aa b12371b 8f887aa 3b3bbc6 f0c3414 5a94dab cc3771a 06e8302 02932c7 8c98fcd a94367a 20efbef 29af3aa 81f46ae 06e8302 7d22a59 06e8302 7d22a59 f6a98d4 7d22a59 a94367a 7d22a59 0211811 06e8302 5a94dab cc3771a f6a98d4 06e8302 a94367a 5a94dab 06e8302 3211fdb 7d22a59 3b3bbc6 81f46ae 6521efd 5a94dab 0211811 06e8302 20efbef 06e8302 5a94dab cc3771a 1cd40ac a94367a 06e8302 7d22a59 02932c7 06e8302 7d22a59 06e8302 3b3bbc6 4287490 02932c7 5a94dab 81f46ae b12371b 06e8302 0211811 b36280c 81f46ae 6d59323 7d22a59 31622ba 02932c7 cc3771a 8f887aa 81f46ae 06e8302 0211811 29af3aa cc3771a b12371b 06e8302 81f46ae b0748d4 e852704 81f46ae b12371b 3b3bbc6 06e8302 5a94dab 7d22a59 5a94dab b12371b 06e8302 b12371b 29af3aa ab7896c 926bc46 f0c3414 7d22a59 06e8302 81f46ae 0211811 b12371b 8f887aa 06e8302 0211811 5a94dab 06e8302 b12371b 5a94dab 0211811 d8fd059 f6a98d4 b12371b 5a94dab 81f46ae 6d59323 29af3aa 81f46ae 3211fdb 81f46ae b12371b a94367a 0211811 e852704 7d22a59 926bc46 e7fdf28 fcfa88c b12371b cc3771a 6d59323 06e8302 f6a98d4 02932c7 06e8302 8c98fcd f6a98d4 b12371b 5a94dab 8fef937 5a94dab 926bc46 fcfa88c 7d22a59 6521efd 81f46ae 7d22a59 3b3bbc6 7d22a59 02932c7 5a94dab 06e8302 a94367a 06e8302 b12371b 29af3aa 06e8302 5a94dab 06e8302 81f46ae 06e8302 5a94dab c38724d 03b8370 3b3bbc6 5a94dab b12371b 5a94dab e852704 29af3aa 7d22a59 3b3bbc6 e7fdf28 8f887aa 06e8302 e852704 7d22a59 b12371b 7d22a59 06e8302 f6a98d4 09056e5 e852704 1cd40ac 7d22a59 06e8302 5a94dab 7d22a59 0211811 b12371b 06e8302 b12371b f6a98d4 31622ba b36280c 06e8302 b12371b 06e8302 0211811 b12371b 06e8302 a94367a 3b3bbc6 06e8302 926bc46 31622ba c38724d 31622ba 3b3bbc6 b12371b fcfa88c b12371b 06e8302 926bc46 a94367a 81f46ae 3b3bbc6 7d22a59 f6a98d4 5a94dab a94367a 06e8302 b36280c 06e8302 3b3bbc6 360abed 03b8370 81f46ae 9a1a1e8 81f46ae 9a1a1e8 81f46ae 06e8302 81f46ae |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NOT_ALIVE",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NON_PARTICIPATING",
"102": "NOT_ALIVE",
"103": "NON_PARTICIPATING",
"104": "NON_PARTICIPATING",
"105": "NON_PARTICIPATING",
"106": "NON_PARTICIPATING",
"107": "NOT_ALIVE",
"108": "SUCCESS",
"109": "NOT_ALIVE",
"11": "NOT_ALIVE",
"110": "NON_PARTICIPATING",
"111": "NON_PARTICIPATING",
"112": "NON_PARTICIPATING",
"113": "NOT_ALIVE",
"114": "NON_PARTICIPATING",
"115": "NON_PARTICIPATING",
"116": "NON_PARTICIPATING",
"117": "NON_PARTICIPATING",
"118": "NOT_ALIVE",
"119": "NOT_ALIVE",
"12": "NON_PARTICIPATING",
"120": "NOT_ALIVE",
"121": "NOT_ALIVE",
"122": "NON_PARTICIPATING",
"123": "NOT_ALIVE",
"124": "SUCCESS",
"125": "NON_PARTICIPATING",
"126": "NOT_ALIVE",
"127": "NOT_ALIVE",
"128": "NOT_ALIVE",
"129": "NON_PARTICIPATING",
"13": "NOT_ALIVE",
"130": "NOT_ALIVE",
"131": "NOT_ALIVE",
"132": "NOT_ALIVE",
"133": "NON_PARTICIPATING",
"134": "NOT_ALIVE",
"135": "NON_PARTICIPATING",
"136": "NON_PARTICIPATING",
"137": "NON_PARTICIPATING",
"138": "SUCCESS",
"139": "NON_PARTICIPATING",
"14": "SUCCESS",
"140": "NON_PARTICIPATING",
"141": "NON_PARTICIPATING",
"142": "NOT_ALIVE",
"143": "NON_PARTICIPATING",
"144": "NOT_ALIVE",
"145": "NOT_ALIVE",
"146": "NON_PARTICIPATING",
"147": "NON_PARTICIPATING",
"148": "SUCCESS",
"149": "NON_PARTICIPATING",
"15": "SUCCESS",
"150": "NOT_ALIVE",
"151": "NOT_ALIVE",
"152": "NOT_ALIVE",
"153": "SUCCESS",
"154": "NON_PARTICIPATING",
"155": "SUCCESS",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NON_PARTICIPATING",
"159": "NOT_ALIVE",
"16": "NON_PARTICIPATING",
"160": "NON_PARTICIPATING",
"161": "NON_PARTICIPATING",
"162": "NOT_ALIVE",
"163": "NOT_ALIVE",
"164": "SUCCESS",
"165": "SUCCESS",
"166": "NOT_ALIVE",
"167": "NON_PARTICIPATING",
"168": "SUCCESS",
"169": "NOT_ALIVE",
"17": "NOT_ALIVE",
"170": "NON_PARTICIPATING",
"171": "NOT_ALIVE",
"172": "NOT_ALIVE",
"173": "SUCCESS",
"174": "NON_PARTICIPATING",
"175": "NOT_ALIVE",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "NOT_ALIVE",
"180": "NOT_ALIVE",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "SUCCESS",
"184": "NON_PARTICIPATING",
"185": "NOT_ALIVE",
"186": "NON_PARTICIPATING",
"187": "NOT_ALIVE",
"188": "NOT_ALIVE",
"189": "NOT_ALIVE",
"19": "NOT_ALIVE",
"190": "NON_PARTICIPATING",
"191": "NOT_ALIVE",
"192": "NOT_ALIVE",
"193": "NOT_ALIVE",
"194": "NOT_ALIVE",
"195": "NOT_ALIVE",
"196": "NON_PARTICIPATING",
"197": "SUCCESS",
"198": "NOT_ALIVE",
"199": "NON_PARTICIPATING",
"2": "NOT_ALIVE",
"20": "NOT_ALIVE",
"200": "NOT_ALIVE",
"201": "NON_PARTICIPATING",
"202": "NOT_ALIVE",
"203": "NOT_ALIVE",
"204": "SUCCESS",
"205": "NOT_ALIVE",
"206": "NOT_ALIVE",
"207": "NOT_ALIVE",
"208": "NON_PARTICIPATING",
"209": "NOT_ALIVE",
"21": "NOT_ALIVE",
"210": "NOT_ALIVE",
"211": "NON_PARTICIPATING",
"212": "NON_PARTICIPATING",
"213": "NON_PARTICIPATING",
"214": "NON_PARTICIPATING",
"215": "SUCCESS",
"216": "NON_PARTICIPATING",
"217": "NON_PARTICIPATING",
"218": "NON_PARTICIPATING",
"219": "NOT_ALIVE",
"22": "NOT_ALIVE",
"220": "NON_PARTICIPATING",
"221": "NOT_ALIVE",
"222": "NOT_ALIVE",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NOT_ALIVE",
"226": "NOT_ALIVE",
"227": "NON_PARTICIPATING",
"228": "NON_PARTICIPATING",
"229": "NON_PARTICIPATING",
"23": "NON_PARTICIPATING",
"230": "NON_PARTICIPATING",
"231": "NOT_ALIVE",
"232": "NOT_ALIVE",
"233": "NOT_ALIVE",
"234": "NOT_ALIVE",
"235": "NON_PARTICIPATING",
"236": "NOT_ALIVE",
"237": "SUCCESS",
"238": "NON_PARTICIPATING",
"239": "NOT_ALIVE",
"24": "NOT_ALIVE",
"240": "NOT_ALIVE",
"241": "NON_PARTICIPATING",
"242": "NOT_ALIVE",
"243": "NON_PARTICIPATING",
"244": "NOT_ALIVE",
"245": "NOT_ALIVE",
"246": "NON_PARTICIPATING",
"247": "NON_PARTICIPATING",
"248": "NON_PARTICIPATING",
"249": "NOT_ALIVE",
"25": "SUCCESS",
"250": "SUCCESS",
"251": "NON_PARTICIPATING",
"252": "NON_PARTICIPATING",
"253": "NOT_ALIVE",
"254": "SUCCESS",
"255": "NOT_ALIVE",
"26": "NON_PARTICIPATING",
"27": "NOT_ALIVE",
"28": "NOT_ALIVE",
"29": "NOT_ALIVE",
"3": "NOT_ALIVE",
"30": "NOT_ALIVE",
"31": "NON_PARTICIPATING",
"32": "SUCCESS",
"33": "NOT_ALIVE",
"34": "NOT_ALIVE",
"35": "NON_PARTICIPATING",
"36": "NOT_ALIVE",
"37": "NOT_ALIVE",
"38": "NOT_ALIVE",
"39": "NON_PARTICIPATING",
"4": "NOT_ALIVE",
"40": "NON_PARTICIPATING",
"41": "NON_PARTICIPATING",
"42": "NON_PARTICIPATING",
"43": "NOT_ALIVE",
"44": "NON_PARTICIPATING",
"45": "NOT_ALIVE",
"46": "NOT_ALIVE",
"47": "NOT_ALIVE",
"48": "NON_PARTICIPATING",
"49": "NON_PARTICIPATING",
"5": "SUCCESS",
"50": "NOT_ALIVE",
"51": "NOT_ALIVE",
"52": "NOT_ALIVE",
"53": "NON_PARTICIPATING",
"54": "NOT_ALIVE",
"55": "NOT_ALIVE",
"56": "NON_PARTICIPATING",
"57": "NON_PARTICIPATING",
"58": "NON_PARTICIPATING",
"59": "NON_PARTICIPATING",
"6": "NON_PARTICIPATING",
"60": "NON_PARTICIPATING",
"61": "NON_PARTICIPATING",
"62": "NOT_ALIVE",
"63": "NON_PARTICIPATING",
"64": "NOT_ALIVE",
"65": "NON_PARTICIPATING",
"66": "NOT_ALIVE",
"67": "NOT_ALIVE",
"68": "NOT_ALIVE",
"69": "NOT_ALIVE",
"7": "NON_PARTICIPATING",
"70": "NOT_ALIVE",
"71": "NON_PARTICIPATING",
"72": "NOT_ALIVE",
"73": "NOT_ALIVE",
"74": "NON_PARTICIPATING",
"75": "NOT_ALIVE",
"76": "NON_PARTICIPATING",
"77": "NON_PARTICIPATING",
"78": "NOT_ALIVE",
"79": "NOT_ALIVE",
"8": "NOT_ALIVE",
"80": "NON_PARTICIPATING",
"81": "NOT_ALIVE",
"82": "NON_PARTICIPATING",
"83": "NOT_ALIVE",
"84": "NON_PARTICIPATING",
"85": "NOT_ALIVE",
"86": "NON_PARTICIPATING",
"87": "NON_PARTICIPATING",
"88": "NON_PARTICIPATING",
"89": "NOT_ALIVE",
"9": "NOT_ALIVE",
"90": "NON_PARTICIPATING",
"91": "NON_PARTICIPATING",
"92": "NON_PARTICIPATING",
"93": "NOT_ALIVE",
"94": "NOT_ALIVE",
"95": "NOT_ALIVE",
"96": "NON_PARTICIPATING",
"97": "NON_PARTICIPATING",
"98": "NON_PARTICIPATING",
"99": "NOT_ALIVE"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
5987273,
5987277,
5987280
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 45,
"intermediate_size": 5632,
"last_allreduce_block": 5986899,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|