File size: 7,194 Bytes
836b91f a4a231a 836b91f 5d8bea0 549cd33 4a54bdc 5c048a9 549cd33 f38f043 e86c954 5c048a9 f73c6dc 5c048a9 f73c6dc 5c048a9 e86c954 5c048a9 e86c954 96aa97f f38f043 e86c954 5c048a9 e86c954 836b91f ff94ff6 5c048a9 f73c6dc e86c954 a4a231a 836b91f e86c954 5d8bea0 e86c954 df93e4c e86c954 5c048a9 4a54bdc 58a4c56 76910c0 e86c954 ff94ff6 5c048a9 e86c954 5d8bea0 e86c954 5c048a9 549cd33 e86c954 5c048a9 f73c6dc f38f043 f73c6dc 549cd33 e86c954 836b91f 40550d4 5c048a9 f38f043 a4a231a 1adfa33 5d8bea0 f38f043 e86c954 f73c6dc a4a231a e86c954 58a4c56 836b91f 77c205d e86c954 5d8bea0 e86c954 836b91f 58a4c56 e86c954 836b91f e86c954 f38f043 e86c954 5d8bea0 5c048a9 e86c954 a4a231a 5d8bea0 f38f043 f73c6dc e86c954 f38f043 f73c6dc 549cd33 e86c954 836b91f 626b56d 5d8bea0 836b91f e86c954 5d8bea0 e86c954 5d8bea0 88591d9 5c048a9 e86c954 5c048a9 e86c954 5c048a9 88591d9 f38f043 5d8bea0 e86c954 5c048a9 f73c6dc e86c954 df93e4c f38f043 e86c954 5c048a9 549cd33 e86c954 836b91f e86c954 5c048a9 58a4c56 5c048a9 e86c954 f73c6dc e86c954 f73c6dc e86c954 5c048a9 f73c6dc 5d8bea0 e86c954 58a4c56 e86c954 5c048a9 1f6d0f2 836b91f 5c048a9 b28592c e86c954 b28592c f73c6dc e86c954 f73c6dc e86c954 58a4c56 e86c954 836b91f 5c048a9 f73c6dc e86c954 58a4c56 e86c954 5d8bea0 e86c954 f73c6dc 549cd33 58a4c56 b28592c 549cd33 5c048a9 e86c954 77c205d e86c954 5c048a9 e86c954 5c048a9 58a4c56 e86c954 f73c6dc b28592c e86c954 549cd33 5c048a9 e86c954 5d8bea0 f38f043 58a4c56 5d8bea0 88591d9 5d8bea0 e86c954 549cd33 5d8bea0 e86c954 836b91f e86c954 5d8bea0 e86c954 5d8bea0 ff94ff6 4822cbf eddea2e e86c954 f73c6dc e86c954 5c048a9 e86c954 5d8bea0 e86c954 f73c6dc 836b91f 423de4a 836b91f 423de4a 836b91f e86c954 836b91f |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "SUCCESS",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "SUCCESS",
"102": "NON_PARTICIPATING",
"103": "NON_PARTICIPATING",
"104": "NON_PARTICIPATING",
"105": "NON_PARTICIPATING",
"106": "SUCCESS",
"107": "NON_PARTICIPATING",
"108": "SUCCESS",
"109": "NON_PARTICIPATING",
"11": "SUCCESS",
"110": "NON_PARTICIPATING",
"111": "NON_PARTICIPATING",
"112": "SUCCESS",
"113": "NOT_ALIVE",
"114": "SUCCESS",
"115": "NOT_ALIVE",
"116": "NON_PARTICIPATING",
"117": "SUCCESS",
"118": "NON_PARTICIPATING",
"119": "NOT_ALIVE",
"12": "NOT_ALIVE",
"120": "NON_PARTICIPATING",
"121": "SUCCESS",
"122": "SUCCESS",
"123": "SUCCESS",
"124": "NOT_ALIVE",
"125": "NOT_ALIVE",
"126": "SUCCESS",
"127": "FAIL",
"128": "FAIL",
"129": "NON_PARTICIPATING",
"13": "NOT_ALIVE",
"130": "SUCCESS",
"131": "NON_PARTICIPATING",
"132": "SUCCESS",
"133": "SUCCESS",
"134": "NOT_ALIVE",
"135": "SUCCESS",
"136": "SUCCESS",
"137": "FAIL",
"138": "NOT_ALIVE",
"139": "SUCCESS",
"14": "NOT_ALIVE",
"140": "SUCCESS",
"141": "NOT_ALIVE",
"142": "SUCCESS",
"143": "NON_PARTICIPATING",
"144": "SUCCESS",
"145": "FAIL",
"146": "NON_PARTICIPATING",
"147": "SUCCESS",
"148": "NON_PARTICIPATING",
"149": "SUCCESS",
"15": "SUCCESS",
"150": "SUCCESS",
"151": "NON_PARTICIPATING",
"152": "NON_PARTICIPATING",
"153": "NON_PARTICIPATING",
"154": "SUCCESS",
"155": "SUCCESS",
"156": "NOT_ALIVE",
"157": "NON_PARTICIPATING",
"158": "NON_PARTICIPATING",
"159": "SUCCESS",
"16": "NOT_ALIVE",
"160": "NON_PARTICIPATING",
"161": "SUCCESS",
"162": "NON_PARTICIPATING",
"163": "SUCCESS",
"164": "SUCCESS",
"165": "SUCCESS",
"166": "NOT_ALIVE",
"167": "SUCCESS",
"168": "NON_PARTICIPATING",
"169": "SUCCESS",
"17": "NOT_ALIVE",
"170": "SUCCESS",
"171": "FAIL",
"172": "FAIL",
"173": "NOT_ALIVE",
"174": "SUCCESS",
"175": "NON_PARTICIPATING",
"176": "NOT_ALIVE",
"177": "SUCCESS",
"178": "SUCCESS",
"179": "SUCCESS",
"18": "NOT_ALIVE",
"180": "NON_PARTICIPATING",
"181": "SUCCESS",
"182": "NOT_ALIVE",
"183": "FAIL",
"184": "SUCCESS",
"185": "FAIL",
"186": "SUCCESS",
"187": "NOT_ALIVE",
"188": "SUCCESS",
"189": "SUCCESS",
"19": "NOT_ALIVE",
"190": "NON_PARTICIPATING",
"191": "SUCCESS",
"192": "FAIL",
"193": "NOT_ALIVE",
"194": "NON_PARTICIPATING",
"195": "SUCCESS",
"196": "SUCCESS",
"197": "NON_PARTICIPATING",
"198": "NOT_ALIVE",
"199": "FAIL",
"2": "NOT_ALIVE",
"20": "NOT_ALIVE",
"200": "NON_PARTICIPATING",
"201": "NOT_ALIVE",
"202": "SUCCESS",
"203": "SUCCESS",
"204": "NON_PARTICIPATING",
"205": "NOT_ALIVE",
"206": "NON_PARTICIPATING",
"207": "NON_PARTICIPATING",
"208": "SUCCESS",
"209": "SUCCESS",
"21": "SUCCESS",
"210": "NON_PARTICIPATING",
"211": "SUCCESS",
"212": "SUCCESS",
"213": "SUCCESS",
"214": "FAIL",
"215": "SUCCESS",
"216": "SUCCESS",
"217": "SUCCESS",
"218": "SUCCESS",
"219": "NON_PARTICIPATING",
"22": "FAIL",
"220": "NON_PARTICIPATING",
"221": "SUCCESS",
"222": "SUCCESS",
"223": "NOT_ALIVE",
"224": "NON_PARTICIPATING",
"225": "SUCCESS",
"226": "NON_PARTICIPATING",
"227": "NON_PARTICIPATING",
"228": "NON_PARTICIPATING",
"229": "NOT_ALIVE",
"23": "NOT_ALIVE",
"230": "SUCCESS",
"231": "NOT_ALIVE",
"232": "NOT_ALIVE",
"233": "SUCCESS",
"234": "SUCCESS",
"235": "NOT_ALIVE",
"236": "SUCCESS",
"237": "NON_PARTICIPATING",
"238": "NON_PARTICIPATING",
"239": "NON_PARTICIPATING",
"24": "SUCCESS",
"240": "NON_PARTICIPATING",
"241": "NON_PARTICIPATING",
"242": "SUCCESS",
"243": "SUCCESS",
"244": "NON_PARTICIPATING",
"245": "NON_PARTICIPATING",
"246": "NON_PARTICIPATING",
"247": "FAIL",
"248": "SUCCESS",
"249": "NOT_ALIVE",
"25": "SUCCESS",
"250": "FAIL",
"251": "NOT_ALIVE",
"252": "NON_PARTICIPATING",
"253": "SUCCESS",
"254": "NOT_ALIVE",
"255": "NON_PARTICIPATING",
"26": "NON_PARTICIPATING",
"27": "SUCCESS",
"28": "FAIL",
"29": "SUCCESS",
"3": "NOT_ALIVE",
"30": "FAIL",
"31": "SUCCESS",
"32": "FAIL",
"33": "NOT_ALIVE",
"34": "SUCCESS",
"35": "SUCCESS",
"36": "SUCCESS",
"37": "SUCCESS",
"38": "SUCCESS",
"39": "SUCCESS",
"4": "NOT_ALIVE",
"40": "SUCCESS",
"41": "SUCCESS",
"42": "SUCCESS",
"43": "NOT_ALIVE",
"44": "SUCCESS",
"45": "NOT_ALIVE",
"46": "SUCCESS",
"47": "SUCCESS",
"48": "NOT_ALIVE",
"49": "NON_PARTICIPATING",
"5": "SUCCESS",
"50": "FAIL",
"51": "NOT_ALIVE",
"52": "SUCCESS",
"53": "SUCCESS",
"54": "NON_PARTICIPATING",
"55": "SUCCESS",
"56": "NON_PARTICIPATING",
"57": "SUCCESS",
"58": "NOT_ALIVE",
"59": "NON_PARTICIPATING",
"6": "NOT_ALIVE",
"60": "SUCCESS",
"61": "SUCCESS",
"62": "SUCCESS",
"63": "SUCCESS",
"64": "SUCCESS",
"65": "NON_PARTICIPATING",
"66": "NON_PARTICIPATING",
"67": "NON_PARTICIPATING",
"68": "SUCCESS",
"69": "NON_PARTICIPATING",
"7": "SUCCESS",
"70": "SUCCESS",
"71": "NON_PARTICIPATING",
"72": "NON_PARTICIPATING",
"73": "NON_PARTICIPATING",
"74": "SUCCESS",
"75": "NON_PARTICIPATING",
"76": "FAIL",
"77": "SUCCESS",
"78": "NON_PARTICIPATING",
"79": "SUCCESS",
"8": "NOT_ALIVE",
"80": "NON_PARTICIPATING",
"81": "NON_PARTICIPATING",
"82": "SUCCESS",
"83": "NON_PARTICIPATING",
"84": "NON_PARTICIPATING",
"85": "NON_PARTICIPATING",
"86": "NON_PARTICIPATING",
"87": "SUCCESS",
"88": "NON_PARTICIPATING",
"89": "NON_PARTICIPATING",
"9": "NOT_ALIVE",
"90": "NON_PARTICIPATING",
"91": "NOT_ALIVE",
"92": "SUCCESS",
"93": "NON_PARTICIPATING",
"94": "NON_PARTICIPATING",
"95": "NON_PARTICIPATING",
"96": "NON_PARTICIPATING",
"97": "SUCCESS",
"98": "NOT_ALIVE",
"99": "NON_PARTICIPATING"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6385383,
6385399,
6385410
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 27,
"intermediate_size": 5632,
"last_allreduce_block": 6385112,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|