File size: 7,574 Bytes
a9159a6 c8953b8 8773dcf c8953b8 45c6851 c8953b8 3d480fd a9159a6 0e0bc0a 5bbcec1 a9159a6 c8953b8 8773dcf a9159a6 d643d7a 94cba48 c8953b8 8773dcf 79dae0d dd9b167 a9159a6 94cba48 8773dcf 0e0bc0a 7458ad2 dd9b167 a9159a6 8773dcf a9159a6 8773dcf 5bbcec1 a9159a6 b8d6f6d dd9b167 c8953b8 5bbcec1 45c6851 c8953b8 a9159a6 b8d6f6d dd9b167 5bbcec1 c8953b8 dd9b167 8773dcf a5147de d643d7a dd9b167 8773dcf d643d7a 8773dcf a5147de a9159a6 49f3440 5bbcec1 a9159a6 7458ad2 8773dcf c8953b8 a9159a6 a5147de dd9b167 7458ad2 c8953b8 8773dcf b8d6f6d d643d7a 8773dcf 49f3440 dd9b167 a9159a6 b8d6f6d 5bbcec1 45c6851 dd9b167 49f3440 a9159a6 8773dcf c8953b8 d643d7a 5bbcec1 a9159a6 b6d1753 8773dcf c8953b8 49f3440 c8953b8 5bbcec1 45c6851 8773dcf 45c6851 5bbcec1 45c6851 a9159a6 d643d7a b6d1753 45c6851 5bbcec1 8773dcf 7458ad2 a9159a6 5bbcec1 c8953b8 d643d7a 49f3440 c8953b8 a9159a6 3d480fd 5bbcec1 45c6851 8773dcf 45c6851 b6d1753 5bbcec1 45c6851 d643d7a 45c6851 a9159a6 7458ad2 d643d7a dd9b167 a9159a6 c8953b8 5bbcec1 8773dcf 45c6851 a9159a6 a5147de d643d7a a5147de a9159a6 a5147de b8d6f6d 8773dcf a9159a6 45c6851 a9159a6 5bbcec1 7458ad2 c8953b8 3d480fd 8773dcf a9159a6 8773dcf 3d480fd 8773dcf 5bbcec1 c8953b8 45c6851 c8953b8 a9159a6 45c6851 a9159a6 45c6851 8773dcf c8953b8 a9159a6 5bbcec1 4f1965a d643d7a a9159a6 5bbcec1 c8953b8 a9159a6 d643d7a 8773dcf d643d7a 0e0bc0a 8773dcf c8953b8 8773dcf 49f3440 a9159a6 49f3440 94cba48 8773dcf a9159a6 a5147de c8953b8 a5147de 7458ad2 d643d7a a9159a6 c8953b8 4f1965a a9159a6 c8953b8 49f3440 8773dcf c8953b8 8773dcf 79dae0d 49f3440 a9159a6 c8953b8 45c6851 a9159a6 dd9b167 49f3440 79dae0d c8953b8 5bbcec1 c8953b8 a9159a6 a5147de a9159a6 8773dcf a9159a6 4f1965a d643d7a 45c6851 a5147de 94cba48 45c6851 a9159a6 82f0290 a9159a6 82f0290 a9159a6 c8953b8 a9159a6 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "SUCCESS",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NON_PARTICIPATING",
"102": "NOT_ALIVE",
"103": "NOT_ALIVE",
"104": "NOT_ALIVE",
"105": "NON_PARTICIPATING",
"106": "NOT_ALIVE",
"107": "NOT_ALIVE",
"108": "NON_PARTICIPATING",
"109": "NOT_ALIVE",
"11": "NOT_ALIVE",
"110": "NOT_ALIVE",
"111": "NON_PARTICIPATING",
"112": "NON_PARTICIPATING",
"113": "NOT_ALIVE",
"114": "NOT_ALIVE",
"115": "NOT_ALIVE",
"116": "NOT_ALIVE",
"117": "NOT_ALIVE",
"118": "NON_PARTICIPATING",
"119": "NOT_ALIVE",
"12": "NOT_ALIVE",
"120": "NON_PARTICIPATING",
"121": "NOT_ALIVE",
"122": "NON_PARTICIPATING",
"123": "NOT_ALIVE",
"124": "NON_PARTICIPATING",
"125": "NOT_ALIVE",
"126": "NOT_ALIVE",
"127": "NOT_ALIVE",
"128": "NOT_ALIVE",
"129": "NOT_ALIVE",
"13": "NOT_ALIVE",
"130": "NOT_ALIVE",
"131": "NOT_ALIVE",
"132": "NOT_ALIVE",
"133": "SUCCESS",
"134": "NOT_ALIVE",
"135": "NON_PARTICIPATING",
"136": "NON_PARTICIPATING",
"137": "NON_PARTICIPATING",
"138": "NON_PARTICIPATING",
"139": "NOT_ALIVE",
"14": "NOT_ALIVE",
"140": "SUCCESS",
"141": "NON_PARTICIPATING",
"142": "NON_PARTICIPATING",
"143": "NON_PARTICIPATING",
"144": "SUCCESS",
"145": "NOT_ALIVE",
"146": "NON_PARTICIPATING",
"147": "NON_PARTICIPATING",
"148": "SUCCESS",
"149": "NOT_ALIVE",
"15": "SUCCESS",
"150": "NOT_ALIVE",
"151": "NON_PARTICIPATING",
"152": "NOT_ALIVE",
"153": "NOT_ALIVE",
"154": "NON_PARTICIPATING",
"155": "NON_PARTICIPATING",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NON_PARTICIPATING",
"159": "NOT_ALIVE",
"16": "NOT_ALIVE",
"160": "NON_PARTICIPATING",
"161": "NON_PARTICIPATING",
"162": "NON_PARTICIPATING",
"163": "NOT_ALIVE",
"164": "NOT_ALIVE",
"165": "NON_PARTICIPATING",
"166": "NON_PARTICIPATING",
"167": "NOT_ALIVE",
"168": "NON_PARTICIPATING",
"169": "NON_PARTICIPATING",
"17": "NOT_ALIVE",
"170": "NON_PARTICIPATING",
"171": "NON_PARTICIPATING",
"172": "NON_PARTICIPATING",
"173": "NON_PARTICIPATING",
"174": "NON_PARTICIPATING",
"175": "NON_PARTICIPATING",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "SUCCESS",
"180": "NON_PARTICIPATING",
"181": "NOT_ALIVE",
"182": "NON_PARTICIPATING",
"183": "NOT_ALIVE",
"184": "NON_PARTICIPATING",
"185": "NON_PARTICIPATING",
"186": "NON_PARTICIPATING",
"187": "SUCCESS",
"188": "SUCCESS",
"189": "SUCCESS",
"19": "NOT_ALIVE",
"190": "NON_PARTICIPATING",
"191": "NON_PARTICIPATING",
"192": "NON_PARTICIPATING",
"193": "NOT_ALIVE",
"194": "NOT_ALIVE",
"195": "NON_PARTICIPATING",
"196": "NOT_ALIVE",
"197": "SUCCESS",
"198": "NON_PARTICIPATING",
"199": "NOT_ALIVE",
"2": "NOT_ALIVE",
"20": "NOT_ALIVE",
"200": "NON_PARTICIPATING",
"201": "SUCCESS",
"202": "NON_PARTICIPATING",
"203": "NON_PARTICIPATING",
"204": "NOT_ALIVE",
"205": "NOT_ALIVE",
"206": "NOT_ALIVE",
"207": "NOT_ALIVE",
"208": "NOT_ALIVE",
"209": "NON_PARTICIPATING",
"21": "SUCCESS",
"210": "NOT_ALIVE",
"211": "NON_PARTICIPATING",
"212": "NON_PARTICIPATING",
"213": "NON_PARTICIPATING",
"214": "NON_PARTICIPATING",
"215": "NOT_ALIVE",
"216": "SUCCESS",
"217": "SUCCESS",
"218": "NON_PARTICIPATING",
"219": "SUCCESS",
"22": "NOT_ALIVE",
"220": "NOT_ALIVE",
"221": "NOT_ALIVE",
"222": "NON_PARTICIPATING",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NOT_ALIVE",
"226": "NON_PARTICIPATING",
"227": "NON_PARTICIPATING",
"228": "SUCCESS",
"229": "NOT_ALIVE",
"23": "SUCCESS",
"230": "SUCCESS",
"231": "NOT_ALIVE",
"232": "NOT_ALIVE",
"233": "NON_PARTICIPATING",
"234": "NOT_ALIVE",
"235": "NON_PARTICIPATING",
"236": "NOT_ALIVE",
"237": "NON_PARTICIPATING",
"238": "NON_PARTICIPATING",
"239": "NON_PARTICIPATING",
"24": "NOT_ALIVE",
"240": "NOT_ALIVE",
"241": "NON_PARTICIPATING",
"242": "SUCCESS",
"243": "NOT_ALIVE",
"244": "NON_PARTICIPATING",
"245": "NON_PARTICIPATING",
"246": "NON_PARTICIPATING",
"247": "NOT_ALIVE",
"248": "NOT_ALIVE",
"249": "NOT_ALIVE",
"25": "SUCCESS",
"250": "NOT_ALIVE",
"251": "NON_PARTICIPATING",
"252": "NON_PARTICIPATING",
"253": "NON_PARTICIPATING",
"254": "NON_PARTICIPATING",
"255": "NON_PARTICIPATING",
"26": "NON_PARTICIPATING",
"27": "NOT_ALIVE",
"28": "NON_PARTICIPATING",
"29": "NOT_ALIVE",
"3": "SUCCESS",
"30": "NOT_ALIVE",
"31": "NOT_ALIVE",
"32": "FAIL",
"33": "NOT_ALIVE",
"34": "NON_PARTICIPATING",
"35": "NON_PARTICIPATING",
"36": "SUCCESS",
"37": "NOT_ALIVE",
"38": "NON_PARTICIPATING",
"39": "NOT_ALIVE",
"4": "NOT_ALIVE",
"40": "NON_PARTICIPATING",
"41": "NOT_ALIVE",
"42": "NOT_ALIVE",
"43": "NON_PARTICIPATING",
"44": "NON_PARTICIPATING",
"45": "NOT_ALIVE",
"46": "SUCCESS",
"47": "NOT_ALIVE",
"48": "NON_PARTICIPATING",
"49": "NOT_ALIVE",
"5": "NOT_ALIVE",
"50": "SUCCESS",
"51": "NOT_ALIVE",
"52": "NOT_ALIVE",
"53": "NON_PARTICIPATING",
"54": "NOT_ALIVE",
"55": "NON_PARTICIPATING",
"56": "NOT_ALIVE",
"57": "NON_PARTICIPATING",
"58": "NOT_ALIVE",
"59": "NON_PARTICIPATING",
"6": "NOT_ALIVE",
"60": "NOT_ALIVE",
"61": "NON_PARTICIPATING",
"62": "NOT_ALIVE",
"63": "FAIL",
"64": "NOT_ALIVE",
"65": "NON_PARTICIPATING",
"66": "NON_PARTICIPATING",
"67": "NON_PARTICIPATING",
"68": "NOT_ALIVE",
"69": "NOT_ALIVE",
"7": "NOT_ALIVE",
"70": "NOT_ALIVE",
"71": "NON_PARTICIPATING",
"72": "NOT_ALIVE",
"73": "NOT_ALIVE",
"74": "NOT_ALIVE",
"75": "NON_PARTICIPATING",
"76": "NOT_ALIVE",
"77": "NOT_ALIVE",
"78": "NON_PARTICIPATING",
"79": "NOT_ALIVE",
"8": "NOT_ALIVE",
"80": "SUCCESS",
"81": "NON_PARTICIPATING",
"82": "NOT_ALIVE",
"83": "FAIL",
"84": "NOT_ALIVE",
"85": "NOT_ALIVE",
"86": "NOT_ALIVE",
"87": "NOT_ALIVE",
"88": "NON_PARTICIPATING",
"89": "NOT_ALIVE",
"9": "NOT_ALIVE",
"90": "NOT_ALIVE",
"91": "NOT_ALIVE",
"92": "NOT_ALIVE",
"93": "NON_PARTICIPATING",
"94": "NON_PARTICIPATING",
"95": "NOT_ALIVE",
"96": "NOT_ALIVE",
"97": "NON_PARTICIPATING",
"98": "NON_PARTICIPATING",
"99": "SUCCESS"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6140875,
6140889
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 117,
"intermediate_size": 5632,
"last_allreduce_block": 6140120,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|