File size: 7,482 Bytes
c10913b e64624e c10913b e64624e 79a8068 c10913b 2115498 fec4854 60947ff fec4854 2115498 c1ccecd 17a6cff e64624e c1ccecd 508359a e64624e 2115498 d52deb4 8b84f67 2115498 e64624e 2115498 fec4854 2115498 e64624e 2115498 c1ccecd 2115498 8c83a4e c1ccecd e64624e a2f59e0 e64624e c10913b e9d992d c877292 2115498 e64624e 4868de8 2115498 c1ccecd e64624e 2115498 6610819 e64624e 8b84f67 2115498 fec4854 2115498 c877292 e64624e c1ccecd e64624e c10913b 3f57e04 c1ccecd e64624e a2f59e0 e9d992d fec4854 1d64701 e64624e 8c83a4e 2115498 d52deb4 e64624e 863e5c9 c1ccecd 732bb9b 8c83a4e 2115498 34a4f02 5566e9d 2115498 17a6cff c10913b 00fc568 60947ff 79a8068 8c83a4e 1d64701 c19416a 069c347 2115498 8b84f67 2eb5593 fec4854 e64624e 2115498 c10913b 2115498 c1ccecd 42bc00c e64624e 5566e9d e64624e 2115498 863e5c9 c1ccecd 2115498 2eb5593 28c6dbb e64624e aa63d04 2115498 e64624e c877292 c10913b e64624e 53f58f8 c19416a e64624e 2115498 e64624e fec4854 2115498 53f58f8 2115498 e64624e 00fc568 2eb5593 c10913b 415e586 a930bf4 fec4854 b43c15f e64624e 2eb5593 2115498 581f0e4 ed147bd 1ffca14 53f58f8 1d64701 00fc568 c877292 8c83a4e e9d992d 2115498 5566e9d e64624e 2115498 3d04152 2115498 e64624e 8b84f67 e64624e 8b84f67 c1ccecd e64624e 8c83a4e 2115498 e9d992d 2115498 e9d992d 53f58f8 d52deb4 2115498 e64624e d52deb4 c10913b e9d992d c877292 e64624e 069c347 e64624e d52deb4 5566e9d 2115498 e64624e 7c7e5cf 60947ff 2115498 ed147bd c19416a d52deb4 c877292 2115498 e64624e 53f58f8 60947ff 2115498 e64624e 4868de8 8e2b160 e64624e 8326b15 c877292 8b84f67 c1ccecd 5566e9d 2115498 53f58f8 e64624e 79a8068 17a6cff e9d992d 53f58f8 2115498 e9d992d 2115498 e64624e 8b84f67 e64624e c1ccecd 2115498 79a8068 c1ccecd 79a8068 2115498 1ffca14 2115498 e64624e c877292 e64624e d52deb4 a930bf4 e64624e 5566e9d 6610819 d52deb4 b43c15f c1ccecd 17a6cff 2115498 e64624e 863e5c9 069c347 c10913b 68213f0 c10913b 68213f0 c10913b 2115498 c10913b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NOT_ALIVE",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NON_PARTICIPATING",
"102": "NON_PARTICIPATING",
"103": "NON_PARTICIPATING",
"104": "NOT_ALIVE",
"105": "NOT_ALIVE",
"106": "NOT_ALIVE",
"107": "NOT_ALIVE",
"108": "NON_PARTICIPATING",
"109": "NOT_ALIVE",
"11": "NOT_ALIVE",
"110": "NOT_ALIVE",
"111": "NOT_ALIVE",
"112": "NON_PARTICIPATING",
"113": "SUCCESS",
"114": "NON_PARTICIPATING",
"115": "NOT_ALIVE",
"116": "NON_PARTICIPATING",
"117": "SUCCESS",
"118": "NOT_ALIVE",
"119": "NON_PARTICIPATING",
"12": "NOT_ALIVE",
"120": "NON_PARTICIPATING",
"121": "NOT_ALIVE",
"122": "NOT_ALIVE",
"123": "NOT_ALIVE",
"124": "SUCCESS",
"125": "NON_PARTICIPATING",
"126": "NON_PARTICIPATING",
"127": "NOT_ALIVE",
"128": "NON_PARTICIPATING",
"129": "NOT_ALIVE",
"13": "NOT_ALIVE",
"130": "NOT_ALIVE",
"131": "NOT_ALIVE",
"132": "NOT_ALIVE",
"133": "NON_PARTICIPATING",
"134": "NON_PARTICIPATING",
"135": "NON_PARTICIPATING",
"136": "NON_PARTICIPATING",
"137": "NON_PARTICIPATING",
"138": "SUCCESS",
"139": "NON_PARTICIPATING",
"14": "SUCCESS",
"140": "NOT_ALIVE",
"141": "NOT_ALIVE",
"142": "NON_PARTICIPATING",
"143": "NOT_ALIVE",
"144": "NOT_ALIVE",
"145": "NOT_ALIVE",
"146": "NOT_ALIVE",
"147": "NOT_ALIVE",
"148": "SUCCESS",
"149": "NOT_ALIVE",
"15": "SUCCESS",
"150": "NOT_ALIVE",
"151": "NOT_ALIVE",
"152": "NOT_ALIVE",
"153": "NON_PARTICIPATING",
"154": "SUCCESS",
"155": "NOT_ALIVE",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NOT_ALIVE",
"159": "NOT_ALIVE",
"16": "NON_PARTICIPATING",
"160": "NOT_ALIVE",
"161": "NON_PARTICIPATING",
"162": "NON_PARTICIPATING",
"163": "NOT_ALIVE",
"164": "SUCCESS",
"165": "SUCCESS",
"166": "NOT_ALIVE",
"167": "NON_PARTICIPATING",
"168": "SUCCESS",
"169": "NOT_ALIVE",
"17": "NOT_ALIVE",
"170": "NOT_ALIVE",
"171": "NOT_ALIVE",
"172": "NON_PARTICIPATING",
"173": "NON_PARTICIPATING",
"174": "NOT_ALIVE",
"175": "NOT_ALIVE",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "NOT_ALIVE",
"180": "NOT_ALIVE",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "NON_PARTICIPATING",
"184": "NON_PARTICIPATING",
"185": "NOT_ALIVE",
"186": "NOT_ALIVE",
"187": "NOT_ALIVE",
"188": "NOT_ALIVE",
"189": "NOT_ALIVE",
"19": "NON_PARTICIPATING",
"190": "NON_PARTICIPATING",
"191": "NON_PARTICIPATING",
"192": "NOT_ALIVE",
"193": "NOT_ALIVE",
"194": "NON_PARTICIPATING",
"195": "NON_PARTICIPATING",
"196": "NON_PARTICIPATING",
"197": "NOT_ALIVE",
"198": "NON_PARTICIPATING",
"199": "NON_PARTICIPATING",
"2": "NON_PARTICIPATING",
"20": "NOT_ALIVE",
"200": "NOT_ALIVE",
"201": "NON_PARTICIPATING",
"202": "NOT_ALIVE",
"203": "NOT_ALIVE",
"204": "NON_PARTICIPATING",
"205": "NOT_ALIVE",
"206": "SUCCESS",
"207": "NOT_ALIVE",
"208": "NOT_ALIVE",
"209": "NOT_ALIVE",
"21": "NOT_ALIVE",
"210": "NOT_ALIVE",
"211": "NOT_ALIVE",
"212": "SUCCESS",
"213": "SUCCESS",
"214": "NOT_ALIVE",
"215": "SUCCESS",
"216": "NOT_ALIVE",
"217": "NON_PARTICIPATING",
"218": "NON_PARTICIPATING",
"219": "NOT_ALIVE",
"22": "NON_PARTICIPATING",
"220": "NOT_ALIVE",
"221": "NOT_ALIVE",
"222": "NOT_ALIVE",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NOT_ALIVE",
"226": "NOT_ALIVE",
"227": "NOT_ALIVE",
"228": "NON_PARTICIPATING",
"229": "NON_PARTICIPATING",
"23": "NON_PARTICIPATING",
"230": "NOT_ALIVE",
"231": "NOT_ALIVE",
"232": "NOT_ALIVE",
"233": "NOT_ALIVE",
"234": "NOT_ALIVE",
"235": "NON_PARTICIPATING",
"236": "NOT_ALIVE",
"237": "NON_PARTICIPATING",
"238": "NON_PARTICIPATING",
"239": "NOT_ALIVE",
"24": "NOT_ALIVE",
"240": "NON_PARTICIPATING",
"241": "NON_PARTICIPATING",
"242": "NOT_ALIVE",
"243": "NOT_ALIVE",
"244": "NOT_ALIVE",
"245": "NOT_ALIVE",
"246": "NON_PARTICIPATING",
"247": "NON_PARTICIPATING",
"248": "NOT_ALIVE",
"249": "NOT_ALIVE",
"25": "SUCCESS",
"250": "NON_PARTICIPATING",
"251": "NOT_ALIVE",
"252": "NON_PARTICIPATING",
"253": "NOT_ALIVE",
"254": "NON_PARTICIPATING",
"255": "NOT_ALIVE",
"26": "NOT_ALIVE",
"27": "NOT_ALIVE",
"28": "NOT_ALIVE",
"29": "NON_PARTICIPATING",
"3": "NON_PARTICIPATING",
"30": "NON_PARTICIPATING",
"31": "NON_PARTICIPATING",
"32": "SUCCESS",
"33": "NOT_ALIVE",
"34": "NOT_ALIVE",
"35": "NON_PARTICIPATING",
"36": "NOT_ALIVE",
"37": "NOT_ALIVE",
"38": "NON_PARTICIPATING",
"39": "SUCCESS",
"4": "NON_PARTICIPATING",
"40": "NON_PARTICIPATING",
"41": "NOT_ALIVE",
"42": "NOT_ALIVE",
"43": "NOT_ALIVE",
"44": "NOT_ALIVE",
"45": "NOT_ALIVE",
"46": "NOT_ALIVE",
"47": "NON_PARTICIPATING",
"48": "NON_PARTICIPATING",
"49": "NOT_ALIVE",
"5": "SUCCESS",
"50": "NOT_ALIVE",
"51": "NOT_ALIVE",
"52": "SUCCESS",
"53": "NOT_ALIVE",
"54": "NOT_ALIVE",
"55": "NOT_ALIVE",
"56": "NOT_ALIVE",
"57": "NON_PARTICIPATING",
"58": "NON_PARTICIPATING",
"59": "NON_PARTICIPATING",
"6": "NON_PARTICIPATING",
"60": "NOT_ALIVE",
"61": "NOT_ALIVE",
"62": "NON_PARTICIPATING",
"63": "NON_PARTICIPATING",
"64": "NOT_ALIVE",
"65": "NOT_ALIVE",
"66": "NOT_ALIVE",
"67": "NOT_ALIVE",
"68": "NOT_ALIVE",
"69": "NOT_ALIVE",
"7": "NON_PARTICIPATING",
"70": "NOT_ALIVE",
"71": "NON_PARTICIPATING",
"72": "NOT_ALIVE",
"73": "NOT_ALIVE",
"74": "NOT_ALIVE",
"75": "NON_PARTICIPATING",
"76": "NOT_ALIVE",
"77": "NON_PARTICIPATING",
"78": "NOT_ALIVE",
"79": "NON_PARTICIPATING",
"8": "NOT_ALIVE",
"80": "NOT_ALIVE",
"81": "NOT_ALIVE",
"82": "NON_PARTICIPATING",
"83": "NON_PARTICIPATING",
"84": "NOT_ALIVE",
"85": "NOT_ALIVE",
"86": "NON_PARTICIPATING",
"87": "NOT_ALIVE",
"88": "NOT_ALIVE",
"89": "NOT_ALIVE",
"9": "NOT_ALIVE",
"90": "NOT_ALIVE",
"91": "NOT_ALIVE",
"92": "NON_PARTICIPATING",
"93": "NOT_ALIVE",
"94": "NON_PARTICIPATING",
"95": "NOT_ALIVE",
"96": "NON_PARTICIPATING",
"97": "NOT_ALIVE",
"98": "NOT_ALIVE",
"99": "NOT_ALIVE"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6007438,
6007476
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 25,
"intermediate_size": 5632,
"last_allreduce_block": 6005880,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|