File size: 7,752 Bytes
bb504cf 9ac2748 bb504cf 9ac2748 e0f94d3 bb504cf 33b55ea 13515ac 90ecc4e 13515ac 9ac2748 bdf8249 b512030 bdf8249 9ac2748 05c4feb e9149c5 90ecc4e bdf8249 ccb0cae 13515ac 33b55ea 9093afa 9ac2748 9093afa 1d62cf3 bdf8249 bad5aa7 9ac2748 e0f94d3 1d62cf3 bb504cf 33b55ea bdf8249 ccb0cae 4980e5b bdf8249 1d62cf3 bdf8249 9ac2748 9d38c9a 1d62cf3 13515ac 9ac2748 1d62cf3 9ac2748 bdf8249 e9149c5 bb504cf 90ecc4e 33b55ea 1d62cf3 bdf8249 36fb06b 13515ac 1d6a33b e9149c5 4980e5b bdf8249 33b55ea e0f94d3 bdf8249 90ecc4e bdf8249 4980e5b 558d678 e0f94d3 9093afa bb504cf bdf8249 9093afa 9ac2748 b512030 bb504cf 4980e5b a3f652f e0f94d3 90ecc4e 1d6a33b 97bb66c ef9f890 33b55ea 9d38c9a 7269158 13515ac 9ac2748 bb504cf 1d62cf3 bdf8249 ccb0cae 90ecc4e bdf8249 9093afa bdf8249 90ecc4e 4980e5b 1d62cf3 558d678 33b55ea 9093afa 60011b4 bdf8249 9ac2748 1d62cf3 bb504cf 9ac2748 9093afa 97bb66c bdf8249 1d62cf3 33b55ea 90ecc4e 4980e5b 1d62cf3 13515ac bdf8249 973ac99 ccb0cae 90ecc4e bdf8249 7269158 bb504cf 33b55ea bb504cf 13515ac 90ecc4e 9093afa 7269158 bdf8249 bc779b1 a13d4a1 973ac99 bdf8249 1d62cf3 36fb06b ccb0cae 1d62cf3 bdf8249 05c4feb 9ac2748 9093afa 9d38c9a 9093afa 1d62cf3 4980e5b 1d62cf3 e9149c5 33b55ea e0f94d3 bdf8249 36fb06b 90ecc4e 36fb06b 973ac99 43ef8f2 ccb0cae bdf8249 33b55ea bdf8249 bb504cf 36fb06b bdf8249 9ac2748 ef9f890 bdf8249 33b55ea 1d62cf3 7cd6bf1 a3f652f 90ecc4e 97bb66c 1d62cf3 bdf8249 90ecc4e 33b55ea 9ac2748 e045c00 fc47272 4980e5b bdf8249 33b55ea bad5aa7 f8ac605 9ac2748 ccb0cae 1d62cf3 973ac99 9093afa 4980e5b b512030 36fb06b 973ac99 bdf8249 36fb06b 90ecc4e 9ac2748 bdf8249 9d38c9a 33b55ea bad5aa7 bdf8249 bad5aa7 e0f94d3 4980e5b 9ac2748 a13d4a1 4980e5b 9ac2748 1d62cf3 33b55ea bdf8249 dd6e298 9ac2748 f8ac605 bdf8249 abbf40d bdf8249 b512030 bdf8249 9ac2748 48cf558 ef9f890 bb504cf 62a5cb9 bb504cf 62a5cb9 bb504cf bdf8249 bb504cf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NON_PARTICIPATING",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NOT_ALIVE",
"102": "NON_PARTICIPATING",
"103": "NON_PARTICIPATING",
"104": "NOT_ALIVE",
"105": "NON_PARTICIPATING",
"106": "NON_PARTICIPATING",
"107": "NOT_ALIVE",
"108": "SUCCESS",
"109": "NON_PARTICIPATING",
"11": "NOT_ALIVE",
"110": "NOT_ALIVE",
"111": "NON_PARTICIPATING",
"112": "SUCCESS",
"113": "NON_PARTICIPATING",
"114": "NOT_ALIVE",
"115": "NON_PARTICIPATING",
"116": "NOT_ALIVE",
"117": "NOT_ALIVE",
"118": "NOT_ALIVE",
"119": "NON_PARTICIPATING",
"12": "NOT_ALIVE",
"120": "NON_PARTICIPATING",
"121": "NON_PARTICIPATING",
"122": "NON_PARTICIPATING",
"123": "NON_PARTICIPATING",
"124": "NON_PARTICIPATING",
"125": "NON_PARTICIPATING",
"126": "NOT_ALIVE",
"127": "NOT_ALIVE",
"128": "NON_PARTICIPATING",
"129": "NON_PARTICIPATING",
"13": "NOT_ALIVE",
"130": "NON_PARTICIPATING",
"131": "NOT_ALIVE",
"132": "NON_PARTICIPATING",
"133": "NON_PARTICIPATING",
"134": "NON_PARTICIPATING",
"135": "NON_PARTICIPATING",
"136": "NON_PARTICIPATING",
"137": "NOT_ALIVE",
"138": "NON_PARTICIPATING",
"139": "NOT_ALIVE",
"14": "SUCCESS",
"140": "NON_PARTICIPATING",
"141": "NOT_ALIVE",
"142": "NOT_ALIVE",
"143": "NON_PARTICIPATING",
"144": "NOT_ALIVE",
"145": "NON_PARTICIPATING",
"146": "NOT_ALIVE",
"147": "NON_PARTICIPATING",
"148": "NOT_ALIVE",
"149": "NON_PARTICIPATING",
"15": "NON_PARTICIPATING",
"150": "NOT_ALIVE",
"151": "NOT_ALIVE",
"152": "NON_PARTICIPATING",
"153": "NOT_ALIVE",
"154": "NON_PARTICIPATING",
"155": "NON_PARTICIPATING",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NOT_ALIVE",
"159": "NOT_ALIVE",
"16": "NON_PARTICIPATING",
"160": "NON_PARTICIPATING",
"161": "NOT_ALIVE",
"162": "NON_PARTICIPATING",
"163": "NOT_ALIVE",
"164": "NOT_ALIVE",
"165": "NOT_ALIVE",
"166": "NON_PARTICIPATING",
"167": "NOT_ALIVE",
"168": "NON_PARTICIPATING",
"169": "NOT_ALIVE",
"17": "NOT_ALIVE",
"170": "NOT_ALIVE",
"171": "NOT_ALIVE",
"172": "NON_PARTICIPATING",
"173": "NON_PARTICIPATING",
"174": "NON_PARTICIPATING",
"175": "NOT_ALIVE",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "NON_PARTICIPATING",
"180": "NOT_ALIVE",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "SUCCESS",
"184": "NON_PARTICIPATING",
"185": "NOT_ALIVE",
"186": "NOT_ALIVE",
"187": "NON_PARTICIPATING",
"188": "NON_PARTICIPATING",
"189": "NOT_ALIVE",
"19": "NON_PARTICIPATING",
"190": "NON_PARTICIPATING",
"191": "NON_PARTICIPATING",
"192": "NON_PARTICIPATING",
"193": "NOT_ALIVE",
"194": "NON_PARTICIPATING",
"195": "NOT_ALIVE",
"196": "NON_PARTICIPATING",
"197": "NOT_ALIVE",
"198": "NOT_ALIVE",
"199": "NON_PARTICIPATING",
"2": "NON_PARTICIPATING",
"20": "NOT_ALIVE",
"200": "NOT_ALIVE",
"201": "NOT_ALIVE",
"202": "NON_PARTICIPATING",
"203": "NOT_ALIVE",
"204": "NOT_ALIVE",
"205": "NON_PARTICIPATING",
"206": "NON_PARTICIPATING",
"207": "NOT_ALIVE",
"208": "NON_PARTICIPATING",
"209": "NOT_ALIVE",
"21": "NOT_ALIVE",
"210": "NON_PARTICIPATING",
"211": "NON_PARTICIPATING",
"212": "SUCCESS",
"213": "NON_PARTICIPATING",
"214": "NON_PARTICIPATING",
"215": "SUCCESS",
"216": "NOT_ALIVE",
"217": "NOT_ALIVE",
"218": "NOT_ALIVE",
"219": "NOT_ALIVE",
"22": "NON_PARTICIPATING",
"220": "NON_PARTICIPATING",
"221": "NOT_ALIVE",
"222": "NOT_ALIVE",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NON_PARTICIPATING",
"226": "NOT_ALIVE",
"227": "NOT_ALIVE",
"228": "NOT_ALIVE",
"229": "NON_PARTICIPATING",
"23": "NON_PARTICIPATING",
"230": "NON_PARTICIPATING",
"231": "SUCCESS",
"232": "NOT_ALIVE",
"233": "NOT_ALIVE",
"234": "NOT_ALIVE",
"235": "NON_PARTICIPATING",
"236": "NOT_ALIVE",
"237": "NON_PARTICIPATING",
"238": "NON_PARTICIPATING",
"239": "NOT_ALIVE",
"24": "NOT_ALIVE",
"240": "NON_PARTICIPATING",
"241": "SUCCESS",
"242": "NON_PARTICIPATING",
"243": "NON_PARTICIPATING",
"244": "NOT_ALIVE",
"245": "NON_PARTICIPATING",
"246": "NOT_ALIVE",
"247": "NON_PARTICIPATING",
"248": "NON_PARTICIPATING",
"249": "NON_PARTICIPATING",
"25": "SUCCESS",
"250": "SUCCESS",
"251": "NOT_ALIVE",
"252": "NOT_ALIVE",
"253": "NOT_ALIVE",
"254": "NON_PARTICIPATING",
"255": "NOT_ALIVE",
"26": "NON_PARTICIPATING",
"27": "NOT_ALIVE",
"28": "NOT_ALIVE",
"29": "NON_PARTICIPATING",
"3": "NON_PARTICIPATING",
"30": "NOT_ALIVE",
"31": "NON_PARTICIPATING",
"32": "NON_PARTICIPATING",
"33": "NOT_ALIVE",
"34": "NOT_ALIVE",
"35": "NON_PARTICIPATING",
"36": "NON_PARTICIPATING",
"37": "NOT_ALIVE",
"38": "NON_PARTICIPATING",
"39": "SUCCESS",
"4": "NOT_ALIVE",
"40": "NON_PARTICIPATING",
"41": "NON_PARTICIPATING",
"42": "NOT_ALIVE",
"43": "NOT_ALIVE",
"44": "NOT_ALIVE",
"45": "NOT_ALIVE",
"46": "NOT_ALIVE",
"47": "SUCCESS",
"48": "NON_PARTICIPATING",
"49": "NON_PARTICIPATING",
"5": "NON_PARTICIPATING",
"50": "NOT_ALIVE",
"51": "NOT_ALIVE",
"52": "SUCCESS",
"53": "NON_PARTICIPATING",
"54": "NOT_ALIVE",
"55": "NOT_ALIVE",
"56": "NON_PARTICIPATING",
"57": "NOT_ALIVE",
"58": "NON_PARTICIPATING",
"59": "NON_PARTICIPATING",
"6": "NON_PARTICIPATING",
"60": "NOT_ALIVE",
"61": "NON_PARTICIPATING",
"62": "NON_PARTICIPATING",
"63": "SUCCESS",
"64": "NOT_ALIVE",
"65": "NON_PARTICIPATING",
"66": "NON_PARTICIPATING",
"67": "NOT_ALIVE",
"68": "NOT_ALIVE",
"69": "NOT_ALIVE",
"7": "NOT_ALIVE",
"70": "NOT_ALIVE",
"71": "NON_PARTICIPATING",
"72": "NON_PARTICIPATING",
"73": "NOT_ALIVE",
"74": "NOT_ALIVE",
"75": "NON_PARTICIPATING",
"76": "NOT_ALIVE",
"77": "SUCCESS",
"78": "NON_PARTICIPATING",
"79": "NON_PARTICIPATING",
"8": "NOT_ALIVE",
"80": "NOT_ALIVE",
"81": "NON_PARTICIPATING",
"82": "NON_PARTICIPATING",
"83": "NON_PARTICIPATING",
"84": "NON_PARTICIPATING",
"85": "NON_PARTICIPATING",
"86": "NON_PARTICIPATING",
"87": "NOT_ALIVE",
"88": "NON_PARTICIPATING",
"89": "NOT_ALIVE",
"9": "NON_PARTICIPATING",
"90": "NOT_ALIVE",
"91": "NOT_ALIVE",
"92": "SUCCESS",
"93": "NOT_ALIVE",
"94": "SUCCESS",
"95": "NOT_ALIVE",
"96": "NOT_ALIVE",
"97": "NON_PARTICIPATING",
"98": "NOT_ALIVE",
"99": "NOT_ALIVE"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6018883,
6018915
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 36,
"intermediate_size": 5632,
"last_allreduce_block": 6016469,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|