File size: 7,752 Bytes
525340d cbcf2e3 525340d cbcf2e3 6a78ed2 525340d ecbfbb9 1121183 f93b459 1121183 cbcf2e3 e561b78 3b61827 e561b78 cbcf2e3 d0cde57 20daea4 f93b459 e561b78 0e87ac8 1121183 ecbfbb9 2c2c984 cbcf2e3 2c2c984 117ce68 e561b78 1121183 cbcf2e3 0558cd7 117ce68 525340d ecbfbb9 e561b78 0e87ac8 a1c4112 e561b78 117ce68 e561b78 cbcf2e3 fbd5bc6 117ce68 1121183 cbcf2e3 117ce68 cbcf2e3 e561b78 20daea4 525340d f93b459 ecbfbb9 117ce68 e561b78 e2c9402 1121183 f681d26 20daea4 a1c4112 e561b78 ecbfbb9 578e39d e561b78 f93b459 e561b78 a1c4112 b6c484d 578e39d 2c2c984 525340d e561b78 2c2c984 cbcf2e3 3b61827 525340d a1c4112 f14291b 6a78ed2 f93b459 f681d26 491335c 525340d ecbfbb9 1418c24 9b135ac 1121183 cbcf2e3 525340d 117ce68 e561b78 0e87ac8 f93b459 e561b78 2c2c984 e561b78 f93b459 a1c4112 117ce68 6480b16 ecbfbb9 2c2c984 cf4a545 e561b78 cbcf2e3 117ce68 525340d cbcf2e3 2c2c984 491335c e561b78 117ce68 ecbfbb9 f93b459 a1c4112 117ce68 1121183 e561b78 b12e878 0e87ac8 f93b459 e561b78 9b135ac 525340d ecbfbb9 525340d 1121183 f93b459 2c2c984 9b135ac e561b78 6f7bf24 e351beb b12e878 e561b78 117ce68 e2c9402 0e87ac8 117ce68 e561b78 8e104eb cbcf2e3 2c2c984 e351beb 2c2c984 117ce68 a1c4112 117ce68 20daea4 ecbfbb9 578e39d e561b78 e2c9402 f93b459 e2c9402 b12e878 1121183 0e87ac8 e561b78 ecbfbb9 e561b78 525340d e2c9402 e561b78 cbcf2e3 525340d e561b78 ecbfbb9 117ce68 1121183 f14291b f93b459 491335c 117ce68 e561b78 f93b459 ecbfbb9 cbcf2e3 fbd5bc6 fcf80cc a1c4112 e561b78 ecbfbb9 9d76d54 1121183 cbcf2e3 0e87ac8 117ce68 b12e878 2c2c984 a1c4112 3b61827 e2c9402 b12e878 e561b78 e2c9402 f93b459 cbcf2e3 e561b78 1121183 ecbfbb9 1121183 e561b78 1121183 6a78ed2 a1c4112 cbcf2e3 e351beb a1c4112 cbcf2e3 117ce68 ecbfbb9 e561b78 525340d cbcf2e3 1121183 e561b78 0ffd0ce e561b78 3b61827 e561b78 cbcf2e3 1121183 525340d 2a3c26a 525340d 2a3c26a 525340d e561b78 525340d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NON_PARTICIPATING",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NOT_ALIVE",
"102": "NON_PARTICIPATING",
"103": "NON_PARTICIPATING",
"104": "NOT_ALIVE",
"105": "NON_PARTICIPATING",
"106": "NON_PARTICIPATING",
"107": "NOT_ALIVE",
"108": "SUCCESS",
"109": "NON_PARTICIPATING",
"11": "NOT_ALIVE",
"110": "NOT_ALIVE",
"111": "NON_PARTICIPATING",
"112": "SUCCESS",
"113": "NON_PARTICIPATING",
"114": "NOT_ALIVE",
"115": "NON_PARTICIPATING",
"116": "NOT_ALIVE",
"117": "NOT_ALIVE",
"118": "NOT_ALIVE",
"119": "NON_PARTICIPATING",
"12": "NOT_ALIVE",
"120": "NON_PARTICIPATING",
"121": "NON_PARTICIPATING",
"122": "NON_PARTICIPATING",
"123": "NON_PARTICIPATING",
"124": "NON_PARTICIPATING",
"125": "NON_PARTICIPATING",
"126": "NOT_ALIVE",
"127": "NOT_ALIVE",
"128": "NON_PARTICIPATING",
"129": "NON_PARTICIPATING",
"13": "NOT_ALIVE",
"130": "NON_PARTICIPATING",
"131": "NOT_ALIVE",
"132": "NON_PARTICIPATING",
"133": "NON_PARTICIPATING",
"134": "NON_PARTICIPATING",
"135": "NON_PARTICIPATING",
"136": "NON_PARTICIPATING",
"137": "NOT_ALIVE",
"138": "NON_PARTICIPATING",
"139": "NOT_ALIVE",
"14": "SUCCESS",
"140": "NON_PARTICIPATING",
"141": "NOT_ALIVE",
"142": "NOT_ALIVE",
"143": "NON_PARTICIPATING",
"144": "NOT_ALIVE",
"145": "NON_PARTICIPATING",
"146": "NOT_ALIVE",
"147": "NON_PARTICIPATING",
"148": "NOT_ALIVE",
"149": "NON_PARTICIPATING",
"15": "NON_PARTICIPATING",
"150": "NOT_ALIVE",
"151": "NOT_ALIVE",
"152": "NON_PARTICIPATING",
"153": "NOT_ALIVE",
"154": "NON_PARTICIPATING",
"155": "NON_PARTICIPATING",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NOT_ALIVE",
"159": "NOT_ALIVE",
"16": "NON_PARTICIPATING",
"160": "NON_PARTICIPATING",
"161": "NOT_ALIVE",
"162": "NON_PARTICIPATING",
"163": "NOT_ALIVE",
"164": "NOT_ALIVE",
"165": "NOT_ALIVE",
"166": "NON_PARTICIPATING",
"167": "NOT_ALIVE",
"168": "NON_PARTICIPATING",
"169": "NOT_ALIVE",
"17": "NOT_ALIVE",
"170": "NOT_ALIVE",
"171": "NOT_ALIVE",
"172": "NON_PARTICIPATING",
"173": "NON_PARTICIPATING",
"174": "NON_PARTICIPATING",
"175": "NOT_ALIVE",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "NON_PARTICIPATING",
"180": "NOT_ALIVE",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "SUCCESS",
"184": "NON_PARTICIPATING",
"185": "NOT_ALIVE",
"186": "NOT_ALIVE",
"187": "NON_PARTICIPATING",
"188": "NON_PARTICIPATING",
"189": "NOT_ALIVE",
"19": "NON_PARTICIPATING",
"190": "NON_PARTICIPATING",
"191": "NON_PARTICIPATING",
"192": "NON_PARTICIPATING",
"193": "NOT_ALIVE",
"194": "NON_PARTICIPATING",
"195": "NOT_ALIVE",
"196": "NON_PARTICIPATING",
"197": "NOT_ALIVE",
"198": "NOT_ALIVE",
"199": "NON_PARTICIPATING",
"2": "NON_PARTICIPATING",
"20": "NOT_ALIVE",
"200": "NOT_ALIVE",
"201": "NOT_ALIVE",
"202": "NON_PARTICIPATING",
"203": "NOT_ALIVE",
"204": "NOT_ALIVE",
"205": "NON_PARTICIPATING",
"206": "NON_PARTICIPATING",
"207": "NOT_ALIVE",
"208": "NON_PARTICIPATING",
"209": "NOT_ALIVE",
"21": "NOT_ALIVE",
"210": "NON_PARTICIPATING",
"211": "NON_PARTICIPATING",
"212": "SUCCESS",
"213": "NON_PARTICIPATING",
"214": "NON_PARTICIPATING",
"215": "SUCCESS",
"216": "NOT_ALIVE",
"217": "NOT_ALIVE",
"218": "NOT_ALIVE",
"219": "NOT_ALIVE",
"22": "NON_PARTICIPATING",
"220": "NON_PARTICIPATING",
"221": "NOT_ALIVE",
"222": "NOT_ALIVE",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NON_PARTICIPATING",
"226": "NOT_ALIVE",
"227": "NOT_ALIVE",
"228": "NOT_ALIVE",
"229": "NON_PARTICIPATING",
"23": "NON_PARTICIPATING",
"230": "NON_PARTICIPATING",
"231": "SUCCESS",
"232": "NOT_ALIVE",
"233": "NOT_ALIVE",
"234": "NOT_ALIVE",
"235": "NON_PARTICIPATING",
"236": "NOT_ALIVE",
"237": "NON_PARTICIPATING",
"238": "NON_PARTICIPATING",
"239": "NOT_ALIVE",
"24": "NOT_ALIVE",
"240": "NON_PARTICIPATING",
"241": "SUCCESS",
"242": "NON_PARTICIPATING",
"243": "NON_PARTICIPATING",
"244": "NOT_ALIVE",
"245": "NON_PARTICIPATING",
"246": "NOT_ALIVE",
"247": "NON_PARTICIPATING",
"248": "NON_PARTICIPATING",
"249": "NON_PARTICIPATING",
"25": "SUCCESS",
"250": "SUCCESS",
"251": "NOT_ALIVE",
"252": "NOT_ALIVE",
"253": "NOT_ALIVE",
"254": "NON_PARTICIPATING",
"255": "NOT_ALIVE",
"26": "NON_PARTICIPATING",
"27": "NOT_ALIVE",
"28": "NOT_ALIVE",
"29": "NON_PARTICIPATING",
"3": "NON_PARTICIPATING",
"30": "NOT_ALIVE",
"31": "NON_PARTICIPATING",
"32": "NON_PARTICIPATING",
"33": "NOT_ALIVE",
"34": "NOT_ALIVE",
"35": "NON_PARTICIPATING",
"36": "NON_PARTICIPATING",
"37": "NOT_ALIVE",
"38": "NON_PARTICIPATING",
"39": "SUCCESS",
"4": "NOT_ALIVE",
"40": "NON_PARTICIPATING",
"41": "NON_PARTICIPATING",
"42": "NOT_ALIVE",
"43": "NOT_ALIVE",
"44": "NOT_ALIVE",
"45": "NOT_ALIVE",
"46": "NOT_ALIVE",
"47": "SUCCESS",
"48": "NON_PARTICIPATING",
"49": "NON_PARTICIPATING",
"5": "NON_PARTICIPATING",
"50": "NOT_ALIVE",
"51": "NOT_ALIVE",
"52": "SUCCESS",
"53": "NON_PARTICIPATING",
"54": "NOT_ALIVE",
"55": "NOT_ALIVE",
"56": "NON_PARTICIPATING",
"57": "NOT_ALIVE",
"58": "NON_PARTICIPATING",
"59": "NON_PARTICIPATING",
"6": "NON_PARTICIPATING",
"60": "NOT_ALIVE",
"61": "NON_PARTICIPATING",
"62": "NON_PARTICIPATING",
"63": "SUCCESS",
"64": "NOT_ALIVE",
"65": "NON_PARTICIPATING",
"66": "NON_PARTICIPATING",
"67": "NOT_ALIVE",
"68": "NOT_ALIVE",
"69": "NOT_ALIVE",
"7": "NOT_ALIVE",
"70": "NOT_ALIVE",
"71": "NON_PARTICIPATING",
"72": "NON_PARTICIPATING",
"73": "NOT_ALIVE",
"74": "NOT_ALIVE",
"75": "NON_PARTICIPATING",
"76": "NOT_ALIVE",
"77": "SUCCESS",
"78": "NON_PARTICIPATING",
"79": "NON_PARTICIPATING",
"8": "NOT_ALIVE",
"80": "NOT_ALIVE",
"81": "NON_PARTICIPATING",
"82": "NON_PARTICIPATING",
"83": "NON_PARTICIPATING",
"84": "NON_PARTICIPATING",
"85": "NON_PARTICIPATING",
"86": "NON_PARTICIPATING",
"87": "NOT_ALIVE",
"88": "NON_PARTICIPATING",
"89": "NOT_ALIVE",
"9": "NON_PARTICIPATING",
"90": "NOT_ALIVE",
"91": "NOT_ALIVE",
"92": "SUCCESS",
"93": "NOT_ALIVE",
"94": "SUCCESS",
"95": "NOT_ALIVE",
"96": "NOT_ALIVE",
"97": "NON_PARTICIPATING",
"98": "NOT_ALIVE",
"99": "NOT_ALIVE"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6018914,
6018944
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 46,
"intermediate_size": 5632,
"last_allreduce_block": 6016469,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|