File size: 7,752 Bytes
dcf0c10 c4a70e5 dcf0c10 e5c561f f57af70 dcf0c10 6be8cc1 9eff8fc 082cfb8 9eff8fc e5c561f 9d0bf17 e12fa68 9d0bf17 e5c561f 68796f8 c4a70e5 082cfb8 9d0bf17 8bd70b2 9eff8fc 6be8cc1 f83567a e5c561f f83567a 11e90e6 9d0bf17 e1e1cb3 e5c561f 7d5892b 11e90e6 dcf0c10 6be8cc1 9d0bf17 8bd70b2 8706d38 9d0bf17 11e90e6 9d0bf17 e5c561f 029307d 11e90e6 9eff8fc e5c561f 11e90e6 e5c561f 9d0bf17 c4a70e5 dcf0c10 082cfb8 6be8cc1 11e90e6 9d0bf17 d1d01b9 9eff8fc 468eba8 c4a70e5 8706d38 9d0bf17 6be8cc1 8095a83 9d0bf17 082cfb8 9d0bf17 8706d38 8f8e1e9 8095a83 f83567a dcf0c10 9d0bf17 f83567a e5c561f e12fa68 dcf0c10 8706d38 ff1a487 f57af70 082cfb8 468eba8 c933e66 345addc 6be8cc1 029307d 198e144 9eff8fc e5c561f dcf0c10 11e90e6 9d0bf17 8bd70b2 082cfb8 9d0bf17 f83567a 9d0bf17 082cfb8 8706d38 11e90e6 73216f8 6be8cc1 f83567a 3a064cf 9d0bf17 e5c561f 11e90e6 dcf0c10 e5c561f f83567a c933e66 9d0bf17 11e90e6 6be8cc1 082cfb8 8706d38 11e90e6 9eff8fc 9d0bf17 182425f 8bd70b2 082cfb8 9d0bf17 198e144 dcf0c10 6be8cc1 dcf0c10 9eff8fc 082cfb8 f83567a 198e144 9d0bf17 d6fb51b 8fcb9dd 182425f 9d0bf17 11e90e6 d1d01b9 8bd70b2 11e90e6 9d0bf17 4c7a983 e5c561f f83567a 029307d f83567a 11e90e6 8706d38 11e90e6 c4a70e5 6be8cc1 8095a83 9d0bf17 d1d01b9 082cfb8 d1d01b9 182425f b1ce618 8bd70b2 9d0bf17 6be8cc1 9d0bf17 dcf0c10 d1d01b9 9d0bf17 e5c561f 345addc 9d0bf17 6be8cc1 11e90e6 e2f5a56 ff1a487 082cfb8 c933e66 11e90e6 9d0bf17 082cfb8 6be8cc1 e5c561f d1f3d6a 4a0ef36 8706d38 9d0bf17 6be8cc1 e1e1cb3 0dc0116 e5c561f 8bd70b2 11e90e6 182425f f83567a 8706d38 e12fa68 d1d01b9 182425f 9d0bf17 d1d01b9 082cfb8 e5c561f 9d0bf17 029307d 6be8cc1 e1e1cb3 9d0bf17 e1e1cb3 f57af70 8706d38 e5c561f 8fcb9dd 8706d38 e5c561f 11e90e6 6be8cc1 9d0bf17 dcf0c10 e5c561f 0dc0116 9d0bf17 06c8cc4 9d0bf17 e12fa68 9d0bf17 e5c561f f1900b8 345addc dcf0c10 9eff8fc bd918a7 9eff8fc dcf0c10 bd918a7 dcf0c10 9d0bf17 dcf0c10 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NON_PARTICIPATING",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NOT_ALIVE",
"102": "NON_PARTICIPATING",
"103": "NON_PARTICIPATING",
"104": "NOT_ALIVE",
"105": "NON_PARTICIPATING",
"106": "NON_PARTICIPATING",
"107": "NOT_ALIVE",
"108": "SUCCESS",
"109": "NON_PARTICIPATING",
"11": "NOT_ALIVE",
"110": "NOT_ALIVE",
"111": "NON_PARTICIPATING",
"112": "SUCCESS",
"113": "NON_PARTICIPATING",
"114": "NOT_ALIVE",
"115": "NON_PARTICIPATING",
"116": "NOT_ALIVE",
"117": "NOT_ALIVE",
"118": "NOT_ALIVE",
"119": "NON_PARTICIPATING",
"12": "NOT_ALIVE",
"120": "NON_PARTICIPATING",
"121": "NON_PARTICIPATING",
"122": "NON_PARTICIPATING",
"123": "NON_PARTICIPATING",
"124": "NON_PARTICIPATING",
"125": "NON_PARTICIPATING",
"126": "NOT_ALIVE",
"127": "NOT_ALIVE",
"128": "NON_PARTICIPATING",
"129": "NON_PARTICIPATING",
"13": "NOT_ALIVE",
"130": "NON_PARTICIPATING",
"131": "NOT_ALIVE",
"132": "NON_PARTICIPATING",
"133": "NON_PARTICIPATING",
"134": "NON_PARTICIPATING",
"135": "NON_PARTICIPATING",
"136": "NON_PARTICIPATING",
"137": "NOT_ALIVE",
"138": "NON_PARTICIPATING",
"139": "NOT_ALIVE",
"14": "SUCCESS",
"140": "NON_PARTICIPATING",
"141": "NOT_ALIVE",
"142": "NOT_ALIVE",
"143": "NON_PARTICIPATING",
"144": "NOT_ALIVE",
"145": "NON_PARTICIPATING",
"146": "NOT_ALIVE",
"147": "NON_PARTICIPATING",
"148": "NOT_ALIVE",
"149": "NON_PARTICIPATING",
"15": "NON_PARTICIPATING",
"150": "NOT_ALIVE",
"151": "NOT_ALIVE",
"152": "NON_PARTICIPATING",
"153": "NOT_ALIVE",
"154": "NON_PARTICIPATING",
"155": "NON_PARTICIPATING",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NOT_ALIVE",
"159": "NOT_ALIVE",
"16": "NON_PARTICIPATING",
"160": "NON_PARTICIPATING",
"161": "NOT_ALIVE",
"162": "NON_PARTICIPATING",
"163": "NOT_ALIVE",
"164": "NOT_ALIVE",
"165": "NOT_ALIVE",
"166": "NON_PARTICIPATING",
"167": "NOT_ALIVE",
"168": "NON_PARTICIPATING",
"169": "NOT_ALIVE",
"17": "NOT_ALIVE",
"170": "NOT_ALIVE",
"171": "NOT_ALIVE",
"172": "NON_PARTICIPATING",
"173": "NON_PARTICIPATING",
"174": "NON_PARTICIPATING",
"175": "NOT_ALIVE",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "NON_PARTICIPATING",
"180": "NOT_ALIVE",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "SUCCESS",
"184": "NON_PARTICIPATING",
"185": "NOT_ALIVE",
"186": "NOT_ALIVE",
"187": "NON_PARTICIPATING",
"188": "NON_PARTICIPATING",
"189": "NOT_ALIVE",
"19": "NON_PARTICIPATING",
"190": "NON_PARTICIPATING",
"191": "NON_PARTICIPATING",
"192": "NON_PARTICIPATING",
"193": "NOT_ALIVE",
"194": "NON_PARTICIPATING",
"195": "NOT_ALIVE",
"196": "NON_PARTICIPATING",
"197": "NOT_ALIVE",
"198": "NOT_ALIVE",
"199": "NON_PARTICIPATING",
"2": "NON_PARTICIPATING",
"20": "NOT_ALIVE",
"200": "NOT_ALIVE",
"201": "NOT_ALIVE",
"202": "NON_PARTICIPATING",
"203": "NOT_ALIVE",
"204": "NOT_ALIVE",
"205": "NON_PARTICIPATING",
"206": "NON_PARTICIPATING",
"207": "NOT_ALIVE",
"208": "NON_PARTICIPATING",
"209": "NOT_ALIVE",
"21": "NOT_ALIVE",
"210": "NON_PARTICIPATING",
"211": "NON_PARTICIPATING",
"212": "SUCCESS",
"213": "NON_PARTICIPATING",
"214": "NON_PARTICIPATING",
"215": "SUCCESS",
"216": "NOT_ALIVE",
"217": "NOT_ALIVE",
"218": "NOT_ALIVE",
"219": "NOT_ALIVE",
"22": "NON_PARTICIPATING",
"220": "NON_PARTICIPATING",
"221": "NOT_ALIVE",
"222": "NOT_ALIVE",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NON_PARTICIPATING",
"226": "NOT_ALIVE",
"227": "NOT_ALIVE",
"228": "NOT_ALIVE",
"229": "NON_PARTICIPATING",
"23": "NON_PARTICIPATING",
"230": "NON_PARTICIPATING",
"231": "SUCCESS",
"232": "NOT_ALIVE",
"233": "NOT_ALIVE",
"234": "NOT_ALIVE",
"235": "NON_PARTICIPATING",
"236": "NOT_ALIVE",
"237": "NON_PARTICIPATING",
"238": "NON_PARTICIPATING",
"239": "NOT_ALIVE",
"24": "NOT_ALIVE",
"240": "NON_PARTICIPATING",
"241": "SUCCESS",
"242": "NON_PARTICIPATING",
"243": "NON_PARTICIPATING",
"244": "NOT_ALIVE",
"245": "NON_PARTICIPATING",
"246": "NOT_ALIVE",
"247": "NON_PARTICIPATING",
"248": "NON_PARTICIPATING",
"249": "NON_PARTICIPATING",
"25": "SUCCESS",
"250": "SUCCESS",
"251": "NOT_ALIVE",
"252": "NOT_ALIVE",
"253": "NOT_ALIVE",
"254": "NON_PARTICIPATING",
"255": "NOT_ALIVE",
"26": "NON_PARTICIPATING",
"27": "NOT_ALIVE",
"28": "NOT_ALIVE",
"29": "NON_PARTICIPATING",
"3": "NON_PARTICIPATING",
"30": "NOT_ALIVE",
"31": "NON_PARTICIPATING",
"32": "NON_PARTICIPATING",
"33": "NOT_ALIVE",
"34": "NOT_ALIVE",
"35": "NON_PARTICIPATING",
"36": "NON_PARTICIPATING",
"37": "NOT_ALIVE",
"38": "NON_PARTICIPATING",
"39": "SUCCESS",
"4": "NOT_ALIVE",
"40": "NON_PARTICIPATING",
"41": "NON_PARTICIPATING",
"42": "NOT_ALIVE",
"43": "NOT_ALIVE",
"44": "NOT_ALIVE",
"45": "NOT_ALIVE",
"46": "NOT_ALIVE",
"47": "SUCCESS",
"48": "NON_PARTICIPATING",
"49": "NON_PARTICIPATING",
"5": "NON_PARTICIPATING",
"50": "NOT_ALIVE",
"51": "NOT_ALIVE",
"52": "SUCCESS",
"53": "NON_PARTICIPATING",
"54": "NOT_ALIVE",
"55": "NOT_ALIVE",
"56": "NON_PARTICIPATING",
"57": "NOT_ALIVE",
"58": "NON_PARTICIPATING",
"59": "NON_PARTICIPATING",
"6": "NON_PARTICIPATING",
"60": "NOT_ALIVE",
"61": "NON_PARTICIPATING",
"62": "NON_PARTICIPATING",
"63": "SUCCESS",
"64": "NOT_ALIVE",
"65": "NON_PARTICIPATING",
"66": "NON_PARTICIPATING",
"67": "NOT_ALIVE",
"68": "NOT_ALIVE",
"69": "NOT_ALIVE",
"7": "NOT_ALIVE",
"70": "NOT_ALIVE",
"71": "NON_PARTICIPATING",
"72": "NON_PARTICIPATING",
"73": "NOT_ALIVE",
"74": "NOT_ALIVE",
"75": "NON_PARTICIPATING",
"76": "NOT_ALIVE",
"77": "SUCCESS",
"78": "NON_PARTICIPATING",
"79": "NON_PARTICIPATING",
"8": "NOT_ALIVE",
"80": "NOT_ALIVE",
"81": "NON_PARTICIPATING",
"82": "NON_PARTICIPATING",
"83": "NON_PARTICIPATING",
"84": "NON_PARTICIPATING",
"85": "NON_PARTICIPATING",
"86": "NON_PARTICIPATING",
"87": "NOT_ALIVE",
"88": "NON_PARTICIPATING",
"89": "NOT_ALIVE",
"9": "NON_PARTICIPATING",
"90": "NOT_ALIVE",
"91": "NOT_ALIVE",
"92": "SUCCESS",
"93": "NOT_ALIVE",
"94": "SUCCESS",
"95": "NOT_ALIVE",
"96": "NOT_ALIVE",
"97": "NON_PARTICIPATING",
"98": "NOT_ALIVE",
"99": "NOT_ALIVE"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6018951,
6018988
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 37,
"intermediate_size": 5632,
"last_allreduce_block": 6016469,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|