File size: 7,836 Bytes
7310c18 aa3acc0 7310c18 5e947ad 5509888 7310c18 e16a895 1ffa11a 5e947ad 37472d3 af8a58f 9d9becc c7a16ed e2664e5 d64b147 37472d3 5e947ad e16a895 5e947ad 1ffa11a 8a5b326 36257d8 cafc80f 06abb2a 8a5b326 06abb2a 5e947ad 06abb2a aa3acc0 37472d3 4577879 6d3fe36 5509888 d64b147 8a5b326 1ffa11a 6d3fe36 f0412b2 5e947ad 7310c18 e16a895 5e947ad 32ffa9a 82ea615 e16a895 37472d3 5e947ad 37472d3 5e947ad aa3acc0 5f8de0b e2664e5 6d3fe36 cafc80f cac997d 5e947ad 300aece 5509888 37472d3 7310c18 af8a58f e16a895 5e947ad f0412b2 06abb2a 5e947ad 81f12a7 5e947ad 8a5b326 5e947ad e16a895 5e947ad 257655e 8a5b326 06abb2a 7310c18 81f12a7 e16a895 8a5b326 c7a16ed 7310c18 e2664e5 36efd1a 5509888 8a5b326 7631c93 aa3acc0 7310c18 5e947ad 37472d3 e16a895 81f12a7 7310c18 f0412b2 7310c18 5e947ad e16a895 5e947ad 06abb2a 81f12a7 5e947ad 32ffa9a aa3acc0 4577879 cafc80f 300aece 6d3fe36 7310c18 e16a895 5e947ad aa3acc0 cafc80f 5e947ad e16a895 5e947ad e16a895 37472d3 e2664e5 cafc80f e16a895 5e947ad 7310c18 e2664e5 5e947ad 7310c18 300aece 7310c18 5e947ad af8a58f f0412b2 5e947ad 300aece 5e947ad d64b147 e16a895 36257d8 5e947ad e2664e5 06abb2a 5e947ad 8a5b326 5e947ad 1ffa11a 9d9becc cafc80f 36efd1a 06abb2a e16a895 06abb2a e16a895 36efd1a af8a58f 7310c18 e16a895 af8a58f e16a895 8a5b326 5e947ad e16a895 5e947ad 9752921 e16a895 37472d3 5e947ad 7310c18 5f8de0b 5e947ad 9d9becc 7310c18 5e947ad e16a895 81f12a7 d64b147 aa3acc0 5509888 5e947ad e16a895 5e947ad cafc80f 06abb2a cafc80f 535e387 e16a895 81f12a7 e16a895 5e947ad cafc80f 5e947ad 81f12a7 5509888 c7a16ed 37472d3 5e947ad 06abb2a e16a895 81f12a7 5e947ad 06abb2a 81f12a7 9752921 9d9becc 5509888 9d9becc 5509888 37472d3 e16a895 8a5b326 9d9becc 5509888 8a5b326 aa3acc0 81f12a7 7310c18 aa3acc0 82ea615 5e947ad 9d9becc 5e947ad c7a16ed e16a895 82ea615 7310c18 06a93ec 7310c18 06a93ec 7310c18 5e947ad 7310c18 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 |
{
"_name_or_path": "distributed/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NOT_ALIVE",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NOT_ALIVE",
"102": "NON_PARTICIPATING",
"103": "NOT_ALIVE",
"104": "NON_PARTICIPATING",
"105": "NON_PARTICIPATING",
"106": "NON_PARTICIPATING",
"107": "NOT_ALIVE",
"108": "NOT_ALIVE",
"109": "NOT_ALIVE",
"11": "NOT_ALIVE",
"110": "NON_PARTICIPATING",
"111": "NOT_ALIVE",
"112": "SUCCESS",
"113": "NOT_ALIVE",
"114": "NON_PARTICIPATING",
"115": "NOT_ALIVE",
"116": "NOT_ALIVE",
"117": "NON_PARTICIPATING",
"118": "NOT_ALIVE",
"119": "NON_PARTICIPATING",
"12": "NON_PARTICIPATING",
"120": "NON_PARTICIPATING",
"121": "NOT_ALIVE",
"122": "NON_PARTICIPATING",
"123": "NOT_ALIVE",
"124": "NON_PARTICIPATING",
"125": "NON_PARTICIPATING",
"126": "NOT_ALIVE",
"127": "NOT_ALIVE",
"128": "NOT_ALIVE",
"129": "NON_PARTICIPATING",
"13": "NOT_ALIVE",
"130": "NOT_ALIVE",
"131": "NOT_ALIVE",
"132": "NON_PARTICIPATING",
"133": "NON_PARTICIPATING",
"134": "NON_PARTICIPATING",
"135": "NON_PARTICIPATING",
"136": "NON_PARTICIPATING",
"137": "NON_PARTICIPATING",
"138": "SUCCESS",
"139": "NON_PARTICIPATING",
"14": "NOT_ALIVE",
"140": "NOT_ALIVE",
"141": "NOT_ALIVE",
"142": "NON_PARTICIPATING",
"143": "NON_PARTICIPATING",
"144": "NON_PARTICIPATING",
"145": "NON_PARTICIPATING",
"146": "NON_PARTICIPATING",
"147": "NOT_ALIVE",
"148": "NON_PARTICIPATING",
"149": "NON_PARTICIPATING",
"15": "NOT_ALIVE",
"150": "NON_PARTICIPATING",
"151": "NOT_ALIVE",
"152": "NOT_ALIVE",
"153": "NON_PARTICIPATING",
"154": "NON_PARTICIPATING",
"155": "NON_PARTICIPATING",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NON_PARTICIPATING",
"159": "NON_PARTICIPATING",
"16": "NON_PARTICIPATING",
"160": "NON_PARTICIPATING",
"161": "NOT_ALIVE",
"162": "NON_PARTICIPATING",
"163": "NOT_ALIVE",
"164": "NOT_ALIVE",
"165": "NON_PARTICIPATING",
"166": "NON_PARTICIPATING",
"167": "NON_PARTICIPATING",
"168": "SUCCESS",
"169": "NOT_ALIVE",
"17": "NOT_ALIVE",
"170": "NON_PARTICIPATING",
"171": "NOT_ALIVE",
"172": "NON_PARTICIPATING",
"173": "SUCCESS",
"174": "NOT_ALIVE",
"175": "NOT_ALIVE",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NON_PARTICIPATING",
"179": "NOT_ALIVE",
"18": "NOT_ALIVE",
"180": "NOT_ALIVE",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "SUCCESS",
"184": "NON_PARTICIPATING",
"185": "NOT_ALIVE",
"186": "NON_PARTICIPATING",
"187": "NON_PARTICIPATING",
"188": "NON_PARTICIPATING",
"189": "NOT_ALIVE",
"19": "NOT_ALIVE",
"190": "NON_PARTICIPATING",
"191": "NOT_ALIVE",
"192": "NON_PARTICIPATING",
"193": "NOT_ALIVE",
"194": "NON_PARTICIPATING",
"195": "NON_PARTICIPATING",
"196": "SUCCESS",
"197": "SUCCESS",
"198": "NON_PARTICIPATING",
"199": "NON_PARTICIPATING",
"2": "NON_PARTICIPATING",
"20": "NOT_ALIVE",
"200": "NOT_ALIVE",
"201": "NOT_ALIVE",
"202": "NOT_ALIVE",
"203": "NOT_ALIVE",
"204": "NON_PARTICIPATING",
"205": "NON_PARTICIPATING",
"206": "NON_PARTICIPATING",
"207": "NOT_ALIVE",
"208": "NON_PARTICIPATING",
"209": "NON_PARTICIPATING",
"21": "NOT_ALIVE",
"210": "NON_PARTICIPATING",
"211": "NOT_ALIVE",
"212": "SUCCESS",
"213": "NON_PARTICIPATING",
"214": "NOT_ALIVE",
"215": "NON_PARTICIPATING",
"216": "NOT_ALIVE",
"217": "NON_PARTICIPATING",
"218": "NON_PARTICIPATING",
"219": "NON_PARTICIPATING",
"22": "NON_PARTICIPATING",
"220": "NOT_ALIVE",
"221": "NOT_ALIVE",
"222": "NOT_ALIVE",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NOT_ALIVE",
"226": "NOT_ALIVE",
"227": "NOT_ALIVE",
"228": "NON_PARTICIPATING",
"229": "NON_PARTICIPATING",
"23": "NON_PARTICIPATING",
"230": "NOT_ALIVE",
"231": "NOT_ALIVE",
"232": "NOT_ALIVE",
"233": "NOT_ALIVE",
"234": "NON_PARTICIPATING",
"235": "NON_PARTICIPATING",
"236": "NOT_ALIVE",
"237": "SUCCESS",
"238": "SUCCESS",
"239": "NOT_ALIVE",
"24": "NOT_ALIVE",
"240": "NOT_ALIVE",
"241": "NOT_ALIVE",
"242": "NON_PARTICIPATING",
"243": "NOT_ALIVE",
"244": "NOT_ALIVE",
"245": "NOT_ALIVE",
"246": "NON_PARTICIPATING",
"247": "NON_PARTICIPATING",
"248": "NOT_ALIVE",
"249": "NOT_ALIVE",
"25": "SUCCESS",
"250": "SUCCESS",
"251": "NOT_ALIVE",
"252": "NON_PARTICIPATING",
"253": "NOT_ALIVE",
"254": "SUCCESS",
"255": "NOT_ALIVE",
"26": "NON_PARTICIPATING",
"27": "NOT_ALIVE",
"28": "NON_PARTICIPATING",
"29": "NOT_ALIVE",
"3": "NON_PARTICIPATING",
"30": "NON_PARTICIPATING",
"31": "NON_PARTICIPATING",
"32": "SUCCESS",
"33": "NOT_ALIVE",
"34": "NOT_ALIVE",
"35": "NON_PARTICIPATING",
"36": "NOT_ALIVE",
"37": "NOT_ALIVE",
"38": "SUCCESS",
"39": "SUCCESS",
"4": "NON_PARTICIPATING",
"40": "NON_PARTICIPATING",
"41": "NON_PARTICIPATING",
"42": "NON_PARTICIPATING",
"43": "NON_PARTICIPATING",
"44": "NON_PARTICIPATING",
"45": "NOT_ALIVE",
"46": "NOT_ALIVE",
"47": "NON_PARTICIPATING",
"48": "NOT_ALIVE",
"49": "NON_PARTICIPATING",
"5": "NOT_ALIVE",
"50": "NON_PARTICIPATING",
"51": "NOT_ALIVE",
"52": "NON_PARTICIPATING",
"53": "NON_PARTICIPATING",
"54": "NON_PARTICIPATING",
"55": "NOT_ALIVE",
"56": "NON_PARTICIPATING",
"57": "NON_PARTICIPATING",
"58": "SUCCESS",
"59": "NON_PARTICIPATING",
"6": "NON_PARTICIPATING",
"60": "NON_PARTICIPATING",
"61": "NON_PARTICIPATING",
"62": "NON_PARTICIPATING",
"63": "NOT_ALIVE",
"64": "NON_PARTICIPATING",
"65": "NON_PARTICIPATING",
"66": "NOT_ALIVE",
"67": "NOT_ALIVE",
"68": "NON_PARTICIPATING",
"69": "NON_PARTICIPATING",
"7": "NON_PARTICIPATING",
"70": "NON_PARTICIPATING",
"71": "NON_PARTICIPATING",
"72": "NON_PARTICIPATING",
"73": "NON_PARTICIPATING",
"74": "NON_PARTICIPATING",
"75": "NON_PARTICIPATING",
"76": "NON_PARTICIPATING",
"77": "NON_PARTICIPATING",
"78": "NOT_ALIVE",
"79": "NOT_ALIVE",
"8": "NOT_ALIVE",
"80": "NON_PARTICIPATING",
"81": "NON_PARTICIPATING",
"82": "NON_PARTICIPATING",
"83": "NON_PARTICIPATING",
"84": "NON_PARTICIPATING",
"85": "NON_PARTICIPATING",
"86": "NOT_ALIVE",
"87": "NON_PARTICIPATING",
"88": "NON_PARTICIPATING",
"89": "NOT_ALIVE",
"9": "NOT_ALIVE",
"90": "NON_PARTICIPATING",
"91": "NON_PARTICIPATING",
"92": "SUCCESS",
"93": "NON_PARTICIPATING",
"94": "SUCCESS",
"95": "NOT_ALIVE",
"96": "NON_PARTICIPATING",
"97": "NOT_ALIVE",
"98": "NON_PARTICIPATING",
"99": "NOT_ALIVE"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
5972871,
5972886
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 21,
"intermediate_size": 5632,
"last_allreduce_block": 5972300,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|