File size: 7,188 Bytes
de3d43c 05baabe de3d43c 795edf5 de3d43c ecdea1b 395b497 a4ef85e de3d43c 395b497 795edf5 36560cf 795edf5 cec90af 1c7e21f bb4d7eb a4ef85e cec90af 05baabe 1940773 de3d43c 795edf5 de3d43c a4ef85e 1940773 a4ef85e de3d43c bb4d7eb de3d43c 1940773 a4ef85e de3d43c 795edf5 43819d0 795edf5 05baabe de3d43c 795edf5 d9a7f30 ecdea1b de3d43c 1c7e21f cec90af de3d43c 795edf5 de3d43c ecdea1b de3d43c db3229f de3d43c 795edf5 1940773 de3d43c 8a50502 f0b83d3 ecdea1b 1940773 a4ef85e 795edf5 a4ef85e 795edf5 a4ef85e de3d43c 05baabe 1c7e21f a4ef85e 05baabe 795edf5 8eaa722 de3d43c 9fe5111 ecdea1b 1940773 a4ef85e de3d43c 36560cf ecdea1b cec90af de3d43c 1c7e21f a4ef85e de3d43c a4ef85e de3d43c 395b497 ecdea1b 795edf5 f0b83d3 de3d43c 37d1a89 1c7e21f 05baabe a4ef85e de3d43c a4ef85e 1c7e21f 37d1a89 de3d43c ecdea1b de3d43c a4ef85e de3d43c ecdea1b a4ef85e de3d43c 795edf5 de3d43c a4ef85e de3d43c cec90af de3d43c 5c119fc de3d43c 1c7e21f 5c119fc a4ef85e de3d43c 36560cf 795edf5 a4ef85e de3d43c 9fe5111 05baabe de3d43c 05baabe ecdea1b de3d43c a4ef85e de3d43c cec90af a4ef85e ecdea1b de3d43c ecdea1b 36560cf de3d43c 795edf5 9fe5111 de3d43c 36560cf 05baabe de3d43c a4ef85e de3d43c cec90af de3d43c 05baabe de3d43c ecdea1b bb4d7eb de3d43c 1c7e21f 05baabe bb4d7eb de3d43c bb4d7eb cec90af 0e4187a de3d43c a4ef85e ecdea1b de3d43c 05baabe de3d43c f0b83d3 de3d43c a4ef85e de3d43c 5c119fc 05baabe de3d43c 1940773 ecdea1b 05baabe 795edf5 cec90af de3d43c a4ef85e ecdea1b 36560cf 795edf5 1940773 a4ef85e f0b83d3 a4ef85e de3d43c 795edf5 de3d43c a4ef85e ecdea1b de3d43c bb4d7eb a4ef85e 795edf5 05baabe 795edf5 ecdea1b 05baabe a4ef85e de3d43c ecdea1b 395b497 a4ef85e 05baabe ecdea1b cec90af de3d43c 05baabe a4ef85e ecdea1b bb4d7eb 795edf5 05baabe de3d43c 1940773 ecdea1b de3d43c e365aae de3d43c e365aae de3d43c a4ef85e de3d43c |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 |
{
"_name_or_path": "dstrbtd/llama-1b",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NOT_ALIVE",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NOT_ALIVE",
"102": "SUCCESS",
"103": "NOT_ALIVE",
"104": "NON_PARTICIPATING",
"105": "SUCCESS",
"106": "NOT_ALIVE",
"107": "NOT_ALIVE",
"108": "NOT_ALIVE",
"109": "SUCCESS",
"11": "NOT_ALIVE",
"110": "NOT_ALIVE",
"111": "SUCCESS",
"112": "NON_PARTICIPATING",
"113": "NON_PARTICIPATING",
"114": "NOT_ALIVE",
"115": "SUCCESS",
"116": "NOT_ALIVE",
"117": "SUCCESS",
"118": "SUCCESS",
"119": "NOT_ALIVE",
"12": "NOT_ALIVE",
"120": "NON_PARTICIPATING",
"121": "NOT_ALIVE",
"122": "NOT_ALIVE",
"123": "NON_PARTICIPATING",
"124": "SUCCESS",
"125": "NOT_ALIVE",
"126": "NON_PARTICIPATING",
"127": "NOT_ALIVE",
"128": "NOT_ALIVE",
"129": "NOT_ALIVE",
"13": "NON_PARTICIPATING",
"130": "SUCCESS",
"131": "NOT_ALIVE",
"132": "NOT_ALIVE",
"133": "NOT_ALIVE",
"134": "NOT_ALIVE",
"135": "SUCCESS",
"136": "NOT_ALIVE",
"137": "NOT_ALIVE",
"138": "NOT_ALIVE",
"139": "SUCCESS",
"14": "NON_PARTICIPATING",
"140": "NOT_ALIVE",
"141": "NOT_ALIVE",
"142": "SUCCESS",
"143": "SUCCESS",
"144": "NOT_ALIVE",
"145": "NOT_ALIVE",
"146": "NOT_ALIVE",
"147": "NOT_ALIVE",
"148": "NOT_ALIVE",
"149": "NON_PARTICIPATING",
"15": "NOT_ALIVE",
"150": "NON_PARTICIPATING",
"151": "NOT_ALIVE",
"152": "NOT_ALIVE",
"153": "SUCCESS",
"154": "NOT_ALIVE",
"155": "NOT_ALIVE",
"156": "NOT_ALIVE",
"157": "SUCCESS",
"158": "SUCCESS",
"159": "NOT_ALIVE",
"16": "NOT_ALIVE",
"160": "NOT_ALIVE",
"161": "NON_PARTICIPATING",
"162": "NOT_ALIVE",
"163": "NOT_ALIVE",
"164": "NOT_ALIVE",
"165": "NOT_ALIVE",
"166": "NON_PARTICIPATING",
"167": "NOT_ALIVE",
"168": "SUCCESS",
"169": "NON_PARTICIPATING",
"17": "NOT_ALIVE",
"170": "NOT_ALIVE",
"171": "NOT_ALIVE",
"172": "NOT_ALIVE",
"173": "NON_PARTICIPATING",
"174": "NON_PARTICIPATING",
"175": "NON_PARTICIPATING",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "NOT_ALIVE",
"180": "NON_PARTICIPATING",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "NOT_ALIVE",
"184": "SUCCESS",
"185": "NON_PARTICIPATING",
"186": "NOT_ALIVE",
"187": "NOT_ALIVE",
"188": "NON_PARTICIPATING",
"189": "NOT_ALIVE",
"19": "NON_PARTICIPATING",
"190": "NOT_ALIVE",
"191": "NOT_ALIVE",
"192": "NOT_ALIVE",
"193": "NOT_ALIVE",
"194": "NOT_ALIVE",
"195": "NOT_ALIVE",
"196": "NON_PARTICIPATING",
"197": "SUCCESS",
"198": "NOT_ALIVE",
"199": "NOT_ALIVE",
"2": "NOT_ALIVE",
"20": "NOT_ALIVE",
"200": "SUCCESS",
"201": "NON_PARTICIPATING",
"202": "NOT_ALIVE",
"203": "NON_PARTICIPATING",
"204": "NOT_ALIVE",
"205": "NON_PARTICIPATING",
"206": "SUCCESS",
"207": "NOT_ALIVE",
"208": "NOT_ALIVE",
"209": "NOT_ALIVE",
"21": "SUCCESS",
"210": "NOT_ALIVE",
"211": "NOT_ALIVE",
"212": "SUCCESS",
"213": "NOT_ALIVE",
"214": "NOT_ALIVE",
"215": "NOT_ALIVE",
"216": "NOT_ALIVE",
"217": "SUCCESS",
"218": "NOT_ALIVE",
"219": "NON_PARTICIPATING",
"22": "NOT_ALIVE",
"220": "NON_PARTICIPATING",
"221": "NON_PARTICIPATING",
"222": "NOT_ALIVE",
"223": "SUCCESS",
"224": "NOT_ALIVE",
"225": "NOT_ALIVE",
"226": "SUCCESS",
"227": "NON_PARTICIPATING",
"228": "NOT_ALIVE",
"229": "NOT_ALIVE",
"23": "NOT_ALIVE",
"230": "NOT_ALIVE",
"231": "NOT_ALIVE",
"232": "NOT_ALIVE",
"233": "NOT_ALIVE",
"234": "NOT_ALIVE",
"235": "NOT_ALIVE",
"236": "NON_PARTICIPATING",
"237": "SUCCESS",
"238": "SUCCESS",
"239": "NOT_ALIVE",
"24": "SUCCESS",
"240": "NOT_ALIVE",
"241": "NOT_ALIVE",
"242": "NOT_ALIVE",
"243": "NOT_ALIVE",
"244": "NOT_ALIVE",
"245": "NOT_ALIVE",
"246": "NON_PARTICIPATING",
"247": "NOT_ALIVE",
"248": "SUCCESS",
"249": "NOT_ALIVE",
"25": "SUCCESS",
"250": "SUCCESS",
"251": "NOT_ALIVE",
"252": "SUCCESS",
"253": "NOT_ALIVE",
"254": "NOT_ALIVE",
"255": "NOT_ALIVE",
"26": "NON_PARTICIPATING",
"27": "SUCCESS",
"28": "NOT_ALIVE",
"29": "NOT_ALIVE",
"3": "SUCCESS",
"30": "NOT_ALIVE",
"31": "SUCCESS",
"32": "NOT_ALIVE",
"33": "NOT_ALIVE",
"34": "SUCCESS",
"35": "NON_PARTICIPATING",
"36": "NOT_ALIVE",
"37": "NOT_ALIVE",
"38": "SUCCESS",
"39": "NON_PARTICIPATING",
"4": "NOT_ALIVE",
"40": "NOT_ALIVE",
"41": "SUCCESS",
"42": "NOT_ALIVE",
"43": "NOT_ALIVE",
"44": "NON_PARTICIPATING",
"45": "NOT_ALIVE",
"46": "NOT_ALIVE",
"47": "NOT_ALIVE",
"48": "SUCCESS",
"49": "SUCCESS",
"5": "NOT_ALIVE",
"50": "NOT_ALIVE",
"51": "NON_PARTICIPATING",
"52": "SUCCESS",
"53": "SUCCESS",
"54": "NOT_ALIVE",
"55": "NON_PARTICIPATING",
"56": "NOT_ALIVE",
"57": "SUCCESS",
"58": "NON_PARTICIPATING",
"59": "NOT_ALIVE",
"6": "NOT_ALIVE",
"60": "NON_PARTICIPATING",
"61": "NOT_ALIVE",
"62": "SUCCESS",
"63": "NOT_ALIVE",
"64": "NOT_ALIVE",
"65": "NOT_ALIVE",
"66": "NOT_ALIVE",
"67": "NOT_ALIVE",
"68": "NOT_ALIVE",
"69": "NON_PARTICIPATING",
"7": "NON_PARTICIPATING",
"70": "NOT_ALIVE",
"71": "NOT_ALIVE",
"72": "NOT_ALIVE",
"73": "SUCCESS",
"74": "NON_PARTICIPATING",
"75": "SUCCESS",
"76": "SUCCESS",
"77": "NOT_ALIVE",
"78": "NON_PARTICIPATING",
"79": "SUCCESS",
"8": "SUCCESS",
"80": "NON_PARTICIPATING",
"81": "NOT_ALIVE",
"82": "NOT_ALIVE",
"83": "SUCCESS",
"84": "NON_PARTICIPATING",
"85": "NOT_ALIVE",
"86": "SUCCESS",
"87": "SUCCESS",
"88": "NON_PARTICIPATING",
"89": "NON_PARTICIPATING",
"9": "NOT_ALIVE",
"90": "SUCCESS",
"91": "NON_PARTICIPATING",
"92": "SUCCESS",
"93": "NON_PARTICIPATING",
"94": "NON_PARTICIPATING",
"95": "NOT_ALIVE",
"96": "NON_PARTICIPATING",
"97": "NOT_ALIVE",
"98": "SUCCESS",
"99": "SUCCESS"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6574379,
6574411
],
"bos_token_id": 1,
"dtype": "float32",
"eos_token_id": 2,
"head_dim": 64,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 45,
"intermediate_size": 5632,
"last_allreduce_block": 6574085,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|