File size: 7,545 Bytes
e0b211e 6643f96 e0b211e 804935d f94eb01 c45a08c 804935d a0fe2e7 f6fbd61 f94eb01 41c8e76 6c48892 c14e127 6c48892 f6fbd61 cfa1ac5 82e51ac 6c48892 f6fbd61 6e346b0 f94eb01 41c8e76 f6fbd61 6e346b0 f6fbd61 6e346b0 f6fbd61 f94eb01 6e346b0 82e51ac 4d5cd3f c45a08c 6c48892 804935d f6fbd61 d0e3c19 6e346b0 f94eb01 f6fbd61 6c48892 6e346b0 ffc92d8 f6fbd61 6c48892 f6fbd61 41c8e76 6c48892 f6fbd61 804935d 1dead14 a0fe2e7 f6fbd61 6c48892 7582dac 41c8e76 e345f96 f94eb01 ffc92d8 6c48892 f2da3af f6fbd61 ffc92d8 f6fbd61 6c48892 4816544 f2da3af d0e3c19 759bed8 f94eb01 f6fbd61 6c48892 c14e127 804935d c784ce6 7a4d383 c45a08c 1dead14 0f93c75 f6fbd61 8448970 f6fbd61 f94eb01 f6fbd61 41c8e76 f94eb01 4d5cd3f 804935d f6fbd61 6c48892 f6fbd61 6e346b0 f94eb01 6c48892 6e346b0 f6fbd61 f94eb01 c784ce6 e43fa59 852f438 a0fe2e7 6e346b0 f5872ab f6fbd61 f94eb01 804935d 6c48892 e345f96 abdde78 6c48892 f94eb01 6e346b0 f6fbd61 41c8e76 6c48892 ffc92d8 e345f96 f94eb01 f6fbd61 6c48892 f6fbd61 bf0f2e6 804935d a0fe2e7 5e6a7fe 41c8e76 f94eb01 6c48892 6e346b0 277df0e 6c48892 e345f96 f94eb01 f6fbd61 6c48892 f94eb01 e43fa59 7582dac f6fbd61 6c48892 f6fbd61 cfa1ac5 6e346b0 4d5cd3f f6fbd61 6c48892 c784ce6 f6fbd61 b7319a2 a0fe2e7 f2da3af f6fbd61 7582dac f6fbd61 7582dac e345f96 f94eb01 d0e3c19 6e346b0 f6fbd61 804935d 7582dac f6fbd61 6c48892 0f93c75 f6fbd61 6c48892 f6fbd61 a0fe2e7 6c48892 fc1357e 7a4d383 f6fbd61 1dead14 6e346b0 f6fbd61 6c48892 ffc92d8 6c48892 f6fbd61 6c48892 2507b83 d2977ad c784ce6 ffc92d8 6c48892 e448c0f 6c48892 f6fbd61 6c48892 e345f96 f94eb01 c784ce6 c14e127 7582dac e345f96 ffc92d8 f6fbd61 1dead14 4d5cd3f f6fbd61 05e3858 f6fbd61 82e51ac 6c48892 ffc92d8 f6fbd61 4d5cd3f 6c48892 f6fbd61 6c48892 f94eb01 a0fe2e7 6c48892 4a87169 f6fbd61 05e3858 6e346b0 6c48892 dffb025 f6fbd61 c14e127 ffc92d8 4d5cd3f e448c0f 0f93c75 e0b211e 5c4eed5 7cbb934 5c4eed5 e0b211e 7cbb934 e0b211e f6fbd61 e0b211e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 |
{
"_name_or_path": "penguin102/c67-h13",
"all_reduce_scores": {
"0": "NOT_ALIVE",
"1": "NOT_ALIVE",
"10": "NOT_ALIVE",
"100": "NOT_ALIVE",
"101": "NOT_ALIVE",
"102": "NOT_ALIVE",
"103": "NOT_ALIVE",
"104": "NOT_ALIVE",
"105": "NON_PARTICIPATING",
"106": "NON_PARTICIPATING",
"107": "NOT_ALIVE",
"108": "SUCCESS",
"109": "NOT_ALIVE",
"11": "NOT_ALIVE",
"110": "NOT_ALIVE",
"111": "NON_PARTICIPATING",
"112": "SUCCESS",
"113": "NOT_ALIVE",
"114": "NOT_ALIVE",
"115": "NON_PARTICIPATING",
"116": "NON_PARTICIPATING",
"117": "NON_PARTICIPATING",
"118": "NOT_ALIVE",
"119": "NOT_ALIVE",
"12": "NOT_ALIVE",
"120": "NOT_ALIVE",
"121": "NOT_ALIVE",
"122": "NON_PARTICIPATING",
"123": "NON_PARTICIPATING",
"124": "NOT_ALIVE",
"125": "NOT_ALIVE",
"126": "NON_PARTICIPATING",
"127": "NON_PARTICIPATING",
"128": "NON_PARTICIPATING",
"129": "NON_PARTICIPATING",
"13": "NOT_ALIVE",
"130": "NON_PARTICIPATING",
"131": "NOT_ALIVE",
"132": "NOT_ALIVE",
"133": "NON_PARTICIPATING",
"134": "NOT_ALIVE",
"135": "NON_PARTICIPATING",
"136": "NOT_ALIVE",
"137": "NOT_ALIVE",
"138": "NOT_ALIVE",
"139": "NOT_ALIVE",
"14": "NOT_ALIVE",
"140": "NON_PARTICIPATING",
"141": "NON_PARTICIPATING",
"142": "NOT_ALIVE",
"143": "NON_PARTICIPATING",
"144": "NON_PARTICIPATING",
"145": "NON_PARTICIPATING",
"146": "NOT_ALIVE",
"147": "NON_PARTICIPATING",
"148": "NON_PARTICIPATING",
"149": "NON_PARTICIPATING",
"15": "SUCCESS",
"150": "NON_PARTICIPATING",
"151": "NOT_ALIVE",
"152": "NON_PARTICIPATING",
"153": "NOT_ALIVE",
"154": "SUCCESS",
"155": "NON_PARTICIPATING",
"156": "NOT_ALIVE",
"157": "NOT_ALIVE",
"158": "NOT_ALIVE",
"159": "NOT_ALIVE",
"16": "NOT_ALIVE",
"160": "NOT_ALIVE",
"161": "NOT_ALIVE",
"162": "NON_PARTICIPATING",
"163": "NOT_ALIVE",
"164": "NON_PARTICIPATING",
"165": "NOT_ALIVE",
"166": "NOT_ALIVE",
"167": "NOT_ALIVE",
"168": "NOT_ALIVE",
"169": "NOT_ALIVE",
"17": "NOT_ALIVE",
"170": "NOT_ALIVE",
"171": "NOT_ALIVE",
"172": "NOT_ALIVE",
"173": "NON_PARTICIPATING",
"174": "NON_PARTICIPATING",
"175": "NOT_ALIVE",
"176": "NOT_ALIVE",
"177": "NOT_ALIVE",
"178": "NOT_ALIVE",
"179": "NOT_ALIVE",
"18": "NON_PARTICIPATING",
"180": "NOT_ALIVE",
"181": "NOT_ALIVE",
"182": "NOT_ALIVE",
"183": "SUCCESS",
"184": "NOT_ALIVE",
"185": "NOT_ALIVE",
"186": "NOT_ALIVE",
"187": "NON_PARTICIPATING",
"188": "NON_PARTICIPATING",
"189": "NOT_ALIVE",
"19": "NOT_ALIVE",
"190": "NON_PARTICIPATING",
"191": "NOT_ALIVE",
"192": "NON_PARTICIPATING",
"193": "NON_PARTICIPATING",
"194": "NOT_ALIVE",
"195": "NOT_ALIVE",
"196": "NOT_ALIVE",
"197": "NON_PARTICIPATING",
"198": "NOT_ALIVE",
"199": "NON_PARTICIPATING",
"2": "NON_PARTICIPATING",
"20": "NOT_ALIVE",
"200": "NOT_ALIVE",
"201": "NOT_ALIVE",
"202": "NOT_ALIVE",
"203": "NOT_ALIVE",
"204": "SUCCESS",
"205": "NOT_ALIVE",
"206": "NON_PARTICIPATING",
"207": "NOT_ALIVE",
"208": "NON_PARTICIPATING",
"209": "NOT_ALIVE",
"21": "NOT_ALIVE",
"210": "NON_PARTICIPATING",
"211": "NOT_ALIVE",
"212": "NON_PARTICIPATING",
"213": "NOT_ALIVE",
"214": "NOT_ALIVE",
"215": "NON_PARTICIPATING",
"216": "NOT_ALIVE",
"217": "NOT_ALIVE",
"218": "NOT_ALIVE",
"219": "NOT_ALIVE",
"22": "NOT_ALIVE",
"220": "NOT_ALIVE",
"221": "NON_PARTICIPATING",
"222": "NON_PARTICIPATING",
"223": "NOT_ALIVE",
"224": "NOT_ALIVE",
"225": "NON_PARTICIPATING",
"226": "NOT_ALIVE",
"227": "NOT_ALIVE",
"228": "NON_PARTICIPATING",
"229": "NOT_ALIVE",
"23": "NON_PARTICIPATING",
"230": "NON_PARTICIPATING",
"231": "NOT_ALIVE",
"232": "NOT_ALIVE",
"233": "NON_PARTICIPATING",
"234": "NOT_ALIVE",
"235": "NOT_ALIVE",
"236": "NON_PARTICIPATING",
"237": "NON_PARTICIPATING",
"238": "NON_PARTICIPATING",
"239": "NOT_ALIVE",
"24": "NOT_ALIVE",
"240": "NOT_ALIVE",
"241": "NON_PARTICIPATING",
"242": "NON_PARTICIPATING",
"243": "SUCCESS",
"244": "NOT_ALIVE",
"245": "NOT_ALIVE",
"246": "NOT_ALIVE",
"247": "NON_PARTICIPATING",
"248": "NON_PARTICIPATING",
"249": "NON_PARTICIPATING",
"25": "SUCCESS",
"250": "NON_PARTICIPATING",
"251": "NOT_ALIVE",
"252": "NOT_ALIVE",
"253": "NOT_ALIVE",
"254": "SUCCESS",
"255": "NOT_ALIVE",
"26": "NON_PARTICIPATING",
"27": "NOT_ALIVE",
"28": "NOT_ALIVE",
"29": "NOT_ALIVE",
"3": "NON_PARTICIPATING",
"30": "SUCCESS",
"31": "NOT_ALIVE",
"32": "NOT_ALIVE",
"33": "NOT_ALIVE",
"34": "NOT_ALIVE",
"35": "SUCCESS",
"36": "NON_PARTICIPATING",
"37": "NOT_ALIVE",
"38": "NON_PARTICIPATING",
"39": "SUCCESS",
"4": "NOT_ALIVE",
"40": "NON_PARTICIPATING",
"41": "NON_PARTICIPATING",
"42": "NOT_ALIVE",
"43": "NOT_ALIVE",
"44": "NOT_ALIVE",
"45": "NOT_ALIVE",
"46": "NON_PARTICIPATING",
"47": "SUCCESS",
"48": "NOT_ALIVE",
"49": "NON_PARTICIPATING",
"5": "SUCCESS",
"50": "NON_PARTICIPATING",
"51": "NOT_ALIVE",
"52": "NOT_ALIVE",
"53": "NON_PARTICIPATING",
"54": "NOT_ALIVE",
"55": "NOT_ALIVE",
"56": "NON_PARTICIPATING",
"57": "NOT_ALIVE",
"58": "NOT_ALIVE",
"59": "NON_PARTICIPATING",
"6": "NOT_ALIVE",
"60": "NOT_ALIVE",
"61": "NON_PARTICIPATING",
"62": "NOT_ALIVE",
"63": "NON_PARTICIPATING",
"64": "NOT_ALIVE",
"65": "NOT_ALIVE",
"66": "NON_PARTICIPATING",
"67": "NOT_ALIVE",
"68": "NOT_ALIVE",
"69": "NOT_ALIVE",
"7": "NOT_ALIVE",
"70": "NON_PARTICIPATING",
"71": "NON_PARTICIPATING",
"72": "NON_PARTICIPATING",
"73": "NON_PARTICIPATING",
"74": "NOT_ALIVE",
"75": "SUCCESS",
"76": "NOT_ALIVE",
"77": "SUCCESS",
"78": "NON_PARTICIPATING",
"79": "NON_PARTICIPATING",
"8": "NOT_ALIVE",
"80": "NON_PARTICIPATING",
"81": "NON_PARTICIPATING",
"82": "NON_PARTICIPATING",
"83": "NON_PARTICIPATING",
"84": "NOT_ALIVE",
"85": "NON_PARTICIPATING",
"86": "NOT_ALIVE",
"87": "NOT_ALIVE",
"88": "NON_PARTICIPATING",
"89": "NOT_ALIVE",
"9": "NOT_ALIVE",
"90": "NOT_ALIVE",
"91": "NON_PARTICIPATING",
"92": "NOT_ALIVE",
"93": "NOT_ALIVE",
"94": "NOT_ALIVE",
"95": "NOT_ALIVE",
"96": "NOT_ALIVE",
"97": "NON_PARTICIPATING",
"98": "NOT_ALIVE",
"99": "NOT_ALIVE"
},
"architectures": [
"LlamaForCausalLM"
],
"attention_bias": false,
"attention_dropout": 0.0,
"block_list": [
6031159,
6031163
],
"bos_token_id": 1,
"eos_token_id": 2,
"hidden_act": "silu",
"hidden_size": 2048,
"initializer_range": 0.02,
"inner_step": 387,
"intermediate_size": 5632,
"last_allreduce_block": 6028406,
"max_position_embeddings": 2048,
"mlp_bias": false,
"model_type": "llama",
"num_attention_heads": 32,
"num_hidden_layers": 22,
"num_key_value_heads": 4,
"pretraining_tp": 1,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.3",
"use_cache": false,
"vocab_size": 32000
}
|