| { | |
| "base_model": "/mnt/1tb/Qwen2.5-14B-Instruct", | |
| "model_name": "Outlier V3.2", | |
| "num_layers": 48, | |
| "hidden_size": 5120, | |
| "intermediate_size": 13824, | |
| "moe_layers": [ | |
| 11, | |
| 12, | |
| 13, | |
| 14, | |
| 15, | |
| 16, | |
| 17, | |
| 18, | |
| 19, | |
| 20, | |
| 21, | |
| 22, | |
| 23, | |
| 24, | |
| 25, | |
| 26, | |
| 27, | |
| 28, | |
| 29, | |
| 30, | |
| 31, | |
| 32, | |
| 33, | |
| 34, | |
| 35, | |
| 36 | |
| ], | |
| "experts_per_layer": 8, | |
| "top_k": 2, | |
| "representation": "zero-delta ternary expert overlays over dense Qwen2.5 shared MLPs" | |
| } | |