| { | |
| "model_type": "MixtureOfExperts7M", | |
| "num_classes": 10, | |
| "num_experts": 16, | |
| "input_dim": 64, | |
| "expert_hidden1": 512, | |
| "expert_hidden2": 512, | |
| "expert_output_dim": 256, | |
| "gate_hidden": 512, | |
| "parameter_count": 6880282, | |
| "framework": "pytorch" | |
| } |
| { | |
| "model_type": "MixtureOfExperts7M", | |
| "num_classes": 10, | |
| "num_experts": 16, | |
| "input_dim": 64, | |
| "expert_hidden1": 512, | |
| "expert_hidden2": 512, | |
| "expert_output_dim": 256, | |
| "gate_hidden": 512, | |
| "parameter_count": 6880282, | |
| "framework": "pytorch" | |
| } |