| base_model: mistralai/Mistral-7B-Instruct-v0.1 | |
| gate_mode: random # one of "hidden", "cheap_embed", or "random" | |
| dtype: bfloat16 # output dtype (float32, float16, or bfloat16) | |
| ## (optional) | |
| # experts_per_token: 2 | |
| experts: | |
| - source_model: Treza12/Biomistral-Class0-Full | |
| positive_prompts: | |
| - "This is a prompt that is demonstrative of what expert_model_1 excels at" | |
| - source_model: Treza12/Biomistral-Class1-Full | |
| positive_prompts: | |
| - "This is a prompt that is demonstrative of what expert_model_1 excels at" | |
| - source_model: Treza12/Biomistral-Class2-Full | |
| positive_prompts: | |
| - "This is a prompt that is demonstrative of what expert_model_1 excels at" | |
| - source_model: Treza12/Biomistral-Class3-Full | |
| positive_prompts: | |
| - "This is a prompt that is demonstrative of what expert_model_1 excels at" | |
| - source_model: Treza12/Biomistral-Class4-Full | |
| positive_prompts: | |
| - "This is a prompt that is demonstrative of what expert_model_1 excels at" | |
| - source_model: Treza12/Biomistral-Class5-Full | |
| positive_prompts: | |
| - "This is a prompt that is demonstrative of what expert_model_1 excels at" |