base_model: mistralai/Mistral-7B-Instruct-v0.1 | |
gate_mode: random # one of "hidden", "cheap_embed", or "random" | |
dtype: bfloat16 # output dtype (float32, float16, or bfloat16) | |
## (optional) | |
# experts_per_token: 2 | |
experts: | |
- source_model: Treza12/Biomistral-Class0-Full | |
positive_prompts: | |
- "This is a prompt that is demonstrative of what expert_model_1 excels at Screening" | |
- source_model: Treza12/Biomistral-Class1-Full | |
positive_prompts: | |
- "This is a prompt that is demonstrative of what expert_model_1 excels at Diagnosis" | |
- source_model: Treza12/Biomistral-Class2-Full | |
positive_prompts: | |
- "This is a prompt that is demonstrative of what expert_model_1 excels at Staging" | |
- source_model: Treza12/Biomistral-Class3-Full | |
positive_prompts: | |
- "This is a prompt that is demonstrative of what expert_model_1 excels at Treatment Selection" | |
- source_model: Treza12/Biomistral-Class4-Full | |
positive_prompts: | |
- "This is a prompt that is demonstrative of what expert_model_1 excels at Prognosis" | |
- source_model: Treza12/Biomistral-Class5-Full | |
positive_prompts: | |
- "This is a prompt that is demonstrative of what expert_model_1 excels at Follow-up" |