DeepSeek-Coder-Instruct-8x1.3b / mergekit_moe_config.yml
SanjiWatsuki's picture
Upload folder using huggingface_hub
a24af6d verified
raw
history blame contribute delete
No virus
785 Bytes
base_model: deepseek-ai/deepseek-coder-1.3b-instruct
gate_mode: random
dtype: bfloat16
experts:
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]
- source_model: deepseek-ai/deepseek-coder-1.3b-instruct
positive_prompts: [""]