Qwen2.5-Coder-7B-Chat-8x-MoE / mergekit_moe_config.yml
BenevolenceMessiah's picture
Upload 31 files
b4a6b43 verified
raw
history blame
701 Bytes
base_model: Qwen/Qwen2.5-Coder-7B
gate_mode: random
dtype: bfloat16
architecture: qwen
experts:
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen
shared_experts:
- source_model: Qwen/Qwen2.5-Coder-7B
architecture: qwen