|
base_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
gate_mode: random |
|
dtype: bfloat16 |
|
experts: |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
- source_model: meta-llama/Meta-Llama-3.1-8B-Instruct |
|
|