| base_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| gate_mode: random | |
| dtype: bfloat16 | |
| experts: | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |
| - source_model: meta-llama/Meta-Llama-3.1-8B-Instruct | |