File size: 563 Bytes
6ab70fa
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
base_model: meta-llama/Meta-Llama-3-8B
gate_mode: random
dtype: bfloat16
experts:
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B
  - source_model: meta-llama/Meta-Llama-3-8B


# and then train the sucker!