File size: 303 Bytes
bb4b4e1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18

base_model: Qwen/Qwen2-7B
gate_mode: random
architecture: qwen
dtype: bfloat16
experts:
  - source_model: Qwen/Qwen2-7B
    positive_prompts: []

  - source_model: Qwen/Qwen2-7B
    positive_prompts: []

shared_experts:
  - source_model: Qwen/Qwen2-7B
    positive_prompts: []
    residual_scale: 0.1