Delete mergekit_moe_config.yml
Browse files- mergekit_moe_config.yml +0 -14
mergekit_moe_config.yml
DELETED
@@ -1,14 +0,0 @@
|
|
1 |
-
base_model: d:/_Qwen2.5-Coder-7B-Instruct
|
2 |
-
gate_mode: random
|
3 |
-
architecture: qwen
|
4 |
-
dtype: bfloat16
|
5 |
-
experts_per_token: 2
|
6 |
-
experts:
|
7 |
-
- source_model: d:/_Qwen2.5-Coder-7B-Instruct
|
8 |
-
- source_model: d:/_Qwen2.5-OlympicCoder-7B
|
9 |
-
- source_model: d:/_Qwen2.5-CodeV-R1-Qwen-7B
|
10 |
-
- source_model: d:/_Qwen2.5-VisCoder-7B
|
11 |
-
|
12 |
-
shared_experts:
|
13 |
-
- source_model: d:/_Qwen2.5-Coder-7B-Instruct
|
14 |
-
residual_scale: 0.1 # downweight output from shared expert to prevent overcooking the model
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|