warshanks commited on
Commit
b294fce
·
verified ·
1 Parent(s): e5daa68

Upload recipe.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. recipe.yaml +16 -0
recipe.yaml ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ default_stage:
2
+ default_modifiers:
3
+ AWQModifier:
4
+ targets: [Linear]
5
+ ignore: [lm_head]
6
+ scheme: W4A16_ASYM
7
+ mappings:
8
+ - smooth_layer: re:.*input_layernorm$
9
+ balance_layers: ['re:.*q_proj$', 're:.*k_proj$', 're:.*v_proj$']
10
+ - smooth_layer: re:.*v_proj$
11
+ balance_layers: ['re:.*o_proj$']
12
+ - smooth_layer: re:.*post_attention_layernorm$
13
+ balance_layers: ['re:.*gate_proj$', 're:.*up_proj$']
14
+ - smooth_layer: re:.*up_proj$
15
+ balance_layers: ['re:.*down_proj$']
16
+ duo_scaling: true