| default_stage: | |
| default_modifiers: | |
| AWQModifier: | |
| targets: [Linear] | |
| ignore: [lm_head, 're:^model\.layers\.\d+\.conv\.'] | |
| scheme: W4A16_ASYM | |
| mappings: | |
| - smooth_layer: model.layers.0.ffn_norm | |
| balance_layers: [model.layers.0.feed_forward.w1, model.layers.0.feed_forward.w3] | |
| - smooth_layer: model.layers.0.feed_forward.w3 | |
| balance_layers: [model.layers.0.feed_forward.w2] | |
| - smooth_layer: model.layers.1.ffn_norm | |
| balance_layers: [model.layers.1.feed_forward.w1, model.layers.1.feed_forward.w3] | |
| - smooth_layer: model.layers.1.feed_forward.w3 | |
| balance_layers: [model.layers.1.feed_forward.w2] | |
| - smooth_layer: model.layers.2.operator_norm | |
| balance_layers: [model.layers.2.self_attn.q_proj, model.layers.2.self_attn.k_proj, | |
| model.layers.2.self_attn.v_proj] | |
| - smooth_layer: model.layers.2.ffn_norm | |
| balance_layers: [model.layers.2.feed_forward.w1, model.layers.2.feed_forward.w3] | |
| - smooth_layer: model.layers.2.feed_forward.w3 | |
| balance_layers: [model.layers.2.feed_forward.w2] | |
| - smooth_layer: model.layers.3.ffn_norm | |
| balance_layers: [model.layers.3.feed_forward.w1, model.layers.3.feed_forward.w3] | |
| - smooth_layer: model.layers.3.feed_forward.w3 | |
| balance_layers: [model.layers.3.feed_forward.w2] | |
| - smooth_layer: model.layers.4.ffn_norm | |
| balance_layers: [model.layers.4.feed_forward.w1, model.layers.4.feed_forward.w3] | |
| - smooth_layer: model.layers.4.feed_forward.w3 | |
| balance_layers: [model.layers.4.feed_forward.w2] | |
| - smooth_layer: model.layers.5.operator_norm | |
| balance_layers: [model.layers.5.self_attn.q_proj, model.layers.5.self_attn.k_proj, | |
| model.layers.5.self_attn.v_proj] | |
| - smooth_layer: model.layers.5.ffn_norm | |
| balance_layers: [model.layers.5.feed_forward.w1, model.layers.5.feed_forward.w3] | |
| - smooth_layer: model.layers.5.feed_forward.w3 | |
| balance_layers: [model.layers.5.feed_forward.w2] | |
| - smooth_layer: model.layers.6.ffn_norm | |
| balance_layers: [model.layers.6.feed_forward.w1, model.layers.6.feed_forward.w3] | |
| - smooth_layer: model.layers.6.feed_forward.w3 | |
| balance_layers: [model.layers.6.feed_forward.w2] | |
| - smooth_layer: model.layers.7.ffn_norm | |
| balance_layers: [model.layers.7.feed_forward.w1, model.layers.7.feed_forward.w3] | |
| - smooth_layer: model.layers.7.feed_forward.w3 | |
| balance_layers: [model.layers.7.feed_forward.w2] | |
| - smooth_layer: model.layers.8.operator_norm | |
| balance_layers: [model.layers.8.self_attn.q_proj, model.layers.8.self_attn.k_proj, | |
| model.layers.8.self_attn.v_proj] | |
| - smooth_layer: model.layers.8.ffn_norm | |
| balance_layers: [model.layers.8.feed_forward.w1, model.layers.8.feed_forward.w3] | |
| - smooth_layer: model.layers.8.feed_forward.w3 | |
| balance_layers: [model.layers.8.feed_forward.w2] | |
| - smooth_layer: model.layers.9.ffn_norm | |
| balance_layers: [model.layers.9.feed_forward.w1, model.layers.9.feed_forward.w3] | |
| - smooth_layer: model.layers.9.feed_forward.w3 | |
| balance_layers: [model.layers.9.feed_forward.w2] | |
| - smooth_layer: model.layers.10.operator_norm | |
| balance_layers: [model.layers.10.self_attn.q_proj, model.layers.10.self_attn.k_proj, | |
| model.layers.10.self_attn.v_proj] | |
| - smooth_layer: model.layers.10.ffn_norm | |
| balance_layers: [model.layers.10.feed_forward.w1, model.layers.10.feed_forward.w3] | |
| - smooth_layer: model.layers.10.feed_forward.w3 | |
| balance_layers: [model.layers.10.feed_forward.w2] | |
| - smooth_layer: model.layers.11.ffn_norm | |
| balance_layers: [model.layers.11.feed_forward.w1, model.layers.11.feed_forward.w3] | |
| - smooth_layer: model.layers.11.feed_forward.w3 | |
| balance_layers: [model.layers.11.feed_forward.w2] | |
| - smooth_layer: model.layers.12.operator_norm | |
| balance_layers: [model.layers.12.self_attn.q_proj, model.layers.12.self_attn.k_proj, | |
| model.layers.12.self_attn.v_proj] | |
| - smooth_layer: model.layers.12.ffn_norm | |
| balance_layers: [model.layers.12.feed_forward.w1, model.layers.12.feed_forward.w3] | |
| - smooth_layer: model.layers.12.feed_forward.w3 | |
| balance_layers: [model.layers.12.feed_forward.w2] | |
| - smooth_layer: model.layers.13.ffn_norm | |
| balance_layers: [model.layers.13.feed_forward.w1, model.layers.13.feed_forward.w3] | |
| - smooth_layer: model.layers.13.feed_forward.w3 | |
| balance_layers: [model.layers.13.feed_forward.w2] | |
| - smooth_layer: model.layers.14.operator_norm | |
| balance_layers: [model.layers.14.self_attn.q_proj, model.layers.14.self_attn.k_proj, | |
| model.layers.14.self_attn.v_proj] | |
| - smooth_layer: model.layers.14.ffn_norm | |
| balance_layers: [model.layers.14.feed_forward.w1, model.layers.14.feed_forward.w3] | |
| - smooth_layer: model.layers.14.feed_forward.w3 | |
| balance_layers: [model.layers.14.feed_forward.w2] | |
| - smooth_layer: model.layers.15.ffn_norm | |
| balance_layers: [model.layers.15.feed_forward.w1, model.layers.15.feed_forward.w3] | |
| - smooth_layer: model.layers.15.feed_forward.w3 | |
| balance_layers: [model.layers.15.feed_forward.w2] | |
| duo_scaling: true | |
| n_grid: 20 | |