DEFAULT_stage: | |
DEFAULT_modifiers: | |
QuantizationModifier: | |
ignore: [lm_head] | |
targets: Linear | |
scheme: W4A16 | |
kv_cache_scheme: {num_bits: 8, type: int, symmetric: true, strategy: tensor, dynamic: false} | |
DEFAULT_stage: | |
DEFAULT_modifiers: | |
QuantizationModifier: | |
ignore: [lm_head] | |
targets: Linear | |
scheme: W4A16 | |
kv_cache_scheme: {num_bits: 8, type: int, symmetric: true, strategy: tensor, dynamic: false} | |