quant_stage: | |
quant_modifiers: | |
QuantizationModifier: | |
targets: [Linear] | |
ignore: [] | |
kv_cache_scheme: | |
num_bits: 8 | |
type: float | |
symmetric: true | |
group_size: null | |
strategy: tensor | |
block_structure: null | |
dynamic: false | |
actorder: null | |
observer: minmax | |
observer_kwargs: {} | |