quant_stage: quant_modifiers: GPTQModifier: config_groups: group_0: targets: [Linear] weights: num_bits: 4 type: int symmetric: true group_size: null strategy: channel block_structure: null dynamic: false actorder: null scale_dtype: null zp_dtype: null observer: memoryless_minmax observer_kwargs: {} input_activations: null output_activations: null format: null targets: [Linear] ignore: [lm_head] kv_cache_scheme: num_bits: 8 type: float symmetric: true group_size: null strategy: tensor block_structure: null dynamic: false actorder: null scale_dtype: null zp_dtype: null observer: memoryless_minmax observer_kwargs: {} bypass_divisibility_checks: false block_size: 128 dampening_frac: 0.01 offload_hessians: false