default_stage: default_modifiers: QuantizationModifier: config_groups: group_0: targets: [Linear] weights: num_bits: 8 type: float symmetric: true group_size: null strategy: block block_structure: [128, 128] dynamic: false actorder: null observer: minmax observer_kwargs: {} input_activations: num_bits: 8 type: float symmetric: true group_size: 128 strategy: group block_structure: null dynamic: true actorder: null observer: null observer_kwargs: {} output_activations: null format: null targets: [Linear] ignore: [lm_head] kv_cache_scheme: num_bits: 8 type: float symmetric: true group_size: null strategy: tensor block_structure: null dynamic: false actorder: null observer: minmax observer_kwargs: {}