default_stage: default_modifiers: QuantizationModifier: config_groups: group_0: targets: [Linear] weights: num_bits: 4 type: float symmetric: true group_size: 16 strategy: tensor_group block_structure: null dynamic: false actorder: null scale_dtype: torch.float8_e4m3fn zp_dtype: null observer: memoryless_minmax observer_kwargs: {} input_activations: num_bits: 4 type: float symmetric: true group_size: 16 strategy: tensor_group block_structure: null dynamic: local actorder: null scale_dtype: null zp_dtype: null observer: static_minmax observer_kwargs: {} output_activations: null format: null targets: [Linear] ignore: ['re:.*lm_head', 're:model.multi_modal_projector.*', 're:model.vision_tower.*', 're:.*mlp.gate$', 're:.*self_attn'] bypass_divisibility_checks: false