default_stage: default_modifiers: SmoothQuantModifier: smoothing_strength: 0.8 mappings: - !!python/tuple - ['re:.*q_proj', 're:.*k_proj', 're:.*v_proj'] - re:.*input_layernorm - !!python/tuple - ['re:.*gate_proj', 're:.*up_proj'] - re:.*post_attention_layernorm ignore: ['re:^audio_projector\..*', 're:^audio_encoder\..*'] GPTQModifier: targets: [Linear] ignore: [decoder.lm_head, 're:^audio_projector\..*', 're:^audio_encoder\..*'] scheme: W4A16 sequential_update: true block_size: 128 dampening_frac: 0.01 offload_hessians: false