diff --git a/auto_gptq/modeling/qwen.py b/auto_gptq/modeling/qwen.py index 8ac32eb..1572bb1 100644 --- a/auto_gptq/modeling/qwen.py +++ b/auto_gptq/modeling/qwen.py @@ -4,7 +4,7 @@ from ._base import * class QwenGPTQForCausalLM(BaseGPTQForCausalLM): layer_type = "QWenBlock" layers_block_name = "transformer.h" - outside_layer_modules = ["transformer.wte", "transformer.wpe", "transformer.ln_f"] + outside_layer_modules = ["transformer.wte", "transformer.wpe", "transformer.ln_f", "transformer.visual"] inside_layer_modules = [ ["attn.c_attn"], ["attn.c_proj"],