diff --git a/vllm/model_executor/models/mllama.py b/vllm/model_executor/models/mllama.py index 475364f3..44ef4972 100644 --- a/vllm/model_executor/models/mllama.py +++ b/vllm/model_executor/models/mllama.py @@ -1053,7 +1053,8 @@ class MllamaForConditionalGeneration(nn.Module, SupportsMultiModal): self.image_size = config.vision_config.image_size self.vision_model = MllamaVisionModel(config.vision_config, - quant_config) + quant_config, + prefix="vision_model") self.language_model = MllamaForCausalLM( config.text_config, cache_config=cache_config,