From ab9e8488d57687d1144e7b4802d195f35882ecdc Mon Sep 17 00:00:00 2001 From: forpanyang <138085590+forpanyang@users.noreply.github.com> Date: Fri, 10 Nov 2023 03:47:14 +0800 Subject: [PATCH] Add Yi model to quantization support (#1600) --- vllm/model_executor/model_loader.py | 1 + 1 file changed, 1 insertion(+) diff --git a/vllm/model_executor/model_loader.py b/vllm/model_executor/model_loader.py index 7fca7ebd..b18f9922 100644 --- a/vllm/model_executor/model_loader.py +++ b/vllm/model_executor/model_loader.py @@ -41,6 +41,7 @@ _MODEL_REGISTRY = { _MODEL_CLASSES_SUPPORT_QUANTIZATION = [ LlamaForCausalLM, MistralForCausalLM, + YiForCausalLM, ]