From 00e6a2dc535c89ac7c92551ef9b92acd8664df02 Mon Sep 17 00:00:00 2001 From: Ali Panahi <64020589+c3-ali@users.noreply.github.com> Date: Tue, 11 Jun 2024 10:40:23 -0700 Subject: [PATCH] [Bugfix] fix lora_dtype value type in arg_utils.py (#5398) --- vllm/engine/arg_utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py index e0aadece..f87ee130 100644 --- a/vllm/engine/arg_utils.py +++ b/vllm/engine/arg_utils.py @@ -68,7 +68,7 @@ class EngineArgs: fully_sharded_loras: bool = False lora_extra_vocab_size: int = 256 long_lora_scaling_factors: Optional[Tuple[float]] = None - lora_dtype = 'auto' + lora_dtype: str = 'auto' max_cpu_loras: Optional[int] = None device: str = 'auto' ray_workers_use_nsight: bool = False