From 1ac4ccf73c91370f1fcb4f60c1117646cd7a7502 Mon Sep 17 00:00:00 2001 From: Woosuk Kwon Date: Thu, 21 Sep 2023 00:52:47 -0700 Subject: [PATCH] Add float16 and float32 (#1115) --- vllm/engine/arg_utils.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/vllm/engine/arg_utils.py b/vllm/engine/arg_utils.py index a03155a4..65a5d74f 100644 --- a/vllm/engine/arg_utils.py +++ b/vllm/engine/arg_utils.py @@ -93,7 +93,9 @@ class EngineArgs: '--dtype', type=str, default=EngineArgs.dtype, - choices=['auto', 'half', 'bfloat16', 'float'], + choices=[ + 'auto', 'half', 'float16', 'bfloat16', 'float', 'float32' + ], help='data type for model weights and activations. ' 'The "auto" option will use FP16 precision ' 'for FP32 and FP16 models, and BF16 precision '