enforce eager mode with bnb quantization temporarily (#6846)

This commit is contained in:
chenqianfzh 2024-07-26 18:32:20 -07:00 committed by GitHub
parent b5f49ee55b
commit bb5494676f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -282,6 +282,10 @@ class ModelConfig:
raise ValueError(
"BitAndBytes quantization with TP or PP is not supported yet.")
if self.quantization == "bitsandbytes" and self.enforce_eager is False:
raise ValueError(
"BitAndBytes with enforce_eager = False is not supported yet.")
def get_hf_config_sliding_window(self) -> Optional[int]:
"""Get the sliding window size, or None if disabled."""