[Core/Bugfix] pass VLLM_ATTENTION_BACKEND to ray workers (#8172)

This commit is contained in:
William Lin 2024-09-10 16:46:08 -07:00 committed by GitHub
parent 22f3a4bc6c
commit 1d5e397aa4
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -242,6 +242,9 @@ class RayGPUExecutor(DistributedGPUExecutor):
VLLM_INSTANCE_ID,
"VLLM_TRACE_FUNCTION":
str(envs.VLLM_TRACE_FUNCTION),
**({
"VLLM_ATTENTION_BACKEND": envs.VLLM_ATTENTION_BACKEND
} if envs.VLLM_ATTENTION_BACKEND is not None else {})
}, ) for (node_id, _) in worker_node_and_gpu_ids]
self._env_vars_for_all_workers = (