diff --git a/vllm/executor/ray_gpu_executor.py b/vllm/executor/ray_gpu_executor.py index 1c2c6f5f40de8..4e32730cf5c6a 100644 --- a/vllm/executor/ray_gpu_executor.py +++ b/vllm/executor/ray_gpu_executor.py @@ -242,8 +242,9 @@ def sort_by_driver_then_worker_ip(worker): VLLM_INSTANCE_ID, "VLLM_TRACE_FUNCTION": str(envs.VLLM_TRACE_FUNCTION), - "VLLM_ATTENTION_BACKEND": (str(envs.VLLM_ATTENTION_BACKEND) if - envs.VLLM_ATTENTION_BACKEND else None), + "VLLM_ATTENTION_BACKEND": + (envs.VLLM_ATTENTION_BACKEND + if envs.VLLM_ATTENTION_BACKEND else "FLASH_ATTN"), }, ) for (node_id, _) in worker_node_and_gpu_ids] self._env_vars_for_all_workers = (