Skip to content

Commit

Permalink
use flashattn as default
Browse files Browse the repository at this point in the history
  • Loading branch information
SolitaryThinker committed Sep 6, 2024
1 parent 3e2cb99 commit e144cb6
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions vllm/executor/ray_gpu_executor.py
Original file line number Diff line number Diff line change
Expand Up @@ -242,8 +242,9 @@ def sort_by_driver_then_worker_ip(worker):
VLLM_INSTANCE_ID,
"VLLM_TRACE_FUNCTION":
str(envs.VLLM_TRACE_FUNCTION),
"VLLM_ATTENTION_BACKEND": (str(envs.VLLM_ATTENTION_BACKEND) if
envs.VLLM_ATTENTION_BACKEND else None),
"VLLM_ATTENTION_BACKEND":
(envs.VLLM_ATTENTION_BACKEND
if envs.VLLM_ATTENTION_BACKEND else "FLASH_ATTN"),
}, ) for (node_id, _) in worker_node_and_gpu_ids]

self._env_vars_for_all_workers = (
Expand Down

0 comments on commit e144cb6

Please sign in to comment.