Skip to content

Commit 7d46886

Browse files
committed
change condition
1 parent 24a9474 commit 7d46886

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

vllm/platforms/rocm.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -184,14 +184,14 @@ def get_attn_backend_cls(cls, selected_backend, head_size, dtype,
184184
selected_backend = (_Backend.ROCM_FLASH if selected_backend
185185
== _Backend.FLASH_ATTN else selected_backend)
186186
if envs.VLLM_USE_V1:
187-
if envs.VLLM_USE_TRITON_FLASH_ATTN:
188-
logger.info("Using Triton Attention backend on V1 engine.")
189-
return ("vllm.v1.attention.backends."
190-
"triton_attn.TritonAttentionBackend")
191-
else:
187+
if envs.VLLM_ROCM_USE_AITER:
192188
logger.info("Using Flash Attention backend on V1 engine.")
193189
return ("vllm.v1.attention.backends."
194190
"flash_attn.FlashAttentionBackend")
191+
else:
192+
logger.info("Using Triton Attention backend on V1 engine.")
193+
return ("vllm.v1.attention.backends."
194+
"triton_attn.TritonAttentionBackend")
195195
if selected_backend == _Backend.ROCM_FLASH:
196196
if not cls.has_device_capability(90):
197197
# not Instinct series GPUs.

0 commit comments

Comments
 (0)