Skip to content

Commit 3523ce5

Browse files
committed
use MLA on rocm
Signed-off-by: Hongxia Yang <[email protected]>
1 parent 2fa8a9d commit 3523ce5

File tree

1 file changed

+0
-3
lines changed

1 file changed

+0
-3
lines changed

vllm/platforms/rocm.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -78,9 +78,6 @@ def get_attn_backend_cls(cls, selected_backend, head_size, dtype,
7878
kv_cache_dtype, block_size, use_v1,
7979
use_mla) -> str:
8080
if use_mla:
81-
if selected_backend and selected_backend != _Backend.TRITON_MLA:
82-
logger.warning(f"Cannot use {selected_backend.name} "
83-
"backend for MLA.")
8481
logger.info("Using Triton MLA backend.")
8582
return "vllm.attention.backends.triton_mla.TritonMLABackend"
8683
selected_backend = (_Backend.ROCM_FLASH if selected_backend

0 commit comments

Comments
 (0)