Skip to content

Commit

Permalink
use MLA on rocm
Browse files Browse the repository at this point in the history
Signed-off-by: Hongxia Yang <hongxia.yang@amd.com>
  • Loading branch information
hongxiayang committed Feb 2, 2025
1 parent 0c1cc40 commit 3b84895
Showing 1 changed file with 0 additions and 3 deletions.
3 changes: 0 additions & 3 deletions vllm/platforms/rocm.py
Original file line number Diff line number Diff line change
Expand Up @@ -78,9 +78,6 @@ def get_attn_backend_cls(cls, selected_backend, head_size, dtype,
kv_cache_dtype, block_size, use_v1,
use_mla) -> str:
if use_mla:
if selected_backend and selected_backend != _Backend.TRITON_MLA:
logger.warning(f"Cannot use {selected_backend.name} "
"backend for MLA.")
logger.info("Using Triton MLA backend.")
return "vllm.attention.backends.triton_mla.TritonMLABackend"
selected_backend = (_Backend.ROCM_FLASH if selected_backend
Expand Down

0 comments on commit 3b84895

Please # to comment.