We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent c0de053 commit 2dee3abCopy full SHA for 2dee3ab
vllm_ascend/patch/platform/patch_platform.py
vllm_ascend/platform.py
@@ -388,6 +388,9 @@ def get_attn_backend_cls(
388
use_mla,
389
has_sink=False,
390
use_sparse=False,
391
+ # NOTE: Please pay special attention to the order of these parameters.
392
+ # Although we are only using some of them so far
393
+ # vllm passes them in sequence when using this interface.
394
use_mm_prefix: bool = False,
395
attn_type: str | None = None,
396
):
0 commit comments