We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e5f1f4a commit d6f3c79Copy full SHA for d6f3c79
tests/v1/spec_decode/test_max_len.py
@@ -47,7 +47,7 @@ def test_eagle_max_len(
47
"multi-token eagle spec decode on current platform"
48
)
49
50
- if attn_backend == "FLASH_ATTN" and current_platform.is_rocm():
+ if attn_backend == "ROCM_AITER_FA" and current_platform.is_rocm():
51
m.setenv("VLLM_ROCM_USE_AITER", "1")
52
53
llm = LLM(
0 commit comments