We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
get_cu_count
1 parent 86d15bf commit 8da2f28Copy full SHA for 8da2f28
vllm/v1/attention/backends/rocm_aiter_fa.py
@@ -18,6 +18,7 @@
18
from vllm.logger import init_logger
19
from vllm.platforms import current_platform
20
from vllm.utils.math_utils import cdiv
21
+from vllm.utils.platform_utils import get_cu_count
22
from vllm.v1.attention.backends.utils import (
23
AttentionCGSupport,
24
AttentionMetadataBuilder,
@@ -38,7 +39,7 @@ def block_size(x, head_dim):
38
39
return min(65536 // x.element_size(), triton.next_power_of_2(head_dim))
40
41
def num_programs(total_tokens):
- return min(total_tokens, current_platform.get_cu_count())
42
+ return min(total_tokens, get_cu_count())
43
44
@triton.jit
45
def cp_mha_gather_cache_kernel(
0 commit comments