We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b3a0d01 commit 64862d1Copy full SHA for 64862d1
vllm/attention/ops/prefix_prefill.py
@@ -11,7 +11,7 @@
11
12
# Static kernels parameters
13
BASE_BLOCK = 128 if current_platform.has_device_capability(80) else 64
14
-NUM_WARPS = 8
+NUM_WARPS = 4 if current_platform.is_rocm() else 8
15
16
# To check compatibility
17
IS_TURING = current_platform.get_device_capability() == (7, 5)
0 commit comments