change api

fsx950223 · fsx950223 · commit 9a17437c758f · 2025-11-13T03:49:46.000Z
Signed-off-by: fsx950223 &lt;fsx950223@outlook.com&gt;
diff --git a/vllm/v1/worker/utils.py b/vllm/v1/worker/utils.py
@@ -316,11 +316,7 @@ def bind_kv_cache(
             # TODO - analyze where runner_kv_caches is used and the right
             # way to ensure it properly reflects multiple attention layers
             # in the same decoder block.
-            if (
-                current_platform.is_cuda()
-                or current_platform.is_xpu()
-                or current_platform.is_rocm()
-            ):
+            if current_platform.is_cuda_alike() or current_platform.is_xpu():
                 # We know that the GPU runner is not impacted by this
                 # case. Some test code depends on runner_kv_caches, but
                 # not in a way that's impacted by ignoring this.