only enable cuda platform

heheda12345 · heheda12345 · commit e5cb02e6755c · 2025-04-25T23:57:46.000-07:00
Signed-off-by: Chen Zhang &lt;zhangch99@outlook.com&gt;
diff --git a/vllm/v1/core/kv_cache_utils.py b/vllm/v1/core/kv_cache_utils.py
@@ -801,7 +801,8 @@ def get_kv_cache_config(vllm_config: VllmConfig,
         The generated KVCacheConfigs
     """
     check_enough_kv_cache_memory(vllm_config, kv_cache_spec, available_memory)
-    if vllm_config.cache_config.disable_hybrid_allocator:
+    if (vllm_config.cache_config.disable_hybrid_allocator
+            or vllm_config.device_config.device.type != "cuda"):
         unify_hybrid_kv_cache_specs(kv_cache_spec)
     if is_kv_cache_type_uniform(kv_cache_spec):
         # KV cache of all layers are the same, which is true for