Skip to content

Commit 0044c40

Browse files
[BugFix][DeepSeek-V3.2] Fix backend selection logic for Blackwell (#30195)
1 parent b952f4d commit 0044c40

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

vllm/platforms/cuda.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -182,8 +182,8 @@ def check_and_update_config(cls, vllm_config: "VllmConfig") -> None:
182182

183183
if vllm_config.attention_config.backend is None:
184184
# Default case
185-
if cls.is_device_capability(100):
186-
# Blackwell => Force CutlassMLA.
185+
if cls.is_device_capability(100) and not use_sparse:
186+
# Blackwell => Force CutlassMLA (unless sparse, i.e. DSv3.2).
187187
use_cutlass_mla = True
188188
# Set the backend in AttentionConfig so it's used during
189189
# backend selection

0 commit comments

Comments
 (0)