mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2025-12-09 07:14:58 +08:00
[BugFix][DeepSeek-V3.2] Fix backend selection logic for Blackwell (#30195)
This commit is contained in:
parent
b952f4d3c3
commit
0044c4038c
@ -182,8 +182,8 @@ class CudaPlatformBase(Platform):
|
||||
|
||||
if vllm_config.attention_config.backend is None:
|
||||
# Default case
|
||||
if cls.is_device_capability(100):
|
||||
# Blackwell => Force CutlassMLA.
|
||||
if cls.is_device_capability(100) and not use_sparse:
|
||||
# Blackwell => Force CutlassMLA (unless sparse, i.e. DSv3.2).
|
||||
use_cutlass_mla = True
|
||||
# Set the backend in AttentionConfig so it's used during
|
||||
# backend selection
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user