mirror of
https://git.datalinker.icu/vllm-project/vllm.git
synced 2026-05-25 01:24:27 +08:00
[Bug] Fix attention_backend arg string parsing (#30534)
Signed-off-by: mgoin <mgoin64@gmail.com>
This commit is contained in:
parent
dc13c99eed
commit
09ad3b76b3
@ -1649,7 +1649,13 @@ class EngineArgs:
|
|||||||
"attention_backend and attention_config.backend "
|
"attention_backend and attention_config.backend "
|
||||||
"are mutually exclusive"
|
"are mutually exclusive"
|
||||||
)
|
)
|
||||||
attention_config.backend = self.attention_backend
|
# Convert string to enum if needed (CLI parsing returns a string)
|
||||||
|
if isinstance(self.attention_backend, str):
|
||||||
|
attention_config.backend = AttentionBackendEnum[
|
||||||
|
self.attention_backend.upper()
|
||||||
|
]
|
||||||
|
else:
|
||||||
|
attention_config.backend = self.attention_backend
|
||||||
|
|
||||||
load_config = self.create_load_config()
|
load_config = self.create_load_config()
|
||||||
|
|
||||||
|
|||||||
Loading…
x
Reference in New Issue
Block a user