[Bug] Fix attention_backend arg string parsing (#30534)
Signed-off-by: mgoin <mgoin64@gmail.com>
This commit is contained in:
@@ -1649,6 +1649,12 @@ class EngineArgs:
|
|||||||
"attention_backend and attention_config.backend "
|
"attention_backend and attention_config.backend "
|
||||||
"are mutually exclusive"
|
"are mutually exclusive"
|
||||||
)
|
)
|
||||||
|
# Convert string to enum if needed (CLI parsing returns a string)
|
||||||
|
if isinstance(self.attention_backend, str):
|
||||||
|
attention_config.backend = AttentionBackendEnum[
|
||||||
|
self.attention_backend.upper()
|
||||||
|
]
|
||||||
|
else:
|
||||||
attention_config.backend = self.attention_backend
|
attention_config.backend = self.attention_backend
|
||||||
|
|
||||||
load_config = self.create_load_config()
|
load_config = self.create_load_config()
|
||||||
|
|||||||
Reference in New Issue
Block a user