[Core] Priority-based scheduling in async engine (#8850)
This commit is contained in:
committed by
GitHub
parent
18e60d7d13
commit
bd429f2b75
@@ -796,7 +796,7 @@ class LLMEngine:
|
||||
raise ValueError(f"Got lora_request {lora_request} but LoRA is "
|
||||
"not enabled!")
|
||||
|
||||
if priority > 0 and not self.scheduler_config.policy == "priority":
|
||||
if priority != 0 and not self.scheduler_config.policy == "priority":
|
||||
raise ValueError(f"Got priority {priority} but "
|
||||
"Priority scheduling is not enabled.")
|
||||
|
||||
|
||||
Reference in New Issue
Block a user