[Bugfix][Model] Jamba assertions and no chunked prefill by default for Jamba (#6784)
This commit is contained in:
@@ -644,6 +644,11 @@ class JambaForCausalLM(nn.Module, HasInnerState):
|
||||
lora_config: Optional[LoRAConfig] = None,
|
||||
scheduler_config: Optional[SchedulerConfig] = None,
|
||||
) -> None:
|
||||
assert not scheduler_config.chunked_prefill_enabled, \
|
||||
"Jamba currently does not support chunked prefill"
|
||||
assert not cache_config.enable_prefix_caching, \
|
||||
"Jamba currently does not support prefix caching"
|
||||
|
||||
super().__init__()
|
||||
self.config = config
|
||||
self.scheduler_config = scheduler_config
|
||||
|
||||
Reference in New Issue
Block a user