[Misc] LoRA + Chunked Prefill (#9057)

This commit is contained in:
Aurick Qiao
2024-12-10 21:09:20 -05:00
committed by GitHub
parent 9a93973708
commit d5c5154fcf
12 changed files with 49 additions and 20 deletions

View File

@@ -53,7 +53,8 @@ def test_phi2_lora(phi2_lora_files):
max_model_len=1024,
enable_lora=True,
max_loras=2,
enforce_eager=True)
enforce_eager=True,
enable_chunked_prefill=True)
expected_lora_output = [
"SELECT catalog_publisher, COUNT(*) as num_catalogs FROM catalogs GROUP BY catalog_publisher ORDER BY num_catalogs DESC LIMIT 1;", # noqa: E501