Fix/async chat serving (#2727)
This commit is contained in:
committed by
GitHub
parent
7e65477e5e
commit
f8e7adda21
@@ -150,7 +150,7 @@ def server(zephyr_lora_files):
|
||||
ray.shutdown()
|
||||
|
||||
|
||||
@pytest.fixture(scope="session")
|
||||
@pytest.fixture(scope="module")
|
||||
def client():
|
||||
client = openai.AsyncOpenAI(
|
||||
base_url="http://localhost:8000/v1",
|
||||
|
||||
Reference in New Issue
Block a user