[Frontend] Adjust try/except blocks in API impl (#10056)

Signed-off-by: Nick Hill <nhill@redhat.com>
This commit is contained in:
Nick Hill
2024-11-07 04:07:51 +00:00
committed by GitHub
parent d3859f1891
commit 29862b884b
2 changed files with 5 additions and 11 deletions

View File

@@ -189,13 +189,7 @@ class OpenAIServingCompletion(OpenAIServing):
try:
async for i, res in result_generator:
final_res_batch[i] = res
except asyncio.CancelledError:
return self.create_error_response("Client disconnected")
except ValueError as e:
# TODO: Use a vllm-specific Validation Error
return self.create_error_response(str(e))
try:
for i, final_res in enumerate(final_res_batch):
assert final_res is not None
@@ -217,6 +211,8 @@ class OpenAIServingCompletion(OpenAIServing):
tokenizer,
request_metadata,
)
except asyncio.CancelledError:
return self.create_error_response("Client disconnected")
except ValueError as e:
# TODO: Use a vllm-specific Validation Error
return self.create_error_response(str(e))