[Misc] Make Serving Benchmark More User-friendly (#5044)

This commit is contained in:
Roger Wang
2024-05-25 10:28:16 -07:00
committed by GitHub
parent d5a1697772
commit f17a1a8f96
2 changed files with 32 additions and 3 deletions

View File

@@ -89,6 +89,9 @@ async def async_request_tgi(
output.latency = most_recent_timestamp - st
output.success = True
output.generated_text = data["generated_text"]
else:
output.error = response.reason or ""
output.success = False
except Exception:
output.success = False
exc_info = sys.exc_info()
@@ -276,6 +279,9 @@ async def async_request_openai_completions(
output.generated_text = generated_text
output.success = True
output.latency = latency
else:
output.error = response.reason or ""
output.success = False
except Exception:
output.success = False
exc_info = sys.exc_info()