Add script for benchmarking serving throughput (#145)

This commit is contained in:
Woosuk Kwon
2023-06-14 19:55:38 -07:00
committed by GitHub
parent da5ddcd544
commit 311490a720
10 changed files with 421 additions and 415 deletions

View File

@@ -120,6 +120,7 @@ class ServerArgs:
class AsyncServerArgs(ServerArgs):
"""Arguments for asynchronous CacheFlow servers."""
server_use_ray: bool = False
disable_log_requests: bool = False
@staticmethod
def add_cli_args(
@@ -129,4 +130,6 @@ class AsyncServerArgs(ServerArgs):
parser.add_argument('--server-use-ray', action='store_true',
help='use Ray to start the LLM server in a '
'separate process as the web server process.')
parser.add_argument('--disable-log-requests', action='store_true',
help='disable logging requests')
return parser