Add throughput benchmarking script (#133)

This commit is contained in:
Woosuk Kwon
2023-05-28 03:20:05 -07:00
committed by GitHub
parent 337871c6fd
commit 211318d44a
12 changed files with 145 additions and 257 deletions

View File

@@ -1,5 +1,5 @@
from cacheflow.entrypoints.llm import LLM
from cacheflow.outputs import RequestOutput
from cacheflow.outputs import RequestOutput, CompletionOutput
from cacheflow.sampling_params import SamplingParams
from cacheflow.server.arg_utils import ServerArgs
from cacheflow.server.llm_server import LLMServer
@@ -9,6 +9,7 @@ __all__ = [
"LLM",
"SamplingParams",
"RequestOutput",
"CompletionOutput",
"LLMServer",
"ServerArgs",
"initialize_cluster",