Port metrics from aioprometheus to prometheus_client (#2730)

This commit is contained in:
Harry Mellor
2024-02-25 19:54:00 +00:00
committed by GitHub
parent f7c1234990
commit ef978fe411
9 changed files with 130 additions and 84 deletions

View File

@@ -165,6 +165,7 @@ class VllmRunner:
dtype: str = "half",
disable_log_stats: bool = True,
tensor_parallel_size: int = 1,
**kwargs,
) -> None:
self.model = LLM(
model=model_name,
@@ -174,6 +175,7 @@ class VllmRunner:
swap_space=0,
disable_log_stats=disable_log_stats,
tensor_parallel_size=tensor_parallel_size,
**kwargs,
)
def generate(