Port metrics from aioprometheus to prometheus_client (#2730)
This commit is contained in:
@@ -165,6 +165,7 @@ class VllmRunner:
|
||||
dtype: str = "half",
|
||||
disable_log_stats: bool = True,
|
||||
tensor_parallel_size: int = 1,
|
||||
**kwargs,
|
||||
) -> None:
|
||||
self.model = LLM(
|
||||
model=model_name,
|
||||
@@ -174,6 +175,7 @@ class VllmRunner:
|
||||
swap_space=0,
|
||||
disable_log_stats=disable_log_stats,
|
||||
tensor_parallel_size=tensor_parallel_size,
|
||||
**kwargs,
|
||||
)
|
||||
|
||||
def generate(
|
||||
|
||||
Reference in New Issue
Block a user