[Bugfix][benchmarks] Fix input token calculation for rerank benchmark metrics (#30596)
Signed-off-by: vensen <vensenmu@gmail.com>
This commit is contained in:
@@ -235,7 +235,9 @@ async def get_request(
|
|||||||
|
|
||||||
|
|
||||||
def calculate_metrics_for_embeddings(
|
def calculate_metrics_for_embeddings(
|
||||||
outputs: list[RequestFuncOutput], dur_s: float, selected_percentiles: list[float]
|
outputs: list[RequestFuncOutput],
|
||||||
|
dur_s: float,
|
||||||
|
selected_percentiles: list[float],
|
||||||
) -> EmbedBenchmarkMetrics:
|
) -> EmbedBenchmarkMetrics:
|
||||||
"""Calculate the metrics for the embedding requests.
|
"""Calculate the metrics for the embedding requests.
|
||||||
|
|
||||||
|
|||||||
@@ -120,6 +120,7 @@ class RerankResult(BaseModel):
|
|||||||
|
|
||||||
|
|
||||||
class RerankUsage(BaseModel):
|
class RerankUsage(BaseModel):
|
||||||
|
prompt_tokens: int
|
||||||
total_tokens: int
|
total_tokens: int
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@@ -502,5 +502,7 @@ class ServingScores(OpenAIServing):
|
|||||||
id=request_id,
|
id=request_id,
|
||||||
model=model_name,
|
model=model_name,
|
||||||
results=results,
|
results=results,
|
||||||
usage=RerankUsage(total_tokens=num_prompt_tokens),
|
usage=RerankUsage(
|
||||||
|
total_tokens=num_prompt_tokens, prompt_tokens=num_prompt_tokens
|
||||||
|
),
|
||||||
)
|
)
|
||||||
|
|||||||
Reference in New Issue
Block a user