Refactor Prometheus and Add Request Level Metrics (#2316)

This commit is contained in:
Robert Shaw
2024-01-31 14:58:07 -08:00
committed by GitHub
parent d0d93b92b1
commit 93b38bea5d
7 changed files with 1230 additions and 98 deletions

View File

@@ -0,0 +1,10 @@
# prometheus.yaml
global:
scrape_interval: 5s
evaluation_interval: 30s
scrape_configs:
- job_name: vllm
static_configs:
- targets:
- 'host.docker.internal:8000'