From 76c66f56a46b321d82af0f5f0296b965522e0bb0 Mon Sep 17 00:00:00 2001 From: Rob Scott Date: Fri, 28 Mar 2025 23:35:54 +0000 Subject: [PATCH] Removing Obsolete Portion of Metrics Guide --- site-src/guides/metrics.md | 23 ++--------------------- 1 file changed, 2 insertions(+), 21 deletions(-) diff --git a/site-src/guides/metrics.md b/site-src/guides/metrics.md index 12ff892ec..fca43dd61 100644 --- a/site-src/guides/metrics.md +++ b/site-src/guides/metrics.md @@ -4,26 +4,7 @@ This guide describes the current state of exposed metrics and how to scrape them ## Requirements -To have response metrics, set the body mode to `Buffered` or `Streamed`: -``` -apiVersion: gateway.envoyproxy.io/v1alpha1 -kind: EnvoyExtensionPolicy -metadata: - name: ext-proc-policy - namespace: default -spec: - extProc: - - backendRefs: - - group: "" - kind: Service - name: inference-gateway-ext-proc - port: 9002 - processingMode: - request: - body: Buffered - response: - body: Buffered -``` +To have response metrics, ensure the body mode is set to `Buffered` or `Streamed` (this should be the default behavior for all implementations). If you want to include usage metrics for vLLM model server streaming request, send the request with `include_usage`: @@ -40,7 +21,7 @@ curl -i ${IP}:${PORT}/v1/completions -H 'Content-Type: application/json' -d '{ ## Exposed metrics -| **Metric name** | **Metric Type** |
**Description**
|
**Labels**
| **Status** | +| **Metric name** | **Metric Type** |
**Description**
|
**Labels**
| **Status** | |:---------------------------------------------|:-----------------|:------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:------------| | inference_model_request_total | Counter | The counter of requests broken out for each model. | `model_name`=<model-name>
`target_model_name`=<target-model-name> | ALPHA | | inference_model_request_error_total | Counter | The counter of requests errors broken out for each model. | `model_name`=<model-name>
`target_model_name`=<target-model-name> | ALPHA |