@@ -10,14 +10,15 @@ import (
10
10
extProcPb "github.com/envoyproxy/go-control-plane/envoy/service/ext_proc/v3"
11
11
"inference.networking.x-k8s.io/gateway-api-inference-extension/pkg/ext-proc/backend"
12
12
"inference.networking.x-k8s.io/gateway-api-inference-extension/pkg/ext-proc/scheduling"
13
+ logutil "inference.networking.x-k8s.io/gateway-api-inference-extension/pkg/ext-proc/util/logging"
13
14
klog "k8s.io/klog/v2"
14
15
)
15
16
16
17
// HandleRequestBody handles body of the request to the backend server, such as parsing the "model"
17
18
// parameter.
18
19
// Envoy sends the request body to ext proc before sending the request to the backend server.
19
20
func (s * Server ) HandleRequestBody (reqCtx * RequestContext , req * extProcPb.ProcessingRequest ) (* extProcPb.ProcessingResponse , error ) {
20
- klog .V (3 ).Infof ("Handling request body" )
21
+ klog .V (logutil . VERBOSE ).Infof ("Handling request body" )
21
22
22
23
// Unmarshal request body (must be JSON).
23
24
v := req .Request .(* extProcPb.ProcessingRequest_RequestBody )
@@ -26,14 +27,14 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
26
27
klog .Errorf ("Error unmarshaling request body: %v" , err )
27
28
return nil , fmt .Errorf ("error unmarshaling request body: %v" , err )
28
29
}
29
- klog .V (3 ).Infof ("Request body: %v" , rb )
30
+ klog .V (logutil . VERBOSE ).Infof ("Request body: %v" , rb )
30
31
31
32
// Resolve target models.
32
33
model , ok := rb ["model" ].(string )
33
34
if ! ok {
34
35
return nil , errors .New ("model not found in request" )
35
36
}
36
- klog .V (3 ).Infof ("Model requested: %v" , model )
37
+ klog .V (logutil . VERBOSE ).Infof ("Model requested: %v" , model )
37
38
modelName := model
38
39
39
40
// NOTE: The nil checking for the modelObject means that we DO allow passthrough currently.
@@ -54,7 +55,7 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
54
55
ResolvedTargetModel : modelName ,
55
56
Critical : backend .IsCritical (modelObj ),
56
57
}
57
- klog .V (3 ).Infof ("LLM Request: %+v" , llmReq )
58
+ klog .V (logutil . VERBOSE ).Infof ("LLM Request: %+v" , llmReq )
58
59
59
60
requestBody := v .RequestBody .Body
60
61
var err error
@@ -66,14 +67,14 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
66
67
klog .Errorf ("Error marshaling request body: %v" , err )
67
68
return nil , fmt .Errorf ("error marshaling request body: %v" , err )
68
69
}
69
- klog .V (3 ).Infof ("Updated body: %v" , string (requestBody ))
70
+ klog .V (logutil . VERBOSE ).Infof ("Updated body: %v" , string (requestBody ))
70
71
}
71
72
72
73
targetPod , err := s .scheduler .Schedule (llmReq )
73
74
if err != nil {
74
75
return nil , fmt .Errorf ("failed to find target pod: %w" , err )
75
76
}
76
- klog .V (3 ).Infof ("Selected target model %v in target pod: %v\n " , llmReq .ResolvedTargetModel , targetPod )
77
+ klog .V (logutil . VERBOSE ).Infof ("Selected target model %v in target pod: %v\n " , llmReq .ResolvedTargetModel , targetPod )
77
78
78
79
reqCtx .Model = llmReq .Model
79
80
reqCtx .ResolvedTargetModel = llmReq .ResolvedTargetModel
@@ -99,7 +100,7 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
99
100
}
100
101
// Print headers for debugging
101
102
for _ , header := range headers {
102
- klog .V (3 ).Infof ("[request_body] Header Key: %s, Header Value: %s\n " , header .Header .Key , header .Header .RawValue )
103
+ klog .V (logutil . VERBOSE ).Infof ("[request_body] Header Key: %s, Header Value: %s\n " , header .Header .Key , header .Header .RawValue )
103
104
}
104
105
105
106
resp := & extProcPb.ProcessingResponse {
@@ -122,10 +123,10 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
122
123
}
123
124
124
125
func HandleRequestHeaders (reqCtx * RequestContext , req * extProcPb.ProcessingRequest ) * extProcPb.ProcessingResponse {
125
- klog .V (3 ).Info ("Handling request headers ..." )
126
+ klog .V (logutil . VERBOSE ).Info ("Handling request headers ..." )
126
127
r := req .Request
127
128
h := r .(* extProcPb.ProcessingRequest_RequestHeaders )
128
- klog .V (3 ).Infof ("Headers: %+v\n " , h )
129
+ klog .V (logutil . VERBOSE ).Infof ("Headers: %+v\n " , h )
129
130
130
131
resp := & extProcPb.ProcessingResponse {
131
132
Response : & extProcPb.ProcessingResponse_RequestHeaders {
0 commit comments