@@ -10,14 +10,15 @@ import (
1010 extProcPb "github.com/envoyproxy/go-control-plane/envoy/service/ext_proc/v3"
1111 "inference.networking.x-k8s.io/gateway-api-inference-extension/pkg/ext-proc/backend"
1212 "inference.networking.x-k8s.io/gateway-api-inference-extension/pkg/ext-proc/scheduling"
13+ logutil "inference.networking.x-k8s.io/gateway-api-inference-extension/pkg/ext-proc/util/logging"
1314 klog "k8s.io/klog/v2"
1415)
1516
1617// HandleRequestBody handles body of the request to the backend server, such as parsing the "model"
1718// parameter.
1819// Envoy sends the request body to ext proc before sending the request to the backend server.
1920func (s * Server ) HandleRequestBody (reqCtx * RequestContext , req * extProcPb.ProcessingRequest ) (* extProcPb.ProcessingResponse , error ) {
20- klog .V (3 ).Infof ("Handling request body" )
21+ klog .V (logutil . VERBOSE ).Infof ("Handling request body" )
2122
2223 // Unmarshal request body (must be JSON).
2324 v := req .Request .(* extProcPb.ProcessingRequest_RequestBody )
@@ -26,14 +27,14 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
2627 klog .Errorf ("Error unmarshaling request body: %v" , err )
2728 return nil , fmt .Errorf ("error unmarshaling request body: %v" , err )
2829 }
29- klog .V (3 ).Infof ("Request body: %v" , rb )
30+ klog .V (logutil . VERBOSE ).Infof ("Request body: %v" , rb )
3031
3132 // Resolve target models.
3233 model , ok := rb ["model" ].(string )
3334 if ! ok {
3435 return nil , errors .New ("model not found in request" )
3536 }
36- klog .V (3 ).Infof ("Model requested: %v" , model )
37+ klog .V (logutil . VERBOSE ).Infof ("Model requested: %v" , model )
3738 modelName := model
3839
3940 // NOTE: The nil checking for the modelObject means that we DO allow passthrough currently.
@@ -54,7 +55,7 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
5455 ResolvedTargetModel : modelName ,
5556 Critical : backend .IsCritical (modelObj ),
5657 }
57- klog .V (3 ).Infof ("LLM Request: %+v" , llmReq )
58+ klog .V (logutil . VERBOSE ).Infof ("LLM Request: %+v" , llmReq )
5859
5960 requestBody := v .RequestBody .Body
6061 var err error
@@ -66,14 +67,14 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
6667 klog .Errorf ("Error marshaling request body: %v" , err )
6768 return nil , fmt .Errorf ("error marshaling request body: %v" , err )
6869 }
69- klog .V (3 ).Infof ("Updated body: %v" , string (requestBody ))
70+ klog .V (logutil . VERBOSE ).Infof ("Updated body: %v" , string (requestBody ))
7071 }
7172
7273 targetPod , err := s .scheduler .Schedule (llmReq )
7374 if err != nil {
7475 return nil , fmt .Errorf ("failed to find target pod: %w" , err )
7576 }
76- klog .V (3 ).Infof ("Selected target model %v in target pod: %v\n " , llmReq .ResolvedTargetModel , targetPod )
77+ klog .V (logutil . VERBOSE ).Infof ("Selected target model %v in target pod: %v\n " , llmReq .ResolvedTargetModel , targetPod )
7778
7879 reqCtx .Model = llmReq .Model
7980 reqCtx .ResolvedTargetModel = llmReq .ResolvedTargetModel
@@ -99,7 +100,7 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
99100 }
100101 // Print headers for debugging
101102 for _ , header := range headers {
102- klog .V (3 ).Infof ("[request_body] Header Key: %s, Header Value: %s\n " , header .Header .Key , header .Header .RawValue )
103+ klog .V (logutil . VERBOSE ).Infof ("[request_body] Header Key: %s, Header Value: %s\n " , header .Header .Key , header .Header .RawValue )
103104 }
104105
105106 resp := & extProcPb.ProcessingResponse {
@@ -122,10 +123,10 @@ func (s *Server) HandleRequestBody(reqCtx *RequestContext, req *extProcPb.Proces
122123}
123124
124125func HandleRequestHeaders (reqCtx * RequestContext , req * extProcPb.ProcessingRequest ) * extProcPb.ProcessingResponse {
125- klog .V (3 ).Info ("Handling request headers ..." )
126+ klog .V (logutil . VERBOSE ).Info ("Handling request headers ..." )
126127 r := req .Request
127128 h := r .(* extProcPb.ProcessingRequest_RequestHeaders )
128- klog .V (3 ).Infof ("Headers: %+v\n " , h )
129+ klog .V (logutil . VERBOSE ).Infof ("Headers: %+v\n " , h )
129130
130131 resp := & extProcPb.ProcessingResponse {
131132 Response : & extProcPb.ProcessingResponse_RequestHeaders {
0 commit comments