feat: switch validation of request body based on request type

gcalmettes · gcalmettes · commit f38b7b59fc2e · 2025-06-20T09:16:33.000+02:00
diff --git a/pkg/plugins/gateway/gateway_req_body.go b/pkg/plugins/gateway/gateway_req_body.go
@@ -31,23 +31,27 @@ import (
 )
 
 func (s *Server) HandleRequestBody(ctx context.Context, requestID string, requestPath string, req *extProcPb.ProcessingRequest,
-	user utils.User, routingAlgorithm types.RoutingAlgorithm) (*extProcPb.ProcessingResponse, string, *types.RoutingContext, bool, int64) {
+	user utils.User, routingAlgorithm types.RoutingAlgorithm,
+) (*extProcPb.ProcessingResponse, string, *types.RoutingContext, bool, OpenAiRequestType, int64) {
 	var routingCtx *types.RoutingContext
 	var term int64 // Identify the trace window
 
+	requestType := NewOpenAiRequestTypeFromPath(requestPath)
+
 	body := req.Request.(*extProcPb.ProcessingRequest_RequestBody)
-	model, message, stream, errRes := validateRequestBody(requestID, requestPath, body.RequestBody.GetBody(), user)
+	model, message, stream, errRes := validateRequestBody(requestID, requestType, body.RequestBody.GetBody(), user)
 	if errRes != nil {
-		return errRes, model, routingCtx, stream, term
+		return errRes, model, routingCtx, stream, requestType, term
 	}
 
 	// early reject the request if model doesn't exist.
 	if !s.cache.HasModel(model) {
 		klog.ErrorS(nil, "model doesn't exist in cache, probably wrong model name", "requestID", requestID, "model", model)
 		return generateErrorResponse(envoyTypePb.StatusCode_BadRequest,
 			[]*configPb.HeaderValueOption{{Header: &configPb.HeaderValue{
-				Key: HeaderErrorNoModelBackends, RawValue: []byte(model)}}},
-			fmt.Sprintf("model %s does not exist", model)), model, routingCtx, stream, term
+				Key: HeaderErrorNoModelBackends, RawValue: []byte(model),
+			}}},
+			fmt.Sprintf("model %s does not exist", model)), model, routingCtx, stream, requestType, term
 	}
 
 	// early reject if no pods are ready to accept request for a model
@@ -56,8 +60,9 @@ func (s *Server) HandleRequestBody(ctx context.Context, requestID string, reques
 		klog.ErrorS(err, "no ready pod available", "requestID", requestID, "model", model)
 		return generateErrorResponse(envoyTypePb.StatusCode_ServiceUnavailable,
 			[]*configPb.HeaderValueOption{{Header: &configPb.HeaderValue{
-				Key: HeaderErrorNoModelBackends, RawValue: []byte("true")}}},
-			fmt.Sprintf("error on getting pods for model %s", model)), model, routingCtx, stream, term
+				Key: HeaderErrorNoModelBackends, RawValue: []byte("true"),
+			}}},
+			fmt.Sprintf("error on getting pods for model %s", model)), model, routingCtx, stream, requestType, term
 	}
 
 	routingCtx = types.NewRoutingContext(ctx, routingAlgorithm, model, message, requestID, user.Name)
@@ -72,8 +77,9 @@ func (s *Server) HandleRequestBody(ctx context.Context, requestID string, reques
 			return generateErrorResponse(
 				envoyTypePb.StatusCode_ServiceUnavailable,
 				[]*configPb.HeaderValueOption{{Header: &configPb.HeaderValue{
-					Key: HeaderErrorRouting, RawValue: []byte("true")}}},
-				"error on selecting target pod"), model, routingCtx, stream, term
+					Key: HeaderErrorRouting, RawValue: []byte("true"),
+				}}},
+				"error on selecting target pod"), model, routingCtx, stream, requestType, term
 		}
 		headers = buildEnvoyProxyHeaders(headers,
 			HeaderRoutingStrategy, string(routingAlgorithm),
@@ -93,5 +99,5 @@ func (s *Server) HandleRequestBody(ctx context.Context, requestID string, reques
 				},
 			},
 		},
-	}, model, routingCtx, stream, term
+	}, model, routingCtx, stream, requestType, term
 }
diff --git a/pkg/plugins/gateway/util.go b/pkg/plugins/gateway/util.go
@@ -34,11 +34,13 @@ import (
 // see https://platform.openai.com/docs/api-reference/embeddings/create#embeddings-create-input
 var maxEmbeddingInputArraySize = 2048
 
-// validateRequestBody validates input by unmarshaling request body into respective openai-golang struct based on requestpath.
+// validateRequestBody validates input by unmarshaling request body into respective openai-golang struct based on requestType.
 // nolint:nakedret
-func validateRequestBody(requestID, requestPath string, requestBody []byte, user utils.User) (model, message string, stream bool, errRes *extProcPb.ProcessingResponse) {
+func validateRequestBody(requestID string, requestType OpenAiRequestType, requestBody []byte, user utils.User) (model, message string, stream bool, errRes *extProcPb.ProcessingResponse) {
 	var streamOptions openai.ChatCompletionStreamOptionsParam
-	if requestPath == "/v1/chat/completions" {
+	switch requestType {
+
+	case OpenAiRequestChatCompletionsType:
 		var jsonMap map[string]json.RawMessage
 		if err := json.Unmarshal(requestBody, &jsonMap); err != nil {
 			klog.ErrorS(err, "error to unmarshal request body", "requestID", requestID, "requestBody", string(requestBody))
@@ -59,7 +61,8 @@ func validateRequestBody(requestID, requestPath string, requestBody []byte, user
 		if errRes = validateStreamOptions(requestID, user, &stream, streamOptions, jsonMap); errRes != nil {
 			return
 		}
-	} else if requestPath == "/v1/completions" {
+
+	case OpenAiRequestCompletionsType:
 		// openai.CompletionsNewParams does not support json unmarshal for CompletionNewParamsPromptUnion in release v0.1.0-beta.10
 		// once supported, input request will be directly unmarshal into openai.CompletionsNewParams
 		type Completion struct {
@@ -75,7 +78,8 @@ func validateRequestBody(requestID, requestPath string, requestBody []byte, user
 		}
 		model = completionObj.Model
 		message = completionObj.Prompt
-	} else if requestPath == "/v1/embeddings" {
+
+	case OpenAiRequestEmbeddingsType:
 		message = "" // prefix_cache algorithms are not relevant for embeddings
 		var jsonMap map[string]json.RawMessage
 		if err := json.Unmarshal(requestBody, &jsonMap); err != nil {
@@ -93,12 +97,12 @@ func validateRequestBody(requestID, requestPath string, requestBody []byte, user
 		if errRes = checkEmbeddingInputSequenceLen(requestID, embeddingObj); errRes != nil {
 			return
 		}
-	} else {
+	case OpenAiRequestUnknownType:
 		errRes = buildErrorResponse(envoyTypePb.StatusCode_NotImplemented, "unknown request path", HeaderErrorRequestBodyProcessing, "true")
 		return
 	}
 
-	klog.V(4).InfoS("validateRequestBody", "requestID", requestID, "requestPath", requestPath, "model", model, "message", message, "stream", stream, "streamOptions", streamOptions)
+	klog.V(4).InfoS("validateRequestBody", "requestID", requestID, "requestType", requestType, "model", model, "message", message, "stream", stream, "streamOptions", streamOptions)
 	return
 }
 
diff --git a/pkg/plugins/gateway/util_test.go b/pkg/plugins/gateway/util_test.go
@@ -28,7 +28,7 @@ import (
 func Test_ValidateRequestBody(t *testing.T) {
 	testCases := []struct {
 		message     string
-		requestPath string
+		requestType OpenAiRequestType
 		requestBody []byte
 		model       string
 		messages    string
@@ -38,95 +38,95 @@ func Test_ValidateRequestBody(t *testing.T) {
 	}{
 		{
 			message:     "unknown path",
-			requestPath: "/v1/unknown",
+			requestType: OpenAiRequestUnknownType,
 			statusCode:  envoyTypePb.StatusCode_NotImplemented,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal error",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte("bad_request"),
 			statusCode:  envoyTypePb.StatusCode_BadRequest,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal ChatCompletionsNewParams",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": 1}`),
 			statusCode:  envoyTypePb.StatusCode_BadRequest,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal no messages",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b"}`),
 			statusCode:  envoyTypePb.StatusCode_BadRequest,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal valid messages",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "messages": [{"role": "system", "content": "this is system"},{"role": "user", "content": "say this is test"}]}`),
 			model:       "llama2-7b",
 			messages:    "this is system say this is test",
 			statusCode:  envoyTypePb.StatusCode_OK,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal invalid messages with complex content",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "messages": [{"role": "system", "content": "this is system"},{"role": "user", "content": {"type": "text", "text": "say this is test", "complex": make(chan int)}}]}`),
 			statusCode:  envoyTypePb.StatusCode_BadRequest,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal valid messages with complex content",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "messages": [{"role": "system", "content": "this is system"},{"role": "user", "content": [{"type": "text", "text": "say this is test"}, {"type": "text", "text": "say this is test"}]}]}`),
 			model:       "llama2-7b",
 			messages:    "this is system [{\"text\":\"say this is test\",\"type\":\"text\"},{\"text\":\"say this is test\",\"type\":\"text\"}]",
 			statusCode:  envoyTypePb.StatusCode_OK,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal valid messages with stop string param",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "messages": [{"role": "system", "content": "this is system"},{"role": "user", "content": "say this is test"}], "stop": "stop"}`),
 			model:       "llama2-7b",
 			messages:    "this is system say this is test",
 			statusCode:  envoyTypePb.StatusCode_OK,
 		},
 		{
 			message:     "/v1/chat/completions json unmarhsal valid messages with stop array param",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "messages": [{"role": "system", "content": "this is system"},{"role": "user", "content": "say this is test"}], "stop": ["stop"]}`),
 			model:       "llama2-7b",
 			messages:    "this is system say this is test",
 			statusCode:  envoyTypePb.StatusCode_OK,
 		},
 		{
 			message:     "/v1/chat/completions json unmarshal invalid stream bool",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "stream": "true", "messages": [{"role": "system", "content": "this is system"}]}`),
 			statusCode:  envoyTypePb.StatusCode_BadRequest,
 		},
 		{
 			message:     "/v1/chat/completions json unmarshal stream options is null",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			user:        utils.User{Tpm: 1},
 			requestBody: []byte(`{"model": "llama2-7b", "stream": true, "messages": [{"role": "system", "content": "this is system"}]}`),
 			statusCode:  envoyTypePb.StatusCode_BadRequest,
 		},
 		{
 			message:     "/v1/chat/completions stream_options.include_usage == false with user.TPM >= 1 is NOT OK",
 			user:        utils.User{Tpm: 1},
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "stream": true, "stream_options": {"include_usage": false},  "messages": [{"role": "system", "content": "this is system"}]}`),
 			statusCode:  envoyTypePb.StatusCode_BadRequest,
 		},
 		{
 			message:     "/v1/chat/completions stream_options.include_usage == false with user.TPM == 0 is OK",
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "stream": true, "stream_options": {"include_usage": false},  "messages": [{"role": "system", "content": "this is system"}]}`),
 			statusCode:  envoyTypePb.StatusCode_OK,
 		},
 		{
 			message:     "/v1/chat/completions valid request body",
 			user:        utils.User{Tpm: 1},
-			requestPath: "/v1/chat/completions",
+			requestType: OpenAiRequestChatCompletionsType,
 			requestBody: []byte(`{"model": "llama2-7b", "stream": true, "stream_options": {"include_usage": true}, "messages": [{"role": "system", "content": "this is system"},{"role": "user", "content": "say this is test"}]}`),
 			stream:      true,
 			model:       "llama2-7b",
@@ -136,7 +136,7 @@ func Test_ValidateRequestBody(t *testing.T) {
 	}
 
 	for _, tt := range testCases {
-		model, messages, stream, errRes := validateRequestBody("1", tt.requestPath, tt.requestBody, tt.user)
+		model, messages, stream, errRes := validateRequestBody("1", tt.requestType, tt.requestBody, tt.user)
 
 		if tt.statusCode == 200 {
 			assert.Equal(t, (*extProcPb.ProcessingResponse)(nil), errRes, tt.message)