fix: accurate apiFormats declarations based on verified provider capabilities

vivekk16 · vivekk16 · commit 7040ab8f1c9a · 2026-06-05T14:49:12.000-04:00
Signed-off-by: Vivek Karunai Kiri Ragavan &lt;vkarunai@redhat.com&gt;
diff --git a/backend/src/test/fixtures.ts b/backend/src/test/fixtures.ts
@@ -167,7 +167,7 @@ export const mockInferenceProviderConfig = {
   spec: {
     capabilities: {
       engines: [
-        { name: 'vllm', servingModes: ['aggregated'], apiFormats: ['openai-chat'], gpuSupport: true, cpuSupport: false },
+        { name: 'vllm', servingModes: ['aggregated'], apiFormats: ['openai-chat', 'openai-responses', 'anthropic-messages'], gpuSupport: true, cpuSupport: false },
         { name: 'llamacpp', servingModes: ['aggregated'], apiFormats: ['openai-chat'], gpuSupport: true, cpuSupport: true },
       ],
     },
diff --git a/controller/config/samples/airunway_v1alpha1_inferenceproviderconfig.yaml b/controller/config/samples/airunway_v1alpha1_inferenceproviderconfig.yaml
@@ -14,7 +14,7 @@ spec:
     engines:
       - name: vllm
         servingModes: [aggregated]
-        apiFormats: [openai-chat]
+        apiFormats: [openai-chat, openai-responses, anthropic-messages]
         gpuSupport: true
       - name: llamacpp
         servingModes: [aggregated]
@@ -42,7 +42,7 @@ spec:
     engines:
       - name: vllm
         servingModes: [aggregated, disaggregated]
-        apiFormats: [openai-chat, anthropic-messages]
+        apiFormats: [openai-chat, openai-responses, anthropic-messages]
         gpuSupport: true
         gateway:
           managesInferencePool: true
@@ -58,7 +58,7 @@ spec:
           inferencePoolNamespace: "{namespace}"
       - name: trtllm
         servingModes: [aggregated]
-        apiFormats: [openai-chat]
+        apiFormats: [openai-chat, openai-responses]
         gpuSupport: true
         gateway:
           managesInferencePool: true
@@ -110,7 +110,7 @@ spec:
     engines:
       - name: vllm
         servingModes: [aggregated, disaggregated]
-        apiFormats: [openai-chat]
+        apiFormats: [openai-chat, openai-responses, anthropic-messages]
         gpuSupport: true
         requiresCRD: false
   selectionRules: []
diff --git a/providers/dynamo/config.go b/providers/dynamo/config.go
@@ -111,15 +111,16 @@ func GetProviderConfigSpec() airunwayv1alpha1.InferenceProviderConfigSpec {
 					airunwayv1alpha1.ServingModeAggregated,
 					airunwayv1alpha1.ServingModeDisaggregated,
 				},
-				APIFormats: []airunwayv1alpha1.APIFormat{
-					airunwayv1alpha1.APIFormatOpenAIChat,
-					airunwayv1alpha1.APIFormatAnthropicMessages,
-				},
-				GPUSupport: true,
-				Gateway:    dynamoGatewayCapabilities(),
+			APIFormats: []airunwayv1alpha1.APIFormat{
+				airunwayv1alpha1.APIFormatOpenAIChat,
+				airunwayv1alpha1.APIFormatOpenAIResponses,
+				airunwayv1alpha1.APIFormatAnthropicMessages,
 			},
-			{
-				Name: airunwayv1alpha1.EngineTypeSGLang,
+			GPUSupport: true,
+			Gateway:    dynamoGatewayCapabilities(),
+		},
+		{
+			Name: airunwayv1alpha1.EngineTypeSGLang,
 				ServingModes: []airunwayv1alpha1.ServingMode{
 					airunwayv1alpha1.ServingModeAggregated,
 					airunwayv1alpha1.ServingModeDisaggregated,
@@ -132,13 +133,14 @@ func GetProviderConfigSpec() airunwayv1alpha1.InferenceProviderConfigSpec {
 				Gateway:    dynamoGatewayCapabilities(),
 			},
 			{
-				Name: airunwayv1alpha1.EngineTypeTRTLLM,
-				ServingModes: []airunwayv1alpha1.ServingMode{
-					airunwayv1alpha1.ServingModeAggregated,
-				},
-				APIFormats: []airunwayv1alpha1.APIFormat{
-					airunwayv1alpha1.APIFormatOpenAIChat,
-				},
+			Name: airunwayv1alpha1.EngineTypeTRTLLM,
+			ServingModes: []airunwayv1alpha1.ServingMode{
+				airunwayv1alpha1.ServingModeAggregated,
+			},
+			APIFormats: []airunwayv1alpha1.APIFormat{
+				airunwayv1alpha1.APIFormatOpenAIChat,
+				airunwayv1alpha1.APIFormatOpenAIResponses,
+			},
 				GPUSupport: true,
 				Gateway:    dynamoGatewayCapabilities(),
 			},
diff --git a/providers/dynamo/config_test.go b/providers/dynamo/config_test.go
@@ -46,6 +46,7 @@ func TestGetProviderConfigSpec(t *testing.T) {
 	}
 	expectedVLLMFormats := []airunwayv1alpha1.APIFormat{
 		airunwayv1alpha1.APIFormatOpenAIChat,
+		airunwayv1alpha1.APIFormatOpenAIResponses,
 		airunwayv1alpha1.APIFormatAnthropicMessages,
 	}
 	if len(vllmCap.APIFormats) != len(expectedVLLMFormats) {
@@ -104,8 +105,24 @@ func TestGetProviderConfigSpec(t *testing.T) {
 	if len(trtllmCap.ServingModes) != 1 || trtllmCap.ServingModes[0] != airunwayv1alpha1.ServingModeAggregated {
 		t.Errorf("expected trtllm to support only aggregated serving mode")
 	}
-	if len(trtllmCap.APIFormats) != 1 || trtllmCap.APIFormats[0] != airunwayv1alpha1.APIFormatOpenAIChat {
-		t.Errorf("expected trtllm to support only openai-chat API format")
+	expectedTRTLLMFormats := []airunwayv1alpha1.APIFormat{
+		airunwayv1alpha1.APIFormatOpenAIChat,
+		airunwayv1alpha1.APIFormatOpenAIResponses,
+	}
+	if len(trtllmCap.APIFormats) != len(expectedTRTLLMFormats) {
+		t.Fatalf("expected trtllm to support %d API formats, got %d", len(expectedTRTLLMFormats), len(trtllmCap.APIFormats))
+	}
+	for _, expected := range expectedTRTLLMFormats {
+		found := false
+		for _, actual := range trtllmCap.APIFormats {
+			if actual == expected {
+				found = true
+				break
+			}
+		}
+		if !found {
+			t.Errorf("expected trtllm to support API format %s", expected)
+		}
 	}
 
 	if len(spec.SelectionRules) != 4 {
diff --git a/providers/kaito/config.go b/providers/kaito/config.go
@@ -70,13 +70,15 @@ func GetProviderConfigSpec() airunwayv1alpha1.InferenceProviderConfigSpec {
 				ServingModes: []airunwayv1alpha1.ServingMode{
 					airunwayv1alpha1.ServingModeAggregated,
 				},
-				APIFormats: []airunwayv1alpha1.APIFormat{
-					airunwayv1alpha1.APIFormatOpenAIChat,
-				},
-				GPUSupport: true,
+			APIFormats: []airunwayv1alpha1.APIFormat{
+				airunwayv1alpha1.APIFormatOpenAIChat,
+				airunwayv1alpha1.APIFormatOpenAIResponses,
+				airunwayv1alpha1.APIFormatAnthropicMessages,
 			},
-			{
-				Name: airunwayv1alpha1.EngineTypeLlamaCpp,
+			GPUSupport: true,
+		},
+		{
+			Name: airunwayv1alpha1.EngineTypeLlamaCpp,
 				ServingModes: []airunwayv1alpha1.ServingMode{
 					airunwayv1alpha1.ServingModeAggregated,
 				},
diff --git a/providers/kaito/config_test.go b/providers/kaito/config_test.go
@@ -50,8 +50,25 @@ func TestGetProviderConfigSpec(t *testing.T) {
 	if len(vllmCap.ServingModes) != 1 || vllmCap.ServingModes[0] != airunwayv1alpha1.ServingModeAggregated {
 		t.Errorf("expected vllm to support only aggregated serving mode")
 	}
-	if len(vllmCap.APIFormats) != 1 || vllmCap.APIFormats[0] != airunwayv1alpha1.APIFormatOpenAIChat {
-		t.Errorf("expected vllm to support openai-chat API format")
+	expectedVLLMFormats := []airunwayv1alpha1.APIFormat{
+		airunwayv1alpha1.APIFormatOpenAIChat,
+		airunwayv1alpha1.APIFormatOpenAIResponses,
+		airunwayv1alpha1.APIFormatAnthropicMessages,
+	}
+	if len(vllmCap.APIFormats) != len(expectedVLLMFormats) {
+		t.Fatalf("expected vllm to support %d API formats, got %d", len(expectedVLLMFormats), len(vllmCap.APIFormats))
+	}
+	for _, expected := range expectedVLLMFormats {
+		found := false
+		for _, actual := range vllmCap.APIFormats {
+			if actual == expected {
+				found = true
+				break
+			}
+		}
+		if !found {
+			t.Errorf("expected vllm to support API format %s", expected)
+		}
 	}
 
 	llamaCap := spec.Capabilities.GetEngineCapability(airunwayv1alpha1.EngineTypeLlamaCpp)
diff --git a/providers/kuberay/config.go b/providers/kuberay/config.go
@@ -77,10 +77,10 @@ func GetProviderConfigSpec() airunwayv1alpha1.InferenceProviderConfigSpec {
 					airunwayv1alpha1.ServingModeAggregated,
 					airunwayv1alpha1.ServingModeDisaggregated,
 				},
-				APIFormats: []airunwayv1alpha1.APIFormat{
-					airunwayv1alpha1.APIFormatOpenAIChat,
-				},
-				GPUSupport: true,
+			APIFormats: []airunwayv1alpha1.APIFormat{
+				airunwayv1alpha1.APIFormatOpenAIChat,
+			},
+			GPUSupport: true,
 			},
 			},
 		},
diff --git a/providers/kuberay/config_test.go b/providers/kuberay/config_test.go
@@ -38,7 +38,7 @@ func TestGetProviderConfigSpec(t *testing.T) {
 		t.Fatalf("expected vllm to support 2 serving modes, got %d", len(vllmCap.ServingModes))
 	}
 	if len(vllmCap.APIFormats) != 1 || vllmCap.APIFormats[0] != airunwayv1alpha1.APIFormatOpenAIChat {
-		t.Errorf("expected vllm to support openai-chat API format")
+		t.Errorf("expected vllm to support only openai-chat API format, got %v", vllmCap.APIFormats)
 	}
 
 	if len(spec.SelectionRules) != 1 {
diff --git a/providers/llmd/config.go b/providers/llmd/config.go
@@ -70,9 +70,11 @@ func GetProviderConfigSpec() airunwayv1alpha1.InferenceProviderConfigSpec {
 					airunwayv1alpha1.ServingModeAggregated,
 					airunwayv1alpha1.ServingModeDisaggregated,
 				},
-				APIFormats: []airunwayv1alpha1.APIFormat{
-					airunwayv1alpha1.APIFormatOpenAIChat,
-				},
+			APIFormats: []airunwayv1alpha1.APIFormat{
+				airunwayv1alpha1.APIFormatOpenAIChat,
+				airunwayv1alpha1.APIFormatOpenAIResponses,
+				airunwayv1alpha1.APIFormatAnthropicMessages,
+			},
 				GPUSupport:  true,
 				RequiresCRD: &requiresCRD,
 			},
diff --git a/providers/llmd/config_test.go b/providers/llmd/config_test.go
@@ -36,8 +36,25 @@ func TestGetProviderConfigSpec(t *testing.T) {
 	}
 
 	// API formats (per-engine)
-	if len(vllmCap.APIFormats) != 1 || vllmCap.APIFormats[0] != airunwayv1alpha1.APIFormatOpenAIChat {
-		t.Errorf("expected vllm to support openai-chat API format")
+	expectedVLLMFormats := []airunwayv1alpha1.APIFormat{
+		airunwayv1alpha1.APIFormatOpenAIChat,
+		airunwayv1alpha1.APIFormatOpenAIResponses,
+		airunwayv1alpha1.APIFormatAnthropicMessages,
+	}
+	if len(vllmCap.APIFormats) != len(expectedVLLMFormats) {
+		t.Fatalf("expected vllm to support %d API formats, got %d", len(expectedVLLMFormats), len(vllmCap.APIFormats))
+	}
+	for _, expected := range expectedVLLMFormats {
+		found := false
+		for _, actual := range vllmCap.APIFormats {
+			if actual == expected {
+				found = true
+				break
+			}
+		}
+		if !found {
+			t.Errorf("expected vllm to support API format %s", expected)
+		}
 	}
 
 	// Serving modes (per-engine)

Original file line number	Diff line number	Diff line change
`@@ -38,7 +38,7 @@ func TestGetProviderConfigSpec(t *testing.T) {`
`38`	`38`	`t.Fatalf("expected vllm to support 2 serving modes, got %d", len(vllmCap.ServingModes))`
`39`	`39`	`}`
`40`	`40`	`if len(vllmCap.APIFormats) != 1 \|\| vllmCap.APIFormats[0] != airunwayv1alpha1.APIFormatOpenAIChat {`
`41`		`- t.Errorf("expected vllm to support openai-chat API format")`
	`41`	`+ t.Errorf("expected vllm to support only openai-chat API format, got %v", vllmCap.APIFormats)`
`42`	`42`	`}`
`43`	`43`
`44`	`44`	`if len(spec.SelectionRules) != 1 {`