Make vLLM port number explicit in InferenceServerConfig

waltforme · waltforme · commit 4c1f9493019b · 2026-01-28T19:42:53.000Z
Signed-off-by: Jun Duan &lt;jun.duan.phd@outlook.com&gt;
diff --git a/api/fma/v1alpha1/inferenceserverconfig_types.go b/api/fma/v1alpha1/inferenceserverconfig_types.go
@@ -33,7 +33,11 @@ type InferenceServerConfigSpec struct {
 
 // ModelServerConfig defines the configuration for a model server
 type ModelServerConfig struct {
-	// Options are the vLLM startup options
+	// Port is the port on which the vLLM server will listen
+	// Particularly, management of vLLM instances' sleep state is done through this port
+	Port int32 `json:"port"`
+
+	// Options are the vLLM startup options, excluding Port
 	// +optional
 	Options string `json:"options,omitempty"`
 
diff --git a/config/crd/fma.llm-d.ai_inferenceserverconfigs.yaml b/config/crd/fma.llm-d.ai_inferenceserverconfigs.yaml
@@ -66,8 +66,16 @@ spec:
                       type: string
                     type: object
                   options:
-                    description: Options are the vLLM startup options
+                    description: Options are the vLLM startup options, excluding Port
                     type: string
+                  port:
+                    description: |-
+                      Port is the port on which the vLLM server will listen
+                      Particularly, management of vLLM instances' sleep state is done through this port
+                    format: int32
+                    type: integer
+                required:
+                - port
                 type: object
             required:
             - launcherConfigName
diff --git a/pkg/generated/applyconfiguration/fma/v1alpha1/modelserverconfig.go b/pkg/generated/applyconfiguration/fma/v1alpha1/modelserverconfig.go