@@ -591,7 +591,8 @@ spec:
591591 alive or ready to receive traffic.
592592 properties :
593593 exec :
594- description : Exec specifies the action to take.
594+ description : Exec specifies a command to execute
595+ in the container.
595596 properties :
596597 command :
597598 description : |-
@@ -612,8 +613,7 @@ spec:
612613 format : int32
613614 type : integer
614615 grpc :
615- description : GRPC specifies an action involving
616- a GRPC port.
616+ description : GRPC specifies a GRPC HealthCheckRequest.
617617 properties :
618618 port :
619619 description : Port number of the gRPC service.
@@ -632,7 +632,7 @@ spec:
632632 - port
633633 type : object
634634 httpGet :
635- description : HTTPGet specifies the http request
635+ description : HTTPGet specifies an HTTP GET request
636636 to perform.
637637 properties :
638638 host :
@@ -700,7 +700,7 @@ spec:
700700 format : int32
701701 type : integer
702702 tcpSocket :
703- description : TCPSocket specifies an action involving
703+ description : TCPSocket specifies a connection to
704704 a TCP port.
705705 properties :
706706 host :
@@ -776,6 +776,32 @@ spec:
776776 type : string
777777 type : object
778778 type : object
779+ multiNode :
780+ description : MultiNode config for NIMService using LeaderWorkerSet
781+ properties :
782+ clusterStartTimeout :
783+ default : 300
784+ description : ClusterStartTimeout specifies the timeout
785+ in seconds for starting the cluster.
786+ type : integer
787+ gpusPerNode :
788+ default : 1
789+ description : GPUPerNode specifies the number of GPUs
790+ for each pod. In most cases, this should match `resources.limits.nvidia.com/gpu`.
791+ type : integer
792+ workers :
793+ default : 2
794+ description : Workers specifies how many worker pods
795+ per multi-node replica to launch.
796+ minimum : 2
797+ type : integer
798+ required :
799+ - clusterStartTimeout
800+ type : object
801+ x-kubernetes-validations :
802+ - message : scale.enabled must be false when multiNode is
803+ not nil
804+ rule : ' !has(self.multiNode) || !self.scale.enabled'
779805 nodeSelector :
780806 additionalProperties :
781807 type : string
@@ -1166,7 +1192,8 @@ spec:
11661192 alive or ready to receive traffic.
11671193 properties :
11681194 exec :
1169- description : Exec specifies the action to take.
1195+ description : Exec specifies a command to execute
1196+ in the container.
11701197 properties :
11711198 command :
11721199 description : |-
@@ -1187,8 +1214,7 @@ spec:
11871214 format : int32
11881215 type : integer
11891216 grpc :
1190- description : GRPC specifies an action involving
1191- a GRPC port.
1217+ description : GRPC specifies a GRPC HealthCheckRequest.
11921218 properties :
11931219 port :
11941220 description : Port number of the gRPC service.
@@ -1207,7 +1233,7 @@ spec:
12071233 - port
12081234 type : object
12091235 httpGet :
1210- description : HTTPGet specifies the http request
1236+ description : HTTPGet specifies an HTTP GET request
12111237 to perform.
12121238 properties :
12131239 host :
@@ -1275,7 +1301,7 @@ spec:
12751301 format : int32
12761302 type : integer
12771303 tcpSocket :
1278- description : TCPSocket specifies an action involving
1304+ description : TCPSocket specifies a connection to
12791305 a TCP port.
12801306 properties :
12811307 host :
@@ -1531,7 +1557,6 @@ spec:
15311557 each pod of the current scale target (e.g. CPU or memory). Such metrics are
15321558 built in to Kubernetes, and have special scaling options on top of those
15331559 available to normal per-pod metrics using the "pods" source.
1534- This is an alpha feature and can be enabled by the HPAContainerMetrics feature flag.
15351560 properties :
15361561 container :
15371562 description : container is the name of
@@ -1994,8 +2019,6 @@ spec:
19942019 description : |-
19952020 type is the type of metric source. It should be one of "ContainerResource", "External",
19962021 "Object", "Pods" or "Resource", each mapping to a matching field in the object.
1997- Note: "ContainerResource" type is available on when the feature-gate
1998- HPAContainerMetrics is enabled
19992022 type : string
20002023 required :
20012024 - type
@@ -2022,7 +2045,8 @@ spec:
20222045 alive or ready to receive traffic.
20232046 properties :
20242047 exec :
2025- description : Exec specifies the action to take.
2048+ description : Exec specifies a command to execute
2049+ in the container.
20262050 properties :
20272051 command :
20282052 description : |-
@@ -2043,8 +2067,7 @@ spec:
20432067 format : int32
20442068 type : integer
20452069 grpc :
2046- description : GRPC specifies an action involving
2047- a GRPC port.
2070+ description : GRPC specifies a GRPC HealthCheckRequest.
20482071 properties :
20492072 port :
20502073 description : Port number of the gRPC service.
@@ -2063,7 +2086,7 @@ spec:
20632086 - port
20642087 type : object
20652088 httpGet :
2066- description : HTTPGet specifies the http request
2089+ description : HTTPGet specifies an HTTP GET request
20672090 to perform.
20682091 properties :
20692092 host :
@@ -2131,7 +2154,7 @@ spec:
21312154 format : int32
21322155 type : integer
21332156 tcpSocket :
2134- description : TCPSocket specifies an action involving
2157+ description : TCPSocket specifies a connection to
21352158 a TCP port.
21362159 properties :
21372160 host :
0 commit comments