Skip to content

Commit 0889693

Browse files
committed
add configurable gateway replicas use gateway.gatewayParameters.replicas
Signed-off-by: nicole-lihui <nicole.li@daocloud.io>
1 parent 4f0f8d0 commit 0889693

File tree

6 files changed

+20
-0
lines changed

6 files changed

+20
-0
lines changed

charts/llm-d-infra/README.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -122,6 +122,7 @@ Kubernetes: `>= 1.28.0-0`
122122
| gateway.gatewayParameters.istio | Istio-specific parameters rendered into the gateway ConfigMap when gateway.provider resolves to "istio" | object | `{"accessLogging":true}` |
123123
| gateway.gatewayParameters.istio.accessLogging | For istio to include access logging or not | bool | `true` |
124124
| gateway.gatewayParameters.logLevel | Log level for provider-managed gateway data plane components | string | `"warn"` |
125+
| gateway.gatewayParameters.replicas | Number of replicas for the gateway | int | `1` |
125126
| gateway.gatewayParameters.resources | Resource requests/limits <br /> Ref: https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/#resource-requests-and-limits-of-pod-and-container | object | `{"limits":{"cpu":"2","memory":"1Gi"},"requests":{"cpu":"100m","memory":"128Mi"}}` |
126127
| gateway.labels | Additional labels provided to the Gateway resource | object | `{}` |
127128
| gateway.listeners | Set of listeners exposed via the Gateway, also propagated to the Ingress if enabled | list | `[{"allowedRoutes":{"namespaces":{"from":"All"}},"name":"default","port":80,"protocol":"HTTP"}]` |

charts/llm-d-infra/templates/gateway-infrastructure/agentgatewayparameters.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -47,4 +47,7 @@ spec:
4747
{{- if .Values.gateway.service.loadBalancerClass }}
4848
loadBalancerClass: {{ .Values.gateway.service.loadBalancerClass | quote }}
4949
{{- end }}
50+
deployment:
51+
spec:
52+
replicas: {{ .Values.gateway.gatewayParameters.replicas }}
5053
{{- end}}

charts/llm-d-infra/templates/gateway-infrastructure/configmap.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,7 @@ data:
2222
{{- if eq $provider "istio" }}
2323
deployment: |
2424
spec:
25+
replicas: {{ .Values.gateway.gatewayParameters.replicas }}
2526
template:
2627
spec:
2728
containers:

charts/llm-d-infra/values.schema.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -241,6 +241,12 @@
241241
"required": [],
242242
"title": "logLevel"
243243
},
244+
"replicas": {
245+
"default": "1",
246+
"description": "Number of replicas for the gateway",
247+
"required": [],
248+
"title": "replicas"
249+
},
244250
"resources": {
245251
"description": "ResourceRequirements describes the compute resource requirements.",
246252
"properties": {

charts/llm-d-infra/values.schema.tmpl.json

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -241,6 +241,12 @@
241241
"required": [],
242242
"title": "logLevel"
243243
},
244+
"replicas": {
245+
"default": "1",
246+
"description": "Number of replicas for the gateway",
247+
"required": [],
248+
"title": "replicas"
249+
},
244250
"resources": {
245251
"$ref": "https://raw.githubusercontent.com/yannh/kubernetes-json-schema/master/master/_definitions.json#/definitions/io.k8s.api.core.v1.ResourceRequirements",
246252
"description": "Resource requests/limits \u003cbr /\u003e Ref: https://kubernetes.io/docs/concepts/configuration/manage-resources-containers/#resource-requests-and-limits-of-pod-and-container",

charts/llm-d-infra/values.yaml

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -98,6 +98,9 @@ gateway:
9898
# -- Log level for provider-managed gateway data plane components
9999
logLevel: warn
100100

101+
# -- Number of replicas for the gateway
102+
replicas: 1
103+
101104
# @schema
102105
# $ref: https://raw.githubusercontent.com/yannh/kubernetes-json-schema/master/master/_definitions.json#/definitions/io.k8s.api.core.v1.ResourceRequirements
103106
# @schema

0 commit comments

Comments
 (0)