File tree Expand file tree Collapse file tree 2 files changed +12
-14
lines changed
config/charts/inferencepool Expand file tree Collapse file tree 2 files changed +12
-14
lines changed Original file line number Diff line number Diff line change 1- {{- range .Values.inferencePool.inferenceObjectives }}
2- {{- $group := "inference.networking.k8s.io" -}}
3- {{- if eq $.Values.inferencePool.apiVersion "inference.networking.x-k8s.io/v1alpha2" -}}
4- {{- $group = "inference.networking.x-k8s.io" -}}
5- {{- end -}}
1+ {{- range .Values.inferenceObjectives }}
62---
73apiVersion : inference.networking.x-k8s.io/v1alpha2
84kind : InferenceObjective
Original file line number Diff line number Diff line change @@ -167,15 +167,7 @@ inferencePool:
167167 # This will soon be deprecated when upstream GW providers support v1, just doing something simple for now.
168168 targetPortNumber : 8000
169169
170- # Optional: Define multiple InferenceObjectives for this InferencePool.
171- # Each InferenceObjective associates a name and priority with this InferencePool.
172- # Users reference these objectives by name in their request headers.
173- # inferenceObjectives:
174- # - name: high-priority
175- # priority: 1
176- # - name: low-priority
177- # priority: 5
178- inferenceObjectives : []
170+
179171
180172# Options: ["gke", "istio", "none"]
181173provider :
@@ -209,3 +201,13 @@ istio:
209201 # connectionPool:
210202 # http:
211203 # maxRequestsPerConnection: 256000
204+
205+
206+ # Optional: Define multiple InferenceObjectives for this InferencePool.
207+ # Each InferenceObjective associates a name and priority with this InferencePool.
208+ # Users reference these objectives by name in their request headers.
209+ inferenceObjectives : []
210+ # - name: high-priority
211+ # priority: 1
212+ # - name: low-priority
213+ # priority: 5
You can’t perform that action at this time.
0 commit comments