Skip to content

Commit 412f835

Browse files
committed
Updates artifacts for v1.1.0-rc.1 release
Signed-off-by: Kellen Swain <[email protected]>
1 parent 6f84d17 commit 412f835

File tree

12 files changed

+22
-22
lines changed

12 files changed

+22
-22
lines changed

config/charts/body-based-routing/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,8 @@ bbr:
33
replicas: 1
44
image:
55
name: bbr
6-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
7-
tag: main
6+
hub: registry.k8s.io/gateway-api-inference-extension
7+
tag: v1.1.0-rc.1
88
pullPolicy: Always
99
port: 9004
1010
healthCheckPort: 9005

config/charts/inferencepool/values.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@ inferenceExtension:
22
replicas: 1
33
image:
44
name: epp
5-
hub: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension
6-
tag: main
5+
hub: registry.k8s.io/gateway-api-inference-extension
6+
tag: v1.1.0-rc.1
77
pullPolicy: Always
88
extProcPort: 9002
99
env: []

config/crd/bases/inference.networking.k8s.io_inferencepools.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ kind: CustomResourceDefinition
33
metadata:
44
annotations:
55
api-approved.kubernetes.io: https://github.com/kubernetes-sigs/gateway-api-inference-extension/pull/1173
6-
inference.networking.k8s.io/bundle-version: main-dev
6+
inference.networking.k8s.io/bundle-version: v1.1.0-rc.1
77
name: inferencepools.inference.networking.k8s.io
88
spec:
99
group: inference.networking.k8s.io

config/crd/bases/inference.networking.x-k8s.io_inferenceobjectives.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ apiVersion: apiextensions.k8s.io/v1
22
kind: CustomResourceDefinition
33
metadata:
44
annotations:
5-
inference.networking.k8s.io/bundle-version: main-dev
5+
inference.networking.k8s.io/bundle-version: v1.1.0-rc.1
66
name: inferenceobjectives.inference.networking.x-k8s.io
77
spec:
88
group: inference.networking.x-k8s.io

config/crd/bases/inference.networking.x-k8s.io_inferencepoolimports.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ apiVersion: apiextensions.k8s.io/v1
22
kind: CustomResourceDefinition
33
metadata:
44
annotations:
5-
inference.networking.k8s.io/bundle-version: main-dev
5+
inference.networking.k8s.io/bundle-version: v1.1.0-rc.1
66
name: inferencepoolimports.inference.networking.x-k8s.io
77
spec:
88
group: inference.networking.x-k8s.io

config/crd/bases/inference.networking.x-k8s.io_inferencepools.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ kind: CustomResourceDefinition
33
metadata:
44
annotations:
55
api-approved.kubernetes.io: unapproved, experimental-only
6-
inference.networking.k8s.io/bundle-version: main-dev
6+
inference.networking.k8s.io/bundle-version: v1.1.0-rc.1
77
name: inferencepools.inference.networking.x-k8s.io
88
spec:
99
group: inference.networking.x-k8s.io

config/manifests/vllm/cpu-deployment.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,8 +14,8 @@ spec:
1414
spec:
1515
containers:
1616
- name: lora
17-
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.8.5" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18-
imagePullPolicy: Always
17+
image: "public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.9.3" # formal images can be found in https://gallery.ecr.aws/q9t5s3a7/vllm-cpu-release-repo
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"
@@ -77,8 +77,8 @@ spec:
7777
- name: lora-adapter-syncer
7878
tty: true
7979
stdin: true
80-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/lora-syncer:main
81-
restartPolicy: Always
80+
image: registry.k8s.io/gateway-api-inference-extension/lora-syncer:v1.1.0-rc.1
81+
restartPolicy: IfNotPresent
8282
imagePullPolicy: Always
8383
env:
8484
- name: DYNAMIC_LORA_ROLLOUT_CONFIG

config/manifests/vllm/gpu-deployment.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
containers:
1616
- name: vllm
1717
image: "vllm/vllm-openai:v0.8.5"
18-
imagePullPolicy: Always
18+
imagePullPolicy: IfNotPresent
1919
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
2020
args:
2121
- "--model"
@@ -155,8 +155,8 @@ spec:
155155
- name: lora-adapter-syncer
156156
tty: true
157157
stdin: true
158-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/lora-syncer:main
159-
restartPolicy: Always
158+
image: registry.k8s.io/gateway-api-inference-extension/lora-syncer:v1.1.0-rc.1
159+
restartPolicy: IfNotPresent
160160
imagePullPolicy: Always
161161
env:
162162
- name: DYNAMIC_LORA_ROLLOUT_CONFIG

config/manifests/vllm/sim-deployment.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
containers:
1616
- name: vllm-sim
1717
image: ghcr.io/llm-d/llm-d-inference-sim:v0.5.0
18-
imagePullPolicy: Always
18+
imagePullPolicy: IfNotPresent
1919
args:
2020
- --model
2121
- meta-llama/Llama-3.1-8B-Instruct

conformance/resources/base.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -200,8 +200,8 @@ spec:
200200
terminationGracePeriodSeconds: 130
201201
containers:
202202
- name: epp
203-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:v1.0.0
204-
imagePullPolicy: Always
203+
image: registry.k8s.io/gateway-api-inference-extension/epp:v1.1.0-rc.1
204+
imagePullPolicy: IfNotPresent
205205
args:
206206
- --pool-name
207207
- "primary-inference-pool"
@@ -298,8 +298,8 @@ spec:
298298
terminationGracePeriodSeconds: 130
299299
containers:
300300
- name: epp
301-
image: us-central1-docker.pkg.dev/k8s-staging-images/gateway-api-inference-extension/epp:v1.0.0
302-
imagePullPolicy: Always
301+
image: registry.k8s.io/gateway-api-inference-extension/epp:v1.1.0-rc.1
302+
imagePullPolicy: IfNotPresent
303303
args:
304304
- --pool-name
305305
- "secondary-inference-pool"

0 commit comments

Comments
 (0)