Skip to content

Commit 35f4570

Browse files
committed
move routing-sidecar from initContainer to a regular container
1 parent 1519a28 commit 35f4570

File tree

6 files changed

+6
-12
lines changed

6 files changed

+6
-12
lines changed

deploy/components/vllm-sim-pd/deployments.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -69,7 +69,7 @@ spec:
6969
app: ${POOL_NAME}
7070
llm-d.ai/role: decode
7171
spec:
72-
initContainers:
72+
containers:
7373
- name: routing-sidecar
7474
image: ${SIDECAR_IMAGE}
7575
imagePullPolicy: IfNotPresent
@@ -110,7 +110,6 @@ spec:
110110
valueFrom:
111111
fieldRef:
112112
fieldPath: status.podIP
113-
containers:
114113
- name: vllm
115114
image: ${VLLM_SIMULATOR_IMAGE}
116115
imagePullPolicy: IfNotPresent

deploy/components/vllm-sim/deployments.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ spec:
1414
labels:
1515
app: ${POOL_NAME}
1616
spec:
17-
initContainers:
17+
containers:
1818
- name: routing-sidecar
1919
image: ${SIDECAR_IMAGE}
2020
imagePullPolicy: IfNotPresent
@@ -55,7 +55,6 @@ spec:
5555
valueFrom:
5656
fieldRef:
5757
fieldPath: status.podIP
58-
containers:
5958
- name: vllm
6059
image: ${VLLM_SIMULATOR_IMAGE}
6160
imagePullPolicy: IfNotPresent

test/e2e/yaml/vllm-sim-dp.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ spec:
1515
app: ${POOL_NAME}
1616
llm-d.ai/role: decode
1717
spec:
18-
initContainers:
18+
containers:
1919
- name: routing-sidecar
2020
image: ${SIDECAR_IMAGE}
2121
imagePullPolicy: IfNotPresent
@@ -39,7 +39,6 @@ spec:
3939
valueFrom:
4040
fieldRef:
4141
fieldPath: status.podIP
42-
containers:
4342
- name: vllm
4443
image: ${VLLM_SIMULATOR_IMAGE}
4544
imagePullPolicy: IfNotPresent

test/e2e/yaml/vllm-sim-pd.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -58,7 +58,7 @@ spec:
5858
app: ${POOL_NAME}
5959
llm-d.ai/role: decode
6060
spec:
61-
initContainers:
61+
containers:
6262
- name: routing-sidecar
6363
image: ${SIDECAR_IMAGE}
6464
imagePullPolicy: IfNotPresent
@@ -72,7 +72,6 @@ spec:
7272
- containerPort: 8000
7373
protocol: TCP
7474
restartPolicy: Always
75-
containers:
7675
- name: vllm
7776
image: ${VLLM_SIMULATOR_IMAGE}
7877
imagePullPolicy: IfNotPresent

test/sidecar/config/base/pod-qwen.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ kind: Pod
33
metadata:
44
name: qwen2-0--5b
55
spec:
6-
initContainers:
6+
containers:
77
- name: routing-proxy
88
image: routing-proxy
99
args:
@@ -22,7 +22,6 @@ spec:
2222
# - "true"
2323
# initialDelaySeconds: 1
2424
# periodSeconds: 360
25-
containers:
2625
- name: vllm
2726
image: vllm/vllm-openai:v0.8.2
2827
args:

test/sidecar/config/nixl/qwen-decoder-pod.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ spec:
1717
operator: In
1818
values:
1919
- NVIDIA-A100-SXM4-80GB
20-
initContainers:
20+
containers:
2121
- name: routing-proxy
2222
image: routing-proxy
2323
securityContext:
@@ -33,7 +33,6 @@ spec:
3333
protocol: TCP
3434
restartPolicy: Always
3535
imagePullPolicy: Always
36-
containers:
3736
- name: vllm
3837
image: vllm-openai
3938
securityContext:

0 commit comments

Comments
 (0)