File tree Expand file tree Collapse file tree 6 files changed +6
-12
lines changed
Expand file tree Collapse file tree 6 files changed +6
-12
lines changed Original file line number Diff line number Diff line change 6969 app : ${POOL_NAME}
7070 llm-d.ai/role : decode
7171 spec :
72- initContainers :
72+ containers :
7373 - name : routing-sidecar
7474 image : ${SIDECAR_IMAGE}
7575 imagePullPolicy : IfNotPresent
@@ -110,7 +110,6 @@ spec:
110110 valueFrom :
111111 fieldRef :
112112 fieldPath : status.podIP
113- containers :
114113 - name : vllm
115114 image : ${VLLM_SIMULATOR_IMAGE}
116115 imagePullPolicy : IfNotPresent
Original file line number Diff line number Diff line change 1414 labels :
1515 app : ${POOL_NAME}
1616 spec :
17- initContainers :
17+ containers :
1818 - name : routing-sidecar
1919 image : ${SIDECAR_IMAGE}
2020 imagePullPolicy : IfNotPresent
5555 valueFrom :
5656 fieldRef :
5757 fieldPath : status.podIP
58- containers :
5958 - name : vllm
6059 image : ${VLLM_SIMULATOR_IMAGE}
6160 imagePullPolicy : IfNotPresent
Original file line number Diff line number Diff line change 1515 app : ${POOL_NAME}
1616 llm-d.ai/role : decode
1717 spec :
18- initContainers :
18+ containers :
1919 - name : routing-sidecar
2020 image : ${SIDECAR_IMAGE}
2121 imagePullPolicy : IfNotPresent
3939 valueFrom :
4040 fieldRef :
4141 fieldPath : status.podIP
42- containers :
4342 - name : vllm
4443 image : ${VLLM_SIMULATOR_IMAGE}
4544 imagePullPolicy : IfNotPresent
Original file line number Diff line number Diff line change 5858 app : ${POOL_NAME}
5959 llm-d.ai/role : decode
6060 spec :
61- initContainers :
61+ containers :
6262 - name : routing-sidecar
6363 image : ${SIDECAR_IMAGE}
6464 imagePullPolicy : IfNotPresent
7272 - containerPort : 8000
7373 protocol : TCP
7474 restartPolicy : Always
75- containers :
7675 - name : vllm
7776 image : ${VLLM_SIMULATOR_IMAGE}
7877 imagePullPolicy : IfNotPresent
Original file line number Diff line number Diff line change @@ -3,7 +3,7 @@ kind: Pod
33metadata :
44 name : qwen2-0--5b
55spec :
6- initContainers :
6+ containers :
77 - name : routing-proxy
88 image : routing-proxy
99 args :
2222 # - "true"
2323 # initialDelaySeconds: 1
2424 # periodSeconds: 360
25- containers :
2625 - name : vllm
2726 image : vllm/vllm-openai:v0.8.2
2827 args :
Original file line number Diff line number Diff line change 1717 operator : In
1818 values :
1919 - NVIDIA-A100-SXM4-80GB
20- initContainers :
20+ containers :
2121 - name : routing-proxy
2222 image : routing-proxy
2323 securityContext :
3333 protocol : TCP
3434 restartPolicy : Always
3535 imagePullPolicy : Always
36- containers :
3736 - name : vllm
3837 image : vllm-openai
3938 securityContext :
You can’t perform that action at this time.
0 commit comments