Skip to content

Commit b2d1f04

Browse files
committed
Improvements to the launcher-based tests
Signed-off-by: Jun Duan <jun.duan.phd@outlook.com>
1 parent baef9d8 commit b2d1f04

File tree

2 files changed

+2
-11
lines changed

2 files changed

+2
-11
lines changed

test/e2e/mkobjs.sh

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,6 @@ spec:
1717
options: "--model HuggingFaceTB/SmolLM2-360M-Instruct"
1818
env_vars:
1919
VLLM_SERVER_DEV_MODE: "1"
20-
VLLM_USE_V1: "1"
2120
VLLM_LOGGING_LEVEL: "DEBUG"
2221
VLLM_CPU_KVCACHE_SPACE: "1" # GiB
2322
labels:
@@ -38,7 +37,6 @@ spec:
3837
options: "--model Qwen/Qwen2.5-0.5B-Instruct"
3938
env_vars:
4039
VLLM_SERVER_DEV_MODE: "1"
41-
VLLM_USE_V1: "1"
4240
VLLM_LOGGING_LEVEL: "DEBUG"
4341
VLLM_CPU_KVCACHE_SPACE: "1" # GiB
4442
labels:
@@ -59,7 +57,6 @@ spec:
5957
options: "--model TinyLlama/TinyLlama-1.1B-Chat-v1.0"
6058
env_vars:
6159
VLLM_SERVER_DEV_MODE: "1"
62-
VLLM_USE_V1: "1"
6360
VLLM_LOGGING_LEVEL: "DEBUG"
6461
VLLM_CPU_KVCACHE_SPACE: "1" # GiB
6562
labels:

test/e2e/run-launcher-based.sh

Lines changed: 2 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -278,12 +278,9 @@ expect '[ "$(kubectl get pod $reqlb3 -o jsonpath={.metadata.labels.dual-pods\\.l
278278
# Verify launcher is bound to new requester
279279
expect '[ "$(kubectl get pod $launcherlb -o jsonpath={.metadata.labels.dual-pods\\.llm-d\\.ai/dual})" == "$reqlb3" ]'
280280

281-
# Verify the new requester is using isc2
282-
expect '[ "$(kubectl get pod $reqlb3 -o jsonpath={.metadata.annotations.dual-pods\\.llm-d\\.ai/inference-server-config})" == "'$isc2'" ]'
283-
284281
# Wait for requester to be ready (launcher should already be ready)
285282
date
286-
kubectl wait --for condition=Ready pod/$reqlb3 --timeout=30s
283+
kubectl wait --for condition=Ready pod/$reqlb3 --timeout=120s
287284
kubectl wait --for condition=Ready pod/$launcherlb --timeout=5s
288285

289286
cheer Successful multiple instances sharing one launcher
@@ -321,12 +318,9 @@ expect '[ "$(kubectl get pod $reqlb4 -o jsonpath={.metadata.labels.dual-pods\\.l
321318
# Verify launcher is bound to new requester
322319
expect '[ "$(kubectl get pod $launcherlb -o jsonpath={.metadata.labels.dual-pods\\.llm-d\\.ai/dual})" == "$reqlb4" ]'
323320

324-
# Verify the new requester is using original isc
325-
expect '[ "$(kubectl get pod $reqlb4 -o jsonpath={.metadata.annotations.dual-pods\\.llm-d\\.ai/inference-server-config})" == "'$isc'" ]'
326-
327321
# Wait for requester to be ready (launcher should already be ready)
328322
date
329-
kubectl wait --for condition=Ready pod/$reqlb4 --timeout=30s
323+
kubectl wait --for condition=Ready pod/$reqlb4 --timeout=120s
330324
kubectl wait --for condition=Ready pod/$launcherlb --timeout=5s
331325

332326
cheer Successful switching instances in one launcher

0 commit comments

Comments
 (0)