Skip to content

Commit a051054

Browse files
committed
improve naming
1 parent 3c86b86 commit a051054

File tree

2 files changed

+6
-8
lines changed

2 files changed

+6
-8
lines changed

tests/model_serving/model_server/llmd/test_singlenode_precise_prefix_cache.py

Lines changed: 5 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,7 @@
2020
get_llmd_workload_pods,
2121
verify_gateway_status,
2222
verify_llm_service_status,
23-
verify_singlenode_prefix_cache_routing,
23+
verify_singlenode_precise_prefix_cache_routing,
2424
)
2525
from simple_logger.logger import get_logger
2626

@@ -31,7 +31,7 @@
3131

3232
@pytest.mark.parametrize(
3333
"unprivileged_model_namespace",
34-
[pytest.param({"name": "singlenode-prefix-cache-test"})],
34+
[pytest.param({"name": "llmd-singlenode-prefix-cache-test"})],
3535
indirect=True,
3636
)
3737
@pytest.mark.parametrize(
@@ -60,23 +60,21 @@ def test_singlenode_precise_prefix_cache(
6060
if gpu_count_on_cluster < 2:
6161
pytest.skip(f"Test requires at least 2 GPUs (found {gpu_count_on_cluster})")
6262

63-
# Verify gateway and service are ready
63+
# Verify infrastructure is ready before testing routing
6464
assert verify_gateway_status(llmd_gateway), "Gateway should be ready"
6565
assert verify_llm_service_status(singlenode_precise_prefix_cache), "LLMInferenceService should be ready"
6666

67-
# Verify router-scheduler pod exists and is running
6867
router_scheduler_pod = get_llmd_router_scheduler_pod(
6968
client=unprivileged_client, llmisvc=singlenode_precise_prefix_cache
7069
)
7170
assert router_scheduler_pod is not None, "Router-scheduler pod should exist"
7271
assert router_scheduler_pod.instance.status.phase == "Running", "Router-scheduler pod should be running"
7372

74-
# Verify workload pods
7573
workload_pods = get_llmd_workload_pods(client=unprivileged_client, llmisvc=singlenode_precise_prefix_cache)
7674
assert len(workload_pods) == 2, f"Expected 2 workload pods, found {len(workload_pods)}"
7775

78-
# Test prefix cache routing (includes assertions for routing affinity)
79-
verify_singlenode_prefix_cache_routing(
76+
# Verify prefix cache routing behavior
77+
verify_singlenode_precise_prefix_cache_routing(
8078
llmisvc=singlenode_precise_prefix_cache,
8179
token=authenticated_llmisvc_token,
8280
workload_pods=workload_pods,

tests/model_serving/model_server/llmd/utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -313,7 +313,7 @@ def get_pod_that_handled_request(workload_pods: list[Pod], baseline_counts: dict
313313
return None
314314

315315

316-
def verify_singlenode_prefix_cache_routing(
316+
def verify_singlenode_precise_prefix_cache_routing(
317317
llmisvc: LLMInferenceService,
318318
token: str,
319319
workload_pods: list[Pod],

0 commit comments

Comments
 (0)