skip tests conditionally + linting

threcc · threcc · commit 066ea91feb57 · 2026-03-27T14:41:06.000+01:00
Signed-off-by: threcc &lt;trecchiu@redhat.com&gt;
diff --git a/tests/model_serving/model_server/llmd/test_llmd_auth.py b/tests/model_serving/model_server/llmd/test_llmd_auth.py
@@ -33,7 +33,10 @@ def test_llmisvc_authorized(self, llmisvc_auth_pair):
 
         for entry in [entry_a, entry_b]:
             status, body = send_chat_completions(
-                llmisvc=entry.service, prompt=prompt, token=entry.token, insecure=False
+                llmisvc=entry.service,
+                prompt=prompt,
+                token=entry.token,
+                insecure=False,
             )
             assert status == 200, f"Authorized request failed with {status}: {body}"
             completion = parse_completion_text(response_body=body)
diff --git a/tests/model_serving/model_server/llmd/test_llmd_connection_cpu.py b/tests/model_serving/model_server/llmd/test_llmd_connection_cpu.py
@@ -21,7 +21,7 @@
     ],
     indirect=True,
 )
-@pytest.mark.usefixtures("valid_aws_config")
+@pytest.mark.usefixtures("valid_aws_config", "skip_if_disconnected")
 class TestLlmdConnectionCpu:
     """Deploy TinyLlama on CPU via S3 and HuggingFace and verify chat completions."""
 
diff --git a/tests/model_serving/model_server/llmd/test_llmd_connection_gpu.py b/tests/model_serving/model_server/llmd/test_llmd_connection_gpu.py
@@ -21,7 +21,7 @@
     ],
     indirect=True,
 )
-@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available")
+@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available", "skip_if_disconnected")
 class TestLlmdConnectionGpu:
     """Deploy Qwen on GPU via S3 and HuggingFace and verify chat completions."""
 
diff --git a/tests/model_serving/model_server/llmd/test_llmd_no_scheduler.py b/tests/model_serving/model_server/llmd/test_llmd_no_scheduler.py
@@ -26,7 +26,7 @@ def router_config(cls):
     [({"name": NAMESPACE}, S3GpuNoSchedulerConfig)],
     indirect=True,
 )
-@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available")
+@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available", "skip_if_disconnected")
 class TestLlmdNoScheduler:
     """Deploy Qwen on GPU with the scheduler disabled and verify chat completions."""
 
diff --git a/tests/model_serving/model_server/llmd/test_llmd_prefill_decode.py b/tests/model_serving/model_server/llmd/test_llmd_prefill_decode.py
@@ -18,7 +18,7 @@
     [({"name": NAMESPACE}, PrefillDecodeConfig)],
     indirect=True,
 )
-@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available")
+@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available", "skip_if_disconnected")
 class TestLlmdPrefillDecode:
     """Deploy Qwen on GPU with prefill-decode disaggregation and verify chat completions."""
 
diff --git a/tests/model_serving/model_server/llmd/test_llmd_singlenode_estimated_prefix_cache.py b/tests/model_serving/model_server/llmd/test_llmd_singlenode_estimated_prefix_cache.py
@@ -30,7 +30,7 @@
     [({"name": NAMESPACE}, EstimatedPrefixCacheConfig)],
     indirect=True,
 )
-@pytest.mark.usefixtures("valid_aws_config", "skip_if_less_than_2_gpus")
+@pytest.mark.usefixtures("valid_aws_config", "skip_if_less_than_2_gpus", "skip_if_disconnected")
 class TestSingleNodeEstimatedPrefixCache:
     """Deploy Qwen on GPU with 2 replicas and estimated prefix cache routing,
     then verify cache hits via Prometheus metrics.
@@ -58,7 +58,10 @@ def test_singlenode_estimated_prefix_cache(
         assert len(workload_pods) == 2, f"Expected 2 workload pods, found {len(workload_pods)}"
 
         successful = send_prefix_cache_requests(
-            llmisvc=llmisvc, prompt=PREFIX_CACHE_PROMPT, token=llmisvc_token, count=NUM_REQUESTS
+            llmisvc=llmisvc,
+            prompt=PREFIX_CACHE_PROMPT,
+            token=llmisvc_token,
+            count=NUM_REQUESTS,
         )
         assert successful == NUM_REQUESTS, f"Expected all {NUM_REQUESTS} requests to succeed, got {successful}"
 
diff --git a/tests/model_serving/model_server/llmd/test_llmd_singlenode_precise_prefix_cache.py b/tests/model_serving/model_server/llmd/test_llmd_singlenode_precise_prefix_cache.py
@@ -31,7 +31,7 @@
     [({"name": NAMESPACE}, PrecisePrefixCacheConfig)],
     indirect=True,
 )
-@pytest.mark.usefixtures("valid_aws_config", "skip_if_less_than_2_gpus")
+@pytest.mark.usefixtures("valid_aws_config", "skip_if_less_than_2_gpus", "skip_if_disconnected")
 class TestSingleNodePrecisePrefixCache:
     """Deploy Qwen on GPU with 2 replicas and precise prefix cache routing,
     then verify cache hits via Prometheus metrics.
@@ -60,7 +60,10 @@ def test_singlenode_precise_prefix_cache(
         assert len(workload_pods) == 2, f"Expected 2 workload pods, found {len(workload_pods)}"
 
         successful = send_prefix_cache_requests(
-            llmisvc=llmisvc, prompt=PREFIX_CACHE_PROMPT, token=llmisvc_token, count=NUM_REQUESTS
+            llmisvc=llmisvc,
+            prompt=PREFIX_CACHE_PROMPT,
+            token=llmisvc_token,
+            count=NUM_REQUESTS,
         )
         assert successful == NUM_REQUESTS, f"Expected all {NUM_REQUESTS} requests to succeed, got {successful}"
 

Original file line number	Diff line number	Diff line change
`@@ -21,7 +21,7 @@`
`21`	`21`	`],`
`22`	`22`	`indirect=True,`
`23`	`23`	`)`
`24`		`-@pytest.mark.usefixtures("valid_aws_config")`
	`24`	`+@pytest.mark.usefixtures("valid_aws_config", "skip_if_disconnected")`
`25`	`25`	`class TestLlmdConnectionCpu:`
`26`	`26`	`"""Deploy TinyLlama on CPU via S3 and HuggingFace and verify chat completions."""`
`27`	`27`
Original file line number	Diff line number	Diff line change
`@@ -26,7 +26,7 @@ def router_config(cls):`
`26`	`26`	`[({"name": NAMESPACE}, S3GpuNoSchedulerConfig)],`
`27`	`27`	`indirect=True,`
`28`	`28`	`)`
`29`		`-@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available")`
	`29`	`+@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available", "skip_if_disconnected")`
`30`	`30`	`class TestLlmdNoScheduler:`
`31`	`31`	`"""Deploy Qwen on GPU with the scheduler disabled and verify chat completions."""`
`32`	`32`
Original file line number	Diff line number	Diff line change
`@@ -18,7 +18,7 @@`
`18`	`18`	`[({"name": NAMESPACE}, PrefillDecodeConfig)],`
`19`	`19`	`indirect=True,`
`20`	`20`	`)`
`21`		`-@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available")`
	`21`	`+@pytest.mark.usefixtures("valid_aws_config", "skip_if_no_gpu_available", "skip_if_disconnected")`
`22`	`22`	`class TestLlmdPrefillDecode:`
`23`	`23`	`"""Deploy Qwen on GPU with prefill-decode disaggregation and verify chat completions."""`
`24`	`24`