Use correct image for VLLM CPU runtime (#650)

sheltoncyril · web-flow · commit c9fc5aa685ca · 2025-09-29T08:32:25.000-04:00
* fix: use right vllm cpu image for disconnected

* fix: guardrails tests return empty now if no detections

* fix: guardrails fix
diff --git a/tests/model_explainability/guardrails/conftest.py b/tests/model_explainability/guardrails/conftest.py
@@ -129,7 +129,7 @@ def vllm_runtime(
         template_name=RuntimeTemplates.VLLM_CUDA,
         deployment_type=KServeDeploymentType.RAW_DEPLOYMENT,
         runtime_image="quay.io/rh-aiservices-bu/vllm-cpu-openai-ubi9"
-        "@sha256:d680ff8becb6bbaf83dfee7b2d9b8a2beb130db7fd5aa7f9a6d8286a58cebbfd",
+        "@sha256:ada6b3ba98829eb81ae4f89364d9b431c0222671eafb9a04aa16f31628536af2",
         containers={
             "kserve-container": {
                 "args": [
diff --git a/tests/model_explainability/guardrails/test_guardrails.py b/tests/model_explainability/guardrails/test_guardrails.py
@@ -114,7 +114,7 @@ def test_guardrails_builtin_detectors_unsuitable_output(
             url=f"https://{guardrails_orchestrator_route.host}{PII_ENDPOINT}{OpenAIEnpoints.CHAT_COMPLETIONS}",
             headers=get_auth_headers(token=current_client_token),
             json=get_chat_payload(
-                content="Hi, write three and only three examples of email adresses "
+                content="Hi, write three and only three examples of email addresses "
                 "that I can use to create an account for an online service."
                 "Don't provide any additional explanation."
             ),
diff --git a/tests/model_explainability/guardrails/utils.py b/tests/model_explainability/guardrails/utils.py
@@ -146,24 +146,25 @@ def verify_builtin_detector_unsuitable_output_response(
 
     unsuitable_output_warning = "UNSUITABLE_OUTPUT"
     warnings = response_data.get("warnings", [])
-    if len(warnings) != 1:
-        errors.append(f"Expected 1 warning in response, got {len(warnings)}")
-    elif warnings[0]["type"] != unsuitable_output_warning:
-        errors.append(f"Expected warning type {unsuitable_output_warning}, got {warnings[0]['type']}")
-
-    output_detections = response_data.get("detections", {}).get("output", [])
-
-    if len(output_detections) < 1:
-        errors.append(f"Expected at least one output detection, but got {len(output_detections)}.")
-    else:
-        errors.extend(
-            verify_detection(
-                detections_list=output_detections,
-                detector_id=detector_id,
-                detection_name=detection_name,
-                detection_type=detection_type,
+    if warnings is not None:
+        if len(warnings) != 1:
+            errors.append(f"Expected 1 warning in response, got {len(warnings)}")
+        elif warnings[0]["type"] != unsuitable_output_warning:
+            errors.append(f"Expected warning type {unsuitable_output_warning}, got {warnings[0]['type']}")
+    output_detections = response_data.get("detections", {})
+    if output_detections is not None:
+        output_detections = output_detections.get("output", [])
+        if len(output_detections) < 1:
+            errors.append(f"Expected at least one output detection, but got {len(output_detections)}.")
+        else:
+            errors.extend(
+                verify_detection(
+                    detections_list=output_detections,
+                    detector_id=detector_id,
+                    detection_name=detection_name,
+                    detection_type=detection_type,
+                )
             )
-        )
 
     assert_no_errors(errors=errors, failure_message_prefix="Unsuitable output detection verification failed")
 
diff --git a/tests/model_explainability/lm_eval/conftest.py b/tests/model_explainability/lm_eval/conftest.py
@@ -325,6 +325,12 @@ def lmeval_minio_copy_pod(
                 "command": ["/bin/sh", "-c"],
                 "args": ["cp -r /mnt/data /shared"],
                 "volumeMounts": [{"name": "shared-data", "mountPath": "/shared"}],
+                "securityContext": {
+                    "allowPrivilegeEscalation": False,
+                    "capabilities": {"drop": ["ALL"]},
+                    "runAsNonRoot": True,
+                    "seccompProfile": {"type": "RuntimeDefault"},
+                },
             }
         ],
         containers=[
@@ -338,7 +344,14 @@ def lmeval_minio_copy_pod(
                     "mc mb --ignore-existing myminio/models &&\n"
                     "mc cp --recursive /shared/data/ myminio/models"
                 ],
+                "env": [{"name": "MC_CONFIG_DIR", "value": "/tmp/.mc"}],
                 "volumeMounts": [{"name": "shared-data", "mountPath": "/shared"}],
+                "securityContext": {
+                    "allowPrivilegeEscalation": False,
+                    "capabilities": {"drop": ["ALL"]},
+                    "runAsNonRoot": True,
+                    "seccompProfile": {"type": "RuntimeDefault"},
+                },
             }
         ],
         wait_for_resource=True,