Add Python Test Suite (#437)

rpancham · vaibhavjainwiz · web-flow · commit b71c371a5860 · 2025-07-15T08:11:41.000-04:00
* Add Python Test Suite

* Fix coderabbitai suggestions

---------

Co-authored-by: Vaibhav Jain &lt;vajain@redhat.com&gt;
diff --git a/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-raw-grpc-deployment].json b/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-raw-grpc-deployment].json
@@ -0,0 +1,25 @@
+{
+  "id": "1",
+  "modelName": "python",
+  "modelVersion": "1",
+  "outputs": [
+    {
+      "datatype": "FP32",
+      "name": "OUTPUT0",
+      "shape": [
+        "4"
+      ]
+    },
+    {
+      "datatype": "FP32",
+      "name": "OUTPUT1",
+      "shape": [
+        "4"
+      ]
+    }
+  ],
+  "rawOutputContents": [
+    "AgAAAAAAAAAAAAAAAAAAAA==",
+    "AAQAAAAAAAAAAAAAAAAAAA=="
+  ]
+}
diff --git a/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-raw-rest-deployment].json b/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-raw-rest-deployment].json
@@ -0,0 +1,32 @@
+{
+  "model_name": "python",
+  "model_version": "1",
+  "outputs": [
+    {
+      "data": [
+        0.921442985534668,
+        0.6223347187042236,
+        0.8059385418891907,
+        1.2578542232513428
+      ],
+      "datatype": "FP32",
+      "name": "OUTPUT0",
+      "shape": [
+        4
+      ]
+    },
+    {
+      "data": [
+        0.49091365933418274,
+        -0.027157962322235107,
+        -0.5641784071922302,
+        0.6906309723854065
+      ],
+      "datatype": "FP32",
+      "name": "OUTPUT1",
+      "shape": [
+        4
+      ]
+    }
+  ]
+}
diff --git a/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-serverless-grpc-deployment].json b/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-serverless-grpc-deployment].json
@@ -0,0 +1,25 @@
+{
+  "id": "1",
+  "modelName": "python",
+  "modelVersion": "1",
+  "outputs": [
+    {
+      "datatype": "FP32",
+      "name": "OUTPUT0",
+      "shape": [
+        "4"
+      ]
+    },
+    {
+      "datatype": "FP32",
+      "name": "OUTPUT1",
+      "shape": [
+        "4"
+      ]
+    }
+  ],
+  "rawOutputContents": [
+    "AgAAAAAAAAAAAAAAAAAAAA==",
+    "AAQAAAAAAAAAAAAAAAAAAA=="
+  ]
+}
diff --git a/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-serverless-rest-deployment].json b/tests/model_serving/model_runtime/triton/basic_model_deployment/__snapshots__/test_python_model/TestPYTHONModel.test_python_inference[python-keras-serverless-rest-deployment].json
@@ -0,0 +1,32 @@
+{
+  "model_name": "python",
+  "model_version": "1",
+  "outputs": [
+    {
+      "data": [
+        0.921442985534668,
+        0.6223347187042236,
+        0.8059385418891907,
+        1.2578542232513428
+      ],
+      "datatype": "FP32",
+      "name": "OUTPUT0",
+      "shape": [
+        4
+      ]
+    },
+    {
+      "data": [
+        0.49091365933418274,
+        -0.027157962322235107,
+        -0.5641784071922302,
+        0.6906309723854065
+      ],
+      "datatype": "FP32",
+      "name": "OUTPUT1",
+      "shape": [
+        4
+      ]
+    }
+  ]
+}
diff --git a/tests/model_serving/model_runtime/triton/basic_model_deployment/kserve-triton-python-gRPC-input.json b/tests/model_serving/model_runtime/triton/basic_model_deployment/kserve-triton-python-gRPC-input.json
@@ -0,0 +1 @@
+{"id":"1","model_name":"python","model_version":"1","inputs":[{"name":"INPUT0","shape":[4],"datatype":"FP32"},{"name":"INPUT1","shape":[4],"datatype":"FP32"}],"outputs":[{"name":"OUTPUT0"},{"name":"OUTPUT1"}],"raw_input_contents":["AQIAAAAAAAAAAAAAAAAAAA==","/wEAgAAAAAAAAAAAAAAAAA=="]}
diff --git a/tests/model_serving/model_runtime/triton/basic_model_deployment/kserve-triton-python-rest-input.json b/tests/model_serving/model_runtime/triton/basic_model_deployment/kserve-triton-python-rest-input.json
@@ -0,0 +1 @@
+{"inputs":[{"name":"INPUT0","shape":[4],"datatype":"FP32","data":[0.7061783075332642,0.29758837819099426,0.12088008970022202,0.974242627620697]},{"name":"INPUT1","shape":[4],"datatype":"FP32","data":[0.21526464819908142,0.32474634051322937,0.6850584745407104,0.2836116552352905]}]}
diff --git a/tests/model_serving/model_runtime/triton/basic_model_deployment/test_python_model.py b/tests/model_serving/model_runtime/triton/basic_model_deployment/test_python_model.py
@@ -0,0 +1,124 @@
+"""
+Test module for Python model served by Triton via KServe.
+
+Validates inference using REST and gRPC protocols with both raw and serverless deployment modes.
+"""
+
+from typing import Any
+
+import pytest
+from ocp_resources.inference_service import InferenceService
+from ocp_resources.pod import Pod
+from simple_logger.logger import get_logger
+
+from utilities.constants import Protocols
+from tests.model_serving.model_runtime.triton.basic_model_deployment.utils import validate_inference_request, load_json
+from tests.model_serving.model_runtime.triton.constant import (
+    BASE_RAW_DEPLOYMENT_CONFIG,
+    BASE_SERVERLESS_DEPLOYMENT_CONFIG,
+    MODEL_PATH_PREFIX,
+    TRITON_GRPC_PYTHON_INPUT_PATH,
+    TRITON_REST_PYTHON_INPUT_PATH,
+)
+
+LOGGER = get_logger(name=__name__)
+
+PYTHON_MODEL_NAME = "python"
+
+MODEL_STORAGE_URI_DICT = {"model-dir": f"{MODEL_PATH_PREFIX}"}
+
+pytestmark = pytest.mark.usefixtures(
+    "root_dir", "valid_aws_config", "triton_rest_serving_runtime_template", "triton_grpc_serving_runtime_template"
+)
+
+
+@pytest.mark.parametrize(
+    ("protocol", "model_namespace", "s3_models_storage_uri", "triton_serving_runtime", "triton_inference_service"),
+    [
+        pytest.param(
+            {"protocol_type": Protocols.REST},
+            {"name": "python-raw"},
+            MODEL_STORAGE_URI_DICT,
+            {**BASE_RAW_DEPLOYMENT_CONFIG},
+            {
+                "name": "python-raw-rest",
+                **BASE_RAW_DEPLOYMENT_CONFIG,
+            },
+            id="python-raw-rest-deployment",
+        ),
+        pytest.param(
+            {"protocol_type": Protocols.GRPC},
+            {"name": "python-raw"},
+            MODEL_STORAGE_URI_DICT,
+            {**BASE_RAW_DEPLOYMENT_CONFIG},
+            {
+                "name": "python-raw-grpc",
+                **BASE_RAW_DEPLOYMENT_CONFIG,
+            },
+            id="python-raw-grpc-deployment",
+        ),
+        pytest.param(
+            {"protocol_type": Protocols.REST},
+            {"name": "python-serverless"},
+            MODEL_STORAGE_URI_DICT,
+            {**BASE_SERVERLESS_DEPLOYMENT_CONFIG},
+            {
+                "name": "python-serverless-rest",
+                **BASE_SERVERLESS_DEPLOYMENT_CONFIG,
+            },
+            id="python-serverless-rest-deployment",
+        ),
+        pytest.param(
+            {"protocol_type": Protocols.GRPC},
+            {"name": "python-serverless"},
+            MODEL_STORAGE_URI_DICT,
+            {**BASE_SERVERLESS_DEPLOYMENT_CONFIG},
+            {
+                "name": "python-serverless-grpc",
+                **BASE_SERVERLESS_DEPLOYMENT_CONFIG,
+            },
+            id="python-serverless-grpc-deployment",
+        ),
+    ],
+    indirect=True,
+)
+class TestPythonModel:
+    """
+    Test class for python inference using Triton on KServe.
+
+    Covers:
+    - REST and gRPC protocols
+    - Raw and serverless modes
+    - Snapshot validation of inference results
+    """
+
+    def test_python_inference(
+        self,
+        triton_inference_service: InferenceService,
+        triton_pod_resource: Pod,
+        triton_response_snapshot: Any,
+        protocol: str,
+        root_dir: str,
+    ) -> None:
+        """
+        Run inference and validate against snapshot.
+
+        Args:
+            triton_inference_service: The deployed InferenceService object
+            triton_pod_resource: The pod running the model server
+            triton_response_snapshot: Expected response snapshot
+            protocol: REST or gRPC
+            root_dir: Root directory for test execution
+        """
+        input_path = TRITON_GRPC_PYTHON_INPUT_PATH if protocol == Protocols.GRPC else TRITON_REST_PYTHON_INPUT_PATH
+        input_query = load_json(path=input_path)
+
+        validate_inference_request(
+            pod_name=triton_pod_resource.name,
+            isvc=triton_inference_service,
+            response_snapshot=triton_response_snapshot,
+            input_query=input_query,
+            model_name=PYTHON_MODEL_NAME,
+            protocol=protocol,
+            root_dir=root_dir,
+        )
diff --git a/tests/model_serving/model_runtime/triton/constant.py b/tests/model_serving/model_runtime/triton/constant.py
@@ -12,6 +12,8 @@
 
 TRITON_REST_ONNX_INPUT_PATH = os.path.join(TRITON_INPUT_BASE_PATH, "kserve-triton-onnx-rest-input.json")
 TRITON_GRPC_ONNX_INPUT_PATH = os.path.join(TRITON_INPUT_BASE_PATH, "kserve-triton-onnx-gRPC-input.json")
+TRITON_REST_PYTHON_INPUT_PATH = os.path.join(TRITON_INPUT_BASE_PATH, "kserve-triton-python-rest-input.json")
+TRITON_GRPC_PYTHON_INPUT_PATH = os.path.join(TRITON_INPUT_BASE_PATH, "kserve-triton-python-gRPC-input.json")
 
 LOCAL_HOST_URL: str = "http://localhost"
 TRITON_REST_PORT: int = 8080

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+{"id":"1","model_name":"python","model_version":"1","inputs":[{"name":"INPUT0","shape":[4],"datatype":"FP32"},{"name":"INPUT1","shape":[4],"datatype":"FP32"}],"outputs":[{"name":"OUTPUT0"},{"name":"OUTPUT1"}],"raw_input_contents":["AQIAAAAAAAAAAAAAAAAAAA==","/wEAgAAAAAAAAAAAAAAAAA=="]}`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+{"inputs":[{"name":"INPUT0","shape":[4],"datatype":"FP32","data":[0.7061783075332642,0.29758837819099426,0.12088008970022202,0.974242627620697]},{"name":"INPUT1","shape":[4],"datatype":"FP32","data":[0.21526464819908142,0.32474634051322937,0.6850584745407104,0.2836116552352905]}]}`