Merge branch 'main' into trustyai-upgrade

rnetser · web-flow · commit 4a5b1c921893 · 2025-04-26T11:58:51.000+03:00
diff --git a/.github/workflows/add-remove-labels.yml b/.github/workflows/add-remove-labels.yml
@@ -37,7 +37,7 @@ jobs:
       - uses: actions/checkout@v4
 
       - name: Install uv
-        uses: astral-sh/setup-uv@v5
+        uses: astral-sh/setup-uv@v6
 
       - name: Run add remove labels
         env:
diff --git a/.github/workflows/add-welcome-comment-set-assignee.yml b/.github/workflows/add-welcome-comment-set-assignee.yml
@@ -15,7 +15,7 @@ jobs:
       - uses: actions/checkout@v4
 
       - name: Install uv
-        uses: astral-sh/setup-uv@v5
+        uses: astral-sh/setup-uv@v6
 
       - name: Run add welcome comment
         env:
diff --git a/.github/workflows/on-review-add-label.yml b/.github/workflows/on-review-add-label.yml
@@ -80,7 +80,7 @@ jobs:
       - uses: actions/checkout@v4
 
       - name: Install uv
-        uses: astral-sh/setup-uv@v5
+        uses: astral-sh/setup-uv@v6
       - name: 'Run add-remove-labels action'
         env:
           GITHUB_TOKEN: ${{ secrets.OPENDATAHUB_TESTS_BOT_PAT }}
diff --git a/.github/workflows/size-labeler.yml b/.github/workflows/size-labeler.yml
@@ -15,7 +15,7 @@ jobs:
       - uses: actions/checkout@v4
 
       - name: Install uv
-        uses: astral-sh/setup-uv@v5
+        uses: astral-sh/setup-uv@v6
 
       - name: Run size labeler
         env:
diff --git a/.github/workflows/tox-tests.yml b/.github/workflows/tox-tests.yml
@@ -12,7 +12,7 @@ jobs:
     - uses: actions/checkout@v4
 
     - name: Install uv
-      uses: astral-sh/setup-uv@v5
+      uses: astral-sh/setup-uv@v6
 
     - name: Install tox-uv
       run: |
diff --git a/pyproject.toml b/pyproject.toml
@@ -66,7 +66,7 @@ dependencies = [
     "openshift-python-wrapper>=11.0.38",
     "semver>=3.0.4",
     "pytest-order>=1.3.0",
-    "marshmallow==3.26.1",  # this version is needed for pytest-jira
+    "marshmallow==3.26.1,<4", # this version is needed for pytest-jira
 ]
 
 [project.urls]
diff --git a/tests/model_serving/model_server/authentication/test_model_mesh_authentication.py b/tests/model_serving/model_server/authentication/test_model_mesh_authentication.py
@@ -25,7 +25,6 @@
 class TestModelMeshAuthentication:
     """Model Mesh Authentication is based on the created Service; cross-model authentication is not blocked"""
 
-    @pytest.mark.ocp_interop
     @pytest.mark.dependency(name="test_model_mesh_model_authentication_openvino_inference_with_tensorflow")
     def test_model_mesh_model_authentication_openvino_inference_with_tensorflow(
         self,
diff --git a/tests/model_serving/model_server/conftest.py b/tests/model_serving/model_server/conftest.py
@@ -368,16 +368,18 @@ def ovms_kserve_inference_service(
     if env_vars := request.param.get("env-vars"):
         isvc_kwargs["model_env_variables"] = env_vars
 
-    if min_replicas := request.param.get("min-replicas"):
+    if (min_replicas := request.param.get("min-replicas")) is not None:
         isvc_kwargs["min_replicas"] = min_replicas
+        if min_replicas == 0:
+            isvc_kwargs["wait_for_predictor_pods"] = False
 
     if max_replicas := request.param.get("max-replicas"):
         isvc_kwargs["max_replicas"] = max_replicas
 
     if scale_metric := request.param.get("scale-metric"):
         isvc_kwargs["scale_metric"] = scale_metric
 
-    if scale_target := request.param.get("scale-target"):
+    if (scale_target := request.param.get("scale-target")) is not None:
         isvc_kwargs["scale_target"] = scale_target
 
     with create_isvc(**isvc_kwargs) as isvc:
diff --git a/tests/model_serving/model_server/model_mesh/test_model_mesh_multi_models.py b/tests/model_serving/model_server/model_mesh/test_model_mesh_multi_models.py
@@ -10,15 +10,16 @@
 from utilities.inference_utils import Inference
 from utilities.manifests.openvino import OPENVINO_INFERENCE_CONFIG
 
-pytestmark = [pytest.mark.modelmesh, pytest.mark.sanity]
+pytestmark = [pytest.mark.modelmesh, pytest.mark.sanity, pytest.mark.ocp_interop]
 
 
 @pytest.mark.parametrize(
-    "model_namespace, http_s3_openvino_model_mesh_inference_service, "
+    "model_namespace, http_s3_ovms_model_mesh_serving_runtime, http_s3_openvino_model_mesh_inference_service, "
     "http_s3_openvino_second_model_mesh_inference_service",
     [
         pytest.param(
             {"name": "model-mesh-multi-model", "modelmesh-enabled": True},
+            {"enable_external_route": True},
             {"model-path": ModelStoragePath.OPENVINO_EXAMPLE_MODEL},
             {
                 "model-path": ModelStoragePath.OPENVINO_VEHICLE_DETECTION,
diff --git a/tests/model_serving/model_server/serverless/test_zero_initial_scale.py b/tests/model_serving/model_server/serverless/test_zero_initial_scale.py
@@ -0,0 +1,93 @@
+import pytest
+from ocp_resources.deployment import Deployment
+
+from tests.model_serving.model_server.serverless.constants import (
+    ONNX_SERVERLESS_INFERENCE_SERVICE_CONFIG,
+)
+from tests.model_serving.model_server.serverless.utils import verify_no_inference_pods
+from tests.model_serving.model_server.utils import verify_inference_response
+from utilities.constants import (
+    Protocols,
+    RunTimeConfigs,
+)
+from utilities.exceptions import DeploymentValidationError
+from utilities.general import create_isvc_label_selector_str
+from utilities.inference_utils import Inference
+from utilities.manifests.onnx import ONNX_INFERENCE_CONFIG
+
+pytestmark = [
+    pytest.mark.serverless,
+    pytest.mark.sanity,
+    pytest.mark.usefixtures("valid_aws_config"),
+]
+
+
+@pytest.mark.serverless
+@pytest.mark.parametrize(
+    "model_namespace, ovms_kserve_serving_runtime, ovms_kserve_inference_service",
+    [
+        pytest.param(
+            {"name": "serverless-initial-scale-zero"},
+            RunTimeConfigs.ONNX_OPSET13_RUNTIME_CONFIG,
+            {
+                **ONNX_SERVERLESS_INFERENCE_SERVICE_CONFIG,
+                "min-replicas": 0,
+            },
+        )
+    ],
+    indirect=True,
+)
+class TestServerlessInitialScaleZero:
+    @pytest.mark.dependency(name="test_no_serverless_pods_created_for_zero_initial_scale")
+    def test_no_serverless_pods_created_for_zero_initial_scale(self, admin_client, ovms_kserve_inference_service):
+        """Verify no pods are created when inference service initial scale is zero, i.e. zero min-replicas requested."""
+        verify_no_inference_pods(client=admin_client, isvc=ovms_kserve_inference_service)
+
+    @pytest.mark.dependency(name="test_no_serverless_replicas_created_for_zero_initial_scale")
+    def test_no_serverless_replicas_created_for_zero_initial_scale(
+        self, admin_client, ovms_kserve_inference_service, ovms_kserve_serving_runtime
+    ):
+        """Verify replica count is zero when inference service initial scale is zero"""
+        labels = [
+            "serving.knative.dev/configurationGeneration=1",
+            create_isvc_label_selector_str(
+                isvc=ovms_kserve_inference_service,
+                resource_type="deployment",
+                runtime_name=ovms_kserve_serving_runtime.name,
+            ),
+        ]
+
+        deployments = list(
+            Deployment.get(
+                label_selector=",".join(labels), client=admin_client, namespace=ovms_kserve_inference_service.namespace
+            )
+        )
+
+        if not deployments:
+            raise DeploymentValidationError(
+                f"Inference Service {ovms_kserve_inference_service.name} new deployment not found"
+            )
+
+        if deployments[0].instance.spec.replicas == 0:
+            deployments[0].wait_for_replicas(deployed=False)
+            return
+
+        raise DeploymentValidationError(
+            f"Inference Service {ovms_kserve_inference_service.name} deployment should have 0 replicas when created"
+        )
+
+    @pytest.mark.dependency(
+        depends=[
+            "test_no_serverless_pods_created_for_zero_initial_scale",
+            "test_no_serverless_replicas_created_for_zero_initial_scale",
+        ]
+    )
+    def test_serverless_inference_after_zero_initial_scale(self, ovms_kserve_inference_service):
+        """Verify model can be queried after being created with an initial scale of zero."""
+        verify_inference_response(
+            inference_service=ovms_kserve_inference_service,
+            inference_config=ONNX_INFERENCE_CONFIG,
+            inference_type=Inference.INFER,
+            protocol=Protocols.HTTPS,
+            use_default_query=True,
+        )
diff --git a/uv.lock b/uv.lock

Original file line number	Diff line number	Diff line change
`@@ -66,7 +66,7 @@ dependencies = [`
`66`	`66`	`"openshift-python-wrapper>=11.0.38",`
`67`	`67`	`"semver>=3.0.4",`
`68`	`68`	`"pytest-order>=1.3.0",`
`69`		`- "marshmallow==3.26.1", # this version is needed for pytest-jira`
	`69`	`+ "marshmallow==3.26.1,<4", # this version is needed for pytest-jira`
`70`	`70`	`]`
`71`	`71`
`72`	`72`	`[project.urls]`