test: update filter options validation for numeric properties (#886)

fege · dbasunag · web-flow · commit e2ae95a15ce2 · 2025-12-01T14:28:31.000Z
* test: update filter options validation for numeric properties

- Update SQL query to match new materialized views
- Add support for numeric properties with range validation (double_value, int_value)
- Update property naming convention for artifact properties (artifacts.{name}.{type})
- Add metricsType and model_id to excluded filter fields

* fix: add back the fixture test_idp_user to properly test the use non-admin case

---------

Co-authored-by: Debarati Basu-Nag &lt;dbasunag@redhat.com&gt;
diff --git a/tests/model_registry/model_catalog/db_constants.py b/tests/model_registry/model_catalog/db_constants.py
@@ -1,38 +1,49 @@
 # Constants useful for querying the model catalog database and parsing its responses
 
 # SQL query for filter_options endpoint database validation
-# Replicates the exact database query used by GetFilterableProperties for the filter_options endpoint
-# in kubeflow/model-registry catalog/internal/db/service/catalog_model.go
-# Note: Uses dynamic type_id lookup via 'kf.CatalogModel' name since type_id appears to be dynamic
+# Queries materialized views (context_property_options, artifact_property_options) that aggregate
+# filterable properties for CatalogModel. Based on GetFilterableProperties in
+# kubeflow/model-registry catalog/internal/db/service/catalog_model.go (PR #1875)
+#
+# Property naming:
+# - Context properties: base name only (special case: 'validated_on.array_value' for arrays)
+# - Artifact properties: 'artifacts.{name}.{type}' where type is string_value/array_value/double_value/int_value
+#
+# Return format:
+# - String/array properties: text array of values
+# - Numeric properties: 2-element text array [min, max] converted from double/int columns
 FILTER_OPTIONS_DB_QUERY = """
-SELECT name, array_agg(string_value) FROM (
-    SELECT
-        name,
-        string_value
-    FROM "ContextProperty" WHERE
-        context_id IN (
-            SELECT id FROM "Context" WHERE type_id = (
-                SELECT id FROM "Type" WHERE name = 'kf.CatalogModel'
-            )
-        )
-        AND string_value IS NOT NULL
-        AND string_value != ''
-        AND string_value IS NOT JSON ARRAY
+SELECT
+    CASE
+        WHEN name = 'validated_on' AND array_value IS NOT NULL THEN name || '.array_value'
+        ELSE name
+    END AS name,
+    COALESCE(string_value, array_value, '{}'::text[]) AS array_agg
+FROM context_property_options
+WHERE type_id = (SELECT id FROM "Type" WHERE name = 'kf.CatalogModel')
 
-    UNION
+UNION ALL
 
-    SELECT
-        name,
-        json_array_elements_text(string_value::json) AS string_value
-    FROM "ContextProperty" WHERE
-        context_id IN (
-            SELECT id FROM "Context" WHERE type_id = (
-                SELECT id FROM "Type" WHERE name = 'kf.CatalogModel'
-            )
-        )
-        AND string_value IS JSON ARRAY
-)
-GROUP BY name HAVING MAX(CHAR_LENGTH(string_value)) <= 100;
+SELECT
+    'artifacts.' ||
+    CASE
+        WHEN string_value IS NOT NULL THEN name || '.string_value'
+        WHEN array_value IS NOT NULL THEN name || '.array_value'
+        WHEN min_double_value IS NOT NULL THEN name || '.double_value'
+        WHEN min_int_value IS NOT NULL THEN name || '.int_value'
+        ELSE name
+    END AS name,
+    CASE
+        WHEN min_double_value IS NOT NULL THEN
+            ARRAY[min_double_value::text, max_double_value::text]
+        WHEN min_int_value IS NOT NULL THEN
+            ARRAY[min_int_value::text, max_int_value::text]
+        ELSE
+            COALESCE(string_value, array_value, '{}'::text[])
+    END AS array_agg
+FROM artifact_property_options
+
+ORDER BY name;
 """
 
 # SQL query for search functionality database validation
@@ -155,5 +166,12 @@
 """
 
 # Fields that are explicitly filtered out by the filter_options endpoint API
-# From db_catalog.go:204-206 in kubeflow/model-registry GetFilterOptions method
-API_EXCLUDED_FILTER_FIELDS = {"source_id", "logo", "license_link"}
+# From db_catalog.go in kubeflow/model-registry GetFilterOptions method
+# Updated with PR #1875 to include metricsType and model_id exclusions
+API_EXCLUDED_FILTER_FIELDS = {
+    "source_id",
+    "logo",
+    "license_link",
+    "artifacts.metricsType.string_value",  # artifact property with full name
+    "artifacts.model_id.string_value",  # artifact property with full name
+}
diff --git a/tests/model_registry/model_catalog/test_filter_options_endpoint.py b/tests/model_registry/model_catalog/test_filter_options_endpoint.py
@@ -95,7 +95,6 @@ def test_filter_options_endpoint_validation(
         ],
         indirect=["user_token_for_api_calls"],
     )
-    @pytest.mark.xfail(strict=True, reason="RHOAIENG-37069: backend/API discrepancy expected")
     def test_comprehensive_coverage_against_database(
         self: Self,
         model_catalog_rest_url: list[str],
diff --git a/tests/model_registry/model_catalog/utils.py b/tests/model_registry/model_catalog/utils.py
@@ -417,32 +417,71 @@ def compare_filter_options_with_database(
     # Log detailed comparison for each property
     for prop_name in sorted(set(expected_properties.keys()) | set(api_filters.keys())):
         if prop_name in expected_properties and prop_name in api_filters:
-            db_values = set(expected_properties[prop_name])
-            api_values = set(api_filters[prop_name]["values"])
-
-            missing_values = db_values - api_values
-            extra_values = api_values - db_values
-
-            if missing_values:
-                error_msg = (
-                    f"Property '{prop_name}': DB has {len(missing_values)} values missing from API: {missing_values}"
-                )
-                LOGGER.error(error_msg)
-                comparison_errors.append(error_msg)
-            if extra_values:
-                error_msg = (
-                    f"Property '{prop_name}': API has {len(extra_values)} values missing from DB: {extra_values}"
-                )
-                LOGGER.error(error_msg)
-                comparison_errors.append(error_msg)
-            if not missing_values and not extra_values:
-                LOGGER.info(f"Property '{prop_name}': Perfect match ({len(api_values)} values)")
+            db_data = expected_properties[prop_name]
+            api_filter = api_filters[prop_name]
+
+            # Check if this is a numeric property (has "range" in API response)
+            if "range" in api_filter:
+                # Numeric property: DB has [min, max] as 2-element array
+                if len(db_data) == 2:
+                    try:
+                        db_min, db_max = float(db_data[0]), float(db_data[1])
+                        api_min = api_filter["range"]["min"]
+                        api_max = api_filter["range"]["max"]
+
+                        if db_min != api_min or db_max != api_max:
+                            error_msg = (
+                                f"Property '{prop_name}': Range mismatch - DB: [{db_min}, {db_max}], "
+                                f"API: [{api_min}, {api_max}]"
+                            )
+                            LOGGER.error(error_msg)
+                            comparison_errors.append(error_msg)
+                        else:
+                            LOGGER.info(f"Property '{prop_name}': Perfect range match (min={api_min}, max={api_max})")
+                    except (ValueError, TypeError) as e:
+                        error_msg = f"Property '{prop_name}': Failed to parse numeric values - {e}"
+                        LOGGER.error(error_msg)
+                        comparison_errors.append(error_msg)
+                else:
+                    error_msg = f"Property '{prop_name}': Expected 2 values for range, got {len(db_data)}"
+                    LOGGER.error(error_msg)
+                    comparison_errors.append(error_msg)
+            else:
+                # String/array property: compare values as sets
+                db_values = set(db_data)
+                api_values = set(api_filter["values"])
+
+                missing_values = db_values - api_values
+                extra_values = api_values - db_values
+
+                if missing_values:
+                    error_msg = (
+                        f"Property '{prop_name}': DB has {len(missing_values)} "
+                        f"values missing from API: {missing_values}"
+                    )
+                    LOGGER.error(error_msg)
+                    comparison_errors.append(error_msg)
+                if extra_values:
+                    error_msg = (
+                        f"Property '{prop_name}': API has {len(extra_values)} values missing from DB: {extra_values}"
+                    )
+                    LOGGER.error(error_msg)
+                    comparison_errors.append(error_msg)
+                if not missing_values and not extra_values:
+                    LOGGER.info(f"Property '{prop_name}': Perfect match ({len(api_values)} values)")
         elif prop_name in expected_properties:
             error_msg = f"Property '{prop_name}': In DB ({len(expected_properties[prop_name])} values) but NOT in API"
             LOGGER.error(error_msg)
             comparison_errors.append(error_msg)
         elif prop_name in api_filters:
-            error_msg = f"Property '{prop_name}': In API ({len(api_filters[prop_name]['values'])} values) but NOT in DB"
+            LOGGER.info(f"Property name: '{prop_name}' in API filters: {api_filters[prop_name]}")
+            # For properties only in API, we can't reliably get DB values, so skip logging them
+            if "range" in api_filters[prop_name]:
+                error_msg = f"Property '{prop_name}': In API (range property) but NOT in DB"
+            else:
+                error_msg = (
+                    f"Property '{prop_name}': In API ({len(api_filters[prop_name]['values'])} values) but NOT in DB"
+                )
             LOGGER.error(error_msg)
             comparison_errors.append(error_msg)
 

Original file line number	Diff line number	Diff line change
`@@ -95,7 +95,6 @@ def test_filter_options_endpoint_validation(`
`95`	`95`	`],`
`96`	`96`	`indirect=["user_token_for_api_calls"],`
`97`	`97`	`)`
`98`		`- @pytest.mark.xfail(strict=True, reason="RHOAIENG-37069: backend/API discrepancy expected")`
`99`	`98`	`def test_comprehensive_coverage_against_database(`
`100`	`99`	`self: Self,`
`101`	`100`	`model_catalog_rest_url: list[str],`