[Standup] Compatibility with the new istio (1.28.1) (llm-d#567)

maugustosilva · web-flow · commit 130979228c9e · 2025-12-12T22:38:51.000-05:00
* [Standup] Compatibility with the new `istio` (1.28.1)

Signed-off-by: maugustosilva &lt;maugusto.silva@gmail.com&gt;

* Make `istio` the default for
`LLMDBENCH_VLLM_MODELSERVICE_GATEWAY_CLASS_NAME`

Signed-off-by: maugustosilva &lt;maugusto.silva@gmail.com&gt;

---------

Signed-off-by: maugustosilva &lt;maugusto.silva@gmail.com&gt;
diff --git a/.github/actions/markdown-link-checker/action.yaml b/.github/actions/markdown-link-checker/action.yaml
@@ -7,7 +7,7 @@ inputs:
   args:
     description: Arguments to pass to markdown-link-check
     required: false
-    default: "--quiet --retry"
+    default: "--retry"
 
 runs:
   using: "composite"
diff --git a/README.md b/README.md
@@ -7,8 +7,8 @@ This repository provides an automated workflow for benchmarking LLM inference us
 Provide a single source of automation for repeatable and reproducible experiments and performance evaluation on `llm-d`.
 
 
-## Prerequisites 
-Please refer to the official [llm-d prerequisites](https://github.com/llm-d/llm-d?tab=readme-ov-file#pre-requisites) for the most up-to-date requirements.
+## Prerequisites
+Please refer to the official [llm-d prerequisites](https://github.com/llm-d/llm-d/blob/main/README.md#pre-requisites) for the most up-to-date requirements.
 For the client setup, the provided `install-deps.sh` will download and install the necessary tools.
 
 ### Administrative Requirements
diff --git a/setup/env.sh b/setup/env.sh
@@ -91,8 +91,8 @@ export LLMDBENCH_DEPLOY_METHODS=${LLMDBENCH_DEPLOY_METHODS:-"modelservice"}
 # Gateway provider specific variables
 export LLMDBENCH_GATEWAY_PROVIDER_KGATEWAY_HELM_REPOSITORY_URL=${LLMDBENCH_GATEWAY_PROVIDER_KGATEWAY_HELM_REPOSITORY_URL:-"oci://cr.kgateway.dev/kgateway-dev/charts"}
 export LLMDBENCH_GATEWAY_PROVIDER_KGATEWAY_CHART_VERSION=${LLMDBENCH_GATEWAY_PROVIDER_KGATEWAY_CHART_VERSION:-"v2.0.3"}
-export LLMDBENCH_GATEWAY_PROVIDER_ISTIO_HELM_REPOSITORY_URL=${LLMDBENCH_GATEWAY_PROVIDER_ISTIO_HELM_REPOSITORY_URL:-"oci://gcr.io/istio-testing/charts"}
-export LLMDBENCH_GATEWAY_PROVIDER_ISTIO_CHART_VERSION=${LLMDBENCH_GATEWAY_PROVIDER_ISTIO_CHART_VERSION:-"1.28-alpha.89f30b26ba71bf5e538083a4720d0bc2d8c06401"}
+export LLMDBENCH_GATEWAY_PROVIDER_ISTIO_HELM_REPOSITORY_URL=${LLMDBENCH_GATEWAY_PROVIDER_ISTIO_HELM_REPOSITORY_URL:-"https://istio-release.storage.googleapis.com/charts"}
+export LLMDBENCH_GATEWAY_PROVIDER_ISTIO_CHART_VERSION=${LLMDBENCH_GATEWAY_PROVIDER_ISTIO_CHART_VERSION:-"1.28.1"}
 
 # Applicable to both standalone and modelservice
 export LLMDBENCH_IGNORE_FAILED_VALIDATION="${LLMDBENCH_IGNORE_FAILED_VALIDATION:-true}"    # default is to continue deployment if validation fails
@@ -187,7 +187,7 @@ export LLMDBENCH_VLLM_MODELSERVICE_CHART_NAME=${LLMDBENCH_VLLM_MODELSERVICE_CHAR
 export LLMDBENCH_VLLM_MODELSERVICE_HELM_REPOSITORY=${LLMDBENCH_VLLM_MODELSERVICE_HELM_REPOSITORY:-"llm-d-modelservice"}
 export LLMDBENCH_VLLM_MODELSERVICE_HELM_REPOSITORY_URL=${LLMDBENCH_VLLM_MODELSERVICE_HELM_REPOSITORY_URL:-"https://llm-d-incubation.github.io/llm-d-modelservice/"}
 export LLMDBENCH_VLLM_MODELSERVICE_URI_PROTOCOL=${LLMDBENCH_VLLM_MODELSERVICE_URI_PROTOCOL:-"pvc"}
-export LLMDBENCH_VLLM_MODELSERVICE_GATEWAY_CLASS_NAME=${LLMDBENCH_VLLM_MODELSERVICE_GATEWAY_CLASS_NAME:-kgateway}
+export LLMDBENCH_VLLM_MODELSERVICE_GATEWAY_CLASS_NAME=${LLMDBENCH_VLLM_MODELSERVICE_GATEWAY_CLASS_NAME:-"istio"}
 export LLMDBENCH_VLLM_MODELSERVICE_GATEWAY_SERVICE_TYPE=${LLMDBENCH_VLLM_MODELSERVICE_GATEWAY_SERVICE_TYPE:-NodePort}
 export LLMDBENCH_VLLM_MODELSERVICE_ROUTE=${LLMDBENCH_VLLM_MODELSERVICE_ROUTE:-false}
 # Endpoint Picker Parameters
diff --git a/setup/steps/02_ensure_gateway_provider.py b/setup/steps/02_ensure_gateway_provider.py
@@ -113,7 +113,7 @@ def get_latest_chart_version(
 
         if result.returncode != 0:
             if verbose:
-                announce(f"❌ Helm search failed: {result.stderr}")
+                announce(f"ERROR: Helm search failed: {result.stderr}")
             return ""
 
         # Parse output to get version (equivalent to: tail -1 | awk '{print $2}')
@@ -269,7 +269,7 @@ def install_kgateway(
         install_cmd = f"helmfile apply -f {helmfile_path}"
         ecode = llmdbench_execute_cmd(actual_cmd=install_cmd, dry_run=ev["control_dry_run"], verbose=ev["control_verbose"])
         if ecode != 0:
-            announce(f"ERROR: Failed while running \"{install_cmd}\" (exit code: {result})")
+            announce(f"ERROR: Failed while running \"{install_cmd}\" (exit code: {ecode})")
         announce(f"✅ kgateway ({ev['gateway_provider_kgateway_chart_version']}) installed")
     else :
         announce(f"✅ kgateway (unknown version) already installed (*.kgateway.dev CRDs found)")
@@ -299,9 +299,12 @@ def install_istio(
         helmfile_path = helm_base_dir / f'helmfile-{ev["current_step"]}.yaml'
         with open(helmfile_path, 'w') as f:
             f.write(f"""
+repositories:
+  - name: istio
+    url: {ev["gateway_provider_istio_helm_repository_url"]}
 releases:
   - name: istio-base
-    chart: {ev["gateway_provider_istio_helm_repository_url"]}/base
+    chart: istio/base
     version: {ev["gateway_provider_istio_chart_version"]}
     namespace: istio-system
     installed: true
@@ -310,7 +313,7 @@ def install_istio(
       kind: gateway-crds
 
   - name: istiod
-    chart: {ev["gateway_provider_istio_helm_repository_url"]}/istiod
+    chart: istio/istiod
     version: {ev["gateway_provider_istio_chart_version"]}
     namespace: istio-system
     installed: true
@@ -320,12 +323,12 @@ def install_istio(
       - meshConfig:
           defaultConfig:
             proxyMetadata:
-              SUPPORT_GATEWAY_API_INFERENCE_EXTENSION: true
+              ENABLE_GATEWAY_API_INFERENCE_EXTENSION: true
         pilot:
           env:
-            SUPPORT_GATEWAY_API_INFERENCE_EXTENSION: true
+            ENABLE_GATEWAY_API_INFERENCE_EXTENSION: true
         tag: {ev["gateway_provider_istio_chart_version"]}
-        hub: "gcr.io/istio-testing"
+        hub: "docker.io/istio"
     labels:
       type: gateway-provider
       kind: gateway-control-plane
@@ -342,7 +345,7 @@ def install_istio(
         announce(f"🚀 Installing istio helm charts from {ev['gateway_provider_istio_helm_repository_url']} ({ev['gateway_provider_istio_chart_version']})")
         ecode = llmdbench_execute_cmd(actual_cmd=install_cmd, dry_run=ev["control_dry_run"], verbose=ev["control_verbose"])
         if ecode != 0:
-            announce(f"ERROR: Failed while running \"{install_cmd}\" (exit code: {result})")
+            announce(f"ERROR: Failed while running \"{install_cmd}\" (exit code: {ecode})")
         announce(f"✅ istio ({ev['gateway_provider_istio_chart_version']}) installed")
     else :
         announce(f"✅ isto (unknown version) already installed (*.istio.io CRDs found)")
@@ -392,7 +395,8 @@ def install_gateway_control_plane(
                    "telemetries.telemetry.istio.io", \
                    "virtualservices.networking.istio.io", \
                    "wasmplugins.extensions.istio.io", \
-                   "workloadgroups.networking.istio.io" ] :
+                   "workloadgroups.networking.istio.io", \
+                   "telemetry.istio.io/v1" ] :
                 if i not in crds :
                     should_install_gateway_control_plane = True
 
@@ -470,10 +474,10 @@ def ensure_gateway_provider(
                 return result
 
             should_install_gateway_api_extension_crds = False
-            for i in [ "inferenceobjectives.inference.networking.x-k8s.io", \
-                       "inferencepoolimports.inference.networking.x-k8s.io", \
+            for i in [ "inferenceobjectives.inference.networking.k8s.io", \
+                       "inferencepoolimports.inference.networking.k8s.io", \
                        "inferencepools.inference.networking.k8s.io", \
-                       "inferencepools.inference.networking.x-k8s.io" ] :
+                       "inferencepools.inference.networking.k8s.io" ] :
                     if i not in crd_names :
                         should_install_gateway_api_extension_crds = True
 
diff --git a/setup/steps/07_deploy_setup.py b/setup/steps/07_deploy_setup.py
@@ -74,17 +74,17 @@ def auto_detect_version(ev, chart, version_key, repo_key) -> int:
                         announce(f"📦 Auto-detected chart version: {version}")
                         return 0
                     else:
-                        announce("❌ Unable to parse version from helm search output")
+                        announce("ERROR: Unable to parse version from helm search output")
                         return 1
                 else:
-                    announce("❌ No charts found in helm search output")
+                    announce("ERROR: No charts found in helm search output")
                     return 1
             else:
-                announce("❌ Unable to find a version for model service helm chart!")
+                announce("ERROR: Unable to find a version for model service helm chart!")
                 return 1
 
         except Exception as e:
-            announce(f"❌ Error auto-detecting {chart} chart version: {e}")
+            announce(f"ERROR: Error auto-detecting {chart} chart version: {e}")
             return 1
     return 0
 
diff --git a/setup/steps/08_deploy_gaie.py b/setup/steps/08_deploy_gaie.py
@@ -150,7 +150,7 @@ def main():
 inferencePool:
   targetPortNumber: {ev['vllm_common_inference_port']}
   modelServerType: vllm
-  apiVersion: "inference.networking.x-k8s.io/v1alpha2"
+  apiVersion: "inference.networking.k8s.io/v1"
   modelServers:
     matchLabels:
       llm-d.ai/inferenceServing: "true"
diff --git a/setup/steps/09_deploy_via_modelservice.py b/setup/steps/09_deploy_via_modelservice.py
@@ -393,7 +393,7 @@ def define_httproute(
       name: infra-{release}-inference-gateway
   rules:
     - backendRefs:
-      - group: inference.networking.x-k8s.io
+      - group: inference.networking.k8s.io
         kind: InferencePool
         name: {model_id_label}-gaie
         port: {service_port}
@@ -416,7 +416,7 @@ def define_httproute(
     if single_model:
       manifest = f"""{manifest}
     - backendRefs:
-      - group: inference.networking.x-k8s.io
+      - group: inference.networking.k8s.io
         kind: InferencePool
         name: {model_id_label}-gaie
         port: {service_port}