From 8b82642302b049708c97e029113a85d28899ea70 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?S=C3=A9bastien=20Han?= Date: Fri, 12 Sep 2025 17:10:05 +0200 Subject: [PATCH 1/2] feat: add watsonx inference provider MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit New provider, env variable WATSONX_API_KEY and WATSONX_PROJECT_ID are expected to be populated to enable the provider. Relates to: RHAIENG-1026 Signed-off-by: Sébastien Han --- distribution/Containerfile | 1 + distribution/build.yaml | 1 + distribution/run.yaml | 6 ++++++ 3 files changed, 8 insertions(+) diff --git a/distribution/Containerfile b/distribution/Containerfile index 70cb42891..ad144e9e7 100644 --- a/distribution/Containerfile +++ b/distribution/Containerfile @@ -15,6 +15,7 @@ RUN pip install \ fastapi \ fire \ httpx \ + ibm_watsonx_ai \ matplotlib \ mcp>=1.8.1 \ nltk \ diff --git a/distribution/build.yaml b/distribution/build.yaml index 188db93bf..304087b03 100644 --- a/distribution/build.yaml +++ b/distribution/build.yaml @@ -6,6 +6,7 @@ distribution_spec: - provider_type: remote::vllm - provider_type: remote::bedrock - provider_type: inline::sentence-transformers + - provider_type: remote::watsonx vector_io: - provider_type: inline::milvus - provider_type: remote::milvus diff --git a/distribution/run.yaml b/distribution/run.yaml index 0d8eee44d..5a27d66f4 100644 --- a/distribution/run.yaml +++ b/distribution/run.yaml @@ -36,6 +36,12 @@ providers: - provider_id: sentence-transformers provider_type: inline::sentence-transformers config: {} + - provider_id: watsonx + provider_type: remote::watsonx + config: + url: ${env.WATSONX_BASE_URL:=https://us-south.ml.cloud.ibm.com} + api_key: ${env.WATSONX_API_KEY:=} + project_id: ${env.WATSONX_PROJECT_ID:=} vector_io: - provider_id: milvus provider_type: inline::milvus From ffce08d1f1ba9195054d8b8dbfc4475ec420021d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?S=C3=A9bastien=20Han?= Date: Fri, 12 Sep 2025 17:22:21 +0200 Subject: [PATCH 2/2] chore: bump lmeval MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Fix auth token propagation in the safety provider. Relates to: RHOAIENG-34050 Signed-off-by: Sébastien Han --- distribution/Containerfile | 2 +- distribution/build.yaml | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/distribution/Containerfile b/distribution/Containerfile index ad144e9e7..9ae8598b0 100644 --- a/distribution/Containerfile +++ b/distribution/Containerfile @@ -41,7 +41,7 @@ RUN pip install \ RUN pip install \ llama_stack_provider_lmeval==0.2.4 RUN pip install \ - llama_stack_provider_trustyai_fms==0.2.1 + llama_stack_provider_trustyai_fms==0.2.2 RUN pip install --extra-index-url https://download.pytorch.org/whl/cpu torch torchao>=0.12.0 torchvision RUN pip install --no-deps sentence-transformers RUN pip install --no-cache llama-stack==0.2.21 diff --git a/distribution/build.yaml b/distribution/build.yaml index 304087b03..490b2b60c 100644 --- a/distribution/build.yaml +++ b/distribution/build.yaml @@ -12,7 +12,7 @@ distribution_spec: - provider_type: remote::milvus safety: - provider_type: remote::trustyai_fms - module: llama_stack_provider_trustyai_fms==0.2.1 + module: llama_stack_provider_trustyai_fms==0.2.2 agents: - provider_type: inline::meta-reference eval: