NVIDIA-NeMo
diff --git a/‎docs/_static/css/custom.css‎
Lines changed: 90 additions & 0 deletions b/‎docs/_static/css/custom.css‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎docs/_static/js/table-expander.js‎
Lines changed: 119 additions & 0 deletions b/‎docs/_static/js/table-expander.js‎
Lines changed: 119 additions & 0 deletions
diff --git a/‎docs/about/release-notes.md‎
Lines changed: 26 additions & 0 deletions b/‎docs/about/release-notes.md‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎docs/about/supported-llms.md‎
Lines changed: 48 additions & 36 deletions b/‎docs/about/supported-llms.md‎
Lines changed: 48 additions & 36 deletions
diff --git a/‎docs/conf.py‎
Lines changed: 3 additions & 0 deletions b/‎docs/conf.py‎
Lines changed: 3 additions & 0 deletions
@@ -27,3 +27,93 @@
 .sd-equal-height .sd-card-body {
     flex: 1;
 }
+
+.table-expand-button {
+    align-items: center;
+    background: #76b900;
+    border: 0;
+    border-radius: 4px;
+    color: #fff;
+    cursor: pointer;
+    display: inline-flex;
+    font-weight: 600;
+    gap: 0.4rem;
+    margin: 0.25rem 0 0.75rem;
+    padding: 0.45rem 0.75rem;
+}
+
+.table-expand-button:hover,
+.table-expand-button:focus {
+    background: #5f9500;
+}
+
+.table-expand-button:focus {
+    outline: 2px solid #1a1a1a;
+    outline-offset: 2px;
+}
+
+.table-expander-modal {
+    background: rgba(0, 0, 0, 0.65);
+    display: none;
+    inset: 0;
+    padding: 2rem;
+    position: fixed;
+    z-index: 10000;
+}
+
+.table-expander-modal.is-open {
+    display: flex;
+}
+
+.table-expander-modal__dialog {
+    background: #fff;
+    border-radius: 6px;
+    box-shadow: 0 1rem 3rem rgba(0, 0, 0, 0.35);
+    display: flex;
+    flex-direction: column;
+    max-height: 90vh;
+    width: min(1200px, 96vw);
+}
+
+.table-expander-modal__header {
+    align-items: center;
+    border-bottom: 1px solid #d9d9d9;
+    display: flex;
+    justify-content: space-between;
+    padding: 1rem 1.25rem;
+}
+
+.table-expander-modal__title {
+    font-size: 1.2rem;
+    font-weight: 700;
+    margin: 0;
+}
+
+.table-expander-modal__close {
+    background: transparent;
+    border: 0;
+    cursor: pointer;
+    font-size: 1.8rem;
+    line-height: 1;
+    padding: 0.1rem 0.35rem;
+}
+
+.table-expander-modal__body {
+    overflow: auto;
+    padding: 1rem 1.25rem 1.25rem;
+}
+
+.table-expander-modal__body table {
+    margin: 0;
+    min-width: 1000px;
+}
+
+body.table-expander-modal-open {
+    overflow: hidden;
+}
+
+@media (max-width: 768px) {
+    .table-expander-modal {
+        padding: 0.75rem;
+    }
+}
@@ -0,0 +1,119 @@
+// SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+// SPDX-License-Identifier: Apache-2.0
+
+(function () {
+    function findNextTable(button) {
+        let current = button.nextElementSibling;
+
+        while (current) {
+            if (current.tagName && current.tagName.toLowerCase() === "table") {
+                return current;
+            }
+
+            const nestedTable = current.querySelector ? current.querySelector("table") : null;
+            if (nestedTable) {
+                return nestedTable;
+            }
+
+            current = current.nextElementSibling;
+        }
+
+        return null;
+    }
+
+    function createModal() {
+        const modal = document.createElement("div");
+        modal.className = "table-expander-modal";
+        modal.setAttribute("role", "dialog");
+        modal.setAttribute("aria-modal", "true");
+        modal.setAttribute("aria-hidden", "true");
+
+        const dialog = document.createElement("div");
+        dialog.className = "table-expander-modal__dialog";
+
+        const header = document.createElement("div");
+        header.className = "table-expander-modal__header";
+
+        const title = document.createElement("p");
+        title.className = "table-expander-modal__title";
+
+        const closeButton = document.createElement("button");
+        closeButton.className = "table-expander-modal__close";
+        closeButton.type = "button";
+        closeButton.setAttribute("aria-label", "Close expanded table");
+        closeButton.textContent = "Close";
+
+        const body = document.createElement("div");
+        body.className = "table-expander-modal__body";
+
+        header.append(title, closeButton);
+        dialog.append(header, body);
+        modal.append(dialog);
+        document.body.append(modal);
+
+        return { body, closeButton, modal, title };
+    }
+
+    function initializeTableExpanders() {
+        const buttons = document.querySelectorAll(".table-expand-button");
+        if (!buttons.length) {
+            return;
+        }
+
+        const modalParts = createModal();
+        let activeButton = null;
+
+        function closeModal() {
+            modalParts.modal.classList.remove("is-open");
+            modalParts.modal.setAttribute("aria-hidden", "true");
+            document.body.classList.remove("table-expander-modal-open");
+            modalParts.body.replaceChildren();
+
+            if (activeButton) {
+                activeButton.focus();
+                activeButton = null;
+            }
+        }
+
+        function openModal(button, table) {
+            const clonedTable = table.cloneNode(true);
+            activeButton = button;
+            modalParts.title.textContent = button.dataset.tableTitle || "Expanded table";
+            modalParts.body.replaceChildren(clonedTable);
+            modalParts.modal.classList.add("is-open");
+            modalParts.modal.setAttribute("aria-hidden", "false");
+            document.body.classList.add("table-expander-modal-open");
+            modalParts.closeButton.focus();
+        }
+
+        buttons.forEach((button) => {
+            const table = findNextTable(button);
+
+            if (!table) {
+                button.hidden = true;
+                return;
+            }
+
+            button.setAttribute("aria-label", "Open table in expanded view");
+            button.addEventListener("click", () => openModal(button, table));
+        });
+
+        modalParts.closeButton.addEventListener("click", closeModal);
+        modalParts.modal.addEventListener("click", (event) => {
+            if (event.target === modalParts.modal) {
+                closeModal();
+            }
+        });
+        document.addEventListener("keydown", (event) => {
+            if (event.key === "Escape" && modalParts.modal.classList.contains("is-open")) {
+                closeModal();
+            }
+        });
+    }
+
+    if (document.readyState === "loading") {
+        document.addEventListener("DOMContentLoaded", initializeTableExpanders);
+    } else {
+        initializeTableExpanders();
+    }
+})();
@@ -25,6 +25,32 @@ For a complete record of changes in a release, refer to the
 
 ---
 
+(v0-22-0)=
+
+## 0.22.0
+
+(v0-22-0-features)=
+
+### Key Features
+
+- LangChain is now optional. `pip install nemoguardrails` no longer pulls
+  LangChain or any provider-specific `langchain-*` packages. The library ships
+  with a built-in client that talks to OpenAI-compatible endpoints directly
+  over `httpx`. Engines whose API isn't OpenAI-compatible (Anthropic, Cohere,
+  Vertex AI, Google Generative AI, in-process Hugging Face, TensorRT-LLM,
+  and others) keep working through LangChain when you opt in with
+  `NEMOGUARDRAILS_LLM_FRAMEWORK=langchain` and install the matching provider
+  package. Most 0.21 configurations keep working unchanged; some shapes need
+  a YAML rewrite. For recipes, see [Migrating to 0.22](../migration/0.22.md).
+
+- Public extension points for LLM integration. Two new protocols, `LLMModel`
+  and `LLMFramework` in `nemoguardrails.types`, let you plug in a custom
+  backend or a whole alternative framework without touching internals.
+
+- Public testing surface. The `nemoguardrails.testing` module exposes
+  `FakeLLMModel`, `TestChat`, and pytest fixtures for writing tests against a
+  guardrails configuration without calling a real model.
+
 (v0-21-0)=
 
 ## 0.21.0
 
@@ -2,7 +2,7 @@
 title:
   page: "Supported LLMs"
   nav: "Supported LLMs"
-description: "Connect to NVIDIA NIM, OpenAI, Azure, Anthropic, HuggingFace, and LangChain providers."
+description: "Connect to NVIDIA NIM, OpenAI, Azure, Anthropic, Hugging Face, and LangChain providers."
 keywords: ["llm providers", "nvidia nim", "openai", "langchain", "embedding providers"]
 topics: ["generative_ai", "developer_tools"]
 tags: ["llms", "ai_inference", "pretrained_models", "nlp"]
@@ -22,40 +22,52 @@ Integrating NeMo Guardrails improves safety and security of an Application LLM,
 
 NeMo Guardrails can also call models for a specific guardrail on behalf of the client. Having guardrail-specific models allows the use of smaller fine-tuned models, which are specialized on the guardrails task. For example the NVIDIA Nemoguard collection of models includes [content-safety](https://build.nvidia.com/nvidia/llama-3_1-nemotron-safety-guard-8b-v3), [topic-control](https://build.nvidia.com/nvidia/llama-3_1-nemoguard-8b-topic-control), and [jailbreak-detect](https://build.nvidia.com/nvidia/nemoguard-jailbreak-detect) models. These models can be accessed on [build.nvidia.com](https://build.nvidia.com/) for rapid prototyping, or on [NGC Catalog](https://catalog.ngc.nvidia.com/) for deployment with NIM Docker containers.
 
-## Application LLM Providers
-
-The NeMo Guardrails library supports major LLM providers, including:
-
-- OpenAI
-- Azure OpenAI
-- Anthropic
-- Cohere
-- Google Vertex AI
-
-### Self-Hosted
-
-The NeMo Guardrails library supports the following self-hosted LLM providers:
-
-- HuggingFace Hub
-- HuggingFace Endpoints
-- vLLM
-- Generic
-
-### Providers from LangChain
-
-The NeMo Guardrails library supports LLM providers from the LangChain Community, including both text completion and chat completion providers. Refer to [Chat model integrations](https://docs.langchain.com/oss/python/integrations/chat) in the LangChain documentation. You can also use the [`nemoguardrails find-providers`](find-providers-command) CLI command to discover available providers.
-
-## Embedding Providers
-
-The NeMo Guardrails library supports the following embedding providers:
-
-- NVIDIA NIM
-- NVIDIA AI Endpoints
-- FastEmbed
-- OpenAI
-- Azure OpenAI
-- Cohere
-- SentenceTransformers
-- Google
+## Inference Providers
+
+Each engine is served by a framework that manages the underlying HTTP or SDK calls. NeMo Guardrails ships with a built-in framework that talks to OpenAI-compatible endpoints over `httpx` with no LangChain dependency. For engines whose API is not OpenAI-compatible, opt into the LangChain framework by setting `NEMOGUARDRAILS_LLM_FRAMEWORK=langchain` and installing the matching `langchain-<provider>` package. To add a custom framework, implement the `LLMFramework` protocol from `nemoguardrails.types`.
+
+```{raw} html
+<button type="button" class="table-expand-button" data-table-title="Inference Providers">
+  <span aria-hidden="true" class="table-expand-button__icon">&#x26F6;</span>
+  Expand table
+</button>
+```
+
+| Engine | Framework | Streaming | Tool calls | Reasoning models | Notes |
+| --- | --- | --- | --- | --- | --- |
+| `anthropic` | LangChain (opt-in) | yes | yes | wrapper-dependent | Requires `pip install langchain langchain-anthropic`. |
+| `azure`, `azure_openai` | LangChain (opt-in) | yes | yes | yes | Azure OpenAI is OpenAI-compatible at the wire level. The LangChain path (`langchain-openai`) is the convenient default because it handles the deployment-name URL pattern and `api-version` query string for you. Azure is also reachable through the built-in client by setting `parameters.base_url` to the deployment URL and passing `api-version` via `default_query` and `api-key` via `default_headers`. |
+| `cohere` | LangChain (opt-in) | yes | yes | n/a | Requires `pip install langchain langchain-cohere`. |
+| `google_genai` | LangChain (opt-in) | yes | yes | n/a | Requires `pip install langchain langchain-google-genai`. |
+| `huggingface_endpoint` | LangChain (opt-in) | varies | varies | varies | Default text-generation schema. If your endpoint exposes `/v1/chat/completions`, prefer `engine: openai` with `parameters.base_url` instead. |
+| `huggingface_pipeline`, `huggingface_hub`, `trt_llm`, `self_hosted` | LangChain (opt-in) | varies | varies | varies | In-process pipelines and LangChain wrappers without a native HTTP path. |
+| `nim` | Built-in | yes | yes | yes | Default base URL `https://integrate.api.nvidia.com/v1`. |
+| `nvidia_ai_endpoints` | Built-in | yes | yes | yes | Alias for `nim`. |
+| `ollama` | Built-in | yes | yes | yes (where supported) | Default base URL `http://localhost:11434/v1`. |
+| `openai` | Built-in | yes | yes | yes | OpenAI public API or any OpenAI-compatible endpoint using `parameters.base_url`. For vLLM, TGI, OpenRouter, Together.ai, Fireworks.ai, Groq, DeepSeek, llama.cpp, NVIDIA Nemotron, and similar providers, use `engine: openai` with `parameters.base_url` and `parameters.api_key`. |
+| `vertexai` | LangChain (opt-in) | yes | yes | n/a | Requires `pip install langchain langchain-google-vertexai`. |
+| `vllm_openai`, `deepseek` | LangChain (opt-in) | yes | yes | yes | Legacy LangChain provider engines. They continue to work when you opt into LangChain. For new configurations, use `engine: openai` with `parameters.base_url` when the wire protocol is OpenAI-compatible. |
+| `<provider_name>` | LangChain (opt-in) | varies | varies | varies | Any community provider exposed through LangChain's chat-model integrations. Use the bare provider name as the engine name. |
+
+For migration recipes between the built-in path and the LangChain path, see [Migrating to 0.22](../migration/0.22.md).
+
+## LangChain-Backed Providers
+
+The NeMo Guardrails library supports LLM providers from the LangChain Community, including both text completion and chat completion providers. Refer to [Chat model integrations](https://python.langchain.com/docs/integrations/chat/) in the LangChain documentation. You can also use the [`nemoguardrails find-providers`](find-providers-command) CLI command to discover available providers.
+
+## Embedding Model Providers
+
+The NeMo Guardrails library uses embedding models for vector similarity search in dialog rails, `embeddings_only` intent matching, and knowledge base retrieval. The following table lists the supported embedding model providers and their corresponding engine names.
+
+| Provider | Engine | Notes |
+| --- | --- | --- |
+| NVIDIA NIM | `nim` | NVIDIA NIM microservices |
+| NVIDIA AI Endpoints | `nvidia_ai_endpoints` | Alias for `nim` |
+| FastEmbed | `fastembed` | FastEmbed embedding model provider |
+| OpenAI | `openai` | OpenAI embedding model provider |
+| Azure OpenAI | `azure` | Azure OpenAI embedding model provider |
+| Cohere | `cohere` | Cohere embedding model provider |
+| SentenceTransformers | `sentence_transformers` | SentenceTransformers embedding model provider |
+| Google | `google` | Google embedding model provider |
 
 For more information on configuring embedding providers, refer to [Embedding Search Providers](../configure-rails/other-configurations/embedding-search-providers.md).
@@ -258,6 +258,9 @@
 html_copy_source = False
 html_show_sourcelink = False
 html_show_sphinx = False
+html_static_path = ["_static"]
+html_css_files = ["css/custom.css"]
+html_js_files = ["js/table-expander.js"]
 
 html_domain_indices = False
 html_use_index = False