diff --git a/.env.example b/.env.example
index 57dad4963f..fb0a62a3d0 100644
--- a/.env.example
+++ b/.env.example
@@ -211,6 +211,50 @@ OTEL_EXPORTER_OTLP_ENDPOINT=http://localhost:4317
 # MCP_SESSION_POOL_ENABLED=false
 # ANYIO_CANCEL_DELIVERY_PATCH_ENABLED=false
 
+# Rust MCP (simple)
+# RUST_MCP_BUILD=false                # build the Rust MCP runtime into Containerfile.lite images
+# RUST_MCP_MODE=off                   # off | shadow | edge | full
+# RUST_MCP_LOG=warn                   # default Rust sidecar log filter for the simple mode flow
+#
+# RUST_MCP_MODE=shadow -> Rust sidecar enabled, but public /mcp stays on Python for safe fallback
+# RUST_MCP_MODE=edge   -> direct public /mcp on Rust with managed UDS sidecar defaults
+# RUST_MCP_MODE=full   -> edge + Rust session/event-store/resume/live-stream/affinity cores
+#
+# Advanced Rust MCP overrides
+# RUST_MCP_SESSION_AUTH_REUSE=false         # advanced override for the fast direct public Rust session-auth path; prefer RUST_MCP_MODE presets above
+# EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED=
+# EXPERIMENTAL_RUST_MCP_RUNTIME_URL=http://127.0.0.1:8787
+# EXPERIMENTAL_RUST_MCP_RUNTIME_UDS=/tmp/contextforge-mcp-rust.sock
+# EXPERIMENTAL_RUST_MCP_RUNTIME_TIMEOUT_SECONDS=30
+# EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED=       # enable Rust-owned MCP session metadata/lifecycle increment
+# EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED=        # enable Rust-owned resumable event-store backend
+# EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED=        # enable Rust-owned public GET /mcp replay/resume path
+# EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED=   # enable Rust-owned public GET /mcp live SSE path
+# EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED=      # enable Rust-owned session-affinity forwarding path
+# EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED= # enable Rust-owned session-bound auth-context reuse
+# EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED=            # launcher env, not a Pydantic setting
+# ENABLE_RUST_MCP_RMCP_BUILD=             # container build arg override for rmcp-enabled Rust MCP binary
+# MCP_RUST_USE_RMCP_UPSTREAM_CLIENT=      # runtime override for official rust-sdk upstream tools/call client
+# MCP_RUST_LISTEN_HTTP=127.0.0.1:8787     # runtime env for bundled Rust sidecar
+# MCP_RUST_LISTEN_UDS=/tmp/contextforge-mcp-rust.sock
+# MCP_RUST_SESSION_CORE_ENABLED=          # explicit sidecar env; defaults from EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED
+# MCP_RUST_SESSION_TTL_SECONDS=3600
+# MCP_RUST_EVENT_STORE_ENABLED=           # explicit sidecar env; defaults from EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED
+# MCP_RUST_RESUME_CORE_ENABLED=           # explicit sidecar env; defaults from EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED
+# MCP_RUST_LIVE_STREAM_CORE_ENABLED=      # explicit sidecar env; defaults from EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED
+# MCP_RUST_AFFINITY_CORE_ENABLED=         # explicit sidecar env; defaults from EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED
+# MCP_RUST_SESSION_AUTH_REUSE_ENABLED=    # explicit sidecar env; defaults from EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED
+# MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS=30
+# MCP_RUST_EVENT_STORE_MAX_EVENTS_PER_STREAM=100
+# MCP_RUST_EVENT_STORE_TTL_SECONDS=3600
+# MCP_RUST_EVENT_STORE_POLL_INTERVAL_MS=250
+# MCP_RUST_LOG=                             # advanced runtime log override for the bundled Rust sidecar
+# MCP_RUST_BACKEND_RPC_URL=http://127.0.0.1:4444/_internal/mcp/rpc
+# MCP_RUST_REDIS_URL=redis://redis:6379/0
+# MCP_RUST_CACHE_PREFIX=mcpgw:
+# MCP_RUST_DATABASE_URL=postgresql://postgres:mysecretpassword@pgbouncer:6432/mcp
+# MCP_RUST_DB_POOL_MAX_SIZE=20
+
 # =============================================================================
 # Performance Tuning (quick reference)
 # =============================================================================
@@ -1773,16 +1817,20 @@ OTEL_EXPORTER_OTLP_ENDPOINT=http://localhost:4317
 # =============================================================================
 # Caches authentication data (user, team, revocation) to reduce database queries
 # Uses Redis when available, falls back to in-memory cache
+# Applies to both Python MCP and Rust MCP because public MCP auth still runs in Python first
 
 # Enable Redis/in-memory caching for authentication data (default: true)
 # Significantly reduces database queries during authentication
+# Disabling this also disables the shared auth cache benefit for RUST_MCP_MODE=edge/full
 # AUTH_CACHE_ENABLED=true
 
 # TTL in seconds for cached user data (default: 60, range: 10-300)
+# Also affects MCP Streamable HTTP auth, including Rust-fronted MCP requests
 # AUTH_CACHE_USER_TTL=60
 
 # TTL in seconds for token revocation cache (default: 30, range: 5-120)
 # Security-critical: keep short to limit exposure window for revoked tokens
+# Also affects MCP auth on both Python and Rust runtime modes
 # AUTH_CACHE_REVOCATION_TTL=30
 
 # TTL in seconds for team membership cache (default: 60, range: 10-300)
@@ -1794,6 +1842,7 @@ OTEL_EXPORTER_OTLP_ENDPOINT=http://localhost:4317
 
 # Enable caching for get_user_teams() (default: true)
 # Set to false to disable teams list caching (useful for debugging)
+# Also affects session-token MCP auth on Python and Rust modes
 # AUTH_CACHE_TEAMS_ENABLED=true
 
 # TTL in seconds for user teams list cache (default: 60, range: 10-300)
@@ -1802,6 +1851,7 @@ OTEL_EXPORTER_OTLP_ENDPOINT=http://localhost:4317
 
 # Batch auth DB queries into single call (default: true)
 # Reduces 3 separate queries to 1, improving performance under load
+# Streamable HTTP MCP auth uses this too before falling back to per-query checks
 # AUTH_CACHE_BATCH_QUERIES=true
 
 # Registry Cache Configuration
diff --git a/.gitignore b/.gitignore
index 434720af3d..8c2e75f5ff 100644
--- a/.gitignore
+++ b/.gitignore
@@ -298,6 +298,7 @@ TODO.md
 FIXMEs
 
 # Upgrade validation outputs
+artifacts/
 artifacts/upgrade-validation*/
 
 # Debug & profiling artifacts
@@ -354,6 +355,12 @@ docs/docs/test/license-check-report.json
 nginx.conf
 docker-compose.perf.yml
 
+# Rust MCP runtime profiling artifacts
+tools_rust/mcp_runtime/profiles/
+tools_rust/mcp_runtime/flamegraph*.svg
+tools_rust/mcp_runtime/flamegraph*.html
+tools_rust/mcp_runtime/perf.data*
+
 # JMeter test results and local installation
 tests/jmeter/results/*.jtl
 tests/jmeter/results/*/
diff --git a/Containerfile.lite b/Containerfile.lite
index f7270a963e..9b5dfc39d8 100644
--- a/Containerfile.lite
+++ b/Containerfile.lite
@@ -20,6 +20,7 @@
 # Python major.minor series to track
 ARG PYTHON_VERSION=3.12
 ARG ENABLE_RUST=false
+ARG ENABLE_RUST_MCP_RMCP=false
 # Enable profiling tools (memray, py-spy) - off by default for smaller images
 # To enable: docker build --build-arg ENABLE_PROFILING=true -f Containerfile.lite .
 # Usage after enabling:
@@ -36,6 +37,7 @@ ARG ENABLE_PROFILING=false
 ###############################################################################
 FROM quay.io/pypa/manylinux2014:2026.03.06-3 AS rust-builder-base
 ARG ENABLE_RUST
+ARG ENABLE_RUST_MCP_RMCP
 
 # Set shell with pipefail for safety
 SHELL ["/bin/bash", "-o", "pipefail", "-c"]
@@ -43,7 +45,11 @@ SHELL ["/bin/bash", "-o", "pipefail", "-c"]
 # Only build if ENABLE_RUST=true
 RUN if [ "$ENABLE_RUST" != "true" ]; then \
         echo "⏭️  Rust builds disabled (set --build-arg ENABLE_RUST=true to enable)"; \
-        mkdir -p /build/rust-wheels; \
+        mkdir -p /build/rust-wheels /build/tools_rust/mcp_runtime/target/release; \
+        printf '#!/usr/bin/env sh\n' > /build/tools_rust/mcp_runtime/target/release/contextforge-mcp-runtime; \
+        printf 'echo "Rust MCP runtime not built into this image. Rebuild with --build-arg ENABLE_RUST=true." >&2\n' >> /build/tools_rust/mcp_runtime/target/release/contextforge-mcp-runtime; \
+        printf 'exit 1\n' >> /build/tools_rust/mcp_runtime/target/release/contextforge-mcp-runtime; \
+        chmod +x /build/tools_rust/mcp_runtime/target/release/contextforge-mcp-runtime; \
         exit 0; \
     fi
 
@@ -55,8 +61,9 @@ ENV PATH="/root/.cargo/bin:$PATH"
 
 WORKDIR /build
 
-# Copy only Rust plugin files (only if ENABLE_RUST=true)
+# Copy only Rust plugin/runtime files (only if ENABLE_RUST=true)
 COPY plugins_rust/ /build/plugins_rust/
+COPY tools_rust/mcp_runtime/ /build/tools_rust/mcp_runtime/
 
 # Build each Rust plugin independently using Python 3.12 from manylinux image
 RUN if [ "$ENABLE_RUST" = "true" ]; then \
@@ -74,6 +81,21 @@ RUN if [ "$ENABLE_RUST" = "true" ]; then \
         echo "⏭️  Skipping Rust plugin build"; \
     fi
 
+WORKDIR /build/tools_rust/mcp_runtime
+
+# Build the experimental Rust MCP runtime binary (only if ENABLE_RUST=true)
+RUN if [ "$ENABLE_RUST" = "true" ]; then \
+        if [ "$ENABLE_RUST_MCP_RMCP" = "true" ]; then \
+            cargo build --release --features rmcp-upstream-client; \
+        else \
+            cargo build --release; \
+        fi && \
+        cp target/release/contextforge_mcp_runtime target/release/contextforge-mcp-runtime && \
+        echo "✅ Rust MCP runtime built successfully"; \
+    else \
+        echo "⏭️  Skipping Rust MCP runtime build"; \
+    fi
+
 FROM rust-builder-base AS rust-builder
 
 ###########################
@@ -127,6 +149,7 @@ COPY pyproject.toml /app/
 # Copy Rust plugin wheels from rust-builder stage (if any exist)
 # ----------------------------------------------------------------------------
 COPY --from=rust-builder /build/rust-wheels/ /tmp/rust-wheels/
+COPY --from=rust-builder /build/tools_rust/mcp_runtime/target/release/contextforge-mcp-runtime /app/bin/contextforge-mcp-runtime
 
 # ----------------------------------------------------------------------------
 # Create and populate virtual environment
@@ -139,6 +162,7 @@ COPY --from=rust-builder /build/rust-wheels/ /tmp/rust-wheels/
 #  - Remove build caches and build artifacts
 # ----------------------------------------------------------------------------
 ARG ENABLE_RUST=false
+ARG ENABLE_RUST_MCP_RMCP=false
 ARG ENABLE_PROFILING=false
 RUN set -euo pipefail \
     && . /etc/profile.d/use-openssl.sh \
@@ -219,6 +243,8 @@ RUN chown -R 1001:0 /app \
 FROM registry.access.redhat.com/ubi10/ubi-minimal:10.1-1772441549 AS runtime
 
 ARG PYTHON_VERSION=3.12
+ARG ENABLE_RUST=false
+ARG ENABLE_RUST_MCP_RMCP=false
 ARG ENABLE_PROFILING=false
 
 # ----------------------------------------------------------------------------
@@ -285,6 +311,8 @@ COPY --from=builder --chown=1001:0 /app /app
 # - Disable pip version check to reduce startup time
 # ----------------------------------------------------------------------------
 ENV PATH="/app/.venv/bin:${PATH}" \
+    CONTEXTFORGE_ENABLE_RUST_BUILD=${ENABLE_RUST} \
+    CONTEXTFORGE_ENABLE_RUST_MCP_RMCP_BUILD=${ENABLE_RUST_MCP_RMCP} \
     PYTHONDONTWRITEBYTECODE=1 \
     PYTHONUNBUFFERED=1 \
     PYTHONHASHSEED=random \
diff --git a/Makefile b/Makefile
index d46436d5a3..9f80881ee7 100644
--- a/Makefile
+++ b/Makefile
@@ -19,6 +19,10 @@ SHELL := /bin/bash
 # Rust build configuration (set to 1 to enable Rust builds, 0 to disable)
 # Default is disabled to avoid requiring Rust toolchain for standard builds
 ENABLE_RUST_BUILD ?= 0
+ENABLE_RUST_MCP_RMCP_BUILD ?=
+RUST_MCP_BUILD ?= 0
+RUST_MCP_MODE ?= off
+RUST_MCP_LOG ?= warn
 
 # Project variables
 PROJECT_NAME      = mcpgateway
@@ -646,13 +650,14 @@ clean:
 # help: query-log-analyze    - Analyze query log for N+1 patterns and slow queries
 # help: query-log-clear      - Clear database query log files
 
-.PHONY: smoketest test-mcp-cli test-mcp-rbac test test-verbose test-profile coverage test-docs pytest-examples test-curl htmlcov doctest doctest-verbose doctest-coverage doctest-check test-db-perf test-db-perf-verbose 2025-11-25 2025-11-25-core 2025-11-25-tasks 2025-11-25-auth 2025-11-25-report dev-query-log query-log-tail query-log-analyze query-log-clear load-test load-test-ui load-test-light load-test-heavy load-test-sustained load-test-stress load-test-report load-test-compose load-test-timeserver load-test-fasttime load-test-1000 load-test-summary load-test-baseline load-test-baseline-ui load-test-baseline-stress load-test-agentgateway-mcp-server-time
+.PHONY: smoketest test-mcp-cli test-mcp-rbac test-mcp-plugin-parity test-mcp-access-matrix test-mcp-session-isolation test-mcp-session-isolation-load test test-verbose test-profile coverage test-docs pytest-examples test-curl htmlcov doctest doctest-verbose doctest-coverage doctest-check test-db-perf test-db-perf-verbose 2025-11-25 2025-11-25-core 2025-11-25-tasks 2025-11-25-auth 2025-11-25-report dev-query-log query-log-tail query-log-analyze query-log-clear load-test load-test-ui load-test-light load-test-heavy load-test-sustained load-test-stress load-test-report load-test-compose load-test-timeserver load-test-fasttime load-test-1000 load-test-summary load-test-baseline load-test-baseline-ui load-test-baseline-stress load-test-agentgateway-mcp-server-time
 
 # Dirs/files always excluded from standard pytest runs
 PYTEST_IGNORE := tests/fuzz tests/manual test.py \
     tests/e2e/test_entra_id_integration.py \
     tests/e2e/test_mcp_cli_protocol.py \
-    tests/e2e/test_mcp_rbac_transport.py
+    tests/e2e/test_mcp_rbac_transport.py \
+    tests/e2e_rust
 
 # Expand to --ignore=<path> flags for pytest CLI
 PYTEST_IGNORE_FLAGS := $(foreach p,$(PYTEST_IGNORE),--ignore=$(p))
@@ -683,6 +688,51 @@ test-mcp-rbac:  ## RBAC + multi-transport MCP protocol tests (needs live gateway
 			|| { echo "❌ MCP RBAC transport tests failed!"; exit 1; }; \
 		echo "✅ MCP RBAC transport tests passed!"'
 
+test-mcp-access-matrix:  ## Detailed Rust MCP role/access matrix test with strong tool/resource/prompt sentinels
+	@echo "🧪 Running MCP role/access matrix tests against $${MCP_CLI_BASE_URL:-http://localhost:8080}..."
+	@echo "   Requires: docker-compose stack rebuilt in Rust edge/full mode"
+	@/bin/bash -c 'source $(VENV_DIR)/bin/activate && \
+		uv run --active pytest tests/e2e_rust/test_mcp_access_matrix.py -v -s --tb=short \
+			|| { echo "❌ MCP role/access matrix tests failed!"; exit 1; }; \
+		echo "✅ MCP role/access matrix tests passed!"'
+
+test-mcp-plugin-parity:  ## MCP plugin parity E2E for current Python or Rust stack using a test-specific plugin config
+	@echo "🧪 Running MCP plugin parity tests against $${MCP_CLI_BASE_URL:-http://localhost:8080}..."
+	@echo "   Requires: stack started with PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml"
+	@/bin/bash -c 'source $(VENV_DIR)/bin/activate && \
+		uv run --active pytest tests/e2e/test_mcp_plugin_parity.py -v -s --tb=short \
+			|| { echo "❌ MCP plugin parity tests failed!"; exit 1; }; \
+		echo "✅ MCP plugin parity tests passed!"'
+
+test-mcp-session-isolation:  ## MCP session/auth isolation tests for the Rust public transport path
+	@echo "🧪 Running MCP session/auth isolation tests against $${MCP_CLI_BASE_URL:-http://localhost:8080}..."
+	@echo "   Requires: docker-compose stack rebuilt in Rust edge/full mode"
+	@/bin/bash -c 'source $(VENV_DIR)/bin/activate && \
+		uv run --active pytest tests/e2e_rust/test_mcp_session_isolation.py -v -s --tb=short \
+			|| { echo "❌ MCP session/auth isolation tests failed!"; exit 1; }; \
+		echo "✅ MCP session/auth isolation tests passed!"'
+
+MCP_ISOLATION_LOCUSTFILE ?= tests/loadtest/locustfile_mcp_isolation.py
+MCP_ISOLATION_LOAD_HOST ?= http://localhost:8080
+MCP_ISOLATION_LOAD_USERS ?= 12
+MCP_ISOLATION_LOAD_SPAWN_RATE ?= 3
+MCP_ISOLATION_LOAD_RUN_TIME ?= 60s
+
+test-mcp-session-isolation-load: ## Multi-user MCP session/auth isolation correctness load test
+	@echo "🧪 Running MCP session/auth isolation load test against $(MCP_ISOLATION_LOAD_HOST)..."
+	@echo "   Requires: docker-compose stack rebuilt in Rust full mode"
+	@test -d "$(VENV_DIR)" || $(MAKE) venv
+	@/bin/bash -eu -o pipefail -c 'source $(VENV_DIR)/bin/activate && \
+		locust -f $(MCP_ISOLATION_LOCUSTFILE) \
+			--host=$(MCP_ISOLATION_LOAD_HOST) \
+			--users=$(MCP_ISOLATION_LOAD_USERS) \
+			--spawn-rate=$(MCP_ISOLATION_LOAD_SPAWN_RATE) \
+			--run-time=$(MCP_ISOLATION_LOAD_RUN_TIME) \
+			--headless \
+			--stop-timeout=30 \
+			--exit-code-on-error=1 \
+			--only-summary'
+
 test:
 	@echo "🧪 Running tests..."
 	@test -d "$(VENV_DIR)" || $(MAKE) venv
@@ -1289,6 +1339,39 @@ testing-up:                                ## Start testing stack (Locust + A2A
 	@echo "   Next:"
 	@echo "      • Open Locust: http://localhost:8089 (default host is http://nginx:80)"
 
+.PHONY: testing-up-rust
+testing-up-rust:                           ## Start testing stack with RUST_MCP_MODE=edge
+	@RUST_MCP_MODE=edge RUST_MCP_LOG=$(RUST_MCP_LOG) $(MAKE) testing-up
+
+.PHONY: testing-up-rust-shadow
+testing-up-rust-shadow:                    ## Start testing stack with RUST_MCP_MODE=shadow
+	@RUST_MCP_MODE=shadow RUST_MCP_LOG=$(RUST_MCP_LOG) $(MAKE) testing-up
+
+.PHONY: testing-up-rust-full
+testing-up-rust-full:                      ## Start testing stack with RUST_MCP_MODE=full
+	@RUST_MCP_MODE=full RUST_MCP_LOG=$(RUST_MCP_LOG) $(MAKE) testing-up
+
+.PHONY: testing-rebuild-rust
+testing-rebuild-rust:                      ## Rebuild Rust image with no cache, then start testing stack in edge mode
+	@$(MAKE) testing-down
+	@$(MAKE) compose-clean
+	@$(MAKE) docker-prod-rust-no-cache
+	@RUST_MCP_MODE=edge RUST_MCP_LOG=$(RUST_MCP_LOG) $(MAKE) testing-up
+
+.PHONY: testing-rebuild-rust-shadow
+testing-rebuild-rust-shadow:               ## Rebuild Rust image with no cache, then start testing stack in shadow mode
+	@$(MAKE) testing-down
+	@$(MAKE) compose-clean
+	@$(MAKE) docker-prod-rust-no-cache
+	@RUST_MCP_MODE=shadow RUST_MCP_LOG=$(RUST_MCP_LOG) $(MAKE) testing-up
+
+.PHONY: testing-rebuild-rust-full
+testing-rebuild-rust-full:                 ## Rebuild Rust image with no cache, then start testing stack in full mode
+	@$(MAKE) testing-down
+	@$(MAKE) compose-clean
+	@$(MAKE) docker-prod-rust-no-cache
+	@RUST_MCP_MODE=full RUST_MCP_LOG=$(RUST_MCP_LOG) $(MAKE) testing-up
+
 .PHONY: testing-down
 testing-down:                              ## Stop testing stack
 	@echo "🧪 Stopping testing stack..."
@@ -2238,6 +2321,19 @@ load-test-agentgateway-mcp-server-time:    ## Load test external MCP server (loc
 
 MCP_PROTOCOL_LOCUSTFILE ?= tests/loadtest/locustfile_mcp_protocol.py
 MCP_PROTOCOL_HOST ?= http://localhost:4444
+MCP_BENCHMARK_HOST ?= http://localhost:8080
+MCP_BENCHMARK_SERVER_ID ?= 9779b6698cbd4b4995ee04a4fab38737
+MCP_BENCHMARK_USERS ?= 125
+MCP_BENCHMARK_SPAWN_RATE ?= 30
+MCP_BENCHMARK_RUN_TIME ?= 60s
+MCP_BENCHMARK_HIGH_USERS ?= 300
+MCP_BENCHMARK_HIGH_SPAWN_RATE ?= 50
+MCP_BENCHMARK_HIGH_RUN_TIME ?= 60s
+MCP_BENCHMARK_WORKERS ?= 4
+MCP_BENCHMARK_MIXED_MASTER_PORT ?= 5567
+MCP_BENCHMARK_TOOLS_MASTER_PORT ?= 5569
+MCP_BENCHMARK_LOCUST_LOG_LEVEL ?= ERROR
+MCP_BENCHMARK_WORKER_LOG_DIR ?= reports/mcp_benchmark_workers
 
 load-test-mcp-protocol:                    ## MCP Streamable HTTP protocol test (150 users, 2min)
 	@echo "🔬 Running MCP STREAMABLE HTTP protocol load test..."
@@ -2274,6 +2370,119 @@ load-test-mcp-protocol-ui:                 ## MCP Streamable HTTP protocol test
 			--run-time=120s \
 			--class-picker'
 
+# help: benchmark-mcp-mixed      - Quick mixed MCP benchmark against the testing stack
+# help: benchmark-mcp-tools      - Quick tools-only MCP benchmark against the testing stack
+# help: benchmark-mcp-mixed-300  - Distributed 300-user mixed MCP benchmark
+# help: benchmark-mcp-tools-300  - Distributed 300-user tools-only MCP benchmark
+
+.PHONY: benchmark-mcp-mixed
+benchmark-mcp-mixed:                        ## Quick mixed MCP benchmark against the testing stack
+	@echo "📊 Running mixed MCP benchmark..."
+	@echo "   Host: $(MCP_BENCHMARK_HOST)"
+	@echo "   Server: $(MCP_BENCHMARK_SERVER_ID)"
+	@echo "   Users: $(MCP_BENCHMARK_USERS), Spawn: $(MCP_BENCHMARK_SPAWN_RATE)/s, Duration: $(MCP_BENCHMARK_RUN_TIME)"
+	@test -d "$(VENV_DIR)" || $(MAKE) venv
+	@/bin/bash -eu -o pipefail -c 'source $(VENV_DIR)/bin/activate && \
+		LOCUST_LOG_LEVEL=$(MCP_BENCHMARK_LOCUST_LOG_LEVEL) MCP_SERVER_ID=$(MCP_BENCHMARK_SERVER_ID) \
+		locust -f $(MCP_PROTOCOL_LOCUSTFILE) \
+			--host=$(MCP_BENCHMARK_HOST) \
+			--users=$(MCP_BENCHMARK_USERS) \
+			--spawn-rate=$(MCP_BENCHMARK_SPAWN_RATE) \
+			--run-time=$(MCP_BENCHMARK_RUN_TIME) \
+			--headless \
+			--only-summary'
+
+.PHONY: benchmark-mcp-tools
+benchmark-mcp-tools:                        ## Quick tools-only MCP benchmark against the testing stack
+	@echo "📊 Running tools-only MCP benchmark..."
+	@echo "   Host: $(MCP_BENCHMARK_HOST)"
+	@echo "   Server: $(MCP_BENCHMARK_SERVER_ID)"
+	@echo "   Users: $(MCP_BENCHMARK_USERS), Spawn: $(MCP_BENCHMARK_SPAWN_RATE)/s, Duration: $(MCP_BENCHMARK_RUN_TIME)"
+	@test -d "$(VENV_DIR)" || $(MAKE) venv
+	@/bin/bash -eu -o pipefail -c 'source $(VENV_DIR)/bin/activate && \
+		LOCUST_LOG_LEVEL=$(MCP_BENCHMARK_LOCUST_LOG_LEVEL) MCP_SERVER_ID=$(MCP_BENCHMARK_SERVER_ID) \
+		locust -f $(MCP_PROTOCOL_LOCUSTFILE) \
+			--host=$(MCP_BENCHMARK_HOST) \
+			--users=$(MCP_BENCHMARK_USERS) \
+			--spawn-rate=$(MCP_BENCHMARK_SPAWN_RATE) \
+			--run-time=$(MCP_BENCHMARK_RUN_TIME) \
+			--headless \
+			--only-summary \
+			MCPToolCallerUser'
+
+.PHONY: benchmark-mcp-mixed-300
+benchmark-mcp-mixed-300:                    ## Distributed 300-user mixed MCP benchmark
+	@echo "📊 Running distributed mixed MCP benchmark..."
+	@echo "   Host: $(MCP_BENCHMARK_HOST)"
+	@echo "   Server: $(MCP_BENCHMARK_SERVER_ID)"
+	@echo "   Users: $(MCP_BENCHMARK_HIGH_USERS), Spawn: $(MCP_BENCHMARK_HIGH_SPAWN_RATE)/s, Duration: $(MCP_BENCHMARK_HIGH_RUN_TIME), Workers: $(MCP_BENCHMARK_WORKERS)"
+	@test -d "$(VENV_DIR)" || $(MAKE) venv
+	@mkdir -p $(MCP_BENCHMARK_WORKER_LOG_DIR)
+	@/bin/bash -eu -o pipefail -c 'source $(VENV_DIR)/bin/activate; \
+		pids=""; \
+		cleanup() { \
+			for pid in $$pids; do kill $$pid 2>/dev/null || true; done; \
+			wait $$pids 2>/dev/null || true; \
+		}; \
+		trap cleanup EXIT INT TERM; \
+		for i in $$(seq 1 $(MCP_BENCHMARK_WORKERS)); do \
+			LOCUST_LOG_LEVEL=$(MCP_BENCHMARK_LOCUST_LOG_LEVEL) MCP_SERVER_ID=$(MCP_BENCHMARK_SERVER_ID) \
+			locust -f $(MCP_PROTOCOL_LOCUSTFILE) \
+				--worker \
+				--master-host=127.0.0.1 \
+				--master-port=$(MCP_BENCHMARK_MIXED_MASTER_PORT) \
+				> $(MCP_BENCHMARK_WORKER_LOG_DIR)/mixed_worker_$$i.log 2>&1 & \
+			pids="$$pids $$!"; \
+		done; \
+		LOCUST_LOG_LEVEL=$(MCP_BENCHMARK_LOCUST_LOG_LEVEL) MCP_SERVER_ID=$(MCP_BENCHMARK_SERVER_ID) \
+		locust -f $(MCP_PROTOCOL_LOCUSTFILE) \
+			--host=$(MCP_BENCHMARK_HOST) \
+			--master \
+			--headless \
+			--expect-workers=$(MCP_BENCHMARK_WORKERS) \
+			--master-bind-port=$(MCP_BENCHMARK_MIXED_MASTER_PORT) \
+			--users=$(MCP_BENCHMARK_HIGH_USERS) \
+			--spawn-rate=$(MCP_BENCHMARK_HIGH_SPAWN_RATE) \
+			--run-time=$(MCP_BENCHMARK_HIGH_RUN_TIME) \
+			--only-summary'
+
+.PHONY: benchmark-mcp-tools-300
+benchmark-mcp-tools-300:                    ## Distributed 300-user tools-only MCP benchmark
+	@echo "📊 Running distributed tools-only MCP benchmark..."
+	@echo "   Host: $(MCP_BENCHMARK_HOST)"
+	@echo "   Server: $(MCP_BENCHMARK_SERVER_ID)"
+	@echo "   Users: $(MCP_BENCHMARK_HIGH_USERS), Spawn: $(MCP_BENCHMARK_HIGH_SPAWN_RATE)/s, Duration: $(MCP_BENCHMARK_HIGH_RUN_TIME), Workers: $(MCP_BENCHMARK_WORKERS)"
+	@test -d "$(VENV_DIR)" || $(MAKE) venv
+	@mkdir -p $(MCP_BENCHMARK_WORKER_LOG_DIR)
+	@/bin/bash -eu -o pipefail -c 'source $(VENV_DIR)/bin/activate; \
+		pids=""; \
+		cleanup() { \
+			for pid in $$pids; do kill $$pid 2>/dev/null || true; done; \
+			wait $$pids 2>/dev/null || true; \
+		}; \
+		trap cleanup EXIT INT TERM; \
+		for i in $$(seq 1 $(MCP_BENCHMARK_WORKERS)); do \
+			LOCUST_LOG_LEVEL=$(MCP_BENCHMARK_LOCUST_LOG_LEVEL) MCP_SERVER_ID=$(MCP_BENCHMARK_SERVER_ID) \
+			locust -f $(MCP_PROTOCOL_LOCUSTFILE) \
+				--worker \
+				--master-host=127.0.0.1 \
+				--master-port=$(MCP_BENCHMARK_TOOLS_MASTER_PORT) \
+				> $(MCP_BENCHMARK_WORKER_LOG_DIR)/tools_worker_$$i.log 2>&1 & \
+			pids="$$pids $$!"; \
+		done; \
+		LOCUST_LOG_LEVEL=$(MCP_BENCHMARK_LOCUST_LOG_LEVEL) MCP_SERVER_ID=$(MCP_BENCHMARK_SERVER_ID) \
+		locust -f $(MCP_PROTOCOL_LOCUSTFILE) \
+			--host=$(MCP_BENCHMARK_HOST) \
+			--master \
+			--headless \
+			--expect-workers=$(MCP_BENCHMARK_WORKERS) \
+			--master-bind-port=$(MCP_BENCHMARK_TOOLS_MASTER_PORT) \
+			--users=$(MCP_BENCHMARK_HIGH_USERS) \
+			--spawn-rate=$(MCP_BENCHMARK_HIGH_SPAWN_RATE) \
+			--run-time=$(MCP_BENCHMARK_HIGH_RUN_TIME) \
+			--only-summary \
+			MCPToolCallerUser'
+
 load-test-mcp-protocol-heavy:              ## MCP Streamable HTTP protocol heavy test (500 users, 5min)
 	@echo "🔬 Running MCP STREAMABLE HTTP protocol HEAVY load test..."
 	@echo "   Host: $(MCP_PROTOCOL_HOST)"
@@ -4605,13 +4814,26 @@ PLATFORM ?= linux/$(shell uname -m | sed 's/x86_64/amd64/;s/aarch64/arm64/')
 
 container-build:
 	@echo "🔨 Building with $(CONTAINER_RUNTIME) for platform $(PLATFORM)..."
-	@RUST_ARG=""; PROFILING_ARG=""; \
-	if [ "$(ENABLE_RUST_BUILD)" = "1" ]; then \
+	@RUST_BUILD_VALUE="$(ENABLE_RUST_BUILD)"; RMCP_BUILD_VALUE="$(ENABLE_RUST_MCP_RMCP_BUILD)"; RUST_ARG=""; RMCP_ARG=""; PROFILING_ARG=""; \
+	if [ "$(RUST_MCP_BUILD)" = "1" ] || [ "$(RUST_MCP_BUILD)" = "true" ]; then \
+		RUST_BUILD_VALUE="1"; \
+		if [ -z "$$RMCP_BUILD_VALUE" ] || [ "$$RMCP_BUILD_VALUE" = "0" ] || [ "$$RMCP_BUILD_VALUE" = "false" ]; then \
+			RMCP_BUILD_VALUE="1"; \
+		fi; \
+	fi; \
+	if [ "$$RUST_BUILD_VALUE" = "1" ] || [ "$$RUST_BUILD_VALUE" = "true" ]; then \
 		echo "🦀 Building container WITH Rust plugins..."; \
 		RUST_ARG="--build-arg ENABLE_RUST=true"; \
+		if [ "$$RMCP_BUILD_VALUE" = "1" ] || [ "$$RMCP_BUILD_VALUE" = "true" ]; then \
+			echo "🦀 Enabling rmcp support in the Rust MCP runtime..."; \
+			RMCP_ARG="--build-arg ENABLE_RUST_MCP_RMCP=true"; \
+		else \
+			RMCP_ARG="--build-arg ENABLE_RUST_MCP_RMCP=false"; \
+		fi; \
 	else \
-		echo "⏭️  Building container WITHOUT Rust plugins (set ENABLE_RUST_BUILD=1 to enable)"; \
+		echo "⏭️  Building container WITHOUT Rust plugins (set RUST_MCP_BUILD=1 or ENABLE_RUST_BUILD=1 to enable)"; \
 		RUST_ARG="--build-arg ENABLE_RUST=false"; \
+		RMCP_ARG="--build-arg ENABLE_RUST_MCP_RMCP=false"; \
 	fi; \
 	if [ "$(ENABLE_PROFILING_BUILD)" = "1" ]; then \
 		echo "📊 Building container WITH profiling tools (memray)..."; \
@@ -4623,7 +4845,9 @@ container-build:
 		--platform=$(PLATFORM) \
 		-f $(CONTAINER_FILE) \
 		$$RUST_ARG \
+		$$RMCP_ARG \
 		$$PROFILING_ARG \
+		$(DOCKER_BUILD_ARGS) \
 		--tag $(IMAGE_BASE):$(IMAGE_TAG) \
 		.
 	@echo "✅ Built image: $(call get_image_name)"
@@ -5123,6 +5347,12 @@ docker:
 docker-prod:
 	@DOCKER_CONTENT_TRUST=1 $(MAKE) container-build CONTAINER_RUNTIME=docker CONTAINER_FILE=Containerfile.lite
 
+docker-prod-rust:
+	@DOCKER_CONTENT_TRUST=1 $(MAKE) container-build CONTAINER_RUNTIME=docker CONTAINER_FILE=Containerfile.lite RUST_MCP_BUILD=1
+
+docker-prod-rust-no-cache:
+	@DOCKER_CONTENT_TRUST=1 $(MAKE) container-build CONTAINER_RUNTIME=docker CONTAINER_FILE=Containerfile.lite RUST_MCP_BUILD=1 DOCKER_BUILD_ARGS="--no-cache"
+
 # Build production image with profiling tools (memray) for performance debugging
 # Usage: make docker-prod-profiling
 # Then run with SYS_PTRACE capability:
@@ -5763,7 +5993,7 @@ MINIKUBE_ADDONS  ?= ingress ingress-dns metrics-server dashboard registry regist
 #   mcpgateway/mcpgateway:latest.  Override with IMAGE=<repo:tag> to use a
 #   remote registry (e.g. ghcr.io/ibm/mcp-context-forge:v0.9.0).
 TAG              ?= latest         # override with TAG=<ver>
-IMAGE            ?= $(IMG):$(TAG)  # or IMAGE=ghcr.io/ibm/mcp-context-forge:$(TAG)
+IMAGE            ?= $(IMAGE_LOCAL) # or IMAGE=ghcr.io/ibm/mcp-context-forge:$(TAG)
 
 # -----------------------------------------------------------------------------
 # 🆘  HELP TARGETS (parsed by `make help`)
@@ -5854,7 +6084,7 @@ minikube-dashboard:
 .PHONY: minikube-context
 minikube-context:
 	@echo "🎯 Switching kubectl context to Minikube ..."
-	kubectl config use-context minikube
+	kubectl config use-context $(MINIKUBE_PROFILE)
 
 .PHONY: minikube-ssh
 minikube-ssh:
@@ -7730,7 +7960,7 @@ migration-test-all: migration-setup        ## Run comprehensive migration test s
 	@echo "📋 Testing PostgreSQL migrations..."
 	@/bin/bash -c "source $(VENV_DIR)/bin/activate && \
 		pytest $(MIGRATION_TEST_DIR)/test_compose_postgres_migrations.py \
-		-v --tb=short --maxfail=3 -m 'not slow' \
+		-v --tb=short --maxfail=3 \
 		--log-cli-level=INFO --log-cli-format='%(asctime)s [%(levelname)s] %(name)s: %(message)s'"
 	@echo ""
 	@echo "📊 Generating migration test report..."
@@ -7752,7 +7982,7 @@ migration-test-postgres:                   ## Run PostgreSQL compose migration t
 	@test -d "$(VENV_DIR)" || $(MAKE) venv
 	@/bin/bash -c "source $(VENV_DIR)/bin/activate && \
 		pytest $(MIGRATION_TEST_DIR)/test_compose_postgres_migrations.py \
-		-v --tb=short --log-cli-level=INFO -m 'not slow'"
+		-v --tb=short --log-cli-level=INFO"
 	@echo "✅ PostgreSQL migration tests complete!"
 
 migration-test-performance:               ## Run migration performance benchmarking
@@ -7864,10 +8094,14 @@ upgrade-validate:                         ## Validate fresh + upgrade DB startup
 # help: rust-build-all-platforms              - Build for all platforms (Linux, macOS, Windows)
 # help: rust-cross                            - Install targets + build all Linux (convenience)
 # help: rust-cross-install-build              - Install targets + build all platforms (one command)
+# help: rust-mcp-runtime-build                - Build the experimental Rust MCP runtime
+# help: rust-mcp-runtime-test                 - Run tests for the experimental Rust MCP runtime
+# help: rust-mcp-runtime-run                  - Run the experimental Rust MCP runtime against local gateway /rpc
 
 .PHONY: rust-build rust-dev rust-test rust-test-integration rust-python-test rust-test-all rust-bench rust-bench-compare rust-compare rust-check rust-clean rust-verify rust-verify-stubs
 .PHONY: rust-ensure-deps rust-install-deps rust-install-targets rust-install
 .PHONY: rust-build-all-linux rust-build-all-platforms rust-cross rust-cross-install-build
+.PHONY: rust-mcp-runtime-build rust-mcp-runtime-test rust-mcp-runtime-run
 
 rust-ensure-deps:                       ## Ensure Rust toolchain, maturin, and all plugins are installed
 	@if ! command -v rustup > /dev/null 2>&1; then \
@@ -7994,6 +8228,18 @@ rust-cross: rust-install-targets rust-build-all-linux  ## Install targets + buil
 rust-cross-install-build: rust-install-deps rust-install-targets rust-build-all-platforms  ## Install targets + build all platforms (one command)
 	@echo "✅ Full cross-compilation setup and build complete"
 
+rust-mcp-runtime-build:                    ## Build the experimental Rust MCP runtime
+	@echo "🦀 Building experimental Rust MCP runtime..."
+	@cd tools_rust/mcp_runtime && cargo build --release
+
+rust-mcp-runtime-test:                     ## Run tests for the experimental Rust MCP runtime
+	@echo "🧪 Running Rust MCP runtime tests..."
+	@cd tools_rust/mcp_runtime && cargo test --release
+
+rust-mcp-runtime-run:                      ## Run the experimental Rust MCP runtime against local gateway /rpc
+	@echo "🚀 Starting Rust MCP runtime on http://127.0.0.1:8787 with backend http://127.0.0.1:4444/rpc"
+	@cd tools_rust/mcp_runtime && cargo run --release -- --backend-rpc-url http://127.0.0.1:4444/rpc --listen-http 127.0.0.1:8787
+
 .PHONY: conc-02-gateways
 conc-02-gateways:                    ## Run CONC-02 gateways read-during-write check (manual env/token setup required)
 	@/bin/bash tests/manual/concurrency/run_conc_02_gateways.sh
diff --git a/charts/mcp-stack/templates/configmap-nginx-proxy.yaml b/charts/mcp-stack/templates/configmap-nginx-proxy.yaml
index d4bc1da10b..35cdb248d4 100644
--- a/charts/mcp-stack/templates/configmap-nginx-proxy.yaml
+++ b/charts/mcp-stack/templates/configmap-nginx-proxy.yaml
@@ -56,6 +56,28 @@ data:
           allow all;
         }
 
+        location ~ ^(/mcp/?|/servers/.*/mcp/?)$ {
+          proxy_http_version 1.1;
+          proxy_set_header Host $http_host;
+          proxy_set_header X-Real-IP $remote_addr;
+          proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+          proxy_set_header X-Forwarded-Proto $forwarded_proto;
+          proxy_set_header X-Forwarded-Host $http_host;
+          proxy_set_header Connection "";
+
+          proxy_request_buffering off;
+          proxy_buffering off;
+          proxy_cache off;
+          add_header X-Accel-Buffering "no" always;
+
+          proxy_connect_timeout 1h;
+          proxy_read_timeout 1h;
+          proxy_send_timeout 1h;
+          send_timeout {{ .Values.nginxProxy.config.sendTimeout }};
+
+          proxy_pass http://gateway_upstream;
+        }
+
         location / {
           proxy_http_version 1.1;
           proxy_set_header Host $http_host;
diff --git a/charts/mcp-stack/templates/registration-jobs.yaml b/charts/mcp-stack/templates/registration-jobs.yaml
index c4a8f2cb8d..44e6fc9212 100644
--- a/charts/mcp-stack/templates/registration-jobs.yaml
+++ b/charts/mcp-stack/templates/registration-jobs.yaml
@@ -142,6 +142,8 @@ spec:
 
               print("fast_time registration complete")
               PY
+
+              exit 0
 {{- end }}
 
 {{- if and .Values.testing.enabled $registrationEnabled .Values.testing.fastTest.register.enabled .Values.testing.fastTestServer.enabled }}
@@ -236,6 +238,8 @@ spec:
               api_request("POST", "/gateways", {"name": gateway_name, "url": gateway_url, "transport": transport})
               print("fast_test registration complete")
               PY
+
+              exit 0
 {{- end }}
 
 {{- if and .Values.testing.enabled $registrationEnabled .Values.testing.a2a.register.enabled .Values.testing.a2aEchoAgent.enabled }}
@@ -344,6 +348,8 @@ spec:
               api_request("POST", "/a2a", payload)
               print("a2a echo registration complete")
               PY
+
+              exit 0
 {{- end }}
 
 {{- if and .Values.benchmark.enabled .Values.benchmark.register.enabled $registrationEnabled }}
@@ -441,4 +447,6 @@ spec:
 
               print("benchmark registration complete")
               PY
+
+              exit 0
 {{- end }}
diff --git a/charts/mcp-stack/values-minikube.yaml b/charts/mcp-stack/values-minikube.yaml
index f784fc1fff..00ebc530d1 100644
--- a/charts/mcp-stack/values-minikube.yaml
+++ b/charts/mcp-stack/values-minikube.yaml
@@ -58,6 +58,12 @@ mcpContextForge:
     PASSWORD_REQUIRE_SPECIAL: "false"
     REQUIRE_STRONG_SECRETS: "false"
 
+migration:
+  image:
+    repository: ghcr.io/ibm/mcp-context-forge
+    tag: "1.0.0-RC-2"
+    pullPolicy: Never
+
 # Disable TLS on fast-time-server ingress for minikube
 mcpFastTimeServer:
   ingress:
diff --git a/docker-compose-embedded.yml b/docker-compose-embedded.yml
index dd428eb6cd..e549c80868 100644
--- a/docker-compose-embedded.yml
+++ b/docker-compose-embedded.yml
@@ -45,7 +45,7 @@ services:
       - ./infra/iframe-test/nginx-embedded.conf:/etc/nginx/nginx.conf:ro
 
   gateway:
-    image: ghcr.io/ibm/mcp-context-forge:1ba8130f7fb82e6f393435be8d064879f234ace1
+    image: ${IMAGE_LOCAL:-mcpgateway/mcpgateway:latest}
     environment:
       # ── Embedded UI ──
       - MCPGATEWAY_UI_EMBEDDED=true
@@ -147,7 +147,7 @@ services:
   # Benchmark services: inherited from base compose (profiles: ["benchmark"])
   # Activated via --profile benchmark in Makefile targets
   register_benchmark:
-    image: ghcr.io/ibm/mcp-context-forge:1ba8130f7fb82e6f393435be8d064879f234ace1
+    image: ${IMAGE_LOCAL:-mcpgateway/mcpgateway:latest}
     environment:
       - JWT_SECRET_KEY=${JWT_SECRET_KEY:-my-test-key}
       - BENCHMARK_SERVER_COUNT=${BENCHMARK_SERVER_COUNT:-10}
diff --git a/docker-compose.yml b/docker-compose.yml
index d5cfc2bd47..b5f93cc18c 100644
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -117,6 +117,9 @@ services:
     build:
       context: .
       dockerfile: Containerfile.lite     # Same one the Makefile builds
+      args:
+        ENABLE_RUST: ${ENABLE_RUST_BUILD:-${RUST_MCP_BUILD:-false}}
+        ENABLE_RUST_MCP_RMCP: ${ENABLE_RUST_MCP_RMCP_BUILD:-${RUST_MCP_BUILD:-false}}
     restart: unless-stopped
     # NOTE: When using replicas > 1, access via nginx:8080 instead of direct port 4444
     # ports:
@@ -139,13 +142,65 @@ services:
       # Both achieve same RPS when database is the bottleneck.
       # ═══════════════════════════════════════════════════════════════════════════
       # - HTTP_SERVER=granian    # Rust-based, native backpressure, +47% memory, -8% CPU
-      - HTTP_SERVER=gunicorn # Python-based, battle-tested, lower memory usage
+      - HTTP_SERVER=${HTTP_SERVER:-gunicorn} # Python-based by default; set granian to benchmark the Rust ASGI front door
       - HOST=0.0.0.0
       - PORT=4444
       # Domain for CORS/cookies (nginx default at http://localhost:8080)
       - APP_DOMAIN=${APP_DOMAIN:-http://localhost:8080}
       # Transport: sse, streamablehttp, http, or all (default: all)
       - TRANSPORT_TYPE=streamablehttp
+      # High-level Rust MCP UX:
+      #   RUST_MCP_MODE=off    -> Python MCP transport
+      #   RUST_MCP_MODE=shadow -> Rust sidecar is present, but public /mcp stays on Python for safe fallback
+      #   RUST_MCP_MODE=edge   -> direct public /mcp on Rust with managed UDS sidecar defaults
+      #   RUST_MCP_MODE=full   -> edge + Rust session/event-store/resume/live-stream/affinity cores
+      # Advanced EXPERIMENTAL_/MCP_RUST_* env vars below still work as explicit overrides.
+      - RUST_MCP_MODE=${RUST_MCP_MODE:-off}
+      - RUST_MCP_LOG=${RUST_MCP_LOG:-warn}
+      # Advanced override: force the session-auth-reuse fast path on/off
+      # independently of RUST_MCP_MODE. Prefer the mode presets above.
+      - RUST_MCP_SESSION_AUTH_REUSE=${RUST_MCP_SESSION_AUTH_REUSE:-}
+      # Experimental Rust MCP runtime internals. Leave unset for the simple
+      # RUST_MCP_MODE=shadow/edge/full paths; set explicitly only to override.
+      - EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED=${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED:-}
+      - EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED=${EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED:-}
+      - EXPERIMENTAL_RUST_MCP_RUNTIME_URL=${EXPERIMENTAL_RUST_MCP_RUNTIME_URL:-}
+      - EXPERIMENTAL_RUST_MCP_RUNTIME_UDS=${EXPERIMENTAL_RUST_MCP_RUNTIME_UDS:-}
+      - EXPERIMENTAL_RUST_MCP_RUNTIME_TIMEOUT_SECONDS=${EXPERIMENTAL_RUST_MCP_RUNTIME_TIMEOUT_SECONDS:-30}
+      - EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED=${EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED:-}
+      - EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED=${EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED:-}
+      - EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED=${EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED:-}
+      - EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED=${EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED:-}
+      - EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED=${EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED:-}
+      - EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED=${EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED:-}
+      # Sidecar-level knobs. These default from the mode-derived experimental settings above.
+      - MCP_RUST_LISTEN_HTTP=${MCP_RUST_LISTEN_HTTP:-}
+      - MCP_RUST_LISTEN_UDS=${MCP_RUST_LISTEN_UDS:-}
+      - MCP_RUST_PUBLIC_LISTEN_HTTP=${MCP_RUST_PUBLIC_LISTEN_HTTP:-}
+      - MCP_RUST_BACKEND_RPC_URL=${MCP_RUST_BACKEND_RPC_URL:-http://127.0.0.1:4444/_internal/mcp/rpc}
+      - MCP_RUST_REDIS_URL=${MCP_RUST_REDIS_URL:-}
+      - MCP_RUST_CACHE_PREFIX=${MCP_RUST_CACHE_PREFIX:-mcpgw:}
+      - MCP_RUST_DATABASE_URL=${MCP_RUST_DATABASE_URL:-}
+      - MCP_RUST_DB_POOL_MAX_SIZE=${MCP_RUST_DB_POOL_MAX_SIZE:-20}
+      - MCP_RUST_SESSION_CORE_ENABLED=${MCP_RUST_SESSION_CORE_ENABLED:-}
+      - MCP_RUST_SESSION_TTL_SECONDS=${MCP_RUST_SESSION_TTL_SECONDS:-3600}
+      - MCP_RUST_EVENT_STORE_ENABLED=${MCP_RUST_EVENT_STORE_ENABLED:-}
+      - MCP_RUST_RESUME_CORE_ENABLED=${MCP_RUST_RESUME_CORE_ENABLED:-}
+      - MCP_RUST_LIVE_STREAM_CORE_ENABLED=${MCP_RUST_LIVE_STREAM_CORE_ENABLED:-}
+      - MCP_RUST_AFFINITY_CORE_ENABLED=${MCP_RUST_AFFINITY_CORE_ENABLED:-}
+      - MCP_RUST_SESSION_AUTH_REUSE_ENABLED=${MCP_RUST_SESSION_AUTH_REUSE_ENABLED:-}
+      - MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS=${MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS:-30}
+      - MCP_RUST_EVENT_STORE_MAX_EVENTS_PER_STREAM=${MCP_RUST_EVENT_STORE_MAX_EVENTS_PER_STREAM:-100}
+      - MCP_RUST_EVENT_STORE_TTL_SECONDS=${MCP_RUST_EVENT_STORE_TTL_SECONDS:-3600}
+      - MCP_RUST_EVENT_STORE_POLL_INTERVAL_MS=${MCP_RUST_EVENT_STORE_POLL_INTERVAL_MS:-250}
+      - MCP_RUST_LOG=${MCP_RUST_LOG:-}
+      - MCP_RUST_CLIENT_CONNECT_TIMEOUT_MS=${MCP_RUST_CLIENT_CONNECT_TIMEOUT_MS:-5000}
+      - MCP_RUST_CLIENT_POOL_IDLE_TIMEOUT_SECONDS=${MCP_RUST_CLIENT_POOL_IDLE_TIMEOUT_SECONDS:-90}
+      - MCP_RUST_CLIENT_POOL_MAX_IDLE_PER_HOST=${MCP_RUST_CLIENT_POOL_MAX_IDLE_PER_HOST:-1024}
+      - MCP_RUST_CLIENT_TCP_KEEPALIVE_SECONDS=${MCP_RUST_CLIENT_TCP_KEEPALIVE_SECONDS:-30}
+      - MCP_RUST_TOOLS_CALL_PLAN_TTL_SECONDS=${MCP_RUST_TOOLS_CALL_PLAN_TTL_SECONDS:-30}
+      - MCP_RUST_UPSTREAM_SESSION_TTL_SECONDS=${MCP_RUST_UPSTREAM_SESSION_TTL_SECONDS:-300}
+      - MCP_RUST_USE_RMCP_UPSTREAM_CLIENT=${MCP_RUST_USE_RMCP_UPSTREAM_CLIENT:-}
       # WebSocket transport features (disabled by default; opt-in only)
       - MCPGATEWAY_WS_RELAY_ENABLED=${MCPGATEWAY_WS_RELAY_ENABLED:-false}
       - MCPGATEWAY_REVERSE_PROXY_ENABLED=${MCPGATEWAY_REVERSE_PROXY_ENABLED:-false}
@@ -338,6 +393,7 @@ services:
       # - KEY_FILE_PASSWORD=${KEY_FILE_PASSWORD}
       # Uncomment to enable plugins
       - PLUGINS_ENABLED=true
+      - PLUGINS_CONFIG_FILE=${PLUGINS_CONFIG_FILE:-plugins/config.yaml}
       # Uncomment to enable catalog
       - MCPGATEWAY_CATALOG_ENABLED=true
       - MCPGATEWAY_CATALOG_FILE=/app/mcp-catalog.yml
@@ -422,14 +478,14 @@ services:
       # ═══════════════════════════════════════════════════════════════════════════
       # Gunicorn Configuration (used when HTTP_SERVER=gunicorn)
       # ═══════════════════════════════════════════════════════════════════════════
-      - GUNICORN_WORKERS=${GUNICORN_WORKERS:-24}  # Worker processes per replica
-      - GUNICORN_TIMEOUT=120                   # Worker timeout in seconds
-      - GUNICORN_GRACEFUL_TIMEOUT=60           # Grace period for worker shutdown
-      - GUNICORN_KEEP_ALIVE=30                 # Keep-alive timeout (matches SSE keepalive)
+      - GUNICORN_WORKERS=${GUNICORN_WORKERS:-24}                    # Worker processes (match CPU cores)
+      - GUNICORN_TIMEOUT=${GUNICORN_TIMEOUT:-120}                   # Worker timeout in seconds
+      - GUNICORN_GRACEFUL_TIMEOUT=${GUNICORN_GRACEFUL_TIMEOUT:-60}           # Grace period for worker shutdown
+      - GUNICORN_KEEP_ALIVE=${GUNICORN_KEEP_ALIVE:-30}                 # Keep-alive timeout (matches SSE keepalive)
       # Worker recycling cleans up MCP SDK stuck task groups (anyio#695 workaround)
-      - GUNICORN_MAX_REQUESTS=1000000          # Recycle workers after 1M requests
-      - GUNICORN_MAX_REQUESTS_JITTER=100000    # ±100000 jitter prevents thundering herd
-      - GUNICORN_BACKLOG=4096                  # Connection queue depth
+      - GUNICORN_MAX_REQUESTS=${GUNICORN_MAX_REQUESTS:-1000000}          # Recycle workers after 1M requests
+      - GUNICORN_MAX_REQUESTS_JITTER=${GUNICORN_MAX_REQUESTS_JITTER:-100000}    # ±100000 jitter prevents thundering herd
+      - GUNICORN_BACKLOG=${GUNICORN_BACKLOG:-4096}                  # Connection queue depth
       # ═══════════════════════════════════════════════════════════════════════════
       # Granian Backpressure Configuration (used when HTTP_SERVER=granian)
       # ═══════════════════════════════════════════════════════════════════════════
@@ -437,11 +493,11 @@ services:
       # immediate 503 responses instead of queuing them (which can cause OOM/timeouts).
       # Total capacity = GRANIAN_WORKERS × GRANIAN_BACKPRESSURE = 16 × 128 = 2048 concurrent
       # Requests beyond this limit receive immediate 503 (no queuing, no OOM)
-      - GRANIAN_WORKERS=16
-      - GRANIAN_BACKLOG=4096
-      - GRANIAN_BACKPRESSURE=128
-      - GRANIAN_HTTP1_BUFFER_SIZE=524288
-      - GRANIAN_RESPAWN_FAILED=true
+      - GRANIAN_WORKERS=${GRANIAN_WORKERS:-16}
+      - GRANIAN_BACKLOG=${GRANIAN_BACKLOG:-4096}
+      - GRANIAN_BACKPRESSURE=${GRANIAN_BACKPRESSURE:-128}
+      - GRANIAN_HTTP1_BUFFER_SIZE=${GRANIAN_HTTP1_BUFFER_SIZE:-524288}
+      - GRANIAN_RESPAWN_FAILED=${GRANIAN_RESPAWN_FAILED:-true}
       # ───────────────────────────────────────────────────────────────────────
       # Granian Worker Lifecycle (recycling to prevent resource leaks)
       # ───────────────────────────────────────────────────────────────────────
@@ -1340,17 +1396,18 @@ services:
 
         echo "Generating JWT token..."
         echo "Environment: JWT_SECRET_KEY=$$JWT_SECRET_KEY"
-        echo "Running: python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --exp 10080 --secret my-test-key --algo HS256"
+        echo "Running: python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --admin --exp 10080 --secret my-test-key --algo HS256"
         # Only capture stdout (the token), let warnings go to stderr
-        export MCPGATEWAY_BEARER_TOKEN=$$(python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --exp 10080 --secret my-test-key --algo HS256 2>/dev/null)
+        export MCPGATEWAY_BEARER_TOKEN=$$(python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --admin --exp 10080 --secret my-test-key --algo HS256 2>/dev/null)
         echo "Generated token: $$MCPGATEWAY_BEARER_TOKEN"
 
         # Decode the token to verify it has expiration
         echo "Decoding token to verify claims..."
         python3 -m mcpgateway.utils.create_jwt_token --decode "$$MCPGATEWAY_BEARER_TOKEN" 2>/dev/null || echo "Failed to decode token"
 
-        # Test authentication first
-        echo "Testing authentication..."
+        # Wait for authenticated gateway readiness. /health goes green before the
+        # admin/bootstrap path is fully ready for authenticated registration calls.
+        echo "Waiting for authenticated gateway readiness..."
 
         # Use Python to make HTTP requests
         python3 -c "
@@ -1374,27 +1431,38 @@ services:
             with urllib.request.urlopen(req) as response:
                 return json.loads(response.read().decode('utf-8'))
 
-        # Test version endpoint without auth
-        print('Checking gateway config...')
-        try:
-            with urllib.request.urlopen('http://gateway:4444/version') as response:
-                data = response.read().decode('utf-8')
-                print(f'Gateway version response (no auth): {data[:200]}')
-        except Exception as e:
-            print(f'Version check failed: {e}')
-
-        # Test version endpoint with auth
-        print('Testing authentication...')
-        try:
-            req = urllib.request.Request('http://gateway:4444/version')
-            req.add_header('Authorization', f'Bearer {token}')
-            with urllib.request.urlopen(req) as response:
-                data = response.read().decode('utf-8')
-                print(f'Auth test response: SUCCESS')
-                auth_success = True
-        except Exception as e:
-            print(f'Auth test response: FAILED - {e}')
-            auth_success = False
+        def api_request_with_retry(method, path, data=None, retries=30, delay=2, retry_statuses=(401, 502, 503)):
+            '''Retry authenticated API requests while gateway workers settle.'''
+            for attempt in range(1, retries + 1):
+                try:
+                    return api_request(method, path, data)
+                except urllib.error.HTTPError as exc:
+                    if exc.code in retry_statuses and attempt < retries:
+                        print(f'Retrying {method} {path} after HTTP {exc.code} ({attempt}/{retries})')
+                        time.sleep(delay)
+                        continue
+                    raise
+                except Exception:
+                    if attempt < retries:
+                        print(f'Retrying {method} {path} after transient error ({attempt}/{retries})')
+                        time.sleep(delay)
+                        continue
+                    raise
+
+        print('Checking authenticated gateway readiness...')
+        for i in range(1, 61):
+            try:
+                gateways = api_request('GET', '/gateways')
+                print(f'✅ Authenticated gateway readiness confirmed ({len(gateways)} gateways visible)')
+                break
+            except urllib.error.HTTPError as exc:
+                print(f'Authenticated readiness not ready yet ({i}/60): HTTP {exc.code}')
+            except Exception as exc:
+                print(f'Authenticated readiness not ready yet ({i}/60): {exc}')
+            time.sleep(2)
+        else:
+            print('❌ Gateway authenticated readiness check failed')
+            sys.exit(1)
 
         # Register fast_time_server with gateway using Streamable HTTP transport
         print('Registering fast_time_server with gateway (Streamable HTTP)...')
@@ -1402,11 +1470,11 @@ services:
         # First check if gateway already exists and delete it
         gateway_id = None
         try:
-            gateways = api_request('GET', '/gateways')
+            gateways = api_request_with_retry('GET', '/gateways')
             for gw in gateways:
                 if gw.get('name') == 'fast_time':
                     print(f'Found existing gateway {gw[\"id\"]}, deleting...')
-                    api_request('DELETE', f'/gateways/{gw[\"id\"]}')
+                    api_request_with_retry('DELETE', f'/gateways/{gw[\"id\"]}', retry_statuses=(401, 502, 503))
                     print('Deleted existing gateway')
         except Exception as e:
             print(f'Note: Could not check/delete existing gateway: {e}')
@@ -1414,14 +1482,14 @@ services:
         # Delete existing virtual server if present (using fixed ID)
         VIRTUAL_SERVER_ID = '9779b6698cbd4b4995ee04a4fab38737'
         try:
-            api_request('DELETE', f'/servers/{VIRTUAL_SERVER_ID}')
+            api_request_with_retry('DELETE', f'/servers/{VIRTUAL_SERVER_ID}', retry_statuses=(401, 502, 503))
             print(f'Deleted existing virtual server {VIRTUAL_SERVER_ID}')
         except Exception as e:
             print(f'Note: No existing virtual server to delete (or error: {e})')
 
         # Register the gateway
         try:
-            result = api_request('POST', '/gateways', {
+            result = api_request_with_retry('POST', '/gateways', {
                 'name': 'fast_time',
                 'url': 'http://fast_time_server:8080/http',
                 'transport': 'STREAMABLEHTTP'
@@ -1499,7 +1567,7 @@ services:
                     'associated_prompts': prompt_ids
                 }
             }
-            result = api_request('POST', '/servers', server_payload)
+            result = api_request_with_retry('POST', '/servers', server_payload)
             print(f'Virtual server created: {result}')
             print(f'✅ Successfully created virtual server with {len(tool_ids)} tools, {len(resource_ids)} resources, {len(prompt_ids)} prompts')
         except Exception as e:
@@ -1536,7 +1604,7 @@ services:
         echo "Registering fast_time_server SSE transport with gateway..."
 
         # Generate JWT token
-        export MCPGATEWAY_BEARER_TOKEN=$$(python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --exp 10080 --secret my-test-key --algo HS256 2>/dev/null)
+        export MCPGATEWAY_BEARER_TOKEN=$$(python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --admin --exp 10080 --secret my-test-key --algo HS256 2>/dev/null)
 
         python3 -c "
         import json
@@ -1707,7 +1775,7 @@ services:
         echo "Registering slow_time_server with gateway..."
 
         # Generate JWT token
-        export MCPGATEWAY_BEARER_TOKEN=$$(python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --exp 10080 --secret my-test-key --algo HS256 2>/dev/null)
+        export MCPGATEWAY_BEARER_TOKEN=$$(python3 -m mcpgateway.utils.create_jwt_token --username admin@example.com --admin --exp 10080 --secret my-test-key --algo HS256 2>/dev/null)
 
         python3 -c "
         import urllib.request
@@ -1820,6 +1888,7 @@ services:
 
         # Register using Python
         python3 -c "
+        import urllib.error
         import urllib.request
         import json
         import os
@@ -1837,13 +1906,45 @@ services:
             with urllib.request.urlopen(req) as response:
                 return json.loads(response.read().decode('utf-8'))
 
+        def api_request_with_retry(method, path, data=None, retries=30, delay=2, retry_statuses=(401, 403, 502, 503)):
+            for attempt in range(1, retries + 1):
+                try:
+                    return api_request(method, path, data)
+                except urllib.error.HTTPError as exc:
+                    if exc.code in retry_statuses and attempt < retries:
+                        print(f'Retrying {method} {path} after HTTP {exc.code} ({attempt}/{retries})')
+                        time.sleep(delay)
+                        continue
+                    raise
+                except Exception:
+                    if attempt < retries:
+                        print(f'Retrying {method} {path} after transient error ({attempt}/{retries})')
+                        time.sleep(delay)
+                        continue
+                    raise
+
+        print('Waiting for authenticated gateway readiness...')
+        for i in range(1, 61):
+            try:
+                gateways = api_request('GET', '/gateways')
+                print(f'✅ Authenticated gateway readiness confirmed ({len(gateways)} gateways visible)')
+                break
+            except urllib.error.HTTPError as exc:
+                print(f'Authenticated readiness not ready yet ({i}/60): HTTP {exc.code}')
+            except Exception as exc:
+                print(f'Authenticated readiness not ready yet ({i}/60): {exc}')
+            time.sleep(2)
+        else:
+            print('❌ Gateway authenticated readiness check failed')
+            exit(1)
+
         # Delete existing gateway if present
         try:
-            gateways = api_request('GET', '/gateways')
+            gateways = api_request_with_retry('GET', '/gateways')
             for gw in gateways:
                 if gw.get('name') == 'fast_test':
                     print(f'Deleting existing gateway {gw[\"id\"]}...')
-                    api_request('DELETE', f'/gateways/{gw[\"id\"]}')
+                    api_request_with_retry('DELETE', f'/gateways/{gw[\"id\"]}')
         except Exception as e:
             print(f'Note: {e}')
 
@@ -1851,14 +1952,14 @@ services:
 
         # Delete existing virtual server if present
         try:
-            api_request('DELETE', f'/servers/{VIRTUAL_SERVER_ID}')
+            api_request_with_retry('DELETE', f'/servers/{VIRTUAL_SERVER_ID}')
             print(f'Deleted existing virtual server {VIRTUAL_SERVER_ID}')
         except Exception as e:
             print(f'Note: No existing virtual server to delete (or error: {e})')
 
         # Register the gateway
         try:
-            result = api_request('POST', '/gateways', {
+            result = api_request_with_retry('POST', '/gateways', {
                 'name': 'fast_test',
                 'url': 'http://fast_test_server:8880/mcp',
                 'transport': 'STREAMABLEHTTP'
@@ -1874,7 +1975,7 @@ services:
         for i in range(30):
             time.sleep(1)
             try:
-                tools = api_request('GET', '/tools')
+                tools = api_request_with_retry('GET', '/tools')
                 fast_test_tools = [t for t in tools if t.get('gatewayId') == gateway_id]
                 if fast_test_tools:
                     print(f'Found {len(fast_test_tools)} tools from fast_test gateway')
@@ -1888,7 +1989,7 @@ services:
         # Collect tool IDs from the fast_test gateway
         tool_ids = []
         try:
-            tools = api_request('GET', '/tools')
+            tools = api_request_with_retry('GET', '/tools')
             tool_ids = [t['id'] for t in tools if t.get('gatewayId') == gateway_id]
             print(f'Tools: {[t[\"name\"] for t in tools if t.get(\"gatewayId\") == gateway_id]}')
         except Exception as e:
@@ -1907,7 +2008,7 @@ services:
                     'associated_prompts': []
                 }
             }
-            result = api_request('POST', '/servers', server_payload)
+            result = api_request_with_retry('POST', '/servers', server_payload)
             print(f'✅ Virtual server created: {VIRTUAL_SERVER_ID} with {len(tool_ids)} tools')
         except Exception as e:
             print(f'❌ Failed to create virtual server: {e}')
diff --git a/docker-entrypoint.sh b/docker-entrypoint.sh
index 9dc26c5b53..f7fe94db54 100755
--- a/docker-entrypoint.sh
+++ b/docker-entrypoint.sh
@@ -1,37 +1,403 @@
 #!/usr/bin/env bash
-#───────────────────────────────────────────────────────────────────────────────
-#  Script : docker-entrypoint.sh
-#  Purpose: Container entrypoint that allows switching between HTTP servers
-#
-#  Environment Variables:
-#    HTTP_SERVER : Which HTTP server to use (default: gunicorn)
-#                  - gunicorn : Python-based with Uvicorn workers (default)
-#                  - granian  : Rust-based HTTP server (alternative)
-#
-#  Usage:
-#    # Run with Gunicorn (default)
-#    docker run -e HTTP_SERVER=gunicorn mcpgateway
-#
-#    # Run with Granian
-#    docker run -e HTTP_SERVER=granian mcpgateway
-#───────────────────────────────────────────────────────────────────────────────
-
 set -euo pipefail
 
 HTTP_SERVER="${HTTP_SERVER:-gunicorn}"
+RUST_MCP_MODE="${RUST_MCP_MODE:-off}"
+RUST_MCP_LOG="${RUST_MCP_LOG:-warn}"
+RUST_MCP_SESSION_AUTH_REUSE="${RUST_MCP_SESSION_AUTH_REUSE:-}"
+EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED="${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED:-}"
+EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED="${EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED:-}"
+EXPERIMENTAL_RUST_MCP_RUNTIME_URL="${EXPERIMENTAL_RUST_MCP_RUNTIME_URL:-}"
+EXPERIMENTAL_RUST_MCP_RUNTIME_UDS="${EXPERIMENTAL_RUST_MCP_RUNTIME_UDS:-}"
+EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED:-}"
+EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED="${EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED:-}"
+EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED:-}"
+EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED:-}"
+EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED:-}"
+EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED="${EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED:-}"
+CONTEXTFORGE_ENABLE_RUST_BUILD="${CONTEXTFORGE_ENABLE_RUST_BUILD:-false}"
+CONTEXTFORGE_ENABLE_RUST_MCP_RMCP_BUILD="${CONTEXTFORGE_ENABLE_RUST_MCP_RMCP_BUILD:-false}"
+MCP_RUST_LISTEN_HTTP="${MCP_RUST_LISTEN_HTTP:-}"
+MCP_RUST_LISTEN_UDS="${MCP_RUST_LISTEN_UDS:-}"
+MCP_RUST_PUBLIC_LISTEN_HTTP="${MCP_RUST_PUBLIC_LISTEN_HTTP:-}"
+MCP_RUST_LOG="${MCP_RUST_LOG:-}"
+MCP_RUST_USE_RMCP_UPSTREAM_CLIENT="${MCP_RUST_USE_RMCP_UPSTREAM_CLIENT:-}"
+MCP_RUST_SESSION_CORE_ENABLED="${MCP_RUST_SESSION_CORE_ENABLED:-}"
+MCP_RUST_EVENT_STORE_ENABLED="${MCP_RUST_EVENT_STORE_ENABLED:-}"
+MCP_RUST_RESUME_CORE_ENABLED="${MCP_RUST_RESUME_CORE_ENABLED:-}"
+MCP_RUST_LIVE_STREAM_CORE_ENABLED="${MCP_RUST_LIVE_STREAM_CORE_ENABLED:-}"
+MCP_RUST_AFFINITY_CORE_ENABLED="${MCP_RUST_AFFINITY_CORE_ENABLED:-}"
+MCP_RUST_SESSION_AUTH_REUSE_ENABLED="${MCP_RUST_SESSION_AUTH_REUSE_ENABLED:-}"
+MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS="${MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS:-}"
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+cd "${SCRIPT_DIR}" || {
+    echo "ERROR: Cannot change to script directory: ${SCRIPT_DIR}"
+    exit 1
+}
+
+RUST_MCP_PID=""
+SERVER_PID=""
+
+apply_rust_mcp_mode_defaults() {
+    local normalized_mode="${RUST_MCP_MODE,,}"
+    local runtime_enabled_default="false"
+    local managed_default="true"
+    local session_core_default="false"
+    local event_store_default="false"
+    local resume_core_default="false"
+    local live_stream_core_default="false"
+    local affinity_core_default="false"
+    local session_auth_reuse_default="false"
+
+    case "${normalized_mode}" in
+        ""|off)
+            ;;
+        shadow)
+            runtime_enabled_default="true"
+            ;;
+        edge)
+            runtime_enabled_default="true"
+            session_auth_reuse_default="true"
+            ;;
+        full)
+            runtime_enabled_default="true"
+            session_core_default="true"
+            event_store_default="true"
+            resume_core_default="true"
+            live_stream_core_default="true"
+            affinity_core_default="true"
+            session_auth_reuse_default="true"
+            ;;
+        *)
+            echo "ERROR: Unknown RUST_MCP_MODE value: ${RUST_MCP_MODE}"
+            echo "Valid options: off, shadow, edge, full"
+            exit 1
+            ;;
+    esac
+
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" ]]; then
+        EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED="${runtime_enabled_default}"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED}" ]]; then
+        EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED="${managed_default}"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_RUNTIME_URL}" ]]; then
+        EXPERIMENTAL_RUST_MCP_RUNTIME_URL="http://127.0.0.1:8787"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED}" ]]; then
+        EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED="${session_core_default}"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED}" ]]; then
+        EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED="${event_store_default}"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED}" ]]; then
+        EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED="${resume_core_default}"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED}" ]]; then
+        EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED="${live_stream_core_default}"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED}" ]]; then
+        EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED="${affinity_core_default}"
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED}" ]]; then
+        if [[ -n "${RUST_MCP_SESSION_AUTH_REUSE}" ]]; then
+            EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED="${RUST_MCP_SESSION_AUTH_REUSE}"
+        else
+            EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED="${session_auth_reuse_default}"
+        fi
+    fi
+    if [[ -z "${EXPERIMENTAL_RUST_MCP_RUNTIME_UDS}" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED}" = "true" ]]; then
+        EXPERIMENTAL_RUST_MCP_RUNTIME_UDS="/tmp/contextforge-mcp-rust.sock"
+    fi
+    if [[ -z "${MCP_RUST_LISTEN_HTTP}" ]]; then
+        MCP_RUST_LISTEN_HTTP="127.0.0.1:8787"
+    fi
+    if [[ -z "${MCP_RUST_PUBLIC_LISTEN_HTTP}" \
+          && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" \
+          && "${EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED}" = "true" \
+          && "${EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED}" = "true" ]]; then
+        MCP_RUST_PUBLIC_LISTEN_HTTP="0.0.0.0:8787"
+    fi
+    if [[ -z "${MCP_RUST_LISTEN_UDS}" && -n "${EXPERIMENTAL_RUST_MCP_RUNTIME_UDS}" ]]; then
+        MCP_RUST_LISTEN_UDS="${EXPERIMENTAL_RUST_MCP_RUNTIME_UDS}"
+    fi
+    if [[ -z "${MCP_RUST_USE_RMCP_UPSTREAM_CLIENT}" ]]; then
+        if [[ "${CONTEXTFORGE_ENABLE_RUST_MCP_RMCP_BUILD}" = "true" ]]; then
+            MCP_RUST_USE_RMCP_UPSTREAM_CLIENT="true"
+        else
+            MCP_RUST_USE_RMCP_UPSTREAM_CLIENT="false"
+        fi
+    fi
+    if [[ -z "${MCP_RUST_LOG}" ]]; then
+        MCP_RUST_LOG="${RUST_MCP_LOG}"
+    fi
+    if [[ -z "${MCP_RUST_SESSION_CORE_ENABLED}" ]]; then
+        MCP_RUST_SESSION_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED}"
+    fi
+    if [[ -z "${MCP_RUST_EVENT_STORE_ENABLED}" ]]; then
+        MCP_RUST_EVENT_STORE_ENABLED="${EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED}"
+    fi
+    if [[ -z "${MCP_RUST_RESUME_CORE_ENABLED}" ]]; then
+        MCP_RUST_RESUME_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED}"
+    fi
+    if [[ -z "${MCP_RUST_LIVE_STREAM_CORE_ENABLED}" ]]; then
+        MCP_RUST_LIVE_STREAM_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED}"
+    fi
+    if [[ -z "${MCP_RUST_AFFINITY_CORE_ENABLED}" ]]; then
+        MCP_RUST_AFFINITY_CORE_ENABLED="${EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED}"
+    fi
+    if [[ -z "${MCP_RUST_SESSION_AUTH_REUSE_ENABLED}" ]]; then
+        MCP_RUST_SESSION_AUTH_REUSE_ENABLED="${EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED}"
+    fi
+    if [[ -z "${MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS}" ]]; then
+        MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS="30"
+    fi
+
+    export RUST_MCP_MODE
+    export RUST_MCP_LOG
+    export RUST_MCP_SESSION_AUTH_REUSE
+    export EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED
+    export EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED
+    export EXPERIMENTAL_RUST_MCP_RUNTIME_URL
+    export EXPERIMENTAL_RUST_MCP_RUNTIME_UDS
+    export EXPERIMENTAL_RUST_MCP_SESSION_CORE_ENABLED
+    export EXPERIMENTAL_RUST_MCP_EVENT_STORE_ENABLED
+    export EXPERIMENTAL_RUST_MCP_RESUME_CORE_ENABLED
+    export EXPERIMENTAL_RUST_MCP_LIVE_STREAM_CORE_ENABLED
+    export EXPERIMENTAL_RUST_MCP_AFFINITY_CORE_ENABLED
+    export EXPERIMENTAL_RUST_MCP_SESSION_AUTH_REUSE_ENABLED
+    export MCP_RUST_LISTEN_HTTP
+    export MCP_RUST_LISTEN_UDS
+    export MCP_RUST_PUBLIC_LISTEN_HTTP
+    export MCP_RUST_LOG
+    export MCP_RUST_USE_RMCP_UPSTREAM_CLIENT
+    export MCP_RUST_SESSION_CORE_ENABLED
+    export MCP_RUST_EVENT_STORE_ENABLED
+    export MCP_RUST_RESUME_CORE_ENABLED
+    export MCP_RUST_LIVE_STREAM_CORE_ENABLED
+    export MCP_RUST_AFFINITY_CORE_ENABLED
+    export MCP_RUST_SESSION_AUTH_REUSE_ENABLED
+    export MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS
+}
+
+cleanup() {
+    local pids=()
+
+    if [[ -n "${SERVER_PID}" ]] && kill -0 "${SERVER_PID}" 2>/dev/null; then
+        pids+=("${SERVER_PID}")
+    fi
+    if [[ -n "${RUST_MCP_PID}" ]] && kill -0 "${RUST_MCP_PID}" 2>/dev/null; then
+        pids+=("${RUST_MCP_PID}")
+    fi
+
+    if [[ ${#pids[@]} -gt 0 ]]; then
+        kill "${pids[@]}" 2>/dev/null || true
+        wait "${pids[@]}" 2>/dev/null || true
+    fi
+}
+
+print_mcp_runtime_mode() {
+    local runtime_mode="python"
+    local upstream_client_mode="native"
+    local session_core_mode="python"
+    local event_store_mode="python"
+    local resume_core_mode="python"
+    local live_stream_core_mode="python"
+    local affinity_core_mode="python"
+    local session_auth_reuse_mode="python"
+
+    if [[ "${MCP_RUST_USE_RMCP_UPSTREAM_CLIENT}" = "true" ]]; then
+        upstream_client_mode="rmcp"
+    fi
+    if [[ "${MCP_RUST_SESSION_CORE_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" ]]; then
+        session_core_mode="rust"
+    fi
+    if [[ "${MCP_RUST_EVENT_STORE_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" ]]; then
+        event_store_mode="rust"
+    fi
+    if [[ "${MCP_RUST_RESUME_CORE_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" ]]; then
+        resume_core_mode="rust"
+    fi
+    if [[ "${MCP_RUST_LIVE_STREAM_CORE_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" ]]; then
+        live_stream_core_mode="rust"
+    fi
+    if [[ "${MCP_RUST_AFFINITY_CORE_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" ]]; then
+        affinity_core_mode="rust"
+    fi
+    if [[ "${MCP_RUST_SESSION_AUTH_REUSE_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" ]]; then
+        session_auth_reuse_mode="rust"
+    fi
+
+    if [[ "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" ]]; then
+        if [[ "${EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED}" = "true" ]]; then
+            runtime_mode="rust-managed"
+            echo "MCP runtime mode: ${runtime_mode} (sidecar managed in this container, upstream client: ${upstream_client_mode}, session core: ${session_core_mode}, event store: ${event_store_mode}, resume core: ${resume_core_mode}, live stream core: ${live_stream_core_mode}, affinity core: ${affinity_core_mode}, session auth reuse: ${session_auth_reuse_mode})"
+        else
+            runtime_mode="rust-external"
+            echo "MCP runtime mode: ${runtime_mode} (external sidecar target: ${EXPERIMENTAL_RUST_MCP_RUNTIME_UDS:-${EXPERIMENTAL_RUST_MCP_RUNTIME_URL}}, upstream client: ${upstream_client_mode}, session core: ${session_core_mode}, event store: ${event_store_mode}, resume core: ${resume_core_mode}, live stream core: ${live_stream_core_mode}, affinity core: ${affinity_core_mode}, session auth reuse: ${session_auth_reuse_mode})"
+        fi
+
+        if [[ "${MCP_RUST_USE_RMCP_UPSTREAM_CLIENT}" = "true" && "${CONTEXTFORGE_ENABLE_RUST_MCP_RMCP_BUILD}" != "true" ]]; then
+            echo "ERROR: MCP_RUST_USE_RMCP_UPSTREAM_CLIENT=true but this image was built without rmcp support."
+            echo "Rebuild with RUST_MCP_BUILD=1 or --build-arg ENABLE_RUST_MCP_RMCP=true."
+            exit 1
+        fi
+        return
+    fi
+
+    if [[ "${CONTEXTFORGE_ENABLE_RUST_BUILD}" = "true" ]]; then
+        runtime_mode="python-rust-built-disabled"
+        echo "WARNING: MCP runtime mode: ${runtime_mode}"
+        echo "WARNING: Rust MCP artifacts are present in this image, but EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED=false so /mcp will run on the Python transport."
+        echo "WARNING: Set RUST_MCP_MODE=shadow, RUST_MCP_MODE=edge, or RUST_MCP_MODE=full to activate the Rust MCP runtime."
+        return
+    fi
+
+    echo "MCP runtime mode: ${runtime_mode} (Rust MCP artifacts not built into this image)"
+}
 
-case "${HTTP_SERVER}" in
-    granian)
-        echo "Starting ContextForge with Granian (Rust-based HTTP server)..."
-        exec ./run-granian.sh "$@"
-        ;;
-    gunicorn)
-        echo "Starting ContextForge with Gunicorn + Uvicorn..."
-        exec ./run-gunicorn.sh "$@"
-        ;;
-    *)
-        echo "ERROR: Unknown HTTP_SERVER value: ${HTTP_SERVER}"
-        echo "Valid options: granian, gunicorn"
+build_server_command() {
+    case "${HTTP_SERVER}" in
+        granian)
+            echo "Starting ContextForge with Granian (Rust-based HTTP server)..."
+            SERVER_CMD=(./run-granian.sh "$@")
+            ;;
+        gunicorn)
+            echo "Starting ContextForge with Gunicorn + Uvicorn..."
+            SERVER_CMD=(./run-gunicorn.sh "$@")
+            ;;
+        *)
+            echo "ERROR: Unknown HTTP_SERVER value: ${HTTP_SERVER}"
+            echo "Valid options: granian, gunicorn"
+            exit 1
+            ;;
+    esac
+}
+
+start_managed_rust_mcp_runtime() {
+    local runtime_bin="/app/bin/contextforge-mcp-runtime"
+    local rust_listen_http="${MCP_RUST_LISTEN_HTTP:-127.0.0.1:8787}"
+    local rust_listen_uds="${MCP_RUST_LISTEN_UDS:-${EXPERIMENTAL_RUST_MCP_RUNTIME_UDS:-}}"
+    local app_root_path="${APP_ROOT_PATH:-}"
+    local backend_rpc_url="${MCP_RUST_BACKEND_RPC_URL:-http://127.0.0.1:${PORT:-4444}${app_root_path}/_internal/mcp/rpc}"
+    local rust_database_url="${MCP_RUST_DATABASE_URL:-}"
+    local rust_redis_url="${MCP_RUST_REDIS_URL:-${REDIS_URL:-}}"
+    local rust_cache_prefix="${MCP_RUST_CACHE_PREFIX:-${CACHE_PREFIX:-mcpgw:}}"
+    local rust_event_store_max="${MCP_RUST_EVENT_STORE_MAX_EVENTS_PER_STREAM:-${STREAMABLE_HTTP_MAX_EVENTS_PER_STREAM:-100}}"
+    local rust_event_store_ttl="${MCP_RUST_EVENT_STORE_TTL_SECONDS:-${STREAMABLE_HTTP_EVENT_TTL:-3600}}"
+
+    if [[ -z "${rust_database_url}" && -n "${DATABASE_URL:-}" ]]; then
+        case "${DATABASE_URL}" in
+            postgresql+psycopg://*)
+                rust_database_url="${DATABASE_URL/postgresql+psycopg:\/\//postgresql://}"
+                ;;
+            postgresql://*|postgres://*)
+                rust_database_url="${DATABASE_URL}"
+                ;;
+        esac
+    fi
+
+    if [[ "${CONTEXTFORGE_ENABLE_RUST_BUILD}" != "true" ]]; then
+        echo "ERROR: EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED=true but this image was built without Rust artifacts."
+        echo "Rebuild with RUST_MCP_BUILD=1 or --build-arg ENABLE_RUST=true, or set EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED=false to use an external sidecar."
+        exit 1
+    fi
+
+    if [[ ! -x "${runtime_bin}" ]]; then
+        echo "ERROR: Rust MCP runtime binary not found at ${runtime_bin}"
         exit 1
-        ;;
-esac
+    fi
+
+    export MCP_RUST_LISTEN_HTTP="${rust_listen_http}"
+    if [[ -n "${rust_listen_uds}" ]]; then
+        export MCP_RUST_LISTEN_UDS="${rust_listen_uds}"
+    else
+        unset MCP_RUST_LISTEN_UDS || true
+        unset EXPERIMENTAL_RUST_MCP_RUNTIME_UDS || true
+    fi
+    if [[ -n "${MCP_RUST_PUBLIC_LISTEN_HTTP:-}" ]]; then
+        export MCP_RUST_PUBLIC_LISTEN_HTTP="${MCP_RUST_PUBLIC_LISTEN_HTTP}"
+    else
+        unset MCP_RUST_PUBLIC_LISTEN_HTTP || true
+    fi
+    export MCP_RUST_BACKEND_RPC_URL="${backend_rpc_url}"
+    export MCP_RUST_SESSION_CORE_ENABLED="${MCP_RUST_SESSION_CORE_ENABLED}"
+    export MCP_RUST_EVENT_STORE_ENABLED="${MCP_RUST_EVENT_STORE_ENABLED}"
+    export MCP_RUST_RESUME_CORE_ENABLED="${MCP_RUST_RESUME_CORE_ENABLED}"
+    export MCP_RUST_LIVE_STREAM_CORE_ENABLED="${MCP_RUST_LIVE_STREAM_CORE_ENABLED}"
+    export MCP_RUST_SESSION_AUTH_REUSE_ENABLED="${MCP_RUST_SESSION_AUTH_REUSE_ENABLED}"
+    export MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS="${MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS}"
+    export MCP_RUST_CACHE_PREFIX="${rust_cache_prefix}"
+    export MCP_RUST_EVENT_STORE_MAX_EVENTS_PER_STREAM="${rust_event_store_max}"
+    export MCP_RUST_EVENT_STORE_TTL_SECONDS="${rust_event_store_ttl}"
+    if [[ -n "${rust_database_url}" ]]; then
+        export MCP_RUST_DATABASE_URL="${rust_database_url}"
+    fi
+    if [[ -n "${rust_redis_url}" ]]; then
+        export MCP_RUST_REDIS_URL="${rust_redis_url}"
+    fi
+
+    if [[ -n "${rust_listen_uds}" ]]; then
+        echo "Starting experimental Rust MCP runtime on unix://${MCP_RUST_LISTEN_UDS} (backend: ${MCP_RUST_BACKEND_RPC_URL})..."
+    else
+        echo "Starting experimental Rust MCP runtime on ${MCP_RUST_LISTEN_HTTP} (backend: ${MCP_RUST_BACKEND_RPC_URL})..."
+    fi
+    "${runtime_bin}" &
+    RUST_MCP_PID=$!
+
+    python3 - <<'PY'
+import httpx
+import os
+import sys
+import time
+import urllib.error
+import urllib.request
+
+base_url = os.environ.get("EXPERIMENTAL_RUST_MCP_RUNTIME_URL", "http://127.0.0.1:8787").rstrip("/")
+health_url = f"{base_url}/health"
+uds_path = os.environ.get("EXPERIMENTAL_RUST_MCP_RUNTIME_UDS") or os.environ.get("MCP_RUST_LISTEN_UDS")
+
+for _ in range(60):
+    if uds_path:
+        try:
+            with httpx.Client(transport=httpx.HTTPTransport(uds=uds_path), timeout=2.0) as client:
+                response = client.get(health_url)
+                if response.status_code == 200:
+                    sys.exit(0)
+        except OSError:
+            time.sleep(0.5)
+        except httpx.HTTPError:
+            time.sleep(0.5)
+    else:
+        try:
+            with urllib.request.urlopen(health_url, timeout=2) as response:
+                if response.status == 200:
+                    sys.exit(0)
+        except (OSError, urllib.error.URLError):
+            time.sleep(0.5)
+
+print(f"ERROR: Experimental Rust MCP runtime failed health check at {health_url}", file=sys.stderr)
+sys.exit(1)
+PY
+}
+
+apply_rust_mcp_mode_defaults
+build_server_command "$@"
+print_mcp_runtime_mode
+
+if [[ "${EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED}" = "true" && "${EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED}" = "true" ]]; then
+    trap cleanup EXIT INT TERM
+    start_managed_rust_mcp_runtime
+    "${SERVER_CMD[@]}" &
+    SERVER_PID=$!
+
+    set +e
+    wait -n "${SERVER_PID}" "${RUST_MCP_PID}"
+    STATUS=$?
+    set -e
+
+    exit "${STATUS}"
+fi
+
+exec "${SERVER_CMD[@]}"
diff --git a/docs/docs/architecture/.pages b/docs/docs/architecture/.pages
index 138202e68b..550f9b18c6 100644
--- a/docs/docs/architecture/.pages
+++ b/docs/docs/architecture/.pages
@@ -2,6 +2,9 @@ nav:
   - Overview: index.md
   - Roadmap: roadmap.md
   - Performance Architecture: performance-architecture.md
+  - Rust MCP Runtime: rust-mcp-runtime.md
+  - Modular Runtime Architecture: modular-design.md
+  - Modular Runtime Specification: modular-runtime
   - Security Features: security-features.md
   - Plugin Framework: plugins.md
   - Export-Import Architecture: export-import-architecture.md
diff --git a/docs/docs/architecture/adr/.pages b/docs/docs/architecture/adr/.pages
index 298410fa0b..221314a73a 100644
--- a/docs/docs/architecture/adr/.pages
+++ b/docs/docs/architecture/adr/.pages
@@ -45,3 +45,8 @@ nav:
   - 40 Flexible Admin UI Section Visibility: 040-flexible-admin-ui-sections.md
   - 41 Top-Level Rust Workspace: 041-top-level-rust-workspace.md
   - 42 Enforce Rust in the Build Process: 042-enforce-rust-in-build-process.md
+  - 43 Rust MCP Runtime Sidecar and Mode Model: 043-rust-mcp-runtime-sidecar-mode-model.md
+  - 44 Module Communication Protocol: 044-module-communication-protocol.md
+  - 45 Auth Remains in Core: 045-auth-remains-in-core.md
+  - 46 Shared-Nothing Between Modules: 046-shared-nothing-between-modules.md
+  - 47 Incremental Migration Over Rewrite: 047-incremental-migration-over-rewrite.md
diff --git a/docs/docs/architecture/adr/038-experimental-rust-transport-backend.md b/docs/docs/architecture/adr/038-experimental-rust-transport-backend.md
index 81967ad2dc..256bbf7aac 100644
--- a/docs/docs/architecture/adr/038-experimental-rust-transport-backend.md
+++ b/docs/docs/architecture/adr/038-experimental-rust-transport-backend.md
@@ -1,11 +1,17 @@
 # ADR-038: Experimental Rust Transport Backend (Streamable HTTP)
 
-- *Status:* Proposed
+- *Status:* Superseded by ADR-043
 - *Date:* 2025-12-26
 - *Deciders:* Platform Team
 
 ## Context
 
+!!! warning
+    This ADR records the original experiment proposal only. The implemented
+    architecture has moved to a Rust sidecar/runtime with mode-based rollout.
+    See [ADR-043](043-rust-mcp-runtime-sidecar-mode-model.md) for the current
+    decision.
+
 ContextForge currently implements its transport layer (stdio, SSE, WebSocket, and Streamable HTTP) in Python using asyncio. While this provides functional correctness, the transport layer experiences performance and memory limitations under higher concurrency due to Python runtime overhead and GIL constraints.
 
 Issue #1621 proposes evaluating a Rust-based transport backend to improve throughput, latency, and resource efficiency while preserving the existing Transport API and protocol semantics.
diff --git a/docs/docs/architecture/adr/043-rust-mcp-runtime-sidecar-mode-model.md b/docs/docs/architecture/adr/043-rust-mcp-runtime-sidecar-mode-model.md
new file mode 100644
index 0000000000..eeb61e9008
--- /dev/null
+++ b/docs/docs/architecture/adr/043-rust-mcp-runtime-sidecar-mode-model.md
@@ -0,0 +1,112 @@
+# ADR-043: Rust MCP Runtime Sidecar with Mode-Based Rollout
+
+- *Status:* Accepted
+- *Date:* 2026-03-14
+- *Deciders:* Platform Team
+- *Supersedes:* ADR-038 (experimental Rust transport backend)
+
+## Context
+
+ContextForge's original Rust transport spike began as a narrow experiment around
+the streamable HTTP MCP path. The implementation has since evolved beyond that
+proposal:
+
+- the runtime is deployed as a separate Rust sidecar/runtime, not as PyO3/FFI
+- nginx can route public `/mcp` traffic directly to Rust
+- Rust can own session, event-store, resume, live-stream, and affinity MCP
+  cores in the `full` mode
+- Python still remains authoritative for authentication, token scoping, and RBAC
+- rollout and rollback are now controlled through a top-level mode model instead
+  of only through low-level experimental flags
+
+The older ADR no longer describes the implemented architecture or the operator
+experience.
+
+## Decision
+
+We standardize on a **Rust MCP runtime sidecar** with a **mode-based rollout
+model**.
+
+### User-facing modes
+
+`RUST_MCP_MODE` is the primary operational control:
+
+- `off`: keep the public MCP path on Python
+- `shadow`: run the Rust sidecar, but keep public `/mcp` on Python
+- `edge`: route public `/mcp` directly from nginx to Rust
+- `full`: `edge` plus Rust-owned MCP session/event-store/resume/live-stream and
+  affinity cores
+
+### Public ingress model
+
+In `edge|full`, nginx routes public `GET/POST/DELETE /mcp` traffic directly to
+the Rust runtime through a dedicated public listener.
+
+Rust authenticates public requests through a trusted internal Python endpoint:
+
+- `POST /_internal/mcp/authenticate`
+
+Python remains the system of record for:
+
+- JWT validation
+- token scoping / team visibility
+- RBAC
+
+Rust consumes the authenticated context and owns progressively more of the
+public MCP runtime path.
+
+### Session/auth reuse
+
+Rust may reuse authenticated context per MCP session, but only with explicit
+ownership/binding checks. Session reuse is:
+
+- bound to the original authenticated context
+- validated against an auth-binding fingerprint
+- denied if the auth binding changes for the same `mcp-session-id`
+- backed by dedicated session-isolation tests
+
+### Fallback and safety
+
+`shadow` is the safety-first rollback/comparison mode. It keeps the public MCP
+transport/session path on Python while still running the Rust sidecar
+internally.
+
+Low-level `EXPERIMENTAL_RUST_MCP_*` flags still exist as advanced overrides, but
+the documented operator model is the high-level mode switch above.
+
+## Consequences
+
+### Positive
+
+- Clear operational model for rollout, benchmarking, and rollback
+- Public MCP ingress can move off Python incrementally without rewriting the
+  full security/control plane
+- `shadow` provides a clean safety mode instead of an ambiguous hybrid path
+- Session/auth reuse has a documented security model and dedicated isolation
+  coverage
+- The runtime can own more of the hot MCP path while preserving Python
+  compatibility fallbacks
+
+### Negative
+
+- The architecture is now explicitly multi-process and multi-language
+- Rust and Python responsibilities must remain carefully documented and tested
+- Health, profiling, and debugging require mode-aware operational knowledge
+- Some behavior still depends on narrow internal Python routes and compatibility
+  seams
+
+## Alternatives Considered
+
+| Option | Why Not |
+|--------|---------|
+| Keep ADR-038 as the canonical description | No longer matches the implementation or rollout model |
+| Full Rust rewrite of the entire gateway/security stack | Higher risk and out of scope for the current incremental migration |
+| Expose only low-level `EXPERIMENTAL_RUST_MCP_*` flags | Too hard for operators to reason about safely |
+| Keep public `/mcp` permanently on Python and use Rust only behind Python | Leaves the Python ingress hop in the hot path and limits the performance gain |
+
+## References
+
+- [Rust MCP Runtime Architecture](../rust-mcp-runtime.md)
+- [Performance Architecture](../performance-architecture.md)
+- `tools_rust/mcp_runtime/TESTING-DESIGN.md` in the repository
+- `tools_rust/mcp_runtime/README.md` in the repository
diff --git a/docs/docs/architecture/adr/044-module-communication-protocol.md b/docs/docs/architecture/adr/044-module-communication-protocol.md
new file mode 100644
index 0000000000..581bfac19d
--- /dev/null
+++ b/docs/docs/architecture/adr/044-module-communication-protocol.md
@@ -0,0 +1,75 @@
+# ADR-044: Module Communication Protocol
+
+- *Status:* Proposed
+- *Date:* 2026-03-15
+- *Deciders:* Platform Team
+- *Related:* [Modular Runtime Architecture](../modular-design.md), [ADR-043](043-rust-mcp-runtime-sidecar-mode-model.md)
+
+## Context
+
+The modular gateway architecture requires protocol modules (MCP, A2A, LLM,
+REST/gRPC) to communicate with the core platform over a well-defined boundary.
+That boundary must:
+
+- Support modules written in any language (Python, Rust, Go).
+- Handle both request/response and server-streaming patterns (e.g., catalog change subscriptions, SSE relay).
+- Keep latency low enough that per-request overhead is negligible relative to upstream calls.
+- Align with existing patterns in the codebase (the plugin framework already supports gRPC external runtimes).
+
+## Decision
+
+We adopt **gRPC over Unix Domain Socket** as the **target-state default**
+module-to-core transport.
+
+- It is language-neutral via protobuf code generation.
+- It supports unary and streaming patterns cleanly.
+- It fits host-local sidecar communication well.
+- It aligns with the existing external plugin gRPC pattern already present in
+  the codebase.
+
+We also allow:
+
+- **HTTP/JSON** as a fallback where a gRPC toolchain is undesirable
+- **direct in-process calls** for embedded runtimes using the same conceptual
+  contract
+
+This is important because the currently implemented Rust MCP precedent still
+uses trusted internal HTTP over UDS or loopback. That precedent remains valid
+during migration, but it does not redefine the longer-term default boundary.
+
+## Consequences
+
+### Positive
+
+- Single contract definition (protobuf) generates client/server stubs for Python, Rust, Go, and other languages.
+- Streaming RPCs natively support catalog change subscriptions and session broadcast patterns.
+- UDS avoids TCP overhead and keeps traffic host-local.
+- Clean process boundary enables crash isolation and independent scaling of modules.
+
+### Negative
+
+- Adds a protobuf/gRPC toolchain dependency for module developers.
+- Serialization overhead is higher than direct in-process calls.
+- Module developers must handle connection lifecycle, deadlines, and
+  backpressure.
+
+### Neutral
+
+- The SPI schemas must be versioned to allow independent evolution.
+- Modules that only need request/response can use HTTP/JSON at the cost of a
+  weaker streaming story.
+
+## Alternatives Considered
+
+| Option | Why Not |
+|--------|---------|
+| **Cap'n Proto** | Better zero-copy performance but significantly less language support and tooling. |
+| **Flatbuffers** | No native streaming support; designed for serialization, not RPC. |
+| **REST/JSON** | No streaming, higher overhead, no schema enforcement at compile time. |
+| **Shared memory** | Too complex, limited to same-host deployment, no language-neutral schema. |
+| **PyO3 / CGo (in-process FFI)** | Available as an optimization for embedded modules, but not suitable as the default boundary because it couples module lifecycle to the Python process. |
+
+## References
+
+- [Modular Runtime Architecture](../modular-design.md)
+- `mcpgateway/plugins/framework/external/grpc/` — Existing gRPC external plugin runtime
diff --git a/docs/docs/architecture/adr/045-auth-remains-in-core.md b/docs/docs/architecture/adr/045-auth-remains-in-core.md
new file mode 100644
index 0000000000..86992b9416
--- /dev/null
+++ b/docs/docs/architecture/adr/045-auth-remains-in-core.md
@@ -0,0 +1,66 @@
+# ADR-045: Authentication and Authorization Remain in Core
+
+- *Status:* Proposed
+- *Date:* 2026-03-15
+- *Deciders:* Platform Team
+- *Related:* [Modular Runtime Architecture](../modular-design.md), [ADR-004](004-combine-jwt-and-basic-auth.md)
+
+## Context
+
+The modular gateway architecture introduces protocol modules that can be implemented in different languages and run as separate processes. A key question is whether authentication and authorization logic should be duplicated in each module or centralized in the core platform.
+
+ContextForge implements a two-layer security model:
+
+1. **Token Scoping (Layer 1):** `normalize_token_teams()` in `mcpgateway/auth.py` controls what resources a caller can see.
+2. **RBAC (Layer 2):** `PermissionService` controls what actions a caller can perform.
+
+Both layers are security-critical and have non-trivial edge cases (admin bypass, public-only tokens, team hierarchy resolution).
+
+## Decision
+
+Authentication and authorization **never move into modules**. The core
+platform remains the single source of truth for:
+
+- JWT verification and token scoping (`normalize_token_teams()`).
+- RBAC permission checks (`PermissionService`).
+- SSO provider integration (GitHub, Google, Okta, Keycloak, Entra ID, generic OIDC).
+- Token revocation checks.
+- Rate limiting.
+
+Modules consume auth through a core-owned auth and policy SPI. The exact RPC or
+method names are intentionally left open, but the contract must support:
+
+- resolving a caller into a typed authenticated context
+- checking permissions against that context
+- preserving token-scoped visibility and deny-path behavior
+
+Modules receive authenticated context or permission outcomes from the core and
+pass that context through subsequent core SPI calls as needed.
+
+## Consequences
+
+### Positive
+
+- Security-critical code has a single implementation — no drift between module auth implementations.
+- Simplifies security auditing — one codebase to review, not N per module.
+- Modules in any language get the full auth stack without reimplementing it.
+- Consistent behavior across all protocols (MCP, A2A, LLM, REST).
+
+### Negative
+
+- Every module request that needs auth must make at least one call or cacheable
+  check against the core-owned auth boundary.
+- Auth logic cannot be freely reimplemented per protocol without risking
+  policy drift.
+
+### Neutral
+
+- Auth caching at the core level (ADR-028) can amortize the cost of repeated
+  checks.
+- The current Rust MCP runtime already demonstrates this pattern in practice.
+
+## References
+
+- [Modular Runtime Architecture](../modular-design.md)
+- `mcpgateway/auth.py` — `normalize_token_teams()`, single source of truth
+- [ADR-043](043-rust-mcp-runtime-sidecar-mode-model.md)
diff --git a/docs/docs/architecture/adr/046-shared-nothing-between-modules.md b/docs/docs/architecture/adr/046-shared-nothing-between-modules.md
new file mode 100644
index 0000000000..dd0ba2457d
--- /dev/null
+++ b/docs/docs/architecture/adr/046-shared-nothing-between-modules.md
@@ -0,0 +1,57 @@
+# ADR-046: Shared-Nothing Between Protocol Modules
+
+- *Status:* Proposed
+- *Date:* 2026-03-15
+- *Deciders:* Platform Team
+- *Related:* [Modular Runtime Architecture](../modular-design.md), [ADR-044](044-module-communication-protocol.md)
+
+## Context
+
+ContextForge supports multiple protocols (MCP, A2A, LLM, REST/gRPC) that sometimes need cross-protocol behavior:
+
+- A2A agents are auto-registered as MCP tools.
+- LLM chat integrates MCP tools via LangChain.
+- REST/gRPC services can be exposed as MCP tools.
+
+In the current monolithic architecture, this cross-protocol behavior happens via direct Python imports between services. In a modular architecture where modules may be written in different languages and run in separate processes, direct imports are not possible.
+
+## Decision
+
+**Modules cannot import or call each other directly.** All cross-protocol
+behavior is mediated by the core platform through core-owned catalogs and
+policy-aware routing.
+
+Illustrative example:
+
+1. an MCP module asks the core to invoke a tool
+2. the core determines the owning integration type
+3. the core routes to the appropriate protocol runtime
+4. the result returns through the core to the original module
+
+The exact dispatcher shape may evolve, but the architectural rule does not:
+modules remain isolated from one another and the core performs the bridging.
+
+## Consequences
+
+### Positive
+
+- Prevents language-specific coupling between modules (Rust MCP module doesn't import Python A2A code).
+- Forces clean API boundaries — all cross-protocol contracts go through the Core SPI.
+- Enables independent deployment and scaling of modules.
+- Modules can be replaced independently (e.g., Go A2A module replaces Python A2A module) without affecting other modules.
+
+### Negative
+
+- Cross-protocol calls have additional latency (two IPC hops: module → core → module).
+- The core becomes a bottleneck for cross-protocol traffic.
+- Some operations that are currently a simple function call become multi-hop IPC chains.
+
+### Neutral
+
+- An event bus (future) can provide asynchronous cross-module communication for non-request-path operations (e.g., "agent registered" → "create tool entry").
+- The `integration_type` field already exists on tools in the current schema, so the routing mechanism is a formalization of existing behavior.
+
+## References
+
+- [Modular Runtime Architecture](../modular-design.md)
+- `mcpgateway/services/tool_service.py` — `_invoke_a2a_tool()` (current cross-protocol call)
diff --git a/docs/docs/architecture/adr/047-incremental-migration-over-rewrite.md b/docs/docs/architecture/adr/047-incremental-migration-over-rewrite.md
new file mode 100644
index 0000000000..cdc62859db
--- /dev/null
+++ b/docs/docs/architecture/adr/047-incremental-migration-over-rewrite.md
@@ -0,0 +1,66 @@
+# ADR-047: Incremental Migration Over Rewrite
+
+- *Status:* Proposed
+- *Date:* 2026-03-15
+- *Deciders:* Platform Team
+- *Related:* [Modular Runtime Architecture](../modular-design.md), [ADR-019](019-modular-architecture-split.md)
+
+## Context
+
+The modular gateway architecture requires significant restructuring of the existing monolithic FastAPI application. Two approaches are possible:
+
+1. **Incremental migration:** Refactor the existing codebase phase-by-phase, keeping the system functional at each step.
+2. **Ground-up rewrite:** Build the modular architecture from scratch and migrate services over.
+
+The existing codebase already has:
+
+- production behavior that cannot be broken casually
+- a broad unit, integration, E2E, security, and performance test surface
+- cross-cutting concerns such as auth, RBAC, plugins, and admin UI that must
+  remain coherent while protocol runtimes are extracted
+- an implemented Rust MCP sidecar precedent showing that sidecar rollout is
+  feasible
+
+## Decision
+
+We **modularize through phased refactoring**, not a ground-up rewrite. The migration follows five phases:
+
+1. **Phase 0 — prerequisite refactors:** create cleaner seams inside the
+   monolith without changing the deployment model
+2. **Phase 1 — core SPI definition:** express core/module boundaries as
+   internal interfaces first
+3. **Phase 2 — module lifecycle:** wrap existing runtimes behind a common
+   lifecycle and capability model
+4. **Phase 3 — sidecar transport:** add sidecar-capable communication where it
+   is justified
+5. **Phase 4 — additional modules:** extract or introduce new protocol
+   runtimes on top of the same contract
+
+Feature flags and rollout controls may be used during the transition, but this
+ADR does not freeze their final names.
+
+## Consequences
+
+### Positive
+
+- The existing test suite provides regression safety at every phase.
+- Each phase leaves the system fully functional — no "big bang" cutover.
+- Risk is distributed across multiple small PRs instead of one massive change.
+- Legacy mode preserves an escape hatch if module mode has issues.
+- The implemented Rust MCP runtime sidecar proves the sidecar pattern works before generalizing it.
+
+### Negative
+
+- The codebase will temporarily have both legacy and modular code paths.
+- Feature flag complexity increases until legacy mode is retired.
+- Each phase requires careful testing in both modes.
+
+### Neutral
+
+- The migration timeline is longer than a rewrite but carries less risk.
+- Legacy mode can be retired once all modules are stable and production-validated.
+
+## References
+
+- [Modular Runtime Architecture](../modular-design.md)
+- [ADR-043](043-rust-mcp-runtime-sidecar-mode-model.md)
diff --git a/docs/docs/architecture/adr/index.md b/docs/docs/architecture/adr/index.md
index 73e748f0af..bc1bd73b93 100644
--- a/docs/docs/architecture/adr/index.md
+++ b/docs/docs/architecture/adr/index.md
@@ -40,10 +40,15 @@ This page tracks all significant design decisions made for ContextForge project,
 | 0033  | Tool Lookup Cache for invoke_tool | Accepted | Performance | 2025-01-20 |
 | 0035  | Query Parameter Authentication for Gateways | Accepted | Security | 2026-01-19 |
 | 0037  | External Plugin STDIO Launch with Command/Env Overrides | Accepted | Extensibility | 2026-01-28 |
-| 0038  | Experimental Rust Transport Backend (Streamable HTTP) | Proposed | Performance | 2025-12-26 |
+| 0038  | Experimental Rust Transport Backend (Streamable HTTP) | Superseded | Performance | 2025-12-26 |
 | 0039  | Adopt Fully Independent Plugin Crates Architecture | Accepted | Architecture | 2026-02-13 |
 | 0040  | Flexible Admin UI Section Visibility | Accepted | User Interface | 2026-02-16 |
 | 0041  | Top-Level Rust Workspace (Cargo.toml at Repository Root) | Accepted | Architecture | 2026-02-26 |
 | 0042  | Enforce Rust in the Build Process                    | Proposed | Build         | 2026-02-26 |
+| 0043  | Rust MCP Runtime Sidecar with Mode-Based Rollout     | Accepted | Architecture  | 2026-03-14 |
+| 0044  | Module Communication Protocol (gRPC over UDS)        | Proposed | Architecture  | 2026-03-15 |
+| 0045  | Authentication and Authorization Remain in Core      | Proposed | Security      | 2026-03-15 |
+| 0046  | Shared-Nothing Between Protocol Modules              | Proposed | Architecture  | 2026-03-15 |
+| 0047  | Incremental Migration Over Rewrite                   | Proposed | Architecture  | 2026-03-15 |
 
 > ✳️ Add new decisions chronologically and link to them from this table.
diff --git a/docs/docs/architecture/index.md b/docs/docs/architecture/index.md
index d119f62e35..54955bda9f 100644
--- a/docs/docs/architecture/index.md
+++ b/docs/docs/architecture/index.md
@@ -4,7 +4,22 @@
 
 ## High-Level Architecture Summary
 
-**ContextForge** is a comprehensive production-grade gateway built on modern Python technologies with a performance-first approach. For a detailed visual diagram of the high-performance components (Rust-powered libraries, async patterns, caching layers, and Kubernetes scaling), see the [Performance Architecture Diagram](performance-architecture.md).
+**ContextForge** is a comprehensive production-grade gateway built on modern
+Python technologies with a performance-first approach. The primary control plane
+remains Python, but the MCP streamable HTTP hot path can now optionally run
+through a dedicated Rust runtime sidecar. For the current Rust MCP runtime
+design, see [Rust MCP Runtime](rust-mcp-runtime.md). For the broader
+high-performance view, see the
+[Performance Architecture Diagram](performance-architecture.md).
+
+The broader target-state modular runtime architecture is documented separately
+in [Modular Runtime Architecture](modular-design.md). That document generalizes
+the current Rust MCP sidecar pattern into a reusable core-plus-modules design
+for future MCP, A2A, LLM, and REST/gRPC runtimes. The related decisions are
+captured in [ADR-043](adr/043-rust-mcp-runtime-sidecar-mode-model.md) through
+[ADR-047](adr/047-incremental-migration-over-rewrite.md). The implementation-
+ready contract for building new modules lives in the
+[Modular Runtime Specification](modular-runtime/index.md).
 
 ## Design Diagrams
 
@@ -35,6 +50,10 @@ The following diagrams are generated by `make docs` and provide a quick visual r
 - Native **MCP (Model Context Protocol)** server implementation supporting protocol version 2025-03-26
 - Transport mechanisms: **HTTP/JSON-RPC**, **Server-Sent Events (SSE)** with keepalive, **WebSocket**, **stdio** (for CLI integration), and **streamable-HTTP**
 - JSON-RPC 2.0 compliant message handling with bidirectional communication
+- Optional **Rust MCP runtime sidecar** for streamable HTTP public ingress with
+  mode-based rollout (`off`, `shadow`, `edge`, `full`)
+- In Rust `edge|full` mode, nginx routes public `/mcp` traffic directly to the
+  Rust runtime while Python remains authoritative for auth and RBAC
 
 **4. Federation & Registry Architecture**
 
diff --git a/docs/docs/architecture/modular-design.md b/docs/docs/architecture/modular-design.md
new file mode 100644
index 0000000000..f786b59e7e
--- /dev/null
+++ b/docs/docs/architecture/modular-design.md
@@ -0,0 +1,676 @@
+# ContextForge Modular Runtime Architecture
+
+**Status:** Proposed target architecture and implementation entry point
+
+This document defines the target-state modular runtime architecture for
+ContextForge.
+
+It is intended to support:
+
+- the existing MCP gateway
+- the existing A2A gateway
+- future LLM gateway runtimes
+- future REST and gRPC gateway runtimes
+- implementations in different languages, including Python, Rust, and Go
+
+## Purpose
+
+ContextForge already contains multiple protocol-facing runtime paths inside one
+Python application. The Rust MCP runtime proves that a protocol runtime can be
+split out into a separate implementation while the core platform remains the
+system of record for security and catalog state.
+
+This specification generalizes that idea into a reusable architecture:
+
+- a **core platform** that owns policy, persistence, catalogs, plugins, admin
+  UI, and observability
+- one or more **protocol modules** that own protocol wire behavior and
+  transport or runtime semantics
+
+The goal is not to rewrite the product. The goal is to create a stable
+architecture that can evolve incrementally from the current codebase.
+
+## Scope
+
+This document is about **runtime decomposition**, not package layout.
+
+It is complementary to
+[ADR-019: Modular Architecture Split (14 Independent Modules)](adr/019-modular-architecture-split.md),
+which is about packaging and repository structure.
+
+This document deliberately distinguishes between:
+
+- **implemented precedent**
+  The current Rust MCP runtime sidecar and existing external plugin runtimes.
+- **target architecture**
+  The longer-term modular contract that future MCP, A2A, LLM, and REST or gRPC
+  runtimes should follow.
+- **migration guidance**
+  The phased path from the current monolith to that target.
+
+## Non-Goals
+
+This specification does not:
+
+- require a ground-up rewrite
+- require all protocols to be extracted at once
+- require all modules to be sidecars immediately
+- freeze final protobuf package names or generated SDK layout
+- replace protocol-specific documents such as
+  [Rust MCP Runtime](rust-mcp-runtime.md)
+
+## Relationship to Existing Architecture Docs
+
+| Document | Role |
+|----------|------|
+| [Rust MCP Runtime](rust-mcp-runtime.md) | Describes the currently implemented MCP sidecar/runtime path and rollout modes |
+| [ADR-043](adr/043-rust-mcp-runtime-sidecar-mode-model.md) | Records the implemented Rust MCP sidecar and mode model |
+| [Multitenancy](multitenancy.md) | Defines team scoping and visibility rules that remain core-owned |
+| [OAuth Design](oauth-design.md) | Defines auth and credential handling that remain core-owned |
+| [Plugin Framework](plugins.md) | Defines plugin behavior that remains centrally configured and enforced by the core |
+
+## How to Use This Specification
+
+Use the documents in this order:
+
+1. this page for the architectural rules and operating model
+2. [Core SPI](modular-runtime/core-spi.md) for the module-to-core contract
+3. [Module Descriptor](modular-runtime/module-descriptor.md) and
+   [Module Lifecycle](modular-runtime/module-lifecycle.md) for module
+   registration and startup behavior
+4. [Error Model](modular-runtime/error-model.md) and
+   [Conformance](modular-runtime/conformance.md) for compatibility and release
+   requirements
+5. the protocol profile for the module being implemented:
+   - [MCP Module Profile](modular-runtime/mcp-module.md)
+   - [A2A Module Profile](modular-runtime/a2a-module.md)
+   - [LLM Module Profile](modular-runtime/llm-module.md)
+   - [REST/gRPC Module Profile](modular-runtime/rest-grpc-module.md)
+
+## Key Decisions
+
+| Decision | Summary | Source |
+|----------|---------|--------|
+| Core owns policy; modules own protocol | Auth, RBAC, catalogs, plugins, persistence, and admin UI stay in the core; wire protocol and transport behavior move to modules | This document |
+| Process boundary first | Sidecars are the default modular boundary; embedded runtimes are an optimization | This document |
+| Default IPC transport | gRPC over Unix Domain Socket is the target-state module-to-core transport; HTTP/JSON remains an explicit fallback | [ADR-044](adr/044-module-communication-protocol.md) |
+| Auth remains in core | Modules consume authenticated context; they do not become independent auth authorities | [ADR-045](adr/045-auth-remains-in-core.md) |
+| Shared-nothing between modules | Modules do not import or call each other directly; cross-protocol behavior is mediated by the core | [ADR-046](adr/046-shared-nothing-between-modules.md) |
+| Incremental migration | The architecture is adopted by refactoring the current system in phases, not by rewrite | [ADR-047](adr/047-incremental-migration-over-rewrite.md) |
+
+## Current Implemented Precedent
+
+ContextForge today is primarily a monolithic Python application, but two
+existing patterns already prove the modular direction:
+
+1. **Rust MCP runtime sidecar**
+   The MCP streamable HTTP public path can run through a Rust sidecar while
+   Python remains authoritative for auth, token scoping, and RBAC.
+2. **External plugin runtimes**
+   Plugins can already run out of process behind a language-neutral transport.
+
+These are important precedents, but they are not yet the full target modular
+contract.
+
+In particular, the current Rust MCP runtime is a **transition architecture**:
+
+- it is a real external runtime
+- it proves sidecar deployment, direct ingress, and mode-based rollout
+- it still contains performance-oriented implementation details that are more
+  specific than the long-term generic module boundary
+
+This document defines the steadier target boundary that future modules should
+converge on.
+
+## Implementation Status
+
+The modular architecture is no longer purely speculative. One protocol module
+is already implemented and validated.
+
+| Protocol family | Module status | Notes |
+|-----------------|---------------|-------|
+| MCP | Implemented | Rust MCP runtime sidecar exists today with mode-based rollout and direct-ingress support |
+| A2A | Not yet extracted | Current A2A runtime remains embedded in Python |
+| LLM | Not yet extracted | Current LLM proxy and chat flows remain embedded in Python |
+| REST/gRPC | Not yet extracted | Current virtualization and service-management flows remain embedded in Python |
+
+The important consequence is that this spec is grounded in a working MCP module
+rather than a hypothetical first extraction.
+
+## Current Precedent vs Target State
+
+The spec must be explicit about what is implemented today versus what future
+modules should target.
+
+| Topic | Implemented today | Target-state default |
+|-------|-------------------|----------------------|
+| First extracted runtime | Rust MCP sidecar | Additional protocol modules, potentially in Rust, Go, or Python |
+| Sidecar transport to core | Narrow internal HTTP over local/private transport, including UDS or loopback depending on path | gRPC over UDS |
+| Fallback transport | HTTP/JSON | HTTP/JSON |
+| Ingress ownership | Both valid today: Python-owned ingress and direct Rust ingress depending on mode | Both valid patterns remain acceptable |
+| Auth authority | Python core | Core platform |
+| Plugin parity | Achieved through a mix of direct core-sensitive handling and selective delegation | Explicit SPI or core-delegation contract |
+| Data-path optimizations | Rust MCP keeps targeted fast paths | Allowed, but must preserve contract and rollback behavior |
+
+## Architecture Principles
+
+1. **Core owns policy; modules own protocol.**
+   The core platform owns security, persistence, catalogs, plugins,
+   configuration, observability, and admin UI. Modules own transport, wire
+   format, session/runtime semantics, capability negotiation, and upstream
+   protocol behavior.
+
+2. **Process boundary first.**
+   The default modular boundary is a sidecar or sibling process. Embedded
+   in-process runtimes are allowed where justified, but they are not the
+   default design center.
+
+3. **Language-neutral contracts.**
+   Contracts between the core and modules must not depend on Python object
+   identity, ORM models, or framework internals.
+
+4. **Shared-nothing between modules.**
+   Modules do not import or call one another directly. Cross-protocol behavior
+   flows through the core.
+
+5. **Compatibility and rollback first.**
+   Each extraction step must preserve an operational rollback path.
+
+6. **Incremental migration over rewrite.**
+   The existing codebase remains the migration source; tests and behavior
+   remain the regression oracle.
+
+## Reference Model
+
+The following diagram is logical, not strictly physical. A module may sit
+behind core-managed routing or may own direct public ingress while still using
+the core for policy and catalog decisions.
+
+```mermaid
+flowchart TD
+    client[Client]
+    ingress[Ingress / Proxy / TLS termination]
+    core[Core Platform]
+    mcp[MCP Module]
+    a2a[A2A Module]
+    llm[LLM Module]
+    rest[REST or gRPC Module]
+    upstream[Upstream service or core-owned catalog action]
+
+    client --> ingress
+    ingress --> core
+    ingress --> mcp
+    core --> mcp
+    core --> a2a
+    core --> llm
+    core --> rest
+    mcp --> core
+    a2a --> core
+    llm --> core
+    rest --> core
+    mcp --> upstream
+    a2a --> upstream
+    llm --> upstream
+    rest --> upstream
+```
+
+Two ingress patterns are valid:
+
+1. `client -> ingress -> core -> module`
+   Use when the core remains the public edge and the module is an internal
+   runtime behind it.
+2. `client -> ingress -> module -> core SPI`
+   Use when the module owns the public protocol edge directly, as the Rust MCP
+   runtime already does in `edge` and `full` mode.
+
+### Responsibilities by Plane
+
+```mermaid
+flowchart LR
+    subgraph ControlPlane[Core platform control and policy plane]
+        auth[Authentication and RBAC]
+        scope[Token scoping and visibility]
+        catalog[Catalogs and CRUD]
+        plugin[Plugin policy]
+        config[Config and secrets]
+        admin[Admin UI and observability]
+    end
+
+    subgraph RuntimePlane[Protocol runtime plane]
+        wire[Wire parsing and serialization]
+        transport[Transport ownership]
+        session[Session or task runtime]
+        caps[Capability negotiation]
+        upstream[Upstream protocol behavior]
+    end
+```
+
+## Core Platform Responsibilities
+
+The core platform remains the common control plane and policy plane. The table
+below is representative, not exhaustive.
+
+| Responsibility | Notes |
+|----------------|-------|
+| Authentication | JWT verification, SSO integration, token normalization, revocation checks |
+| Authorization | RBAC, team scoping, visibility filtering, deny-path behavior |
+| Persistence | Database models, migrations, consistency, ownership metadata |
+| Catalogs | Tools, resources, prompts, servers, gateways, agents, providers, and other core-owned records |
+| CRUD and admin flows | Registration, update, delete, import/export, admin workflows |
+| Plugin policy and configuration | Central plugin config, hook selection, hook execution policy |
+| Prompt/completion/roots business services | Prompt rendering policy, completion services, roots services, and other catalog-backed non-wire operations |
+| LLM and upstream provider control plane | Provider credentials, model configuration, policy-aware routing metadata |
+| gRPC and REST control surfaces | Core-owned registration, exposure metadata, and governance for virtualized services |
+| Observability | Traces, logs, metrics, audit signals, support bundles |
+| Configuration and secrets | Global config precedence, secret resolution, encryption |
+| Cross-protocol routing | Mediate calls between protocol modules through core-owned catalogs and services |
+| Admin UI | Platform UI remains core-owned even when runtimes are modularized |
+
+The core does **not** own protocol wire parsing, protocol transport semantics,
+or protocol-specific session state machines once those are extracted into a
+module.
+
+## Protocol Module Responsibilities
+
+Each protocol module owns protocol-facing runtime behavior for one protocol
+family.
+
+| Responsibility | Example |
+|----------------|---------|
+| Wire parsing and serialization | MCP JSON-RPC, A2A request envelopes, future LLM request formats |
+| Protocol transport | streamable HTTP, SSE, WebSocket, stdio, long-poll, push channels |
+| Runtime/session semantics | MCP session lifecycle, A2A task state handling, LLM chat session flow |
+| Capability negotiation | MCP `initialize`, A2A capability advertisement, future provider capability declarations |
+| Upstream protocol behavior | MCP upstream client pooling, A2A invocation behavior, LLM provider relay logic |
+| Protocol-specific health and stats | Runtime-owned counters, transport stats, protocol-specific readiness |
+
+Modules should not become independent sources of truth for security policy,
+catalog ownership, or long-term persistence rules.
+
+## Module Runtime Contract
+
+The contract has three parts:
+
+1. **module identity**
+2. **module lifecycle**
+3. **core SPI service families**
+
+Those concrete documents live under [Modular Runtime Specification](modular-runtime/index.md).
+
+### Module Identity
+
+Every module should declare a stable descriptor with fields equivalent to:
+
+- module id
+- protocol family
+- implementation language
+- module version
+- supported SPI version(s)
+- runtime mode
+  - embedded
+  - sidecar
+- exposed capabilities
+- health and stats endpoints or RPCs
+
+The exact wire schema is implementation detail. The architectural requirement
+is that the core can discover what a module is, what contract version it
+supports, and how to talk to it.
+
+### Module Lifecycle
+
+Every module should support these lifecycle phases:
+
+1. **register**
+   The module is discovered and its descriptor is loaded.
+2. **initialize**
+   The core provides configuration, scoped dependencies, and any required
+   bootstrap state.
+3. **ready**
+   The module can accept live traffic.
+4. **drain**
+   The module stops accepting new work and lets in-flight work complete.
+5. **shutdown**
+   The module releases resources and exits cleanly.
+
+At minimum, the core must be able to ask a module for:
+
+- readiness
+- liveness
+- version and capability metadata
+- runtime stats
+
+### Core SPI Service Families
+
+The exact API surface will evolve, but the module contract should be organized
+around stable service families rather than one-off internal endpoints.
+
+| Service family | What it provides |
+|----------------|------------------|
+| Auth and policy | Resolve caller context, validate authenticated identity, check permissions, enforce token-scoped visibility |
+| Catalog read and invoke | List, fetch, and invoke tools, resources, prompts, agents, servers, gateways, providers, and related core-owned records through policy-aware services |
+| Session and event services | Session lookup, ownership checks, replay/event access where the protocol requires shared session or event semantics |
+| Plugin services | Execute or delegate plugin-sensitive pre/post operations under core-owned plugin policy |
+| Observability | Trace context propagation, structured logging, audit events, module metrics publication |
+| Configuration and secrets | Scoped config delivery, secret references, feature flags, core-provided defaults |
+| Admin and health integration | Module stats, health, and optional descriptors the core UI can surface |
+
+Two constraints are intentionally fixed:
+
+- the architecture does **not** freeze exact final RPC names yet
+- the architecture does **not** require one giant interface; multiple smaller
+  service definitions are preferred
+
+## Communication Model
+
+### Default Transport
+
+The target-state default module-to-core transport is:
+
+- **gRPC over Unix Domain Socket**
+
+Why:
+
+- language-neutral
+- streaming support
+- well understood code generation story for Python, Rust, and Go
+- suitable for host-local sidecar communication
+
+This is the target-state default, not a claim about every implemented module
+today. The current Rust MCP runtime is the main precedent and still uses a
+mix of narrow internal HTTP over local/private transport depending on the path.
+
+### Fallback Transport
+
+The fallback transport is:
+
+- **HTTP/JSON over loopback or internal network**
+
+This is acceptable when:
+
+- a gRPC toolchain is undesirable
+- a runtime only needs request/response behavior
+- an operator environment prefers plain HTTP for debugging or policy reasons
+
+### Embedded Mode
+
+Embedded modules may bypass serialization and call the same conceptual contract
+directly in-process.
+
+This is an optimization, not a different architecture.
+
+### No Direct Module-to-Module Calls
+
+Modules do not import or invoke each other directly.
+
+Cross-protocol behavior must be mediated by the core.
+
+Example:
+
+```mermaid
+sequenceDiagram
+    participant MCP as MCP module
+    participant Core as Core platform
+    participant A2A as A2A module
+
+    MCP->>Core: Invoke tool by catalog entry
+    Core->>Core: Apply auth, visibility, RBAC, plugin policy
+    Core->>A2A: Dispatch invoke to owning protocol runtime
+    A2A-->>Core: Structured result
+    Core-->>MCP: Structured result
+```
+
+That preserves language independence and keeps routing policy in one place.
+
+## Security and Trust Model
+
+The modular architecture does **not** distribute trust equally.
+
+### Core-Owned Security Responsibilities
+
+The core remains the source of truth for:
+
+- authentication
+- token scoping
+- RBAC
+- secret storage and decryption
+- rate limiting policy
+- audit and security logging
+
+Modules may enforce the outcome of a core decision, but they do not become
+independent security authorities.
+
+### What Modules Receive
+
+Modules should receive:
+
+- a typed authenticated context
+- permission decisions or permission-check APIs
+- scoped resource visibility through catalog calls
+
+Modules should **not** be expected to:
+
+- interpret raw JWT claims as the source of truth
+- fetch and decrypt stored credentials
+- invent their own team-scoping semantics
+
+### Trust Boundary for Sidecars
+
+Sidecars must communicate with the core over a trusted local or private
+channel. The deployment mechanism may vary, but the architectural
+requirements are:
+
+- the core can authenticate the module channel
+- arbitrary external clients cannot call privileged core-internal module APIs
+- channel permissions or network policy are explicit
+
+## Cross-Protocol Mediation
+
+ContextForge already has cross-protocol behaviors:
+
+- A2A agents exposed as MCP tools
+- LLM chat invoking MCP tools
+- REST and gRPC services exposed as virtual servers or tools
+
+In the modular architecture, those behaviors stay possible, but the routing
+belongs to the core.
+
+The core is responsible for:
+
+- deciding which catalog entry is being invoked
+- determining the owning protocol/runtime
+- applying policy, plugin rules, and observability
+- dispatching to the appropriate module
+
+The key consequence is that modules remain isolated, while the product keeps a
+single coherent governance model.
+
+## Plugin Model
+
+Plugins remain a core-owned concern.
+
+That means:
+
+- plugin configuration stays centralized
+- the core defines which hooks run
+- modules must preserve plugin parity on plugin-sensitive flows
+
+There are two acceptable implementation patterns:
+
+1. the module explicitly calls a core plugin SPI around the relevant operation
+2. the module delegates a plugin-sensitive flow back to the core when parity
+   requires it
+
+This keeps plugin behavior consistent even when the fast path moves into a
+different language.
+
+## Deployment Patterns
+
+The architecture supports three deployment patterns.
+
+### 1. Monolithic / Embedded
+
+The core and modules run in one process.
+
+Use when:
+
+- minimizing operational complexity
+- migrating incrementally
+- performance-sensitive in-process execution is justified
+
+### 2. Hybrid
+
+Some protocols remain embedded while others move into sidecars.
+
+This is the current precedent with the Rust MCP runtime:
+
+- Python remains the core
+- MCP may run through a Rust sidecar
+- A2A and other runtime paths remain embedded in Python
+
+### 3. Full Sidecar Model
+
+Multiple protocol runtimes run as separate processes, possibly in different
+languages, while the core remains the shared control plane.
+
+This is the long-term extensibility model for future A2A, LLM, and REST/gRPC
+modules.
+
+## Configuration Model
+
+Configuration remains layered and core-owned.
+
+The architecture should distinguish:
+
+- **core-global settings**
+  Shared platform settings such as auth, database, Redis, plugin config, and
+  observability.
+- **module-scoped settings**
+  Protocol-specific runtime settings such as protocol version behavior,
+  transport tuning, or runtime-specific timeouts.
+
+Module-scoped settings should use explicit namespacing and should be delivered
+through the module runtime contract rather than by relying on unrestricted
+global process imports.
+
+## Health, Failure, and Fallback
+
+Every module should define:
+
+- how it reports readiness and liveness
+- how it reports degraded mode
+- what happens if the core becomes unavailable
+- what happens if the module becomes unavailable
+- whether traffic can fall back to an embedded or legacy path
+
+This is especially important for incremental rollout.
+
+The current Rust MCP runtime already demonstrates this pattern through
+mode-based rollout and rollback. Future modules should preserve the same
+operational discipline.
+
+## Testing and Release Requirements
+
+Every protocol module should be expected to prove:
+
+- contract compatibility with the core SPI
+- protocol conformance for its protocol surface
+- security deny paths
+- fallback and rollback behavior
+- plugin parity for plugin-sensitive flows
+- performance and degradation characteristics appropriate to the protocol
+
+Where a module introduces deployment-specific behavior, release validation
+should also cover:
+
+- compose or local stack validation
+- Kubernetes or Helm validation where applicable
+- upgrade and migration compatibility where applicable
+
+The concrete target-state test matrix is defined in
+[Conformance](modular-runtime/conformance.md).
+
+## Migration Strategy
+
+The migration is intentionally phased.
+
+### Phase 0: Extract seams inside the monolith
+
+Create clearer boundaries inside the current Python code:
+
+- isolate protocol dispatch
+- isolate policy and catalog boundaries
+- reduce direct cross-service coupling where practical
+
+### Phase 1: Define the core SPI
+
+Define the first stable internal service families between core and modules.
+
+At this stage, modules may still be embedded.
+
+### Phase 2: Wrap existing runtimes behind module lifecycles
+
+Make protocol runtimes conform to a common lifecycle and capability model even
+before all traffic crosses an IPC boundary.
+
+### Phase 3: Move selected runtimes to sidecars
+
+Use sidecars where the performance, isolation, or language goals justify it.
+The current Rust MCP runtime is the first concrete example of this phase.
+
+### Phase 4: Add new protocol runtimes
+
+Introduce new A2A, LLM, and REST/gRPC runtimes behind the same architectural
+contract.
+
+### Phase 5: Optimize
+
+Only after the boundary is stable should the implementation optimize for:
+
+- direct hot paths
+- embedded fast paths
+- selective caching and event-stream ownership
+
+## What Is Decided vs What Is Still Open
+
+### Decided in principle
+
+- ContextForge should evolve toward a core-plus-modules runtime model.
+- The core remains the policy and control plane.
+- Modules are language-agnostic and process-boundary first.
+- Shared-nothing between modules is a design rule.
+- Incremental migration is the preferred path.
+
+### Still intentionally open
+
+- exact final SPI RPC names
+- exact protobuf package layout
+- exact module descriptor wire schema
+- whether all plugin hooks are always explicit SPI calls versus selective core
+  delegation for parity-sensitive flows
+- how much direct data-path optimization a module may keep before it must be
+  expressed through the generic SPI
+
+## Open Questions
+
+- What is the minimal first stable SPI version that supports both MCP and A2A
+  without overfitting to either?
+- Which cross-module events deserve an event bus rather than synchronous
+  core-mediated routing?
+- How should optional protocol surfaces be classified in release gating versus
+  follow-up compatibility work?
+- What is the right balance between generic SPI purity and targeted fast paths
+  for performance-sensitive runtimes?
+
+## Related Documents
+
+- [Modular Runtime Specification](modular-runtime/index.md)
+- [Rust MCP Runtime](rust-mcp-runtime.md)
+- [ADR-043: Rust MCP Runtime Sidecar with Mode-Based Rollout](adr/043-rust-mcp-runtime-sidecar-mode-model.md)
+- [ADR-044: Module Communication Protocol](adr/044-module-communication-protocol.md)
+- [ADR-045: Authentication and Authorization Remain in Core](adr/045-auth-remains-in-core.md)
+- [ADR-046: Shared-Nothing Between Protocol Modules](adr/046-shared-nothing-between-modules.md)
+- [ADR-047: Incremental Migration Over Rewrite](adr/047-incremental-migration-over-rewrite.md)
+- [ADR-019: Modular Architecture Split (14 Independent Modules)](adr/019-modular-architecture-split.md)
+- [Multitenancy](multitenancy.md)
+- [OAuth Design](oauth-design.md)
+- [Plugin Framework](plugins.md)
diff --git a/docs/docs/architecture/modular-runtime/.pages b/docs/docs/architecture/modular-runtime/.pages
new file mode 100644
index 0000000000..f7862155f3
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/.pages
@@ -0,0 +1,12 @@
+title: Modular Runtime Specification
+nav:
+  - Overview: index.md
+  - Core SPI: core-spi.md
+  - Module Descriptor: module-descriptor.md
+  - Module Lifecycle: module-lifecycle.md
+  - Error Model: error-model.md
+  - Conformance: conformance.md
+  - MCP Module Profile: mcp-module.md
+  - A2A Module Profile: a2a-module.md
+  - LLM Module Profile: llm-module.md
+  - REST-gRPC Module Profile: rest-grpc-module.md
diff --git a/docs/docs/architecture/modular-runtime/a2a-module.md b/docs/docs/architecture/modular-runtime/a2a-module.md
new file mode 100644
index 0000000000..7468edee6c
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/a2a-module.md
@@ -0,0 +1,85 @@
+# A2A Module Profile
+
+This profile defines how a future A2A module should map onto the current
+ContextForge A2A surface.
+
+## Current Surface
+
+Today the A2A HTTP surface is embedded in `main.py` and uses the core service
+layer directly.
+
+Current live endpoints include:
+
+- `GET /a2a` and `GET /a2a/` for list
+- `GET /a2a/{agent_id}` for fetch
+- `POST /a2a/{agent_name}/invoke` for invoke
+
+CRUD endpoints also exist today, but they are core-owned admin operations and
+should remain there in the modular design.
+
+The persisted A2A record already contains the fields a module will depend on:
+
+- endpoint URL
+- protocol version
+- capability or config metadata
+- auth configuration
+- team, owner, and visibility
+- associated MCP tool linkage where the agent is exposed cross-protocol
+
+## What the A2A Module Owns
+
+The module should own:
+
+- A2A request parsing and response serialization
+- protocol-specific discovery and read surface for agents
+- invoke envelope construction and normalization
+- outbound A2A transport behavior to target agents
+- protocol-specific retries, timeouts, and future streaming or push behavior
+- task or runtime state handling where A2A requires it
+- protocol-specific metrics and runtime health
+
+## What Stays in Core
+
+The core should continue to own:
+
+- agent CRUD and persistence
+- auth and token normalization
+- RBAC and visibility filtering
+- encrypted auth and OAuth secret storage
+- ownership and mutation checks
+- cross-protocol exposure of A2A agents as MCP tools
+
+That last point is important: if an A2A agent is exposed as an MCP tool, the
+core still mediates that cross-protocol bridge.
+
+## Required Policy Semantics
+
+The A2A module must preserve current product semantics:
+
+- token scoping remains separate from RBAC
+- public-only tokens can only see public records
+- team visibility uses normalized token team state
+- admin bypass semantics come from the core, not from local JWT parsing
+- hidden or inaccessible agents may intentionally use not-found semantics
+- feature-flagged query-parameter auth remains a core-governed exception, not a
+  module-defined bypass
+
+## Required SPI Usage
+
+At minimum, an A2A module needs:
+
+- `AuthPolicyService`
+- `CatalogService` for agent discovery and invoke
+- `PluginService` for any parity-sensitive A2A hooks
+- `ObservabilityService`
+- `ConfigSecretsService` for module-scoped transport or timeout settings
+
+## Conformance Additions
+
+An A2A module should additionally prove:
+
+- invoke deny paths for wrong team, wrong owner, and public-only tokens
+- correct handling of agent visibility modes
+- correct propagation of outbound auth without exposing stored secrets
+- correct cross-protocol behavior when an A2A agent is invoked through the MCP
+  tool bridge
diff --git a/docs/docs/architecture/modular-runtime/conformance.md b/docs/docs/architecture/modular-runtime/conformance.md
new file mode 100644
index 0000000000..a98ab810eb
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/conformance.md
@@ -0,0 +1,88 @@
+# Conformance
+
+Every new protocol module should prove the same categories of correctness
+before it is considered release-ready.
+
+## Minimum Required Gates
+
+### 1. Contract Compatibility
+
+The module must prove:
+
+- descriptor compatibility
+- lifecycle compatibility
+- SPI version negotiation
+- correct startup failure on incompatible SPI
+
+### 2. Security and Policy
+
+The module must prove:
+
+- unauthenticated deny paths
+- wrong-team deny paths
+- insufficient-permission deny paths
+- hidden-resource not-found behavior where the product requires it
+- trusted-channel behavior for sidecar-only core APIs
+
+### 3. Protocol Correctness
+
+The module must prove:
+
+- required protocol surfaces
+- capability negotiation
+- correct optional-surface behavior
+- stable request and response shapes
+- structured error handling
+
+### 4. Plugin Parity
+
+The module must prove plugin-sensitive flows still behave correctly.
+
+For a protocol module, this means:
+
+- explicitly exercising active plugins, not only plugin-disabled stacks
+- proving both the normal path and the parity-sensitive path
+- documenting any remaining delegated or unsupported hooks
+
+### 5. Rollback and Degradation
+
+The module must prove:
+
+- health reporting
+- degraded-state reporting
+- rollback or fallback path
+- safe failure when the core is unavailable
+
+### 6. Performance
+
+The module must prove:
+
+- no unacceptable regression on the intended hot paths
+- no correctness failures under representative load
+- no hidden bypass of policy or plugin behavior in the fast path
+
+## Environment Matrix
+
+At minimum, release validation should cover:
+
+- local or compose deployment
+- the intended production deployment mode
+- upgrade and migration behavior where the module changes deployment structure
+
+If the release story includes Helm or Kubernetes, that must be validated too.
+
+## Suggested Evidence
+
+- focused unit tests
+- live stack-backed E2E tests
+- plugin parity tests
+- protocol compliance suite where one exists
+- benchmark or load sanity checks
+
+## Protocol Profiles
+
+Each protocol profile adds its own required checks:
+
+- [A2A Module Profile](a2a-module.md)
+- [LLM Module Profile](llm-module.md)
+- [REST/gRPC Module Profile](rest-grpc-module.md)
diff --git a/docs/docs/architecture/modular-runtime/core-spi.md b/docs/docs/architecture/modular-runtime/core-spi.md
new file mode 100644
index 0000000000..384daed937
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/core-spi.md
@@ -0,0 +1,291 @@
+# Core SPI
+
+This document defines the target-state service families between the core
+platform and a protocol module.
+
+The preferred transport is gRPC over UDS. During transition, HTTP/JSON over a
+trusted local channel is also acceptable. The information model below is what
+matters.
+
+## Design Rules
+
+- Modules do not read the database directly as their primary source of truth.
+- Modules do not interpret raw JWT claims as authoritative policy.
+- Modules do not fetch or decrypt stored credentials directly.
+- Modules call the core for policy-sensitive catalog access.
+- Modules may keep protocol-local caches, but cache invalidation still follows
+  core-owned rules.
+
+## Service Families
+
+### Suggested First-Cut IDL Package Layout
+
+The architecture does not freeze final generated package names, but a new
+module should assume a layout equivalent to:
+
+- `core.spi.auth.v1`
+- `core.spi.catalog.v1`
+- `core.spi.plugin.v1`
+- `core.spi.session.v1`
+- `core.spi.config.v1`
+- `core.spi.observability.v1`
+
+This is a useful planning baseline for a Rust A2A module or a Go LLM proxy
+module even if the exact final packages evolve.
+
+### AuthPolicyService
+
+Provides authenticated context and permission decisions.
+
+Required operations:
+
+- `ResolveCaller`
+- `CheckPermission`
+- `CheckCatalogAccess`
+- `ValidateSessionBinding`
+
+Illustrative request and response shapes:
+
+```json
+{
+  "resolveCallerRequest": {
+    "transport": "streamable_http",
+    "headers": {"authorization": "Bearer ..."},
+    "clientIp": "203.0.113.10",
+    "requestedServerId": "server-123"
+  }
+}
+```
+
+```json
+{
+  "authenticatedContext": {
+    "subject": {
+      "userEmail": "alice@example.com",
+      "isAdmin": false,
+      "tokenTeams": ["team-alpha"]
+    },
+    "visibilityScope": {
+      "serverId": "server-123",
+      "permissions": ["tools.read", "resources.read"],
+      "ipRestrictions": [],
+      "timeRestrictions": {}
+    },
+    "trace": {
+      "requestId": "req-123",
+      "correlationId": "corr-456"
+    }
+  }
+}
+```
+
+The important invariant is semantic, not syntactic:
+
+- `tokenTeams = null` and `isAdmin = true` means unrestricted admin context
+- `tokenTeams = []` means public-only visibility
+- team membership and visibility must use the same normalization as the core
+
+### CatalogService
+
+Provides policy-aware access to core-owned records.
+
+Required operation classes:
+
+- list records
+- fetch one record
+- invoke a record-backed action
+- subscribe to record-change streams where the protocol needs them
+
+Representative entity families:
+
+- tools
+- resources
+- prompts
+- agents
+- servers
+- gateways
+- LLM providers and models
+- roots
+
+Illustrative list request:
+
+```json
+{
+  "listCatalogRequest": {
+    "entityType": "prompt",
+    "serverId": "server-123",
+    "authenticatedContextRef": "ctx-abc",
+    "filters": {
+      "activeOnly": true
+    }
+  }
+}
+```
+
+Illustrative invoke request:
+
+```json
+{
+  "invokeCatalogRequest": {
+    "entityType": "tool",
+    "entityId": "tool-123",
+    "serverId": "server-123",
+    "authenticatedContextRef": "ctx-abc",
+    "arguments": {
+      "timezone": "UTC"
+    }
+  }
+}
+```
+
+### PluginService
+
+Modules must preserve plugin parity on plugin-sensitive flows.
+
+Two allowed patterns:
+
+1. explicit hook execution through the SPI
+2. full delegation of a parity-sensitive flow back to the core
+
+Required hook classes:
+
+- pre-fetch
+- post-fetch
+- pre-invoke
+- post-invoke
+- request or response mutation where the product already supports it
+
+Illustrative hook call:
+
+```json
+{
+  "executeHookRequest": {
+    "hook": "resource_post_fetch",
+    "entityType": "resource",
+    "entityName": "time://formats",
+    "serverId": "server-123",
+    "authenticatedContextRef": "ctx-abc",
+    "payload": {
+      "contents": [{"uri": "time://formats", "mimeType": "text/plain", "text": "UTC"}]
+    }
+  }
+}
+```
+
+### SessionEventService
+
+Needed for protocols with shared session or task state.
+
+Required when the protocol needs:
+
+- stable session ownership
+- replay or resume
+- distributed event history
+- ownership validation across workers
+
+Representative operations:
+
+- `CreateSession`
+- `GetSession`
+- `ValidateSessionOwner`
+- `AppendEvent`
+- `ReplayEvents`
+- `DeleteSession`
+
+### ConfigSecretsService
+
+Provides module-scoped configuration and secret references.
+
+Required capabilities:
+
+- get module config
+- resolve core-managed feature flags
+- resolve secret references to a usable form without exposing unrelated secrets
+
+Modules should receive only the settings they need, not a whole-process
+configuration dump.
+
+### ObservabilityService
+
+Provides structured platform integration.
+
+Required capabilities:
+
+- emit structured logs
+- publish counters and histograms
+- attach trace context
+- emit audit events
+
+Modules may expose protocol-local metrics, but the core remains the system of
+record for shared operational visibility.
+
+## Minimum Service-Family Matrix
+
+| Module family | Required service families | Usually optional |
+|---------------|---------------------------|------------------|
+| MCP | AuthPolicy, Catalog, Plugin, SessionEvent, Observability, ConfigSecrets | Additional module-local optimizations |
+| A2A | AuthPolicy, Catalog, Observability, ConfigSecrets | Plugin, SessionEvent |
+| LLM | AuthPolicy, Catalog, Observability, ConfigSecrets | Plugin, SessionEvent |
+| REST/gRPC | AuthPolicy, Catalog, Observability, ConfigSecrets | Plugin, SessionEvent |
+
+## Authenticated Context
+
+Every SPI call that depends on caller identity should carry either:
+
+- a full authenticated context
+- a short-lived authenticated-context reference issued by the core
+
+The minimum fields are:
+
+- user identity
+- admin status
+- normalized token team state
+- effective server scope if one is already known
+- permission or scope restrictions attached to the token
+- request and trace correlation identifiers
+
+## Invocation Envelope
+
+All invoke-style operations should preserve the same conceptual envelope:
+
+- target record
+- effective server or gateway context
+- authenticated context reference
+- input arguments
+- trace metadata
+- optional delegation hints
+
+That allows a Rust A2A module and a Go LLM module to call the same core
+services without inventing a protocol-specific policy seam.
+
+## Typical Flow
+
+```mermaid
+sequenceDiagram
+    participant Client
+    participant Module
+    participant Core
+    participant Upstream
+
+    Client->>Module: protocol request
+    Module->>Core: ResolveCaller
+    Core-->>Module: AuthenticatedContext
+    Module->>Core: CheckCatalogAccess / InvokeCatalogAction
+    Core-->>Module: Policy-approved target and action result
+    Module->>Upstream: protocol-specific outbound call if needed
+    Upstream-->>Module: upstream result
+    Module->>Core: ExecuteHook or emit audit event
+    Module-->>Client: protocol response
+```
+
+## Versioning
+
+The SPI must be explicitly versioned.
+
+Rules:
+
+- the core declares supported SPI versions
+- the module declares supported SPI versions
+- incompatible versions fail at startup
+- additive changes are preferred
+- protocol capability negotiation is separate from SPI version negotiation
diff --git a/docs/docs/architecture/modular-runtime/error-model.md b/docs/docs/architecture/modular-runtime/error-model.md
new file mode 100644
index 0000000000..fac25fa23b
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/error-model.md
@@ -0,0 +1,78 @@
+# Error Model
+
+Modules in different languages must still present a coherent failure model to
+the core and to clients.
+
+## Canonical Error Categories
+
+| Category | Meaning |
+|----------|---------|
+| `INVALID_ARGUMENT` | Client supplied malformed or semantically invalid input |
+| `UNAUTHENTICATED` | Caller identity could not be established |
+| `PERMISSION_DENIED` | Caller is authenticated but not allowed |
+| `NOT_FOUND` | Resource intentionally absent or hidden |
+| `CONFLICT` | Request conflicts with current state |
+| `FAILED_PRECONDITION` | State is valid but not ready for this operation |
+| `RATE_LIMITED` | Policy denied due to rate or quota |
+| `UNSUPPORTED` | Optional feature or method is not supported |
+| `UNAVAILABLE` | Core, module, or upstream dependency is temporarily unavailable |
+| `UPSTREAM_ERROR` | Upstream protocol peer failed |
+| `INTERNAL` | Unexpected internal failure |
+
+## Required Error Envelope
+
+Every structured module error should include:
+
+- canonical category
+- stable machine-readable code
+- human-readable message safe for clients
+- origin
+  - `module`
+  - `core`
+  - `plugin`
+  - `upstream`
+- retryability hint
+- trace or correlation id when available
+
+Example:
+
+```json
+{
+  "error": {
+    "category": "PERMISSION_DENIED",
+    "code": "a2a.invoke.denied",
+    "message": "Access denied",
+    "origin": "core",
+    "retryable": false,
+    "traceId": "trace-123"
+  }
+}
+```
+
+## Safety Rules
+
+- Do not expose stack traces to clients.
+- Do not expose raw `err.to_string()` data from internal libraries on public
+  paths.
+- Hide existence where the current product intentionally uses not-found
+  semantics for protected records.
+- Preserve protocol-correct error mapping where the protocol defines it.
+
+## Mapping Guidance
+
+| Canonical category | HTTP | gRPC |
+|-------------------|------|------|
+| `INVALID_ARGUMENT` | `400` | `INVALID_ARGUMENT` |
+| `UNAUTHENTICATED` | `401` | `UNAUTHENTICATED` |
+| `PERMISSION_DENIED` | `403` | `PERMISSION_DENIED` |
+| `NOT_FOUND` | `404` | `NOT_FOUND` |
+| `CONFLICT` | `409` | `ALREADY_EXISTS` or `ABORTED` |
+| `FAILED_PRECONDITION` | `412` or `400` | `FAILED_PRECONDITION` |
+| `RATE_LIMITED` | `429` | `RESOURCE_EXHAUSTED` |
+| `UNSUPPORTED` | `400`, `404`, or protocol-specific unsupported response | `UNIMPLEMENTED` |
+| `UNAVAILABLE` | `503` | `UNAVAILABLE` |
+| `UPSTREAM_ERROR` | `502` | `UNKNOWN` or mapped upstream status |
+| `INTERNAL` | `500` | `INTERNAL` |
+
+Protocol-specific documents may add more precise mappings, but they must not
+break these semantics.
diff --git a/docs/docs/architecture/modular-runtime/index.md b/docs/docs/architecture/modular-runtime/index.md
new file mode 100644
index 0000000000..c6f5c034b7
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/index.md
@@ -0,0 +1,66 @@
+# Modular Runtime Specification
+
+This section turns the [Modular Runtime Architecture](../modular-design.md)
+into an implementation-oriented specification that another team can use to
+build a protocol module in Rust, Go, or Python.
+
+The intent is not to freeze every future protobuf field today. The intent is
+to define the minimum contract surface clearly enough that:
+
+- the existing Rust MCP module can be understood as the reference implementation
+- a Rust A2A module can be implemented without re-designing the trust model
+- a Go LLM proxy module can be implemented without guessing where policy lives
+- a REST or gRPC module can be implemented without inventing a different
+  lifecycle or error model
+
+## Reading Order
+
+1. [Core SPI](core-spi.md)
+2. [Module Descriptor](module-descriptor.md)
+3. [Module Lifecycle](module-lifecycle.md)
+4. [Error Model](error-model.md)
+5. [Conformance](conformance.md)
+6. the protocol profile that matches the module being implemented
+   - [MCP Module Profile](mcp-module.md)
+   - [A2A Module Profile](a2a-module.md)
+   - [LLM Module Profile](llm-module.md)
+   - [REST/gRPC Module Profile](rest-grpc-module.md)
+
+## Contract Status
+
+This spec set is **normative at the architecture level**:
+
+- the boundaries are intended
+- the ownership rules are intended
+- the lifecycle and required fields are intended
+
+It is **illustrative at the wire-schema level**:
+
+- example JSON and proto-like structures define the required information model
+- final generated bindings can still evolve as long as they preserve those
+  semantics
+
+## Implemented Precedent
+
+The first implemented precedent is the
+[Rust MCP Runtime](../rust-mcp-runtime.md).
+
+That precedent proves:
+
+- a protocol runtime can move out of Python
+- a module can own direct public ingress
+- the core can remain authoritative for auth, token scoping, and RBAC
+- plugin parity and rollback can still be preserved
+
+It does **not** mean that every future module must copy the exact current Rust
+MCP seam. The target-state contracts in this section are slightly more generic
+than the current implementation.
+
+## Status by Protocol Family
+
+| Protocol family | Status |
+|-----------------|--------|
+| MCP | Implemented as a Rust sidecar/runtime path |
+| A2A | Planned against this spec |
+| LLM | Planned against this spec |
+| REST/gRPC | Planned against this spec |
diff --git a/docs/docs/architecture/modular-runtime/llm-module.md b/docs/docs/architecture/modular-runtime/llm-module.md
new file mode 100644
index 0000000000..e0e34ce87c
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/llm-module.md
@@ -0,0 +1,82 @@
+# LLM Module Profile
+
+This profile defines how a future LLM proxy or chat module should map onto the
+current ContextForge LLM surfaces.
+
+## Current Surface
+
+Today there are two main LLM-facing surfaces:
+
+- **OpenAI-compatible proxy**
+  - `POST /chat/completions`
+  - `GET /models`
+- **Session-oriented chat**
+  - `/llmchat/connect`
+  - `/llmchat/chat`
+  - `/llmchat/disconnect`
+  - `/llmchat/status/{user_id}`
+  - `/llmchat/config/{user_id}`
+  - `/llmchat/gateway/models`
+
+Those surfaces are currently implemented through Python routers and services.
+
+The important split is that ContextForge already has both:
+
+- a direct OpenAI-compatible proxy surface
+- a higher-level chat surface that coordinates models, servers, and session
+  state
+
+## What the LLM Module Owns
+
+A future LLM module should own:
+
+- request parsing for OpenAI-compatible and session-style chat surfaces
+- streaming transport behavior
+- provider relay runtime behavior
+- chat-session orchestration and protocol-local session state
+- provider-specific retries, deadlines, and streaming normalization
+- protocol-local metrics and runtime health
+
+## What Stays in Core
+
+The core should continue to own:
+
+- provider and model registry CRUD
+- provider credentials and secret handling
+- auth, RBAC, and token-scope policy
+- model visibility and governance
+- prompt, tool, and resource catalogs
+- plugin policy
+- admin UI and provider-management workflows
+- any shared governance around which virtual servers or model records are
+  exposed to which callers
+
+## Required SPI Usage
+
+A future LLM module will typically require:
+
+- `AuthPolicyService`
+- `CatalogService` for model lookup and MCP-facing resource access
+- `PluginService` where chat or provider flows become plugin-sensitive
+- `ObservabilityService`
+- `ConfigSecretsService`
+- `SessionEventService` if shared chat-session semantics are extracted
+
+## Cross-Protocol Constraint
+
+If the LLM module can call MCP tools or prompts, it must not call another
+module directly. The core still decides:
+
+- what catalog entry is being invoked
+- what protocol owns it
+- what policy and plugin rules apply
+
+## Conformance Additions
+
+An LLM module should additionally prove:
+
+- non-streaming and streaming parity
+- model visibility and deny paths
+- provider-auth failure handling without leaking sensitive details
+- correct cross-protocol invocation when chat flows reach MCP-backed tools or
+  prompts
diff --git a/docs/docs/architecture/modular-runtime/mcp-module.md b/docs/docs/architecture/modular-runtime/mcp-module.md
new file mode 100644
index 0000000000..8017b09eb2
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/mcp-module.md
@@ -0,0 +1,85 @@
+# MCP Module Profile
+
+This profile maps the implemented Rust MCP module onto the modular runtime
+specification and defines what future MCP implementations should preserve.
+
+## Current Status
+
+MCP is the first implemented protocol module in ContextForge.
+
+The current implementation is the
+[Rust MCP Runtime](../rust-mcp-runtime.md), which already proves:
+
+- sidecar deployment
+- direct public ingress in `edge` and `full` mode
+- core-owned auth, token scoping, and RBAC
+- plugin parity on validated flows
+- rollback through mode-based rollout
+
+## What the MCP Module Owns
+
+The MCP module owns:
+
+- MCP wire parsing and serialization
+- transport behavior for streamable HTTP and related protocol edge behavior
+- session lifecycle and capability negotiation
+- replay, resume, and live-stream runtime behavior where enabled
+- protocol-specific upstream MCP client behavior
+- protocol-specific health and stats
+
+## What Stays in Core
+
+The core continues to own:
+
+- authentication and token normalization
+- RBAC and visibility filtering
+- core-owned catalogs for tools, resources, prompts, servers, and gateways
+- plugin configuration and policy
+- admin UI and platform observability
+- cross-protocol mediation
+
+## Current Implemented Seam vs Target-State Seam
+
+The current Rust MCP module is the reference implementation, but it is still a
+transition architecture in one important respect:
+
+- implemented today:
+  - trusted internal HTTP over UDS or loopback on some seams
+- target-state default:
+  - gRPC over UDS for the core SPI
+
+That difference is acceptable. The current module proves the boundary; the
+target-state SPI documents how future modules should converge.
+
+## Required Invariants
+
+Any MCP module, including the existing Rust one, must preserve:
+
+- core-owned auth and RBAC authority
+- session ownership and isolation
+- plugin parity on plugin-sensitive flows
+- rollback and degraded-mode safety
+- no direct module-to-module calls for cross-protocol behavior
+
+## Required SPI Usage
+
+An MCP module requires:
+
+- `AuthPolicyService`
+- `CatalogService`
+- `PluginService`
+- `SessionEventService`
+- `ObservabilityService`
+- `ConfigSecretsService`
+
+## Release Expectations
+
+An MCP module should be held to the strongest conformance bar because it is the
+first extracted runtime and the precedent for later modules.
+
+That means:
+
+- live stack-backed protocol tests
+- deny-path and isolation tests
+- plugin parity tests
+- benchmark validation on the intended hot paths
diff --git a/docs/docs/architecture/modular-runtime/module-descriptor.md b/docs/docs/architecture/modular-runtime/module-descriptor.md
new file mode 100644
index 0000000000..b8bcb40472
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/module-descriptor.md
@@ -0,0 +1,110 @@
+# Module Descriptor
+
+Every protocol module must expose a stable descriptor that the core can use for
+discovery, compatibility checks, health integration, and release validation.
+
+## Required Fields
+
+| Field | Meaning |
+|-------|---------|
+| `moduleId` | Stable module identifier, for example `mcp-rust-runtime` |
+| `protocolFamily` | One of `mcp`, `a2a`, `llm`, `rest-grpc`, or a future family |
+| `implementationLanguage` | `python`, `rust`, `go`, or another language identifier |
+| `moduleVersion` | Module build or release version |
+| `spiVersions` | Supported core SPI versions |
+| `runtimeModes` | Supported runtime modes such as `embedded`, `sidecar` |
+| `ingressModes` | Whether the module can run behind core routing, direct public ingress, or both |
+| `capabilities` | Declared protocol and runtime capabilities |
+| `health` | How health and readiness are queried |
+| `stats` | Optional runtime metrics surface |
+| `pluginParity` | Which plugin-sensitive flows are fully supported, delegated, or not yet supported |
+| `fallbackStrategy` | Whether rollback to legacy or embedded path exists |
+
+## Example Descriptor
+
+```json
+{
+  "moduleId": "a2a-rust-runtime",
+  "protocolFamily": "a2a",
+  "implementationLanguage": "rust",
+  "moduleVersion": "0.1.0",
+  "spiVersions": ["v1alpha1"],
+  "runtimeModes": ["sidecar"],
+  "ingressModes": ["core-routed"],
+  "capabilities": {
+    "discovery": true,
+    "invoke": true,
+    "taskState": true,
+    "streaming": false,
+    "pushNotifications": false
+  },
+  "health": {
+    "readiness": "grpc",
+    "liveness": "grpc"
+  },
+  "pluginParity": {
+    "preInvoke": "delegate",
+    "postInvoke": "delegate"
+  },
+  "fallbackStrategy": {
+    "supportsRollback": true,
+    "fallbackPath": "python-core"
+  }
+}
+```
+
+Second illustrative example for a Go LLM proxy module:
+
+```json
+{
+  "moduleId": "llm-go-proxy",
+  "protocolFamily": "llm",
+  "implementationLanguage": "go",
+  "moduleVersion": "0.1.0",
+  "spiVersions": ["v1alpha1"],
+  "runtimeModes": ["sidecar"],
+  "ingressModes": ["core-routed"],
+  "capabilities": {
+    "chatCompletions": true,
+    "streaming": true,
+    "sessionChat": true,
+    "providerRelay": true
+  }
+}
+```
+
+## Capability Taxonomy
+
+Capabilities should be declarative, not inferred from language or module name.
+
+Recommended categories:
+
+- ingress
+- transport
+- request or response streaming
+- session or task state
+- replay or resume
+- subscriptions
+- prompt rendering
+- resource reads
+- tool or agent invocation
+- provider relay
+- plugin parity support
+
+## Descriptor Rules
+
+- The descriptor must be available before live traffic.
+- Capabilities must be honest. Unsupported optional protocol surfaces must be
+  declared as unsupported, not silently dropped.
+- The descriptor must be sufficient for the core to decide:
+  - whether the module can be started
+  - whether a given deployment mode is valid
+  - whether the module satisfies release policy for the protocol family
+
+## Protocol-Specific Notes
+
+- A Rust A2A module should declare task-state and invoke support explicitly.
+- A Go LLM proxy module should declare both chat-completion and streaming
+  support explicitly.
+- A REST or gRPC module should declare whether it owns reflection, OpenAPI
+  import, or only invocation relay.
diff --git a/docs/docs/architecture/modular-runtime/module-lifecycle.md b/docs/docs/architecture/modular-runtime/module-lifecycle.md
new file mode 100644
index 0000000000..0419239bb5
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/module-lifecycle.md
@@ -0,0 +1,87 @@
+# Module Lifecycle
+
+Every module must support the same lifecycle phases, regardless of language.
+
+## Lifecycle Phases
+
+1. **register**
+   The core discovers the module and reads its descriptor.
+2. **initialize**
+   The core provides module-scoped configuration, trust material, and SPI
+   connection information.
+3. **ready**
+   The module is healthy and can accept live traffic.
+4. **drain**
+   The module stops accepting new work and lets in-flight work complete.
+5. **shutdown**
+   The module releases resources and exits cleanly.
+
+## Lifecycle Sequence
+
+```mermaid
+sequenceDiagram
+    participant Core
+    participant Module
+
+    Core->>Module: register / descriptor query
+    Module-->>Core: descriptor
+    Core->>Module: initialize(config, spi, trust)
+    Module-->>Core: initialized
+    Core->>Module: readiness probe
+    Module-->>Core: ready
+    Note over Core,Module: live traffic
+    Core->>Module: drain
+    Module-->>Core: draining
+    Core->>Module: shutdown
+    Module-->>Core: stopped
+```
+
+## Initialize Payload
+
+The initialize payload should include:
+
+- module-scoped configuration
+- supported SPI version selected by the core
+- how to reach the core SPI
+- trace and observability configuration
+- any trusted channel or module authentication material
+- deployment mode
+- explicit fallback expectations
+
+It should not include unrestricted access to the core configuration model.
+
+## Readiness Semantics
+
+A module is not ready merely because the process is listening.
+
+Ready means:
+
+- descriptor is loaded
+- configuration was accepted
+- SPI compatibility was established
+- any required warmup completed
+- the module can enforce required deny paths safely
+
+## Drain Semantics
+
+Drain should:
+
+- reject new live traffic
+- keep ownership checks and in-flight responses correct
+- preserve resumable or replayable state where the protocol requires it
+- expose a clear draining status to the core
+
+## Failure Rules
+
+- If SPI compatibility fails, startup must fail before traffic.
+- If the core becomes unavailable, the module must report degraded state.
+- If the module cannot preserve protocol correctness safely, it must fail
+  closed or trigger rollback rather than continue in a partial-trust mode.
+
+## Rollback Requirement
+
+Every production-facing extracted module should document:
+
+- whether rollback to legacy or embedded path exists
+- how rollback is triggered
+- what state must be preserved during rollback
diff --git a/docs/docs/architecture/modular-runtime/rest-grpc-module.md b/docs/docs/architecture/modular-runtime/rest-grpc-module.md
new file mode 100644
index 0000000000..2d833428ff
--- /dev/null
+++ b/docs/docs/architecture/modular-runtime/rest-grpc-module.md
@@ -0,0 +1,63 @@
+# REST/gRPC Module Profile
+
+This profile defines how a future REST or gRPC module should map onto the
+current virtualized service surfaces.
+
+## Current Surface
+
+Today ContextForge can:
+
+- expose REST-backed tools and virtual servers
+- register and manage gRPC services
+- use OpenAPI import or reflection-style discovery to create gateway-managed
+  records
+
+This is still largely core-owned today.
+
+That means a future REST/gRPC module is more likely to be a runtime extraction
+than a greenfield subsystem. The registration and governance model already
+exists in the core.
+
+## What the REST/gRPC Module Owns
+
+A future REST/gRPC module should own:
+
+- protocol-specific outbound transport behavior
+- reflection or discovery runtime behavior where enabled
+- protocol-specific request and response normalization
+- streaming semantics where the underlying protocol supports them
+- runtime metrics, health, and deadlines
+
+## What Stays in Core
+
+The core should continue to own:
+
+- service registration and persistence
+- visibility, ownership, and governance policy
+- generated tool, prompt, or resource catalog records
+- auth, RBAC, and token scoping
+- secret storage and TLS material governance
+- cross-protocol exposure into MCP or other front-door protocols
+
+In other words, the module owns protocol behavior, not the registry of record.
+
+## Required SPI Usage
+
+At minimum, a REST/gRPC module will usually require:
+
+- `AuthPolicyService`
+- `CatalogService`
+- `ObservabilityService`
+- `ConfigSecretsService`
+- optionally `PluginService` if response mutation or policy hooks are required
+
+## Conformance Additions
+
+A REST/gRPC module should additionally prove:
+
+- SSRF and target-validation rules remain enforced
+- TLS and metadata handling preserve the current trust model
+- reflection or OpenAPI-derived surfaces do not bypass core visibility or
+  ownership rules
+- virtualized service behavior remains consistent when surfaced through MCP or
+  another protocol
diff --git a/docs/docs/architecture/performance-architecture.md b/docs/docs/architecture/performance-architecture.md
index 01f2ef2e77..684dd5a7d4 100644
--- a/docs/docs/architecture/performance-architecture.md
+++ b/docs/docs/architecture/performance-architecture.md
@@ -169,77 +169,63 @@ This diagram showcases the performance-optimized architecture of ContextForge, h
 └─────────────────────────────────────────────────────────────────────────────────────────────────────────┘
 ```
 
-## MCP Streamable HTTP Request Path
+## MCP Streamable HTTP Request Paths
 
-Every MCP request to `/servers/{server_id}/mcp` passes through these layers:
+ContextForge now has two materially different MCP request paths, depending on
+the Rust runtime mode.
 
+### Mode summary
+
+| Mode | Public `/mcp` ingress | Session/runtime ownership |
+|------|------------------------|---------------------------|
+| `off` | Python | Python |
+| `shadow` | Python | Python (Rust sidecar present internally only) |
+| `edge` | Rust | Mixed: Rust ingress, Python still backs more MCP internals |
+| `full` | Rust | Rust ingress plus Rust session/event/resume/live-stream/affinity cores |
+
+### Python-owned public path (`off`, `shadow`)
+
+```text
+Client Request
+  -> NGINX
+  -> Python gateway middleware/auth/token scoping
+  -> Python MCP session manager + handlers
+  -> upstream MCP server
 ```
-Client Request (JSON-RPC over HTTP POST)
-    │
-    ▼
-┌─────────────────────────────────────────────┐
-│  NGINX (Edge/Proxy)                         │
-│  • least_conn load balancing                │
-│  • keepalive 512 per worker                 │
-│  • No caching for /mcp (POST requests)      │
-└─────────────────────────────────────────────┘
-    │
-    ▼
-┌─────────────────────────────────────────────┐
-│  GATEWAY MIDDLEWARE STACK                    │
-│  1. SecurityHeaders, CORS                   │
-│  2. MCPPathRewrite + Auth                   │
-│     • JWT verification (HMAC)               │
-│     • Token revocation check (DB/cache)     │
-│     • User lookup (DB/cache)                │
-│     • Team resolution (DB/cache)            │
-│  3. Token scoping (Layer 1 auth)            │
-│  4. Request logging                         │
-└─────────────────────────────────────────────┘
-    │
-    ▼
-┌─────────────────────────────────────────────┐
-│  MCP SDK SessionManager                     │
-│  • JSON-RPC envelope parsing                │
-│  • Session tracking (stateless by default)  │
-│  • Context variable propagation             │
-│  • Handler method routing                   │
-└─────────────────────────────────────────────┘
-    │
-    ├── tools/list ─────┐
-    ├── tools/call ─────┤
-    ├── resources/list ─┤
-    ├── prompts/list ───┤
-    └── ping ───────────┘
-    │
-    ▼
-┌─────────────────────────────────────────────┐
-│  MCP HANDLER                                │
-│  • RBAC permission check (Layer 2 auth)     │
-│  • Server/tool lookup (DB query)            │
-│  • For tools/call: upstream proxy           │
-│    via MCP Session Pool (if enabled)        │
-└─────────────────────────────────────────────┘
-    │
-    ▼
-┌─────────────────────────────────────────────┐
-│  UPSTREAM MCP SERVER                        │
-│  (fast_test_server, fast_time, plugins)     │
-│  • Executes tool logic                      │
-│  • Returns JSON-RPC result                  │
-└─────────────────────────────────────────────┘
+
+### Rust-owned public path (`edge`, `full`)
+
+```text
+Client Request
+  -> NGINX
+  -> Rust public MCP listener
+  -> trusted Python auth endpoint
+  -> Rust MCP routing/session/runtime logic
+  -> upstream MCP server or narrow Python internal route
 ```
 
+Important current behavior:
+
+- Python remains authoritative for JWT auth, token scoping, and RBAC in all
+  modes.
+- `edge|full` remove the old public Python ingress hop by routing nginx
+  directly to Rust.
+- `full` also moves MCP session, event-store, resume, live-stream, and
+  affinity/owner-worker logic into Rust.
+- `shadow` is the safety-first fallback mode: the Rust sidecar is running, but
+  public `/mcp` stays mounted on Python.
+
 ### Performance Characteristics by Layer
 
 | Layer | Typical Latency | Scaling Bottleneck | Key Tunable |
 |-------|----------------|-------------------|-------------|
 | nginx | <1ms | Not a bottleneck | `keepalive`, `worker_connections` |
-| Middleware + Auth | 5-15ms | Auth DB queries | `AUTH_CACHE_*_TTL`, `AUTH_CACHE_BATCH_QUERIES` |
-| MCP SDK SessionManager | 2-5ms | JSON-RPC parsing, context vars | `JSON_RESPONSE_ENABLED` |
+| Python auth/control path | 5-15ms | Auth DB/cache queries | `AUTH_CACHE_*`, `AUTH_CACHE_BATCH_QUERIES` |
+| Rust public ingress (`edge`, `full`) | low single-digit ms | Syscall/network overhead | keepalive, upstream reuse, request shaping |
+| Python MCP session manager (`off`, `shadow`) | 2-5ms | JSON-RPC parsing, context vars | `JSON_RESPONSE_ENABLED` |
 | RBAC check | 1-5ms | Permission DB queries | Role cache TTL (5 min internal) |
-| tools/list (DB) | 5-10ms | Sequential table scans | `REGISTRY_CACHE_TOOLS_TTL` |
-| tools/call (upstream) | 10-200ms | Upstream server + network | `MCP_SESSION_POOL_ENABLED` |
+| tools/list / resources / prompts | 5-10ms | DB and compatibility paths | cache TTLs, Rust specialized handlers |
+| tools/call (upstream) | 10-200ms | Upstream server + network | upstream session reuse, direct execution, RMCP client reuse |
 
 ### Feature Flags and Middleware Overhead
 
@@ -249,12 +235,21 @@ The most impactful features to disable when not needed are: admin UI, A2A protoc
 
 ### Key Architectural Insight
 
-The `/rpc` endpoint and the `/servers/{id}/mcp` endpoint serve the same logical operations (tools/list, tools/call) but follow different code paths:
+The important transport distinction is no longer only `/rpc` versus `/mcp`.
+It is now also **Python-owned MCP** versus **Rust-owned public MCP ingress**:
+
+- **`/rpc`** still benefits heavily from Redis-backed caches and does not follow
+  the streamable HTTP MCP session path.
+- **Python MCP (`off`, `shadow`)** still pays the full Python middleware,
+  session-manager, and handler cost on the public path.
+- **Rust MCP (`edge`, `full`)** removes the public Python ingress hop and moves
+  progressively more MCP session/runtime work to Rust, but Python auth/RBAC
+  remains part of the control plane.
 
-- **`/rpc`**: Uses Redis-backed caching (registry cache, tool lookup cache) for most lookups. Under load, Redis handles the read pressure, keeping PgBouncer/PostgreSQL near idle.
-- **`/mcp`**: Routes through the MCP SDK session manager, which executes its own handler functions. These handlers query the database via SQLAlchemy for server resolution, tool lookup, and RBAC checks. The auth cache (Redis-backed, TTL up to 300s) mitigates some of this, but RBAC and server/tool lookups still hit the database.
+This means that scaling MCP throughput now depends on two different concerns:
 
-This means that scaling MCP throughput depends heavily on reducing per-request database queries in the MCP transport handlers.
+1. shrinking Python auth/control work that still happens for Rust MCP traffic
+2. minimizing per-request transport and upstream costs on the Rust side
 
 ---
 
diff --git a/docs/docs/architecture/rust-mcp-runtime.md b/docs/docs/architecture/rust-mcp-runtime.md
new file mode 100644
index 0000000000..615cd61350
--- /dev/null
+++ b/docs/docs/architecture/rust-mcp-runtime.md
@@ -0,0 +1,177 @@
+# Rust MCP Runtime
+
+The Rust MCP runtime is an optional sidecar/runtime path for ContextForge's
+streamable HTTP MCP traffic. It is designed to move the public MCP hot path out
+of Python incrementally while keeping Python authoritative for authentication,
+token scoping, and RBAC.
+
+It is also the first concrete precedent for the broader
+[Modular Runtime Architecture](modular-design.md): a protocol-specific runtime
+that can move out of the Python process while the core platform remains the
+shared policy and control plane. The generalized implementor-facing contract
+for future modules is documented in the
+[Modular Runtime Specification](modular-runtime/index.md).
+
+This page describes the current architecture and the supported rollout modes.
+
+## Mode Model
+
+The user-facing control is `RUST_MCP_MODE`:
+
+| Mode | Public `/mcp` ingress | Rust session/event/resume/live-stream cores | Intended use |
+|------|------------------------|--------------------------------------------|--------------|
+| `off` | Python | No | Baseline Python MCP path |
+| `shadow` | Python | No public Rust ownership | Safety-first rollback/comparison mode with Rust sidecar present |
+| `edge` | Rust | No | Direct public Rust ingress with Python still backing more MCP internals |
+| `full` | Rust | Yes | Fastest public Rust path with Rust-owned MCP session/runtime cores |
+
+Use the testing stack wrappers to bring these up locally:
+
+```bash
+make testing-rebuild-rust-shadow
+make testing-rebuild-rust
+make testing-rebuild-rust-full
+```
+
+## Request Flows
+
+### `off` and `shadow`
+
+In `off` and `shadow`, the public MCP path remains Python-owned:
+
+```text
+client
+  -> nginx
+  -> Python gateway transport/auth/token scoping/RBAC
+  -> Python MCP handlers
+  -> upstream MCP server
+```
+
+`shadow` differs from `off` only in that the Rust sidecar is present and can be
+used for internal validation and comparison; it does not own the public MCP
+transport.
+
+### `edge` and `full`
+
+In `edge` and `full`, nginx routes public `GET/POST/DELETE /mcp` directly to
+the Rust runtime:
+
+```text
+client
+  -> nginx
+  -> Rust public listener
+  -> trusted Python auth endpoint (internal)
+  -> Rust MCP routing/execution/session logic
+  -> upstream MCP server or narrow Python internal endpoint
+```
+
+Important details:
+
+- Direct public Rust ingress is enabled by the dedicated public listener set up
+  from `RUST_MCP_MODE=edge|full`.
+- Rust authenticates public traffic through the trusted Python internal endpoint
+  `POST /_internal/mcp/authenticate`.
+- Rust strips forwarded/proxy-chain headers on the trusted Rust -> Python hop so
+  Python evaluates the request as an internal runtime dispatch rather than as an
+  external client IP.
+
+## Responsibility Split
+
+The current split is intentionally conservative:
+
+| Concern | Python | Rust |
+|---------|--------|------|
+| JWT authentication | Yes | Via trusted internal Python auth |
+| Token scoping / team visibility | Yes | Consumes authenticated context |
+| RBAC | Yes | Enforces Python-authenticated result |
+| Public MCP HTTP edge | `off`, `shadow` | `edge`, `full` |
+| Session registry | Python in `off`, `shadow` | Rust in `full` |
+| Event store / replay / resume | Python in `off`, `shadow`, `edge` | Rust in `full` |
+| Live `GET /mcp` SSE edge | Python in `off`, `shadow`, `edge` | Rust in `full` |
+| Affinity / owner-worker forwarding | Python in `off`, `shadow`, `edge` | Rust in `full` |
+| Direct `tools/call` execution | Python fallback still exists | Rust hot path when eligible |
+
+The important architectural point is that Rust does not currently replace the
+full security model. Python remains the authority for auth and RBAC while Rust
+owns progressively more of the public MCP transport and session/runtime work.
+
+## Session/Auth Reuse Model
+
+To reduce repeated auth overhead on session-bound MCP traffic, Rust can reuse
+authenticated context for an established MCP session. This is not a global
+per-user cache. It is bound to the MCP session and validated against the
+original authenticated context.
+
+Key invariants:
+
+- a session belongs to exactly one authenticated caller context
+- a different caller cannot reuse the same `mcp-session-id`
+- a changed auth binding on the same session is denied rather than reused
+- replay/resume and delete operations preserve the same ownership checks
+
+This model is validated by the dedicated isolation suite:
+
+```bash
+make test-mcp-session-isolation
+```
+
+See the detailed threat model and test matrix in
+`tools_rust/mcp_runtime/TESTING-DESIGN.md` in the repository.
+
+## Verification
+
+After bringing up the stack, verify the active mode through `/health`:
+
+```bash
+curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'
+```
+
+Representative full-Rust headers:
+
+```text
+x-contextforge-mcp-runtime-mode: rust-managed
+x-contextforge-mcp-transport-mounted: rust
+x-contextforge-mcp-session-core-mode: rust
+x-contextforge-mcp-event-store-mode: rust
+x-contextforge-mcp-resume-core-mode: rust
+x-contextforge-mcp-live-stream-core-mode: rust
+x-contextforge-mcp-affinity-core-mode: rust
+x-contextforge-mcp-session-auth-reuse-mode: rust
+```
+
+Representative shadow-mode headers:
+
+```text
+x-contextforge-mcp-runtime-mode: rust-managed
+x-contextforge-mcp-transport-mounted: python
+x-contextforge-mcp-session-core-mode: python
+x-contextforge-mcp-event-store-mode: python
+x-contextforge-mcp-resume-core-mode: python
+x-contextforge-mcp-live-stream-core-mode: python
+x-contextforge-mcp-affinity-core-mode: python
+x-contextforge-mcp-session-auth-reuse-mode: python
+```
+
+## Validation and Benchmark Workflow
+
+Recommended stack-backed validation:
+
+```bash
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-session-isolation
+cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml
+```
+
+Recommended benchmark wrappers:
+
+```bash
+make benchmark-mcp-mixed
+make benchmark-mcp-tools
+make benchmark-mcp-mixed-300
+make benchmark-mcp-tools-300
+```
+
+For Rust-local profiling and crate-level lint/test helpers, see
+`tools_rust/mcp_runtime/README.md` in the repository.
diff --git a/docs/docs/deployment/compose.md b/docs/docs/deployment/compose.md
index b39d8f52e9..ecc96e1ad7 100644
--- a/docs/docs/deployment/compose.md
+++ b/docs/docs/deployment/compose.md
@@ -179,6 +179,42 @@ curl http://localhost:8080/health    # {"status":"healthy"}
 
 ---
 
+## Rust MCP Compose Modes
+
+For the compose-backed testing stack, the Rust MCP runtime is exposed through
+mode-specific make targets:
+
+```bash
+make testing-rebuild-rust-shadow
+make testing-rebuild-rust
+make testing-rebuild-rust-full
+```
+
+Mode summary:
+
+- `shadow`: Rust sidecar present, but public `/mcp` stays on Python
+- `edge`: public `/mcp` routed directly from nginx to Rust
+- `full`: `edge` plus Rust session/event-store/resume/live-stream/affinity
+  cores
+
+Verify the active mode via `/health`:
+
+```bash
+curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'
+```
+
+Examples:
+
+- `x-contextforge-mcp-transport-mounted: python` means the public MCP path is
+  still Python-owned
+- `x-contextforge-mcp-transport-mounted: rust` means nginx is routing public
+  `/mcp` traffic directly to the Rust runtime
+
+For the current runtime architecture, see
+[Rust MCP Runtime](../architecture/rust-mcp-runtime.md).
+
+---
+
 ## 🗄 Selecting a database
 
 Uncomment one service block in `docker-compose.yml` and align `DATABASE_URL`:
diff --git a/docs/docs/development/profiling.md b/docs/docs/development/profiling.md
index 7a125a0ace..0d7c700332 100644
--- a/docs/docs/development/profiling.md
+++ b/docs/docs/development/profiling.md
@@ -16,6 +16,7 @@ This guide covers tools and techniques for profiling ContextForge performance un
 | **memray** | Python memory profiling | Find memory leaks and allocation hotspots |
 | **docker stats** | Resource monitoring | Track CPU/memory usage |
 | **Redis CLI** | Cache analysis | Check hit rates |
+| **perf / cargo flamegraph** | Rust CPU profiling | Inspect Rust MCP runtime hotspots |
 
 ---
 
@@ -237,6 +238,39 @@ py-spy record -o flamegraph.svg -- python -m mcpgateway
 
 ---
 
+## Rust MCP Runtime Profiling
+
+For Rust-local profiling of the MCP runtime crate:
+
+```bash
+make -C tools_rust/mcp_runtime setup-profiling
+make -C tools_rust/mcp_runtime flamegraph-test
+make -C tools_rust/mcp_runtime flamegraph-test-rmcp
+```
+
+These targets generate flamegraphs under:
+
+```text
+tools_rust/mcp_runtime/profiles/
+```
+
+Use them to inspect Rust-internal startup and hot-path behavior in the runtime
+crate itself.
+
+For live profiling of the compose-backed Rust runtime under load:
+
+```bash
+ps -eo pid,cmd | grep contextforge-mcp-runtime
+sudo perf record -F 99 -g -p <pid> -- sleep 20
+sudo perf report --stdio
+```
+
+Use live `perf` during a real benchmark when you want steady-state behavior.
+Use the crate-local flamegraph targets when you want in-process Rust visibility
+without the rest of the stack.
+
+---
+
 ## Memory Profiling with memray
 
 [memray](https://github.com/bloomberg/memray) is a memory profiler for Python that tracks allocations in Python code, native extension modules, and the Python interpreter itself. It's ideal for finding memory leaks, high-water marks, and allocation hotspots.
diff --git a/docs/docs/testing/index.md b/docs/docs/testing/index.md
index 56ef89fe73..3f8bb1bb24 100644
--- a/docs/docs/testing/index.md
+++ b/docs/docs/testing/index.md
@@ -10,7 +10,7 @@ This section covers the testing strategy and tools for ContextForge.
 |-------|------|----------|--------|
 | **Unit tests** | pytest | `tests/unit/` | Implemented |
 | **Integration tests** | pytest | `tests/integration/` | Implemented |
-| **End-to-end tests** | pytest | `tests/e2e/` | Implemented |
+| **End-to-end tests** | pytest | `tests/e2e/`, `tests/e2e_rust/` | Implemented |
 | **UI automation** | Playwright | `tests/playwright/` | Implemented |
 | **Security / DAST** | Playwright + OWASP ZAP | `tests/playwright/security/` | Implemented |
 | **Load testing** | Locust | `tests/loadtest/` | Implemented |
@@ -93,6 +93,66 @@ Access the Locust dashboard at `http://localhost:8089` when running with the web
 
 ---
 
+## 🦀 Rust MCP Runtime Validation
+
+For the Rust MCP runtime path, the most important stack-backed checks are:
+
+```bash
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+make test-mcp-session-isolation
+make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s
+cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml
+```
+
+For live plugin parity, use the test-specific plugin config and run the same
+E2E against both Python mode and Rust full mode:
+
+```bash
+PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml make testing-up
+MCP_PLUGIN_PARITY_EXPECTED_RUNTIME=python make test-mcp-plugin-parity
+
+PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml make testing-rebuild-rust-full
+MCP_PLUGIN_PARITY_EXPECTED_RUNTIME=rust make test-mcp-plugin-parity
+```
+
+This parity gate currently proves live plugin behavior on:
+- `resources/read`
+- `tools/call`
+- `prompts/get`
+
+For revocation and membership/role-drift validation, shorten the reuse TTL so
+the bounded-TTL contract completes quickly:
+
+```bash
+MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS=2 MCP_RUST_SESSION_AUTH_REUSE_GRACE_SECONDS=1 make testing-rebuild-rust-full
+make test-mcp-access-matrix
+make test-mcp-session-isolation
+make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s
+```
+
+Use these mode-specific rebuild targets when validating rollout behavior:
+
+```bash
+make testing-rebuild-rust-shadow
+make testing-rebuild-rust
+make testing-rebuild-rust-full
+```
+
+These validate, respectively:
+
+- `shadow`: Rust sidecar present while public `/mcp` stays on Python
+- `edge`: direct Rust public ingress without the full Rust session/runtime cores
+- `full`: direct Rust public ingress plus Rust session/event/resume/live-stream
+  and affinity cores
+
+For throughput benchmarks and Locust wrappers, see
+[Performance Testing](performance.md).
+
+---
+
 ## 🌐 Frontend JavaScript Testing
 
 Frontend JavaScript unit tests are **not yet implemented**. The codebase uses plain JavaScript (not TypeScript) with:
diff --git a/docs/docs/testing/performance.md b/docs/docs/testing/performance.md
index feb876258e..993e99aaef 100644
--- a/docs/docs/testing/performance.md
+++ b/docs/docs/testing/performance.md
@@ -36,6 +36,43 @@ Compare the 95/99th percentile latencies and error rates with and without the ga
 * Overhead from JSON-RPC wrapping/unwrapping
 * Improper worker/thread config in Gunicorn
 
+## Rust MCP Benchmark Workflow
+
+When benchmarking the Rust MCP runtime on the compose-backed test stack, use the
+mode-specific rebuild helpers first:
+
+```bash
+make testing-rebuild-rust-shadow
+make testing-rebuild-rust
+make testing-rebuild-rust-full
+```
+
+Then use the benchmark wrappers:
+
+```bash
+make benchmark-mcp-mixed
+make benchmark-mcp-tools
+make benchmark-mcp-mixed-300
+make benchmark-mcp-tools-300
+```
+
+These wrappers target the nginx-exposed compose stack on
+`http://localhost:8080` and use the MCP protocol Locust file under
+`tests/loadtest/locustfile_mcp_protocol.py`.
+
+Recommended Rust MCP validation sequence:
+
+```bash
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-session-isolation
+make benchmark-mcp-tools-300
+```
+
+If you are comparing performance and rollback behavior, run the same benchmark
+suite in `shadow` and `full`.
+
 ## 🚀 Scripted Load Tests: `tests/hey/hey.sh`
 
 A wrapper script exists at:
diff --git a/infra/nginx/nginx-performance.conf b/infra/nginx/nginx-performance.conf
index 94dc58175b..7c268ef994 100644
--- a/infra/nginx/nginx-performance.conf
+++ b/infra/nginx/nginx-performance.conf
@@ -168,6 +168,15 @@ http {
         keepalive_timeout 60s;            # Connection idle timeout
     }
 
+    upstream mcp_transport_backend {
+        least_conn;
+        server gateway:8787 max_fails=0;
+        server gateway:4444 max_fails=0 backup;
+        keepalive 512;
+        keepalive_requests 100000;
+        keepalive_timeout 60s;
+    }
+
     # Cache bypass conditions
     map $request_method $skip_cache {
         default 0;
@@ -469,6 +478,30 @@ http {
             proxy_read_timeout 1h;
         }
 
+        # MCP Streamable HTTP transport
+        location ~ ^(/mcp/?|/servers/.*/mcp/?)$ {
+            proxy_pass http://mcp_transport_backend;
+
+            # MCP GET /mcp can be a long-lived SSE stream; disable buffering.
+            proxy_http_version 1.1;
+            proxy_set_header Connection '';
+            proxy_request_buffering off;
+            proxy_buffering off;
+            proxy_cache off;
+            add_header X-Accel-Buffering "no" always;
+
+            # Proxy headers
+            proxy_set_header Host $http_host;
+            proxy_set_header X-Real-IP $remote_addr;
+            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+            proxy_set_header X-Forwarded-Proto $scheme;
+
+            # Extended timeouts for long-lived MCP transport streams
+            proxy_connect_timeout 1h;
+            proxy_send_timeout 1h;
+            proxy_read_timeout 1h;
+        }
+
         # ============================================================
         # JSON-RPC Endpoint - No Caching
         # ============================================================
diff --git a/infra/nginx/nginx-tls.conf b/infra/nginx/nginx-tls.conf
index b6d58a3961..a022b62736 100644
--- a/infra/nginx/nginx-tls.conf
+++ b/infra/nginx/nginx-tls.conf
@@ -549,6 +549,31 @@ http {
             proxy_read_timeout 1h;
         }
 
+        # MCP Streamable HTTP transport
+        location ~ ^(/mcp/?|/servers/.*/mcp/?)$ {
+            proxy_pass https://gateway_backend;
+
+            # MCP GET /mcp can be a long-lived SSE stream; disable buffering.
+            proxy_http_version 1.1;
+            proxy_set_header Connection '';
+            proxy_request_buffering off;
+            proxy_buffering off;
+            proxy_cache off;
+            add_header X-Accel-Buffering "no" always;
+
+            # Proxy headers
+            proxy_set_header Host $http_host;
+            proxy_set_header X-Real-IP $remote_addr;
+            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+            proxy_set_header X-Forwarded-Proto $forwarded_proto;
+            proxy_set_header X-Forwarded-Host $http_host;
+
+            # Extended timeouts for long-lived MCP transport streams
+            proxy_connect_timeout 1h;
+            proxy_send_timeout 1h;
+            proxy_read_timeout 1h;
+        }
+
         # ============================================================
         # JSON-RPC Endpoint - No Caching
         # ============================================================
diff --git a/infra/nginx/nginx.conf b/infra/nginx/nginx.conf
index 9a9be05b3e..b44702e757 100644
--- a/infra/nginx/nginx.conf
+++ b/infra/nginx/nginx.conf
@@ -171,6 +171,15 @@ http {
         keepalive_timeout 60s;            # Connection idle timeout
     }
 
+    upstream mcp_transport_backend {
+        least_conn;
+        server gateway:8787 max_fails=0;
+        server gateway:4444 max_fails=0 backup;
+        keepalive 512;
+        keepalive_requests 100000;
+        keepalive_timeout 60s;
+    }
+
     # ============================================================
     # SSL Backend Configuration (for HTTPS gateway backend)
     # ============================================================
@@ -558,6 +567,31 @@ http {
             proxy_read_timeout 1h;
         }
 
+        # MCP Streamable HTTP transport
+        location ~ ^(/mcp/?|/servers/.*/mcp/?)$ {
+            proxy_pass http://mcp_transport_backend;
+
+            # MCP GET /mcp can be long-lived SSE, so do not buffer the stream.
+            proxy_http_version 1.1;
+            proxy_set_header Connection '';
+            proxy_request_buffering off;
+            proxy_buffering off;
+            proxy_cache off;
+            add_header X-Accel-Buffering "no" always;
+
+            # Proxy headers
+            proxy_set_header Host $http_host;
+            proxy_set_header X-Real-IP $remote_addr;
+            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+            proxy_set_header X-Forwarded-Proto $forwarded_proto;
+            proxy_set_header X-Forwarded-Host $http_host;
+
+            # Extended timeouts for stateful MCP sessions and SSE streams
+            proxy_connect_timeout 1h;
+            proxy_send_timeout 1h;
+            proxy_read_timeout 1h;
+        }
+
         # ============================================================
         # JSON-RPC Endpoint - No Caching
         # ============================================================
diff --git a/mcpgateway/admin.py b/mcpgateway/admin.py
index f4a8bbfd56..ff5ced2144 100644
--- a/mcpgateway/admin.py
+++ b/mcpgateway/admin.py
@@ -1771,6 +1771,7 @@ async def get_overview_partial(
             "redis_available": redis_available,
             "redis_reachable": redis_reachable,
             "uptime_seconds": uptime_seconds,
+            "mcp_runtime": version_module.mcp_runtime_status_payload(),
         }
 
         return request.app.state.templates.TemplateResponse(request, "overview_partial.html", context)
diff --git a/mcpgateway/config.py b/mcpgateway/config.py
index cdc749f402..7badc013c3 100644
--- a/mcpgateway/config.py
+++ b/mcpgateway/config.py
@@ -235,6 +235,48 @@ class Settings(BaseSettings):
 
     # Protocol
     protocol_version: str = "2025-11-25"
+    experimental_rust_mcp_runtime_enabled: bool = Field(
+        default=False,
+        description="Proxy POST /mcp traffic through the experimental Rust MCP runtime sidecar.",
+    )
+    experimental_rust_mcp_runtime_url: str = Field(
+        default="http://127.0.0.1:8787",
+        description="Base URL for the experimental Rust MCP runtime sidecar.",
+    )
+    experimental_rust_mcp_runtime_uds: Optional[str] = Field(
+        default=None,
+        description="Optional Unix domain socket path for the experimental Rust MCP runtime sidecar.",
+    )
+    experimental_rust_mcp_runtime_timeout_seconds: int = Field(
+        default=30,
+        ge=1,
+        le=300,
+        description="Timeout in seconds for Python-to-Rust MCP runtime proxy requests.",
+    )
+    experimental_rust_mcp_session_core_enabled: bool = Field(
+        default=False,
+        description="Enable the experimental Rust-owned MCP session metadata core while keeping Python as the fallback transport backend.",
+    )
+    experimental_rust_mcp_event_store_enabled: bool = Field(
+        default=False,
+        description="Enable the experimental Rust-owned resumable MCP event-store backend for Streamable HTTP sessions.",
+    )
+    experimental_rust_mcp_resume_core_enabled: bool = Field(
+        default=False,
+        description="Enable the experimental Rust-owned public MCP replay/resume path for GET /mcp with Last-Event-ID while keeping Python fallback available.",
+    )
+    experimental_rust_mcp_live_stream_core_enabled: bool = Field(
+        default=False,
+        description="Enable the experimental Rust-owned public MCP live GET /mcp SSE path while keeping Python as the fallback upstream stream source.",
+    )
+    experimental_rust_mcp_affinity_core_enabled: bool = Field(
+        default=False,
+        description="Enable the experimental Rust-owned MCP session-affinity forwarding path while keeping Python worker forwarding as the fallback.",
+    )
+    experimental_rust_mcp_session_auth_reuse_enabled: bool = Field(
+        default=False,
+        description="Enable the experimental Rust-owned MCP session-bound auth-context reuse path for direct public /mcp ingress.",
+    )
 
     # Authentication
     basic_auth_user: str = "admin"
@@ -1830,6 +1872,30 @@ def _auto_enable_security_txt(cls, v: Any, info: ValidationInfo) -> bool:
             return bool(info.data["well_known_security_txt"].strip())
         return bool(v)
 
+    @field_validator("experimental_rust_mcp_runtime_uds", mode="after")
+    @classmethod
+    def _validate_experimental_rust_mcp_runtime_uds(cls, value: Optional[str]) -> Optional[str]:
+        """Validate the optional UDS path used for the Rust MCP runtime sidecar.
+
+        Args:
+            value: Candidate UDS path from configuration.
+
+        Returns:
+            The normalized absolute UDS path, or ``None`` when unset.
+
+        Raises:
+            ValueError: If the path is not absolute or its parent directory is missing.
+        """
+        if value in (None, ""):
+            return None
+
+        uds_path = Path(value).expanduser()
+        if not uds_path.is_absolute():
+            raise ValueError("experimental_rust_mcp_runtime_uds must be an absolute path")
+        if not uds_path.parent.exists():
+            raise ValueError(f"experimental_rust_mcp_runtime_uds parent directory does not exist: {uds_path.parent}")
+        return str(uds_path)
+
     # -------------------------------
     # Flexible list parsing for envs
     # -------------------------------
diff --git a/mcpgateway/main.py b/mcpgateway/main.py
index 160b549307..e650bbd52c 100644
--- a/mcpgateway/main.py
+++ b/mcpgateway/main.py
@@ -28,10 +28,12 @@
 
 # Standard
 import asyncio
+import base64
 from contextlib import asynccontextmanager, suppress
 from datetime import datetime, timezone
 from functools import lru_cache
 import hashlib
+import hmac
 import html
 import re
 import sys
@@ -64,7 +66,9 @@
 from uvicorn.middleware.proxy_headers import ProxyHeadersMiddleware
 
 # First-Party
+# Import the admin routes from the new module
 from mcpgateway import __version__
+from mcpgateway import version as version_module
 from mcpgateway.admin import admin_router, set_logging_service
 from mcpgateway.auth import _check_token_revoked_sync, _lookup_api_token_sync, _resolve_teams_from_db, get_current_user, get_user_team_roles, normalize_token_teams
 from mcpgateway.bootstrap_db import main as bootstrap_db
@@ -143,8 +147,16 @@
 from mcpgateway.services.server_service import ServerError, ServerLockConflictError, ServerNameConflictError, ServerNotFoundError
 from mcpgateway.services.tag_service import TagService
 from mcpgateway.services.tool_service import ToolError, ToolLockConflictError, ToolNameConflictError, ToolNotFoundError
+from mcpgateway.transports.rust_mcp_runtime_proxy import RustMCPRuntimeProxy
 from mcpgateway.transports.sse_transport import SSETransport
-from mcpgateway.transports.streamablehttp_transport import SessionManagerWrapper, set_shared_session_registry, streamable_http_auth
+from mcpgateway.transports.streamablehttp_transport import (
+    _validate_streamable_session_access,
+    get_streamable_http_auth_context,
+    SessionManagerWrapper,
+    set_shared_session_registry,
+    streamable_http_auth,
+    user_context_var,
+)
 from mcpgateway.utils.db_isready import wait_for_db_ready
 from mcpgateway.utils.error_formatter import ErrorFormatter
 from mcpgateway.utils.metadata_capture import MetadataCapture
@@ -156,8 +168,6 @@
 from mcpgateway.utils.token_scoping import validate_server_access
 from mcpgateway.utils.verify_credentials import extract_websocket_bearer_token, is_proxy_auth_trust_active, require_admin_auth, require_docs_auth_override, verify_jwt_token
 from mcpgateway.validation.jsonrpc import JSONRPCError
-
-# Import the admin routes from the new module
 from mcpgateway.version import router as version_router
 
 # Initialize logging service first
@@ -299,6 +309,340 @@ def get_user_email(user):
     return str(user) if user else "unknown"
 
 
+_INTERNAL_MCP_AUTH_CONTEXT_HEADER = "x-contextforge-auth-context"
+_INTERNAL_MCP_RUNTIME_AUTH_HEADER = "x-contextforge-mcp-runtime-auth"
+_INTERNAL_MCP_RUNTIME_AUTH_CONTEXT = "contextforge-internal-mcp-runtime-v1"
+_INTERNAL_MCP_SESSION_VALIDATED_HEADER = "x-contextforge-session-validated"
+
+
+def _get_internal_mcp_auth_context(request: Request) -> Optional[Dict[str, Any]]:
+    """Return trusted auth context forwarded from the StreamableHTTP MCP auth layer.
+
+    Args:
+        request: Incoming request that may carry trusted MCP auth context on state.
+
+    Returns:
+        The forwarded auth context dictionary when present, otherwise ``None``.
+    """
+    internal_auth_context = getattr(request.state, "_mcp_internal_auth_context", None)
+    if isinstance(internal_auth_context, dict):
+        return internal_auth_context
+    return None
+
+
+def _decode_internal_mcp_auth_context(header_value: str) -> Dict[str, Any]:
+    """Decode the trusted internal MCP auth header payload.
+
+    Args:
+        header_value: Base64url-encoded trusted auth context header value.
+
+    Returns:
+        Decoded auth context dictionary.
+
+    Raises:
+        ValueError: If the decoded payload is not a JSON object.
+    """
+    padding = "=" * (-len(header_value) % 4)
+    decoded = base64.urlsafe_b64decode(f"{header_value}{padding}".encode("ascii"))
+    payload = orjson.loads(decoded)
+    if not isinstance(payload, dict):
+        raise ValueError("Decoded internal MCP auth context must be an object")
+    return payload
+
+
+def _auth_encryption_secret_value() -> str:
+    """Return the configured auth-encryption secret as a plain string.
+
+    Returns:
+        The auth-encryption secret, normalized to a regular string.
+    """
+    secret = settings.auth_encryption_secret
+    if hasattr(secret, "get_secret_value"):
+        return secret.get_secret_value()
+    return str(secret)
+
+
+@lru_cache(maxsize=8)
+def _expected_internal_mcp_runtime_auth_header_for_secret(secret: str) -> str:
+    """Return the shared secret-derived trust header for Rust->Python MCP hops.
+
+    Args:
+        secret: Auth-encryption secret to derive the trust header from.
+
+    Returns:
+        Hex-encoded SHA-256 digest derived from the provided auth secret.
+    """
+    material = f"{secret}:{_INTERNAL_MCP_RUNTIME_AUTH_CONTEXT}".encode("utf-8")
+    return hashlib.sha256(material).hexdigest()
+
+
+def _expected_internal_mcp_runtime_auth_header() -> str:
+    """Return the current shared secret-derived trust header for Rust->Python MCP hops.
+
+    Returns:
+        Hex-encoded SHA-256 digest derived from the current auth secret.
+    """
+    return _expected_internal_mcp_runtime_auth_header_for_secret(_auth_encryption_secret_value())
+
+
+def _has_valid_internal_mcp_runtime_auth_header(request: Request) -> bool:
+    """Validate the shared secret-derived trust header for internal MCP requests.
+
+    Args:
+        request: Incoming internal MCP request.
+
+    Returns:
+        ``True`` when the derived trust header matches the expected value.
+    """
+    provided = request.headers.get(_INTERNAL_MCP_RUNTIME_AUTH_HEADER)
+    if not provided:
+        return False
+    return hmac.compare_digest(provided, _expected_internal_mcp_runtime_auth_header())
+
+
+def _is_trusted_internal_mcp_runtime_request(request: Request) -> bool:
+    """Return whether the request came from the local Rust runtime sidecar.
+
+    Args:
+        request: Incoming request to inspect.
+
+    Returns:
+        ``True`` when the request carries the trusted Rust runtime marker from
+        loopback, otherwise ``False``.
+    """
+    runtime_marker = request.headers.get("x-contextforge-mcp-runtime")
+    client_host = getattr(getattr(request, "client", None), "host", None)
+    return runtime_marker == "rust" and _has_valid_internal_mcp_runtime_auth_header(request) and client_host in ("127.0.0.1", "::1")
+
+
+def _build_internal_mcp_forwarded_user(request: Request) -> Dict[str, Any]:
+    """Build the authenticated user payload for internal Rust -> Python MCP dispatch.
+
+    Args:
+        request: Trusted internal request forwarded from the Rust runtime.
+
+    Returns:
+        Synthetic authenticated user payload used by internal MCP handlers.
+
+    Raises:
+        HTTPException: If the request is not trusted or the forwarded auth context
+            is missing or invalid.
+    """
+    if not _is_trusted_internal_mcp_runtime_request(request):
+        raise HTTPException(status_code=403, detail="Internal MCP dispatch is only available to the local Rust runtime")
+
+    header_value = request.headers.get(_INTERNAL_MCP_AUTH_CONTEXT_HEADER)
+    if not header_value:
+        raise HTTPException(status_code=400, detail="Missing trusted MCP auth context")
+
+    try:
+        auth_context = _decode_internal_mcp_auth_context(header_value)
+    except Exception as exc:
+        raise HTTPException(status_code=400, detail=f"Invalid trusted MCP auth context: {exc}") from exc
+
+    setattr(request.state, "_mcp_internal_auth_context", auth_context)
+
+    if "teams" in auth_context and (auth_context["teams"] is None or isinstance(auth_context["teams"], list)):
+        request.state.token_teams = auth_context["teams"]
+
+    if request.headers.get(_INTERNAL_MCP_SESSION_VALIDATED_HEADER) == "rust":
+        auth_context["_rust_session_validated"] = True
+
+    return {
+        "email": auth_context.get("email"),
+        "full_name": auth_context.get("email") or "MCP Internal Forward",
+        "is_admin": bool(auth_context.get("permission_is_admin", auth_context.get("is_admin", False))),
+        "auth_method": "mcp_internal_forward",
+        "token_use": auth_context.get("token_use"),
+    }
+
+
+def _enforce_internal_mcp_server_scope(request: Request, server_id: str) -> None:
+    """Validate trusted internal server scope against any forwarded token server scope.
+
+    Args:
+        request: Trusted internal MCP request.
+        server_id: Effective virtual server identifier for the operation.
+
+    Raises:
+        HTTPException: If the forwarded token scope does not authorize the server.
+    """
+    auth_context = _get_internal_mcp_auth_context(request)
+    if not isinstance(auth_context, dict):
+        return
+
+    scoped_server_id = auth_context.get("scoped_server_id")
+    if isinstance(scoped_server_id, str) and scoped_server_id and not validate_server_access({"server_id": scoped_server_id}, server_id):
+        raise HTTPException(status_code=403, detail=f"Token not authorized for server: {server_id}")
+
+
+async def _authorize_internal_mcp_request(request: Request, db: Session, *, permission: str, method: str, server_id: Optional[str] = None):
+    """Authorize trusted Rust-side MCP dispatch while preserving permissive MCP semantics.
+
+    For authenticated callers, this enforces the same token-scope and RBAC rules as
+    the regular RPC dispatcher. For unauthenticated MCP callers in permissive mode,
+    StreamableHTTP middleware already downgraded them to public-only scope and
+    enforced per-server OAuth, so the internal Rust -> Python hop should not re-deny
+    public-only requests merely because there is no authenticated RBAC identity.
+
+    Args:
+        request: Trusted internal MCP request.
+        db: Active database session.
+        permission: RBAC permission required for the method.
+        method: MCP method name being authorized.
+        server_id: Optional virtual server identifier used for additional scope checks.
+
+    Returns:
+        The forwarded user payload used for downstream authorization and scoping.
+    """
+    user = _build_internal_mcp_forwarded_user(request)
+    auth_context = _get_internal_mcp_auth_context(request) or {}
+
+    if server_id:
+        _enforce_internal_mcp_server_scope(request, server_id)
+
+    if auth_context.get("is_authenticated", True) is True:
+        await _ensure_rpc_permission(user, db, permission, method, request=request)
+
+    return user
+
+
+def _build_internal_mcp_auth_scope(
+    *,
+    method: str,
+    path: str,
+    query_string: str,
+    headers: Dict[str, str],
+    client_ip: Optional[str],
+) -> Dict[str, Any]:
+    """Construct a synthetic ASGI scope for internal Rust -> Python MCP auth.
+
+    Args:
+        method: HTTP method of the original public MCP request.
+        path: Public MCP path, for example ``/mcp`` or ``/servers/<id>/mcp``.
+        query_string: Raw query string without the leading ``?``.
+        headers: Public request headers to replay through auth/token scoping.
+        client_ip: Effective client IP derived by Rust from the public request.
+
+    Returns:
+        ASGI scope dictionary suitable for token scoping and ``streamable_http_auth``.
+    """
+    raw_headers = []
+    for name, value in headers.items():
+        if not isinstance(name, str) or not isinstance(value, str):
+            continue
+        raw_headers.append((name.lower().encode("latin-1"), value.encode("latin-1")))
+
+    return {
+        "type": "http",
+        "method": method.upper(),
+        "path": path,
+        "raw_path": path.encode("latin-1"),
+        "query_string": query_string.encode("latin-1"),
+        "headers": raw_headers,
+        "client": (client_ip or "unknown", 0),
+        "state": {},
+    }
+
+
+async def _run_internal_mcp_authentication(
+    *,
+    method: str,
+    path: str,
+    query_string: str,
+    headers: Dict[str, str],
+    client_ip: Optional[str],
+) -> tuple[Optional[Response], Dict[str, Any]]:
+    """Run token scoping and MCP transport auth for a direct Rust ingress request.
+
+    Args:
+        method: HTTP method of the public request.
+        path: Public request path.
+        query_string: Raw query string without the leading ``?``.
+        headers: Public request headers replayed from Rust.
+        client_ip: Effective client IP for token-scope IP restriction checks.
+
+    Returns:
+        Tuple of ``(error_response, auth_context)``.
+        ``error_response`` is ``None`` on success; otherwise it contains the exact
+        response generated by the existing token-scoping/auth layers.
+    """
+    scope = _build_internal_mcp_auth_scope(
+        method=method,
+        path=path,
+        query_string=query_string,
+        headers=headers,
+        client_ip=client_ip,
+    )
+    request = starletteRequest(scope)
+    sent_messages: list[dict[str, Any]] = []
+
+    async def _receive() -> dict[str, Any]:
+        """Return an empty request body for the synthetic auth probe.
+
+        Returns:
+            Minimal ASGI ``http.request`` message with no body content.
+        """
+        return {"type": "http.request", "body": b"", "more_body": False}
+
+    async def _send(message: dict[str, Any]) -> None:
+        """Capture ASGI response messages emitted by auth middleware.
+
+        Args:
+            message: ASGI response message emitted by the auth stack.
+        """
+        sent_messages.append(message)
+
+    def _captured_response() -> Response:
+        """Build a concrete response from the captured ASGI messages.
+
+        Returns:
+            Response reconstructed from the captured auth middleware output.
+        """
+        status_code = 500
+        response_headers: Dict[str, str] = {}
+        body = b""
+        for message in sent_messages:
+            if message.get("type") == "http.response.start":
+                status_code = int(message.get("status", 500))
+                response_headers = {
+                    key.decode("latin-1"): value.decode("latin-1") for key, value in message.get("headers", []) if isinstance(key, (bytes, bytearray)) and isinstance(value, (bytes, bytearray))
+                }
+            elif message.get("type") == "http.response.body":
+                body += message.get("body", b"")
+        return Response(content=body, status_code=status_code, headers=response_headers)
+
+    async def _call_next(_request: starletteRequest) -> Response:
+        """Run the existing Streamable HTTP auth layer for the synthetic request.
+
+        Returns:
+            Success response when authentication passes, otherwise the captured
+            failure response emitted by the existing middleware chain.
+        """
+        auth_ok = await streamable_http_auth(scope, _receive, _send)
+        if auth_ok:
+            return ORJSONResponse(status_code=200, content={"authenticated": True})
+        return _captured_response()
+
+    original_context = user_context_var.get()
+    user_context_var.set({})
+    try:
+        if settings.email_auth_enabled:
+            response = await token_scoping_middleware(request, _call_next)
+        else:
+            response = await _call_next(request)
+
+        if response is None:
+            response = _captured_response()
+
+        if response.status_code >= 400:
+            return response, {}
+
+        return None, get_streamable_http_auth_context()
+    finally:
+        user_context_var.set(original_context)
+
+
 def _normalize_token_teams(teams: Optional[List]) -> List[str]:
     """
     Normalize token teams to list of team IDs.
@@ -371,6 +715,12 @@ def _get_token_teams_from_request(request: Request) -> Optional[List[str]]:
         >>> main._get_token_teams_from_request(req)
         []
     """
+    internal_auth_context = _get_internal_mcp_auth_context(request)
+    if isinstance(internal_auth_context, dict) and "teams" in internal_auth_context:
+        internal_teams = internal_auth_context.get("teams")
+        if internal_teams is None or isinstance(internal_teams, list):
+            return internal_teams
+
     # SECURITY: First check request.state.token_teams (already normalized by auth.py)
     # This is the preferred path as auth.py has already applied normalize_token_teams
     # Use getattr with a sentinel to distinguish "not set" from "set to None"
@@ -431,6 +781,15 @@ def _get_rpc_filter_context(request: Request, user) -> tuple:
     # Check if user is admin - MUST come from token, not DB user
     # This ensures that tokens with restricted scope (empty teams) don't inherit admin bypass
     is_admin = False
+    internal_auth_context = _get_internal_mcp_auth_context(request)
+    if isinstance(internal_auth_context, dict):
+        if user_email is None:
+            user_email = internal_auth_context.get("email")
+        is_admin = bool(internal_auth_context.get("is_admin", False))
+        if token_teams is not None and len(token_teams) == 0:
+            is_admin = False
+        return user_email, token_teams, is_admin
+
     cached = getattr(request.state, "_jwt_verified_payload", None)
     if cached and isinstance(cached, tuple) and len(cached) == 2:
         _, payload = cached
@@ -455,6 +814,9 @@ def _has_verified_jwt_payload(request: Request) -> bool:
     Returns:
         ``True`` when a verified payload tuple is present, otherwise ``False``.
     """
+    internal_auth_context = _get_internal_mcp_auth_context(request)
+    if isinstance(internal_auth_context, dict):
+        return True
     cached = getattr(request.state, "_jwt_verified_payload", None)
     return bool(cached and isinstance(cached, tuple) and len(cached) == 2 and cached[1])
 
@@ -540,6 +902,13 @@ def _extract_scoped_permissions(request: Request) -> set[str] | None:
         None: no explicit scope cap (empty permissions or no JWT — defer to RBAC)
         set: explicit permission set (may contain '*' for wildcard)
     """
+    internal_auth_context = _get_internal_mcp_auth_context(request)
+    if isinstance(internal_auth_context, dict):
+        permissions = internal_auth_context.get("scoped_permissions")
+        if not permissions:
+            return None
+        return set(permissions)
+
     cached = getattr(request.state, "_jwt_verified_payload", None)
     if not cached or not isinstance(cached, tuple) or len(cached) != 2:
         return None
@@ -555,6 +924,27 @@ def _extract_scoped_permissions(request: Request) -> set[str] | None:
     return set(permissions)
 
 
+def _is_permission_admin_user(user) -> bool:
+    """Return whether the caller already has permission-layer admin authority.
+
+    This is stricter than token-scope admin semantics. It is used only to skip
+    redundant RBAC DB lookups after token scope caps have already been enforced.
+
+    Args:
+        user: Authenticated user object or dict-like payload.
+
+    Returns:
+        ``True`` when the caller already has permission-layer admin authority.
+    """
+    if hasattr(user, "is_admin"):
+        return bool(getattr(user, "is_admin", False))
+    if isinstance(user, dict):
+        if "permission_is_admin" in user:
+            return bool(user.get("permission_is_admin", False))
+        return False
+    return False
+
+
 async def _ensure_rpc_permission(user, db: Session, permission: str, method: str, request: Request | None = None) -> None:
     """Require a specific RPC permission for a method branch.
 
@@ -579,6 +969,9 @@ async def _ensure_rpc_permission(user, db: Session, permission: str, method: str
             logger.warning("RPC permission denied (token scope): method=%s, required=%s", method, permission)
             raise JSONRPCError(-32003, _ACCESS_DENIED_MSG, {"method": method})
 
+    if permission == "admin.system_config" and _is_permission_admin_user(user):
+        return
+
     # Layer 2: RBAC check
     # Session tokens have no explicit team_id, so check across all team-scoped roles.
     # Mirrors the @require_permission decorator's check_any_team fallback (rbac.py:562-576).
@@ -589,6 +982,72 @@ async def _ensure_rpc_permission(user, db: Session, permission: str, method: str
         raise JSONRPCError(-32003, _ACCESS_DENIED_MSG, {"method": method})
 
 
+def _serialize_mcp_tool_definition(tool: Any) -> Dict[str, Any]:
+    """Return an MCP-compliant tool definition without API-only metadata fields.
+
+    Args:
+        tool: Tool ORM object, pydantic model, or dict-like payload.
+
+    Returns:
+        MCP-compatible tool definition dictionary.
+    """
+    if hasattr(tool, "model_dump"):
+        data = tool.model_dump(by_alias=True, exclude_none=True)
+    elif isinstance(tool, dict):
+        data = dict(tool)
+    else:
+        data = {}
+
+    payload: Dict[str, Any] = {
+        "name": data.get("name", getattr(tool, "name", None)),
+        "description": data.get("description", getattr(tool, "description", None)),
+        "inputSchema": data.get("inputSchema", getattr(tool, "input_schema", None)),
+    }
+
+    output_schema = data.get("outputSchema", getattr(tool, "output_schema", None))
+    if output_schema is not None:
+        payload["outputSchema"] = output_schema
+
+    annotations = data.get("annotations", getattr(tool, "annotations", None))
+    if annotations is not None:
+        payload["annotations"] = annotations
+
+    return {key: value for key, value in payload.items() if value is not None}
+
+
+def _serialize_mcp_tool_definitions(tools: List[Any]) -> List[Dict[str, Any]]:
+    """Serialize tool records to MCP tool definitions.
+
+    Args:
+        tools: Iterable of tool-like records to serialize.
+
+    Returns:
+        List of MCP-compatible tool definitions.
+    """
+    return [_serialize_mcp_tool_definition(tool) for tool in tools]
+
+
+def _serialize_legacy_tool_payloads(tools: List[Any]) -> List[Dict[str, Any]]:
+    """Serialize tool records using the legacy JSON-RPC shape.
+
+    Args:
+        tools: Iterable of tool-like records to serialize.
+
+    Returns:
+        List of legacy tool payload dictionaries.
+    """
+    payloads: List[Dict[str, Any]] = []
+    for tool in tools:
+        if hasattr(tool, "model_dump"):
+            payload = tool.model_dump(by_alias=True, exclude_none=True)
+        elif isinstance(tool, dict):
+            payload = dict(tool)
+        else:
+            payload = {}
+        payloads.append(payload)
+    return payloads
+
+
 def _enforce_scoped_resource_access(request: Request, db: Session, user, resource_path: str) -> None:
     """Apply token-scope ownership checks for a concrete resource path.
 
@@ -685,6 +1144,147 @@ async def _authorize_run_cancellation(request: Request, user, request_id: str, *
 resource_cache = ResourceCache(max_size=settings.resource_cache_size, ttl=settings.resource_cache_ttl)
 
 
+def _rust_build_included() -> bool:
+    """Return whether the current image includes Rust MCP artifacts.
+
+    Returns:
+        ``True`` when the current image contains the Rust MCP binaries/plugins.
+    """
+    return version_module.rust_build_included()
+
+
+def _rust_runtime_managed() -> bool:
+    """Return whether the gateway expects to manage the Rust MCP sidecar locally.
+
+    Returns:
+        ``True`` when the gateway should launch and supervise the Rust sidecar.
+    """
+    return version_module.rust_runtime_managed()
+
+
+def _current_mcp_transport_mount() -> str:
+    """Return which public /mcp transport is currently mounted.
+
+    Returns:
+        Runtime label identifying the currently mounted public MCP transport.
+    """
+    return version_module.current_mcp_transport_mount()
+
+
+def _should_mount_public_rust_transport() -> bool:
+    """Return whether the public ``/mcp`` path should be served directly by Rust.
+
+    Returns:
+        ``True`` only when the Rust runtime is enabled and the session-auth reuse
+        path is enabled, allowing Rust to safely own steady-state public MCP
+        session traffic. Otherwise returns ``False`` and leaves public MCP on
+        the Python ingress path.
+    """
+    return version_module.should_mount_public_rust_transport()
+
+
+def _should_use_rust_public_session_stack() -> bool:
+    """Return whether Rust should own the effective public MCP session stack.
+
+    Returns:
+        ``True`` only when the Rust runtime is enabled and session-auth reuse is
+        enabled, allowing the public transport, session metadata, replay/resume,
+        live-stream, and affinity behavior to stay on a consistent Rust-backed
+        path. Otherwise returns ``False`` so the public MCP session stack falls
+        back to Python semantics.
+    """
+    return version_module.should_use_rust_public_session_stack()
+
+
+def _current_mcp_runtime_mode() -> str:
+    """Return a compact runtime-mode label for observability.
+
+    Returns:
+        Human-readable runtime mode label for health/readiness reporting.
+    """
+    return version_module.current_mcp_runtime_mode()
+
+
+def _current_mcp_session_core_mode() -> str:
+    """Return which session core currently owns MCP session metadata.
+
+    Returns:
+        ``"rust"`` when the Rust session core is enabled, otherwise ``"python"``.
+    """
+    return version_module.current_mcp_session_core_mode()
+
+
+def _current_mcp_event_store_mode() -> str:
+    """Return which runtime currently owns MCP resumable event-store semantics.
+
+    Returns:
+        ``"rust"`` when the Rust event store is enabled, otherwise ``"python"``.
+    """
+    return version_module.current_mcp_event_store_mode()
+
+
+def _current_mcp_resume_core_mode() -> str:
+    """Return which runtime currently owns public MCP replay/resume behavior.
+
+    Returns:
+        ``"rust"`` when Rust owns replay/resume, otherwise ``"python"``.
+    """
+    return version_module.current_mcp_resume_core_mode()
+
+
+def _current_mcp_live_stream_core_mode() -> str:
+    """Return which runtime currently owns non-resume public GET /mcp SSE behavior.
+
+    Returns:
+        ``"rust"`` when Rust owns live GET /mcp streaming, otherwise ``"python"``.
+    """
+    return version_module.current_mcp_live_stream_core_mode()
+
+
+def _current_mcp_affinity_core_mode() -> str:
+    """Return which runtime currently owns MCP multi-worker session-affinity forwarding.
+
+    Returns:
+        ``"rust"`` when Rust owns session-affinity forwarding, otherwise ``"python"``.
+    """
+    return version_module.current_mcp_affinity_core_mode()
+
+
+def _current_mcp_session_auth_reuse_mode() -> str:
+    """Return which runtime currently owns MCP session-bound auth-context reuse.
+
+    Returns:
+        ``"rust"`` when Rust session auth reuse is enabled, otherwise ``"python"``.
+    """
+    return version_module.current_mcp_session_auth_reuse_mode()
+
+
+def _mcp_runtime_status_payload() -> Dict[str, Any]:
+    """Return MCP runtime diagnostics for health/readiness endpoints.
+
+    Returns:
+        Diagnostic payload describing the active MCP runtime configuration.
+    """
+    return version_module.mcp_runtime_status_payload()
+
+
+def _apply_runtime_mode_headers(response: Response) -> None:
+    """Attach MCP runtime mode headers to a response.
+
+    Args:
+        response: Response object to annotate.
+    """
+    response.headers["x-contextforge-mcp-runtime-mode"] = _current_mcp_runtime_mode()
+    response.headers["x-contextforge-mcp-transport-mounted"] = _current_mcp_transport_mount()
+    response.headers["x-contextforge-rust-build-included"] = "true" if _rust_build_included() else "false"
+    response.headers["x-contextforge-mcp-session-core-mode"] = _current_mcp_session_core_mode()
+    response.headers["x-contextforge-mcp-event-store-mode"] = _current_mcp_event_store_mode()
+    response.headers["x-contextforge-mcp-resume-core-mode"] = _current_mcp_resume_core_mode()
+    response.headers["x-contextforge-mcp-live-stream-core-mode"] = _current_mcp_live_stream_core_mode()
+    response.headers["x-contextforge-mcp-affinity-core-mode"] = _current_mcp_affinity_core_mode()
+    response.headers["x-contextforge-mcp-session-auth-reuse-mode"] = _current_mcp_session_auth_reuse_mode()
+
+
 @lru_cache(maxsize=512)
 def _parse_jsonpath(jsonpath: str) -> JSONPath:
     """Cache parsed JSONPath expression.
@@ -2424,7 +3024,10 @@ def get_db():
                 pass  # nosec B110 - Best effort cleanup on connection failure
         raise
     finally:
-        db.close()
+        try:
+            db.close()
+        except Exception:
+            pass  # nosec B110 - Best effort cleanup on already-failed prompt bridge sessions
 
 
 async def _read_request_json(request: Request) -> Any:
@@ -6028,17 +6631,2241 @@ async def remove_root(
 @utility_router.post("/rpc/")
 @utility_router.post("/rpc")
 async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depends(get_current_user_with_permissions)):
-    """Handle RPC requests.
+    """Handle authenticated public RPC requests.
 
     Args:
-        request (Request): The incoming FastAPI request.
-        db (Session): Database session.
-        user: The authenticated user (dict with RBAC context).
+        request: Incoming public RPC request.
+        db: Database session provided by dependency injection.
+        user: Authenticated user payload with permissions.
 
     Returns:
-        Response with the RPC result or error.
+        JSON-RPC response generated by the shared authenticated RPC dispatcher.
+    """
+    return await _handle_rpc_authenticated(request, db=db, user=user)
 
-    Raises:
+
+@utility_router.post("/_internal/mcp/authenticate/")
+@utility_router.post("/_internal/mcp/authenticate")
+async def handle_internal_mcp_authenticate(request: Request):
+    """Authenticate a public MCP request for direct Rust ingress.
+
+    Args:
+        request: Trusted internal request sent by the local Rust runtime.
+
+    Returns:
+        Auth context payload that Rust can forward on subsequent internal MCP calls.
+
+    Raises:
+        HTTPException: If the request is not trusted or the forwarded payload is invalid.
+    """
+    if not _is_trusted_internal_mcp_runtime_request(request):
+        raise HTTPException(status_code=403, detail="Internal MCP authenticate is only available to the local Rust runtime")
+
+    payload = await request.json()
+    if not isinstance(payload, dict):
+        raise HTTPException(status_code=400, detail="Invalid internal MCP authenticate payload")
+
+    method = str(payload.get("method") or "GET").upper()
+    path = payload.get("path")
+    query_string = payload.get("queryString", "")
+    forwarded_headers = payload.get("headers", {})
+    client_ip = payload.get("clientIp")
+
+    if not isinstance(path, str) or not path:
+        raise HTTPException(status_code=400, detail="Internal MCP authenticate payload requires path")
+    if not isinstance(query_string, str):
+        raise HTTPException(status_code=400, detail="Internal MCP authenticate payload queryString must be a string")
+    if not isinstance(forwarded_headers, dict) or not all(isinstance(name, str) and isinstance(value, str) for name, value in forwarded_headers.items()):
+        raise HTTPException(status_code=400, detail="Internal MCP authenticate payload headers must be a string map")
+    if client_ip is not None and not isinstance(client_ip, str):
+        raise HTTPException(status_code=400, detail="Internal MCP authenticate payload clientIp must be a string")
+
+    error_response, auth_context = await _run_internal_mcp_authentication(
+        method=method,
+        path=path,
+        query_string=query_string,
+        headers=forwarded_headers,
+        client_ip=client_ip,
+    )
+    if error_response is not None:
+        return error_response
+
+    return ORJSONResponse(status_code=200, content={"authContext": auth_context})
+
+
+@utility_router.post("/_internal/mcp/rpc/")
+@utility_router.post("/_internal/mcp/rpc")
+async def handle_internal_mcp_rpc(request: Request):
+    """Handle trusted MCP dispatch forwarded from the local Rust runtime.
+
+    Args:
+        request: Trusted internal MCP request from the Rust runtime.
+
+    Returns:
+        JSON-RPC response from the shared authenticated RPC dispatcher.
+
+    Raises:
+        Exception: Propagated after rolling back the local database session.
+    """
+    user = _build_internal_mcp_forwarded_user(request)
+    db = SessionLocal()
+    try:
+        response = await _handle_rpc_authenticated(request, db=db, user=user)
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return response
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/initialize/")
+@utility_router.post("/_internal/mcp/initialize")
+async def handle_internal_mcp_initialize(request: Request):
+    """Handle trusted MCP initialize requests forwarded from the local Rust runtime.
+
+    Args:
+        request: Trusted internal MCP initialize request.
+
+    Returns:
+        JSON-RPC initialize response payload.
+    """
+    user = _build_internal_mcp_forwarded_user(request)
+    req_id = None
+    try:
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id")
+        if req_id is None:
+            req_id = str(uuid.uuid4())
+
+        if body.get("method") != "initialize":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+        else:
+            server_id = params.get("server_id")
+
+        result = await _execute_rpc_initialize(
+            request,
+            user,
+            params=params,
+            server_id=server_id,
+            mcp_session_id=request.headers.get("mcp-session-id") or request.headers.get("x-mcp-session-id"),
+        )
+        return ORJSONResponse(content={"jsonrpc": "2.0", "result": result, "id": req_id})
+    except JSONRPCError as exc:
+        error = exc.to_dict()
+        return ORJSONResponse(content={"jsonrpc": "2.0", "error": error["error"], "id": req_id})
+    except Exception as exc:
+        logger.error("Internal MCP initialize error: %s", exc)
+        return ORJSONResponse(
+            content={
+                "jsonrpc": "2.0",
+                "error": {"code": -32000, "message": "Internal error", "data": str(exc)},
+                "id": req_id,
+            }
+        )
+
+
+@utility_router.delete("/_internal/mcp/session/")
+@utility_router.delete("/_internal/mcp/session")
+async def handle_internal_mcp_session_delete(request: Request):
+    """Handle trusted MCP session teardown forwarded from the local Rust runtime.
+
+    Args:
+        request: Trusted internal MCP session-delete request.
+
+    Returns:
+        Empty HTTP response indicating the session was removed.
+    """
+    _build_internal_mcp_forwarded_user(request)
+    auth_context = _get_internal_mcp_auth_context(request) or {}
+    mcp_session_id = request.headers.get("mcp-session-id") or request.headers.get("x-mcp-session-id")
+    if not mcp_session_id:
+        return ORJSONResponse(status_code=400, content={"detail": "mcp-session-id header is required"})
+
+    if auth_context.get("_rust_session_validated") is not True:
+        session_allowed, deny_status, deny_detail = await _validate_streamable_session_access(
+            mcp_session_id=mcp_session_id,
+            user_context=auth_context,
+        )
+        if not session_allowed:
+            return ORJSONResponse(status_code=deny_status, content={"detail": deny_detail})
+
+    server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+    if server_id:
+        _enforce_internal_mcp_server_scope(request, server_id)
+
+    await session_registry.remove_session(mcp_session_id)
+
+    if settings.mcpgateway_session_affinity_enabled:
+        try:
+            # First-Party
+            from mcpgateway.services.mcp_session_pool import get_mcp_session_pool  # pylint: disable=import-outside-toplevel
+
+            pool = get_mcp_session_pool()
+            await pool.cleanup_streamable_http_session_owner(mcp_session_id)
+        except RuntimeError:
+            pass
+
+    return Response(status_code=204)
+
+
+@utility_router.post("/_internal/mcp/notifications/initialized/")
+@utility_router.post("/_internal/mcp/notifications/initialized")
+async def handle_internal_mcp_notifications_initialized(request: Request):
+    """Handle trusted MCP notifications/initialized requests from the local Rust runtime.
+
+    Args:
+        request: Trusted internal MCP notification request.
+
+    Returns:
+        Empty HTTP response acknowledging the notification.
+
+    Raises:
+        HTTPException: If trusted server-scope validation fails.
+    """
+    _build_internal_mcp_forwarded_user(request)
+    req_id = None
+    try:
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id")
+        if body.get("method") != "notifications/initialized":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+
+        logger.info("Client initialized")
+        await logging_service.notify("Client initialized", LogLevel.INFO)
+        return Response(status_code=status.HTTP_204_NO_CONTENT)
+    except HTTPException:
+        raise
+    except Exception as exc:
+        logger.error("Internal MCP notifications/initialized error: %s", exc)
+        return ORJSONResponse(
+            content={
+                "jsonrpc": "2.0",
+                "error": {"code": -32000, "message": "Internal error", "data": str(exc)},
+                "id": req_id,
+            }
+        )
+
+
+@utility_router.post("/_internal/mcp/notifications/message/")
+@utility_router.post("/_internal/mcp/notifications/message")
+async def handle_internal_mcp_notifications_message(request: Request):
+    """Handle trusted MCP notifications/message requests from the local Rust runtime.
+
+    Args:
+        request: Trusted internal MCP notification request.
+
+    Returns:
+        Empty HTTP response acknowledging the notification.
+
+    Raises:
+        HTTPException: If trusted server-scope validation fails.
+    """
+    _build_internal_mcp_forwarded_user(request)
+    req_id = None
+    try:
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id")
+        if body.get("method") != "notifications/message":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        await logging_service.notify(
+            params.get("data"),
+            LogLevel(params.get("level", "info")),
+            params.get("logger"),
+        )
+        return Response(status_code=status.HTTP_204_NO_CONTENT)
+    except HTTPException:
+        raise
+    except Exception as exc:
+        logger.error("Internal MCP notifications/message error: %s", exc)
+        return ORJSONResponse(
+            content={
+                "jsonrpc": "2.0",
+                "error": {"code": -32000, "message": "Internal error", "data": str(exc)},
+                "id": req_id,
+            }
+        )
+
+
+@utility_router.post("/_internal/mcp/notifications/cancelled/")
+@utility_router.post("/_internal/mcp/notifications/cancelled")
+async def handle_internal_mcp_notifications_cancelled(request: Request):
+    """Handle trusted MCP notifications/cancelled requests from the local Rust runtime.
+
+    Args:
+        request: Trusted internal MCP cancellation notification.
+
+    Returns:
+        Empty HTTP response acknowledging the cancellation.
+
+    Raises:
+        HTTPException: If cancellation authorization or trusted scope validation fails.
+    """
+    user = _build_internal_mcp_forwarded_user(request)
+    req_id = None
+    try:
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id")
+        if body.get("method") != "notifications/cancelled":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        raw_request_id = params.get("requestId")
+        request_id = str(raw_request_id) if raw_request_id is not None else None
+        reason = params.get("reason")
+        logger.info("Request cancelled: %s, reason: %s", request_id, reason)
+        if request_id is not None:
+            await _authorize_run_cancellation(request, user, request_id, as_jsonrpc_error=False)
+            await cancellation_service.cancel_run(request_id, reason=reason)
+        await logging_service.notify(f"Request cancelled: {request_id}", LogLevel.INFO)
+        return Response(status_code=status.HTTP_204_NO_CONTENT)
+    except HTTPException:
+        raise
+    except Exception as exc:
+        logger.error("Internal MCP notifications/cancelled error: %s", exc)
+        return ORJSONResponse(
+            content={
+                "jsonrpc": "2.0",
+                "error": {"code": -32000, "message": "Internal error", "data": str(exc)},
+                "id": req_id,
+            }
+        )
+
+
+@utility_router.post("/_internal/mcp/tools/list/")
+@utility_router.post("/_internal/mcp/tools/list")
+async def handle_internal_mcp_tools_list(request: Request):
+    """Handle trusted server-scoped tools/list requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP tools/list request.
+
+    Returns:
+        MCP tools/list response payload for the requested virtual server.
+
+    Raises:
+        HTTPException: If the trusted server scope is missing or invalid.
+    """
+    server_id = request.headers.get("x-contextforge-server-id")
+    if not server_id:
+        raise HTTPException(status_code=400, detail="Missing trusted MCP server scope")
+
+    db = SessionLocal()
+    try:
+        user = await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="tools.read",
+            method="tools/list",
+            server_id=server_id,
+        )
+        user_email, token_teams, is_admin = _get_rpc_filter_context(request, user)
+        if is_admin and token_teams is None:
+            user_email = None
+            token_teams = None
+        elif token_teams is None:
+            token_teams = []
+
+        tools = await tool_service.list_server_mcp_tool_definitions(
+            db,
+            server_id,
+            user_email=user_email,
+            token_teams=token_teams,
+        )
+        return ORJSONResponse(content={"tools": tools})
+    except HTTPException:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content={"code": exc.code, "message": exc.message, "data": exc.data})
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/resources/list/")
+@utility_router.post("/_internal/mcp/resources/list")
+async def handle_internal_mcp_resources_list(request: Request):
+    """Handle trusted resources/list requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP resources/list request.
+
+    Returns:
+        MCP resources/list response payload.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "resources/list":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+        else:
+            server_id = params.get("server_id")
+        cursor = params.get("cursor")
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="resources.read",
+            method="resources/list",
+            server_id=server_id,
+        )
+
+        user_email, token_teams, is_admin = _get_rpc_filter_context(request, user)
+        if is_admin and token_teams is None:
+            user_email = None
+            token_teams = None
+        elif token_teams is None:
+            token_teams = []
+
+        if server_id:
+            resources = await resource_service.list_server_resources(
+                db,
+                server_id,
+                user_email=user_email,
+                token_teams=token_teams,
+            )
+            payload = {"resources": [r.model_dump(by_alias=True, exclude_none=True) for r in resources]}
+        else:
+            resources, next_cursor = await resource_service.list_resources(
+                db,
+                cursor=cursor,
+                limit=0,
+                user_email=user_email,
+                token_teams=token_teams,
+            )
+            payload = {"resources": [r.model_dump(by_alias=True, exclude_none=True) for r in resources]}
+            if next_cursor:
+                payload["nextCursor"] = next_cursor
+
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/resources/read/")
+@utility_router.post("/_internal/mcp/resources/read")
+async def handle_internal_mcp_resources_read(request: Request):
+    """Handle trusted resources/read requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP resources/read request.
+
+    Returns:
+        MCP resources/read response payload.
+    """
+    db = SessionLocal()
+    req_id = None
+    uri = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "resources/read":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+        else:
+            server_id = params.get("server_id")
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="resources.read",
+            method="resources/read",
+            server_id=server_id,
+        )
+
+        uri = params.get("uri")
+        request_id = params.get("requestId")
+        meta_data = params.get("_meta")
+        if not uri:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "code": -32602,
+                    "message": "Missing resource URI in parameters",
+                    "data": params,
+                },
+            )
+
+        auth_user_email, auth_token_teams, auth_is_admin = _get_rpc_filter_context(request, user)
+        if auth_is_admin and auth_token_teams is None:
+            auth_user_email = None
+        elif auth_token_teams is None:
+            auth_token_teams = []
+
+        plugin_context_table = getattr(request.state, "plugin_context_table", None)
+        plugin_global_context = getattr(request.state, "plugin_global_context", None)
+        result = await resource_service.read_resource(
+            db,
+            resource_uri=uri,
+            request_id=request_id,
+            user=auth_user_email,
+            server_id=server_id,
+            token_teams=auth_token_teams,
+            plugin_context_table=plugin_context_table,
+            plugin_global_context=plugin_global_context,
+            meta_data=meta_data,
+        )
+        # First-Party
+        from mcpgateway.common.models import ResourceContent  # pylint: disable=import-outside-toplevel
+
+        if isinstance(result, ResourceContent):
+            normalized_content = {"uri": result.uri}
+            if result.mime_type:
+                normalized_content["mimeType"] = result.mime_type
+            if result.text is not None:
+                normalized_content["text"] = result.text
+            elif result.blob is not None:
+                normalized_content["blob"] = base64.b64encode(result.blob).decode("ascii")
+            payload = {"contents": [normalized_content]}
+        elif hasattr(result, "model_dump"):
+            payload = {"contents": [result.model_dump(by_alias=True, exclude_none=True)]}
+        else:
+            payload = {"contents": [result]}
+
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except ResourceNotFoundError as exc:
+        return ORJSONResponse(
+            status_code=404,
+            content={
+                "code": -32002,
+                "message": str(exc),
+                "data": {"uri": uri} if uri else None,
+            },
+        )
+    except ResourceError as exc:
+        return ORJSONResponse(
+            status_code=400,
+            content={
+                "code": -32602,
+                "message": str(exc),
+                "data": {"uri": uri} if uri else None,
+            },
+        )
+    except JSONRPCError as exc:
+        status_code = 403 if exc.code == -32003 else 400
+        return ORJSONResponse(status_code=status_code, content=exc.to_dict()["error"])
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/resources/subscribe/")
+@utility_router.post("/_internal/mcp/resources/subscribe")
+async def handle_internal_mcp_resources_subscribe(request: Request):
+    """Handle trusted resources/subscribe requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP resources/subscribe request.
+
+    Returns:
+        Empty JSON response confirming the subscription.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "resources/subscribe":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="resources.read",
+            method="resources/subscribe",
+            server_id=server_id,
+        )
+
+        uri = params.get("uri")
+        if not uri:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "code": -32602,
+                    "message": "Missing resource URI in parameters",
+                    "data": params,
+                },
+            )
+
+        access_user_email, access_token_teams = _get_scoped_resource_access_context(request, user)
+        user_email = get_user_email(user)
+        subscription = ResourceSubscription(uri=uri, subscriber_id=user_email)
+        await resource_service.subscribe_resource(
+            db,
+            subscription,
+            user_email=access_user_email,
+            token_teams=access_token_teams,
+        )
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content={})
+    except ResourceNotFoundError as exc:
+        return ORJSONResponse(
+            status_code=404,
+            content={"code": -32002, "message": str(exc), "data": None},
+        )
+    except PermissionError:
+        return ORJSONResponse(
+            status_code=403,
+            content={"code": -32003, "message": _ACCESS_DENIED_MSG, "data": {"method": "resources/subscribe"}},
+        )
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/resources/unsubscribe/")
+@utility_router.post("/_internal/mcp/resources/unsubscribe")
+async def handle_internal_mcp_resources_unsubscribe(request: Request):
+    """Handle trusted resources/unsubscribe requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP resources/unsubscribe request.
+
+    Returns:
+        Empty JSON response confirming the unsubscription.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "resources/unsubscribe":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="resources.read",
+            method="resources/unsubscribe",
+            server_id=server_id,
+        )
+
+        uri = params.get("uri")
+        if not uri:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "code": -32602,
+                    "message": "Missing resource URI in parameters",
+                    "data": params,
+                },
+            )
+
+        user_email = get_user_email(user)
+        subscription = ResourceSubscription(uri=uri, subscriber_id=user_email)
+        await resource_service.unsubscribe_resource(db, subscription)
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content={})
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/resources/templates/list/")
+@utility_router.post("/_internal/mcp/resources/templates/list")
+async def handle_internal_mcp_resource_templates_list(request: Request):
+    """Handle trusted resources/templates/list requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP resources/templates/list request.
+
+    Returns:
+        MCP resources/templates/list response payload.
+
+    Raises:
+        Exception: Propagated after best-effort rollback when unexpected failures occur.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "resources/templates/list":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+        else:
+            server_id = params.get("server_id")
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="resources.read",
+            method="resources/templates/list",
+            server_id=server_id,
+        )
+
+        user_email, token_teams, is_admin = _get_rpc_filter_context(request, user)
+        if is_admin and token_teams is None:
+            token_teams = None
+        elif token_teams is None:
+            token_teams = []
+
+        resource_templates = await resource_service.list_resource_templates(
+            db,
+            user_email=user_email,
+            token_teams=token_teams,
+            server_id=server_id,
+        )
+        payload = {"resourceTemplates": [rt.model_dump(by_alias=True, exclude_none=True) for rt in resource_templates]}
+
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/roots/list/")
+@utility_router.post("/_internal/mcp/roots/list")
+async def handle_internal_mcp_roots_list(request: Request):
+    """Handle trusted roots/list requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP roots/list request.
+
+    Returns:
+        MCP roots/list response payload.
+
+    Raises:
+        Exception: Propagated after best-effort rollback when unexpected failures occur.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "roots/list":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="admin.system_config",
+            method="roots/list",
+            server_id=None,
+        )
+        roots = await root_service.list_roots()
+        payload = {"roots": [r.model_dump(by_alias=True, exclude_none=True) for r in roots]}
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/completion/complete/")
+@utility_router.post("/_internal/mcp/completion/complete")
+async def handle_internal_mcp_completion_complete(request: Request):
+    """Handle trusted completion/complete requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP completion/complete request.
+
+    Returns:
+        MCP completion response payload.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "completion/complete":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+        else:
+            server_id = params.get("server_id")
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="tools.read",
+            method="completion/complete",
+            server_id=server_id,
+        )
+
+        user_email, token_teams, is_admin = _get_rpc_filter_context(request, user)
+        if is_admin and token_teams is None:
+            user_email = None
+            token_teams = None
+        elif token_teams is None:
+            token_teams = []
+
+        payload = await completion_service.handle_completion(
+            db,
+            params,
+            user_email=user_email,
+            token_teams=token_teams,
+        )
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/sampling/createMessage/")
+@utility_router.post("/_internal/mcp/sampling/createMessage")
+async def handle_internal_mcp_sampling_create_message(request: Request):
+    """Handle trusted sampling/createMessage requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP sampling/createMessage request.
+
+    Returns:
+        MCP sampling/createMessage response payload.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "sampling/createMessage":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        if request.headers.get("x-contextforge-mcp-runtime") == "rust":
+            server_id = request.headers.get("x-contextforge-server-id")
+            if server_id:
+                _enforce_internal_mcp_server_scope(request, server_id)
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        payload = await sampling_handler.create_message(db, params)
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/logging/setLevel/")
+@utility_router.post("/_internal/mcp/logging/setLevel")
+async def handle_internal_mcp_logging_set_level(request: Request):
+    """Handle trusted logging/setLevel requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP logging/setLevel request.
+
+    Returns:
+        Empty JSON response confirming the new log level.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "logging/setLevel":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="admin.system_config",
+            method="logging/setLevel",
+            server_id=None,
+        )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        level = LogLevel(params.get("level"))
+        await logging_service.set_level(level)
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content={})
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception as exc:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(status_code=500, content={"code": -32000, "message": "Internal error", "data": str(exc)})
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/prompts/list/")
+@utility_router.post("/_internal/mcp/prompts/list")
+async def handle_internal_mcp_prompts_list(request: Request):
+    """Handle trusted prompts/list requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP prompts/list request.
+
+    Returns:
+        MCP prompts/list response payload.
+
+    Raises:
+        Exception: Propagated after best-effort rollback when unexpected failures occur.
+    """
+    db = SessionLocal()
+    req_id = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "prompts/list":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+        else:
+            server_id = params.get("server_id")
+        cursor = params.get("cursor")
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="prompts.read",
+            method="prompts/list",
+            server_id=server_id,
+        )
+
+        user_email, token_teams, is_admin = _get_rpc_filter_context(request, user)
+        if is_admin and token_teams is None:
+            user_email = None
+            token_teams = None
+        elif token_teams is None:
+            token_teams = []
+
+        if server_id:
+            prompts = await prompt_service.list_server_prompts(
+                db,
+                server_id,
+                cursor=cursor,
+                user_email=user_email,
+                token_teams=token_teams,
+            )
+            payload = {"prompts": [p.model_dump(by_alias=True, exclude_none=True) for p in prompts]}
+        else:
+            prompts, next_cursor = await prompt_service.list_prompts(
+                db,
+                cursor=cursor,
+                limit=0,
+                user_email=user_email,
+                token_teams=token_teams,
+            )
+            payload = {"prompts": [p.model_dump(by_alias=True, exclude_none=True) for p in prompts]}
+            if next_cursor:
+                payload["nextCursor"] = next_cursor
+
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/prompts/get/")
+@utility_router.post("/_internal/mcp/prompts/get")
+async def handle_internal_mcp_prompts_get(request: Request):
+    """Handle trusted prompts/get requests forwarded from the Rust runtime.
+
+    Args:
+        request: Trusted internal MCP prompts/get request.
+
+    Returns:
+        MCP prompts/get response payload.
+
+    Raises:
+        Exception: Propagated after best-effort rollback when unexpected failures occur.
+    """
+    db = SessionLocal()
+    req_id = None
+    name = None
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        req_id = body.get("id") if isinstance(body, dict) else None
+        if not isinstance(body, dict) or body.get("method") != "prompts/get":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": req_id,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") if request.headers.get("x-contextforge-mcp-runtime") == "rust" else None
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+        else:
+            server_id = params.get("server_id")
+
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission="prompts.read",
+            method="prompts/get",
+            server_id=server_id,
+        )
+
+        name = params.get("name")
+        arguments = params.get("arguments", {})
+        meta_data = params.get("_meta")
+        if not name:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "code": -32602,
+                    "message": "Missing prompt name in parameters",
+                    "data": params,
+                },
+            )
+
+        auth_user_email, auth_token_teams, auth_is_admin = _get_rpc_filter_context(request, user)
+        if auth_is_admin and auth_token_teams is None:
+            auth_user_email = None
+        elif auth_token_teams is None:
+            auth_token_teams = []
+
+        plugin_context_table = getattr(request.state, "plugin_context_table", None)
+        plugin_global_context = getattr(request.state, "plugin_global_context", None)
+        result = await prompt_service.get_prompt(
+            db,
+            name,
+            arguments,
+            user=auth_user_email,
+            server_id=server_id,
+            token_teams=auth_token_teams,
+            plugin_context_table=plugin_context_table,
+            plugin_global_context=plugin_global_context,
+            _meta_data=meta_data,
+        )
+        payload = result.model_dump(by_alias=True, exclude_none=True) if hasattr(result, "model_dump") else result
+
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=payload)
+    except PromptNotFoundError as exc:
+        return ORJSONResponse(
+            status_code=404,
+            content={
+                "code": -32002,
+                "message": str(exc),
+                "data": {"name": name} if name else None,
+            },
+        )
+    except PromptError as exc:
+        try:
+            if db.is_active and db.in_transaction() is not None:
+                db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        return ORJSONResponse(
+            status_code=422,
+            content={
+                "code": -32000,
+                "message": str(exc),
+                "data": {"name": name} if name else None,
+            },
+        )
+    except JSONRPCError as exc:
+        status_code = 403 if exc.code == -32003 else 400
+        return ORJSONResponse(status_code=status_code, content=exc.to_dict()["error"])
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/tools/list/authz/")
+@utility_router.post("/_internal/mcp/tools/list/authz")
+async def handle_internal_mcp_tools_list_authz(request: Request):
+    """Authorize trusted server-scoped tools/list requests for the Rust direct-DB path.
+
+    Args:
+        request: Trusted internal MCP authz request.
+
+    Returns:
+        Empty success response when the request is authorized.
+    """
+    return await _authorize_internal_mcp_server_scoped_method(
+        request,
+        permission="tools.read",
+        method="tools/list",
+    )
+
+
+async def _authorize_internal_mcp_server_scoped_method(
+    request: Request,
+    *,
+    permission: str,
+    method: str,
+) -> Response:
+    """Authorize a trusted server-scoped MCP method for Rust direct-path execution.
+
+    Args:
+        request: Trusted internal MCP authz request.
+        permission: Permission required for the target method.
+        method: MCP method name being authorized.
+
+    Returns:
+        Empty success response when the method is authorized, otherwise a JSON error response.
+
+    Raises:
+        HTTPException: If the trusted server scope header is missing.
+        Exception: Propagated after best-effort rollback when unexpected failures occur.
+    """
+    server_id = request.headers.get("x-contextforge-server-id")
+    if not server_id:
+        raise HTTPException(status_code=400, detail="Missing trusted MCP server scope")
+
+    db = SessionLocal()
+    try:
+        await _authorize_internal_mcp_request(
+            request,
+            db,
+            permission=permission,
+            method=method,
+            server_id=server_id,
+        )
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return Response(status_code=status.HTTP_204_NO_CONTENT)
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content={"code": exc.code, "message": exc.message, "data": exc.data})
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        db.close()
+
+
+@utility_router.post("/_internal/mcp/resources/list/authz/")
+@utility_router.post("/_internal/mcp/resources/list/authz")
+async def handle_internal_mcp_resources_list_authz(request: Request):
+    """Authorize trusted server-scoped resources/list requests for Rust direct-path execution.
+
+    Args:
+        request: Trusted internal MCP authz request.
+
+    Returns:
+        Empty success response when the request is authorized.
+    """
+    return await _authorize_internal_mcp_server_scoped_method(
+        request,
+        permission="resources.read",
+        method="resources/list",
+    )
+
+
+@utility_router.post("/_internal/mcp/resources/read/authz/")
+@utility_router.post("/_internal/mcp/resources/read/authz")
+async def handle_internal_mcp_resources_read_authz(request: Request):
+    """Authorize trusted server-scoped resources/read requests for Rust direct-path execution.
+
+    Args:
+        request: Trusted internal MCP authz request.
+
+    Returns:
+        Empty success response when the request is authorized.
+    """
+    return await _authorize_internal_mcp_server_scoped_method(
+        request,
+        permission="resources.read",
+        method="resources/read",
+    )
+
+
+@utility_router.post("/_internal/mcp/resources/templates/list/authz/")
+@utility_router.post("/_internal/mcp/resources/templates/list/authz")
+async def handle_internal_mcp_resource_templates_list_authz(request: Request):
+    """Authorize trusted server-scoped resources/templates/list requests for Rust direct-path execution.
+
+    Args:
+        request: Trusted internal MCP authz request.
+
+    Returns:
+        Empty success response when the request is authorized.
+    """
+    return await _authorize_internal_mcp_server_scoped_method(
+        request,
+        permission="resources.read",
+        method="resources/templates/list",
+    )
+
+
+@utility_router.post("/_internal/mcp/prompts/list/authz/")
+@utility_router.post("/_internal/mcp/prompts/list/authz")
+async def handle_internal_mcp_prompts_list_authz(request: Request):
+    """Authorize trusted server-scoped prompts/list requests for Rust direct-path execution.
+
+    Args:
+        request: Trusted internal MCP authz request.
+
+    Returns:
+        Empty success response when the request is authorized.
+    """
+    return await _authorize_internal_mcp_server_scoped_method(
+        request,
+        permission="prompts.read",
+        method="prompts/list",
+    )
+
+
+@utility_router.post("/_internal/mcp/prompts/get/authz/")
+@utility_router.post("/_internal/mcp/prompts/get/authz")
+async def handle_internal_mcp_prompts_get_authz(request: Request):
+    """Authorize trusted server-scoped prompts/get requests for Rust direct-path execution.
+
+    Args:
+        request: Trusted internal MCP authz request.
+
+    Returns:
+        Empty success response when the request is authorized.
+    """
+    return await _authorize_internal_mcp_server_scoped_method(
+        request,
+        permission="prompts.read",
+        method="prompts/get",
+    )
+
+
+async def _maybe_forward_affinitized_rpc_request(
+    request: Request,
+    *,
+    method: str,
+    params: Dict[str, Any],
+    req_id: Any,
+    lowered_request_headers: Dict[str, str],
+) -> Optional[Dict[str, Any]]:
+    """Forward an MCP request to the owning worker when session affinity requires it.
+
+    Args:
+        request: Incoming RPC request.
+        method: MCP method name being executed.
+        params: Parsed JSON-RPC params payload.
+        req_id: JSON-RPC request identifier.
+        lowered_request_headers: Lower-cased request headers used for forwarding.
+
+    Returns:
+        Forwarded JSON-RPC response payload when affinity forwarding handled the
+        request, otherwise ``None`` so local execution can continue.
+    """
+    request_headers = request.headers
+    rpc_client_host = getattr(getattr(request, "client", None), "host", None)
+    rpc_from_loopback = rpc_client_host in ("127.0.0.1", "::1") if rpc_client_host else False
+    mcp_session_id = request_headers.get("mcp-session-id") or request_headers.get("x-mcp-session-id")
+    is_internally_forwarded = rpc_from_loopback and request_headers.get("x-forwarded-internally") == "true"
+
+    if settings.mcpgateway_session_affinity_enabled and mcp_session_id and method != "initialize" and not is_internally_forwarded:
+        # First-Party
+        from mcpgateway.services.mcp_session_pool import MCPSessionPool, WORKER_ID  # pylint: disable=import-outside-toplevel
+
+        if not MCPSessionPool.is_valid_mcp_session_id(mcp_session_id):
+            logger.debug("Invalid MCP session id for affinity forwarding, executing locally")
+            return None
+
+        session_short = mcp_session_id[:8] if len(mcp_session_id) >= 8 else mcp_session_id
+        logger.debug("[AFFINITY] Worker %s | Session %s... | Method: %s | RPC request received, checking affinity", WORKER_ID, session_short, method)
+        try:
+            # First-Party
+            from mcpgateway.services.mcp_session_pool import get_mcp_session_pool  # pylint: disable=import-outside-toplevel
+
+            pool = get_mcp_session_pool()
+            forwarded_response = await pool.forward_request_to_owner(
+                mcp_session_id,
+                {"method": method, "params": params, "headers": lowered_request_headers, "req_id": req_id},
+            )
+            if forwarded_response is not None:
+                logger.info("[AFFINITY] Worker %s | Session %s... | Method: %s | Forwarded response received", WORKER_ID, session_short, method)
+                if "error" in forwarded_response:
+                    return {"jsonrpc": "2.0", "error": forwarded_response["error"], "id": req_id}
+                return {"jsonrpc": "2.0", "result": forwarded_response.get("result", {}), "id": req_id}
+        except RuntimeError:
+            logger.debug("[AFFINITY] Worker %s | Session %s... | Method: %s | Pool not initialized, executing locally", WORKER_ID, session_short, method)
+        return None
+
+    if is_internally_forwarded and mcp_session_id:
+        # First-Party
+        from mcpgateway.services.mcp_session_pool import WORKER_ID  # pylint: disable=import-outside-toplevel
+
+        session_short = mcp_session_id[:8] if len(mcp_session_id) >= 8 else mcp_session_id
+        logger.debug("[AFFINITY] Worker %s | Session %s... | Method: %s | Internally forwarded request, executing locally", WORKER_ID, session_short, method)
+
+    return None
+
+
+async def _execute_rpc_initialize(
+    request: Request,
+    user,
+    *,
+    params: Dict[str, Any],
+    server_id: Optional[str],
+    mcp_session_id: Optional[str],
+):
+    """Execute the MCP initialize handshake while preserving session ownership semantics.
+
+    Args:
+        request: Incoming RPC request.
+        user: Authenticated user payload.
+        params: Initialize params payload.
+        server_id: Optional virtual server identifier.
+        mcp_session_id: Session id from the transport headers, when present.
+
+    Returns:
+        Serialized initialize result payload.
+
+    Raises:
+        JSONRPCError: If session ownership cannot be claimed or validated.
+    """
+    init_session_id = params.get("session_id") or params.get("sessionId") or request.query_params.get("session_id")
+    requester_email, requester_is_admin = _get_request_identity(request, user)
+
+    if init_session_id:
+        effective_owner = await session_registry.claim_session_owner(init_session_id, requester_email)
+        if effective_owner is None:
+            raise JSONRPCError(-32003, _ACCESS_DENIED_MSG, {"method": "initialize"})
+
+        if effective_owner and not requester_is_admin and requester_email != effective_owner:
+            raise JSONRPCError(-32003, _ACCESS_DENIED_MSG, {"method": "initialize"})
+
+    result = await session_registry.handle_initialize_logic(params, session_id=init_session_id, server_id=server_id)
+    if hasattr(result, "model_dump"):
+        result = result.model_dump(by_alias=True, exclude_none=True)
+
+    if settings.mcpgateway_session_affinity_enabled and mcp_session_id and mcp_session_id != "not-provided":
+        try:
+            # First-Party
+            from mcpgateway.services.mcp_session_pool import get_mcp_session_pool, WORKER_ID  # pylint: disable=import-outside-toplevel
+
+            pool = get_mcp_session_pool()
+            await pool.register_pool_session_owner(mcp_session_id)
+            logger.debug("[AFFINITY_INIT] Worker %s | Session %s... | Registered ownership after initialize", WORKER_ID, mcp_session_id[:8])
+        except Exception as e:
+            logger.warning("[AFFINITY_INIT] Failed to register session ownership: %s", e)
+
+    return result
+
+
+async def _execute_rpc_tools_call(
+    request: Request,
+    db: Session,
+    user,
+    *,
+    req_id: Any,
+    params: Dict[str, Any],
+    lowered_request_headers: Dict[str, str],
+    server_id: Optional[str],
+):
+    """Execute the hot-path ``tools/call`` branch without the generic RPC method switch.
+
+    Args:
+        request: Incoming RPC request.
+        db: Active database session.
+        user: Authenticated user payload.
+        req_id: JSON-RPC request identifier.
+        params: Parsed tools/call params payload.
+        lowered_request_headers: Lower-cased request headers used for passthrough.
+        server_id: Optional virtual server identifier.
+
+    Returns:
+        Serialized MCP tools/call result payload.
+
+    Raises:
+        JSONRPCError: If the tool name is missing, execution is cancelled, or the
+            downstream tool branch reports a JSON-RPC-visible failure.
+    """
+    name = params.get("name")
+    arguments = params.get("arguments", {})
+    meta_data = params.get("_meta", None)
+    if not name:
+        raise JSONRPCError(-32602, "Missing tool name in parameters", params)
+
+    auth_user_email, auth_token_teams, auth_is_admin = _get_rpc_filter_context(request, user)
+    run_owner_email = auth_user_email
+    run_owner_team_ids = [] if auth_token_teams is None else list(auth_token_teams)
+    if auth_is_admin and auth_token_teams is None:
+        auth_user_email = None
+    elif auth_token_teams is None:
+        auth_token_teams = []
+
+    oauth_user_email = get_user_email(user)
+    plugin_context_table = getattr(request.state, "plugin_context_table", None)
+    plugin_global_context = getattr(request.state, "plugin_global_context", None)
+
+    run_id = str(req_id) if req_id is not None else None
+    tool_task: Optional[asyncio.Task] = None
+
+    async def cancel_tool_task(reason: Optional[str] = None):
+        """Cancel the active tool execution task when cancellation is requested.
+
+        Args:
+            reason: Optional human-readable cancellation reason.
+        """
+        if tool_task and not tool_task.done():
+            logger.info("Cancelling tool task for run_id=%s, reason=%s", run_id, reason)
+            tool_task.cancel()
+
+    if settings.mcpgateway_tool_cancellation_enabled and run_id:
+        await cancellation_service.register_run(
+            run_id,
+            name=f"tool:{name}",
+            cancel_callback=cancel_tool_task,
+            owner_email=run_owner_email,
+            owner_team_ids=run_owner_team_ids,
+        )
+
+    try:
+        if settings.mcpgateway_tool_cancellation_enabled and run_id:
+            run_status = await cancellation_service.get_status(run_id)
+            if run_status and run_status.get("cancelled"):
+                raise JSONRPCError(-32800, f"Tool execution cancelled: {name}", {"requestId": run_id})
+
+        async def execute_tool():
+            """Execute the tool invocation using the existing Python service layer.
+
+            Returns:
+                Result returned by the Python tool service.
+
+            Raises:
+                JSONRPCError: If the requested tool cannot be found.
+            """
+            try:
+                return await tool_service.invoke_tool(
+                    db=db,
+                    name=name,
+                    arguments=arguments,
+                    request_headers=lowered_request_headers,
+                    app_user_email=oauth_user_email,
+                    user_email=auth_user_email,
+                    token_teams=auth_token_teams,
+                    server_id=server_id,
+                    plugin_context_table=plugin_context_table,
+                    plugin_global_context=plugin_global_context,
+                    meta_data=meta_data,
+                )
+            except (ToolNotFoundError, ValueError):
+                logger.error("Tool not found: %s", name)
+                raise JSONRPCError(-32601, f"Tool not found: {name}", None)
+
+        tool_task = asyncio.create_task(execute_tool())
+
+        if settings.mcpgateway_tool_cancellation_enabled and run_id:
+            run_status = await cancellation_service.get_status(run_id)
+            if run_status and run_status.get("cancelled"):
+                tool_task.cancel()
+
+        try:
+            result = await tool_task
+            if hasattr(result, "model_dump"):
+                result = result.model_dump(by_alias=True, exclude_none=True)
+            return result
+        except asyncio.CancelledError as exc:
+            logger.info("Tool execution cancelled for run_id=%s, tool=%s", run_id, name)
+            raise JSONRPCError(-32800, f"Tool execution cancelled: {name}", {"requestId": run_id, "partial": False}) from exc
+    finally:
+        if settings.mcpgateway_tool_cancellation_enabled and run_id:
+            await cancellation_service.unregister_run(run_id)
+
+
+@utility_router.post("/_internal/mcp/tools/call/")
+@utility_router.post("/_internal/mcp/tools/call")
+async def handle_internal_mcp_tools_call(request: Request):
+    """Handle trusted tools/call requests forwarded from the local Rust runtime.
+
+    Args:
+        request: Trusted internal MCP tools/call request.
+
+    Returns:
+        JSON-RPC response payload for the tools/call request.
+
+    Raises:
+        PluginError: Re-raised so plugin middleware can preserve existing behavior.
+        PluginViolationError: Re-raised so plugin middleware can preserve existing behavior.
+        Exception: Propagated after best-effort rollback when unexpected failures occur.
+    """
+    req_id = None
+    db = SessionLocal()
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        if not isinstance(body, dict) or body.get("method") != "tools/call":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": body.get("id") if isinstance(body, dict) else None,
+                },
+            )
+
+        req_id = body.get("id")
+        if req_id is None:
+            req_id = str(uuid.uuid4())
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        server_id = request.headers.get("x-contextforge-server-id") or params.get("server_id")
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+
+        lowered_request_headers = {k.lower(): v for k, v in request.headers.items()}
+        forwarded_response = await _maybe_forward_affinitized_rpc_request(
+            request,
+            method="tools/call",
+            params=params,
+            req_id=req_id,
+            lowered_request_headers=lowered_request_headers,
+        )
+        if forwarded_response is not None:
+            return forwarded_response
+
+        if (_get_internal_mcp_auth_context(request) or {}).get("is_authenticated", True) is True:
+            await _ensure_rpc_permission(user, db, "tools.execute", "tools/call", request=request)
+
+        try:
+            result = await _execute_rpc_tools_call(
+                request,
+                db,
+                user,
+                req_id=req_id,
+                params=params,
+                lowered_request_headers=lowered_request_headers,
+                server_id=server_id,
+            )
+        finally:
+            if db.is_active and db.in_transaction() is not None:
+                db.commit()
+            db.close()
+
+        return {"jsonrpc": "2.0", "result": result, "id": req_id}
+    except (PluginError, PluginViolationError):
+        raise
+    except JSONRPCError as e:
+        error = e.to_dict()
+        return {"jsonrpc": "2.0", "error": error["error"], "id": req_id}
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        try:
+            db.close()
+        except Exception:
+            pass  # nosec B110 - Best effort cleanup on connection failure
+
+
+@utility_router.post("/_internal/mcp/tools/call/resolve/")
+@utility_router.post("/_internal/mcp/tools/call/resolve")
+async def handle_internal_mcp_tools_call_resolve(request: Request):
+    """Resolve a Rust-direct MCP tools/call execution plan without executing the tool.
+
+    Args:
+        request: Trusted internal MCP tools/call resolve request.
+
+    Returns:
+        JSON response containing either an execution plan or a JSON-RPC-visible error.
+
+    Raises:
+        PluginError: Re-raised so plugin middleware can preserve existing behavior.
+        PluginViolationError: Re-raised so plugin middleware can preserve existing behavior.
+        Exception: Propagated after best-effort rollback when unexpected failures occur.
+    """
+    db = SessionLocal()
+    try:
+        user = _build_internal_mcp_forwarded_user(request)
+        try:
+            body = orjson.loads(await request.body())
+        except orjson.JSONDecodeError:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32700, "message": "Parse error"},
+                    "id": None,
+                },
+            )
+
+        if not isinstance(body, dict) or body.get("method") != "tools/call":
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32600, "message": "Invalid Request"},
+                    "id": body.get("id") if isinstance(body, dict) else None,
+                },
+            )
+
+        params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+
+        name = params.get("name")
+        if not name:
+            return ORJSONResponse(
+                status_code=400,
+                content={
+                    "jsonrpc": "2.0",
+                    "error": {"code": -32602, "message": "Missing tool name in parameters"},
+                    "id": body.get("id"),
+                },
+            )
+
+        server_id = request.headers.get("x-contextforge-server-id") or params.get("server_id")
+        if server_id:
+            _enforce_internal_mcp_server_scope(request, server_id)
+
+        if (_get_internal_mcp_auth_context(request) or {}).get("is_authenticated", True) is True:
+            await _ensure_rpc_permission(user, db, "tools.execute", "tools/call", request=request)
+
+        auth_user_email, auth_token_teams, auth_is_admin = _get_rpc_filter_context(request, user)
+        if auth_is_admin and auth_token_teams is None:
+            auth_user_email = None
+        elif auth_token_teams is None:
+            auth_token_teams = []
+
+        plan = await tool_service.prepare_rust_mcp_tool_execution(
+            db=db,
+            name=name,
+            request_headers={k.lower(): v for k, v in request.headers.items()},
+            app_user_email=get_user_email(user),
+            user_email=auth_user_email,
+            token_teams=auth_token_teams,
+            server_id=server_id,
+        )
+
+        if db.is_active and db.in_transaction() is not None:
+            db.commit()
+        return ORJSONResponse(content=plan)
+    except ToolNotFoundError as exc:
+        request_id = body.get("id") if isinstance(body, dict) else None
+        return ORJSONResponse(
+            status_code=404,
+            content={
+                "jsonrpc": "2.0",
+                "error": {"code": -32601, "message": str(exc)},
+                "id": request_id,
+            },
+        )
+    except ToolError as exc:
+        request_id = body.get("id") if isinstance(body, dict) else None
+        return ORJSONResponse(
+            status_code=400,
+            content={
+                "jsonrpc": "2.0",
+                "error": {"code": -32000, "message": str(exc)},
+                "id": request_id,
+            },
+        )
+    except (PluginError, PluginViolationError):
+        raise
+    except JSONRPCError as exc:
+        return ORJSONResponse(status_code=403, content=exc.to_dict()["error"])
+    except Exception:
+        try:
+            db.rollback()
+        except Exception:
+            try:
+                db.invalidate()
+            except Exception:
+                pass  # nosec B110 - Best effort cleanup on connection failure
+        raise
+    finally:
+        try:
+            db.close()
+        except Exception:
+            pass  # nosec B110 - Best effort cleanup on connection failure
+
+
+@utility_router.post("/_internal/mcp/tools/call/metric/")
+@utility_router.post("/_internal/mcp/tools/call/metric")
+async def handle_internal_mcp_tools_call_metric(request: Request):
+    """Record buffered tool/server metrics for a Rust-direct `tools/call`.
+
+    Args:
+        request: Trusted internal metrics writeback request.
+
+    Returns:
+        ORJSONResponse acknowledging the buffered metric writeback.
+    """
+    _build_internal_mcp_forwarded_user(request)
+    try:
+        body = orjson.loads(await request.body())
+    except orjson.JSONDecodeError:
+        return ORJSONResponse(status_code=400, content={"detail": "Invalid JSON body"})
+
+    if not isinstance(body, dict):
+        return ORJSONResponse(status_code=400, content={"detail": "Invalid metrics payload"})
+
+    tool_id = body.get("toolId")
+    duration_ms = body.get("durationMs")
+    success = body.get("success")
+    server_id = body.get("serverId")
+    error_message = body.get("errorMessage")
+
+    if not isinstance(tool_id, str) or not tool_id.strip():
+        return ORJSONResponse(status_code=400, content={"detail": "Missing toolId"})
+    if not isinstance(duration_ms, (int, float)) or duration_ms < 0:
+        return ORJSONResponse(status_code=400, content={"detail": "Invalid durationMs"})
+    if not isinstance(success, bool):
+        return ORJSONResponse(status_code=400, content={"detail": "Invalid success flag"})
+    if server_id is not None and (not isinstance(server_id, str) or not server_id.strip()):
+        return ORJSONResponse(status_code=400, content={"detail": "Invalid serverId"})
+    if error_message is not None and not isinstance(error_message, str):
+        return ORJSONResponse(status_code=400, content={"detail": "Invalid errorMessage"})
+
+    request_server_id = request.headers.get("x-contextforge-server-id")
+    if request_server_id:
+        _enforce_internal_mcp_server_scope(request, request_server_id)
+        if server_id and server_id != request_server_id:
+            return ORJSONResponse(status_code=400, content={"detail": "serverId does not match forwarded server scope"})
+        server_id = request_server_id
+
+    # First-Party
+    from mcpgateway.services.metrics_buffer_service import get_metrics_buffer_service  # pylint: disable=import-outside-toplevel
+
+    metrics_buffer = get_metrics_buffer_service()
+    response_time = float(duration_ms) / 1000.0
+    metrics_buffer.record_tool_metric_with_duration(
+        tool_id=tool_id,
+        response_time=response_time,
+        success=success,
+        error_message=error_message,
+    )
+    if server_id:
+        metrics_buffer.record_server_metric_with_duration(
+            server_id=server_id,
+            response_time=response_time,
+            success=success,
+            error_message=error_message,
+        )
+
+    return ORJSONResponse(content={"status": "ok"})
+
+
+async def _handle_rpc_authenticated(request: Request, db: Session, user):
+    """Handle RPC requests.
+
+    Args:
+        request (Request): The incoming FastAPI request.
+        db (Session): Database session.
+        user: The authenticated user (dict with RBAC context).
+
+    Returns:
+        Response with the RPC result or error.
+
+    Raises:
         PluginError: If encounters issue with plugin
         PluginViolationError: If plugin violated the request. Example - In case of OPA plugin, if the request is denied by policy.
     """
@@ -6064,13 +8891,35 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
                     "id": None,
                 },
             )
+        request_headers = request.headers
+        lowered_headers: Optional[Dict[str, str]] = None
+
+        def _lowered_request_headers() -> Dict[str, str]:
+            """Return a cached lower-cased copy of the incoming request headers.
+
+            Returns:
+                Dict[str, str]: Lower-cased request headers cached for repeated access.
+            """
+            nonlocal lowered_headers
+            if lowered_headers is None:
+                lowered_headers = {k.lower(): v for k, v in request_headers.items()}
+            return lowered_headers
+
+        _trusted_internal_mcp_dispatch = _get_internal_mcp_auth_context(request) is not None
+        _internal_runtime_server_id = request_headers.get("x-contextforge-server-id") if request_headers.get("x-contextforge-mcp-runtime") == "rust" else None
+
         method = body["method"]
         req_id = body.get("id")
         if req_id is None:
             req_id = str(uuid.uuid4())
         params = body.get("params", {})
+        if not isinstance(params, dict):
+            params = {}
+        if _internal_runtime_server_id:
+            params["server_id"] = _internal_runtime_server_id
         server_id = params.get("server_id", None)
         cursor = params.get("cursor")  # Extract cursor parameter
+        mcp_session_id = request_headers.get("mcp-session-id") or request_headers.get("x-mcp-session-id")
 
         # RBAC: Enforce server_id scoping for server-scoped tokens.
         # Extract token scopes once, then:
@@ -6081,6 +8930,11 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
         _cached = getattr(request.state, "_jwt_verified_payload", None)
         _jwt_payload = _cached[1] if (isinstance(_cached, tuple) and len(_cached) == 2 and isinstance(_cached[1], dict)) else None
         _token_scopes = _jwt_payload.get("scopes", {}) if _jwt_payload else {}
+        _internal_auth_context = _get_internal_mcp_auth_context(request)
+        if (not _token_scopes) and isinstance(_internal_auth_context, dict):
+            _scoped_server_id = _internal_auth_context.get("scoped_server_id")
+            if isinstance(_scoped_server_id, str) and _scoped_server_id:
+                _token_scopes = {"server_id": _scoped_server_id}
         _token_server_id = _token_scopes.get("server_id") if _token_scopes else None
 
         if server_id:
@@ -6096,91 +8950,27 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
         elif _token_server_id is not None:
             server_id = _token_server_id
 
-        RPCRequest(jsonrpc="2.0", method=method, params=params)  # Validate the request body against the RPCRequest model
-
-        # Multi-worker session affinity: check if we should forward to another worker
-        # This applies to ALL methods (except initialize which creates new sessions)
-        # The x-forwarded-internally header marks requests that have already been forwarded
-        # to prevent infinite forwarding loops
-        headers = {k.lower(): v for k, v in request.headers.items()}
-        # Session ID can come from two sources:
-        # 1. MCP-Session-Id (mcp-session-id) - MCP protocol header from Streamable HTTP clients
-        # 2. x-mcp-session-id - our internal header from SSE session_registry calls
-        mcp_session_id = headers.get("mcp-session-id") or headers.get("x-mcp-session-id")
-        # Only trust x-forwarded-internally from loopback to prevent external spoofing
-        _rpc_client_host = request.client.host if request.client else None
-        _rpc_from_loopback = _rpc_client_host in ("127.0.0.1", "::1") if _rpc_client_host else False
-        is_internally_forwarded = _rpc_from_loopback and headers.get("x-forwarded-internally") == "true"
-
-        if settings.mcpgateway_session_affinity_enabled and mcp_session_id and method != "initialize" and not is_internally_forwarded:
-            # First-Party
-            from mcpgateway.services.mcp_session_pool import MCPSessionPool, WORKER_ID  # pylint: disable=import-outside-toplevel
-
-            if not MCPSessionPool.is_valid_mcp_session_id(mcp_session_id):
-                logger.debug("Invalid MCP session id for affinity forwarding, executing locally")
-            else:
-                session_short = mcp_session_id[:8] if len(mcp_session_id) >= 8 else mcp_session_id
-                logger.debug(f"[AFFINITY] Worker {WORKER_ID} | Session {session_short}... | Method: {method} | RPC request received, checking affinity")
-                try:
-                    # First-Party
-                    from mcpgateway.services.mcp_session_pool import get_mcp_session_pool  # pylint: disable=import-outside-toplevel
-
-                    pool = get_mcp_session_pool()
-                    forwarded_response = await pool.forward_request_to_owner(
-                        mcp_session_id,
-                        {"method": method, "params": params, "headers": dict(headers), "req_id": req_id},
-                    )
-                    if forwarded_response is not None:
-                        # Request was handled by another worker
-                        logger.info(f"[AFFINITY] Worker {WORKER_ID} | Session {session_short}... | Method: {method} | Forwarded response received")
-                        if "error" in forwarded_response:
-                            raise JSONRPCError(
-                                forwarded_response["error"].get("code", -32603),
-                                forwarded_response["error"].get("message", "Forwarded request failed"),
-                            )
-                        result = forwarded_response.get("result", {})
-                        return {"jsonrpc": "2.0", "result": result, "id": req_id}
-                except RuntimeError:
-                    # Pool not initialized - execute locally
-                    logger.debug(f"[AFFINITY] Worker {WORKER_ID} | Session {session_short}... | Method: {method} | Pool not initialized, executing locally")
-        elif is_internally_forwarded and mcp_session_id:
-            # First-Party
-            from mcpgateway.services.mcp_session_pool import WORKER_ID  # pylint: disable=import-outside-toplevel
+        if not _trusted_internal_mcp_dispatch:
+            RPCRequest(jsonrpc="2.0", method=method, params=params)  # Validate the request body against the RPCRequest model
 
-            session_short = mcp_session_id[:8] if len(mcp_session_id) >= 8 else mcp_session_id
-            logger.debug(f"[AFFINITY] Worker {WORKER_ID} | Session {session_short}... | Method: {method} | Internally forwarded request, executing locally")
+        forwarded_response = await _maybe_forward_affinitized_rpc_request(
+            request,
+            method=method,
+            params=params,
+            req_id=req_id,
+            lowered_request_headers=_lowered_request_headers(),
+        )
+        if forwarded_response is not None:
+            return forwarded_response
 
         if method == "initialize":
-            # Extract session_id from params or query string (for capability tracking)
-            init_session_id = params.get("session_id") or params.get("sessionId") or request.query_params.get("session_id")
-            requester_email, requester_is_admin = _get_request_identity(request, user)
-
-            if init_session_id:
-                effective_owner = await session_registry.claim_session_owner(init_session_id, requester_email)
-                if effective_owner is None:
-                    raise JSONRPCError(-32003, _ACCESS_DENIED_MSG, {"method": method})
-
-                if effective_owner and not requester_is_admin and requester_email != effective_owner:
-                    raise JSONRPCError(-32003, _ACCESS_DENIED_MSG, {"method": method})
-
-            # Pass server_id to advertise OAuth capability if configured per RFC 9728
-            result = await session_registry.handle_initialize_logic(body.get("params", {}), session_id=init_session_id, server_id=server_id)
-            if hasattr(result, "model_dump"):
-                result = result.model_dump(by_alias=True, exclude_none=True)
-
-            # Register session ownership in Redis for multi-worker affinity
-            # This must happen AFTER initialize succeeds so subsequent requests route to this worker
-            if settings.mcpgateway_session_affinity_enabled and mcp_session_id and mcp_session_id != "not-provided":
-                try:
-                    # First-Party
-                    from mcpgateway.services.mcp_session_pool import get_mcp_session_pool, WORKER_ID  # pylint: disable=import-outside-toplevel
-
-                    pool = get_mcp_session_pool()
-                    # Claim-or-refresh ownership for this session (does not steal).
-                    await pool.register_pool_session_owner(mcp_session_id)
-                    logger.debug(f"[AFFINITY_INIT] Worker {WORKER_ID} | Session {mcp_session_id[:8]}... | Registered ownership after initialize")
-                except Exception as e:
-                    logger.warning(f"[AFFINITY_INIT] Failed to register session ownership: {e}")
+            result = await _execute_rpc_initialize(
+                request,
+                user,
+                params=params,
+                server_id=server_id,
+                mcp_session_id=mcp_session_id,
+            )
         elif method == "tools/list":
             await _ensure_rpc_permission(user, db, "tools.read", method, request=request)
             user_email, token_teams, is_admin = _get_rpc_filter_context(request, user)
@@ -6206,7 +8996,7 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
                 # Release DB connection early to prevent idle-in-transaction under load
                 db.commit()
                 db.close()
-                result = {"tools": [t.model_dump(by_alias=True, exclude_none=True) for t in tools]}
+                result = {"tools": _serialize_mcp_tool_definitions(tools)}
             else:
                 tools, next_cursor = await tool_service.list_tools(
                     db,
@@ -6221,7 +9011,7 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
                 # Release DB connection early to prevent idle-in-transaction under load
                 db.commit()
                 db.close()
-                result = {"tools": [t.model_dump(by_alias=True, exclude_none=True) for t in tools]}
+                result = {"tools": _serialize_mcp_tool_definitions(tools)}
                 if next_cursor:
                     result["nextCursor"] = next_cursor
         elif method == "list_tools":  # Legacy endpoint
@@ -6249,7 +9039,7 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
                 )
                 db.commit()
                 db.close()
-                result = {"tools": [t.model_dump(by_alias=True, exclude_none=True) for t in tools]}
+                result = {"tools": _serialize_legacy_tool_payloads(tools)}
             else:
                 tools, next_cursor = await tool_service.list_tools(
                     db,
@@ -6263,7 +9053,7 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
                 )
                 db.commit()
                 db.close()
-                result = {"tools": [t.model_dump(by_alias=True, exclude_none=True) for t in tools]}
+                result = {"tools": _serialize_legacy_tool_payloads(tools)}
                 if next_cursor:
                     result["nextCursor"] = next_cursor
         elif method == "list_gateways":
@@ -6345,7 +9135,7 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
                     result = {"contents": [result]}
             except (ValueError, ResourceNotFoundError):
                 # Resource not found in the gateway
-                logger.error(f"Resource not found: {uri}")
+                logger.error("Resource not found: %s", uri)
                 raise JSONRPCError(-32002, f"Resource not found: {uri}", {"uri": uri})
             # Release transaction after resources/read completes
             db.commit()
@@ -6443,109 +9233,17 @@ async def handle_rpc(request: Request, db: Session = Depends(get_db), user=Depen
             await _ensure_rpc_permission(user, db, "tools.execute", method, request=request)
             # Note: Multi-worker session affinity forwarding is handled earlier
             # (before method routing) to apply to ALL methods, not just tools/call
-            name = params.get("name")
-            arguments = params.get("arguments", {})
-            meta_data = params.get("_meta", None)
-            if not name:
-                raise JSONRPCError(-32602, "Missing tool name in parameters", params)
-
-            # Get authorization context (same as tools/list)
-            auth_user_email, auth_token_teams, auth_is_admin = _get_rpc_filter_context(request, user)
-            run_owner_email = auth_user_email
-            run_owner_team_ids = [] if auth_token_teams is None else list(auth_token_teams)
-            if auth_is_admin and auth_token_teams is None:
-                auth_user_email = None
-                # auth_token_teams stays None (unrestricted)
-            elif auth_token_teams is None:
-                auth_token_teams = []  # Non-admin without teams = public-only
-
-            # Get user email for OAuth token selection
-            oauth_user_email = get_user_email(user)
-            # Get plugin contexts from request.state for cross-hook sharing
-            plugin_context_table = getattr(request.state, "plugin_context_table", None)
-            plugin_global_context = getattr(request.state, "plugin_global_context", None)
-
-            # Register the tool execution for cancellation tracking with task reference (if enabled)
-            # Note: req_id can be 0 which is falsy but valid per JSON-RPC spec, so use 'is not None'
-            run_id = str(req_id) if req_id is not None else None
-            tool_task: Optional[asyncio.Task] = None
-
-            async def cancel_tool_task(reason: Optional[str] = None):
-                """Cancel callback that actually cancels the asyncio task.
-
-                Args:
-                    reason: Optional reason for cancellation.
-                """
-                if tool_task and not tool_task.done():
-                    logger.info(f"Cancelling tool task for run_id={run_id}, reason={reason}")
-                    tool_task.cancel()
-
-            if settings.mcpgateway_tool_cancellation_enabled and run_id:
-                await cancellation_service.register_run(
-                    run_id,
-                    name=f"tool:{name}",
-                    cancel_callback=cancel_tool_task,
-                    owner_email=run_owner_email,
-                    owner_team_ids=run_owner_team_ids,
-                )
-
             try:
-                # Check if cancelled before execution (only if feature enabled)
-                if settings.mcpgateway_tool_cancellation_enabled and run_id:
-                    run_status = await cancellation_service.get_status(run_id)
-                    if run_status and run_status.get("cancelled"):
-                        raise JSONRPCError(-32800, f"Tool execution cancelled: {name}", {"requestId": run_id})
-
-                # Create task for tool execution to enable real cancellation
-                async def execute_tool():
-                    """Execute tool invocation with fallback to gateway forwarding.
-
-                    Returns:
-                        The tool invocation result or gateway forwarding result.
-
-                    Raises:
-                        JSONRPCError: If the tool is not found.
-                    """
-                    try:
-                        return await tool_service.invoke_tool(
-                            db=db,
-                            name=name,
-                            arguments=arguments,
-                            request_headers=headers,
-                            app_user_email=oauth_user_email,
-                            user_email=auth_user_email,
-                            token_teams=auth_token_teams,
-                            server_id=server_id,
-                            plugin_context_table=plugin_context_table,
-                            plugin_global_context=plugin_global_context,
-                            meta_data=meta_data,
-                        )
-                    except ValueError:
-                        # Tool not found log error and raise JSONRPCError
-                        logger.error(f"Tool not found: {name}")
-                        raise JSONRPCError(-32601, f"Tool not found: {name}", None)
-
-                tool_task = asyncio.create_task(execute_tool())
-
-                # Re-check cancellation after task creation to handle race condition
-                # where cancel arrived between pre-check and task creation (callback saw tool_task=None)
-                if settings.mcpgateway_tool_cancellation_enabled and run_id:
-                    run_status = await cancellation_service.get_status(run_id)
-                    if run_status and run_status.get("cancelled"):
-                        tool_task.cancel()
-
-                try:
-                    result = await tool_task
-                    if hasattr(result, "model_dump"):
-                        result = result.model_dump(by_alias=True, exclude_none=True)
-                except asyncio.CancelledError:
-                    # Task was cancelled - return partial result or error
-                    logger.info(f"Tool execution cancelled for run_id={run_id}, tool={name}")
-                    raise JSONRPCError(-32800, f"Tool execution cancelled: {name}", {"requestId": run_id, "partial": False})
+                result = await _execute_rpc_tools_call(
+                    request,
+                    db,
+                    user,
+                    req_id=req_id,
+                    params=params,
+                    lowered_request_headers=_lowered_request_headers(),
+                    server_id=server_id,
+                )
             finally:
-                # Unregister the run when done (only if feature enabled)
-                if settings.mcpgateway_tool_cancellation_enabled and run_id:
-                    await cancellation_service.unregister_run(run_id)
                 # Release transaction after tools/call completes
                 db.commit()
                 db.close()
@@ -6590,7 +9288,7 @@ async def execute_tool():
             raw_request_id = params.get("requestId")
             request_id = str(raw_request_id) if raw_request_id is not None else None
             reason = params.get("reason")
-            logger.info(f"Request cancelled: {request_id}, reason: {reason}")
+            logger.info("Request cancelled: %s, reason: %s", request_id, reason)
             # Attempt local cancellation per MCP spec
             if request_id is not None:
                 await _authorize_run_cancellation(request, user, request_id, as_jsonrpc_error=True)
@@ -6640,7 +9338,7 @@ async def execute_tool():
                 if not capable_sessions:
                     raise JSONRPCError(-32000, "No elicitation-capable clients available", {"message": elicit_params.message})
                 target_session_id = capable_sessions[0]
-                logger.debug(f"Selected session {target_session_id} for elicitation")
+                logger.debug("Selected session %s for elicitation", target_session_id)
 
             # Verify session has elicitation capability
             if not await session_registry.has_elicitation_capability(target_session_id):
@@ -6683,7 +9381,7 @@ async def execute_tool():
                 }
 
                 await session_registry.broadcast(target_session_id, elicitation_request)
-                logger.debug(f"Sent elicitation request {pending.request_id} to session {target_session_id}")
+                logger.debug("Sent elicitation request %s to session %s", pending.request_id, target_session_id)
 
                 # Wait for response
                 elicit_result = await elicitation_task
@@ -6711,9 +9409,7 @@ async def execute_tool():
             # Catch-all for other completion/* methods (currently unsupported)
             result = {}
         elif method == "logging/setLevel":
-            # MCP logging/setLevel is a standard MCP capability invoked by clients during
-            # initialization; servers.use (not admin.system_config) keeps the handshake working.
-            await _ensure_rpc_permission(user, db, "servers.use", method, request=request)
+            await _ensure_rpc_permission(user, db, "admin.system_config", method, request=request)
             level = LogLevel(params.get("level"))
             await logging_service.set_level(level)
             result = {}
@@ -6724,8 +9420,6 @@ async def execute_tool():
             # Backward compatibility: Try to invoke as a tool directly
             # This allows both old format (method=tool_name) and new format (method=tools/call)
             await _ensure_rpc_permission(user, db, "tools.execute", method, request=request)
-            # Standard
-            headers = {k.lower(): v for k, v in request.headers.items()}
 
             # Get authorization context (same as tools/call)
             auth_user_email, auth_token_teams, auth_is_admin = _get_rpc_filter_context(request, user)
@@ -6750,7 +9444,7 @@ async def execute_tool():
                     db=db,
                     name=method,
                     arguments=params,
-                    request_headers=headers,
+                    request_headers=_lowered_request_headers(),
                     app_user_email=oauth_user_email,
                     user_email=auth_user_email,
                     token_teams=auth_token_teams,
@@ -6765,7 +9459,7 @@ async def execute_tool():
                 raise
             except Exception:
                 # Log error and return invalid method
-                logger.error(f"Method not found: {method}")
+                logger.error("Method not found: %s", method)
                 raise JSONRPCError(-32000, "Invalid method", params)
 
         return {"jsonrpc": "2.0", "result": result, "id": req_id}
@@ -7189,7 +9883,7 @@ async def reset_metrics(entity: Optional[str] = None, entity_id: Optional[int] =
 # Healthcheck      #
 ####################
 @app.get("/health")
-def healthcheck():
+def healthcheck(response: Response = None):
     """
     Perform a basic health check to verify database connectivity.
 
@@ -7197,6 +9891,9 @@ def healthcheck():
     Uses a dedicated session to avoid cross-thread issues and double-commit
     from get_db dependency. All DB operations happen in the same thread.
 
+    Args:
+        response: Optional response object used to attach runtime-mode headers.
+
     Returns:
         A dictionary with the health status and optional error message.
     """
@@ -7205,7 +9902,9 @@ def healthcheck():
         db.execute(text("SELECT 1"))
         # Explicitly commit to release PgBouncer backend connection in transaction mode.
         db.commit()
-        return {"status": "healthy"}
+        if response is not None:
+            _apply_runtime_mode_headers(response)
+        return {"status": "healthy", "mcp_runtime": _mcp_runtime_status_payload()}
     except Exception as e:
         # Rollback, then invalidate if rollback fails (mirrors get_db cleanup).
         try:
@@ -7217,7 +9916,9 @@ def healthcheck():
                 pass  # nosec B110 - Best effort cleanup on connection failure
         error_message = f"Database connection error: {str(e)}"
         logger.error(error_message)
-        return {"status": "unhealthy", "error": error_message}
+        if response is not None:
+            _apply_runtime_mode_headers(response)
+        return {"status": "unhealthy", "error": error_message, "mcp_runtime": _mcp_runtime_status_payload()}
     finally:
         db.close()
 
@@ -7266,8 +9967,12 @@ def _check_db() -> str | None:
     if error:
         error_message = f"Readiness check failed: {error}"
         logger.error(error_message)
-        return ORJSONResponse(content={"status": "not ready", "error": error_message}, status_code=503)
-    return ORJSONResponse(content={"status": "ready"}, status_code=200)
+        response = ORJSONResponse(content={"status": "not ready", "error": error_message, "mcp_runtime": _mcp_runtime_status_payload()}, status_code=503)
+        _apply_runtime_mode_headers(response)
+        return response
+    response = ORJSONResponse(content={"status": "ready", "mcp_runtime": _mcp_runtime_status_payload()}, status_code=200)
+    _apply_runtime_mode_headers(response)
+    return response
 
 
 @app.get("/health/security", tags=["health"])
@@ -7921,8 +10626,163 @@ async def cleanup_import_statuses(max_age_hours: int = 24, user=Depends(get_curr
 else:
     logger.warning("Admin API routes not mounted - Admin API disabled via MCPGATEWAY_ADMIN_API_ENABLED=False")
 
+
+class MCPRuntimeHeaderTransportWrapper:
+    """Annotate Python-owned MCP transport responses with the active runtime marker."""
+
+    def __init__(self, transport_app, *, runtime_name: str) -> None:
+        """Wrap an MCP transport app and stamp a runtime header on responses.
+
+        Args:
+            transport_app: Underlying MCP transport app.
+            runtime_name: Runtime label to expose via response headers.
+        """
+        self.transport_app = transport_app
+        self.runtime_name = runtime_name.encode("ascii")
+
+    async def handle_streamable_http(self, scope, receive, send):
+        """Forward an MCP request while ensuring the runtime marker header is present.
+
+        Args:
+            scope: Incoming ASGI scope.
+            receive: ASGI receive callable.
+            send: ASGI send callable.
+        """
+
+        async def _send_with_runtime_header(message):
+            """Attach MCP runtime mode headers before sending the ASGI event downstream.
+
+            Args:
+                message: Outgoing ASGI message emitted by the wrapped application.
+            """
+            if message.get("type") == "http.response.start":
+                headers = list(message.get("headers") or [])
+                if not any(isinstance(item, (tuple, list)) and len(item) == 2 and isinstance(item[0], (bytes, bytearray)) and item[0].lower() == b"x-contextforge-mcp-runtime" for item in headers):
+                    headers.append((b"x-contextforge-mcp-runtime", self.runtime_name))
+                if not any(
+                    isinstance(item, (tuple, list)) and len(item) == 2 and isinstance(item[0], (bytes, bytearray)) and item[0].lower() == b"x-contextforge-mcp-session-core" for item in headers
+                ):
+                    headers.append((b"x-contextforge-mcp-session-core", _current_mcp_session_core_mode().encode("ascii")))
+                if not any(isinstance(item, (tuple, list)) and len(item) == 2 and isinstance(item[0], (bytes, bytearray)) and item[0].lower() == b"x-contextforge-mcp-resume-core" for item in headers):
+                    headers.append((b"x-contextforge-mcp-resume-core", _current_mcp_resume_core_mode().encode("ascii")))
+                if not any(
+                    isinstance(item, (tuple, list)) and len(item) == 2 and isinstance(item[0], (bytes, bytearray)) and item[0].lower() == b"x-contextforge-mcp-live-stream-core" for item in headers
+                ):
+                    headers.append((b"x-contextforge-mcp-live-stream-core", _current_mcp_live_stream_core_mode().encode("ascii")))
+                if not any(
+                    isinstance(item, (tuple, list)) and len(item) == 2 and isinstance(item[0], (bytes, bytearray)) and item[0].lower() == b"x-contextforge-mcp-affinity-core" for item in headers
+                ):
+                    headers.append((b"x-contextforge-mcp-affinity-core", _current_mcp_affinity_core_mode().encode("ascii")))
+                if not any(
+                    isinstance(item, (tuple, list)) and len(item) == 2 and isinstance(item[0], (bytes, bytearray)) and item[0].lower() == b"x-contextforge-mcp-session-auth-reuse" for item in headers
+                ):
+                    headers.append((b"x-contextforge-mcp-session-auth-reuse", _current_mcp_session_auth_reuse_mode().encode("ascii")))
+                message = dict(message)
+                message["headers"] = headers
+            await send(message)
+
+        await self.transport_app.handle_streamable_http(scope, receive, _send_with_runtime_header)
+
+
+def _build_mcp_transport_app():
+    """Choose the MCP transport app for the mounted /mcp path.
+
+    Returns:
+        Transport app object that should be mounted at the public ``/mcp`` path.
+    """
+    if _should_mount_public_rust_transport():
+        logger.warning(
+            "MCP runtime mode: %s. GET/POST/DELETE /mcp requests will be proxied to %s. MCP session core mode: %s. MCP replay/resume core mode: %s. MCP live stream core mode: %s. MCP affinity core mode: %s. MCP session auth reuse mode: %s.",
+            _current_mcp_runtime_mode(),
+            settings.experimental_rust_mcp_runtime_uds or settings.experimental_rust_mcp_runtime_url,
+            _current_mcp_session_core_mode(),
+            _current_mcp_resume_core_mode(),
+            _current_mcp_live_stream_core_mode(),
+            _current_mcp_affinity_core_mode(),
+            _current_mcp_session_auth_reuse_mode(),
+        )
+        return RustMCPRuntimeProxy(streamable_http_session.handle_streamable_http)
+
+    if settings.experimental_rust_mcp_runtime_enabled:
+        logger.warning(
+            "MCP runtime mode: %s. Rust sidecar remains enabled, but public /mcp stays on the Python transport because MCP session auth reuse is disabled. MCP session core mode: %s. MCP replay/resume core mode: %s. MCP live stream core mode: %s. MCP affinity core mode: %s. MCP session auth reuse mode: %s.",
+            _current_mcp_runtime_mode(),
+            _current_mcp_session_core_mode(),
+            _current_mcp_resume_core_mode(),
+            _current_mcp_live_stream_core_mode(),
+            _current_mcp_affinity_core_mode(),
+            _current_mcp_session_auth_reuse_mode(),
+        )
+        return MCPRuntimeHeaderTransportWrapper(streamable_http_session, runtime_name="python")
+
+    if _rust_build_included():
+        logger.warning(
+            "MCP runtime mode: %s. Rust MCP artifacts are present in this image, but EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED=false so /mcp remains on the Python transport. Set RUST_MCP_MODE=edge or RUST_MCP_MODE=full to activate the Rust runtime with the simple env flow.",
+            _current_mcp_runtime_mode(),
+        )
+    else:
+        logger.info("MCP runtime mode: %s. /mcp is mounted on the Python transport.", _current_mcp_runtime_mode())
+
+    return MCPRuntimeHeaderTransportWrapper(streamable_http_session, runtime_name="python")
+
+
+class InternalTrustedMCPTransportBridge:
+    """Trusted internal bridge from Rust MCP transport requests to the Python session manager."""
+
+    def __init__(self, transport_app) -> None:
+        """Store the underlying Python transport app used for trusted forwarding.
+
+        Args:
+            transport_app: Python transport app that ultimately owns session handling.
+        """
+        self.transport_app = transport_app
+
+    async def handle_streamable_http(self, scope, receive, send):
+        """Translate trusted Rust transport requests into Python session-manager calls.
+
+        Args:
+            scope: Incoming ASGI scope.
+            receive: ASGI receive callable.
+            send: ASGI send callable.
+        """
+        if scope.get("type") != "http":
+            response = ORJSONResponse(status_code=404, content={"detail": "Not found"})
+            await response(scope, receive, send)
+            return
+
+        method = str(scope.get("method", "GET")).upper()
+        if method not in {"GET", "POST", "DELETE"}:
+            response = ORJSONResponse(status_code=405, content={"detail": "Method not allowed"})
+            await response(scope, receive, send)
+            return
+
+        request = Request(scope, receive=receive)
+        try:
+            _build_internal_mcp_forwarded_user(request)
+        except HTTPException as exc:
+            response = ORJSONResponse(status_code=exc.status_code, content={"detail": exc.detail})
+            await response(scope, receive, send)
+            return
+
+        auth_context = _get_internal_mcp_auth_context(request) or {}
+        server_id = request.headers.get("x-contextforge-server-id")
+        forwarded_scope = dict(scope)
+        forwarded_scope["path"] = "/mcp/"
+        forwarded_scope["modified_path"] = f"/servers/{server_id}/mcp" if server_id else "/mcp/"
+
+        token = user_context_var.set(auth_context)
+        try:
+            await self.transport_app.handle_streamable_http(forwarded_scope, receive, send)
+        finally:
+            user_context_var.reset(token)
+
+
+mcp_transport_app = _build_mcp_transport_app()
+internal_trusted_mcp_transport = InternalTrustedMCPTransportBridge(streamable_http_session)
+
 # Streamable http Mount
-app.mount("/mcp", app=streamable_http_session.handle_streamable_http)
+app.mount("/mcp", app=mcp_transport_app.handle_streamable_http)
+app.mount("/_internal/mcp/transport", app=internal_trusted_mcp_transport.handle_streamable_http)
 
 # Conditional static files mounting and root redirect
 if UI_ENABLED:
diff --git a/mcpgateway/middleware/token_scoping.py b/mcpgateway/middleware/token_scoping.py
index 6f57f9c9b7..f8835997d8 100644
--- a/mcpgateway/middleware/token_scoping.py
+++ b/mcpgateway/middleware/token_scoping.py
@@ -13,6 +13,8 @@
 # Standard
 from datetime import datetime, timedelta, timezone
 from functools import lru_cache
+import hashlib
+import hmac
 import ipaddress
 import re
 from typing import List, Optional, Pattern, Tuple
@@ -59,6 +61,11 @@
     (re.compile(r"/gateways/?([a-f0-9\-]+)"), "gateway"),
 ]
 _AUTH_COOKIE_NAMES = ("jwt_token", "access_token")
+_INTERNAL_MCP_PATH_PREFIX = "/_internal/mcp"
+_INTERNAL_MCP_RUNTIME_HEADER = "x-contextforge-mcp-runtime"
+_INTERNAL_MCP_AUTH_CONTEXT_HEADER = "x-contextforge-auth-context"
+_INTERNAL_MCP_RUNTIME_AUTH_HEADER = "x-contextforge-mcp-runtime-auth"
+_INTERNAL_MCP_RUNTIME_AUTH_CONTEXT = "contextforge-internal-mcp-runtime-v1"
 
 # Permission map with precompiled patterns
 # Maps (HTTP method, path pattern) to required permission
@@ -1210,6 +1217,13 @@ async def __call__(self, request: Request, call_next):
             if normalized_path == "/":
                 return await call_next(request)
 
+            # Trusted internal Rust -> Python MCP dispatch already carries a
+            # normalized auth context and is re-authorized by the internal MCP
+            # handlers. Re-applying token-scoping path checks here would reject
+            # the private /_internal/mcp/* hop for scoped tokens.
+            if self._is_trusted_internal_mcp_runtime_request(request, normalized_path):
+                return await call_next(request)
+
             if any(normalized_path.startswith(path) for path in skip_paths):
                 return await call_next(request)
 
@@ -1328,6 +1342,74 @@ async def __call__(self, request: Request, call_next):
                 content={"detail": exc.detail},
             )
 
+    def _is_trusted_internal_mcp_runtime_request(self, request: Request, normalized_path: str) -> bool:
+        """Return whether the request is a trusted loopback Rust MCP sidecar hop.
+
+        Args:
+            request: Incoming HTTP request.
+            normalized_path: Canonicalized request path used for route matching.
+
+        Returns:
+            ``True`` when the request originated from the local Rust MCP runtime and
+            includes the expected trusted headers.
+        """
+        if normalized_path != _INTERNAL_MCP_PATH_PREFIX and not normalized_path.startswith(f"{_INTERNAL_MCP_PATH_PREFIX}/"):
+            return False
+
+        if request.headers.get(_INTERNAL_MCP_RUNTIME_HEADER) != "rust":
+            return False
+
+        provided_auth = request.headers.get(_INTERNAL_MCP_RUNTIME_AUTH_HEADER)
+        if not provided_auth:
+            return False
+
+        expected_auth = self._expected_internal_mcp_runtime_auth_header()
+        if not hmac.compare_digest(provided_auth, expected_auth):
+            return False
+
+        if not request.headers.get(_INTERNAL_MCP_AUTH_CONTEXT_HEADER):
+            return False
+
+        client_host = getattr(getattr(request, "client", None), "host", None)
+        return client_host in ("127.0.0.1", "::1")
+
+    @staticmethod
+    def _auth_encryption_secret_value() -> str:
+        """Return the configured auth-encryption secret as a plain string.
+
+        Returns:
+            The auth-encryption secret, normalized to a regular string.
+        """
+        secret = settings.auth_encryption_secret
+        if hasattr(secret, "get_secret_value"):
+            return secret.get_secret_value()
+        return str(secret)
+
+    @staticmethod
+    @lru_cache(maxsize=8)
+    def _expected_internal_mcp_runtime_auth_header_for_secret(secret: str) -> str:
+        """Return the expected shared internal-auth header for a specific secret.
+
+        Args:
+            secret: Auth-encryption secret to derive the trust header from.
+
+        Returns:
+            Hex-encoded SHA-256 digest derived from the provided auth secret.
+        """
+        material = f"{secret}:{_INTERNAL_MCP_RUNTIME_AUTH_CONTEXT}".encode("utf-8")
+        return hashlib.sha256(material).hexdigest()
+
+    @staticmethod
+    def _expected_internal_mcp_runtime_auth_header() -> str:
+        """Return the expected shared internal-auth header for Rust MCP hops.
+
+        Returns:
+            Shared secret-derived digest expected on trusted internal Rust MCP calls.
+        """
+        return TokenScopingMiddleware._expected_internal_mcp_runtime_auth_header_for_secret(
+            TokenScopingMiddleware._auth_encryption_secret_value()
+        )
+
 
 # Create middleware instance
 token_scoping_middleware = TokenScopingMiddleware()
diff --git a/mcpgateway/schemas.py b/mcpgateway/schemas.py
index 1c80475ae8..d752dfdd6a 100644
--- a/mcpgateway/schemas.py
+++ b/mcpgateway/schemas.py
@@ -295,6 +295,14 @@ class MetricsResponse(BaseModelWithConfigDict):
 
     @model_serializer(mode="wrap")
     def _exclude_none_a2a(self, handler):
+        """Omit the A2A metrics field when that feature is disabled.
+
+        Args:
+            handler: Pydantic serializer callback for the wrapped model.
+
+        Returns:
+            Dict[str, Any]: Serialized metrics payload without empty A2A fields.
+        """
         result = handler(self)
         if self.a2a_agents is None:
             result.pop("a2aAgents", None)
diff --git a/mcpgateway/services/email_auth_service.py b/mcpgateway/services/email_auth_service.py
index 00bcb36672..4f2e5579e5 100644
--- a/mcpgateway/services/email_auth_service.py
+++ b/mcpgateway/services/email_auth_service.py
@@ -70,9 +70,6 @@
 logging_service = LoggingService()
 logger = logging_service.get_logger(__name__)
 
-# Strong references to background tasks to prevent GC before completion
-_background_tasks: set[asyncio.Task] = set()
-
 _GET_ALL_USERS_LIMIT = 10000
 _DUMMY_ARGON2_HASH = "$argon2id$v=19$m=65536,t=3,p=1$9x/nTs9D0R97+BI7BWP2Tg$V/40qCuaGh4i+94HpGpxJESEVs3IDpLzUqtNqRPuty4"
 
@@ -422,6 +419,33 @@ async def _invalidate_user_auth_cache(self, email: str) -> None:
         except Exception as cache_error:  # nosec B110
             logger.debug("Failed to invalidate auth cache for %s: %s", email, cache_error)
 
+    async def _invalidate_deleted_user_auth_caches(self, email: str) -> None:
+        """Invalidate all auth-cache entries affected by permanent user deletion.
+
+        Args:
+            email: User email for cache invalidation.
+        """
+        try:
+            # First-Party
+            from mcpgateway.cache.auth_cache import auth_cache  # pylint: disable=import-outside-toplevel
+
+            results = await asyncio.wait_for(
+                asyncio.gather(
+                    auth_cache.invalidate_user(email),
+                    auth_cache.invalidate_user_teams(email),
+                    auth_cache.invalidate_team_membership(email),
+                    return_exceptions=True,
+                ),
+                timeout=5.0,
+            )
+            for result in results:
+                if isinstance(result, Exception):
+                    logger.debug("Failed to invalidate delete-user auth cache for %s: %s", email, result)
+        except asyncio.TimeoutError:
+            logger.warning("Delete-user auth cache invalidation timed out for %s - continuing", email)
+        except Exception as cache_error:  # nosec B110
+            logger.debug("Failed to invalidate delete-user auth cache for %s: %s", email, cache_error)
+
     def _log_auth_event(
         self,
         event_type: str,
@@ -556,14 +580,15 @@ async def create_user(
         if not skip_password_validation:
             self.validate_password(password)
 
+        # Hash before the first DB read so PgBouncer transaction pooling does not
+        # hold an idle transaction open across the async hashing call.
+        password_hash = await self.password_service.hash_password_async(password)
+
         # Check if user already exists
         existing_user = await self.get_user_by_email(email)
         if existing_user:
             raise UserExistsError(f"User with email {email} already exists")
 
-        # Hash the password
-        password_hash = await self.password_service.hash_password_async(password)
-
         # Create new user (record password change timestamp)
         user = EmailUser(
             email=email,
@@ -1804,17 +1829,7 @@ async def delete_user(self, email: str) -> bool:
             self.db.delete(user)
             self.db.commit()
 
-            # Invalidate all auth caches for deleted user
-            try:
-                # First-Party
-                from mcpgateway.cache.auth_cache import auth_cache  # pylint: disable=import-outside-toplevel
-
-                for coro in [auth_cache.invalidate_user(email), auth_cache.invalidate_user_teams(email), auth_cache.invalidate_team_membership(email)]:
-                    task = asyncio.create_task(coro)
-                    _background_tasks.add(task)
-                    task.add_done_callback(_background_tasks.discard)
-            except Exception as cache_error:
-                logger.debug(f"Failed to invalidate cache on user delete: {cache_error}")
+            await self._invalidate_deleted_user_auth_caches(email)
 
             logger.info(f"User {SecurityValidator.sanitize_log_message(email)} deleted permanently")
             return True
diff --git a/mcpgateway/services/mcp_session_pool.py b/mcpgateway/services/mcp_session_pool.py
index 7874267d37..a8d1291f59 100644
--- a/mcpgateway/services/mcp_session_pool.py
+++ b/mcpgateway/services/mcp_session_pool.py
@@ -1266,6 +1266,17 @@ async def _cleanup_pool_session_owner(self, mcp_session_id: str) -> None:
             # Cleanup failure is non-fatal
             logger.debug(f"Failed to cleanup pool session owner in Redis: {e}")
 
+    async def cleanup_streamable_http_session_owner(self, mcp_session_id: str) -> None:
+        """Public wrapper for cleaning up Streamable HTTP session ownership.
+
+        This is used by trusted internal MCP session teardown paths that need to
+        remove affinity ownership without reaching into private helpers.
+        """
+        if not self.is_valid_mcp_session_id(mcp_session_id):
+            logger.debug("Invalid mcp_session_id for owner cleanup, skipping")
+            return
+        await self._cleanup_pool_session_owner(mcp_session_id)
+
     async def close_all(self) -> None:
         """
         Gracefully close all pooled and active sessions.
diff --git a/mcpgateway/services/metrics.py b/mcpgateway/services/metrics.py
index 931a5e8081..8918218a70 100644
--- a/mcpgateway/services/metrics.py
+++ b/mcpgateway/services/metrics.py
@@ -98,6 +98,12 @@ def _get_registry_collector(metric_name: str):
     ["outcome"],
 )
 
+mcp_auth_cache_events_counter = Counter(
+    "mcp_auth_cache_events_total",
+    "Total number of MCP auth cache events by outcome",
+    ["outcome"],
+)
+
 
 def setup_metrics(app):
     """
diff --git a/mcpgateway/services/metrics_buffer_service.py b/mcpgateway/services/metrics_buffer_service.py
index 2054d95f45..8364e03197 100644
--- a/mcpgateway/services/metrics_buffer_service.py
+++ b/mcpgateway/services/metrics_buffer_service.py
@@ -144,11 +144,57 @@ async def start(self) -> None:
             logger.info("MetricsBufferService disabled, skipping start")
             return
 
-        if self._flush_task is None or self._flush_task.done():
+        current_loop = asyncio.get_running_loop()
+        if not self._flush_task_is_active_for_loop(current_loop):
             self._shutdown_event.clear()
             self._flush_task = asyncio.create_task(self._flush_loop())
             logger.info("MetricsBufferService flush task started")
 
+    def _flush_task_is_active_for_loop(self, loop: asyncio.AbstractEventLoop) -> bool:
+        """Return whether the current flush task is usable for the active loop.
+
+        Args:
+            loop: The currently running event loop for this worker process.
+
+        Returns:
+            True when the cached flush task belongs to the current live loop.
+        """
+        task = self._flush_task
+        if task is None or task.done() or task.cancelled():
+            return False
+
+        try:
+            task_loop = task.get_loop()
+        except (AttributeError, RuntimeError):
+            return False
+
+        return task_loop is loop and task_loop.is_running()
+
+    def _ensure_flush_task_started(self) -> None:
+        """Best-effort lazy-start for the background flush task.
+
+        In preloaded multi-worker deployments, the singleton may exist in a
+        worker before the worker's startup hook has started the flush loop. A
+        first buffered metric should recover from that state instead of sitting
+        in memory forever.
+        """
+        if not self.recording_enabled or not self.enabled:
+            return
+
+        try:
+            loop = asyncio.get_running_loop()
+        except RuntimeError:
+            return
+
+        if self._flush_task_is_active_for_loop(loop):
+            return
+
+        if self._shutdown_event.is_set():
+            self._shutdown_event = asyncio.Event()
+
+        self._flush_task = loop.create_task(self._flush_loop())
+        logger.info("MetricsBufferService flush task started lazily")
+
     async def shutdown(self) -> None:
         """Shutdown service with final flush."""
         logger.info("MetricsBufferService shutting down...")
@@ -199,6 +245,41 @@ def record_tool_metric(
             error_message=error_message,
         )
 
+        self._ensure_flush_task_started()
+        with self._lock:
+            self._tool_metrics.append(metric)
+            self._total_buffered += 1
+
+    def record_tool_metric_with_duration(
+        self,
+        tool_id: str,
+        response_time: float,
+        success: bool,
+        error_message: Optional[str] = None,
+    ) -> None:
+        """Buffer a tool metric with pre-calculated response time.
+
+        Args:
+            tool_id: UUID of the tool.
+            response_time: Pre-calculated response time in seconds.
+            success: Whether the operation succeeded.
+            error_message: Optional error message if failed.
+        """
+        if not self.recording_enabled:
+            return  # Execution metrics recording disabled
+        if not self.enabled:
+            self._write_tool_metric_with_duration_immediately(tool_id, response_time, success, error_message)
+            return
+
+        metric = BufferedToolMetric(
+            tool_id=tool_id,
+            timestamp=datetime.now(timezone.utc),
+            response_time=response_time,
+            is_success=success,
+            error_message=error_message,
+        )
+
+        self._ensure_flush_task_started()
         with self._lock:
             self._tool_metrics.append(metric)
             self._total_buffered += 1
@@ -232,6 +313,7 @@ def record_resource_metric(
             error_message=error_message,
         )
 
+        self._ensure_flush_task_started()
         with self._lock:
             self._resource_metrics.append(metric)
             self._total_buffered += 1
@@ -265,6 +347,7 @@ def record_prompt_metric(
             error_message=error_message,
         )
 
+        self._ensure_flush_task_started()
         with self._lock:
             self._prompt_metrics.append(metric)
             self._total_buffered += 1
@@ -298,6 +381,41 @@ def record_server_metric(
             error_message=error_message,
         )
 
+        self._ensure_flush_task_started()
+        with self._lock:
+            self._server_metrics.append(metric)
+            self._total_buffered += 1
+
+    def record_server_metric_with_duration(
+        self,
+        server_id: str,
+        response_time: float,
+        success: bool,
+        error_message: Optional[str] = None,
+    ) -> None:
+        """Buffer a server metric with pre-calculated response time.
+
+        Args:
+            server_id: UUID of the server.
+            response_time: Pre-calculated response time in seconds.
+            success: Whether the operation succeeded.
+            error_message: Optional error message if failed.
+        """
+        if not self.recording_enabled:
+            return  # Execution metrics recording disabled
+        if not self.enabled:
+            self._write_server_metric_with_duration_immediately(server_id, response_time, success, error_message)
+            return
+
+        metric = BufferedServerMetric(
+            server_id=server_id,
+            timestamp=datetime.now(timezone.utc),
+            response_time=response_time,
+            is_success=success,
+            error_message=error_message,
+        )
+
+        self._ensure_flush_task_started()
         with self._lock:
             self._server_metrics.append(metric)
             self._total_buffered += 1
@@ -334,6 +452,7 @@ def record_a2a_agent_metric(
             error_message=error_message,
         )
 
+        self._ensure_flush_task_started()
         with self._lock:
             self._a2a_agent_metrics.append(metric)
             self._total_buffered += 1
@@ -370,6 +489,7 @@ def record_a2a_agent_metric_with_duration(
             error_message=error_message,
         )
 
+        self._ensure_flush_task_started()
         with self._lock:
             self._a2a_agent_metrics.append(metric)
             self._total_buffered += 1
@@ -594,6 +714,35 @@ def _write_tool_metric_immediately(
         except Exception as e:
             logger.error(f"Failed to write tool metric: {e}")
 
+    def _write_tool_metric_with_duration_immediately(
+        self,
+        tool_id: str,
+        response_time: float,
+        success: bool,
+        error_message: Optional[str],
+    ) -> None:
+        """Write a single tool metric with pre-calculated duration immediately.
+
+        Args:
+            tool_id: UUID of the tool.
+            response_time: Pre-calculated response time in seconds.
+            success: Whether the operation succeeded.
+            error_message: Optional error message if failed.
+        """
+        try:
+            with fresh_db_session() as db:
+                metric = ToolMetric(
+                    tool_id=tool_id,
+                    timestamp=datetime.now(timezone.utc),
+                    response_time=response_time,
+                    is_success=success,
+                    error_message=error_message,
+                )
+                db.add(metric)
+                db.commit()
+        except Exception as e:
+            logger.error(f"Failed to write tool metric: {e}")
+
     def _write_resource_metric_immediately(
         self,
         resource_id: str,
@@ -681,6 +830,35 @@ def _write_server_metric_immediately(
         except Exception as e:
             logger.error(f"Failed to write server metric: {e}")
 
+    def _write_server_metric_with_duration_immediately(
+        self,
+        server_id: str,
+        response_time: float,
+        success: bool,
+        error_message: Optional[str],
+    ) -> None:
+        """Write a single server metric with pre-calculated duration immediately.
+
+        Args:
+            server_id: UUID of the server.
+            response_time: Pre-calculated response time in seconds.
+            success: Whether the operation succeeded.
+            error_message: Optional error message if failed.
+        """
+        try:
+            with fresh_db_session() as db:
+                metric = ServerMetric(
+                    server_id=server_id,
+                    timestamp=datetime.now(timezone.utc),
+                    response_time=response_time,
+                    is_success=success,
+                    error_message=error_message,
+                )
+                db.add(metric)
+                db.commit()
+        except Exception as e:
+            logger.error(f"Failed to write server metric: {e}")
+
     def _write_a2a_agent_metric_immediately(
         self,
         a2a_agent_id: str,
diff --git a/mcpgateway/services/prompt_service.py b/mcpgateway/services/prompt_service.py
index 49a25f38f8..ec336ea46e 100644
--- a/mcpgateway/services/prompt_service.py
+++ b/mcpgateway/services/prompt_service.py
@@ -25,6 +25,9 @@
 
 # Third-Party
 from jinja2 import Environment, meta, select_autoescape, Template
+from mcp import ClientSession
+from mcp.client.sse import sse_client
+from mcp.client.streamable_http import streamablehttp_client
 import orjson
 from pydantic import ValidationError
 from sqlalchemy import and_, delete, desc, not_, or_, select
@@ -46,15 +49,19 @@
 from mcpgateway.services.base_service import BaseService
 from mcpgateway.services.event_service import EventService
 from mcpgateway.services.logging_service import LoggingService
+from mcpgateway.services.mcp_session_pool import get_mcp_session_pool, TransportType
 from mcpgateway.services.metrics_buffer_service import get_metrics_buffer_service
 from mcpgateway.services.metrics_cleanup_service import delete_metrics_in_batches, pause_rollup_during_purge
 from mcpgateway.services.observability_service import current_trace_id, ObservabilityService
 from mcpgateway.services.structured_logger import get_structured_logger
 from mcpgateway.services.team_management_service import TeamManagementService
 from mcpgateway.utils.create_slug import slugify
+from mcpgateway.utils.gateway_access import build_gateway_auth_headers
 from mcpgateway.utils.metrics_common import build_top_performers
 from mcpgateway.utils.pagination import unified_paginate
+from mcpgateway.utils.services_auth import decode_auth
 from mcpgateway.utils.sqlalchemy_modifier import json_contains_tag_expr
+from mcpgateway.utils.url_auth import apply_query_param_auth, sanitize_exception_message
 
 # Cache import (lazy to avoid circular dependencies)
 _REGISTRY_CACHE = None
@@ -244,6 +251,108 @@ def __init__(self) -> None:
         self._jinja_env = _get_jinja_env()
         self._plugin_manager: PluginManager | None = get_plugin_manager()
 
+    @staticmethod
+    def _should_fetch_gateway_prompt(prompt: DbPrompt) -> bool:
+        """Return whether a prompt must be executed against its source gateway.
+
+        Federated prompts are synced into the catalog as metadata via
+        ``list_prompts()``. Those records often have ``template=""``, which
+        means the gateway must call the upstream MCP ``prompts/get`` endpoint
+        instead of trying to render a local template.
+
+        Args:
+            prompt: Prompt ORM object resolved from the catalog.
+
+        Returns:
+            ``True`` when the prompt is gateway-backed and has no local template.
+        """
+        return bool(getattr(prompt, "gateway_id", None)) and not bool(getattr(prompt, "template", ""))
+
+    async def _fetch_gateway_prompt_result(self, prompt: DbPrompt, arguments: Optional[Dict[str, str]], user_identity: Optional[str]) -> PromptResult:
+        """Fetch a rendered prompt from the upstream MCP gateway.
+
+        Args:
+            prompt: Gateway-backed prompt record from the catalog.
+            arguments: Optional prompt-rendering arguments.
+            user_identity: Effective requester email for session-pool isolation.
+
+        Returns:
+            Prompt result normalized into ContextForge models.
+
+        Raises:
+            PromptError: If the gateway prompt cannot be fetched.
+        """
+        gateway = getattr(prompt, "gateway", None)
+        if gateway is None:
+            raise PromptError(f"Prompt '{prompt.name}' is gateway-backed but missing gateway metadata")
+
+        gateway_url = str(gateway.url)
+        headers = build_gateway_auth_headers(gateway)
+        auth_query_params_decrypted: Optional[Dict[str, str]] = None
+
+        if getattr(gateway, "auth_type", None) == "query_param" and getattr(gateway, "auth_query_params", None):
+            auth_query_params_decrypted = {}
+            for param_key, encrypted_value in (gateway.auth_query_params or {}).items():
+                try:
+                    decoded = decode_auth(encrypted_value)
+                    auth_query_params_decrypted[param_key] = decoded.get(param_key, "")
+                except Exception as exc:
+                    raise PromptError(f"Failed to decode query-parameter auth for prompt gateway '{gateway.id}'") from exc
+            if auth_query_params_decrypted:
+                gateway_url = apply_query_param_auth(gateway_url, auth_query_params_decrypted)
+
+        remote_name = getattr(prompt, "original_name", None) or prompt.name
+        pool_user_identity = (user_identity or "anonymous").strip() or "anonymous"
+        gateway_id = str(getattr(gateway, "id", ""))
+        transport = str(getattr(gateway, "transport", "streamable_http") or "streamable_http").lower()
+        pool_transport_type = TransportType.SSE if transport == "sse" else TransportType.STREAMABLE_HTTP
+        prompt_arguments = arguments or None
+
+        try:
+            if settings.mcp_session_pool_enabled:
+                try:
+                    pool = get_mcp_session_pool()
+                except RuntimeError:
+                    pool = None
+                if pool is not None:
+                    async with pool.session(
+                        url=gateway_url,
+                        headers=headers,
+                        transport_type=pool_transport_type,
+                        user_identity=pool_user_identity,
+                        gateway_id=gateway_id,
+                    ) as pooled:
+                        remote_result = await pooled.session.get_prompt(remote_name, arguments=prompt_arguments)
+                        return PromptResult(
+                            messages=[
+                                Message.model_validate(message.model_dump(by_alias=True, exclude_none=True) if hasattr(message, "model_dump") else message)
+                                for message in getattr(remote_result, "messages", []) or []
+                            ],
+                            description=getattr(remote_result, "description", None) or prompt.description,
+                        )
+
+            if transport == "sse":
+                async with sse_client(url=gateway_url, headers=headers, timeout=settings.health_check_timeout) as streams:
+                    async with ClientSession(*streams) as session:
+                        await session.initialize()
+                        remote_result = await session.get_prompt(remote_name, arguments=prompt_arguments)
+            else:
+                async with streamablehttp_client(url=gateway_url, headers=headers, timeout=settings.health_check_timeout) as (read_stream, write_stream, _get_session_id):
+                    async with ClientSession(read_stream, write_stream) as session:
+                        await session.initialize()
+                        remote_result = await session.get_prompt(remote_name, arguments=prompt_arguments)
+
+            return PromptResult(
+                messages=[
+                    Message.model_validate(message.model_dump(by_alias=True, exclude_none=True) if hasattr(message, "model_dump") else message)
+                    for message in getattr(remote_result, "messages", []) or []
+                ],
+                description=getattr(remote_result, "description", None) or prompt.description,
+            )
+        except Exception as exc:
+            sanitized_error = sanitize_exception_message(str(exc), auth_query_params_decrypted)
+            raise PromptError(f"Failed to fetch prompt '{remote_name}' from gateway: {sanitized_error}") from exc
+
     @staticmethod
     def validate_arguments_json(args_value: Any, context: str = "") -> List[Dict[str, Any]]:
         """Validate and parse prompt arguments JSON.
@@ -1642,15 +1751,15 @@ async def get_prompt(
 
                 # Find prompt by ID first, then by name (active prompts only)
                 search_key = str(prompt_id)
-                prompt = db.execute(select(DbPrompt).where(DbPrompt.id == prompt_id).where(DbPrompt.enabled)).scalar_one_or_none()
+                prompt = db.execute(select(DbPrompt).options(joinedload(DbPrompt.gateway)).where(DbPrompt.id == prompt_id).where(DbPrompt.enabled)).scalar_one_or_none()
                 if not prompt:
-                    prompt = db.execute(select(DbPrompt).where(DbPrompt.name == prompt_id).where(DbPrompt.enabled)).scalar_one_or_none()
+                    prompt = db.execute(select(DbPrompt).options(joinedload(DbPrompt.gateway)).where(DbPrompt.name == prompt_id).where(DbPrompt.enabled)).scalar_one_or_none()
 
                 if not prompt:
                     # Check if an inactive prompt exists
-                    inactive_prompt = db.execute(select(DbPrompt).where(DbPrompt.id == prompt_id).where(not_(DbPrompt.enabled))).scalar_one_or_none()
+                    inactive_prompt = db.execute(select(DbPrompt).options(joinedload(DbPrompt.gateway)).where(DbPrompt.id == prompt_id).where(not_(DbPrompt.enabled))).scalar_one_or_none()
                     if not inactive_prompt:
-                        inactive_prompt = db.execute(select(DbPrompt).where(DbPrompt.name == prompt_id).where(not_(DbPrompt.enabled))).scalar_one_or_none()
+                        inactive_prompt = db.execute(select(DbPrompt).options(joinedload(DbPrompt.gateway)).where(DbPrompt.name == prompt_id).where(not_(DbPrompt.enabled))).scalar_one_or_none()
 
                     if inactive_prompt:
                         raise PromptNotFoundError(f"Prompt '{search_key}' exists but is inactive")
@@ -1679,7 +1788,11 @@ async def get_prompt(
                         raise PromptNotFoundError(f"Prompt not found: {search_key}")
                     server_scoped = True
 
-                if not arguments:
+                if self._should_fetch_gateway_prompt(prompt):
+                    # Release the read transaction before any remote network I/O.
+                    db.commit()
+                    result = await self._fetch_gateway_prompt_result(prompt, arguments, user)
+                elif not arguments:
                     result = PromptResult(
                         messages=[
                             Message(
@@ -1704,7 +1817,7 @@ async def get_prompt(
                 if has_post_fetch:
                     post_result, _ = await self._plugin_manager.invoke_hook(
                         PromptHookType.PROMPT_POST_FETCH,
-                        payload=PromptPosthookPayload(prompt_id=str(prompt.id), result=result),
+                        payload=PromptPosthookPayload(prompt_id=prompt.name, result=result),
                         global_context=global_context,
                         local_contexts=context_table,
                         violations_as_exceptions=True,
diff --git a/mcpgateway/services/resource_service.py b/mcpgateway/services/resource_service.py
index ec47de6496..b683029cf6 100644
--- a/mcpgateway/services/resource_service.py
+++ b/mcpgateway/services/resource_service.py
@@ -41,7 +41,7 @@
 import parse
 from pydantic import ValidationError
 from sqlalchemy import and_, delete, desc, not_, or_, select
-from sqlalchemy.exc import IntegrityError, OperationalError
+from sqlalchemy.exc import IntegrityError, MultipleResultsFound, OperationalError
 from sqlalchemy.orm import joinedload, Session
 
 # First-Party
@@ -2121,10 +2121,27 @@ async def read_resource(
                     # Matches uri (modified value from pluggins if applicable)
                     # with uri from resource DB
                     # if uri is of type resource template then resource is retreived from DB
-                    query = select(DbResource).where(DbResource.uri == str(uri)).where(DbResource.enabled)
+                    query = select(DbResource)
+                    if server_id:
+                        query = query.join(
+                            server_resource_association,
+                            server_resource_association.c.resource_id == DbResource.id,
+                        ).where(server_resource_association.c.server_id == server_id)
+                    query = query.where(DbResource.uri == str(uri)).where(DbResource.enabled)
                     if include_inactive:
-                        query = select(DbResource).where(DbResource.uri == str(uri))
-                    resource_db = db.execute(query).scalar_one_or_none()
+                        query = select(DbResource)
+                        if server_id:
+                            query = query.join(
+                                server_resource_association,
+                                server_resource_association.c.resource_id == DbResource.id,
+                            ).where(server_resource_association.c.server_id == server_id)
+                        query = query.where(DbResource.uri == str(uri))
+                    try:
+                        resource_db = db.execute(query).scalar_one_or_none()
+                    except MultipleResultsFound as exc:
+                        if server_id:
+                            raise ResourceError(f"Multiple resources matched URI '{uri}' for server '{server_id}'.") from exc
+                        raise ResourceError(f"Resource URI '{uri}' is ambiguous across multiple servers; use /servers/{{id}}/mcp.") from exc
 
                     # Check for direct_proxy mode
                     if resource_db and resource_db.gateway and getattr(resource_db.gateway, "gateway_mode", "cache") == "direct_proxy" and settings.mcpgateway_direct_proxy_enabled:
@@ -2180,8 +2197,23 @@ async def read_resource(
                         # Normal cache mode - resource found in DB
                         content = resource_db.content
                     else:
-                        # Check the inactivity first
-                        check_inactivity = db.execute(select(DbResource).where(DbResource.uri == str(resource_uri)).where(not_(DbResource.enabled))).scalar_one_or_none()
+                        # Check the inactivity first using the same server scope that
+                        # governed the active lookup. Without this, duplicate URIs
+                        # across different virtual servers/gateways can produce
+                        # ambiguous results even though the current request is
+                        # already scoped to a single server.
+                        inactive_query = select(DbResource)
+                        if server_id:
+                            inactive_query = inactive_query.join(
+                                server_resource_association,
+                                server_resource_association.c.resource_id == DbResource.id,
+                            ).where(server_resource_association.c.server_id == server_id)
+                        try:
+                            check_inactivity = db.execute(inactive_query.where(DbResource.uri == str(resource_uri)).where(not_(DbResource.enabled))).scalar_one_or_none()
+                        except MultipleResultsFound as exc:
+                            if server_id:
+                                raise ResourceError(f"Multiple inactive resources matched URI '{resource_uri}' for server '{server_id}'.") from exc
+                            raise ResourceError(f"Resource URI '{resource_uri}' is ambiguous across multiple servers; use /servers/{{id}}/mcp.") from exc
                         if check_inactivity:
                             raise ResourceNotFoundError(f"Resource '{resource_uri}' exists but is inactive")
 
diff --git a/mcpgateway/services/tool_service.py b/mcpgateway/services/tool_service.py
index 89e1f3f9fc..2b07efb3a6 100644
--- a/mcpgateway/services/tool_service.py
+++ b/mcpgateway/services/tool_service.py
@@ -2152,6 +2152,79 @@ async def list_server_tools(
 
         return result
 
+    async def list_server_mcp_tool_definitions(
+        self,
+        db: Session,
+        server_id: str,
+        *,
+        include_inactive: bool = False,
+        user_email: Optional[str] = None,
+        token_teams: Optional[List[str]] = None,
+    ) -> List[Dict[str, Any]]:
+        """Return server-scoped MCP tool definitions without building full ToolRead models.
+
+        This is a hot-path helper for the internal Rust -> Python seam. It keeps
+        auth and visibility semantics aligned with ``list_server_tools`` while
+        avoiding the heavier ``ToolRead`` conversion that is only needed for the
+        admin/API surfaces.
+
+        Args:
+            db: Active database session.
+            server_id: Virtual server identifier used to scope the tool listing.
+            include_inactive: Whether disabled tools should be included.
+            user_email: Requester email for owner-scoped visibility checks.
+            token_teams: Normalized team scope from the caller token.
+
+        Returns:
+            A list of MCP-compatible tool definition dictionaries.
+        """
+        name_column = DbTool.__table__.c.name
+        query = (
+            select(
+                name_column.label("name"),
+                DbTool.description.label("description"),
+                DbTool.input_schema.label("input_schema"),
+                DbTool.output_schema.label("output_schema"),
+                DbTool.annotations.label("annotations"),
+                DbTool.owner_email.label("owner_email"),
+                DbTool.team_id.label("team_id"),
+                DbTool.visibility.label("visibility"),
+            )
+            .join(server_tool_association, DbTool.id == server_tool_association.c.tool_id)
+            .where(server_tool_association.c.server_id == server_id)
+        )
+
+        if not include_inactive:
+            query = query.where(DbTool.enabled)
+
+        if user_email is not None or token_teams is not None:
+            team_ids = token_teams if token_teams is not None else []
+            is_public_only_token = token_teams is not None and len(token_teams) == 0
+
+            access_conditions = [DbTool.visibility == "public"]
+            if not is_public_only_token and user_email:
+                access_conditions.append(DbTool.owner_email == user_email)
+            if team_ids:
+                access_conditions.append(and_(DbTool.team_id.in_(team_ids), DbTool.visibility.in_(["team", "public"])))
+            query = query.where(or_(*access_conditions))
+
+        rows = db.execute(query).mappings().all()
+        db.commit()
+
+        result: List[Dict[str, Any]] = []
+        for row in rows:
+            payload: Dict[str, Any] = {
+                "name": row["name"],
+                "description": row["description"],
+                "inputSchema": row["input_schema"] or {"type": "object", "properties": {}},
+                "annotations": row["annotations"] or {},
+            }
+            if row["output_schema"] is not None:
+                payload["outputSchema"] = row["output_schema"]
+            result.append(payload)
+
+        return result
+
     async def list_tools_for_user(
         self,
         db: Session,
@@ -2755,6 +2828,319 @@ async def invoke_tool_direct(
             logger.exception(f"Direct proxy tool invocation failed for {name}: {e}")
             raise ToolInvocationError(f"Direct proxy tool invocation failed: {str(e)}")
 
+    async def prepare_rust_mcp_tool_execution(
+        self,
+        db: Session,
+        name: str,
+        request_headers: Optional[Dict[str, str]] = None,
+        app_user_email: Optional[str] = None,
+        user_email: Optional[str] = None,
+        token_teams: Optional[List[str]] = None,
+        server_id: Optional[str] = None,
+    ) -> Dict[str, Any]:
+        """Build a narrow MCP execution plan for the Rust runtime hot path.
+
+        This reuses Python's existing auth, scoping, and secret-handling logic,
+        but stops before the actual upstream MCP call. The Rust runtime can then
+        execute the call directly for the simple streamable HTTP MCP cases that
+        dominate load tests, while Python remains the authority for policy.
+
+        Args:
+            db: Active database session.
+            name: Tool name requested by the caller.
+            request_headers: Incoming request headers used for passthrough/auth decisions.
+            app_user_email: OAuth application user email, when present.
+            user_email: Effective requester email after auth normalization.
+            token_teams: Normalized team scope from the caller token.
+            server_id: Optional virtual server identifier restricting tool access.
+
+        Returns:
+            A Rust execution plan dictionary, or a fallback descriptor when direct
+            Rust execution is not eligible.
+
+        Raises:
+            ToolNotFoundError: If the requested tool is not visible or invocable.
+            ToolInvocationError: If gateway auth preparation fails or the tool name is ambiguous.
+        """
+        if self._plugin_manager and (self._plugin_manager.has_hooks_for(ToolHookType.TOOL_PRE_INVOKE) or self._plugin_manager.has_hooks_for(ToolHookType.TOOL_POST_INVOKE)):
+            return {"eligible": False, "fallbackReason": "plugin-hooks-configured"}
+
+        if current_trace_id.get():
+            return {"eligible": False, "fallbackReason": "observability-trace-active"}
+
+        gateway_id_from_header = extract_gateway_id_from_headers(request_headers)
+        is_direct_proxy = False
+        tool = None
+        gateway = None
+        tool_selected_from_server_scope = False
+        tool_payload: Dict[str, Any] = {}
+        gateway_payload: Optional[Dict[str, Any]] = None
+        if gateway_id_from_header:
+            gateway = db.execute(select(DbGateway).where(DbGateway.id == gateway_id_from_header)).scalar_one_or_none()
+            if gateway and gateway.gateway_mode == "direct_proxy" and settings.mcpgateway_direct_proxy_enabled:
+                if not await check_gateway_access(db, gateway, user_email, token_teams):
+                    raise ToolNotFoundError(f"Tool not found: {name}")
+                is_direct_proxy = True
+                gateway_payload = {
+                    "id": str(gateway.id),
+                    "name": gateway.name,
+                    "url": gateway.url,
+                    "auth_type": gateway.auth_type,
+                    "auth_value": encode_auth(gateway.auth_value) if isinstance(gateway.auth_value, dict) else gateway.auth_value,
+                    "auth_query_params": gateway.auth_query_params,
+                    "oauth_config": gateway.oauth_config,
+                    "ca_certificate": gateway.ca_certificate,
+                    "ca_certificate_sig": gateway.ca_certificate_sig,
+                    "passthrough_headers": gateway.passthrough_headers,
+                    "gateway_mode": gateway.gateway_mode,
+                }
+                tool_payload = {
+                    "id": None,
+                    "name": name,
+                    "original_name": name,
+                    "enabled": True,
+                    "reachable": True,
+                    "integration_type": "MCP",
+                    "request_type": "streamablehttp",
+                    "gateway_id": str(gateway.id),
+                }
+
+        if not is_direct_proxy:
+            tool_lookup_cache = _get_tool_lookup_cache()
+            cached_payload = await tool_lookup_cache.get(name) if tool_lookup_cache.enabled else None
+
+            if cached_payload:
+                status = cached_payload.get("status", "active")
+                if status == "missing":
+                    raise ToolNotFoundError(f"Tool not found: {name}")
+                if status == "inactive":
+                    raise ToolNotFoundError(f"Tool '{name}' exists but is inactive")
+                if status == "offline":
+                    raise ToolNotFoundError(f"Tool '{name}' exists but is currently offline. Please verify if it is running.")
+                tool_payload = cached_payload.get("tool") or {}
+                gateway_payload = cached_payload.get("gateway")
+
+        if not tool_payload:
+            tools = self._load_invocable_tools(db, name, server_id=server_id)
+            tool_selected_from_server_scope = bool(server_id)
+
+            if not tools:
+                raise ToolNotFoundError(f"Tool not found: {name}")
+
+            multiple_found = len(tools) > 1
+            if not multiple_found:
+                tool = tools[0]
+            else:
+                visibility_priority = {"team": 0, "private": 1, "public": 2}
+                accessible_tools: list[tuple[int, Any]] = []
+                for candidate in tools:
+                    tool_dict = {"visibility": candidate.visibility, "team_id": candidate.team_id, "owner_email": candidate.owner_email}
+                    if await self._check_tool_access(db, tool_dict, user_email, token_teams):
+                        priority = visibility_priority.get(candidate.visibility, 99)
+                        accessible_tools.append((priority, candidate))
+
+                if not accessible_tools:
+                    raise ToolNotFoundError(f"Tool not found: {name}")
+
+                accessible_tools.sort(key=lambda item: item[0])
+                best_priority = accessible_tools[0][0]
+                best_tools = [candidate for priority, candidate in accessible_tools if priority == best_priority]
+                if len(best_tools) > 1:
+                    raise ToolInvocationError(f"Multiple tools found with name '{name}' at same priority level. Tool name is ambiguous.")
+                tool = best_tools[0]
+
+            if not tool.enabled:
+                raise ToolNotFoundError(f"Tool '{name}' exists but is inactive")
+
+            if not tool.reachable:
+                await tool_lookup_cache.set_negative(name, "offline")
+                raise ToolNotFoundError(f"Tool '{name}' exists but is currently offline. Please verify if it is running.")
+
+            gateway = tool.gateway
+            cache_payload = self._build_tool_cache_payload(tool, gateway)
+            tool_payload = cache_payload.get("tool") or {}
+            gateway_payload = cache_payload.get("gateway")
+            if not multiple_found:
+                await tool_lookup_cache.set(name, cache_payload, gateway_id=tool_payload.get("gateway_id"))
+
+        if tool_payload.get("enabled") is False:
+            raise ToolNotFoundError(f"Tool '{name}' exists but is inactive")
+        if tool_payload.get("reachable") is False:
+            raise ToolNotFoundError(f"Tool '{name}' exists but is currently offline. Please verify if it is running.")
+
+        if is_direct_proxy:
+            return {"eligible": False, "fallbackReason": "direct-proxy"}
+
+        if not await self._check_tool_access(db, tool_payload, user_email, token_teams):
+            raise ToolNotFoundError(f"Tool not found: {name}")
+
+        if server_id and not tool_selected_from_server_scope:
+            tool_id_for_check = tool_payload.get("id")
+            if not tool_id_for_check:
+                raise ToolNotFoundError(f"Tool not found: {name}")
+            server_match = db.execute(
+                select(server_tool_association.c.tool_id).where(
+                    server_tool_association.c.server_id == server_id,
+                    server_tool_association.c.tool_id == tool_id_for_check,
+                )
+            ).first()
+            if not server_match:
+                raise ToolNotFoundError(f"Tool not found: {name}")
+
+        tool_integration_type = tool_payload.get("integration_type")
+        if tool_integration_type != "MCP":
+            return {"eligible": False, "fallbackReason": f"unsupported-integration:{tool_integration_type or 'unknown'}"}
+
+        tool_request_type = tool_payload.get("request_type")
+        transport = tool_request_type.lower() if tool_request_type else "sse"
+        if transport != "streamablehttp":
+            return {"eligible": False, "fallbackReason": f"unsupported-transport:{transport}"}
+
+        tool_jsonpath_filter = tool_payload.get("jsonpath_filter")
+        if tool_jsonpath_filter:
+            return {"eligible": False, "fallbackReason": "jsonpath-filter-configured"}
+
+        passthrough_allowed = global_config_cache.get_passthrough_headers(db, settings.default_passthrough_headers)
+
+        if tool is not None:
+            gateway = tool.gateway
+
+        tool_name_original = tool_payload.get("original_name") or tool_payload.get("name") or name
+        tool_id = tool_payload.get("id")
+        tool_gateway_id = tool_payload.get("gateway_id")
+        tool_timeout_ms = tool_payload.get("timeout_ms")
+        effective_timeout = (tool_timeout_ms / 1000) if tool_timeout_ms else settings.tool_timeout
+
+        has_gateway = gateway_payload is not None
+        gateway_url = gateway_payload.get("url") if has_gateway else None
+        gateway_name = gateway_payload.get("name") if has_gateway else None
+        gateway_auth_type = gateway_payload.get("auth_type") if has_gateway else None
+        gateway_auth_value = gateway_payload.get("auth_value") if has_gateway and isinstance(gateway_payload.get("auth_value"), str) else None
+        gateway_auth_query_params = gateway_payload.get("auth_query_params") if has_gateway and isinstance(gateway_payload.get("auth_query_params"), dict) else None
+        gateway_oauth_config = gateway_payload.get("oauth_config") if has_gateway and isinstance(gateway_payload.get("oauth_config"), dict) else None
+        if has_gateway and gateway is not None:
+            runtime_gateway_auth_value = getattr(gateway, "auth_value", None)
+            if isinstance(runtime_gateway_auth_value, dict):
+                gateway_auth_value = encode_auth(runtime_gateway_auth_value)
+            elif isinstance(runtime_gateway_auth_value, str):
+                gateway_auth_value = runtime_gateway_auth_value
+            runtime_gateway_query_params = getattr(gateway, "auth_query_params", None)
+            if isinstance(runtime_gateway_query_params, dict):
+                gateway_auth_query_params = runtime_gateway_query_params
+            runtime_gateway_oauth_config = getattr(gateway, "oauth_config", None)
+            if isinstance(runtime_gateway_oauth_config, dict):
+                gateway_oauth_config = runtime_gateway_oauth_config
+        gateway_ca_cert = gateway_payload.get("ca_certificate") if has_gateway else None
+        gateway_id_str = gateway_payload.get("id") if has_gateway else None
+
+        if tool is None and has_gateway:
+            requires_gateway_auth_hydration = gateway_auth_type in {"basic", "bearer", "authheaders", "oauth", "query_param"}
+            if requires_gateway_auth_hydration:
+                tool_id_for_hydration = tool_payload.get("id")
+                if tool_id_for_hydration:
+                    tool_auth_row = db.execute(select(DbTool).options(joinedload(DbTool.gateway)).where(DbTool.id == tool_id_for_hydration)).scalar_one_or_none()
+                    if tool_auth_row and tool_auth_row.gateway:
+                        hydrated_gateway_auth_value = getattr(tool_auth_row.gateway, "auth_value", None)
+                        if isinstance(hydrated_gateway_auth_value, dict):
+                            gateway_auth_value = encode_auth(hydrated_gateway_auth_value)
+                        elif isinstance(hydrated_gateway_auth_value, str):
+                            gateway_auth_value = hydrated_gateway_auth_value
+                        hydrated_gateway_query_params = getattr(tool_auth_row.gateway, "auth_query_params", None)
+                        if isinstance(hydrated_gateway_query_params, dict):
+                            gateway_auth_query_params = hydrated_gateway_query_params
+                        hydrated_gateway_oauth_config = getattr(tool_auth_row.gateway, "oauth_config", None)
+                        if isinstance(hydrated_gateway_oauth_config, dict):
+                            gateway_oauth_config = hydrated_gateway_oauth_config
+
+        gateway_auth_query_params_decrypted: Optional[Dict[str, str]] = None
+        if gateway_auth_type == "query_param" and gateway_auth_query_params:
+            gateway_auth_query_params_decrypted = {}
+            for param_key, encrypted_value in gateway_auth_query_params.items():
+                if encrypted_value:
+                    try:
+                        decrypted = decode_auth(encrypted_value)
+                        gateway_auth_query_params_decrypted[param_key] = decrypted.get(param_key, "")
+                    except Exception:  # noqa: S110
+                        logger.debug(f"Failed to decrypt query param '{param_key}' for Rust MCP tool execution plan")
+            if gateway_auth_query_params_decrypted and gateway_url:
+                gateway_url = apply_query_param_auth(gateway_url, gateway_auth_query_params_decrypted)
+
+        if gateway_ca_cert:
+            return {"eligible": False, "fallbackReason": "custom-ca-certificate"}
+
+        if not gateway_url:
+            return {"eligible": False, "fallbackReason": "missing-gateway-url"}
+
+        if has_gateway and gateway_auth_type == "oauth" and isinstance(gateway_oauth_config, dict) and gateway_oauth_config:
+            grant_type = gateway_oauth_config.get("grant_type", "client_credentials")
+            if grant_type == "authorization_code":
+                try:
+                    # First-Party
+                    from mcpgateway.services.token_storage_service import TokenStorageService  # pylint: disable=import-outside-toplevel
+
+                    with fresh_db_session() as token_db:
+                        token_storage = TokenStorageService(token_db)
+                        if not app_user_email:
+                            raise ToolInvocationError(f"User authentication required for OAuth-protected gateway '{gateway_name}'. Please ensure you are authenticated.")
+                        access_token = await token_storage.get_user_token(gateway_id_str, app_user_email)
+
+                    if access_token:
+                        headers = {"Authorization": f"Bearer {access_token}"}
+                    else:
+                        raise ToolInvocationError(f"Please authorize {gateway_name} first. Visit /oauth/authorize/{gateway_id_str} to complete OAuth flow.")
+                except Exception as e:
+                    logger.error(f"Failed to obtain stored OAuth token for gateway {gateway_name}: {e}")
+                    raise ToolInvocationError(f"OAuth token retrieval failed for gateway: {str(e)}")
+            else:
+                try:
+                    access_token = await self.oauth_manager.get_access_token(gateway_oauth_config)
+                    headers = {"Authorization": f"Bearer {access_token}"}
+                except Exception as e:
+                    logger.error(f"Failed to obtain OAuth access token for gateway {gateway_name}: {e}")
+                    raise ToolInvocationError(f"OAuth authentication failed for gateway: {str(e)}")
+        else:
+            headers = decode_auth(gateway_auth_value) if gateway_auth_value else {}
+
+        if request_headers:
+            headers = compute_passthrough_headers_cached(
+                request_headers,
+                headers,
+                passthrough_allowed,
+                gateway_auth_type=gateway_auth_type,
+                gateway_passthrough_headers=gateway_payload.get("passthrough_headers") if has_gateway else None,
+            )
+
+        runtime_headers = {str(header_name): str(header_value) for header_name, header_value in headers.items() if header_name and header_value}
+
+        return {
+            "eligible": True,
+            "transport": transport,
+            "serverUrl": gateway_url,
+            "remoteToolName": tool_name_original,
+            "headers": runtime_headers,
+            "timeoutMs": int(effective_timeout * 1000),
+            "gatewayId": tool_gateway_id,
+            "toolName": name,
+            "toolId": tool_id or None,
+            "serverId": server_id,
+        }
+
+    def _load_invocable_tools(self, db: Session, name: str, server_id: Optional[str] = None) -> List[DbTool]:
+        """Load candidate tools for invocation, narrowing to a virtual server when possible.
+
+        Args:
+            db: Active database session.
+            name: Tool name to resolve.
+            server_id: Optional virtual server identifier used to constrain results.
+
+        Returns:
+            A list of candidate tool ORM rows matching the request.
+        """
+        query = select(DbTool).options(joinedload(DbTool.gateway)).where(DbTool.name == name)
+        if server_id:
+            query = query.join(server_tool_association, DbTool.id == server_tool_association.c.tool_id).where(server_tool_association.c.server_id == server_id)
+        return db.execute(query).scalars().all()
+
     async def invoke_tool(
         self,
         db: Session,
@@ -2885,7 +3271,7 @@ async def invoke_tool(
             # Use a single query to avoid a race between separate enabled/inactive lookups.
             # Use scalars().all() instead of scalar_one_or_none() to handle duplicate
             # tool names across teams without crashing on MultipleResultsFound.
-            tools = db.execute(select(DbTool).options(joinedload(DbTool.gateway)).where(DbTool.name == name)).scalars().all()
+            tools = self._load_invocable_tools(db, name, server_id=server_id)
 
             if not tools:
                 raise ToolNotFoundError(f"Tool not found: {name}")
diff --git a/mcpgateway/templates/overview_partial.html b/mcpgateway/templates/overview_partial.html
index cf486601a7..4390ef5c5b 100644
--- a/mcpgateway/templates/overview_partial.html
+++ b/mcpgateway/templates/overview_partial.html
@@ -19,6 +19,103 @@ <h2 class="text-2xl font-bold text-gray-900 dark:text-gray-100 flex items-center
     </div>
   </div>
 
+  <!-- MCP Runtime Status -->
+  <div
+    id="overview-mcp-runtime-card"
+    class="bg-white dark:bg-gray-800 rounded-lg shadow p-4 border border-gray-200 dark:border-gray-700"
+  >
+    <div class="flex flex-col lg:flex-row lg:items-center lg:justify-between gap-4">
+      <div>
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          MCP Runtime
+        </div>
+        <div class="mt-2 flex flex-wrap items-center gap-2">
+          <span
+            id="overview-mcp-core-badge"
+            class="px-3 py-1 rounded-full text-sm font-medium {% if mcp_runtime.mounted == 'rust' %}bg-orange-100 text-orange-800 dark:bg-orange-900 dark:text-orange-200{% else %}bg-blue-100 text-blue-800 dark:bg-blue-900 dark:text-blue-200{% endif %}"
+            title="Effective public MCP transport mounted in this gateway"
+          >
+            {% if mcp_runtime.mounted == 'rust' %}🦀 Rust MCP Core{% else %}🐍
+            Python MCP Core{% endif %}
+          </span>
+          <span
+            id="overview-mcp-runtime-mode-badge"
+            class="px-3 py-1 rounded-full text-sm font-medium bg-gray-100 text-gray-800 dark:bg-gray-700 dark:text-gray-200"
+            title="High-level runtime mode"
+          >
+            {{ mcp_runtime.mode | replace('-', ' ') }}
+          </span>
+          {% if mcp_runtime.mode == 'rust-managed' and mcp_runtime.mounted == 'python' %}
+          <span
+            class="px-3 py-1 rounded-full text-sm font-medium bg-amber-100 text-amber-800 dark:bg-amber-900 dark:text-amber-200"
+            title="Rust sidecar is present, but the public MCP path is still using Python semantics"
+          >
+            Shadow / safe fallback
+          </span>
+          {% elif mcp_runtime.mode == 'python-rust-built-disabled' %}
+          <span
+            class="px-3 py-1 rounded-full text-sm font-medium bg-indigo-100 text-indigo-800 dark:bg-indigo-900 dark:text-indigo-200"
+            title="Rust binaries are included in the image, but the MCP runtime is disabled"
+          >
+            Rust build available
+          </span>
+          {% endif %}
+        </div>
+      </div>
+
+      <div class="grid grid-cols-2 md:grid-cols-3 xl:grid-cols-6 gap-2">
+        <div class="rounded-lg bg-gray-50 dark:bg-gray-700 px-3 py-2">
+          <div class="text-xs font-medium text-gray-500 dark:text-gray-400">
+            Public MCP
+          </div>
+          <div class="text-sm font-semibold text-gray-900 dark:text-gray-100">
+            {% if mcp_runtime.mounted == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+          </div>
+        </div>
+        <div class="rounded-lg bg-gray-50 dark:bg-gray-700 px-3 py-2">
+          <div class="text-xs font-medium text-gray-500 dark:text-gray-400">
+            Session
+          </div>
+          <div class="text-sm font-semibold text-gray-900 dark:text-gray-100">
+            {% if mcp_runtime.session_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+          </div>
+        </div>
+        <div class="rounded-lg bg-gray-50 dark:bg-gray-700 px-3 py-2">
+          <div class="text-xs font-medium text-gray-500 dark:text-gray-400">
+            Replay
+          </div>
+          <div class="text-sm font-semibold text-gray-900 dark:text-gray-100">
+            {% if mcp_runtime.resume_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+          </div>
+        </div>
+        <div class="rounded-lg bg-gray-50 dark:bg-gray-700 px-3 py-2">
+          <div class="text-xs font-medium text-gray-500 dark:text-gray-400">
+            Live Stream
+          </div>
+          <div class="text-sm font-semibold text-gray-900 dark:text-gray-100">
+            {% if mcp_runtime.live_stream_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+          </div>
+        </div>
+        <div class="rounded-lg bg-gray-50 dark:bg-gray-700 px-3 py-2">
+          <div class="text-xs font-medium text-gray-500 dark:text-gray-400">
+            Affinity
+          </div>
+          <div class="text-sm font-semibold text-gray-900 dark:text-gray-100">
+            {% if mcp_runtime.affinity_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+          </div>
+        </div>
+        <div class="rounded-lg bg-gray-50 dark:bg-gray-700 px-3 py-2">
+          <div class="text-xs font-medium text-gray-500 dark:text-gray-400">
+            Auth Reuse
+          </div>
+          <div class="text-sm font-semibold text-gray-900 dark:text-gray-100">
+            {% if mcp_runtime.session_auth_reuse_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+
   <!-- Key Metrics Cards -->
   <div class="grid grid-cols-2 md:grid-cols-4 gap-4">
     <!-- Total Executions -->
diff --git a/mcpgateway/templates/version_info_partial.html b/mcpgateway/templates/version_info_partial.html
index 02609502e9..04593d14f0 100644
--- a/mcpgateway/templates/version_info_partial.html
+++ b/mcpgateway/templates/version_info_partial.html
@@ -2,6 +2,7 @@
 <div class="space-y-6">
   <!-- Application Overview Card (Similar to System Summary) -->
   <div
+    id="version-app-overview-card"
     class="bg-gradient-to-r from-blue-500 to-purple-600 rounded-lg shadow-lg p-6 text-white"
   >
     <h2 class="text-2xl font-bold mb-4 flex items-center">
@@ -57,7 +58,7 @@ <h2 class="text-2xl font-bold mb-4 flex items-center">
   </div>
 
   <!-- Platform & Runtime Card -->
-  <div class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
+  <div id="version-platform-runtime-card" class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
     <h3 class="text-lg font-medium mb-4 dark:text-gray-200 flex items-center">
       <svg
         class="h-6 w-6 mr-2 text-indigo-600"
@@ -102,8 +103,116 @@ <h3 class="text-lg font-medium mb-4 dark:text-gray-200 flex items-center">
     </div>
   </div>
 
+  <!-- MCP Runtime Card -->
+  <div id="version-mcp-runtime-card" class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
+    <div class="flex flex-col lg:flex-row lg:items-start lg:justify-between gap-4">
+      <div>
+        <h3 class="text-lg font-medium mb-1 dark:text-gray-200 flex items-center">
+          <span class="text-2xl mr-2" aria-hidden="true">
+            {% if payload.mcp_runtime.mounted == 'rust' %}🦀{% else %}🐍{% endif %}
+          </span>
+          MCP Runtime
+        </h3>
+        <p class="text-sm text-gray-600 dark:text-gray-400">
+          Active MCP transport and core ownership for this gateway instance.
+        </p>
+      </div>
+      <div class="flex flex-wrap gap-2">
+        <span
+          id="version-mcp-core-badge"
+          class="px-3 py-1 rounded-full text-sm font-medium {% if payload.mcp_runtime.mounted == 'rust' %}bg-orange-100 text-orange-800 dark:bg-orange-900 dark:text-orange-200{% else %}bg-blue-100 text-blue-800 dark:bg-blue-900 dark:text-blue-200{% endif %}"
+        >
+          {% if payload.mcp_runtime.mounted == 'rust' %}🦀 Rust MCP Core{% else %}🐍 Python MCP Core{% endif %}
+        </span>
+        <span
+          id="version-mcp-runtime-mode-badge"
+          class="px-3 py-1 rounded-full text-sm font-medium bg-gray-100 text-gray-800 dark:bg-gray-700 dark:text-gray-200"
+        >
+          {{ payload.mcp_runtime.mode | replace('-', ' ') }}
+        </span>
+      </div>
+    </div>
+
+    <div class="grid grid-cols-1 md:grid-cols-2 xl:grid-cols-4 gap-4 mt-4">
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Public Transport
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.mounted == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+        </div>
+      </div>
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Session Core
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.session_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+        </div>
+      </div>
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Event Store
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.event_store_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+        </div>
+      </div>
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Replay / Resume
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.resume_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+        </div>
+      </div>
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Live Stream
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.live_stream_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+        </div>
+      </div>
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Affinity
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.affinity_core_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+        </div>
+      </div>
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Session Auth Reuse
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.session_auth_reuse_mode == 'rust' %}🦀 Rust{% else %}🐍 Python{% endif %}
+        </div>
+      </div>
+      <div class="bg-gray-50 rounded p-4 dark:bg-gray-700">
+        <div class="text-sm font-medium text-gray-500 dark:text-gray-400">
+          Rust Build Included
+        </div>
+        <div class="text-lg font-semibold text-gray-900 dark:text-gray-100">
+          {% if payload.mcp_runtime.rust_build_included %}Yes{% else %}No{% endif %}
+        </div>
+      </div>
+    </div>
+
+    {% if payload.mcp_runtime.mode == 'rust-managed' and payload.mcp_runtime.mounted == 'python' %}
+    <div class="mt-4 rounded-lg border border-amber-200 bg-amber-50 px-4 py-3 text-sm text-amber-800 dark:border-amber-700 dark:bg-amber-900/20 dark:text-amber-200">
+      Public MCP traffic is still on the Python path. The Rust sidecar is present internally for managed rollout or safe fallback operation.
+    </div>
+    {% elif payload.mcp_runtime.mode == 'python-rust-built-disabled' %}
+    <div class="mt-4 rounded-lg border border-indigo-200 bg-indigo-50 px-4 py-3 text-sm text-indigo-800 dark:border-indigo-700 dark:bg-indigo-900/20 dark:text-indigo-200">
+      This image includes Rust MCP artifacts, but the runtime is currently disabled and the public MCP path remains Python-only.
+    </div>
+    {% endif %}
+  </div>
+
   <!-- Services Status Card -->
-  <div class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
+  <div id="version-services-status-card" class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
     <h3 class="text-lg font-medium mb-4 dark:text-gray-200 flex items-center">
       <svg
         class="h-6 w-6 mr-2 text-indigo-600"
@@ -261,7 +370,7 @@ <h3 class="text-lg font-medium mb-4 dark:text-gray-200 flex items-center">
   </div>
 
   <!-- System Resources Card -->
-  <div class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
+  <div id="version-system-resources-card" class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
     <h3 class="text-lg font-medium mb-4 dark:text-gray-200 flex items-center">
       <svg
         class="h-6 w-6 mr-2 text-indigo-600"
@@ -325,7 +434,7 @@ <h3 class="text-lg font-medium mb-4 dark:text-gray-200 flex items-center">
   </div>
 
   <!-- Support Bundle Download Card -->
-  <div class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
+  <div id="version-support-bundle-card" class="bg-white rounded-lg shadow p-6 dark:bg-gray-800">
     <div class="flex justify-between items-center mb-4">
       <div>
         <h3 class="text-lg font-medium dark:text-gray-200 flex items-center">
diff --git a/mcpgateway/transports/rust_mcp_runtime_proxy.py b/mcpgateway/transports/rust_mcp_runtime_proxy.py
new file mode 100644
index 0000000000..1da38e8e9c
--- /dev/null
+++ b/mcpgateway/transports/rust_mcp_runtime_proxy.py
@@ -0,0 +1,268 @@
+# -*- coding: utf-8 -*-
+"""Location: ./mcpgateway/transports/rust_mcp_runtime_proxy.py
+Copyright 2025
+SPDX-License-Identifier: Apache-2.0
+
+Experimental MCP transport proxy for the Rust runtime edge.
+
+This module keeps Python auth/path-rewrite middleware in front of MCP traffic
+while proxying MCP transport requests to the optional Rust runtime sidecar.
+"""
+
+# Future
+from __future__ import annotations
+
+# Standard
+import asyncio
+import base64
+import logging
+import re
+from urllib.parse import urlsplit, urlunsplit
+
+# Third-Party
+import httpx
+import orjson
+from starlette.types import Receive, Scope, Send
+
+# First-Party
+from mcpgateway.config import settings
+from mcpgateway.services.http_client_service import get_http_client, get_http_limits
+from mcpgateway.transports.streamablehttp_transport import get_streamable_http_auth_context
+from mcpgateway.utils.orjson_response import ORJSONResponse
+
+logger = logging.getLogger(__name__)
+
+_SERVER_ID_RE = re.compile(r"/servers/(?P<server_id>[a-fA-F0-9\-]+)/mcp/?$")
+_CONTEXTFORGE_SERVER_ID_HEADER = "x-contextforge-server-id"
+_CONTEXTFORGE_AUTH_CONTEXT_HEADER = "x-contextforge-auth-context"
+_CONTEXTFORGE_AFFINITY_FORWARDED_HEADER = "x-contextforge-affinity-forwarded"
+_CLIENT_ERROR_DETAIL = "See server logs"
+_REQUEST_HOP_BY_HOP_HEADERS = frozenset({"host", "content-length", "connection", "transfer-encoding", "keep-alive"})
+_FORWARDED_CHAIN_HEADERS = frozenset({"forwarded", "x-forwarded-for", "x-forwarded-host", "x-forwarded-port", "x-forwarded-proto"})
+_INTERNAL_ONLY_REQUEST_HEADERS = frozenset(
+    {
+        "x-forwarded-internally",
+        "x-original-worker",
+        "x-mcp-session-id",
+        "x-contextforge-mcp-runtime",
+        _CONTEXTFORGE_SERVER_ID_HEADER,
+        _CONTEXTFORGE_AUTH_CONTEXT_HEADER,
+        _CONTEXTFORGE_AFFINITY_FORWARDED_HEADER,
+    }
+)
+_RESPONSE_HOP_BY_HOP_HEADERS = frozenset({"connection", "transfer-encoding", "keep-alive"})
+
+
+class RustMCPRuntimeProxy:
+    """Proxy MCP transport traffic to the experimental Rust runtime."""
+
+    def __init__(self, python_fallback_app) -> None:
+        """Initialize the proxy with the existing Python MCP transport fallback.
+
+        Args:
+            python_fallback_app: Python MCP transport app used when Rust cannot handle
+                the request.
+        """
+        self.python_fallback_app = python_fallback_app
+        self._uds_client: httpx.AsyncClient | None = None
+        self._uds_client_lock = asyncio.Lock()
+
+    async def handle_streamable_http(self, scope: Scope, receive: Receive, send: Send) -> None:
+        """Route MCP transport requests to the Rust runtime and preserve Python fallback for others.
+
+        Args:
+            scope: Incoming ASGI scope.
+            receive: ASGI receive callable.
+            send: ASGI send callable.
+        """
+        if scope.get("type") != "http":
+            await self.python_fallback_app(scope, receive, send)
+            return
+
+        method = str(scope.get("method", "GET")).upper()
+        if method not in {"GET", "POST", "DELETE"}:
+            await self.python_fallback_app(scope, receive, send)
+            return
+
+        target_url = _build_runtime_mcp_url(scope)
+        headers = _build_forward_headers(scope)
+        timeout = httpx.Timeout(settings.experimental_rust_mcp_runtime_timeout_seconds)
+
+        try:
+            client = await self._get_runtime_client()
+            async with client.stream(
+                method,
+                target_url,
+                content=_stream_request_body(receive) if method == "POST" else b"",
+                headers=headers,
+                timeout=timeout,
+                follow_redirects=False,
+            ) as response:
+                await send(
+                    {
+                        "type": "http.response.start",
+                        "status": response.status_code,
+                        "headers": [(name, value) for name, value in response.headers.raw if name.decode("latin-1").lower() not in _RESPONSE_HOP_BY_HOP_HEADERS],
+                    }
+                )
+                async for chunk in response.aiter_bytes():
+                    if chunk:
+                        await send({"type": "http.response.body", "body": chunk, "more_body": True})
+                await send({"type": "http.response.body", "body": b"", "more_body": False})
+        except httpx.HTTPError as exc:
+            logger.error("Experimental Rust MCP runtime request failed: %s", exc)
+            error_response = ORJSONResponse(
+                status_code=502,
+                content={
+                    "jsonrpc": "2.0",
+                    "id": None,
+                    "error": {
+                        "code": -32000,
+                        "message": "Experimental Rust MCP runtime unavailable",
+                        "data": _CLIENT_ERROR_DETAIL,
+                    },
+                },
+            )
+            await error_response(scope, receive, send)
+            return
+
+    async def _get_runtime_client(self) -> httpx.AsyncClient:
+        """Return the client used for Python -> Rust runtime proxying.
+
+        Returns:
+            An async HTTP client configured for either UDS or loopback HTTP.
+        """
+        uds_path = settings.experimental_rust_mcp_runtime_uds
+        if not uds_path:
+            return await get_http_client()
+
+        if self._uds_client is not None:
+            return self._uds_client
+
+        async with self._uds_client_lock:
+            if self._uds_client is None:
+                self._uds_client = httpx.AsyncClient(
+                    transport=httpx.AsyncHTTPTransport(uds=uds_path),
+                    limits=get_http_limits(),
+                    timeout=httpx.Timeout(settings.experimental_rust_mcp_runtime_timeout_seconds),
+                    follow_redirects=False,
+                )
+            return self._uds_client
+
+
+async def _stream_request_body(receive: Receive):
+    """Yield ASGI request body chunks without buffering the full request.
+
+    Args:
+        receive: ASGI receive callable for the current request.
+
+    Yields:
+        Raw request body chunks as they arrive from the client.
+    """
+    while True:
+        message = await receive()
+        if message["type"] == "http.disconnect":
+            return
+        if message["type"] != "http.request":
+            continue
+        body = message.get("body", b"")
+        if body:
+            yield body
+        if not message.get("more_body", False):
+            return
+
+
+def _extract_server_id_from_scope(scope: Scope) -> str | None:
+    """Extract server_id when the mounted MCP path came from /servers/<id>/mcp.
+
+    Args:
+        scope: Incoming ASGI scope.
+
+    Returns:
+        The matched server id, or ``None`` when the request is not server-scoped.
+    """
+    modified_path = str(scope.get("modified_path") or scope.get("path") or "")
+    match = _SERVER_ID_RE.search(modified_path)
+    return match.group("server_id") if match else None
+
+
+def _build_runtime_mcp_url(scope: Scope) -> str:
+    """Build the target Rust runtime /mcp URL, preserving the query string.
+
+    Args:
+        scope: Incoming ASGI scope.
+
+    Returns:
+        Absolute URL for the Rust sidecar MCP endpoint.
+    """
+    base = urlsplit(settings.experimental_rust_mcp_runtime_url)
+    query_string = scope.get("query_string", b"")
+    query = query_string.decode("latin-1") if isinstance(query_string, (bytes, bytearray)) else str(query_string or "")
+    base_path = base.path.rstrip("/")
+    if not base_path:
+        target_path = "/mcp/"
+    elif base_path.endswith("/mcp"):
+        target_path = f"{base_path}/"
+    else:
+        target_path = f"{base_path}/mcp/"
+    merged_query = "&".join(part for part in (base.query, query) if part)
+    return urlunsplit((base.scheme, base.netloc, target_path, merged_query, ""))
+
+
+def _build_forward_headers(scope: Scope) -> list[tuple[str, str]]:
+    """Forward request headers needed by the Rust runtime while stripping internal-only headers.
+
+    Args:
+        scope: Incoming ASGI scope.
+
+    Returns:
+        Header tuples safe to forward to the Rust sidecar.
+    """
+    headers: list[tuple[str, str]] = []
+    for item in scope.get("headers") or []:
+        if not isinstance(item, (tuple, list)) or len(item) != 2:
+            continue
+        name, value = item
+        if not isinstance(name, (bytes, bytearray)) or not isinstance(value, (bytes, bytearray)):
+            continue
+        header_name = name.decode("latin-1").lower()
+        if header_name in _REQUEST_HOP_BY_HOP_HEADERS or header_name in _FORWARDED_CHAIN_HEADERS or header_name in _INTERNAL_ONLY_REQUEST_HEADERS:
+            continue
+        headers.append((header_name, value.decode("latin-1")))
+
+    server_id = _extract_server_id_from_scope(scope)
+    if server_id:
+        headers.append((_CONTEXTFORGE_SERVER_ID_HEADER, server_id))
+
+    auth_context = _build_forwarded_auth_context_header()
+    if auth_context is not None:
+        headers.append((_CONTEXTFORGE_AUTH_CONTEXT_HEADER, auth_context))
+
+    client = scope.get("client")
+    client_host = client[0] if isinstance(client, (tuple, list)) and client else None
+    from_loopback = client_host in ("127.0.0.1", "::1")
+    incoming_headers = {
+        name.decode("latin-1").lower(): value.decode("latin-1")
+        for item in scope.get("headers") or []
+        if isinstance(item, (tuple, list)) and len(item) == 2
+        for name, value in [item]
+        if isinstance(name, (bytes, bytearray)) and isinstance(value, (bytes, bytearray))
+    }
+    if from_loopback and incoming_headers.get("x-forwarded-internally") == "true":
+        headers.append((_CONTEXTFORGE_AFFINITY_FORWARDED_HEADER, "rust"))
+
+    return headers
+
+
+def _build_forwarded_auth_context_header() -> str | None:
+    """Serialize the authenticated MCP context for the trusted internal Python dispatcher.
+
+    Returns:
+        Base64url-encoded auth context for trusted internal forwarding, or ``None``
+        when no MCP auth context is available.
+    """
+    auth_context = get_streamable_http_auth_context()
+    if not auth_context:
+        return None
+    encoded = base64.urlsafe_b64encode(orjson.dumps(auth_context)).decode("ascii")
+    return encoded.rstrip("=")
diff --git a/mcpgateway/transports/streamablehttp_transport.py b/mcpgateway/transports/streamablehttp_transport.py
index 0c6a6b3856..d38d4c3a54 100644
--- a/mcpgateway/transports/streamablehttp_transport.py
+++ b/mcpgateway/transports/streamablehttp_transport.py
@@ -38,6 +38,7 @@
 from dataclasses import dataclass
 import re
 from typing import Any, AsyncGenerator, Dict, List, Optional, Pattern, Tuple, Union
+from urllib.parse import urlsplit, urlunsplit
 from uuid import uuid4
 
 # Third-Party
@@ -64,7 +65,9 @@
 from mcpgateway.db import SessionLocal
 from mcpgateway.middleware.rbac import _ACCESS_DENIED_MSG
 from mcpgateway.services.completion_service import CompletionService
+from mcpgateway.services.http_client_service import get_http_client, get_http_limits
 from mcpgateway.services.logging_service import LoggingService
+from mcpgateway.services.metrics import mcp_auth_cache_events_counter
 from mcpgateway.services.oauth_manager import OAuthEnforcementUnavailableError, OAuthRequiredError
 from mcpgateway.services.permission_service import PermissionService
 from mcpgateway.services.prompt_service import PromptService
@@ -79,6 +82,19 @@
 logging_service = LoggingService()
 logger = logging_service.get_logger(__name__)
 
+
+def _record_mcp_auth_cache_event(outcome: str) -> None:
+    """Best-effort Prometheus counter update for MCP auth cache flow.
+
+    Args:
+        outcome: Cache-flow outcome label to emit.
+    """
+    try:
+        mcp_auth_cache_events_counter.labels(outcome=outcome).inc()
+    except Exception:
+        pass  # nosec B110 - Metrics must not break auth flow
+
+
 # Precompiled regex for server ID extraction from path
 _SERVER_ID_RE: Pattern[str] = re.compile(r"/servers/(?P<server_id>[a-fA-F0-9\-]+)/mcp")
 
@@ -98,6 +114,9 @@
 user_context_var: contextvars.ContextVar[dict[str, Any]] = contextvars.ContextVar("user_context", default={})
 _oauth_checked_var: contextvars.ContextVar[bool] = contextvars.ContextVar("_oauth_checked", default=False)
 _shared_session_registry: Optional[Any] = None
+_rust_event_store_client: Optional[httpx.AsyncClient] = None
+_rust_event_store_client_lock = asyncio.Lock()
+_RUST_EVENT_STORE_DEFAULT_KEY_PREFIX = "mcpgw:eventstore"
 
 # ------------------------------ Event store ------------------------------
 
@@ -396,6 +415,128 @@ async def replay_events_after(
         return last_event.stream_id
 
 
+class RustEventStore(EventStore):
+    """Rust-backed event store that delegates resumable stream state to the sidecar."""
+
+    def __init__(self, max_events_per_stream: int = 100, ttl: int = 3600, key_prefix: str = _RUST_EVENT_STORE_DEFAULT_KEY_PREFIX):
+        """Initialize the Rust-backed event store wrapper.
+
+        Args:
+            max_events_per_stream: Maximum number of events retained per stream.
+            ttl: Event retention time in seconds.
+            key_prefix: Redis key prefix shared with the Rust sidecar.
+        """
+        self.max_events_per_stream = max_events_per_stream
+        self.ttl = ttl
+        self.key_prefix = key_prefix.rstrip(":")
+
+    async def store_event(self, stream_id: StreamId, message: JSONRPCMessage | None) -> EventId:
+        """Store an event in the Rust-backed resumable event store.
+
+        Args:
+            stream_id: Stream that owns the event.
+            message: JSON-RPC payload to persist for replay.
+
+        Returns:
+            The generated event identifier returned by the Rust sidecar.
+
+        Raises:
+            RuntimeError: If the Rust sidecar event store is unavailable or returns invalid data.
+        """
+        client = await _get_rust_event_store_client()
+        message_dict = None if message is None else (message.model_dump() if hasattr(message, "model_dump") else dict(message))
+        response = await client.post(
+            _build_rust_runtime_internal_url("/_internal/event-store/store"),
+            json={
+                "streamId": stream_id,
+                "message": message_dict,
+                "keyPrefix": self.key_prefix,
+                "maxEventsPerStream": self.max_events_per_stream,
+                "ttlSeconds": self.ttl,
+            },
+            timeout=httpx.Timeout(settings.experimental_rust_mcp_runtime_timeout_seconds),
+            follow_redirects=False,
+        )
+        response.raise_for_status()
+        payload = response.json()
+        event_id = payload.get("eventId")
+        if not isinstance(event_id, str) or not event_id:
+            raise RuntimeError("Rust event store returned an invalid eventId")
+        return event_id
+
+    async def replay_events_after(self, last_event_id: EventId, send_callback: EventCallback) -> Union[StreamId, None]:
+        """Replay events newer than ``last_event_id`` through the provided callback.
+
+        Args:
+            last_event_id: Last event acknowledged by the reconnecting client.
+            send_callback: Callback invoked for each replayed event payload.
+
+        Returns:
+            The associated stream identifier when replay succeeds, else ``None``.
+        """
+        client = await _get_rust_event_store_client()
+        response = await client.post(
+            _build_rust_runtime_internal_url("/_internal/event-store/replay"),
+            json={
+                "lastEventId": last_event_id,
+                "keyPrefix": self.key_prefix,
+            },
+            timeout=httpx.Timeout(settings.experimental_rust_mcp_runtime_timeout_seconds),
+            follow_redirects=False,
+        )
+        response.raise_for_status()
+        payload = response.json()
+        stream_id = payload.get("streamId")
+        if not isinstance(stream_id, str) or not stream_id:
+            return None
+        for event in payload.get("events", []):
+            if not isinstance(event, dict):
+                continue
+            await send_callback(event.get("message"))
+        return stream_id
+
+
+async def _get_rust_event_store_client() -> httpx.AsyncClient:
+    """Return the HTTP client used for Python -> Rust event-store calls.
+
+    Returns:
+        An async HTTP client configured for Rust event-store access.
+    """
+    global _rust_event_store_client  # pylint: disable=global-statement
+
+    uds_path = settings.experimental_rust_mcp_runtime_uds
+    if not uds_path:
+        return await get_http_client()
+
+    if _rust_event_store_client is not None:
+        return _rust_event_store_client
+
+    async with _rust_event_store_client_lock:
+        if _rust_event_store_client is None:
+            _rust_event_store_client = httpx.AsyncClient(
+                transport=httpx.AsyncHTTPTransport(uds=uds_path),
+                limits=get_http_limits(),
+                timeout=httpx.Timeout(settings.experimental_rust_mcp_runtime_timeout_seconds),
+                follow_redirects=False,
+            )
+        return _rust_event_store_client
+
+
+def _build_rust_runtime_internal_url(path: str) -> str:
+    """Build a Rust sidecar internal URL for UDS or loopback HTTP transport.
+
+    Args:
+        path: Internal Rust runtime path to append to the configured base URL.
+
+    Returns:
+        Absolute URL targeting the Rust sidecar over HTTP or UDS-backed transport.
+    """
+    base = urlsplit(settings.experimental_rust_mcp_runtime_url)
+    base_path = base.path.rstrip("/")
+    target_path = f"{base_path}{path}" if base_path else path
+    return urlunsplit((base.scheme, base.netloc, target_path, "", ""))
+
+
 # ------------------------------ Streamable HTTP Transport ------------------------------
 
 
@@ -655,6 +796,29 @@ def _check_scoped_permission(user_context: dict[str, Any], permission: str) -> b
     return allowed
 
 
+def _check_any_team_for_server_scoped_rbac(user_context: dict[str, Any] | None, server_id: str | None) -> bool:
+    """Return whether Streamable HTTP RBAC should check across team-scoped roles.
+
+    Server-scoped MCP routes (``/servers/<id>/mcp``) should authorize team-bound
+    callers against the specific virtual server context. Session tokens already do
+    this via ``check_any_team=True`` because they have no single explicit team_id.
+    Team-scoped API tokens need the same treatment on server-scoped routes; otherwise
+    they are evaluated only in global scope and incorrectly denied.
+
+    Args:
+        user_context: Current authenticated MCP user context, if any.
+        server_id: Effective virtual server identifier for the MCP request.
+
+    Returns:
+        ``True`` when RBAC should search across the caller's token teams.
+    """
+    if not user_context:
+        return False
+    if user_context.get("token_use") == "session":
+        return True
+    return bool(server_id) and bool(user_context.get("teams"))
+
+
 def set_shared_session_registry(session_registry: Any) -> None:
     """Set the process-wide session registry used by Streamable HTTP helpers.
 
@@ -723,6 +887,9 @@ async def _validate_streamable_session_access(
     if not _should_enforce_streamable_rbac(user_context):
         return True, 200, ""
 
+    if isinstance(user_context, dict) and user_context.get("_rust_session_validated") is True:
+        return True, 200, ""
+
     # Initialize establishes a new session and is authorized separately.
     if (rpc_method or "").strip() == "initialize":
         return True, 200, ""
@@ -996,11 +1163,10 @@ async def call_tool(name: str, arguments: dict) -> Union[
         # Layer 2: RBAC check
         # Session tokens have no explicit team_id; check across all team-scoped roles.
         # Mirrors the @require_permission decorator's check_any_team fallback (rbac.py:562-576).
-        _is_session_token = user_context.get("token_use") == "session"
         has_execute_permission = await _check_streamable_permission(
             user_context=user_context,
             permission="tools.execute",
-            check_any_team=_is_session_token,
+            check_any_team=_check_any_team_for_server_scoped_rbac(user_context, server_id),
         )
         if not has_execute_permission:
             raise PermissionError(_ACCESS_DENIED_MSG)
@@ -2057,14 +2223,13 @@ async def set_logging_level(level: types.LoggingLevel) -> types.EmptyResult:
 
     if _should_enforce_streamable_rbac(user_context):
         # Layer 1: Token scope cap
-        # MCP logging/setLevel is a standard MCP capability invoked by clients during
-        # initialization; servers.use (not admin.system_config) keeps the handshake working.
-        if not _check_scoped_permission(user_context, "servers.use"):
+        if not _check_scoped_permission(user_context, "admin.system_config"):
             raise PermissionError(_ACCESS_DENIED_MSG)
         # Layer 2: RBAC check
         has_permission = await _check_streamable_permission(
             user_context=user_context,
-            permission="servers.use",
+            permission="admin.system_config",
+            check_any_team=_check_any_team_for_server_scoped_rbac(user_context, server_id),
         )
         if not has_permission:
             raise PermissionError(_ACCESS_DENIED_MSG)
@@ -2229,8 +2394,14 @@ def __init__(self) -> None:
         """
 
         if settings.use_stateful_sessions:
+            if settings.experimental_rust_mcp_runtime_enabled and settings.experimental_rust_mcp_session_auth_reuse_enabled and settings.experimental_rust_mcp_event_store_enabled:
+                event_store = RustEventStore(
+                    max_events_per_stream=settings.streamable_http_max_events_per_stream,
+                    ttl=settings.streamable_http_event_ttl,
+                )
+                logger.debug("Using RustEventStore for stateful sessions")
             # Use Redis event store for single-worker stateful deployments
-            if settings.cache_type == "redis" and settings.redis_url:
+            elif settings.cache_type == "redis" and settings.redis_url:
                 event_store = RedisEventStore(max_events_per_stream=settings.streamable_http_max_events_per_stream, ttl=settings.streamable_http_event_ttl)
                 logger.debug("Using RedisEventStore for stateful sessions (single-worker)")
             else:
@@ -2361,11 +2532,11 @@ async def handle_streamable_http(self, scope: Scope, receive: Receive, send: Sen
         # This mirrors /servers/{id}/sse and /servers/{id}/message guards.
         user_context = user_context_var.get()
         if match and _should_enforce_streamable_rbac(user_context):
-            _is_session = user_context.get("token_use") == "session" if user_context else False
+            _server_id = match.group("server_id")
             has_server_access = await _check_streamable_permission(
                 user_context=user_context,
                 permission="servers.use",
-                check_any_team=_is_session,
+                check_any_team=_check_any_team_for_server_scoped_rbac(user_context, _server_id),
             )
             if not has_server_access:
                 response = ORJSONResponse(
@@ -2766,10 +2937,47 @@ def _set_proxy_user_context(proxy_user: str) -> None:
             "teams": [],
             "is_authenticated": True,
             "is_admin": False,
+            "permission_is_admin": False,
         }
     )
 
 
+def get_streamable_http_auth_context() -> dict[str, Any]:
+    """Return the current StreamableHTTP auth context for trusted internal forwarding.
+
+    The Rust MCP proxy uses this to carry already-authenticated MCP request context
+    across the Python -> Rust -> Python seam so the internal dispatcher does not
+    need to repeat JWT verification and team normalization on the hot path.
+
+    Returns:
+        A shallow copy of the trusted auth context fields that may be forwarded
+        across the internal MCP seam.
+    """
+    user_context = user_context_var.get()
+    if not isinstance(user_context, dict):
+        return {}
+
+    forwarded: dict[str, Any] = {}
+    for key in (
+        "email",
+        "teams",
+        "is_authenticated",
+        "is_admin",
+        "token_use",
+        "permission_is_admin",
+        "scoped_permissions",
+        "scoped_server_id",
+    ):
+        if key not in user_context:
+            continue
+        value = user_context[key]
+        if isinstance(value, list):
+            forwarded[key] = list(value)
+        else:
+            forwarded[key] = value
+    return forwarded
+
+
 class _StreamableHttpAuthHandler:
     """Per-request handler that authenticates MCP StreamableHTTP requests.
 
@@ -2901,6 +3109,7 @@ async def _auth_no_token(self, *, path: str, bearer_header_supplied: bool) -> bo
                 "teams": [],  # Empty list = public-only access
                 "is_authenticated": False,
                 "is_admin": False,
+                "permission_is_admin": False,
             }
         )
         return True  # Allow request to proceed with public-only access
@@ -2920,23 +3129,109 @@ async def _auth_jwt(self, *, token: str) -> bool:
             if not isinstance(user_payload, dict):
                 return True
 
-            jti = user_payload.get("jti")
-            if jti:
-                # First-Party
-                from mcpgateway.auth import _check_token_revoked_sync  # pylint: disable=import-outside-toplevel
+            # First-Party
+            from mcpgateway.auth import _get_auth_context_batched_sync  # pylint: disable=import-outside-toplevel
+            from mcpgateway.cache.auth_cache import CachedAuthContext, get_auth_cache  # pylint: disable=import-outside-toplevel
 
+            jti = user_payload.get("jti")
+            user_email = user_payload.get("sub") or user_payload.get("email")
+            nested_user = user_payload.get("user", {})
+            nested_is_admin = nested_user.get("is_admin", False) if isinstance(nested_user, dict) else False
+            is_admin = user_payload.get("is_admin", False) or nested_is_admin
+            token_use = user_payload.get("token_use")
+            db_user_is_admin = False
+            user_record = None
+            auth_cache = get_auth_cache() if settings.auth_cache_enabled else None
+            cached_ctx: CachedAuthContext | None = None
+            batched_auth_ctx: dict[str, Any] | None = None
+            cached_team_ids: list[str] | None = None
+            platform_admin_email = getattr(settings, "platform_admin_email", "admin@example.com")
+
+            if user_email and auth_cache is not None:
                 try:
-                    is_revoked = await asyncio.to_thread(_check_token_revoked_sync, jti)
-                except Exception as exc:
-                    logger.warning("MCP token revocation check failed for jti=%s; allowing request (fail-open): %s", jti, exc)
-                    is_revoked = False
-                if is_revoked:
-                    return await self._send_error(detail="Token has been revoked", headers={"WWW-Authenticate": "Bearer"})
+                    cached_ctx = await auth_cache.get_auth_context(user_email, jti)
+                    if cached_ctx is not None:
+                        _record_mcp_auth_cache_event("auth_context_hit")
+                        if cached_ctx.is_token_revoked:
+                            _record_mcp_auth_cache_event("auth_context_hit_revoked")
+                            return await self._send_error(detail="Token has been revoked", headers={"WWW-Authenticate": "Bearer"})
+
+                        cached_user = cached_ctx.user
+                        if cached_user and not cached_user.get("is_active", True):
+                            _record_mcp_auth_cache_event("auth_context_hit_inactive")
+                            return await self._send_error(detail="Account disabled", headers={"WWW-Authenticate": "Bearer"})
+
+                        if cached_user:
+                            db_user_is_admin = bool(cached_user.get("is_admin", False))
+                        elif settings.require_user_in_db and user_email != platform_admin_email:
+                            return await self._send_error(detail="User not found in database", headers={"WWW-Authenticate": "Bearer"})
+
+                        if token_use == "session" and not is_admin:  # nosec B105 - token_use is a JWT claim type, not a password
+                            cached_team_ids = await auth_cache.get_user_teams(f"{user_email}:True")
+                            if cached_team_ids is not None:
+                                _record_mcp_auth_cache_event("teams_cache_hit")
+                    else:
+                        _record_mcp_auth_cache_event("auth_context_miss")
+                except HTTPException:
+                    raise
+                except Exception as cache_error:
+                    _record_mcp_auth_cache_event("auth_context_cache_error")
+                    logger.debug("MCP auth cache lookup failed for %s: %s", user_email, cache_error)
+                    cached_ctx = None
+
+            if user_email and cached_ctx is None and settings.auth_cache_batch_queries:
+                try:
+                    batched_auth_ctx = await asyncio.to_thread(_get_auth_context_batched_sync, user_email, jti)
+                    _record_mcp_auth_cache_event("auth_context_batch_hit")
+                    if batched_auth_ctx.get("is_token_revoked", False):
+                        _record_mcp_auth_cache_event("auth_context_batch_revoked")
+                        return await self._send_error(detail="Token has been revoked", headers={"WWW-Authenticate": "Bearer"})
+
+                    cached_user = batched_auth_ctx.get("user")
+                    if cached_user and not cached_user.get("is_active", True):
+                        _record_mcp_auth_cache_event("auth_context_batch_inactive")
+                        return await self._send_error(detail="Account disabled", headers={"WWW-Authenticate": "Bearer"})
 
-            user_email = user_payload.get("sub") or user_payload.get("email")
-            if user_email:
+                    if cached_user:
+                        db_user_is_admin = bool(cached_user.get("is_admin", False))
+                    elif settings.require_user_in_db and user_email != platform_admin_email:
+                        return await self._send_error(detail="User not found in database", headers={"WWW-Authenticate": "Bearer"})
+
+                    if auth_cache is not None:
+                        await auth_cache.set_auth_context(
+                            user_email,
+                            jti,
+                            CachedAuthContext(
+                                user=cached_user,
+                                personal_team_id=batched_auth_ctx.get("personal_team_id"),
+                                is_token_revoked=bool(batched_auth_ctx.get("is_token_revoked", False)),
+                            ),
+                        )
+                        if token_use == "session" and not is_admin:  # nosec B105 - token_use is a JWT claim type, not a password
+                            cached_team_ids = list(batched_auth_ctx.get("team_ids") or [])
+                            await auth_cache.set_user_teams(f"{user_email}:True", cached_team_ids)
+                            _record_mcp_auth_cache_event("teams_batch_hit")
+                except HTTPException:
+                    raise
+                except Exception as batch_error:
+                    _record_mcp_auth_cache_event("auth_context_batch_error")
+                    logger.warning("Batched MCP auth lookup failed for user=%s; falling back to individual checks: %s", user_email, batch_error)
+                    batched_auth_ctx = None
+
+            if user_email and cached_ctx is None and batched_auth_ctx is None:
+                _record_mcp_auth_cache_event("auth_context_fallback")
                 # First-Party
-                from mcpgateway.auth import _get_user_by_email_sync  # pylint: disable=import-outside-toplevel
+                from mcpgateway.auth import _check_token_revoked_sync, _get_user_by_email_sync  # pylint: disable=import-outside-toplevel
+
+                is_revoked = False
+                if jti:
+                    try:
+                        is_revoked = await asyncio.to_thread(_check_token_revoked_sync, jti)
+                    except Exception as exc:
+                        logger.warning("MCP token revocation check failed for jti=%s; allowing request (fail-open): %s", jti, exc)
+                        is_revoked = False
+                    if is_revoked:
+                        return await self._send_error(detail="Token has been revoked", headers={"WWW-Authenticate": "Bearer"})
 
                 user_lookup_succeeded = True
                 try:
@@ -2949,23 +3244,61 @@ async def _auth_jwt(self, *, token: str) -> bool:
                 if user_lookup_succeeded:
                     if user_record and not getattr(user_record, "is_active", True):
                         return await self._send_error(detail="Account disabled", headers={"WWW-Authenticate": "Bearer"})
-                    if user_record is None and settings.require_user_in_db and user_email != getattr(settings, "platform_admin_email", "admin@example.com"):
+                    if user_record:
+                        db_user_is_admin = bool(getattr(user_record, "is_admin", False))
+                    if user_record is None and settings.require_user_in_db and user_email != platform_admin_email:
                         return await self._send_error(detail="User not found in database", headers={"WWW-Authenticate": "Bearer"})
 
-            # Resolve teams based on token_use claim
-            token_use = user_payload.get("token_use")
+                    if auth_cache is not None:
+                        try:
+                            await auth_cache.set_auth_context(
+                                user_email,
+                                jti,
+                                CachedAuthContext(
+                                    user=(
+                                        {
+                                            "email": user_record.email,
+                                            "password_hash": user_record.password_hash,
+                                            "full_name": user_record.full_name,
+                                            "is_admin": bool(user_record.is_admin),
+                                            "is_active": bool(user_record.is_active),
+                                            "auth_provider": user_record.auth_provider,
+                                            "password_change_required": bool(user_record.password_change_required),
+                                            "email_verified_at": user_record.email_verified_at,
+                                            "created_at": user_record.created_at,
+                                            "updated_at": user_record.updated_at,
+                                        }
+                                        if user_record is not None
+                                        else None
+                                    ),
+                                    personal_team_id=None,
+                                    is_token_revoked=is_revoked,
+                                ),
+                            )
+                        except Exception as cache_set_error:
+                            logger.debug("Failed to cache MCP auth context for %s: %s", user_email, cache_set_error)
+
             if token_use == "session":  # nosec B105 - Not a password; token_use is a JWT claim type
                 # Session token: resolve teams from DB/cache
-                user_email_for_teams = user_payload.get("sub") or user_payload.get("email")
-                is_admin_flag = user_payload.get("is_admin", False) or user_payload.get("user", {}).get("is_admin", False)
-                if is_admin_flag:
+                if is_admin:
                     final_teams = None  # Admin bypass
-                elif user_email_for_teams:
-                    # Resolve teams synchronously with L1 cache (StreamableHTTP uses sync context)
-                    # First-Party
-                    from mcpgateway.auth import _resolve_teams_from_db_sync  # pylint: disable=import-outside-toplevel
-
-                    final_teams = _resolve_teams_from_db_sync(user_email_for_teams, is_admin=False)
+                elif user_email:
+                    if cached_team_ids is not None:
+                        final_teams = cached_team_ids
+                    elif batched_auth_ctx is not None:
+                        final_teams = list(batched_auth_ctx.get("team_ids") or [])
+                    else:
+                        _record_mcp_auth_cache_event("teams_db_resolve")
+                        # Resolve teams synchronously with L1 cache (StreamableHTTP uses sync context)
+                        # First-Party
+                        from mcpgateway.auth import _resolve_teams_from_db_sync  # pylint: disable=import-outside-toplevel
+
+                        final_teams = _resolve_teams_from_db_sync(user_email, is_admin=False)
+                        if auth_cache is not None and final_teams is not None:
+                            try:
+                                await auth_cache.set_user_teams(f"{user_email}:True", final_teams)
+                            except Exception as cache_set_error:
+                                logger.debug("Failed to cache MCP teams list for %s: %s", user_email, cache_set_error)
                 else:
                     final_teams = []  # No email — public-only
             else:
@@ -2979,8 +3312,6 @@ async def _auth_jwt(self, *, token: str) -> bool:
             # SECURITY: Validate team membership for team-scoped tokens
             # Users removed from a team should lose MCP access immediately, not at token expiry
             # ═══════════════════════════════════════════════════════════════════════════
-            is_admin = user_payload.get("is_admin", False) or user_payload.get("user", {}).get("is_admin", False)
-
             # Only validate membership for team-scoped tokens (non-empty teams list)
             # Skip for: public-only tokens ([]), admin unrestricted tokens (None)
             if final_teams and len(final_teams) > 0 and user_email:
@@ -2997,10 +3328,12 @@ async def _auth_jwt(self, *, token: str) -> bool:
                 # Check cache first (60s TTL)
                 cached_result = auth_cache.get_team_membership_valid_sync(user_email, final_teams)
                 if cached_result is False:
+                    _record_mcp_auth_cache_event("team_membership_cache_reject")
                     logger.warning("MCP auth rejected: User %s no longer member of teams (cached)", user_email)
                     return await self._send_error(detail="Token invalid: User is no longer a member of the associated team", status_code=HTTP_403_FORBIDDEN)
 
                 if cached_result is None:
+                    _record_mcp_auth_cache_event("team_membership_cache_miss")
                     # Cache miss - query database
                     with SessionLocal() as db:
                         memberships = (
@@ -3025,12 +3358,15 @@ async def _auth_jwt(self, *, token: str) -> bool:
 
                         # Cache positive result
                         auth_cache.set_team_membership_valid_sync(user_email, final_teams, True)
+                else:
+                    _record_mcp_auth_cache_event("team_membership_cache_hit")
 
             auth_user_ctx: dict[str, Any] = {
                 "email": user_email,
                 "teams": final_teams,
                 "is_authenticated": True,
                 "is_admin": is_admin,
+                "permission_is_admin": db_user_is_admin or is_admin,
                 "token_use": token_use,  # propagated for downstream RBAC (check_any_team)
             }
             # Extract scoped permissions from JWT for per-method enforcement
@@ -3038,6 +3374,9 @@ async def _auth_jwt(self, *, token: str) -> bool:
             jwt_scoped_perms = jwt_scopes.get("permissions") or [] if isinstance(jwt_scopes, dict) else []
             if jwt_scoped_perms:
                 auth_user_ctx["scoped_permissions"] = jwt_scoped_perms
+            scoped_server_id = jwt_scopes.get("server_id") if isinstance(jwt_scopes, dict) else None
+            if isinstance(scoped_server_id, str) and scoped_server_id:
+                auth_user_ctx["scoped_server_id"] = scoped_server_id
             user_context_var.set(auth_user_ctx)
         except HTTPException:
             # JWT verification failed (expired, malformed, bad signature, etc.)
diff --git a/mcpgateway/version.py b/mcpgateway/version.py
index dd6e670bfe..9dee323947 100644
--- a/mcpgateway/version.py
+++ b/mcpgateway/version.py
@@ -103,6 +103,314 @@
 router = APIRouter(tags=["meta"])
 
 
+def _env_flag(name: str, default: bool = False) -> bool:
+    """Read a boolean environment variable using common truthy spellings.
+
+    Args:
+        name: Environment variable name.
+        default: Default value used when the variable is unset.
+
+    Returns:
+        Parsed boolean value.
+    """
+    value = os.getenv(name)
+    if value is None:
+        return default
+    return value.strip().lower() in {"1", "true", "yes", "on"}
+
+
+def _rust_build_included() -> bool:
+    """Return whether the current image includes Rust MCP artifacts.
+
+    Returns:
+        ``True`` when the current image contains the Rust MCP binaries/plugins.
+    """
+    return _env_flag("CONTEXTFORGE_ENABLE_RUST_BUILD", default=False)
+
+
+def _rust_runtime_managed() -> bool:
+    """Return whether the gateway expects to manage the Rust MCP sidecar locally.
+
+    Returns:
+        ``True`` when the gateway should launch and supervise the Rust sidecar.
+    """
+    return _env_flag("EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED", default=True)
+
+
+def _current_mcp_transport_mount() -> str:
+    """Return which public ``/mcp`` transport is currently mounted.
+
+    Returns:
+        Runtime label identifying the currently mounted public MCP transport.
+    """
+    return "rust" if _should_mount_public_rust_transport() else "python"
+
+
+def _should_mount_public_rust_transport() -> bool:
+    """Return whether public ``/mcp`` should be served directly by Rust.
+
+    Returns:
+        ``True`` only when the Rust runtime is enabled and Rust can safely own
+        steady-state public MCP session traffic.
+    """
+    return bool(settings.experimental_rust_mcp_runtime_enabled and settings.experimental_rust_mcp_session_auth_reuse_enabled)
+
+
+def _should_use_rust_public_session_stack() -> bool:
+    """Return whether Rust should own the effective public MCP session stack.
+
+    Returns:
+        ``True`` only when the public MCP transport and session semantics should
+        stay on the Rust-backed path.
+    """
+    return _should_mount_public_rust_transport()
+
+
+def _current_mcp_runtime_mode() -> str:
+    """Return the current MCP runtime mode label used for health and UI surfaces.
+
+    Returns:
+        Human-readable runtime mode label for diagnostics and UI reporting.
+    """
+    if settings.experimental_rust_mcp_runtime_enabled:
+        return "rust-managed" if _rust_runtime_managed() else "rust-external"
+    if _rust_build_included():
+        return "python-rust-built-disabled"
+    return "python"
+
+
+def _current_mcp_session_core_mode() -> str:
+    """Return which runtime currently owns MCP session metadata.
+
+    Returns:
+        ``"rust"`` when the Rust session core is enabled, otherwise ``"python"``.
+    """
+    if _should_use_rust_public_session_stack() and settings.experimental_rust_mcp_session_core_enabled:
+        return "rust"
+    return "python"
+
+
+def _current_mcp_event_store_mode() -> str:
+    """Return which runtime currently owns MCP resumable event-store semantics.
+
+    Returns:
+        ``"rust"`` when the Rust event store is enabled, otherwise ``"python"``.
+    """
+    if _should_use_rust_public_session_stack() and settings.experimental_rust_mcp_event_store_enabled:
+        return "rust"
+    return "python"
+
+
+def _current_mcp_resume_core_mode() -> str:
+    """Return which runtime currently owns public MCP replay/resume behavior.
+
+    Returns:
+        ``"rust"`` when Rust owns replay/resume, otherwise ``"python"``.
+    """
+    if (
+        _should_use_rust_public_session_stack()
+        and settings.experimental_rust_mcp_session_core_enabled
+        and settings.experimental_rust_mcp_event_store_enabled
+        and settings.experimental_rust_mcp_resume_core_enabled
+    ):
+        return "rust"
+    return "python"
+
+
+def _current_mcp_live_stream_core_mode() -> str:
+    """Return which runtime currently owns non-resume public GET ``/mcp`` SSE behavior.
+
+    Returns:
+        ``"rust"`` when Rust owns live GET ``/mcp`` streaming, otherwise ``"python"``.
+    """
+    if _should_use_rust_public_session_stack() and settings.experimental_rust_mcp_live_stream_core_enabled:
+        return "rust"
+    return "python"
+
+
+def _current_mcp_affinity_core_mode() -> str:
+    """Return which runtime currently owns MCP multi-worker session-affinity forwarding.
+
+    Returns:
+        ``"rust"`` when Rust owns session-affinity forwarding, otherwise ``"python"``.
+    """
+    if _should_use_rust_public_session_stack() and settings.experimental_rust_mcp_affinity_core_enabled:
+        return "rust"
+    return "python"
+
+
+def _current_mcp_session_auth_reuse_mode() -> str:
+    """Return which runtime currently owns MCP session-bound auth-context reuse.
+
+    Returns:
+        ``"rust"`` when Rust session auth reuse is enabled, otherwise ``"python"``.
+    """
+    if settings.experimental_rust_mcp_runtime_enabled and settings.experimental_rust_mcp_session_auth_reuse_enabled:
+        return "rust"
+    return "python"
+
+
+def _mcp_runtime_status_payload() -> Dict[str, Any]:
+    """Return MCP runtime diagnostics for health, UI, and version surfaces.
+
+    Returns:
+        Diagnostic payload describing the active MCP runtime configuration.
+    """
+    payload: Dict[str, Any] = {
+        "mode": _current_mcp_runtime_mode(),
+        "mounted": _current_mcp_transport_mount(),
+        "rust_build_included": _rust_build_included(),
+        "rust_runtime_enabled": settings.experimental_rust_mcp_runtime_enabled,
+        "session_core_mode": _current_mcp_session_core_mode(),
+        "event_store_mode": _current_mcp_event_store_mode(),
+        "resume_core_mode": _current_mcp_resume_core_mode(),
+        "live_stream_core_mode": _current_mcp_live_stream_core_mode(),
+        "affinity_core_mode": _current_mcp_affinity_core_mode(),
+        "session_auth_reuse_mode": _current_mcp_session_auth_reuse_mode(),
+        "rust_session_core_enabled": bool(_should_use_rust_public_session_stack() and settings.experimental_rust_mcp_session_core_enabled),
+        "rust_event_store_enabled": bool(_should_use_rust_public_session_stack() and settings.experimental_rust_mcp_event_store_enabled),
+        "rust_resume_core_enabled": bool(
+            _should_use_rust_public_session_stack()
+            and settings.experimental_rust_mcp_session_core_enabled
+            and settings.experimental_rust_mcp_event_store_enabled
+            and settings.experimental_rust_mcp_resume_core_enabled
+        ),
+        "rust_live_stream_core_enabled": bool(_should_use_rust_public_session_stack() and settings.experimental_rust_mcp_live_stream_core_enabled),
+        "rust_affinity_core_enabled": bool(_should_use_rust_public_session_stack() and settings.experimental_rust_mcp_affinity_core_enabled),
+        "rust_session_auth_reuse_enabled": bool(settings.experimental_rust_mcp_runtime_enabled and settings.experimental_rust_mcp_session_auth_reuse_enabled),
+    }
+
+    if settings.experimental_rust_mcp_runtime_enabled:
+        payload["rust_runtime_managed"] = _rust_runtime_managed()
+        if settings.experimental_rust_mcp_runtime_uds:
+            payload["sidecar_transport"] = "uds"
+            payload["sidecar_target"] = settings.experimental_rust_mcp_runtime_uds
+        else:
+            payload["sidecar_transport"] = "http"
+            payload["sidecar_target"] = settings.experimental_rust_mcp_runtime_url
+
+    return payload
+
+
+def rust_build_included() -> bool:
+    """Return whether the current image includes Rust MCP artifacts.
+
+    Returns:
+        ``True`` when the current image contains the Rust MCP binaries/plugins.
+    """
+    return _rust_build_included()
+
+
+def rust_runtime_managed() -> bool:
+    """Return whether the gateway expects to manage the Rust MCP sidecar locally.
+
+    Returns:
+        ``True`` when the gateway should launch and supervise the Rust sidecar.
+    """
+    return _rust_runtime_managed()
+
+
+def current_mcp_transport_mount() -> str:
+    """Return which public ``/mcp`` transport is currently mounted.
+
+    Returns:
+        Runtime label identifying the currently mounted public MCP transport.
+    """
+    return _current_mcp_transport_mount()
+
+
+def should_mount_public_rust_transport() -> bool:
+    """Return whether public ``/mcp`` should be served directly by Rust.
+
+    Returns:
+        ``True`` only when the Rust runtime is enabled and Rust can safely own
+        steady-state public MCP session traffic.
+    """
+    return _should_mount_public_rust_transport()
+
+
+def should_use_rust_public_session_stack() -> bool:
+    """Return whether Rust should own the effective public MCP session stack.
+
+    Returns:
+        ``True`` only when the public MCP transport and session semantics should
+        stay on the Rust-backed path.
+    """
+    return _should_use_rust_public_session_stack()
+
+
+def current_mcp_runtime_mode() -> str:
+    """Return the current MCP runtime mode label used for health and UI surfaces.
+
+    Returns:
+        Human-readable runtime mode label for diagnostics and UI reporting.
+    """
+    return _current_mcp_runtime_mode()
+
+
+def current_mcp_session_core_mode() -> str:
+    """Return which runtime currently owns MCP session metadata.
+
+    Returns:
+        ``"rust"`` when the Rust session core is enabled, otherwise ``"python"``.
+    """
+    return _current_mcp_session_core_mode()
+
+
+def current_mcp_event_store_mode() -> str:
+    """Return which runtime currently owns MCP resumable event-store semantics.
+
+    Returns:
+        ``"rust"`` when the Rust event store is enabled, otherwise ``"python"``.
+    """
+    return _current_mcp_event_store_mode()
+
+
+def current_mcp_resume_core_mode() -> str:
+    """Return which runtime currently owns public MCP replay/resume behavior.
+
+    Returns:
+        ``"rust"`` when Rust owns replay/resume, otherwise ``"python"``.
+    """
+    return _current_mcp_resume_core_mode()
+
+
+def current_mcp_live_stream_core_mode() -> str:
+    """Return which runtime currently owns non-resume public GET ``/mcp`` SSE behavior.
+
+    Returns:
+        ``"rust"`` when Rust owns live GET ``/mcp`` streaming, otherwise ``"python"``.
+    """
+    return _current_mcp_live_stream_core_mode()
+
+
+def current_mcp_affinity_core_mode() -> str:
+    """Return which runtime currently owns MCP multi-worker session-affinity forwarding.
+
+    Returns:
+        ``"rust"`` when Rust owns session-affinity forwarding, otherwise ``"python"``.
+    """
+    return _current_mcp_affinity_core_mode()
+
+
+def current_mcp_session_auth_reuse_mode() -> str:
+    """Return which runtime currently owns MCP session-bound auth-context reuse.
+
+    Returns:
+        ``"rust"`` when Rust session auth reuse is enabled, otherwise ``"python"``.
+    """
+    return _current_mcp_session_auth_reuse_mode()
+
+
+def mcp_runtime_status_payload() -> Dict[str, Any]:
+    """Return MCP runtime diagnostics for health, UI, and version surfaces.
+
+    Returns:
+        Diagnostic payload describing the active MCP runtime configuration.
+    """
+    return _mcp_runtime_status_payload()
+
+
 def _is_secret(key: str) -> bool:
     """Identify if an environment variable key likely represents a secret.
 
@@ -563,6 +871,7 @@ def _build_payload(
             "metrics_cleanup_enabled": getattr(settings, "metrics_cleanup_enabled", True),
             "metrics_rollup_enabled": getattr(settings, "metrics_rollup_enabled", True),
         },
+        "mcp_runtime": _mcp_runtime_status_payload(),
         "env": _public_env(),
         "system": _system_metrics(),
     }
@@ -629,6 +938,7 @@ def _render_html(payload: Dict[str, Any]) -> str:
         ...     "database": {"dialect": "sqlite", "reachable": True},
         ...     "redis": {"available": False},
         ...     "settings": {"cache_type": "memory"},
+        ...     "mcp_runtime": {"mode": "python", "mounted": "python"},
         ...     "system": {"cpu_count": 4},
         ...     "env": {"PATH": "/usr/bin"}
         ... }
@@ -646,6 +956,8 @@ def _render_html(payload: Dict[str, Any]) -> str:
         True
         >>> '<h2>Database</h2>' in html
         True
+        >>> '<h2>MCP Runtime</h2>' in html
+        True
         >>> '<style>' in html
         True
         >>> 'border-collapse:collapse' in html
@@ -667,6 +979,7 @@ def _render_html(payload: Dict[str, Any]) -> str:
         ("Database", "database"),
         ("Redis", "redis"),
         ("Settings", "settings"),
+        ("MCP Runtime", "mcp_runtime"),
         ("System", "system"),
     ):
         sections += f"<h2>{title}</h2>{_html_table(payload[key])}"
diff --git a/plugins/plugin_parity_config.yaml b/plugins/plugin_parity_config.yaml
new file mode 100644
index 0000000000..f40ea4d010
--- /dev/null
+++ b/plugins/plugin_parity_config.yaml
@@ -0,0 +1,55 @@
+plugins:
+  - name: "LicenseHeaderInjector"
+    kind: "plugins.license_header_injector.license_header_injector.LicenseHeaderInjectorPlugin"
+    description: "Injects an SPDX header into the parity-test resource output."
+    version: "0.1"
+    author: "ContextForge Team"
+    hooks: ["resource_post_fetch"]
+    tags: ["plugin", "resource", "parity", "test"]
+    mode: "enforce"
+    priority: 100
+    conditions:
+      - resources: ["time://formats"]
+    config:
+      header_template: "SPDX-License-Identifier: Apache-2.0"
+      languages: ["python"]
+      max_size_kb: 512
+
+  - name: "ToolOutputSentinelPlugin"
+    kind: "plugins.test_tool_output_sentinel.ToolOutputSentinelPlugin"
+    description: "Appends a deterministic sentinel to tool results for MCP parity tests."
+    version: "0.1"
+    author: "ContextForge Team"
+    hooks: ["tool_post_invoke"]
+    tags: ["plugin", "tool", "parity", "test"]
+    mode: "enforce"
+    priority: 110
+    conditions:
+      - tools: ["fast-time-get-system-time"]
+    config:
+      sentinel_text: "[TOOL-POST-INVOKE-SENTINEL]"
+      separator: "\n"
+      append_to_all_text_blocks: false
+
+  - name: "PromptOutputSentinelPlugin"
+    kind: "plugins.test_prompt_output_sentinel.PromptOutputSentinelPlugin"
+    description: "Appends a deterministic sentinel to prompt results for MCP parity tests."
+    version: "0.1"
+    author: "ContextForge Team"
+    hooks: ["prompt_post_fetch"]
+    tags: ["plugin", "prompt", "parity", "test"]
+    mode: "enforce"
+    priority: 120
+    conditions:
+      - prompts: ["fast-time-convert-time-detailed"]
+    config:
+      sentinel_text: "[PROMPT-POST-FETCH-SENTINEL]"
+      separator: "\n"
+      append_to_all_messages: false
+
+plugin_settings:
+  parallel_execution_within_band: true
+  plugin_timeout: 30
+  fail_on_plugin_error: false
+  enable_plugin_api: true
+  plugin_health_check_interval: 60
diff --git a/plugins/test_prompt_output_sentinel.py b/plugins/test_prompt_output_sentinel.py
new file mode 100644
index 0000000000..a4840bbe58
--- /dev/null
+++ b/plugins/test_prompt_output_sentinel.py
@@ -0,0 +1,112 @@
+# -*- coding: utf-8 -*-
+"""Location: ./plugins/test_prompt_output_sentinel.py
+Copyright 2026
+SPDX-License-Identifier: Apache-2.0
+Authors: Mihai Criveti
+
+Test-only prompt output sentinel plugin.
+
+This plugin appends a deterministic sentinel string to textual prompt outputs so
+live MCP parity tests can prove that `prompt_post_fetch` hooks still run when
+the Rust MCP public path is active.
+"""
+
+from __future__ import annotations
+
+from copy import deepcopy
+
+from pydantic import BaseModel, Field
+
+from mcpgateway.plugins.framework import Plugin, PluginConfig, PluginContext, PromptPosthookPayload, PromptPosthookResult
+
+
+class PromptOutputSentinelConfig(BaseModel):
+    """Configuration for the prompt output sentinel plugin.
+
+    Attributes:
+        sentinel_text: Deterministic marker appended to prompt text.
+        separator: Separator inserted before the sentinel.
+        append_to_all_messages: When true, append to every text message.
+    """
+
+    sentinel_text: str = Field(default="[PROMPT-POST-FETCH-SENTINEL]")
+    separator: str = Field(default="\n")
+    append_to_all_messages: bool = Field(default=False)
+
+
+def _append_sentinel(text: str, cfg: PromptOutputSentinelConfig) -> str:
+    """Append the configured sentinel to a text value.
+
+    Args:
+        text: Original prompt text.
+        cfg: Plugin configuration.
+
+    Returns:
+        Text with the sentinel appended once.
+    """
+    if cfg.sentinel_text in text:
+        return text
+    if not text:
+        return cfg.sentinel_text
+    return f"{text}{cfg.separator}{cfg.sentinel_text}"
+
+
+class PromptOutputSentinelPlugin(Plugin):
+    """Append a deterministic sentinel to prompt outputs for live parity tests."""
+
+    def __init__(self, config: PluginConfig) -> None:
+        """Initialize the plugin.
+
+        Args:
+            config: Plugin configuration.
+        """
+        super().__init__(config)
+        self._cfg = PromptOutputSentinelConfig(**(config.config or {}))
+
+    async def prompt_post_fetch(self, payload: PromptPosthookPayload, context: PluginContext) -> PromptPosthookResult:
+        """Append the sentinel to prompt message text.
+
+        Args:
+            payload: Prompt result payload after retrieval/rendering.
+            context: Plugin execution context.
+
+        Returns:
+            A modified payload when a text message was updated, otherwise a
+            no-op result.
+        """
+        del context
+
+        result = deepcopy(payload.result)
+        messages = result.get("messages") if isinstance(result, dict) else getattr(result, "messages", None)
+        if not isinstance(messages, list):
+            return PromptPosthookResult(continue_processing=True)
+
+        modified = False
+        for message in messages:
+            content = message.get("content") if isinstance(message, dict) else getattr(message, "content", None)
+            if content is None:
+                continue
+
+            if isinstance(content, dict):
+                text = content.get("text")
+                if not isinstance(text, str):
+                    continue
+                updated = _append_sentinel(text, self._cfg)
+                if updated != text:
+                    content["text"] = updated
+                    modified = True
+            else:
+                text = getattr(content, "text", None)
+                if not isinstance(text, str):
+                    continue
+                updated = _append_sentinel(text, self._cfg)
+                if updated != text:
+                    setattr(content, "text", updated)
+                    modified = True
+
+            if modified and not self._cfg.append_to_all_messages:
+                break
+
+        if modified:
+            return PromptPosthookResult(modified_payload=PromptPosthookPayload(prompt_id=payload.prompt_id, result=result))
+        return PromptPosthookResult(continue_processing=True)
diff --git a/plugins/test_tool_output_sentinel.py b/plugins/test_tool_output_sentinel.py
new file mode 100644
index 0000000000..39b4d479fd
--- /dev/null
+++ b/plugins/test_tool_output_sentinel.py
@@ -0,0 +1,114 @@
+# -*- coding: utf-8 -*-
+"""Location: ./plugins/test_tool_output_sentinel.py
+Copyright 2026
+SPDX-License-Identifier: Apache-2.0
+Authors: Mihai Criveti
+
+Test-only tool output sentinel plugin.
+
+This plugin appends a deterministic sentinel string to textual tool outputs so
+live MCP parity tests can prove that `tool_post_invoke` hooks are still applied
+when the Rust MCP fast path is active.
+"""
+
+from __future__ import annotations
+
+from copy import deepcopy
+from typing import Any
+
+from pydantic import BaseModel, Field
+
+from mcpgateway.plugins.framework import Plugin, PluginConfig, PluginContext, ToolPostInvokePayload, ToolPostInvokeResult
+
+
+class ToolOutputSentinelConfig(BaseModel):
+    """Configuration for the tool output sentinel plugin.
+
+    Attributes:
+        sentinel_text: Deterministic marker appended to text outputs.
+        separator: Separator inserted before the sentinel.
+        append_to_all_text_blocks: When true, append to every text block in an
+            MCP `content` array. When false, stop after the first text block.
+    """
+
+    sentinel_text: str = Field(default="[TOOL-POST-INVOKE-SENTINEL]")
+    separator: str = Field(default="\n")
+    append_to_all_text_blocks: bool = Field(default=False)
+
+
+def _append_sentinel(text: str, cfg: ToolOutputSentinelConfig) -> str:
+    """Append the configured sentinel to a text value.
+
+    Args:
+        text: Original text result.
+        cfg: Plugin configuration.
+
+    Returns:
+        Text with the sentinel appended once.
+    """
+    if cfg.sentinel_text in text:
+        return text
+    if not text:
+        return cfg.sentinel_text
+    return f"{text}{cfg.separator}{cfg.sentinel_text}"
+
+
+class ToolOutputSentinelPlugin(Plugin):
+    """Append a deterministic sentinel to tool outputs for live parity tests."""
+
+    def __init__(self, config: PluginConfig) -> None:
+        """Initialize the plugin.
+
+        Args:
+            config: Plugin configuration.
+        """
+        super().__init__(config)
+        self._cfg = ToolOutputSentinelConfig(**(config.config or {}))
+
+    async def tool_post_invoke(self, payload: ToolPostInvokePayload, context: PluginContext) -> ToolPostInvokeResult:
+        """Append the sentinel to supported textual tool outputs.
+
+        Args:
+            payload: Tool result payload after execution.
+            context: Plugin execution context.
+
+        Returns:
+            A modified payload when the result shape is supported, otherwise a
+            no-op result.
+        """
+        del context
+
+        result = payload.result
+        if isinstance(result, str):
+            updated = _append_sentinel(result, self._cfg)
+            if updated != result:
+                return ToolPostInvokeResult(modified_payload=ToolPostInvokePayload(name=payload.name, result=updated))
+            return ToolPostInvokeResult(continue_processing=True)
+
+        if isinstance(result, dict) and isinstance(result.get("text"), str):
+            updated = _append_sentinel(result["text"], self._cfg)
+            if updated != result["text"]:
+                new_result = dict(result)
+                new_result["text"] = updated
+                return ToolPostInvokeResult(modified_payload=ToolPostInvokePayload(name=payload.name, result=new_result))
+            return ToolPostInvokeResult(continue_processing=True)
+
+        if isinstance(result, dict) and isinstance(result.get("content"), list):
+            new_result: dict[str, Any] = deepcopy(result)
+            modified = False
+            for item in new_result["content"]:
+                if not isinstance(item, dict):
+                    continue
+                if item.get("type") != "text" or not isinstance(item.get("text"), str):
+                    continue
+                updated = _append_sentinel(item["text"], self._cfg)
+                if updated != item["text"]:
+                    item["text"] = updated
+                    modified = True
+                if not self._cfg.append_to_all_text_blocks:
+                    break
+            if modified:
+                return ToolPostInvokeResult(modified_payload=ToolPostInvokePayload(name=payload.name, result=new_result))
+            return ToolPostInvokeResult(continue_processing=True)
+
+        return ToolPostInvokeResult(continue_processing=True)
diff --git a/tests/AGENTS.md b/tests/AGENTS.md
index 3ecf94758c..75edd5bb1c 100644
--- a/tests/AGENTS.md
+++ b/tests/AGENTS.md
@@ -10,6 +10,7 @@ tests/
 │   └── mcpgateway/     # Mirrors source structure
 ├── integration/        # Cross-module and service integration tests
 ├── e2e/               # End-to-end flows (slower; may require services)
+├── e2e_rust/          # Rust-mode-specific end-to-end flows (requires Rust MCP path)
 ├── performance/        # Database performance & N+1 detection tests
 ├── playwright/        # UI automation (requires extra setup)
 ├── security/          # Security validation tests
@@ -38,6 +39,11 @@ make htmlcov                      # Coverage HTML → docs/docs/coverage/index.h
 make coverage                     # Full coverage (md + HTML + XML + badge + annotated)
 make smoketest                    # Container build + simple E2E flow
 make test-mcp-cli                 # MCP protocol via mcp-cli (needs live gateway)
+make test-mcp-rbac                # MCP RBAC transport E2E (needs live gateway)
+make test-mcp-plugin-parity       # MCP plugin parity E2E for the current stack (requires test-specific plugin config)
+make test-mcp-access-matrix       # Rust-only MCP role/access matrix with strong sentinels
+make test-mcp-session-isolation   # Rust-only MCP session isolation E2E
+make test-mcp-session-isolation-load  # Rust-only Locust correctness load test
 
 # Selective runs
 pytest -k "fragment"              # By name substring
diff --git a/tests/e2e/mcp_test_helpers.py b/tests/e2e/mcp_test_helpers.py
index 78dede8ed4..9601c9407f 100644
--- a/tests/e2e/mcp_test_helpers.py
+++ b/tests/e2e/mcp_test_helpers.py
@@ -57,8 +57,22 @@ def _gateway_reachable() -> bool:
         return False
 
 
+def _rust_mcp_gateway_active() -> bool:
+    try:
+        # Third-Party
+        import httpx
+
+        resp = httpx.get(f"{BASE_URL}/health", timeout=5)
+        if resp.status_code != 200:
+            return False
+        return resp.headers.get("x-contextforge-mcp-transport-mounted") == "rust"
+    except Exception:
+        return False
+
+
 skip_no_mcp_cli = pytest.mark.skipif(not _mcp_cli_available(), reason="mcp-cli not installed (pip install 'mcp-cli[cli]')")
 skip_no_gateway = pytest.mark.skipif(not _gateway_reachable(), reason=f"ContextForge not reachable at {BASE_URL}")
+skip_no_rust_mcp_gateway = pytest.mark.skipif(not _rust_mcp_gateway_active(), reason=f"Rust MCP public transport not active at {BASE_URL}")
 
 
 # ---------------------------------------------------------------------------
diff --git a/tests/e2e/test_mcp_cli_protocol.py b/tests/e2e/test_mcp_cli_protocol.py
index d9b61c0e39..7594d52309 100644
--- a/tests/e2e/test_mcp_cli_protocol.py
+++ b/tests/e2e/test_mcp_cli_protocol.py
@@ -41,6 +41,7 @@
 import sys
 
 # Third-Party
+import httpx
 import pytest
 
 # Local
@@ -430,3 +431,34 @@ def test_server_capabilities(self, jwt_token: str) -> None:
         assert "prompts" in caps, f"Missing 'prompts' capability: {caps}"
         cap_names = sorted(caps.keys())
         print(f"    -> Server capabilities: {cap_names}")
+
+
+class TestRawHttpTransportParity:
+    """Direct HTTP checks for the Rust-fronted MCP transport."""
+
+    def test_initialize_delete_flow_uses_rust_transport(self, jwt_token: str) -> None:
+        """Raw initialize and DELETE should stay on the Rust MCP edge when enabled."""
+        initialize_headers = {
+            "authorization": f"Bearer {jwt_token}",
+            "accept": "application/json, text/event-stream",
+            "content-type": "application/json",
+            "mcp-protocol-version": "2025-03-26",
+        }
+
+        with httpx.Client(timeout=10.0) as client:
+            init_response = client.post(f"{BASE_URL}/mcp/", headers=initialize_headers, json=_build_initialize())
+            assert init_response.status_code == 200, init_response.text
+            runtime_marker = init_response.headers.get("x-contextforge-mcp-runtime")
+            if runtime_marker != "rust":
+                pytest.skip("Rust MCP runtime not enabled on target gateway")
+
+            print(f"    -> Raw HTTP initialize runtime header: {runtime_marker}")
+
+            delete_headers = {
+                "authorization": f"Bearer {jwt_token}",
+                "accept": "application/json, text/event-stream",
+            }
+            delete_response = client.request("DELETE", f"{BASE_URL}/mcp/", headers=delete_headers)
+            assert delete_response.status_code == 405, delete_response.text
+            assert delete_response.headers.get("x-contextforge-mcp-runtime") == "rust"
+            print(f"    -> Raw HTTP DELETE runtime header: {delete_response.headers.get('x-contextforge-mcp-runtime')}")
diff --git a/tests/e2e/test_mcp_plugin_parity.py b/tests/e2e/test_mcp_plugin_parity.py
new file mode 100644
index 0000000000..76da5024ee
--- /dev/null
+++ b/tests/e2e/test_mcp_plugin_parity.py
@@ -0,0 +1,385 @@
+# -*- coding: utf-8 -*-
+"""Location: ./tests/e2e/test_mcp_plugin_parity.py
+Copyright 2026
+SPDX-License-Identifier: Apache-2.0
+Authors: Mihai Criveti
+
+Compose-backed MCP plugin parity tests.
+
+These tests run against the current live stack and assert that a test-specific
+plugin configuration still takes effect on the public MCP path. Run the same
+file against both Python mode and Rust full mode to prove parity.
+"""
+
+from __future__ import annotations
+
+from contextlib import suppress
+from datetime import datetime
+from typing import Any, Generator
+import os
+import uuid
+
+import httpx
+import pytest
+
+from mcpgateway.utils.create_jwt_token import _create_jwt_token
+
+from tests.e2e.mcp_test_helpers import BASE_URL, skip_no_gateway
+
+MCP_PROTOCOL_VERSION = "2025-11-25"
+PLUGIN_PARITY_PREFIX = "mcp-plugin-parity"
+RESOURCE_LICENSE_PREFIX = "# SPDX-License-Identifier: Apache-2.0"
+TOOL_OUTPUT_SENTINEL = "[TOOL-POST-INVOKE-SENTINEL]"
+PROMPT_OUTPUT_SENTINEL = "[PROMPT-POST-FETCH-SENTINEL]"
+EXPECTED_RUNTIME = os.getenv("MCP_PLUGIN_PARITY_EXPECTED_RUNTIME")
+pytestmark = [
+    pytest.mark.e2e,
+    skip_no_gateway,
+    pytest.mark.skipif(
+        not EXPECTED_RUNTIME,
+        reason=(
+            "requires the dedicated plugin parity stack; run via "
+            "MCP_PLUGIN_PARITY_EXPECTED_RUNTIME=<python|rust> make test-mcp-plugin-parity"
+        ),
+    ),
+]
+
+# This suite targets the standard compose-backed test stack, which uses the
+# fixed local JWT secret below. Do not source this from mutable process env,
+# because broad-suite tests may patch JWT_SECRET_KEY before this module loads.
+COMPOSE_TEST_JWT_SECRET = "my-test-key"
+
+
+def _make_admin_jwt() -> str:
+    """Create a platform-admin JWT for compose-backed parity tests.
+
+    Returns:
+        A signed admin JWT.
+    """
+    return _create_jwt_token(
+        {"sub": "admin@example.com"},
+        user_data={"email": "admin@example.com", "is_admin": True, "auth_provider": "local"},
+        teams=None,
+        secret=COMPOSE_TEST_JWT_SECRET,
+    )
+
+
+def _api_headers(token: str) -> dict[str, str]:
+    """Build JSON API headers.
+
+    Args:
+        token: Bearer token to send.
+
+    Returns:
+        Standard API headers.
+    """
+    return {"Authorization": f"Bearer {token}", "Accept": "application/json"}
+
+
+def _mcp_headers(token: str, *, session_id: str | None = None) -> dict[str, str]:
+    """Build MCP JSON-RPC headers.
+
+    Args:
+        token: Bearer token to send.
+        session_id: Optional MCP session identifier.
+
+    Returns:
+        Standard MCP headers.
+    """
+    headers = {
+        "Authorization": f"Bearer {token}",
+        "Accept": "application/json, text/event-stream",
+        "Content-Type": "application/json",
+        "MCP-Protocol-Version": MCP_PROTOCOL_VERSION,
+    }
+    if session_id:
+        headers["mcp-session-id"] = session_id
+    return headers
+
+
+def _request_json(
+    client: httpx.Client,
+    method: str,
+    path: str,
+    *,
+    expected: tuple[int, ...] = (200, 201),
+    **kwargs: Any,
+) -> Any:
+    """Send a JSON API request and return the parsed body.
+
+    Args:
+        client: Configured HTTP client.
+        method: HTTP method.
+        path: Relative API path.
+        expected: Allowed status codes.
+        **kwargs: Request options forwarded to `httpx`.
+
+    Returns:
+        Parsed JSON response body, or `None` for an empty body.
+    """
+    response = client.request(method, path, **kwargs)
+    assert response.status_code in expected, (
+        f"{method} {path} expected {expected}, got {response.status_code}: {response.text}"
+    )
+    return response.json() if response.content else None
+
+
+def _mcp_post(
+    client: httpx.Client,
+    *,
+    server_id: str,
+    token: str,
+    method: str,
+    params: dict[str, Any] | None = None,
+    session_id: str | None = None,
+    request_id: int = 1,
+) -> httpx.Response:
+    """Send a direct server-scoped MCP request.
+
+    Args:
+        client: Configured HTTP client.
+        server_id: Target virtual server id.
+        token: Bearer token to send.
+        method: JSON-RPC method.
+        params: Optional method parameters.
+        session_id: Optional MCP session id.
+        request_id: JSON-RPC request id.
+
+    Returns:
+        Raw HTTP response.
+    """
+    return client.post(
+        f"/servers/{server_id}/mcp/",
+        headers=_mcp_headers(token, session_id=session_id),
+        json={
+            "jsonrpc": "2.0",
+            "id": request_id,
+            "method": method,
+            "params": params or {},
+        },
+    )
+
+
+def _assert_runtime_header(response: httpx.Response) -> None:
+    """Assert the runtime header when an expected runtime is configured.
+
+    Args:
+        response: MCP HTTP response.
+    """
+    if EXPECTED_RUNTIME:
+        assert response.headers.get("x-contextforge-mcp-runtime") == EXPECTED_RUNTIME, response.headers
+
+
+def _initialize_session(client: httpx.Client, *, server_id: str, token: str) -> str | None:
+    """Initialize an MCP session and return its session id when present.
+
+    Args:
+        client: Configured HTTP client.
+        server_id: Target virtual server id.
+        token: Bearer token to send.
+
+    Returns:
+        The allocated MCP session id when the runtime exposes one, otherwise
+        `None`.
+    """
+    response = _mcp_post(
+        client,
+        server_id=server_id,
+        token=token,
+        method="initialize",
+        params={
+            "protocolVersion": MCP_PROTOCOL_VERSION,
+            "capabilities": {},
+            "clientInfo": {"name": "mcp-plugin-parity", "version": "1.0.0"},
+        },
+    )
+    assert response.status_code == 200, response.text
+    _assert_runtime_header(response)
+    payload = response.json()
+    assert "result" in payload, payload
+    return response.headers.get("mcp-session-id")
+
+
+def _extract_result(response: httpx.Response) -> dict[str, Any]:
+    """Extract the JSON-RPC result payload from a successful response.
+
+    Args:
+        response: MCP HTTP response.
+
+    Returns:
+        JSON-RPC `result` payload.
+    """
+    assert response.status_code == 200, response.text
+    _assert_runtime_header(response)
+    payload = response.json()
+    assert "result" in payload, payload
+    return payload["result"]
+
+
+@pytest.fixture(scope="module")
+def admin_client() -> Generator[httpx.Client, None, None]:
+    """Module-scoped admin client.
+
+    Yields:
+        Authenticated admin HTTP client.
+    """
+    token = _make_admin_jwt()
+    # This suite only talks to the local plain-HTTP test stack. Passing
+    # verify=False avoids unrelated TLS env leakage from other tests.
+    with httpx.Client(base_url=BASE_URL, headers=_api_headers(token), timeout=20.0, verify=False) as client:
+        yield client
+
+
+@pytest.fixture(scope="module")
+def plugin_parity_server(admin_client: httpx.Client) -> Generator[dict[str, str], None, None]:
+    """Provision a server-scoped MCP endpoint for plugin parity checks.
+
+    Args:
+        admin_client: Module-scoped admin client.
+
+    Yields:
+        Dict containing the server id and admin token.
+    """
+    team = _request_json(
+        admin_client,
+        "POST",
+        "/teams/",
+        json={
+            "name": f"{PLUGIN_PARITY_PREFIX}-team-{uuid.uuid4().hex[:8]}",
+            "description": "Plugin parity MCP team",
+            "visibility": "private",
+        },
+    )
+    team_id = team["id"]
+
+    tools = _request_json(admin_client, "GET", "/tools")
+    resources = _request_json(admin_client, "GET", "/resources")
+    prompts = _request_json(admin_client, "GET", "/prompts")
+    time_tool = next(tool for tool in tools if tool["name"] == "fast-time-get-system-time")
+    formats_resource = next(resource for resource in resources if resource["uri"] == "time://formats")
+    detailed_prompt = next(prompt for prompt in prompts if prompt["name"] == "fast-time-convert-time-detailed")
+
+    server = _request_json(
+        admin_client,
+        "POST",
+        "/servers",
+        json={
+            "server": {
+                "name": f"{PLUGIN_PARITY_PREFIX}-server-{uuid.uuid4().hex[:8]}",
+                "description": "Plugin parity virtual server",
+                "associated_tools": [time_tool["id"]],
+                "associated_resources": [formats_resource["id"]],
+                "associated_prompts": [detailed_prompt["id"]],
+            },
+            "team_id": team_id,
+            "visibility": "team",
+        },
+    )
+    server_id = server["id"]
+
+    yield {"server_id": server_id, "token": _make_admin_jwt()}
+
+    with suppress(Exception):
+        admin_client.delete(f"/servers/{server_id}")
+    with suppress(Exception):
+        admin_client.delete(f"/teams/{team_id}")
+
+
+class TestMcpPluginParity:
+    """Live plugin parity assertions for the public MCP path."""
+
+    def test_resources_read_applies_license_header(self, plugin_parity_server: dict[str, str]) -> None:
+        """`resources/read` should still run `resource_post_fetch` hooks.
+
+        Args:
+            plugin_parity_server: Provisioned server fixture.
+        """
+        with httpx.Client(base_url=BASE_URL, timeout=20.0, verify=False) as client:
+            session_id = _initialize_session(client, server_id=plugin_parity_server["server_id"], token=plugin_parity_server["token"])
+            result = _extract_result(
+                _mcp_post(
+                    client,
+                    server_id=plugin_parity_server["server_id"],
+                    token=plugin_parity_server["token"],
+                    session_id=session_id,
+                    method="resources/read",
+                    params={"uri": "time://formats"},
+                    request_id=2,
+                )
+            )
+
+        contents = result.get("contents", [])
+        assert len(contents) == 1, contents
+        content = contents[0]
+        assert content["uri"] == "time://formats"
+        assert "mime_type" not in content, content
+        assert isinstance(content.get("text"), str), content
+        assert content["text"].startswith(RESOURCE_LICENSE_PREFIX), content["text"]
+        assert '"output_formats"' in content["text"], content["text"]
+
+    def test_tools_call_appends_sentinel(self, plugin_parity_server: dict[str, str]) -> None:
+        """`tools/call` should still run the test-only `tool_post_invoke` hook.
+
+        Args:
+            plugin_parity_server: Provisioned server fixture.
+        """
+        with httpx.Client(base_url=BASE_URL, timeout=20.0, verify=False) as client:
+            session_id = _initialize_session(client, server_id=plugin_parity_server["server_id"], token=plugin_parity_server["token"])
+            result = _extract_result(
+                _mcp_post(
+                    client,
+                    server_id=plugin_parity_server["server_id"],
+                    token=plugin_parity_server["token"],
+                    session_id=session_id,
+                    method="tools/call",
+                    params={"name": "fast-time-get-system-time", "arguments": {"timezone": "UTC"}},
+                    request_id=3,
+                )
+            )
+
+        assert not result.get("isError", False), result
+        content = result.get("content", [])
+        assert len(content) == 1, content
+        text = content[0]["text"]
+        lines = text.splitlines()
+        assert lines[-1] == TOOL_OUTPUT_SENTINEL, text
+        parsed = datetime.fromisoformat(lines[0].replace("Z", "+00:00"))
+        assert parsed.tzinfo is not None
+
+    def test_prompts_get_appends_sentinel(self, plugin_parity_server: dict[str, str]) -> None:
+        """`prompts/get` should still run `prompt_post_fetch` hooks.
+
+        Args:
+            plugin_parity_server: Provisioned server fixture.
+        """
+        with httpx.Client(base_url=BASE_URL, timeout=20.0, verify=False) as client:
+            session_id = _initialize_session(client, server_id=plugin_parity_server["server_id"], token=plugin_parity_server["token"])
+            result = _extract_result(
+                _mcp_post(
+                    client,
+                    server_id=plugin_parity_server["server_id"],
+                    token=plugin_parity_server["token"],
+                    session_id=session_id,
+                    method="prompts/get",
+                    params={
+                        "name": "fast-time-convert-time-detailed",
+                        "arguments": {
+                            "time": "2025-01-15T12:00:00Z",
+                            "from_timezone": "UTC",
+                            "to_timezones": "America/New_York,Europe/Dublin",
+                            "include_context": "true",
+                        },
+                    },
+                    request_id=4,
+                )
+            )
+
+        assert result["description"] == "Detailed time conversion"
+        messages = result.get("messages", [])
+        assert len(messages) == 1, messages
+        text = messages[0]["content"]["text"]
+        assert isinstance(text, str) and text, result
+        lines = text.splitlines()
+        assert lines[-1] == PROMPT_OUTPUT_SENTINEL, text
+        assert "America/New_York" in text, text
+        assert "Europe/Dublin" in text, text
diff --git a/tests/e2e/test_mcp_rbac_transport.py b/tests/e2e/test_mcp_rbac_transport.py
index 6136f79092..5846572334 100644
--- a/tests/e2e/test_mcp_rbac_transport.py
+++ b/tests/e2e/test_mcp_rbac_transport.py
@@ -471,6 +471,25 @@ def _mcp_tool_call(access_token: str, tool_name: str, arguments: dict[str, Any]
     return resp
 
 
+def _assert_access_denied_tool_call(resp: dict[str, Any], *, method: str = "tools/call") -> str:
+    """Accept either a JSON-RPC access error or an MCP tool-call error result."""
+    if "error" in resp:
+        error = resp["error"]
+        assert error.get("code") == -32003, f"Expected access denied JSON-RPC error: {resp}"
+        message = str(error.get("message", ""))
+        assert "access denied" in message.lower(), f"Expected access denied JSON-RPC error: {resp}"
+        error_method = error.get("data", {}).get("method")
+        if error_method is not None:
+            assert error_method == method, f"Unexpected denied method in JSON-RPC error: {resp}"
+        return message
+
+    result = resp.get("result", {})
+    assert result.get("isError", False), f"Expected access denied tool result or JSON-RPC error: {resp}"
+    message = result.get("content", [{}])[0].get("text", "")
+    assert "access denied" in message.lower(), f"Expected access denied tool result or JSON-RPC error: {resp}"
+    return message
+
+
 def _mcp_initialize_only(access_token: str, server_url: str = BASE_URL) -> list[dict[str, Any]]:
     """Send only initialize and return all responses."""
     env = build_wrapper_env(access_token, server_url)
@@ -642,24 +661,19 @@ def test_admin_calls_tool_success(self, test_users: dict) -> None:
     def test_developer_denied_tools_execute_on_default_endpoint(self, test_users: dict) -> None:
         """Developer has team-scoped tools.execute but default /mcp checks global scope only."""
         resp = _mcp_tool_call(test_users["developer"]["access_token"], "fast-time-get-system-time", {"timezone": "UTC"})
-        result = resp.get("result", {})
-        assert result.get("isError", False), f"Developer should be denied tools.execute on default endpoint: {result}"
-        text = result.get("content", [{}])[0].get("text", "")
-        assert "access denied" in text.lower()
+        text = _assert_access_denied_tool_call(resp)
         print(f"    -> Developer denied tools.execute (expected): {text}")
 
     def test_team_admin_denied_tools_execute_on_default_endpoint(self, test_users: dict) -> None:
         """Team admin has team-scoped tools.execute but default /mcp checks global scope only."""
         resp = _mcp_tool_call(test_users["team_admin"]["access_token"], "fast-time-get-system-time", {"timezone": "UTC"})
-        result = resp.get("result", {})
-        assert result.get("isError", False), f"Team admin should be denied on default endpoint: {result}"
+        _assert_access_denied_tool_call(resp)
         print("    -> Team admin denied tools.execute on default endpoint (expected)")
 
     def test_outsider_denied_tools_execute(self, outsider_user: dict) -> None:
         """Outsider has no RBAC role, should be denied tools.execute."""
         resp = _mcp_tool_call(outsider_user["access_token"], "fast-time-get-system-time", {"timezone": "UTC"})
-        result = resp.get("result", {})
-        assert result.get("isError", False), f"Outsider should be denied tools.execute: {result}"
+        _assert_access_denied_tool_call(resp)
         print("    -> Outsider denied tools.execute (expected)")
 
     def test_outsider_calls_nonexistent_tool_error(self, outsider_user: dict) -> None:
@@ -671,8 +685,7 @@ def test_outsider_calls_nonexistent_tool_error(self, outsider_user: dict) -> Non
     def test_viewer_denied_tools_execute(self, test_users: dict) -> None:
         """Viewer has tools.read but NOT tools.execute even in team scope."""
         resp = _mcp_tool_call(test_users["viewer"]["access_token"], "fast-time-get-system-time", {"timezone": "UTC"})
-        result = resp.get("result", {})
-        assert result.get("isError", False) or "error" in resp, f"Viewer should be denied tools.execute: {resp}"
+        _assert_access_denied_tool_call(resp)
         print("    -> Viewer denied tools.execute (expected)")
 
 
diff --git a/tests/e2e_rust/__init__.py b/tests/e2e_rust/__init__.py
new file mode 100644
index 0000000000..b9f168aeb1
--- /dev/null
+++ b/tests/e2e_rust/__init__.py
@@ -0,0 +1,6 @@
+# -*- coding: utf-8 -*-
+"""Location: ./tests/e2e_rust/__init__.py
+Copyright 2026
+SPDX-License-Identifier: Apache-2.0
+Authors: Mihai Criveti
+"""
diff --git a/tests/e2e_rust/test_mcp_access_matrix.py b/tests/e2e_rust/test_mcp_access_matrix.py
new file mode 100644
index 0000000000..ae1eed955b
--- /dev/null
+++ b/tests/e2e_rust/test_mcp_access_matrix.py
@@ -0,0 +1,598 @@
+# -*- coding: utf-8 -*-
+"""Location: ./tests/e2e_rust/test_mcp_access_matrix.py
+Copyright 2026
+SPDX-License-Identifier: Apache-2.0
+Authors: Mihai Criveti
+
+Compose-backed MCP role/access matrix tests for the Rust public transport path.
+
+These tests validate the live server-scoped MCP endpoint with strong sentinels:
+
+- exact tool, resource, and prompt discovery for a scoped virtual server
+- structured `resources/read` payload verification
+- structured `prompts/get` verification
+- expected `tools/call` allow/deny behavior across scoped admin and non-admin users
+
+The goal is correctness and access-matrix coverage, not throughput.
+"""
+
+from __future__ import annotations
+
+from contextlib import suppress
+from datetime import datetime
+import json
+from typing import Any, Generator
+import uuid
+
+import httpx
+import pytest
+
+from mcpgateway.utils.create_jwt_token import _create_jwt_token
+
+from tests.e2e.mcp_test_helpers import BASE_URL, JWT_SECRET, TEST_PASSWORD, skip_no_gateway, skip_no_rust_mcp_gateway
+
+pytestmark = [pytest.mark.e2e, skip_no_gateway, skip_no_rust_mcp_gateway]
+
+MCP_PROTOCOL_VERSION = "2025-11-25"
+ACCESS_PREFIX = "mcp-access"
+EXPECTED_TOOL_NAMES = {"fast-time-get-system-time", "fast-time-convert-time"}
+EXPECTED_RESOURCE_URIS = {"time://formats", "timezone://info", "time://business-hours", "time://current/world"}
+REQUIRED_PROMPT_NAMES = {"fast-time-schedule-meeting", "fast-time-convert-time-detailed", "fast-time-compare-timezones"}
+
+
+def _make_jwt(email: str, *, is_admin: bool = False, teams: list[str] | None = None) -> str:
+    """Create a JWT for compose-backed E2E tests."""
+    return _create_jwt_token(
+        {"sub": email},
+        user_data={"email": email, "is_admin": is_admin, "auth_provider": "local"},
+        teams=teams,
+        secret=JWT_SECRET,
+    )
+
+
+def _api_headers(token: str) -> dict[str, str]:
+    """Build standard JSON API headers."""
+    return {"Authorization": f"Bearer {token}", "Accept": "application/json"}
+
+
+def _mcp_headers(token: str, *, session_id: str | None = None) -> dict[str, str]:
+    """Build headers for direct MCP JSON-RPC POSTs."""
+    headers = {
+        "Authorization": f"Bearer {token}",
+        "Accept": "application/json, text/event-stream",
+        "Content-Type": "application/json",
+        "MCP-Protocol-Version": MCP_PROTOCOL_VERSION,
+    }
+    if session_id:
+        headers["mcp-session-id"] = session_id
+    return headers
+
+
+def _request_json(
+    client: httpx.Client,
+    method: str,
+    path: str,
+    *,
+    expected: tuple[int, ...] = (200, 201),
+    **kwargs: Any,
+) -> Any:
+    """Send a JSON API request and return the parsed payload."""
+    response = client.request(method, path, **kwargs)
+    assert response.status_code in expected, (
+        f"{method} {path} expected {expected}, got {response.status_code}: {response.text}"
+    )
+    return response.json() if response.content else None
+
+
+def _resolve_role_id(admin_client: httpx.Client, role_name: str) -> str:
+    """Resolve an RBAC role name to its UUID."""
+    roles = _request_json(admin_client, "GET", "/rbac/roles")
+    for role in roles:
+        if role.get("name") == role_name:
+            return role["id"]
+    raise AssertionError(f"RBAC role '{role_name}' not found")
+
+
+def _create_user_token(
+    admin_client: httpx.Client,
+    *,
+    email: str,
+    is_admin: bool,
+    team_id: str | None,
+    role_name: str | None,
+    permissions: list[str],
+) -> dict[str, Any]:
+    """Create a user, optional team membership/role, and a scoped API token."""
+    _request_json(
+        admin_client,
+        "POST",
+        "/auth/email/admin/users",
+        json={
+            "email": email,
+            "password": TEST_PASSWORD,
+            "full_name": f"Access Matrix {email.split('@', maxsplit=1)[0]}",
+            "is_admin": is_admin,
+            "is_active": True,
+            "password_change_required": False,
+        },
+    )
+
+    role_id = None
+    if team_id:
+        _request_json(
+            admin_client,
+            "POST",
+            f"/teams/{team_id}/members",
+            json={"email": email, "role": "member"},
+        )
+    if role_name and team_id:
+        role_id = _resolve_role_id(admin_client, role_name)
+        _request_json(
+            admin_client,
+            "POST",
+            f"/rbac/users/{email}/roles",
+            json={"role_id": role_id, "scope": "team", "scope_id": team_id},
+        )
+
+    user_jwt = _make_jwt(email, is_admin=is_admin, teams=[team_id] if team_id else None)
+    with httpx.Client(base_url=BASE_URL, headers=_api_headers(user_jwt), timeout=20.0) as user_client:
+        payload: dict[str, Any] = {
+            "name": f"{ACCESS_PREFIX}-token-{uuid.uuid4().hex[:8]}",
+            "expires_in_days": 1,
+            "scope": {"permissions": permissions},
+        }
+        if team_id:
+            payload["team_id"] = team_id
+        token_response = _request_json(user_client, "POST", "/tokens", json=payload)
+
+    token_obj = token_response.get("token", token_response)
+    return {
+        "email": email,
+        "access_token": token_response["access_token"],
+        "token_id": token_obj.get("id") or token_obj.get("token_id"),
+        "team_id": team_id,
+        "role_id": role_id,
+    }
+
+
+def _cleanup_user(admin_client: httpx.Client, user_info: dict[str, Any]) -> None:
+    """Best-effort cleanup for a created test user and token."""
+    token_id = user_info.get("token_id")
+    if token_id:
+        with suppress(Exception):
+            admin_client.delete(f"/tokens/admin/{token_id}")
+    with suppress(Exception):
+        admin_client.delete(f"/auth/email/admin/users/{user_info['email']}")
+
+
+def _mcp_post(
+    client: httpx.Client,
+    *,
+    server_id: str,
+    token: str,
+    method: str,
+    params: dict[str, Any] | None = None,
+    session_id: str | None = None,
+    request_id: int = 1,
+) -> httpx.Response:
+    """Send a direct MCP JSON-RPC POST to the server-scoped endpoint."""
+    return client.post(
+        f"/servers/{server_id}/mcp/",
+        headers=_mcp_headers(token, session_id=session_id),
+        json={
+            "jsonrpc": "2.0",
+            "id": request_id,
+            "method": method,
+            "params": params or {},
+        },
+    )
+
+
+def _initialize_session(client: httpx.Client, *, server_id: str, token: str) -> str | None:
+    """Initialize an MCP session and return the session id when the transport issues one."""
+    response = _mcp_post(
+        client,
+        server_id=server_id,
+        token=token,
+        method="initialize",
+        params={
+            "protocolVersion": MCP_PROTOCOL_VERSION,
+            "capabilities": {},
+            "clientInfo": {"name": "mcp-access-matrix", "version": "1.0.0"},
+        },
+    )
+    assert response.status_code == 200, response.text
+    payload = response.json()
+    assert "result" in payload, payload
+    assert response.headers.get("x-contextforge-mcp-runtime") == "rust"
+    return response.headers.get("mcp-session-id")
+
+
+def _extract_result(response: httpx.Response) -> dict[str, Any]:
+    """Return the JSON-RPC result payload from a successful response."""
+    assert response.status_code == 200, response.text
+    payload = response.json()
+    assert "result" in payload, payload
+    return payload["result"]
+
+
+def _extract_error(response: httpx.Response, *, expected_status: int) -> dict[str, Any]:
+    """Return the JSON-RPC error payload from a failed response."""
+    assert response.status_code == expected_status, response.text
+    payload = response.json()
+    assert "error" in payload, payload
+    return payload["error"]
+
+
+def _assert_access_denied(response: httpx.Response) -> None:
+    """Assert the MCP request was denied without leaking resource data."""
+    assert response.status_code == 200, response.text
+    payload = response.json()
+    error = payload.get("error")
+    assert error, payload
+    assert error.get("code") == -32003, payload
+    assert "access denied" in str(error.get("message", "")).lower(), payload
+
+
+def _assert_tools_list(result: dict[str, Any]) -> None:
+    """Assert the expected fast-time tools are exposed by the scoped server."""
+    tools = result.get("tools", [])
+    names = {tool["name"] for tool in tools}
+    assert names == EXPECTED_TOOL_NAMES, tools
+
+    tools_by_name = {tool["name"]: tool for tool in tools}
+    get_time = tools_by_name["fast-time-get-system-time"]
+    assert get_time["annotations"]["title"] == "Get System Time"
+    assert set(get_time["inputSchema"]["properties"]) == {"timezone"}
+    assert get_time["inputSchema"]["required"] == []
+
+    convert_time = tools_by_name["fast-time-convert-time"]
+    assert set(convert_time["inputSchema"]["required"]) == {"time", "source_timezone", "target_timezone"}
+
+
+def _assert_resources_list(result: dict[str, Any]) -> None:
+    """Assert the expected static resources are exposed by the scoped server."""
+    resources = result.get("resources", [])
+    uris = {resource["uri"] for resource in resources}
+    assert uris == EXPECTED_RESOURCE_URIS, resources
+
+
+def _assert_prompts_list(result: dict[str, Any]) -> None:
+    """Assert the expected prompt names and argument schemas are exposed."""
+    prompts = result.get("prompts", [])
+    names = {prompt["name"] for prompt in prompts}
+    assert REQUIRED_PROMPT_NAMES <= names, prompts
+
+    prompts_by_name = {prompt["name"]: prompt for prompt in prompts}
+    convert_prompt = prompts_by_name["fast-time-convert-time-detailed"]
+    args = {arg["name"]: arg for arg in convert_prompt["arguments"]}
+    assert set(args) == {"time", "from_timezone", "to_timezones", "include_context"}
+    assert args["time"]["required"] is True
+    assert args["from_timezone"]["required"] is True
+    assert args["to_timezones"]["required"] is True
+    assert args["include_context"]["required"] is False
+
+
+def _assert_formats_resource(result: dict[str, Any]) -> None:
+    """Assert the `time://formats` resource returns the expected structured payload."""
+    contents = result.get("contents", [])
+    assert len(contents) == 1, contents
+    content = contents[0]
+    assert content["uri"] == "time://formats"
+
+    payload = json.loads(content["text"])
+    assert set(payload["output_formats"]) >= {"iso8601", "rfc3339", "unix"}
+    example_formats = {example["format"] for example in payload["examples"]}
+    assert {"ISO 8601", "RFC 3339", "Unix Timestamp"} <= example_formats
+    assert "2006-01-02T15:04:05Z" in payload["input_formats"]
+
+
+def _assert_prompt_get(result: dict[str, Any]) -> None:
+    """Assert prompt retrieval returns the expected structured prompt shape."""
+    assert result["description"] == "Detailed time conversion"
+    messages = result.get("messages", [])
+    assert len(messages) == 1, messages
+    message = messages[0]
+    assert message["role"] == "user"
+    assert message["content"]["type"] == "text"
+    text = message["content"]["text"]
+    assert isinstance(text, str)
+    assert text.strip(), result
+    assert "America/New_York" in text, text
+    assert "Europe/Dublin" in text, text
+
+
+def _assert_tool_call_success(result: dict[str, Any]) -> None:
+    """Assert tool execution returned a fresh RFC3339 timestamp."""
+    assert not result.get("isError", False), result
+    content = result.get("content", [])
+    assert len(content) == 1, content
+    text = content[0]["text"]
+    parsed = datetime.fromisoformat(text.replace("Z", "+00:00"))
+    assert parsed.tzinfo is not None
+
+
+@pytest.fixture(scope="module")
+def admin_client() -> Generator[httpx.Client, None, None]:
+    """Module-scoped admin API client."""
+    token = _make_jwt("admin@example.com", is_admin=True, teams=None)
+    with httpx.Client(base_url=BASE_URL, headers=_api_headers(token), timeout=20.0) as client:
+        yield client
+
+
+@pytest.fixture(scope="module")
+def access_matrix_env(admin_client: httpx.Client) -> Generator[dict[str, Any], None, None]:
+    """Provision a team-scoped virtual server plus scoped admin and non-admin users."""
+    team = _request_json(
+        admin_client,
+        "POST",
+        "/teams/",
+        json={
+            "name": f"{ACCESS_PREFIX}-team-{uuid.uuid4().hex[:8]}",
+            "description": "Rust MCP access matrix team",
+            "visibility": "private",
+        },
+    )
+    team_id = team["id"]
+
+    tools = _request_json(admin_client, "GET", "/tools")
+    resources = _request_json(admin_client, "GET", "/resources")
+    prompts = _request_json(admin_client, "GET", "/prompts")
+    gateways = _request_json(admin_client, "GET", "/gateways")
+    gateway = next(g for g in gateways if g["name"] == "fast_time")
+    gateway_id = gateway["id"]
+    tool_ids = [tool["id"] for tool in tools if (tool.get("gatewayId") or tool.get("gateway_id")) == gateway_id]
+    resource_ids = [resource["id"] for resource in resources if resource.get("federationSource") == "fast_time"]
+    prompt_ids = [prompt["id"] for prompt in prompts if prompt.get("gatewaySlug") == "fast-time"]
+
+    server = _request_json(
+        admin_client,
+        "POST",
+        "/servers",
+        json={
+            "server": {
+                "name": f"{ACCESS_PREFIX}-server-{uuid.uuid4().hex[:8]}",
+                "description": "Rust MCP access matrix virtual server",
+                "associated_tools": tool_ids,
+                "associated_resources": resource_ids,
+                "associated_prompts": prompt_ids,
+            },
+            "team_id": team_id,
+            "visibility": "team",
+        },
+    )
+    server_id = server["id"]
+
+    users = {
+        "admin_scoped": _create_user_token(
+            admin_client,
+            email=f"{ACCESS_PREFIX}-admin-{uuid.uuid4().hex[:8]}@test.com",
+            is_admin=True,
+            team_id=team_id,
+            role_name=None,
+            permissions=["tools.read", "tools.execute", "resources.read", "prompts.read"],
+        ),
+        "developer_read_only": _create_user_token(
+            admin_client,
+            email=f"{ACCESS_PREFIX}-ro-{uuid.uuid4().hex[:8]}@test.com",
+            is_admin=False,
+            team_id=team_id,
+            role_name="developer",
+            permissions=["tools.read", "resources.read", "prompts.read"],
+        ),
+        "developer_read_execute": _create_user_token(
+            admin_client,
+            email=f"{ACCESS_PREFIX}-rw-{uuid.uuid4().hex[:8]}@test.com",
+            is_admin=False,
+            team_id=team_id,
+            role_name="developer",
+            permissions=["tools.read", "tools.execute", "resources.read", "prompts.read"],
+        ),
+        "outsider_read_only": _create_user_token(
+            admin_client,
+            email=f"{ACCESS_PREFIX}-outsider-{uuid.uuid4().hex[:8]}@test.com",
+            is_admin=False,
+            team_id=None,
+            role_name=None,
+            permissions=["tools.read", "resources.read", "prompts.read"],
+        ),
+    }
+
+    yield {"server_id": server_id, "users": users}
+
+    for user in users.values():
+        _cleanup_user(admin_client, user)
+    with suppress(Exception):
+        admin_client.delete(f"/servers/{server_id}")
+    with suppress(Exception):
+        admin_client.delete(f"/teams/{team_id}")
+
+
+class TestMcpAccessMatrix:
+    """Role and token-scope access matrix for the Rust public transport path."""
+
+    def test_admin_scoped_token_has_full_server_scoped_access(self, access_matrix_env: dict[str, Any]) -> None:
+        """Scoped admin token should discover and execute with strong output sentinels."""
+        server_id = access_matrix_env["server_id"]
+        token = access_matrix_env["users"]["admin_scoped"]["access_token"]
+
+        with httpx.Client(base_url=BASE_URL, timeout=20.0) as client:
+            session_id = _initialize_session(client, server_id=server_id, token=token)
+
+            _assert_tools_list(_extract_result(_mcp_post(client, server_id=server_id, token=token, session_id=session_id, method="tools/list", request_id=2)))
+            _assert_resources_list(_extract_result(_mcp_post(client, server_id=server_id, token=token, session_id=session_id, method="resources/list", request_id=3)))
+            _assert_prompts_list(_extract_result(_mcp_post(client, server_id=server_id, token=token, session_id=session_id, method="prompts/list", request_id=4)))
+            _assert_formats_resource(
+                _extract_result(
+                    _mcp_post(
+                        client,
+                        server_id=server_id,
+                        token=token,
+                        session_id=session_id,
+                        method="resources/read",
+                        params={"uri": "time://formats"},
+                        request_id=5,
+                    )
+                )
+            )
+            _assert_prompt_get(
+                _extract_result(
+                    _mcp_post(
+                        client,
+                        server_id=server_id,
+                        token=token,
+                        session_id=session_id,
+                        method="prompts/get",
+                        params={
+                            "name": "fast-time-convert-time-detailed",
+                            "arguments": {
+                                "time": "2025-01-15T12:00:00Z",
+                                "from_timezone": "UTC",
+                                "to_timezones": "America/New_York,Europe/Dublin",
+                                "include_context": "true",
+                            },
+                        },
+                        request_id=6,
+                    )
+                )
+            )
+            _assert_tool_call_success(
+                _extract_result(
+                    _mcp_post(
+                        client,
+                        server_id=server_id,
+                        token=token,
+                        session_id=session_id,
+                        method="tools/call",
+                        params={"name": "fast-time-get-system-time", "arguments": {"timezone": "UTC"}},
+                        request_id=7,
+                    )
+                )
+            )
+
+    def test_admin_prompt_invalid_arguments_return_structured_error(self, access_matrix_env: dict[str, Any]) -> None:
+        """Prompt bridge errors should surface as MCP errors, not Rust decode failures."""
+        server_id = access_matrix_env["server_id"]
+        token = access_matrix_env["users"]["admin_scoped"]["access_token"]
+
+        with httpx.Client(base_url=BASE_URL, timeout=20.0) as client:
+            session_id = _initialize_session(client, server_id=server_id, token=token)
+            error = _extract_error(
+                _mcp_post(
+                    client,
+                    server_id=server_id,
+                    token=token,
+                    session_id=session_id,
+                    method="prompts/get",
+                    params={
+                        "name": "fast-time-convert-time-detailed",
+                        "arguments": {
+                            "time": "2025-01-15T12:00:00Z",
+                            "source_timezone": "UTC",
+                            "target_timezones": ["America/New_York", "Europe/Dublin"],
+                        },
+                    },
+                    request_id=8,
+                ),
+                expected_status=200,
+            )
+
+        assert error["code"] == -32602
+        assert "decode failed" not in error["message"].lower()
+        assert error["message"] == "Prompt argument 'target_timezones' must be a string value"
+
+    def test_non_admin_read_only_token_has_read_access_with_strong_sentinels(self, access_matrix_env: dict[str, Any]) -> None:
+        """Non-admin read-only token should initialize and verify tools/resources/prompts output shapes."""
+        server_id = access_matrix_env["server_id"]
+        token = access_matrix_env["users"]["developer_read_only"]["access_token"]
+
+        with httpx.Client(base_url=BASE_URL, timeout=20.0) as client:
+            session_id = _initialize_session(client, server_id=server_id, token=token)
+
+            _assert_tools_list(_extract_result(_mcp_post(client, server_id=server_id, token=token, session_id=session_id, method="tools/list", request_id=2)))
+            _assert_resources_list(_extract_result(_mcp_post(client, server_id=server_id, token=token, session_id=session_id, method="resources/list", request_id=3)))
+            _assert_prompts_list(_extract_result(_mcp_post(client, server_id=server_id, token=token, session_id=session_id, method="prompts/list", request_id=4)))
+            _assert_formats_resource(
+                _extract_result(
+                    _mcp_post(
+                        client,
+                        server_id=server_id,
+                        token=token,
+                        session_id=session_id,
+                        method="resources/read",
+                        params={"uri": "time://formats"},
+                        request_id=5,
+                    )
+                )
+            )
+            _assert_prompt_get(
+                _extract_result(
+                    _mcp_post(
+                        client,
+                        server_id=server_id,
+                        token=token,
+                        session_id=session_id,
+                        method="prompts/get",
+                        params={
+                            "name": "fast-time-convert-time-detailed",
+                            "arguments": {
+                                "time": "2025-01-15T12:00:00Z",
+                                "from_timezone": "UTC",
+                                "to_timezones": "America/New_York,Europe/Dublin",
+                                "include_context": "true",
+                            },
+                        },
+                        request_id=6,
+                    )
+                )
+            )
+            _assert_access_denied(
+                _mcp_post(
+                    client,
+                    server_id=server_id,
+                    token=token,
+                    session_id=session_id,
+                    method="tools/call",
+                    params={"name": "fast-time-get-system-time", "arguments": {"timezone": "UTC"}},
+                    request_id=7,
+                )
+            )
+
+    def test_non_admin_read_execute_token_still_denied_tools_call(self, access_matrix_env: dict[str, Any]) -> None:
+        """Document the current MCP behavior for non-admin scoped execute tokens on the Rust path."""
+        server_id = access_matrix_env["server_id"]
+        token = access_matrix_env["users"]["developer_read_execute"]["access_token"]
+
+        with httpx.Client(base_url=BASE_URL, timeout=20.0) as client:
+            session_id = _initialize_session(client, server_id=server_id, token=token)
+            _assert_access_denied(
+                _mcp_post(
+                    client,
+                    server_id=server_id,
+                    token=token,
+                    session_id=session_id,
+                    method="tools/call",
+                    params={"name": "fast-time-get-system-time", "arguments": {"timezone": "UTC"}},
+                    request_id=2,
+                )
+            )
+
+    def test_outsider_scoped_token_cannot_initialize_team_server(self, access_matrix_env: dict[str, Any]) -> None:
+        """Outsider token should be denied before any team-scoped MCP interaction occurs."""
+        server_id = access_matrix_env["server_id"]
+        token = access_matrix_env["users"]["outsider_read_only"]["access_token"]
+
+        with httpx.Client(base_url=BASE_URL, timeout=20.0) as client:
+            response = _mcp_post(
+                client,
+                server_id=server_id,
+                token=token,
+                method="initialize",
+                params={
+                    "protocolVersion": MCP_PROTOCOL_VERSION,
+                    "capabilities": {},
+                    "clientInfo": {"name": "mcp-access-matrix", "version": "1.0.0"},
+                },
+            )
+
+        assert response.status_code in (401, 403), response.text
diff --git a/tests/e2e_rust/test_mcp_session_isolation.py b/tests/e2e_rust/test_mcp_session_isolation.py
new file mode 100644
index 0000000000..f588fc610e
--- /dev/null
+++ b/tests/e2e_rust/test_mcp_session_isolation.py
@@ -0,0 +1,783 @@
+# -*- coding: utf-8 -*-
+"""Compose-backed MCP session/auth isolation tests for the Rust transport path.
+
+These tests focus on security and correctness, not throughput. They validate
+that MCP session ownership stays bound to the original caller context and does
+not leak across:
+
+- another user in the same team with otherwise-valid access
+- a user outside the team
+- the same email presenting a different, narrower token
+
+The suite uses the live docker-compose stack and real REST setup calls so it
+exercises PostgreSQL, Redis, nginx, Python auth/RBAC, and the Rust MCP runtime
+end to end.
+"""
+
+# Future
+from __future__ import annotations
+
+# Standard
+from concurrent.futures import ThreadPoolExecutor
+from contextlib import suppress
+from datetime import datetime
+import json
+import os
+import time
+from typing import Any, Generator
+import uuid
+
+# Third-Party
+import httpx
+import pytest
+
+# First-Party
+from mcpgateway.utils.create_jwt_token import _create_jwt_token
+
+# Local
+from tests.e2e.mcp_test_helpers import BASE_URL, JWT_SECRET, TEST_PASSWORD, skip_no_gateway, skip_no_rust_mcp_gateway
+
+pytestmark = [pytest.mark.e2e, skip_no_gateway, skip_no_rust_mcp_gateway]
+
+MCP_PROTOCOL_VERSION = "2025-11-25"
+ISOLATION_PREFIX = "mcp-iso"
+SESSION_AUTH_REUSE_TTL_SECONDS = int(os.getenv("MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS", "30"))
+SESSION_AUTH_REUSE_GRACE_SECONDS = int(os.getenv("MCP_RUST_SESSION_AUTH_REUSE_GRACE_SECONDS", "15"))
+
+
+def _make_jwt(email: str, is_admin: bool = False, teams=None) -> str:
+    """Create a JWT suitable for compose-backed E2E tests."""
+    return _create_jwt_token(
+        {"sub": email},
+        user_data={"email": email, "is_admin": is_admin, "auth_provider": "local"},
+        teams=teams,
+        secret=JWT_SECRET,
+    )
+
+
+def _json_headers(token: str) -> dict[str, str]:
+    """Build standard JSON API headers."""
+    return {
+        "Authorization": f"Bearer {token}",
+        "Accept": "application/json",
+    }
+
+
+def _request_json(
+    client: httpx.Client,
+    method: str,
+    path: str,
+    *,
+    expected: tuple[int, ...] = (200, 201),
+    **kwargs: Any,
+) -> Any:
+    """Send an API request and return the JSON payload."""
+    response = client.request(method, path, **kwargs)
+    assert response.status_code in expected, (
+        f"{method} {path} expected {expected}, got {response.status_code}: {response.text}"
+    )
+    return response.json() if response.content else None
+
+
+def _resolve_role_id(admin_client: httpx.Client, role_name: str) -> str:
+    """Resolve an RBAC role name to its UUID."""
+    roles = _request_json(admin_client, "GET", "/rbac/roles")
+    for role in roles:
+        if role.get("name") == role_name:
+            return role["id"]
+    raise AssertionError(f"RBAC role '{role_name}' not found")
+
+
+def _create_user(
+    admin_client: httpx.Client,
+    *,
+    email: str,
+    team_id: str | None = None,
+    role_name: str | None = None,
+    is_admin: bool = False,
+) -> dict[str, Any]:
+    """Create a user, optionally add team membership/role, and mint an API token."""
+    _request_json(
+        admin_client,
+        "POST",
+        "/auth/email/admin/users",
+        json={
+            "email": email,
+            "password": TEST_PASSWORD,
+            "full_name": f"Isolation Test {email.split('@', maxsplit=1)[0]}",
+            "is_admin": is_admin,
+            "is_active": True,
+            "password_change_required": False,
+        },
+    )
+
+    if team_id:
+        _request_json(
+            admin_client,
+            "POST",
+            f"/teams/{team_id}/members",
+            json={"email": email, "role": "member"},
+        )
+
+    role_id = None
+    if role_name and team_id:
+        role_id = _resolve_role_id(admin_client, role_name)
+        _request_json(
+            admin_client,
+            "POST",
+            f"/rbac/users/{email}/roles",
+            json={"role_id": role_id, "scope": "team", "scope_id": team_id},
+        )
+
+    user_jwt = _make_jwt(email, is_admin=is_admin, teams=[team_id] if team_id else None)
+    with httpx.Client(base_url=BASE_URL, headers=_json_headers(user_jwt), timeout=20.0) as user_client:
+        token_payload: dict[str, Any] = {
+            "name": f"{ISOLATION_PREFIX}-token-{uuid.uuid4().hex[:8]}",
+            "expires_in_days": 1,
+        }
+        if team_id:
+            token_payload["team_id"] = team_id
+        token_response = _request_json(
+            user_client,
+            "POST",
+            "/tokens",
+            json=token_payload,
+        )
+
+    token_obj = token_response.get("token", token_response)
+    return {
+        "email": email,
+        "access_token": token_response["access_token"],
+        "token_id": token_obj.get("id") or token_obj.get("token_id"),
+        "team_id": team_id,
+        "role": role_name,
+        "role_id": role_id,
+        "is_admin": is_admin,
+    }
+
+
+def _cleanup_user(admin_client: httpx.Client, user_info: dict[str, Any]) -> None:
+    """Best-effort cleanup for a created test user and token."""
+    token_id = user_info.get("token_id")
+    if token_id:
+        with suppress(Exception):
+            admin_client.delete(f"/tokens/admin/{token_id}")
+    with suppress(Exception):
+        admin_client.delete(f"/auth/email/admin/users/{user_info['email']}")
+
+
+def _mcp_url(server_id: str) -> str:
+    """Return the server-scoped MCP endpoint path."""
+    return f"/servers/{server_id}/mcp/"
+
+
+def _mcp_headers(token: str, *, session_id: str | None = None, accept: str = "application/json, text/event-stream") -> dict[str, str]:
+    """Build MCP transport headers."""
+    headers = {
+        "Authorization": f"Bearer {token}",
+        "Accept": accept,
+        "Content-Type": "application/json",
+        "MCP-Protocol-Version": MCP_PROTOCOL_VERSION,
+    }
+    if session_id:
+        headers["mcp-session-id"] = session_id
+    return headers
+
+
+def _initialize_session(
+    token: str,
+    server_id: str,
+) -> tuple[httpx.Response, dict[str, Any], str]:
+    """Initialize a live MCP session and return the response, payload, and session id."""
+    with httpx.Client(base_url=BASE_URL, timeout=20.0) as client:
+        response = client.post(
+            _mcp_url(server_id),
+            headers=_mcp_headers(token),
+            json={
+                "jsonrpc": "2.0",
+                "id": 1,
+                "method": "initialize",
+                "params": {
+                    "protocolVersion": MCP_PROTOCOL_VERSION,
+                    "capabilities": {},
+                    "clientInfo": {"name": "mcp-session-isolation", "version": "1.0.0"},
+                },
+            },
+        )
+    assert response.status_code == 200, response.text
+    payload = response.json()
+    assert "result" in payload, payload
+    session_id = response.headers.get("mcp-session-id")
+    assert session_id, f"Missing mcp-session-id header: {response.headers}"
+    assert response.headers.get("x-contextforge-mcp-runtime") == "rust"
+    return response, payload, session_id
+
+
+def _mcp_post(
+    token: str,
+    server_id: str,
+    *,
+    method: str,
+    params: dict[str, Any] | None = None,
+    session_id: str | None = None,
+    request_id: int | str = 1,
+) -> httpx.Response:
+    """Send a direct JSON-RPC POST to the MCP endpoint."""
+    with httpx.Client(base_url=BASE_URL, timeout=20.0) as client:
+        return client.post(
+            _mcp_url(server_id),
+            headers=_mcp_headers(token, session_id=session_id),
+            json={
+                "jsonrpc": "2.0",
+                "id": request_id,
+                "method": method,
+                "params": params or {},
+            },
+        )
+
+
+def _assert_denied(response: httpx.Response) -> None:
+    """Assert that a transport or JSON-RPC request was denied without leaking data."""
+    if response.status_code in (401, 403, 404):
+        if response.headers.get("content-type", "").startswith("application/json"):
+            body = response.json()
+            body_text = json.dumps(body).lower()
+            assert (
+                "denied" in body_text
+                or "not found" in body_text
+                or "access" in body_text
+                or "revoked" in body_text
+                or "invalid" in body_text
+            ), body
+        return
+
+    assert response.status_code == 200, response.text
+    body = response.json()
+    if "error" in body:
+        error = body["error"]
+        assert error.get("code") in (-32003, -32600), body
+        error_message = str(error.get("message", "")).lower()
+        assert (
+            "denied" in error_message
+            or "not found" in error_message
+            or "revoked" in error_message
+            or "invalid" in error_message
+        ), body
+        return
+
+    result = body.get("result", {})
+    assert result.get("isError", False), body
+    content = result.get("content", [{}])
+    message = str(content[0].get("text", "")).lower() if content else ""
+    assert (
+        "denied" in message
+        or "not found" in message
+        or "revoked" in message
+        or "invalid" in message
+    ), body
+
+
+def _extract_tool_names(response: httpx.Response) -> list[str]:
+    """Extract tool names from a successful tools/list response."""
+    assert response.status_code == 200, response.text
+    payload = response.json()
+    assert "result" in payload, payload
+    tools = payload["result"].get("tools", [])
+    return [tool["name"] for tool in tools]
+
+
+def _select_time_gateway(gateways: list[dict[str, Any]], tools: list[dict[str, Any]]) -> dict[str, Any]:
+    """Select a compose-backed streamable HTTP gateway with live time tools.
+
+    Prefer the canonical ``fast_time`` gateway when available, but fall back
+    to ``fast_test`` on clean rebuilds where the ``register_fast_time`` helper
+    has not yet succeeded. The isolation suite validates session/auth binding,
+    so any live MCP gateway with a time tool is sufficient.
+    """
+    tool_counts_by_gateway: dict[str, int] = {}
+    for tool in tools:
+        gateway_id = tool.get("gatewayId")
+        if gateway_id:
+            tool_counts_by_gateway[gateway_id] = tool_counts_by_gateway.get(gateway_id, 0) + 1
+
+    preferred_names = ("fast_time", "fast_test")
+    for preferred_name in preferred_names:
+        for candidate in gateways:
+            if (
+                candidate.get("name") == preferred_name
+                and candidate.get("transport") == "STREAMABLEHTTP"
+                and tool_counts_by_gateway.get(candidate.get("id"), 0) > 0
+            ):
+                return candidate
+
+    for candidate in gateways:
+        url = str(candidate.get("url", ""))
+        if (
+            candidate.get("transport") == "STREAMABLEHTTP"
+            and tool_counts_by_gateway.get(candidate.get("id"), 0) > 0
+            and (
+            "fast_time_server:8080/http" in url or "fast_test_server:8880/mcp" in url
+            )
+        ):
+            return candidate
+
+    raise AssertionError("No compose-backed time-capable STREAMABLEHTTP gateway with synced tools found")
+
+
+def _find_tool_name(tool_names: list[str], fragment: str) -> str:
+    """Find a tool name by substring match."""
+    for name in tool_names:
+        if fragment in name:
+            return name
+    raise AssertionError(f"Expected a tool containing '{fragment}', got {tool_names}")
+
+
+def _request_denied(response: httpx.Response) -> bool:
+    """Return True when a transport or JSON-RPC response clearly denies access."""
+    if response.status_code in (401, 403, 404):
+        return True
+    if response.status_code != 200:
+        return False
+    payload = response.json()
+    if "error" in payload:
+        message = str(payload["error"].get("message", "")).lower()
+        return "denied" in message or "not found" in message or "revoked" in message
+    result = payload.get("result", {})
+    if result.get("isError", False):
+        content = result.get("content", [{}])
+        message = str(content[0].get("text", "")).lower() if content else ""
+        return "denied" in message or "not found" in message or "revoked" in message
+    return False
+
+
+def _wait_for_session_denial(
+    token: str,
+    server_id: str,
+    *,
+    session_id: str,
+    method: str,
+    params: dict[str, Any] | None = None,
+    timeout_seconds: int | None = None,
+) -> httpx.Response:
+    """Poll until a session-bound request is denied or the bounded TTL contract is violated."""
+    deadline = time.time() + float(
+        timeout_seconds
+        if timeout_seconds is not None
+        else SESSION_AUTH_REUSE_TTL_SECONDS + SESSION_AUTH_REUSE_GRACE_SECONDS
+    )
+    last_response = None
+    while time.time() < deadline:
+        last_response = _mcp_post(
+            token,
+            server_id,
+            method=method,
+            params=params,
+            session_id=session_id,
+            request_id=f"wait-{uuid.uuid4().hex[:8]}",
+        )
+        if _request_denied(last_response):
+            return last_response
+        time.sleep(1.0)
+
+    raise AssertionError(
+        "Session remained usable beyond the bounded auth-reuse TTL contract: "
+        f"status={getattr(last_response, 'status_code', None)} "
+        f"body={getattr(last_response, 'text', None)}"
+    )
+
+
+def _revoke_team_role(admin_client: httpx.Client, user_info: dict[str, Any]) -> None:
+    """Revoke a team-scoped RBAC role from a test user."""
+    role_id = user_info.get("role_id")
+    team_id = user_info.get("team_id")
+    assert role_id and team_id, f"User is missing role assignment details: {user_info}"
+    response = admin_client.delete(
+        f"/rbac/users/{user_info['email']}/roles/{role_id}",
+        params={"scope": "team", "scope_id": team_id},
+    )
+    assert response.status_code == 200, response.text
+
+
+def _extract_text_result(response: httpx.Response) -> str:
+    """Extract the first text content item from a successful tools/call response."""
+    assert response.status_code == 200, response.text
+    payload = response.json()
+    assert "result" in payload, payload
+    result = payload["result"]
+    assert not result.get("isError", False), payload
+    return result.get("content", [{}])[0].get("text", "")
+
+
+@pytest.fixture(scope="module")
+def admin_client() -> Generator[httpx.Client, None, None]:
+    """Admin-authenticated API client for test setup and cleanup."""
+    token = _make_jwt("admin@example.com", is_admin=True, teams=None)
+    with httpx.Client(base_url=BASE_URL, headers=_json_headers(token), timeout=20.0) as client:
+        yield client
+
+
+@pytest.fixture(scope="module")
+def isolation_environment(admin_client: httpx.Client) -> Generator[dict[str, Any], None, None]:
+    """Create a dedicated team-scoped MCP server and the users needed for isolation checks."""
+    team_name = f"{ISOLATION_PREFIX}-team-{uuid.uuid4().hex[:8]}"
+    team = _request_json(
+        admin_client,
+        "POST",
+        "/teams/",
+        json={"name": team_name, "description": "Rust MCP session isolation team", "visibility": "private"},
+    )
+    team_id = team["id"]
+
+    tools = _request_json(admin_client, "GET", "/tools")
+    gateways = _request_json(admin_client, "GET", "/gateways")
+    gateway = _select_time_gateway(gateways, tools)
+    gateway_id = gateway["id"]
+
+    tool_ids = [tool["id"] for tool in tools if tool.get("gatewayId") == gateway_id]
+    assert tool_ids, f"No tools found for gateway {gateway_id}"
+
+    server = _request_json(
+        admin_client,
+        "POST",
+        "/servers",
+        json={
+            "server": {
+                "name": f"{ISOLATION_PREFIX}-server-{uuid.uuid4().hex[:8]}",
+                "description": "Rust MCP session isolation virtual server",
+                "associated_tools": tool_ids,
+                "associated_resources": [],
+                "associated_prompts": [],
+            },
+            "team_id": team_id,
+            "visibility": "team",
+        },
+    )
+    server_id = server["id"]
+
+    users = {
+        "owner": _create_user(
+            admin_client,
+            email=f"{ISOLATION_PREFIX}-owner-{uuid.uuid4().hex[:8]}@test.com",
+            team_id=team_id,
+            role_name="developer",
+        ),
+        "peer": _create_user(
+            admin_client,
+            email=f"{ISOLATION_PREFIX}-peer-{uuid.uuid4().hex[:8]}@test.com",
+            team_id=team_id,
+            role_name="developer",
+        ),
+        "outsider": _create_user(
+            admin_client,
+            email=f"{ISOLATION_PREFIX}-outsider-{uuid.uuid4().hex[:8]}@test.com",
+        ),
+    }
+
+    try:
+        yield {
+            "team_id": team_id,
+            "server_id": server_id,
+            "users": users,
+        }
+    finally:
+        with suppress(Exception):
+            admin_client.delete(f"/servers/{server_id}")
+        for user in users.values():
+            _cleanup_user(admin_client, user)
+        with suppress(Exception):
+            admin_client.delete(f"/teams/{team_id}")
+
+
+class TestMcpSessionIsolation:
+    """End-to-end MCP session ownership and auth-binding isolation tests."""
+
+    def test_same_team_peer_can_access_server_but_not_owner_session(self, isolation_environment: dict[str, Any]) -> None:
+        """A same-team user may use the server, but not another user's session."""
+        server_id = isolation_environment["server_id"]
+        owner = isolation_environment["users"]["owner"]
+        peer = isolation_environment["users"]["peer"]
+
+        _, _, owner_session_id = _initialize_session(owner["access_token"], server_id)
+        peer_init_response, _, _ = _initialize_session(peer["access_token"], server_id)
+        assert peer_init_response.headers.get("x-contextforge-mcp-runtime") == "rust"
+
+        owner_tools = _extract_tool_names(
+            _mcp_post(owner["access_token"], server_id, method="tools/list", session_id=owner_session_id, request_id=2)
+        )
+        assert owner_tools, "Owner should see team-scoped tools"
+
+        peer_hijack = _mcp_post(
+            peer["access_token"],
+            server_id,
+            method="tools/list",
+            session_id=owner_session_id,
+            request_id=3,
+        )
+        _assert_denied(peer_hijack)
+
+    def test_same_email_public_only_token_cannot_reuse_owner_session(self, isolation_environment: dict[str, Any]) -> None:
+        """A narrower same-email session token must not inherit a team-scoped MCP session."""
+        server_id = isolation_environment["server_id"]
+        owner = isolation_environment["users"]["owner"]
+        _, _, owner_session_id = _initialize_session(owner["access_token"], server_id)
+
+        public_only_token = _make_jwt(owner["email"], is_admin=False, teams=[])
+        response = _mcp_post(
+            public_only_token,
+            server_id,
+            method="tools/list",
+            session_id=owner_session_id,
+            request_id=4,
+        )
+        _assert_denied(response)
+
+    def test_cross_user_live_stream_hijack_denied(self, isolation_environment: dict[str, Any]) -> None:
+        """A second user must not attach to another user's live GET /mcp session."""
+        server_id = isolation_environment["server_id"]
+        owner = isolation_environment["users"]["owner"]
+        outsider = isolation_environment["users"]["outsider"]
+        _, _, owner_session_id = _initialize_session(owner["access_token"], server_id)
+
+        with httpx.Client(base_url=BASE_URL, timeout=10.0) as client:
+            response = client.get(
+                _mcp_url(server_id),
+                headers=_mcp_headers(outsider["access_token"], session_id=owner_session_id, accept="text/event-stream"),
+            )
+        _assert_denied(response)
+
+    def test_cross_user_resume_hijack_denied(self, isolation_environment: dict[str, Any]) -> None:
+        """A second user must not replay another user's resumable stream."""
+        server_id = isolation_environment["server_id"]
+        owner = isolation_environment["users"]["owner"]
+        outsider = isolation_environment["users"]["outsider"]
+        _, _, owner_session_id = _initialize_session(owner["access_token"], server_id)
+
+        with httpx.Client(base_url=BASE_URL, timeout=10.0) as client:
+            response = client.get(
+                _mcp_url(server_id),
+                params={"session_id": owner_session_id},
+                headers={
+                    **_mcp_headers(outsider["access_token"], accept="text/event-stream"),
+                    "Last-Event-ID": "evt-1",
+                },
+            )
+        _assert_denied(response)
+
+    def test_cross_user_delete_denied_and_owner_session_survives(self, isolation_environment: dict[str, Any]) -> None:
+        """A second user cannot delete another user's MCP session."""
+        server_id = isolation_environment["server_id"]
+        owner = isolation_environment["users"]["owner"]
+        peer = isolation_environment["users"]["peer"]
+        _, _, owner_session_id = _initialize_session(owner["access_token"], server_id)
+
+        with httpx.Client(base_url=BASE_URL, timeout=10.0) as client:
+            delete_response = client.request(
+                "DELETE",
+                _mcp_url(server_id),
+                params={"session_id": owner_session_id},
+                headers={
+                    "Authorization": f"Bearer {peer['access_token']}",
+                    "Accept": "application/json, text/event-stream",
+                },
+            )
+        _assert_denied(delete_response)
+
+        owner_follow_up = _mcp_post(
+            owner["access_token"],
+            server_id,
+            method="tools/list",
+            session_id=owner_session_id,
+            request_id=5,
+        )
+        assert owner_follow_up.status_code == 200, owner_follow_up.text
+        assert _extract_tool_names(owner_follow_up)
+
+    def test_owner_session_tool_results_are_fresh(self, isolation_environment: dict[str, Any]) -> None:
+        """Repeated owner calls within the same session should return live, changing tool output."""
+        server_id = isolation_environment["server_id"]
+        admin_token = _make_jwt("admin@example.com", is_admin=True, teams=None)
+        _, _, owner_session_id = _initialize_session(admin_token, server_id)
+
+        tool_names = _extract_tool_names(
+            _mcp_post(admin_token, server_id, method="tools/list", session_id=owner_session_id, request_id=6)
+        )
+        time_tool = _find_tool_name(tool_names, "get-system-time")
+
+        first = _extract_text_result(
+            _mcp_post(
+                admin_token,
+                server_id,
+                method="tools/call",
+                params={"name": time_tool, "arguments": {"timezone": "UTC"}},
+                session_id=owner_session_id,
+                request_id=7,
+            )
+        )
+        time.sleep(1.2)
+        second = _extract_text_result(
+            _mcp_post(
+                admin_token,
+                server_id,
+                method="tools/call",
+                params={"name": time_tool, "arguments": {"timezone": "UTC"}},
+                session_id=owner_session_id,
+                request_id=8,
+            )
+        )
+
+        first_dt = datetime.fromisoformat(first.replace("Z", "+00:00"))
+        second_dt = datetime.fromisoformat(second.replace("Z", "+00:00"))
+        assert second_dt > first_dt, (first, second)
+
+    def test_concurrent_owner_requests_and_peer_hijacks_do_not_leak(self, isolation_environment: dict[str, Any]) -> None:
+        """Concurrent valid and hijack traffic must not leak one caller's session to another."""
+        server_id = isolation_environment["server_id"]
+        peer = isolation_environment["users"]["peer"]
+        admin_token = _make_jwt("admin@example.com", is_admin=True, teams=None)
+        _, _, owner_session_id = _initialize_session(admin_token, server_id)
+
+        tool_names = _extract_tool_names(
+            _mcp_post(admin_token, server_id, method="tools/list", session_id=owner_session_id, request_id=9)
+        )
+        time_tool = _find_tool_name(tool_names, "get-system-time")
+
+        def owner_call(index: int) -> tuple[str, int, str]:
+            response = _mcp_post(
+                admin_token,
+                server_id,
+                method="tools/call",
+                params={"name": time_tool, "arguments": {"timezone": "UTC"}},
+                session_id=owner_session_id,
+                request_id=f"owner-{index}",
+            )
+            return ("owner", response.status_code, _extract_text_result(response))
+
+        def peer_hijack(index: int) -> tuple[str, int, str]:
+            response = _mcp_post(
+                peer["access_token"],
+                server_id,
+                method="tools/call",
+                params={"name": time_tool, "arguments": {"timezone": "UTC"}},
+                session_id=owner_session_id,
+                request_id=f"peer-{index}",
+            )
+            return ("peer", response.status_code, response.text)
+
+        with ThreadPoolExecutor(max_workers=8) as executor:
+            futures = [executor.submit(owner_call, i) for i in range(8)] + [
+                executor.submit(peer_hijack, i) for i in range(8)
+            ]
+            results = [future.result() for future in futures]
+
+        owner_results = [result for result in results if result[0] == "owner"]
+        peer_results = [result for result in results if result[0] == "peer"]
+
+        assert len(owner_results) == 8
+        assert len(peer_results) == 8
+        assert all(status == 200 for _, status, _ in owner_results), owner_results
+        assert all(text for _, _, text in owner_results), owner_results
+
+        for _, status, text in peer_results:
+            assert status in (200, 403, 404), peer_results
+            if status == 200:
+                payload = json.loads(text)
+                if "result" in payload and not payload["result"].get("isError", False):
+                    raise AssertionError(f"Peer hijack unexpectedly succeeded: {payload}")
+
+    def test_revoked_token_session_is_denied_within_bounded_reuse_ttl(
+        self,
+        isolation_environment: dict[str, Any],
+        admin_client: httpx.Client,
+    ) -> None:
+        """Revoking the owner token must deny the session no later than the documented reuse TTL."""
+        server_id = isolation_environment["server_id"]
+        team_id = isolation_environment["team_id"]
+        user = _create_user(
+            admin_client,
+            email=f"{ISOLATION_PREFIX}-revoke-{uuid.uuid4().hex[:8]}@test.com",
+            team_id=team_id,
+            role_name="developer",
+        )
+
+        try:
+            _, _, session_id = _initialize_session(user["access_token"], server_id)
+
+            revoke_response = admin_client.delete(f"/tokens/admin/{user['token_id']}")
+            assert revoke_response.status_code == 204, revoke_response.text
+
+            denied = _wait_for_session_denial(
+                user["access_token"],
+                server_id,
+                session_id=session_id,
+                method="tools/list",
+            )
+            _assert_denied(denied)
+        finally:
+            _cleanup_user(admin_client, user)
+
+    def test_removed_team_member_session_is_denied_within_bounded_reuse_ttl(
+        self,
+        isolation_environment: dict[str, Any],
+        admin_client: httpx.Client,
+    ) -> None:
+        """Removing a member from the team must invalidate the existing MCP session within the bounded TTL."""
+        server_id = isolation_environment["server_id"]
+        team_id = isolation_environment["team_id"]
+        user = _create_user(
+            admin_client,
+            email=f"{ISOLATION_PREFIX}-member-{uuid.uuid4().hex[:8]}@test.com",
+            team_id=team_id,
+            role_name="developer",
+        )
+
+        try:
+            _, _, session_id = _initialize_session(user["access_token"], server_id)
+
+            remove_response = admin_client.delete(f"/teams/{team_id}/members/{user['email']}")
+            assert remove_response.status_code == 200, remove_response.text
+
+            denied = _wait_for_session_denial(
+                user["access_token"],
+                server_id,
+                session_id=session_id,
+                method="tools/list",
+            )
+            _assert_denied(denied)
+        finally:
+            _cleanup_user(admin_client, user)
+
+    def test_revoked_team_role_session_is_denied_within_bounded_reuse_ttl(
+        self,
+        isolation_environment: dict[str, Any],
+        admin_client: httpx.Client,
+    ) -> None:
+        """Revoking the team RBAC role must deny tool execution on the existing session within the bounded TTL."""
+        server_id = isolation_environment["server_id"]
+        team_id = isolation_environment["team_id"]
+        user = _create_user(
+            admin_client,
+            email=f"{ISOLATION_PREFIX}-role-{uuid.uuid4().hex[:8]}@test.com",
+            team_id=team_id,
+            role_name="developer",
+        )
+
+        try:
+            _, _, session_id = _initialize_session(user["access_token"], server_id)
+
+            tool_names = _extract_tool_names(
+                _mcp_post(user["access_token"], server_id, method="tools/list", session_id=session_id, request_id=10)
+            )
+            time_tool = _find_tool_name(tool_names, "get-system-time")
+
+            _revoke_team_role(admin_client, user)
+
+            denied = _wait_for_session_denial(
+                user["access_token"],
+                server_id,
+                session_id=session_id,
+                method="tools/call",
+                params={"name": time_tool, "arguments": {"timezone": "UTC"}},
+            )
+            _assert_denied(denied)
+        finally:
+            _cleanup_user(admin_client, user)
diff --git a/tests/loadtest/locustfile_mcp_isolation.py b/tests/loadtest/locustfile_mcp_isolation.py
new file mode 100644
index 0000000000..be2d264232
--- /dev/null
+++ b/tests/loadtest/locustfile_mcp_isolation.py
@@ -0,0 +1,481 @@
+# -*- coding: utf-8 -*-
+"""Rust MCP session/auth isolation correctness load test.
+
+This Locust harness is intentionally separate from the throughput benchmarks.
+It validates that a live Rust MCP session remains usable for the owner while
+same-team peers and outsiders cannot hijack it under concurrent traffic.
+
+Copyright 2026
+SPDX-License-Identifier: Apache-2.0
+Authors: Mihai Criveti
+"""
+
+# Future
+from __future__ import annotations
+
+# Standard
+from datetime import datetime
+import json
+import os
+from pathlib import Path
+import random
+import uuid
+
+# Third-Party
+from locust import HttpUser, between, events, task
+from locust.runners import MasterRunner, WorkerRunner
+import requests
+
+# First-Party
+from mcpgateway.utils.create_jwt_token import _create_jwt_token
+
+BASE_URL = os.getenv("MCP_CLI_BASE_URL", "http://localhost:8080")
+JWT_SECRET = os.getenv("JWT_SECRET_KEY", "my-test-key")
+TEST_PASSWORD = "SecureTestPass123!"
+MCP_PROTOCOL_VERSION = "2025-11-25"
+ISOLATION_PREFIX = "mcp-iso-load"
+
+_ENV_CACHE: dict[str, str] | None = None
+_STATE: dict[str, object] = {}
+
+
+def _load_env_file() -> dict[str, str]:
+    """Load .env values from the project root when present."""
+    global _ENV_CACHE  # pylint: disable=global-statement
+    if _ENV_CACHE is not None:
+        return _ENV_CACHE
+
+    env_vars: dict[str, str] = {}
+    search_paths = [
+        Path.cwd() / ".env",
+        Path.cwd().parent / ".env",
+        Path.cwd().parent.parent / ".env",
+        Path(__file__).parent.parent.parent / ".env",
+    ]
+    for path in search_paths:
+        if path.exists():
+            with open(path, "r", encoding="utf-8") as handle:
+                for line in handle:
+                    line = line.strip()
+                    if not line or line.startswith("#") or "=" not in line:
+                        continue
+                    key, _, value = line.partition("=")
+                    env_vars[key.strip()] = value.strip().strip("\"'")
+            break
+    _ENV_CACHE = env_vars
+    return env_vars
+
+
+def _cfg(key: str, default: str = "") -> str:
+    env_vars = _load_env_file()
+    return os.environ.get(key) or env_vars.get(key) or default
+
+
+def _make_jwt(email: str, is_admin: bool = False, teams=None) -> str:
+    """Create a JWT suitable for compose-backed setup calls."""
+    return _create_jwt_token(
+        {"sub": email},
+        user_data={"email": email, "is_admin": is_admin, "auth_provider": "local"},
+        teams=teams,
+        secret=JWT_SECRET,
+    )
+
+
+def _json_headers(token: str) -> dict[str, str]:
+    return {"Authorization": f"Bearer {token}", "Accept": "application/json"}
+
+
+def _request_json(
+    client: requests.Session,
+    method: str,
+    path: str,
+    *,
+    expected: tuple[int, ...] = (200, 201),
+    **kwargs,
+):
+    response = client.request(method, f"{BASE_URL}{path}", timeout=20, **kwargs)
+    assert response.status_code in expected, (
+        f"{method} {path} expected {expected}, got {response.status_code}: {response.text}"
+    )
+    return response.json() if response.content else None
+
+
+def _resolve_role_id(admin_client: requests.Session, role_name: str) -> str:
+    roles = _request_json(admin_client, "GET", "/rbac/roles")
+    for role in roles:
+        if role.get("name") == role_name:
+            return role["id"]
+    raise AssertionError(f"RBAC role '{role_name}' not found")
+
+
+def _select_time_gateway(gateways: list[dict], tools: list[dict]) -> dict:
+    tool_counts_by_gateway: dict[str, int] = {}
+    for tool in tools:
+        gateway_id = tool.get("gatewayId")
+        if gateway_id:
+            tool_counts_by_gateway[gateway_id] = tool_counts_by_gateway.get(gateway_id, 0) + 1
+
+    for preferred_name in ("fast_time", "fast_test"):
+        for gateway in gateways:
+            if (
+                gateway.get("name") == preferred_name
+                and gateway.get("transport") == "STREAMABLEHTTP"
+                and tool_counts_by_gateway.get(gateway.get("id"), 0) > 0
+            ):
+                return gateway
+
+    raise AssertionError("No compose-backed time-capable STREAMABLEHTTP gateway found")
+
+
+def _create_user(
+    admin_client: requests.Session,
+    *,
+    email: str,
+    team_id: str | None,
+    role_name: str | None,
+    is_admin: bool = False,
+) -> dict[str, str | None]:
+    _request_json(
+        admin_client,
+        "POST",
+        "/auth/email/admin/users",
+        json={
+            "email": email,
+            "password": TEST_PASSWORD,
+            "full_name": f"Isolation Load {email.split('@', maxsplit=1)[0]}",
+            "is_admin": is_admin,
+            "is_active": True,
+            "password_change_required": False,
+        },
+    )
+
+    role_id = None
+    if team_id:
+        _request_json(
+            admin_client,
+            "POST",
+            f"/teams/{team_id}/members",
+            json={"email": email, "role": "member"},
+        )
+    if role_name and team_id:
+        role_id = _resolve_role_id(admin_client, role_name)
+        _request_json(
+            admin_client,
+            "POST",
+            f"/rbac/users/{email}/roles",
+            json={"role_id": role_id, "scope": "team", "scope_id": team_id},
+        )
+
+    jwt_token = _make_jwt(email, is_admin=is_admin, teams=[team_id] if team_id else None)
+    user_client = requests.Session()
+    user_client.headers.update(_json_headers(jwt_token))
+    token_payload: dict[str, object] = {
+        "name": f"{ISOLATION_PREFIX}-token-{uuid.uuid4().hex[:8]}",
+        "expires_in_days": 1,
+    }
+    if team_id:
+        token_payload["team_id"] = team_id
+    token_response = _request_json(user_client, "POST", "/tokens", json=token_payload)
+    token_obj = token_response.get("token", token_response)
+    return {
+        "email": email,
+        "access_token": token_response["access_token"],
+        "token_id": token_obj.get("id") or token_obj.get("token_id"),
+        "team_id": team_id,
+        "role_id": role_id,
+    }
+
+
+def _cleanup_state() -> None:
+    if not _STATE:
+        return
+
+    admin_client = requests.Session()
+    admin_client.headers.update(_json_headers(_STATE["admin_token"]))  # type: ignore[index]
+    for user in _STATE.get("users", {}).values():  # type: ignore[union-attr]
+        token_id = user.get("token_id")
+        if token_id:
+            admin_client.delete(f"{BASE_URL}/tokens/admin/{token_id}", timeout=10)
+        admin_client.delete(f"{BASE_URL}/auth/email/admin/users/{user['email']}", timeout=10)
+
+    server_id = _STATE.get("server_id")
+    if server_id:
+        admin_client.delete(f"{BASE_URL}/servers/{server_id}", timeout=10)
+    team_id = _STATE.get("team_id")
+    if team_id:
+        admin_client.delete(f"{BASE_URL}/teams/{team_id}", timeout=10)
+    _STATE.clear()
+
+
+def _contains_iso8601_timestamp(value) -> bool:
+    """Return True when any nested string value parses as an ISO-8601 timestamp."""
+    if isinstance(value, str):
+        candidate = value.strip()
+        if not candidate:
+            return False
+        try:
+            datetime.fromisoformat(candidate.replace("Z", "+00:00"))
+        except ValueError:
+            return False
+        return True
+    if isinstance(value, dict):
+        return any(_contains_iso8601_timestamp(item) for item in value.values())
+    if isinstance(value, list):
+        return any(_contains_iso8601_timestamp(item) for item in value)
+    return False
+
+
+def _bootstrap_state() -> None:
+    if _STATE:
+        return
+
+    health = requests.get(f"{BASE_URL}/health", timeout=10)
+    health.raise_for_status()
+    assert (
+        health.headers.get("x-contextforge-mcp-runtime-mode") == "rust-managed"
+    ), f"Rust MCP runtime is not active at {BASE_URL}"
+
+    admin_token = _make_jwt(_cfg("PLATFORM_ADMIN_EMAIL", "admin@example.com"), is_admin=True, teams=None)
+    admin_client = requests.Session()
+    admin_client.headers.update(_json_headers(admin_token))
+
+    team = _request_json(
+        admin_client,
+        "POST",
+        "/teams/",
+        json={
+            "name": f"{ISOLATION_PREFIX}-team-{uuid.uuid4().hex[:8]}",
+            "description": "Rust MCP isolation load team",
+            "visibility": "private",
+        },
+    )
+    team_id = team["id"]
+
+    tools = _request_json(admin_client, "GET", "/tools")
+    gateways = _request_json(admin_client, "GET", "/gateways")
+    gateway = _select_time_gateway(gateways, tools)
+    gateway_id = gateway["id"]
+    tool_ids = [tool["id"] for tool in tools if tool.get("gatewayId") == gateway_id]
+    server = _request_json(
+        admin_client,
+        "POST",
+        "/servers",
+        json={
+            "server": {
+                "name": f"{ISOLATION_PREFIX}-server-{uuid.uuid4().hex[:8]}",
+                "description": "Rust MCP isolation load server",
+                "associated_tools": tool_ids,
+                "associated_resources": [],
+                "associated_prompts": [],
+            },
+            "team_id": team_id,
+            "visibility": "team",
+        },
+    )
+    server_id = server["id"]
+
+    owner = _create_user(
+        admin_client,
+        email=f"{ISOLATION_PREFIX}-owner-{uuid.uuid4().hex[:8]}@test.com",
+        team_id=team_id,
+        role_name="developer",
+        is_admin=True,
+    )
+    peer = _create_user(
+        admin_client,
+        email=f"{ISOLATION_PREFIX}-peer-{uuid.uuid4().hex[:8]}@test.com",
+        team_id=team_id,
+        role_name="developer",
+    )
+    outsider = _create_user(
+        admin_client,
+        email=f"{ISOLATION_PREFIX}-outsider-{uuid.uuid4().hex[:8]}@test.com",
+        team_id=None,
+        role_name=None,
+    )
+
+    owner_headers = {
+        "Authorization": f"Bearer {owner['access_token']}",
+        "Accept": "application/json, text/event-stream",
+        "Content-Type": "application/json",
+        "MCP-Protocol-Version": MCP_PROTOCOL_VERSION,
+    }
+    initialize = requests.post(
+        f"{BASE_URL}/servers/{server_id}/mcp/",
+        headers=owner_headers,
+        json={
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "initialize",
+            "params": {
+                "protocolVersion": MCP_PROTOCOL_VERSION,
+                "capabilities": {},
+                "clientInfo": {"name": "mcp-isolation-load", "version": "1.0.0"},
+            },
+        },
+        timeout=20,
+    )
+    initialize.raise_for_status()
+    session_id = initialize.headers["mcp-session-id"]
+
+    tools_list = requests.post(
+        f"{BASE_URL}/servers/{server_id}/mcp/",
+        headers={**owner_headers, "mcp-session-id": session_id},
+        json={"jsonrpc": "2.0", "id": 2, "method": "tools/list", "params": {}},
+        timeout=20,
+    )
+    tools_list.raise_for_status()
+    tool_names = [tool["name"] for tool in tools_list.json()["result"]["tools"]]
+    time_tool = next(name for name in tool_names if "get-system-time" in name)
+
+    _STATE.update(
+        {
+            "admin_token": admin_token,
+            "team_id": team_id,
+            "server_id": server_id,
+            "session_id": session_id,
+            "time_tool": time_tool,
+            "users": {"owner": owner, "peer": peer, "outsider": outsider},
+        }
+    )
+
+
+@events.test_start.add_listener
+def _on_test_start(environment, **_kwargs) -> None:
+    runner = environment.runner
+    if isinstance(runner, WorkerRunner):
+        return
+    _bootstrap_state()
+
+
+@events.test_stop.add_listener
+def _on_test_stop(environment, **_kwargs) -> None:
+    runner = environment.runner
+    if isinstance(runner, MasterRunner):
+        return
+    _cleanup_state()
+
+
+class BaseIsolationUser(HttpUser):
+    abstract = True
+    wait_time = between(0.1, 0.5)
+
+    @property
+    def server_id(self) -> str:
+        return str(_STATE["server_id"])
+
+    @property
+    def session_id(self) -> str:
+        return str(_STATE["session_id"])
+
+    @property
+    def time_tool(self) -> str:
+        return str(_STATE["time_tool"])
+
+    def _headers(self, token: str, *, include_session: bool = False) -> dict[str, str]:
+        headers = {
+            "Authorization": f"Bearer {token}",
+            "Accept": "application/json, text/event-stream",
+            "Content-Type": "application/json",
+            "MCP-Protocol-Version": MCP_PROTOCOL_VERSION,
+        }
+        if include_session:
+            headers["mcp-session-id"] = self.session_id
+        return headers
+
+
+class McpIsolationOwnerUser(BaseIsolationUser):
+    weight = 3
+
+    @task(3)
+    def tools_list_owner_session(self) -> None:
+        owner = _STATE["users"]["owner"]  # type: ignore[index]
+        with self.client.post(
+            f"/servers/{self.server_id}/mcp/",
+            headers=self._headers(owner["access_token"], include_session=True),
+            json={"jsonrpc": "2.0", "id": random.randint(10, 10000), "method": "tools/list", "params": {}},
+            catch_response=True,
+            name="MCP isolation owner tools/list",
+        ) as response:
+            if response.status_code != 200:
+                response.failure(f"Owner tools/list failed: {response.status_code} {response.text}")
+                return
+            payload = response.json()
+            tool_names = [tool["name"] for tool in payload.get("result", {}).get("tools", [])]
+            if self.time_tool not in tool_names:
+                response.failure(f"Owner did not see expected tool list: {tool_names}")
+            else:
+                response.success()
+
+    @task(1)
+    def tools_call_owner_session(self) -> None:
+        owner = _STATE["users"]["owner"]  # type: ignore[index]
+        with self.client.post(
+            f"/servers/{self.server_id}/mcp/",
+            headers=self._headers(owner["access_token"], include_session=True),
+            json={
+                "jsonrpc": "2.0",
+                "id": random.randint(10, 10000),
+                "method": "tools/call",
+                "params": {"name": self.time_tool, "arguments": {"timezone": "UTC"}},
+            },
+            catch_response=True,
+            name="MCP isolation owner tools/call",
+        ) as response:
+            if response.status_code != 200:
+                response.failure(f"Owner tools/call failed: {response.status_code} {response.text}")
+                return
+            payload = response.json()
+            if payload.get("result", {}).get("isError", False):
+                response.failure(f"Owner tools/call unexpectedly errored: {payload}")
+                return
+            if _contains_iso8601_timestamp(payload.get("result", {})):
+                response.success()
+            else:
+                response.failure(f"Owner tools/call returned non-time payload: {json.dumps(payload)}")
+
+
+class McpIsolationHijackUser(BaseIsolationUser):
+    weight = 2
+
+    @task(2)
+    def same_team_peer_hijack(self) -> None:
+        peer = _STATE["users"]["peer"]  # type: ignore[index]
+        with self.client.post(
+            f"/servers/{self.server_id}/mcp/",
+            headers=self._headers(peer["access_token"], include_session=True),
+            json={"jsonrpc": "2.0", "id": random.randint(10, 10000), "method": "tools/list", "params": {}},
+            catch_response=True,
+            name="MCP isolation peer hijack",
+        ) as response:
+            if response.status_code in (403, 404):
+                response.success()
+                return
+            if response.status_code == 200:
+                payload = response.json()
+                denied = "error" in payload or payload.get("result", {}).get("isError", False)
+                if denied:
+                    response.success()
+                    return
+            response.failure(f"Peer hijack unexpectedly succeeded: {response.status_code} {response.text}")
+
+    @task(1)
+    def outsider_hijack(self) -> None:
+        outsider = _STATE["users"]["outsider"]  # type: ignore[index]
+        with self.client.post(
+            f"/servers/{self.server_id}/mcp/",
+            headers=self._headers(outsider["access_token"], include_session=True),
+            json={"jsonrpc": "2.0", "id": random.randint(10, 10000), "method": "tools/list", "params": {}},
+            catch_response=True,
+            name="MCP isolation outsider hijack",
+        ) as response:
+            if response.status_code in (403, 404):
+                response.success()
+                return
+            if response.status_code == 200:
+                payload = response.json()
+                denied = "error" in payload or payload.get("result", {}).get("isError", False)
+                if denied:
+                    response.success()
+                    return
+            response.failure(f"Outsider hijack unexpectedly succeeded: {response.status_code} {response.text}")
diff --git a/tests/loadtest/locustfile_mcp_protocol.py b/tests/loadtest/locustfile_mcp_protocol.py
index 3daf316eb3..47a4657f0a 100644
--- a/tests/loadtest/locustfile_mcp_protocol.py
+++ b/tests/loadtest/locustfile_mcp_protocol.py
@@ -44,6 +44,7 @@
 """
 
 # Standard
+from dataclasses import dataclass
 from datetime import datetime, timedelta, timezone
 import json
 import logging
@@ -52,15 +53,13 @@
 import random
 from typing import Any
 import uuid
+import warnings
 
 # Third-Party
 from locust import between, constant_throughput, events, tag, task
 from locust.contrib.fasthttp import FastHttpUser
 from locust.runners import MasterRunner, WorkerRunner
 
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-
 # =============================================================================
 # Configuration
 # =============================================================================
@@ -106,14 +105,58 @@ def _cfg(key: str, default: str = "") -> str:
 
 # MCP target
 MCP_SERVER_ID = _cfg("MCP_SERVER_ID", "")
+MCP_SERVER_IDS_STR = _cfg("MCP_SERVER_IDS", "")
 MCP_TOOL_NAMES_STR = _cfg("MCP_TOOL_NAMES", "")
+LOCUST_LOG_LEVEL = os.environ.get("LOCUST_LOG_LEVEL", _ENV.get("LOCUST_LOG_LEVEL", "INFO")).upper()
+
+logging.basicConfig(level=getattr(logging, LOCUST_LOG_LEVEL, logging.INFO))
+logger = logging.getLogger(__name__)
+logger.setLevel(getattr(logging, LOCUST_LOG_LEVEL, logging.INFO))
+
+
+def _configure_log_levels() -> None:
+    """Reduce benchmark log noise across Locust and common client libraries."""
+    level = getattr(logging, LOCUST_LOG_LEVEL, logging.INFO)
+    logger.setLevel(level)
+    for logger_name in (
+        "locust",
+        "locust.main",
+        "locust.runners",
+        "locust.stats_logger",
+        "urllib3",
+        "requests",
+        "gevent",
+    ):
+        logging.getLogger(logger_name).setLevel(level)
+    if level >= logging.ERROR:
+        warnings.filterwarnings(
+            "ignore",
+            message=r"The HMAC key is .* below the minimum recommended length of 32 bytes for SHA256\.",
+        )
+
+
+@dataclass(frozen=True)
+class ServerTarget:
+    server_id: str
+    server_name: str
+    tool_names: list[str]
+    resource_uris: list[str]
+    prompt_targets: list["PromptTarget"]
+
+
+@dataclass(frozen=True)
+class PromptTarget:
+    name: str
+    required_arguments: dict[str, str]
 
 # Shared state (populated on test_start)
 _server_id: str = ""
 _tool_names: list[str] = []
 _resource_uris: list[str] = []
-_prompt_names: list[str] = []
+_prompt_targets: list[PromptTarget] = []
+_server_targets: list[ServerTarget] = []
 _jwt_token: str | None = None
+_server_target_index = 0
 
 # Timezones for realistic args
 TIMEZONES = [
@@ -132,6 +175,36 @@ def _cfg(key: str, default: str = "") -> str:
 ]
 
 
+def _default_prompt_argument_value(prompt_name: str, argument_name: str) -> str:
+    """Return a deterministic benchmark-friendly value for a required prompt arg."""
+    name = argument_name.lower()
+    prompt = prompt_name.lower()
+
+    if "timezones" in name:
+        return "America/New_York,Europe/Dublin"
+    if "timezone_b" in name or "secondary_timezone" in name:
+        return "America/New_York"
+    if "timezone_a" in name or "primary_timezone" in name or "from_timezone" in name or "source_timezone" in name:
+        return "UTC"
+    if "target_timezone" in name or (name == "timezone" and "compare" not in prompt):
+        return "Europe/Dublin"
+    if "timezone" in name:
+        return "UTC"
+    if "include_" in name or name.startswith("with_") or name.endswith("_enabled") or name.endswith("_flag"):
+        return "true"
+    if "duration" in name:
+        return "30"
+    if "time" in name or "date" in name:
+        return "2025-01-15T12:00:00Z"
+    if "location" in name or "city" in name:
+        return "Dublin"
+    if "email" in name:
+        return "loadtest@example.com"
+    if "name" in name or "title" in name or "subject" in name:
+        return "load-test"
+    return "load-test"
+
+
 # =============================================================================
 # JWT Token Generation
 # =============================================================================
@@ -182,19 +255,21 @@ def _get_token() -> str:
 
 
 def _auto_detect(host: str) -> None:
-    """Discover server_id and tool_names from the gateway REST API."""
-    global _server_id, _tool_names, _resource_uris, _prompt_names  # pylint: disable=global-statement
+    """Discover MCP server targets and per-target inventories from the gateway REST API."""
+    global _server_id, _tool_names, _resource_uris, _prompt_targets, _server_targets  # pylint: disable=global-statement
 
     # Third-Party
     import requests  # pylint: disable=import-outside-toplevel
 
     token = _get_token()
     headers = {"Authorization": f"Bearer {token}", "Accept": "application/json"}
+    requested_server_ids = [server_id.strip() for server_id in MCP_SERVER_IDS_STR.split(",") if server_id.strip()]
 
-    # --- Server ID (prefer server with the most associated tools) ---
+    # --- Server ID selection (prefer explicit multi-server list, then single server, else best auto-detect) ---
     if MCP_SERVER_ID:
-        _server_id = MCP_SERVER_ID
-    else:
+        requested_server_ids = [MCP_SERVER_ID]
+
+    if not requested_server_ids:
         try:
             resp = requests.get(f"{host}/servers", headers=headers, timeout=10)
             resp.raise_for_status()
@@ -206,82 +281,112 @@ def _auto_detect(host: str) -> None:
                 enabled = [s for s in servers if s.get("enabled", True)]
                 if enabled:
                     best = max(enabled, key=lambda s: len(s.get("associatedTools", [])))
-                    _server_id = best.get("id", "")
-                    logger.info(
-                        "Selected server %r (%s) with %d tools",
-                        best.get("name"),
-                        _server_id,
-                        len(best.get("associatedTools", [])),
-                    )
+                    requested_server_ids = [best.get("id", "")]
                 else:
-                    _server_id = servers[0].get("id", "")
+                    requested_server_ids = [servers[0].get("id", "")]
         except Exception as e:
             logger.warning("Failed to auto-detect server_id: %s", e)
 
-    if not _server_id:
-        logger.error("No MCP_SERVER_ID set and auto-detection failed. Set MCP_SERVER_ID env var.")
+    requested_server_ids = [server_id for server_id in requested_server_ids if server_id]
+    if not requested_server_ids:
+        logger.error("No MCP_SERVER_ID/MCP_SERVER_IDS set and auto-detection failed.")
         return
 
-    logger.info("Using server_id: %s", _server_id)
-
-    # --- Discover tools/resources/prompts via MCP protocol ---
-    mcp_url = f"{host}/servers/{_server_id}/mcp"
-    mcp_headers = {**headers, "Content-Type": "application/json"}
-    session_id = None
-
-    def _mcp_call(method: str, params: dict | None = None) -> dict | None:
-        nonlocal session_id
-        payload = {"jsonrpc": "2.0", "id": str(uuid.uuid4()), "method": method}
-        if params:
-            payload["params"] = params
-        hdrs = dict(mcp_headers)
-        if session_id:
-            hdrs["Mcp-Session-Id"] = session_id
-        try:
-            resp = requests.post(mcp_url, json=payload, headers=hdrs, timeout=15)
-            if "Mcp-Session-Id" in resp.headers:
-                session_id = resp.headers["Mcp-Session-Id"]
-            resp.raise_for_status()
-            data = resp.json()
-            if "error" in data:
-                logger.warning("MCP error for %s: %s", method, data["error"])
+    discovered_targets: list[ServerTarget] = []
+
+    for server_id in requested_server_ids:
+        mcp_url = f"{host}/servers/{server_id}/mcp"
+        mcp_headers = {**headers, "Content-Type": "application/json"}
+        session_id = None
+        server_name = server_id
+
+        def _mcp_call(method: str, params: dict | None = None) -> dict | None:
+            nonlocal session_id
+            payload = {"jsonrpc": "2.0", "id": str(uuid.uuid4()), "method": method}
+            if params:
+                payload["params"] = params
+            hdrs = dict(mcp_headers)
+            if session_id:
+                hdrs["Mcp-Session-Id"] = session_id
+            try:
+                resp = requests.post(mcp_url, json=payload, headers=hdrs, timeout=15)
+                if "Mcp-Session-Id" in resp.headers:
+                    session_id = resp.headers["Mcp-Session-Id"]
+                resp.raise_for_status()
+                data = resp.json()
+                if "error" in data:
+                    logger.warning("MCP error for server %s method %s: %s", server_id, method, data["error"])
+                    return None
+                return data.get("result")
+            except Exception as e:
+                logger.warning("MCP %s failed for server %s: %s", method, server_id, e)
                 return None
-            return data.get("result")
-        except Exception as e:
-            logger.warning("MCP %s failed: %s", method, e)
-            return None
 
-    # Initialize session
-    _mcp_call(
-        "initialize",
-        {
-            "protocolVersion": "2024-11-05",
-            "capabilities": {},
-            "clientInfo": {"name": "locust-mcp-discovery", "version": "1.0"},
-        },
-    )
-
-    # Tool names
-    if MCP_TOOL_NAMES_STR:
-        _tool_names = [t.strip() for t in MCP_TOOL_NAMES_STR.split(",") if t.strip()]
-    else:
-        result = _mcp_call("tools/list")
-        if result:
-            _tool_names = [t["name"] for t in result.get("tools", []) if "name" in t]
+        init_result = _mcp_call(
+            "initialize",
+            {
+                "protocolVersion": "2024-11-05",
+                "capabilities": {},
+                "clientInfo": {"name": "locust-mcp-discovery", "version": "1.0"},
+            },
+        )
+        if init_result:
+            server_name = init_result.get("serverInfo", {}).get("name") or server_name
+
+        if MCP_TOOL_NAMES_STR:
+            tool_names = [t.strip() for t in MCP_TOOL_NAMES_STR.split(",") if t.strip()]
+        else:
+            result = _mcp_call("tools/list")
+            tool_names = [t["name"] for t in result.get("tools", []) if "name" in t] if result else []
+
+        result = _mcp_call("resources/list")
+        resource_uris = [r["uri"] for r in result.get("resources", []) if "uri" in r] if result else []
 
-    # Resources
-    result = _mcp_call("resources/list")
-    if result:
-        _resource_uris = [r["uri"] for r in result.get("resources", []) if "uri" in r]
+        result = _mcp_call("prompts/list")
+        prompt_targets = []
+        if result:
+            for prompt in result.get("prompts", []):
+                prompt_name = prompt.get("name")
+                if not isinstance(prompt_name, str) or not prompt_name:
+                    continue
+                required_arguments = {}
+                for argument in prompt.get("arguments", []) or []:
+                    arg_name = argument.get("name")
+                    if argument.get("required") and isinstance(arg_name, str) and arg_name:
+                        required_arguments[arg_name] = _default_prompt_argument_value(prompt_name, arg_name)
+                prompt_targets.append(PromptTarget(name=prompt_name, required_arguments=required_arguments))
+
+        discovered_targets.append(
+            ServerTarget(
+                server_id=server_id,
+                server_name=server_name,
+                tool_names=tool_names,
+                resource_uris=resource_uris,
+                prompt_targets=prompt_targets,
+            )
+        )
 
-    # Prompts
-    result = _mcp_call("prompts/list")
-    if result:
-        _prompt_names = [p["name"] for p in result.get("prompts", []) if "name" in p]
+    _server_targets = discovered_targets
+    if not _server_targets:
+        logger.error("No MCP server targets could be initialized.")
+        return
 
-    logger.info("Discovered %d tools, %d resources, %d prompts", len(_tool_names), len(_resource_uris), len(_prompt_names))
-    if _tool_names:
-        logger.info("Tools: %s", ", ".join(_tool_names[:20]))
+    primary = _server_targets[0]
+    _server_id = primary.server_id
+    _tool_names = primary.tool_names
+    _resource_uris = primary.resource_uris
+    _prompt_targets = primary.prompt_targets
+
+    logger.info("Using %d MCP server target(s)", len(_server_targets))
+    for target in _server_targets:
+        logger.info(
+            "  server=%s name=%r tools=%d resources=%d prompts=%d",
+            target.server_id,
+            target.server_name,
+            len(target.tool_names),
+            len(target.resource_uris),
+            len(target.prompt_targets),
+        )
 
 
 # =============================================================================
@@ -306,6 +411,12 @@ def set_defaults(parser):
     parser.set_defaults(users=150, spawn_rate=30, run_time="120s")
 
 
+@events.init.add_listener
+def on_locust_init(environment, **kwargs):
+    del environment, kwargs
+    _configure_log_levels()
+
+
 @events.test_start.add_listener
 def on_test_start(environment, **kwargs):
     host = environment.host or "http://localhost:4444"
@@ -318,15 +429,24 @@ def on_test_start(environment, **kwargs):
         logger.info("MCP STREAMABLE HTTP PROTOCOL LOAD TEST")
         logger.info("=" * 70)
         logger.info("  Host: %s", host)
-        if _server_id:
+        if _server_targets:
+            for target in _server_targets[:5]:
+                logger.info(
+                    "  MCP endpoint: %s/servers/%s/mcp (%s, tools=%d)",
+                    host,
+                    target.server_id,
+                    target.server_name,
+                    len(target.tool_names),
+                )
+        elif _server_id:
             logger.info("  MCP endpoint: %s/servers/%s/mcp", host, _server_id)
-        logger.info("  Tools: %s", ", ".join(_tool_names[:10]) if _tool_names else "(none)")
+            logger.info("  Tools: %s", ", ".join(_tool_names[:10]) if _tool_names else "(none)")
         logger.info("=" * 70)
 
 
 @events.test_stop.add_listener
 def on_test_stop(environment, **kwargs):
-    if isinstance(environment.runner, MasterRunner):
+    if isinstance(environment.runner, WorkerRunner):
         return
     stats = environment.stats
     total = stats.total.num_requests
@@ -398,9 +518,14 @@ def __init__(self, *args, **kwargs):
         self._mcp_session_id: str | None = None
         self._initialized = False
         self._token = _get_token()
+        self._server_id = ""
+        self._server_name = ""
+        self._tool_names: list[str] = []
+        self._resource_uris: list[str] = []
+        self._prompt_targets: list[PromptTarget] = []
 
     def _mcp_path(self) -> str:
-        return f"/servers/{_server_id}/mcp"
+        return f"/servers/{self._server_id}/mcp"
 
     def _mcp_headers(self) -> dict[str, str]:
         headers = {
@@ -418,48 +543,69 @@ def _mcp_request(self, method: str, params: dict | None, name: str) -> dict | No
         Returns the 'result' field on success, None on error.
         """
         payload = _jsonrpc(method, params)
-        with self.client.post(
-            self._mcp_path(),
-            data=json.dumps(payload),
-            headers=self._mcp_headers(),
-            name=name,
-            catch_response=True,
-        ) as response:
-            # Capture session ID
-            sid = response.headers.get("Mcp-Session-Id")
-            if sid:
-                self._mcp_session_id = sid
-
-            if response.status_code in (502, 503, 504):
-                response.failure(f"Infrastructure error: {response.status_code}")
-                return None
-
-            if response.status_code != 200:
-                response.failure(f"HTTP {response.status_code}")
-                return None
-
-            try:
-                data = response.json()
-            except Exception as e:
-                response.failure(f"Invalid JSON: {e}")
-                return None
-
-            if data is None:
-                response.failure("Null JSON response")
-                return None
-
-            if "error" in data:
-                err = data["error"]
-                response.failure(f"JSON-RPC error {err.get('code', '?')}: {err.get('message', '?')}")
-                return None
+        try:
+            with self.client.post(
+                self._mcp_path(),
+                data=json.dumps(payload),
+                headers=self._mcp_headers(),
+                name=name,
+                catch_response=True,
+            ) as response:
+                if response is None:
+                    return None
+
+                # Capture session ID
+                sid = response.headers.get("Mcp-Session-Id") if response.headers else None
+                if sid:
+                    self._mcp_session_id = sid
+
+                if response.status_code in (502, 503, 504):
+                    response.failure(f"Infrastructure error: {response.status_code}")
+                    return None
+
+                if response.status_code != 200:
+                    response.failure(f"HTTP {response.status_code}")
+                    return None
+
+                try:
+                    data = response.json()
+                except Exception as e:
+                    response.failure(f"Invalid JSON: {e}")
+                    return None
+
+                if data is None:
+                    response.failure("Null JSON response")
+                    return None
+
+                if "error" in data:
+                    err = data["error"]
+                    response.failure(f"JSON-RPC error {err.get('code', '?')}: {err.get('message', '?')}")
+                    return None
+
+                response.success()
+                return data.get("result")
+        except Exception as e:  # pragma: no cover - network client can fail before a response exists
+            logger.warning("MCP request failed before response for %s: %s", name, e)
+            return None
 
-            response.success()
-            return data.get("result")
+    def _assign_target(self):
+        global _server_target_index  # pylint: disable=global-statement
+        if not _server_targets:
+            return
+        target = _server_targets[_server_target_index % len(_server_targets)]
+        _server_target_index += 1
+        self._server_id = target.server_id
+        self._server_name = target.server_name
+        self._tool_names = list(target.tool_names)
+        self._resource_uris = list(target.resource_uris)
+        self._prompt_targets = list(target.prompt_targets)
 
     def _ensure_initialized(self):
         """Initialize the MCP session (once per user lifecycle)."""
         if self._initialized:
             return
+        if not self._server_id:
+            return
         result = self._mcp_request(
             "initialize",
             {
@@ -473,6 +619,7 @@ def _ensure_initialized(self):
             self._initialized = True
 
     def on_start(self):
+        self._assign_target()
         self._ensure_initialized()
 
 
@@ -498,7 +645,7 @@ class MCPAgentUser(BaseMCPUser):
 
     def _pick_tools(self, n: int = 1) -> list[str]:
         """Pick n random tools from the discovered set (cap at 6 like the customer)."""
-        pool = _tool_names[:6] if len(_tool_names) > 6 else _tool_names
+        pool = self._tool_names[:6] if len(self._tool_names) > 6 else self._tool_names
         if not pool:
             return []
         return random.sample(pool, min(n, len(pool)))
@@ -559,17 +706,17 @@ def agent_list_prompts(self):
     @tag("agent", "resources")
     def agent_read_resource(self):
         """Agent reads a resource."""
-        if _resource_uris:
-            uri = random.choice(_resource_uris)
+        if self._resource_uris:
+            uri = random.choice(self._resource_uris)
             self._mcp_request("resources/read", {"uri": uri}, "MCP resources/read")
 
     @task(1)
     @tag("agent", "prompts")
     def agent_get_prompt(self):
         """Agent gets a prompt."""
-        if _prompt_names:
-            name = random.choice(_prompt_names)
-            self._mcp_request("prompts/get", {"name": name}, "MCP prompts/get")
+        if self._prompt_targets:
+            prompt = random.choice(self._prompt_targets)
+            self._mcp_request("prompts/get", {"name": prompt.name, "arguments": dict(prompt.required_arguments)}, "MCP prompts/get")
 
     @task(1)
     @tag("agent", "ping")
@@ -596,9 +743,9 @@ class MCPToolCallerUser(BaseMCPUser):
     @tag("toolcall", "call")
     def call_tool(self):
         """Call a random tool rapidly."""
-        if not _tool_names:
+        if not self._tool_names:
             return
-        tool = random.choice(_tool_names[:6] if len(_tool_names) > 6 else _tool_names)
+        tool = random.choice(self._tool_names[:6] if len(self._tool_names) > 6 else self._tool_names)
         name_lower = tool.lower()
         if "time" in name_lower:
             args = {"timezone": random.choice(TIMEZONES)}
@@ -654,16 +801,16 @@ def list_resource_templates(self):
     @task(3)
     @tag("discovery", "resources")
     def read_resource(self):
-        if _resource_uris:
-            uri = random.choice(_resource_uris)
+        if self._resource_uris:
+            uri = random.choice(self._resource_uris)
             self._mcp_request("resources/read", {"uri": uri}, "MCP resources/read")
 
     @task(3)
     @tag("discovery", "prompts")
     def get_prompt(self):
-        if _prompt_names:
-            name = random.choice(_prompt_names)
-            self._mcp_request("prompts/get", {"name": name}, "MCP prompts/get")
+        if self._prompt_targets:
+            prompt = random.choice(self._prompt_targets)
+            self._mcp_request("prompts/get", {"name": prompt.name, "arguments": dict(prompt.required_arguments)}, "MCP prompts/get")
 
 
 # =============================================================================
@@ -710,8 +857,8 @@ def full_lifecycle(self):
         self._mcp_request("tools/list", {}, "MCP tools/list [churn]")
 
         # Call a tool
-        if _tool_names:
-            tool = random.choice(_tool_names[:6] if len(_tool_names) > 6 else _tool_names)
+        if self._tool_names:
+            tool = random.choice(self._tool_names[:6] if len(self._tool_names) > 6 else self._tool_names)
             name_lower = tool.lower()
             if "time" in name_lower:
                 args = {"timezone": random.choice(TIMEZONES)}
@@ -741,9 +888,9 @@ class MCPStressUser(BaseMCPUser):
     @task(10)
     @tag("stress", "call")
     def stress_call_tool(self):
-        if not _tool_names:
+        if not self._tool_names:
             return
-        tool = random.choice(_tool_names[:6] if len(_tool_names) > 6 else _tool_names)
+        tool = random.choice(self._tool_names[:6] if len(self._tool_names) > 6 else self._tool_names)
         name_lower = tool.lower()
         if "time" in name_lower:
             args = {"timezone": "UTC"}
diff --git a/tests/migration/conftest.py b/tests/migration/conftest.py
index cd366b4561..1e326a293d 100644
--- a/tests/migration/conftest.py
+++ b/tests/migration/conftest.py
@@ -24,9 +24,12 @@
 from .utils.migration_runner import MigrationTestRunner
 from .version_config import VersionConfig
 
+REPORTS_DIR = Path("tests/migration/reports")
+REPORTS_DIR.mkdir(parents=True, exist_ok=True)
+
 # Configure logging for migration tests
 logging.basicConfig(
-    level=logging.INFO, format="%(asctime)s [%(levelname)s] %(name)s: %(message)s", handlers=[logging.StreamHandler(), logging.FileHandler("tests/migration/reports/migration_tests.log", mode="a")]
+    level=logging.INFO, format="%(asctime)s [%(levelname)s] %(name)s: %(message)s", handlers=[logging.StreamHandler(), logging.FileHandler(REPORTS_DIR / "migration_tests.log", mode="a")]
 )
 
 logger = logging.getLogger(__name__)
diff --git a/tests/migration/docker-compose.test.yml b/tests/migration/docker-compose.test.yml
new file mode 100644
index 0000000000..891cd58f93
--- /dev/null
+++ b/tests/migration/docker-compose.test.yml
@@ -0,0 +1,55 @@
+
+version: "3.9"
+
+networks:
+  migration_test:
+    driver: bridge
+
+volumes:
+  postgres_data:
+    labels:
+      migration-test: "true"
+
+services:
+  postgres:
+    image: postgres:17
+    environment:
+      - POSTGRES_USER=test_user
+      - POSTGRES_PASSWORD=test_migration_password_123
+      - POSTGRES_DB=mcp_test
+    volumes:
+      - postgres_data:/var/lib/postgresql/data
+    networks: [migration_test]
+    labels:
+      migration-test: "true"
+    healthcheck:
+      test: ["CMD-SHELL", "pg_isready -U test_user -d mcp_test"]
+      interval: 10s
+      timeout: 5s
+      retries: 5
+      start_period: 10s
+
+  gateway:
+    image: ${IMAGE_LOCAL:-ghcr.io/ibm/mcp-context-forge:latest}
+    environment:
+      - DATABASE_URL=postgresql://test_user:test_migration_password_123@postgres:5432/mcp_test
+      - REDIS_URL=redis://redis:6379/0
+      - MCPGATEWAY_UI_ENABLED=false
+      - MCPGATEWAY_ADMIN_API_ENABLED=true
+      - AUTH_REQUIRED=false
+      - LOG_LEVEL=INFO
+      - PYTHONUNBUFFERED=1
+    ports:
+      - "0:4444"  # Random host port
+    networks: [migration_test]
+    labels:
+      migration-test: "true"
+    depends_on:
+      postgres:
+        condition: service_healthy
+
+  redis:
+    image: redis:latest
+    networks: [migration_test]
+    labels:
+      migration-test: "true"
diff --git a/tests/migration/test_compose_postgres_migrations.py b/tests/migration/test_compose_postgres_migrations.py
index d1d8d671d7..8ec58fd97e 100644
--- a/tests/migration/test_compose_postgres_migrations.py
+++ b/tests/migration/test_compose_postgres_migrations.py
@@ -554,7 +554,10 @@ def _validate_compose_service_health(self, container_manager, containers):
     def _stop_compose_stack(self, container_manager, compose_file):
         """Stop and clean up compose stack."""
         try:
-            cmd = [f"{container_manager.runtime}-compose", "-f", compose_file, "down", "-v", "--remove-orphans"]
+            if container_manager.runtime == "docker":
+                cmd = [container_manager.runtime, "compose", "-f", compose_file, "down", "-v", "--remove-orphans"]
+            else:
+                cmd = [f"{container_manager.runtime}-compose", "-f", compose_file, "down", "-v", "--remove-orphans"]
             container_manager._run_command(cmd, check=False)
         except Exception as e:
             logger.warning(f"⚠️ Error stopping compose stack: {e}")
diff --git a/tests/migration/utils/container_manager.py b/tests/migration/utils/container_manager.py
index 0a25f452e8..12c515f9e4 100644
--- a/tests/migration/utils/container_manager.py
+++ b/tests/migration/utils/container_manager.py
@@ -386,7 +386,7 @@ def start_compose_stack(self, version: str, compose_file: str) -> Dict[str, str]
         logger.info(f"🔧 Environment variables: {env}")
 
         # Start the stack
-        cmd = [f"{self.runtime}-compose", "-f", compose_file, "up", "-d"]
+        cmd = self._compose_command("-f", compose_file, "up", "-d")
         self._run_command(cmd, env=env)
 
         # Get container IDs for all services
@@ -412,7 +412,7 @@ def _get_compose_containers(self, compose_file: str) -> Dict[str, str]:
         Returns:
             Dictionary mapping service names to container IDs
         """
-        cmd = [f"{self.runtime}-compose", "-f", compose_file, "ps", "-q"]
+        cmd = self._compose_command("-f", compose_file, "ps", "-q")
         result = self._run_command(cmd, capture_output=True)
 
         container_ids = result.stdout.strip().split("\n")
@@ -421,7 +421,7 @@ def _get_compose_containers(self, compose_file: str) -> Dict[str, str]:
         for container_id in container_ids:
             if container_id:
                 # Get service name for this container
-                inspect_cmd = [self.runtime, "inspect", container_id, "--format", '{{.Config.Labels."com.docker.compose.service"}}']
+                inspect_cmd = [self.runtime, "inspect", container_id, "--format", '{{ index .Config.Labels "com.docker.compose.service" }}']
                 inspect_result = self._run_command(inspect_cmd, capture_output=True)
                 service_name = inspect_result.stdout.strip()
                 containers[service_name] = container_id
@@ -458,6 +458,16 @@ def _wait_for_postgres_ready(self, container_id: str, timeout: int = 60) -> None
         logger.error(f"❌ Timeout waiting for PostgreSQL {container_id[:12]} to be ready")
         raise RuntimeError(f"PostgreSQL failed to become ready within {timeout}s")
 
+    def _compose_command(self, *args: str) -> list[str]:
+        """Build a compose command for the active container runtime.
+
+        Docker uses the Compose v2 plugin (`docker compose`). Podman continues
+        to use the standalone `podman-compose` wrapper.
+        """
+        if self.runtime == "docker":
+            return [self.runtime, "compose", *args]
+        return [f"{self.runtime}-compose", *args]
+
     def exec_alembic_command(self, container_id: str, command: str) -> str:
         """Execute Alembic command in container.
 
diff --git a/tests/playwright/pages/version_page.py b/tests/playwright/pages/version_page.py
index 4c833900a9..07b21467b2 100644
--- a/tests/playwright/pages/version_page.py
+++ b/tests/playwright/pages/version_page.py
@@ -29,7 +29,7 @@ def version_panel(self) -> Locator:
     @property
     def app_overview_card(self) -> Locator:
         """Application overview card with gradient background."""
-        return self.version_panel.locator(".bg-gradient-to-r").first
+        return self.page.locator("#version-app-overview-card")
 
     @property
     def app_name(self) -> Locator:
@@ -61,7 +61,22 @@ def app_version(self) -> Locator:
     @property
     def platform_runtime_card(self) -> Locator:
         """Platform & Runtime card container."""
-        return self.version_panel.locator("div.bg-white.rounded-lg.shadow").first
+        return self.page.locator("#version-platform-runtime-card")
+
+    @property
+    def mcp_runtime_card(self) -> Locator:
+        """MCP runtime card container."""
+        return self.page.locator("#version-mcp-runtime-card")
+
+    @property
+    def mcp_core_badge(self) -> Locator:
+        """Primary MCP core badge."""
+        return self.page.locator("#version-mcp-core-badge")
+
+    @property
+    def mcp_runtime_mode_badge(self) -> Locator:
+        """Runtime mode badge."""
+        return self.page.locator("#version-mcp-runtime-mode-badge")
 
     @property
     def python_version(self) -> Locator:
@@ -83,7 +98,7 @@ def operating_system(self) -> Locator:
     @property
     def services_status_card(self) -> Locator:
         """Services status card container."""
-        return self.version_panel.locator("div.bg-white.rounded-lg.shadow").nth(1)
+        return self.page.locator("#version-services-status-card")
 
     @property
     def database_status_card(self) -> Locator:
@@ -110,7 +125,7 @@ def cache_status_badge(self) -> Locator:
     @property
     def system_resources_card(self) -> Locator:
         """System resources card container."""
-        return self.version_panel.locator("div.bg-white.rounded-lg.shadow").nth(2)
+        return self.page.locator("#version-system-resources-card")
 
     @property
     def cpu_info(self) -> Locator:
@@ -137,7 +152,7 @@ def boot_time(self) -> Locator:
     @property
     def support_bundle_card(self) -> Locator:
         """Support bundle download card container."""
-        return self.version_panel.locator("div.bg-white.rounded-lg.shadow").nth(3)
+        return self.page.locator("#version-support-bundle-card")
 
     @property
     def download_support_bundle_btn(self) -> Locator:
@@ -225,6 +240,14 @@ def get_fastapi_version(self) -> str:
         """
         return self.fastapi_version.text_content().strip()
 
+    def get_mcp_core_badge(self) -> str:
+        """Get the primary MCP core badge text."""
+        return self.mcp_core_badge.text_content().strip()
+
+    def get_mcp_runtime_mode_badge(self) -> str:
+        """Get the MCP runtime mode badge text."""
+        return self.mcp_runtime_mode_badge.text_content().strip()
+
     def get_operating_system(self) -> str:
         """Get the operating system information.
 
diff --git a/tests/playwright/regression/test_admin_crud_regression.py b/tests/playwright/regression/test_admin_crud_regression.py
index f9545fecfa..9ac7259944 100644
--- a/tests/playwright/regression/test_admin_crud_regression.py
+++ b/tests/playwright/regression/test_admin_crud_regression.py
@@ -261,7 +261,6 @@ def test_delete_virtual_server_flow(
         admin_page.wait_for_timeout(1_000)
 
         # Step 2: Find delete button within catalog panel
-        server_rows = admin_page.locator('#servers-table-body [data-testid="server-item"]')
         delete_button = admin_page.locator('#catalog-panel button[type="submit"]:has-text("Delete"):visible').first
 
         try:
@@ -269,7 +268,15 @@ def test_delete_virtual_server_flow(
         except PlaywrightTimeoutError:
             pytest.skip("No servers available to delete")
 
-        initial_count = server_rows.count()
+        # Capture the server ID from the first delete form so we can
+        # verify it disappears after deletion (row counts are unreliable
+        # with pagination when total items exceed per_page).
+        first_delete_form = admin_page.locator(
+            '#servers-table-body form[action*="/delete"]'
+        ).first
+        delete_action = first_delete_form.get_attribute("action") or ""
+        # Extract server ID from action URL like /admin/servers/<id>/delete
+        deleted_server_id = delete_action.rsplit("/delete", 1)[0].rsplit("/", 1)[-1]
 
         # Step 3 & 4: Accept native confirm() dialogs and click delete.
         # handleDeleteSubmit shows two native confirm() dialogs, then
@@ -291,7 +298,15 @@ def test_delete_virtual_server_flow(
         servers_tab.click()
         admin_page.wait_for_selector("#servers-table-body", state="attached", timeout=10_000)
         admin_page.wait_for_timeout(1_000)
-        expect(server_rows).to_have_count(initial_count - 1, timeout=15_000)
+
+        # Verify the deleted server's ID no longer appears in any
+        # delete-form action URL.  This is pagination-safe unlike
+        # counting rows (the default per_page=10 may re-fill the
+        # page from subsequent pages after a deletion).
+        remaining_delete_forms = admin_page.locator(
+            f'#servers-table-body form[action*="{deleted_server_id}"]'
+        )
+        expect(remaining_delete_forms).to_have_count(0, timeout=15_000)
 
         # Step 6 & 7: Verify no errors
         js_errors = _filter_benign_errors(error_collector["js_errors"])
diff --git a/tests/playwright/test_version_page.py b/tests/playwright/test_version_page.py
index 7a71ec9d3e..0c54d3ee3f 100644
--- a/tests/playwright/test_version_page.py
+++ b/tests/playwright/test_version_page.py
@@ -78,6 +78,22 @@ def test_platform_runtime_card_displays(self, version_page: VersionPage):
         os_info = version_page.get_operating_system()
         assert len(os_info) > 0, "Operating system info should not be empty"
 
+    def test_mcp_runtime_card_displays(self, version_page: VersionPage):
+        """Test that MCP runtime card exposes the active MCP core and mode."""
+        version_page.navigate_to_version_tab()
+        version_page.wait_for_version_panel_loaded()
+
+        expect(version_page.mcp_runtime_card).to_be_visible()
+        expect(version_page.mcp_core_badge).to_be_visible()
+        expect(version_page.mcp_runtime_mode_badge).to_be_visible()
+
+        core_badge = version_page.get_mcp_core_badge()
+        assert "MCP Core" in core_badge, "MCP core badge should describe the active MCP core"
+        assert "Rust" in core_badge or "Python" in core_badge, "MCP core badge should identify Rust or Python"
+
+        runtime_mode = version_page.get_mcp_runtime_mode_badge()
+        assert len(runtime_mode) > 0, "MCP runtime mode badge should not be empty"
+
     def test_services_status_card_displays(self, version_page: VersionPage):
         """Test that services status card displays database and cache status."""
         version_page.navigate_to_version_tab()
diff --git a/tests/unit/mcpgateway/middleware/test_token_scoping.py b/tests/unit/mcpgateway/middleware/test_token_scoping.py
index daa7e40431..4ebc513bc5 100644
--- a/tests/unit/mcpgateway/middleware/test_token_scoping.py
+++ b/tests/unit/mcpgateway/middleware/test_token_scoping.py
@@ -12,6 +12,7 @@
 """
 
 # Standard
+import hashlib
 import json
 from unittest.mock import AsyncMock, MagicMock, patch
 
@@ -21,10 +22,21 @@
 import pytest
 
 # First-Party
+from mcpgateway.config import settings
 from mcpgateway.db import Permissions
 from mcpgateway.middleware.token_scoping import _get_llm_permission_patterns, TokenScopingMiddleware
 
 
+def _trusted_internal_runtime_headers() -> dict[str, str]:
+    secret = settings.auth_encryption_secret.get_secret_value()
+    expected = hashlib.sha256(f"{secret}:contextforge-internal-mcp-runtime-v1".encode("utf-8")).hexdigest()
+    return {
+        "x-contextforge-mcp-runtime": "rust",
+        "x-contextforge-mcp-runtime-auth": expected,
+        "x-contextforge-auth-context": "trusted-payload",
+    }
+
+
 @pytest.fixture(autouse=True)
 def clear_llm_permission_pattern_cache():
     """Clear cached LLM permission regex patterns between tests."""
@@ -142,6 +154,89 @@ def test_transport_endpoints_whitelisted_for_server_scoped_tokens(self, middlewa
             result = middleware._check_server_restriction(path, "server-123")
             assert result is True, f"{path} should be whitelisted for server-scoped tokens"
 
+    @pytest.mark.asyncio
+    async def test_trusted_internal_mcp_runtime_request_bypasses_token_scoping(self, middleware, mock_request):
+        """Trusted loopback Rust sidecar hops should bypass token-scoping path checks."""
+        mock_request.url.path = "/_internal/mcp/rpc"
+        mock_request.scope["path"] = "/_internal/mcp/rpc"
+        mock_request.method = "POST"
+        mock_request.headers = {"Authorization": "Bearer scoped-token", **_trusted_internal_runtime_headers()}
+
+        call_next = AsyncMock(return_value="ok")
+        with patch.object(middleware, "_extract_token_scopes", new=AsyncMock(side_effect=AssertionError("token scoping should be bypassed"))):
+            result = await middleware(mock_request, call_next)
+
+        assert result == "ok"
+        call_next.assert_called_once()
+
+    @pytest.mark.asyncio
+    async def test_untrusted_internal_mcp_runtime_request_still_enforces_token_scoping(self, middleware, mock_request):
+        """Only loopback Rust sidecar hops should bypass token scoping."""
+        mock_request.url.path = "/_internal/mcp/rpc"
+        mock_request.scope["path"] = "/_internal/mcp/rpc"
+        mock_request.method = "POST"
+        mock_request.client.host = "10.0.0.8"
+        mock_request.headers = {"Authorization": "Bearer scoped-token", **_trusted_internal_runtime_headers()}
+
+        payload = {"sub": "user@example.com", "scopes": {"permissions": ["tools.read"]}}
+        with (
+            patch.object(middleware, "_extract_token_scopes", new=AsyncMock(return_value=payload)),
+            patch.object(middleware, "_check_team_membership", return_value=True),
+            patch.object(middleware, "_check_resource_team_ownership", return_value=True),
+            patch.object(middleware, "_check_server_restriction", return_value=True),
+            patch.object(middleware, "_check_permission_restrictions", return_value=False),
+        ):
+            call_next = AsyncMock()
+            response = await middleware(mock_request, call_next)
+
+        assert response.status_code == status.HTTP_403_FORBIDDEN
+        call_next.assert_not_called()
+
+    @pytest.mark.asyncio
+    async def test_internal_mcp_request_without_runtime_header_does_not_bypass(self, middleware, mock_request):
+        """Missing the Rust runtime marker must not bypass token scoping."""
+        mock_request.url.path = "/_internal/mcp/rpc"
+        mock_request.scope["path"] = "/_internal/mcp/rpc"
+        mock_request.method = "POST"
+        mock_request.headers = {
+            "Authorization": "Bearer scoped-token",
+            "x-contextforge-auth-context": "trusted-payload",
+        }
+
+        with (
+            patch.object(middleware, "_extract_token_scopes", new=AsyncMock(return_value={"sub": "user@example.com", "scopes": {"permissions": ["tools.read"]}})),
+            patch.object(middleware, "_check_server_restriction", return_value=True),
+            patch.object(middleware, "_check_permission_restrictions", return_value=False),
+        ):
+            call_next = AsyncMock()
+            response = await middleware(mock_request, call_next)
+
+        assert response.status_code == status.HTTP_403_FORBIDDEN
+        call_next.assert_not_called()
+
+    @pytest.mark.asyncio
+    async def test_internal_mcp_request_without_auth_context_does_not_bypass(self, middleware, mock_request):
+        """Missing the trusted auth-context header must not bypass token scoping."""
+        mock_request.url.path = "/_internal/mcp/rpc"
+        mock_request.scope["path"] = "/_internal/mcp/rpc"
+        mock_request.method = "POST"
+        mock_request.headers = {
+            "Authorization": "Bearer scoped-token",
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-mcp-runtime-auth": _trusted_internal_runtime_headers()["x-contextforge-mcp-runtime-auth"],
+        }
+
+        with (
+            patch.object(middleware, "_extract_token_scopes", new=AsyncMock(return_value={"sub": "user@example.com", "scopes": {"permissions": ["tools.read"]}})),
+            patch.object(middleware, "_check_server_restriction", return_value=True),
+            patch.object(middleware, "_check_permission_restrictions", return_value=False),
+        ):
+            call_next = AsyncMock()
+            response = await middleware(mock_request, call_next)
+
+        assert response.status_code == status.HTTP_403_FORBIDDEN
+        call_next.assert_not_called()
+
     @pytest.mark.asyncio
     async def test_canonical_permissions_used_in_map(self, middleware):
         """Test that permission map uses canonical Permissions constants (Issue 5 fix)."""
diff --git a/tests/unit/mcpgateway/plugins/plugins/test_prompt_output_sentinel.py b/tests/unit/mcpgateway/plugins/plugins/test_prompt_output_sentinel.py
new file mode 100644
index 0000000000..599992aa2b
--- /dev/null
+++ b/tests/unit/mcpgateway/plugins/plugins/test_prompt_output_sentinel.py
@@ -0,0 +1,102 @@
+# -*- coding: utf-8 -*-
+"""Unit tests for the prompt output sentinel plugin."""
+
+from __future__ import annotations
+
+from types import SimpleNamespace
+
+import pytest
+
+from mcpgateway.common.models import Message, PromptResult, Role, TextContent
+from mcpgateway.plugins.framework import PluginConfig, PromptPosthookPayload
+from plugins.test_prompt_output_sentinel import PromptOutputSentinelPlugin
+
+
+@pytest.fixture
+def plugin() -> PromptOutputSentinelPlugin:
+    """Create a prompt output sentinel plugin instance.
+
+    Returns:
+        Configured prompt sentinel plugin.
+    """
+    return PromptOutputSentinelPlugin(
+        PluginConfig(
+            name="prompt-sentinel",
+            kind="plugins.test_prompt_output_sentinel.PromptOutputSentinelPlugin",
+            hooks=["prompt_post_fetch"],
+            config={"sentinel_text": "[PROMPT-POST-FETCH-SENTINEL]"},
+        )
+    )
+
+
+@pytest.mark.asyncio
+async def test_prompt_post_fetch_appends_sentinel_to_prompt_result(plugin: PromptOutputSentinelPlugin) -> None:
+    """The plugin should append its sentinel to prompt text results.
+
+    Args:
+        plugin: Prompt sentinel plugin under test.
+    """
+    result = PromptResult(
+        description="Prompt description",
+        messages=[Message(role=Role.USER, content=TextContent(type="text", text="Rendered prompt body"))],
+    )
+
+    response = await plugin.prompt_post_fetch(
+        PromptPosthookPayload(prompt_id="prompt-1", result=result),
+        SimpleNamespace(),
+    )
+
+    updated = response.modified_payload.result
+    assert updated.messages[0].content.text.endswith("[PROMPT-POST-FETCH-SENTINEL]")
+    assert "Rendered prompt body" in updated.messages[0].content.text
+
+
+@pytest.mark.asyncio
+async def test_prompt_post_fetch_supports_dict_like_results(plugin: PromptOutputSentinelPlugin) -> None:
+    """The plugin should also support dict-like prompt results.
+
+    Args:
+        plugin: Prompt sentinel plugin under test.
+    """
+    response = await plugin.prompt_post_fetch(
+        PromptPosthookPayload(
+            prompt_id="prompt-2",
+            result={
+                "description": "Prompt description",
+                "messages": [{"role": "user", "content": {"type": "text", "text": "Rendered dict body"}}],
+            },
+        ),
+        SimpleNamespace(),
+    )
+
+    updated = response.modified_payload.result
+    assert updated.messages[0].content.text.endswith("[PROMPT-POST-FETCH-SENTINEL]")
+    assert "Rendered dict body" in updated.messages[0].content.text
+
+
+@pytest.mark.asyncio
+async def test_prompt_post_fetch_is_idempotent(plugin: PromptOutputSentinelPlugin) -> None:
+    """The plugin should not append the sentinel twice.
+
+    Args:
+        plugin: Prompt sentinel plugin under test.
+    """
+    payload = PromptPosthookPayload(
+        prompt_id="prompt-3",
+        result={
+            "messages": [
+                {
+                    "role": "user",
+                    "content": {
+                        "type": "text",
+                        "text": "Already tagged\n[PROMPT-POST-FETCH-SENTINEL]",
+                    },
+                }
+            ]
+        },
+    )
+
+    response = await plugin.prompt_post_fetch(payload, SimpleNamespace())
+
+    assert response.modified_payload is None
+    assert response.continue_processing is True
diff --git a/tests/unit/mcpgateway/plugins/plugins/test_tool_output_sentinel.py b/tests/unit/mcpgateway/plugins/plugins/test_tool_output_sentinel.py
new file mode 100644
index 0000000000..fea243bbda
--- /dev/null
+++ b/tests/unit/mcpgateway/plugins/plugins/test_tool_output_sentinel.py
@@ -0,0 +1,82 @@
+# -*- coding: utf-8 -*-
+"""Location: ./tests/unit/mcpgateway/plugins/plugins/test_tool_output_sentinel.py
+Copyright 2026
+SPDX-License-Identifier: Apache-2.0
+Authors: Mihai Criveti
+
+Unit tests for the test-only tool output sentinel plugin.
+"""
+
+from __future__ import annotations
+
+import pytest
+
+from mcpgateway.plugins.framework import PluginConfig, PluginContext, ToolHookType, ToolPostInvokePayload
+from mcpgateway.plugins.framework.models import GlobalContext
+from plugins.test_tool_output_sentinel import ToolOutputSentinelPlugin
+
+
+def _plugin() -> ToolOutputSentinelPlugin:
+    """Build a configured sentinel plugin for unit tests.
+
+    Returns:
+        Configured plugin instance.
+    """
+    return ToolOutputSentinelPlugin(
+        PluginConfig(
+            name="ToolOutputSentinelPlugin",
+            kind="plugins.test_tool_output_sentinel.ToolOutputSentinelPlugin",
+            hooks=[ToolHookType.TOOL_POST_INVOKE],
+            priority=10,
+            config={"sentinel_text": "[UNIT-SENTINEL]", "separator": "\n"},
+        )
+    )
+
+
+def _context() -> PluginContext:
+    """Build a minimal plugin context.
+
+    Returns:
+        Minimal plugin context for unit tests.
+    """
+    return PluginContext(global_context=GlobalContext(request_id="test-tool-output-sentinel"))
+
+
+@pytest.mark.asyncio
+async def test_tool_post_invoke_appends_to_string_result() -> None:
+    """String tool results should receive the sentinel suffix."""
+    plugin = _plugin()
+    result = await plugin.tool_post_invoke(ToolPostInvokePayload(name="demo-tool", result="hello"), _context())
+    assert result.modified_payload is not None
+    assert result.modified_payload.result == "hello\n[UNIT-SENTINEL]"
+
+
+@pytest.mark.asyncio
+async def test_tool_post_invoke_appends_to_mcp_content_result() -> None:
+    """MCP content arrays should receive the sentinel on the first text item."""
+    plugin = _plugin()
+    payload = ToolPostInvokePayload(
+        name="demo-tool",
+        result={"content": [{"type": "text", "text": "2026-03-15T10:00:00Z"}], "isError": False},
+    )
+
+    result = await plugin.tool_post_invoke(payload, _context())
+
+    assert result.modified_payload is not None
+    modified = result.modified_payload.result
+    assert modified["content"][0]["text"] == "2026-03-15T10:00:00Z\n[UNIT-SENTINEL]"
+
+
+@pytest.mark.asyncio
+async def test_tool_post_invoke_is_idempotent_for_existing_sentinel() -> None:
+    """Existing sentinels should not be duplicated."""
+    plugin = _plugin()
+    payload = ToolPostInvokePayload(
+        name="demo-tool",
+        result={"content": [{"type": "text", "text": "hello\n[UNIT-SENTINEL]"}], "isError": False},
+    )
+
+    result = await plugin.tool_post_invoke(payload, _context())
+
+    assert result.modified_payload is None
+    assert result.continue_processing is True
diff --git a/tests/unit/mcpgateway/services/test_email_auth_basic.py b/tests/unit/mcpgateway/services/test_email_auth_basic.py
index 81d76d0271..7b668f25b5 100644
--- a/tests/unit/mcpgateway/services/test_email_auth_basic.py
+++ b/tests/unit/mcpgateway/services/test_email_auth_basic.py
@@ -464,6 +464,41 @@ async def test_create_user_success(self, service, mock_db, mock_password_service
                 # Verify password was hashed (async version is called via asyncio.to_thread)
                 mock_password_service.hash_password_async.assert_called_once_with("SecurePass123")
 
+    @pytest.mark.asyncio
+    async def test_create_user_hashes_password_before_first_db_lookup(self, service, mock_db):
+        """Password hashing happens before the first DB lookup to avoid idle transactions."""
+        call_order = []
+
+        async def _hash_password(password):
+            call_order.append("hash")
+            return "hashed-password"
+
+        async def _get_user_by_email(_email):
+            call_order.append("lookup")
+            return None
+
+        service.password_service.hash_password_async = AsyncMock(side_effect=_hash_password)
+        service.get_user_by_email = AsyncMock(side_effect=_get_user_by_email)
+
+        mock_role_svc = MagicMock()
+        mock_role_svc.get_role_by_name = AsyncMock(return_value=None)
+        mock_role_svc.assign_role_to_user = AsyncMock()
+
+        with patch.object(type(service), "role_service", new_callable=lambda: property(lambda self: mock_role_svc)):
+            with patch("mcpgateway.services.email_auth_service.settings") as mock_settings:
+                mock_settings.auto_create_personal_teams = False
+                mock_settings.password_min_length = 8
+                mock_settings.password_require_uppercase = False
+                mock_settings.password_require_lowercase = False
+                mock_settings.password_require_numbers = False
+                mock_settings.password_require_special = False
+
+                await service.create_user(email="ordered@example.com", password="SecurePass123")
+
+        assert call_order[:2] == ["hash", "lookup"]
+        assert isinstance(mock_db.add.call_args_list[0][0][0], EmailUser)
+        assert mock_db.commit.call_count >= 1
+
     @pytest.mark.skip(reason="PersonalTeamService import happens inside method, complex to mock")
     @pytest.mark.asyncio
     async def test_create_user_with_personal_team(self, service, mock_db, mock_password_service):
@@ -2467,11 +2502,13 @@ async def test_delete_user_cache_invalidation_exception_is_non_fatal(self, servi
         mock_result.scalars.return_value.all.return_value = []  # No teams owned
         mock_db.execute.return_value = mock_result
 
-        def _raise_after_close(coro):
-            coro.close()
-            raise Exception("task-failure")
+        from mcpgateway.cache.auth_cache import auth_cache
 
-        with patch("asyncio.create_task", side_effect=_raise_after_close):
+        with (
+            patch.object(auth_cache, "invalidate_user", new=AsyncMock(side_effect=RuntimeError("cache-down"))),
+            patch.object(auth_cache, "invalidate_user_teams", new=AsyncMock(return_value=None)),
+            patch.object(auth_cache, "invalidate_team_membership", new=AsyncMock(return_value=None)),
+        ):
             result = await service.delete_user("test@example.com")
 
         assert result is True
diff --git a/tests/unit/mcpgateway/services/test_mcp_session_pool.py b/tests/unit/mcpgateway/services/test_mcp_session_pool.py
index 9d2e58a099..373d5c706d 100644
--- a/tests/unit/mcpgateway/services/test_mcp_session_pool.py
+++ b/tests/unit/mcpgateway/services/test_mcp_session_pool.py
@@ -1437,3 +1437,29 @@ async def test_session_context_manager(self):
             assert pool._pools[pool_key].qsize() == 1
 
         await pool.close_all()
+
+
+class TestStreamableHttpSessionOwnerCleanup:
+    """Tests for the public session-owner cleanup wrapper."""
+
+    @pytest.mark.asyncio
+    async def test_cleanup_streamable_http_session_owner_skips_invalid_ids(self):
+        """Invalid MCP session ids should be ignored."""
+        pool = MCPSessionPool()
+        pool.is_valid_mcp_session_id = MagicMock(return_value=False)
+        pool._cleanup_pool_session_owner = AsyncMock()
+
+        await pool.cleanup_streamable_http_session_owner("not-valid")
+
+        pool._cleanup_pool_session_owner.assert_not_awaited()
+
+    @pytest.mark.asyncio
+    async def test_cleanup_streamable_http_session_owner_cleans_valid_ids(self):
+        """Valid MCP session ids should delegate to the private cleanup helper."""
+        pool = MCPSessionPool()
+        pool.is_valid_mcp_session_id = MagicMock(return_value=True)
+        pool._cleanup_pool_session_owner = AsyncMock()
+
+        await pool.cleanup_streamable_http_session_owner("abc123def456")
+
+        pool._cleanup_pool_session_owner.assert_awaited_once_with("abc123def456")
diff --git a/tests/unit/mcpgateway/services/test_metrics_buffer_service.py b/tests/unit/mcpgateway/services/test_metrics_buffer_service.py
index d0e9b2a2a2..03ce490f9f 100644
--- a/tests/unit/mcpgateway/services/test_metrics_buffer_service.py
+++ b/tests/unit/mcpgateway/services/test_metrics_buffer_service.py
@@ -213,6 +213,24 @@ def test_server_metric_immediate_write_called(self):
 
         mock_write.assert_called_once()
 
+    def test_tool_metric_with_duration_immediate_write_called(self):
+        """record_tool_metric_with_duration should call immediate write when disabled."""
+        service = MetricsBufferService(enabled=False)
+
+        with patch.object(service, "_write_tool_metric_with_duration_immediately") as mock_write:
+            service.record_tool_metric_with_duration("tool-1", 0.25, True, None)
+
+        mock_write.assert_called_once_with("tool-1", 0.25, True, None)
+
+    def test_server_metric_with_duration_immediate_write_called(self):
+        """record_server_metric_with_duration should call immediate write when disabled."""
+        service = MetricsBufferService(enabled=False)
+
+        with patch.object(service, "_write_server_metric_with_duration_immediately") as mock_write:
+            service.record_server_metric_with_duration("server-1", 0.25, True, None)
+
+        mock_write.assert_called_once_with("server-1", 0.25, True, None)
+
     def test_a2a_metric_immediate_write_called(self):
         """record_a2a_agent_metric should call immediate write when disabled."""
         service = MetricsBufferService(enabled=False)
@@ -334,6 +352,40 @@ def test_record_server_metric_buffers_when_enabled(self):
         assert metric.is_success is True
         assert metric.response_time >= 0.25
 
+    def test_record_tool_metric_with_duration_buffers_when_enabled(self):
+        service = MetricsBufferService(enabled=True)
+
+        service.record_tool_metric_with_duration(
+            tool_id="tool-123",
+            response_time=0.75,
+            success=False,
+            error_message="boom",
+        )
+
+        assert len(service._tool_metrics) == 1
+        metric = service._tool_metrics[0]
+        assert metric.tool_id == "tool-123"
+        assert metric.response_time == 0.75
+        assert metric.is_success is False
+        assert metric.error_message == "boom"
+
+    def test_record_server_metric_with_duration_buffers_when_enabled(self):
+        service = MetricsBufferService(enabled=True)
+
+        service.record_server_metric_with_duration(
+            server_id="server-123",
+            response_time=0.75,
+            success=False,
+            error_message="boom",
+        )
+
+        assert len(service._server_metrics) == 1
+        metric = service._server_metrics[0]
+        assert metric.server_id == "server-123"
+        assert metric.response_time == 0.75
+        assert metric.is_success is False
+        assert metric.error_message == "boom"
+
     def test_record_a2a_agent_metric_with_duration_buffers_when_enabled(self):
         service = MetricsBufferService(enabled=True)
 
@@ -389,6 +441,73 @@ def _fake_create_task(coro):
     created["coro"].close()
 
 
+@pytest.mark.asyncio
+async def test_start_replaces_stale_flush_task_from_other_loop(monkeypatch):
+    service = MetricsBufferService(enabled=True)
+    service.recording_enabled = True
+    service._flush_loop = AsyncMock()
+
+    stale_task = MagicMock()
+    stale_task.done.return_value = False
+    stale_task.cancelled.return_value = False
+    stale_task.get_loop.return_value = SimpleNamespace(is_running=lambda: False)
+    service._flush_task = stale_task
+
+    created = {}
+
+    def _fake_create_task(coro):
+        created["coro"] = coro
+        task = MagicMock()
+        task.done.return_value = False
+        task.cancelled.return_value = False
+        task.get_loop.return_value = asyncio.get_running_loop()
+        return task
+
+    monkeypatch.setattr(asyncio, "create_task", _fake_create_task)
+
+    await service.start()
+
+    assert service._flush_task is not stale_task
+    assert created["coro"] is not None
+    created["coro"].close()
+
+
+@pytest.mark.asyncio
+async def test_record_tool_metric_restarts_stale_flush_task(monkeypatch):
+    service = MetricsBufferService(enabled=True)
+    service.recording_enabled = True
+    service._flush_loop = AsyncMock()
+
+    stale_task = MagicMock()
+    stale_task.done.return_value = False
+    stale_task.cancelled.return_value = False
+    stale_task.get_loop.return_value = SimpleNamespace(is_running=lambda: False)
+    service._flush_task = stale_task
+
+    loop = asyncio.get_running_loop()
+    original_create_task = loop.create_task
+    created = {}
+
+    def _fake_create_task(coro):
+        created["coro"] = coro
+        task = MagicMock()
+        task.done.return_value = False
+        task.cancelled.return_value = False
+        task.get_loop.return_value = loop
+        return task
+
+    monkeypatch.setattr(loop, "create_task", _fake_create_task)
+
+    try:
+        service.record_tool_metric_with_duration("tool-123", 0.25, True, None)
+    finally:
+        monkeypatch.setattr(loop, "create_task", original_create_task)
+
+    assert service._flush_task is not stale_task
+    assert created["coro"] is not None
+    created["coro"].close()
+
+
 @pytest.mark.asyncio
 async def test_shutdown_cancels_and_flushes(monkeypatch):
     service = MetricsBufferService(enabled=True)
diff --git a/tests/unit/mcpgateway/services/test_prompt_service.py b/tests/unit/mcpgateway/services/test_prompt_service.py
index 51849c63de..4c5da0ac4d 100644
--- a/tests/unit/mcpgateway/services/test_prompt_service.py
+++ b/tests/unit/mcpgateway/services/test_prompt_service.py
@@ -395,6 +395,56 @@ async def test_get_prompt_rendered(self, prompt_service, test_db):
         assert isinstance(msg.content, TextContent)
         assert msg.content.text == "Hello, Alice!"
 
+    @pytest.mark.asyncio
+    async def test_get_prompt_gateway_backed_blank_template_fetches_remote_result(self, prompt_service, test_db):
+        """Gateway-backed prompts without local templates should execute upstream."""
+        gateway = MagicMock()
+        gateway.id = "gw-1"
+        gateway.url = "http://gateway.example.com/mcp"
+        gateway.transport = "streamable_http"
+
+        db_prompt = _build_db_prompt(
+            name="fast-time-convert-time-detailed",
+            template="",
+            desc="Convert time with detailed context",
+        )
+        db_prompt.original_name = "convert_time_detailed"
+        db_prompt.gateway_id = gateway.id
+        db_prompt.gateway = gateway
+
+        test_db.execute = Mock(return_value=_make_execute_result(scalar=db_prompt))
+        test_db.commit = Mock()
+
+        remote_result = PromptResult(
+            messages=[
+                Message(
+                    role=Role.USER,
+                    content=TextContent(
+                        type="text",
+                        text="Rendered prompt for America/New_York and Europe/Dublin",
+                    ),
+                )
+            ],
+            description="Convert time with detailed context",
+        )
+        prompt_service._fetch_gateway_prompt_result = AsyncMock(return_value=remote_result)
+
+        result = await prompt_service.get_prompt(
+            test_db,
+            db_prompt.name,
+            {"from_timezone": "UTC", "to_timezones": "America/New_York,Europe/Dublin"},
+            user="user@test.com",
+        )
+
+        prompt_service._fetch_gateway_prompt_result.assert_awaited_once_with(
+            db_prompt,
+            {"from_timezone": "UTC", "to_timezones": "America/New_York,Europe/Dublin"},
+            "user@test.com",
+        )
+        test_db.commit.assert_called_once()
+        assert result.description == "Convert time with detailed context"
+        assert result.messages[0].content.text == "Rendered prompt for America/New_York and Europe/Dublin"
+
     @pytest.mark.asyncio
     async def test_get_prompt_by_name(self, prompt_service, test_db):
         """Prompt lookup falls back to name when ID lookup misses."""
diff --git a/tests/unit/mcpgateway/services/test_resource_service.py b/tests/unit/mcpgateway/services/test_resource_service.py
index 7c3aa97002..10fc1b3a5a 100644
--- a/tests/unit/mcpgateway/services/test_resource_service.py
+++ b/tests/unit/mcpgateway/services/test_resource_service.py
@@ -22,7 +22,7 @@
 
 # Third-Party
 import pytest
-from sqlalchemy.exc import IntegrityError
+from sqlalchemy.exc import IntegrityError, MultipleResultsFound
 
 # First-Party
 from mcpgateway.db import Resource as DbResource
@@ -4809,6 +4809,73 @@ async def test_read_resource_server_scoping_match_sets_span_attributes(self):
         assert out.text == "TEXT"
         span.set_attribute.assert_any_call("success", True)
 
+    @pytest.mark.asyncio
+    async def test_read_resource_server_scoped_uri_lookup_avoids_duplicate_uri_collisions(self):
+        """Server-scoped URI reads must not fail when the same URI exists on another gateway."""
+        from mcpgateway.services.resource_service import ResourceService
+
+        svc = ResourceService()
+        db = MagicMock()
+        db.commit = MagicMock()
+        db.close = MagicMock()
+
+        resource_db = MagicMock(
+            id="res-1",
+            uri="time://formats",
+            enabled=True,
+            content="SCOPED TEXT",
+            gateway=None,
+            visibility="public",
+            owner_email=None,
+            team_id=None,
+        )
+
+        resource_lookup_result = MagicMock()
+        resource_lookup_result.scalar_one_or_none.return_value = resource_db
+        server_match_result = MagicMock()
+        server_match_result.first.return_value = ("res-1",)
+
+        def execute_side_effect(statement, *args, **kwargs):
+            sql = str(statement)
+            if "resources.uri" in sql and "resources.enabled" in sql:
+                if "JOIN server_resource_association" not in sql:
+                    raise MultipleResultsFound("duplicate URI across gateways")
+                return resource_lookup_result
+            if "server_resource_association.resource_id" in sql:
+                return server_match_result
+            raise AssertionError(sql)
+
+        db.execute.side_effect = execute_side_effect
+
+        with (
+            patch.object(svc, "_check_resource_access", new_callable=AsyncMock, return_value=True),
+            patch("mcpgateway.services.metrics_buffer_service.get_metrics_buffer_service", return_value=MagicMock()),
+        ):
+            out = await svc.read_resource(db, resource_uri="time://formats", server_id="srv-1")
+
+        assert out.text == "SCOPED TEXT"
+
+    @pytest.mark.asyncio
+    async def test_read_resource_generic_uri_lookup_reports_ambiguity(self):
+        """Generic URI reads should fail cleanly when the same URI exists on multiple servers."""
+        from mcpgateway.services.resource_service import ResourceService
+
+        svc = ResourceService()
+        db = MagicMock()
+        db.commit = MagicMock()
+        db.close = MagicMock()
+
+        def execute_side_effect(statement, *args, **kwargs):
+            sql = str(statement)
+            if "resources.uri" in sql and "resources.enabled" in sql:
+                raise MultipleResultsFound("duplicate URI across gateways")
+            raise AssertionError(sql)
+
+        db.execute.side_effect = execute_side_effect
+
+        with pytest.raises(ResourceError, match=r"ambiguous across multiple servers; use /servers/\{id\}/mcp"):
+            await svc.read_resource(db, resource_uri="time://formats")
+
     @pytest.mark.asyncio
     async def test_read_resource_quack_branch_stateful_hasattr_covers_unreachable_elif_false_arc(self):
         """Cover the (practically unreachable) branch arc (2296->2321) by using a stateful __getattr__."""
diff --git a/tests/unit/mcpgateway/services/test_tool_service.py b/tests/unit/mcpgateway/services/test_tool_service.py
index 4a2d6a2643..86808770e1 100644
--- a/tests/unit/mcpgateway/services/test_tool_service.py
+++ b/tests/unit/mcpgateway/services/test_tool_service.py
@@ -10,7 +10,7 @@
 # Standard
 import asyncio
 import base64
-from contextlib import asynccontextmanager
+from contextlib import asynccontextmanager, contextmanager
 from datetime import datetime, timezone
 import logging
 import time
@@ -6512,6 +6512,929 @@ async def test_invoke_tool_header_gateway_not_direct_proxy(self, tool_service, m
                     request_headers=request_headers,
                 )
 
+
+class TestRustMcpExecutionPlan:
+    """Tests for ToolService.prepare_rust_mcp_tool_execution()."""
+
+    @pytest.fixture
+    def mock_direct_gateway(self):
+        """Create a direct-proxy gateway payload for header-based lookup tests."""
+        return SimpleNamespace(
+            id="gw-dp-1",
+            name="direct_proxy_gw",
+            slug="direct-proxy-gw",
+            url="http://remote-mcp:8080/mcp",
+            gateway_mode="direct_proxy",
+            enabled=True,
+            reachable=True,
+            auth_type="bearer",
+            auth_value={"Authorization": "Bearer remote-token"},
+            auth_query_params=None,
+            oauth_config=None,
+            ca_certificate=None,
+            ca_certificate_sig=None,
+            passthrough_headers=[],
+            visibility="public",
+            team_id=None,
+            owner_email=None,
+            signing_algorithm=None,
+            transport="STREAMABLEHTTP",
+        )
+
+    @staticmethod
+    def _cache_payload(**tool_overrides):
+        gateway_payload = {
+            "id": "gw-1",
+            "name": "gateway-one",
+            "url": "http://gateway.example/mcp",
+            "auth_type": None,
+            "auth_value": None,
+            "auth_query_params": None,
+            "oauth_config": None,
+            "ca_certificate": None,
+            "ca_certificate_sig": None,
+            "passthrough_headers": [],
+        }
+        gateway_payload.update(tool_overrides.pop("gateway", {}))
+        tool_payload = {
+            "id": "tool-1",
+            "name": "tool-one",
+            "original_name": "tool-one",
+            "enabled": True,
+            "reachable": True,
+            "integration_type": "MCP",
+            "request_type": "streamablehttp",
+            "gateway_id": "gw-1",
+            "jsonpath_filter": None,
+            "timeout_ms": None,
+        }
+        tool_payload.update(tool_overrides)
+        return {"status": "active", "tool": tool_payload, "gateway": gateway_payload}
+
+    @staticmethod
+    def _cache_mock(payload):
+        mock_cache = AsyncMock()
+        mock_cache.enabled = True
+        mock_cache.get = AsyncMock(return_value=payload)
+        mock_cache.set = AsyncMock()
+        mock_cache.set_negative = AsyncMock()
+        return mock_cache
+
+    def _setup_db_for_header_lookup(self, test_db, gateway, tool=None):
+        """Set up execute() to return gateway on first call and tool on subsequent calls."""
+        call_count = [0]
+
+        def execute_side_effect(*_args, **_kwargs):
+            call_count[0] += 1
+            result = Mock()
+            if call_count[0] == 1:
+                result.scalar_one_or_none.return_value = gateway
+            else:
+                result.scalar_one_or_none.return_value = tool
+                result.scalars.return_value = result
+                result.all.return_value = [tool] if tool else []
+            return result
+
+        test_db.execute = Mock(side_effect=execute_side_effect)
+
+    @pytest.mark.asyncio
+    async def test_list_server_mcp_tool_definitions_public_only_and_output_schema(self, tool_service):
+        """Server-scoped MCP tool definitions should include outputSchema only when present."""
+        rows = [
+            {
+                "name": "tool-public",
+                "description": "desc",
+                "input_schema": {"type": "object"},
+                "output_schema": None,
+                "annotations": None,
+                "owner_email": None,
+                "team_id": None,
+                "visibility": "public",
+            },
+            {
+                "name": "tool-team",
+                "description": "team-desc",
+                "input_schema": None,
+                "output_schema": {"type": "object"},
+                "annotations": {"title": "Team"},
+                "owner_email": "owner@example.com",
+                "team_id": "team-a",
+                "visibility": "team",
+            },
+        ]
+        db = MagicMock()
+        db.execute.return_value.mappings.return_value.all.return_value = rows
+
+        payload = await tool_service.list_server_mcp_tool_definitions(
+            db,
+            "srv-1",
+            include_inactive=False,
+            user_email="owner@example.com",
+            token_teams=["team-a"],
+        )
+
+        assert payload == [
+            {
+                "name": "tool-public",
+                "description": "desc",
+                "inputSchema": {"type": "object"},
+                "annotations": {},
+            },
+            {
+                "name": "tool-team",
+                "description": "team-desc",
+                "inputSchema": {"type": "object", "properties": {}},
+                "annotations": {"title": "Team"},
+                "outputSchema": {"type": "object"},
+            },
+        ]
+        db.commit.assert_called_once()
+
+    @pytest.mark.asyncio
+    @pytest.mark.parametrize(
+        ("plugin_hooks", "trace_id", "expected_reason"),
+        [
+            (True, None, "plugin-hooks-configured"),
+            (False, "trace-1", "observability-trace-active"),
+        ],
+    )
+    async def test_prepare_rust_mcp_tool_execution_fast_fallbacks(self, tool_service, plugin_hooks, trace_id, expected_reason):
+        """Plugin hooks and active traces should bypass Rust direct execution."""
+        tool_service._plugin_manager = MagicMock()
+        tool_service._plugin_manager.has_hooks_for.return_value = plugin_hooks
+
+        with patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=trace_id))):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+        assert plan == {"eligible": False, "fallbackReason": expected_reason}
+
+    @pytest.mark.asyncio
+    @pytest.mark.parametrize(
+        ("status", "error_match"),
+        [
+            ("missing", "Tool not found"),
+            ("inactive", "exists but is inactive"),
+            ("offline", "currently offline"),
+        ],
+    )
+    async def test_prepare_rust_mcp_tool_execution_respects_negative_cache_entries(self, tool_service, status, error_match):
+        """Negative cache entries should short-circuit with the expected error."""
+        cache = self._cache_mock({"status": status})
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+        ):
+            with pytest.raises(ToolNotFoundError, match=error_match):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_direct_proxy_fallback(self, tool_service):
+        """Direct-proxy gateways should fall back to the Python execution path."""
+        gateway = SimpleNamespace(
+            id="gw-1",
+            name="gw",
+            url="http://gateway.example/mcp",
+            gateway_mode="direct_proxy",
+            auth_type=None,
+            auth_value=None,
+            auth_query_params=None,
+            oauth_config=None,
+            ca_certificate=None,
+            ca_certificate_sig=None,
+            passthrough_headers=[],
+        )
+        db = MagicMock()
+        db.execute.return_value.scalar_one_or_none.return_value = gateway
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.settings.mcpgateway_direct_proxy_enabled", True),
+            patch("mcpgateway.services.tool_service.check_gateway_access", new=AsyncMock(return_value=True)),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(
+                db,
+                "tool-one",
+                request_headers={"x-context-forge-gateway-id": "gw-1"},
+                user_email="user@example.com",
+                token_teams=["team-a"],
+            )
+
+        assert plan == {"eligible": False, "fallbackReason": "direct-proxy"}
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_direct_proxy_access_denied(self, tool_service):
+        """Direct-proxy lookup should deny inaccessible gateways as not-found."""
+        gateway = SimpleNamespace(
+            id="gw-1",
+            name="gw",
+            url="http://gateway.example/mcp",
+            gateway_mode="direct_proxy",
+            auth_type=None,
+            auth_value=None,
+            auth_query_params=None,
+            oauth_config=None,
+            ca_certificate=None,
+            ca_certificate_sig=None,
+            passthrough_headers=[],
+        )
+        db = MagicMock()
+        db.execute.return_value.scalar_one_or_none.return_value = gateway
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.settings.mcpgateway_direct_proxy_enabled", True),
+            patch("mcpgateway.services.tool_service.check_gateway_access", new=AsyncMock(return_value=False)),
+        ):
+            with pytest.raises(ToolNotFoundError, match="Tool not found"):
+                await tool_service.prepare_rust_mcp_tool_execution(
+                    db,
+                    "tool-one",
+                    request_headers={"x-context-forge-gateway-id": "gw-1"},
+                    user_email="user@example.com",
+                    token_teams=["team-a"],
+                )
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_loads_missing_tool_from_db(self, tool_service):
+        """DB lookup should raise not-found when no invocable tool exists."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[]),
+        ):
+            with pytest.raises(ToolNotFoundError, match="Tool not found"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_rejects_ambiguous_accessible_tool_candidates(self, tool_service):
+        """Multiple equally visible accessible tools should be treated as ambiguous."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+        candidate_a = SimpleNamespace(
+            enabled=True,
+            reachable=True,
+            visibility="team",
+            team_id="team-a",
+            owner_email="user@example.com",
+            gateway=SimpleNamespace(),
+        )
+        candidate_b = SimpleNamespace(
+            enabled=True,
+            reachable=True,
+            visibility="team",
+            team_id="team-b",
+            owner_email="user@example.com",
+            gateway=SimpleNamespace(),
+        )
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[candidate_a, candidate_b]),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+        ):
+            with pytest.raises(ToolInvocationError, match="ambiguous"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one", user_email="user@example.com", token_teams=["team-a"])
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_selects_highest_priority_accessible_candidate(self, tool_service):
+        """A single best-priority accessible candidate should be selected successfully."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+        selected_gateway = SimpleNamespace(
+            id="gw-1",
+            name="gateway-one",
+            url="http://gateway.example/mcp",
+            auth_type=None,
+            auth_value=None,
+            auth_query_params=None,
+            oauth_config=None,
+            ca_certificate=None,
+            ca_certificate_sig=None,
+            passthrough_headers=[],
+        )
+        candidate_team = SimpleNamespace(
+            id="tool-team",
+            enabled=True,
+            reachable=True,
+            visibility="team",
+            team_id="team-a",
+            owner_email="user@example.com",
+            gateway=selected_gateway,
+        )
+        candidate_public = SimpleNamespace(
+            id="tool-public",
+            enabled=True,
+            reachable=True,
+            visibility="public",
+            team_id=None,
+            owner_email=None,
+            gateway=selected_gateway,
+        )
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache.get_passthrough_headers", return_value=[]),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", side_effect=lambda request_headers, headers, *_args, **_kwargs: headers),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[candidate_public, candidate_team]),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(side_effect=[True, True, True])),
+            patch.object(tool_service, "_build_tool_cache_payload", return_value=self._cache_payload(id="tool-team", gateway_id="gw-1")),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(
+                MagicMock(),
+                "tool-one",
+                user_email="user@example.com",
+                token_teams=["team-a"],
+            )
+
+        assert plan["eligible"] is True
+        assert plan["gatewayId"] == "gw-1"
+        assert plan["toolName"] == "tool-one"
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_rejects_inaccessible_db_candidates(self, tool_service):
+        """DB-loaded candidates with no accessible match should surface as not-found."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+        candidate_a = SimpleNamespace(enabled=True, reachable=True, visibility="team", team_id="team-a", owner_email="user@example.com", gateway=SimpleNamespace())
+        candidate_b = SimpleNamespace(enabled=True, reachable=True, visibility="public", team_id=None, owner_email=None, gateway=SimpleNamespace())
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[candidate_a, candidate_b]),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=False)),
+        ):
+            with pytest.raises(ToolNotFoundError, match="Tool not found"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one", user_email="user@example.com", token_teams=["team-a"])
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_rejects_inactive_db_tool(self, tool_service):
+        """Inactive DB-loaded tools should fail before plan generation."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+        tool = SimpleNamespace(
+            enabled=False,
+            reachable=True,
+            visibility="public",
+            team_id=None,
+            owner_email=None,
+            gateway=SimpleNamespace(),
+        )
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[tool]),
+        ):
+            with pytest.raises(ToolNotFoundError, match="inactive"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_marks_unreachable_tools_offline_and_caches_negative_result(self, tool_service):
+        """Unreachable DB-loaded tools should set a negative cache entry before failing."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+        tool = SimpleNamespace(
+            enabled=True,
+            reachable=False,
+            visibility="public",
+            team_id=None,
+            owner_email=None,
+            gateway=SimpleNamespace(),
+        )
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[tool]),
+        ):
+            with pytest.raises(ToolNotFoundError, match="currently offline"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+        cache.set_negative.assert_awaited_once_with("tool-one", "offline")
+
+    @pytest.mark.asyncio
+    @pytest.mark.parametrize(
+        ("payload", "error_match"),
+        [
+            ({"enabled": False}, "inactive"),
+            ({"reachable": False}, "currently offline"),
+        ],
+    )
+    async def test_prepare_rust_mcp_tool_execution_rejects_inactive_or_offline_cached_payloads(self, tool_service, payload, error_match):
+        """Cached payloads should honor enabled/reachable flags before plan generation."""
+        cache = self._cache_mock(self._cache_payload(**payload))
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+        ):
+            with pytest.raises(ToolNotFoundError, match=error_match):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_rejects_cached_payload_when_access_is_denied(self, tool_service):
+        """Cached payloads should still pass through access checks."""
+        cache = self._cache_mock(self._cache_payload())
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=False)),
+        ):
+            with pytest.raises(ToolNotFoundError, match="Tool not found"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one", user_email="user@example.com", token_teams=["team-a"])
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_rejects_server_scoped_cached_payload_without_tool_id(self, tool_service):
+        """Server-scoped cached payloads need a concrete tool id for membership checks."""
+        cache = self._cache_mock(self._cache_payload(id=None))
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+        ):
+            with pytest.raises(ToolNotFoundError, match="Tool not found"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one", server_id="srv-1")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_uses_live_gateway_auth_fields_for_loaded_tools(self, tool_service):
+        """Loaded DB tools should prefer live gateway auth metadata over cached payload values."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+        gateway = SimpleNamespace(
+            id="gw-1",
+            name="gateway-one",
+            description="gateway-one",
+            slug="gateway-one",
+            url="http://gateway.example/mcp",
+            transport="streamablehttp",
+            capabilities={},
+            auth_type="basic",
+            auth_value={"Authorization": "Bearer live-token"},
+            auth_query_params={"api_key": "live-query"},
+            oauth_config={"grant_type": "client_credentials"},
+            ca_certificate=None,
+            enabled=True,
+            reachable=True,
+            team_id=None,
+            owner_email=None,
+            visibility="public",
+            tags=[],
+            gateway_mode="cache",
+            passthrough_headers=[],
+        )
+        tool = SimpleNamespace(
+            id="tool-1",
+            url=None,
+            description="tool-one",
+            original_description="tool-one",
+            enabled=True,
+            reachable=True,
+            visibility="public",
+            team_id=None,
+            owner_email=None,
+            integration_type="MCP",
+            request_type="streamablehttp",
+            original_name="tool-one",
+            name="tool-one",
+            timeout_ms=None,
+            jsonpath_filter=None,
+            headers={},
+            input_schema={"type": "object"},
+            output_schema=None,
+            annotations={},
+            auth_type=None,
+            custom_name=None,
+            custom_name_slug=None,
+            display_name=None,
+            tags=[],
+            gateway_id="gw-1",
+            gateway=gateway,
+        )
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[tool]),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch("mcpgateway.services.tool_service.encode_auth", return_value="encoded-live-auth"),
+            patch("mcpgateway.services.tool_service.decode_auth", return_value={"Authorization": "Bearer live-token"}),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", return_value={"Authorization": "Bearer live-token"}),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+        assert plan["eligible"] is True
+        assert plan["headers"] == {"Authorization": "Bearer live-token"}
+        cache.set.assert_awaited_once()
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_uses_live_gateway_string_auth_values(self, tool_service):
+        """Loaded DB tools should honor pre-encoded gateway auth strings."""
+        cache = self._cache_mock(None)
+        tool_service._plugin_manager = None
+        gateway = SimpleNamespace(
+            id="gw-1",
+            name="gateway-one",
+            description="gateway-one",
+            slug="gateway-one",
+            url="http://gateway.example/mcp",
+            transport="streamablehttp",
+            capabilities={},
+            auth_type="bearer",
+            auth_value="encoded-string-auth",
+            auth_query_params=None,
+            oauth_config=None,
+            ca_certificate=None,
+            enabled=True,
+            reachable=True,
+            team_id=None,
+            owner_email=None,
+            visibility="public",
+            tags=[],
+            gateway_mode="cache",
+            passthrough_headers=[],
+        )
+        tool = SimpleNamespace(
+            id="tool-1",
+            url=None,
+            description="tool-one",
+            original_description="tool-one",
+            enabled=True,
+            reachable=True,
+            visibility="public",
+            team_id=None,
+            owner_email=None,
+            integration_type="MCP",
+            request_type="streamablehttp",
+            original_name="tool-one",
+            name="tool-one",
+            timeout_ms=None,
+            jsonpath_filter=None,
+            headers={},
+            input_schema={"type": "object"},
+            output_schema=None,
+            annotations={},
+            auth_type=None,
+            custom_name=None,
+            custom_name_slug=None,
+            display_name=None,
+            tags=[],
+            gateway_id="gw-1",
+            gateway=gateway,
+        )
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_load_invocable_tools", return_value=[tool]),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch("mcpgateway.services.tool_service.decode_auth", return_value={"Authorization": "Bearer string-token"}),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", return_value={"Authorization": "Bearer string-token"}),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+        assert plan["headers"] == {"Authorization": "Bearer string-token"}
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_hydrates_gateway_auth_from_db_when_tool_is_cached(self, tool_service):
+        """Cached tool payloads should hydrate gateway auth details from the DB when needed."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={"auth_type": "basic", "auth_value": None, "auth_query_params": None, "oauth_config": None},
+            )
+        )
+        tool_service._plugin_manager = None
+        tool_auth_row = SimpleNamespace(
+            gateway=SimpleNamespace(
+                auth_value={"Authorization": "Bearer hydrated-token"},
+                auth_query_params={"api_key": "hydrated"},
+                oauth_config={"grant_type": "client_credentials"},
+            )
+        )
+        db = MagicMock()
+        db.execute.return_value.scalar_one_or_none.return_value = tool_auth_row
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch("mcpgateway.services.tool_service.encode_auth", return_value="encoded-hydrated-auth"),
+            patch("mcpgateway.services.tool_service.decode_auth", return_value={"Authorization": "Bearer hydrated-token"}),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", return_value={"Authorization": "Bearer hydrated-token"}),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(db, "tool-one")
+
+        assert plan["eligible"] is True
+        assert plan["headers"] == {"Authorization": "Bearer hydrated-token"}
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_hydrates_gateway_string_auth_from_db(self, tool_service):
+        """Cached payload hydration should also honor string auth values from the DB row."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={"auth_type": "basic", "auth_value": None, "auth_query_params": None, "oauth_config": None},
+            )
+        )
+        tool_service._plugin_manager = None
+        tool_auth_row = SimpleNamespace(
+            gateway=SimpleNamespace(
+                auth_value="encoded-hydrated-string",
+                auth_query_params=None,
+                oauth_config=None,
+            )
+        )
+        db = MagicMock()
+        db.execute.return_value.scalar_one_or_none.return_value = tool_auth_row
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch("mcpgateway.services.tool_service.decode_auth", return_value={"Authorization": "Bearer hydrated-string"}),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", return_value={"Authorization": "Bearer hydrated-string"}),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(db, "tool-one")
+
+        assert plan["headers"] == {"Authorization": "Bearer hydrated-string"}
+
+    def test_load_invocable_tools_applies_server_scope_filter(self, tool_service):
+        """Server-scoped tool loading should join through the server association table."""
+        db = MagicMock()
+        result = MagicMock()
+        result.scalars.return_value.all.return_value = []
+        db.execute.return_value = result
+
+        assert tool_service._load_invocable_tools(db, "tool-one", server_id="srv-1") == []
+        db.execute.assert_called_once()
+
+    @pytest.mark.asyncio
+    @pytest.mark.parametrize(
+        ("tool_overrides", "expected_reason"),
+        [
+            ({"integration_type": "REST"}, "unsupported-integration:REST"),
+            ({"request_type": "sse"}, "unsupported-transport:sse"),
+            ({"jsonpath_filter": "$.items[*]"}, "jsonpath-filter-configured"),
+            ({"gateway": {"ca_certificate": "cert"}}, "custom-ca-certificate"),
+            ({"gateway": {"url": None}}, "missing-gateway-url"),
+        ],
+    )
+    async def test_prepare_rust_mcp_tool_execution_returns_expected_fallback_reasons(self, tool_service, tool_overrides, expected_reason):
+        """Unsupported execution plans should report explicit fallback reasons."""
+        cache = self._cache_mock(self._cache_payload(**tool_overrides))
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+        assert plan == {"eligible": False, "fallbackReason": expected_reason}
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_checks_server_membership(self, tool_service):
+        """Server-scoped execution should reject tools not attached to the requested server."""
+        cache = self._cache_mock(self._cache_payload())
+        db = MagicMock()
+        db.execute.return_value.first.return_value = None
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+        ):
+            with pytest.raises(ToolNotFoundError, match="Tool not found"):
+                await tool_service.prepare_rust_mcp_tool_execution(db, "tool-one", server_id="srv-1")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_handles_query_param_auth_and_passthrough(self, tool_service):
+        """Query-param auth should be applied before returning an eligible Rust plan."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={
+                    "auth_type": "query_param",
+                    "auth_query_params": {
+                        "api_key": base64.b64encode(orjson.dumps({"api_key": "secret"})).decode(),
+                        "broken": "not-decodable",
+                    },
+                    "passthrough_headers": ["X-Tenant-Id"],
+                }
+            )
+        )
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=["X-Tenant-Id"]))),
+            patch("mcpgateway.services.tool_service.decode_auth", side_effect=lambda value: {"api_key": "secret"} if value != "not-decodable" else (_ for _ in ()).throw(ValueError("bad"))),
+            patch("mcpgateway.services.tool_service.apply_query_param_auth", side_effect=lambda url, params: f"{url}?api_key={params['api_key']}"),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", return_value={"X-Tenant-Id": "tenant-1"}),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(
+                MagicMock(),
+                "tool-one",
+                request_headers={"x-tenant-id": "tenant-1"},
+                user_email="user@example.com",
+                token_teams=["team-a"],
+            )
+
+        assert plan["eligible"] is True
+        assert plan["serverUrl"] == "http://gateway.example/mcp?api_key=secret"
+        assert plan["headers"] == {"X-Tenant-Id": "tenant-1"}
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_oauth_authorization_code_requires_user(self, tool_service):
+        """Authorization-code OAuth plans should require an authenticated app user."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={
+                    "auth_type": "oauth",
+                    "oauth_config": {"grant_type": "authorization_code"},
+                }
+            )
+        )
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+        ):
+            with pytest.raises(ToolInvocationError, match="OAuth token retrieval failed"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_oauth_client_credentials_failure(self, tool_service):
+        """Client-credentials OAuth failures should bubble up as ToolInvocationError."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={
+                    "auth_type": "oauth",
+                    "oauth_config": {"grant_type": "client_credentials"},
+                }
+            )
+        )
+        tool_service._plugin_manager = None
+        tool_service.oauth_manager = MagicMock(get_access_token=AsyncMock(side_effect=RuntimeError("boom")))
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+        ):
+            with pytest.raises(ToolInvocationError, match="OAuth authentication failed"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_oauth_authorization_code_uses_stored_token(self, tool_service):
+        """Authorization-code OAuth plans should inject a stored bearer token when available."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={
+                    "auth_type": "oauth",
+                    "oauth_config": {"grant_type": "authorization_code"},
+                }
+            )
+        )
+        token_storage = MagicMock()
+        token_storage.get_user_token = AsyncMock(return_value="stored-oauth-token")
+        fresh_session = MagicMock()
+        tool_service._plugin_manager = None
+
+        @contextmanager
+        def _fresh_db_session():
+            yield fresh_session
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+            patch("mcpgateway.services.token_storage_service.TokenStorageService", return_value=token_storage),
+            patch("mcpgateway.services.tool_service.fresh_db_session", _fresh_db_session),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", side_effect=lambda _request_headers, headers, *_args, **_kwargs: headers),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one", app_user_email="user@example.com")
+
+        assert plan["eligible"] is True
+        assert plan["headers"] == {"Authorization": "Bearer stored-oauth-token"}
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_oauth_authorization_code_requires_prior_authorization(self, tool_service):
+        """Authorization-code OAuth plans should fail when no stored token exists for the user."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={
+                    "auth_type": "oauth",
+                    "oauth_config": {"grant_type": "authorization_code"},
+                }
+            )
+        )
+        token_storage = MagicMock()
+        token_storage.get_user_token = AsyncMock(return_value=None)
+        fresh_session = MagicMock()
+        tool_service._plugin_manager = None
+
+        @contextmanager
+        def _fresh_db_session():
+            yield fresh_session
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+            patch("mcpgateway.services.token_storage_service.TokenStorageService", return_value=token_storage),
+            patch("mcpgateway.services.tool_service.fresh_db_session", _fresh_db_session),
+        ):
+            with pytest.raises(ToolInvocationError, match="OAuth token retrieval failed"):
+                await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one", app_user_email="user@example.com")
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_oauth_client_credentials_success(self, tool_service):
+        """Client-credentials OAuth plans should inject a freshly acquired access token."""
+        cache = self._cache_mock(
+            self._cache_payload(
+                gateway={
+                    "auth_type": "oauth",
+                    "oauth_config": {"grant_type": "client_credentials"},
+                }
+            )
+        )
+        tool_service._plugin_manager = None
+        tool_service.oauth_manager = MagicMock(get_access_token=AsyncMock(return_value="oauth-access-token"))
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", side_effect=lambda _request_headers, headers, *_args, **_kwargs: headers),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(MagicMock(), "tool-one")
+
+        assert plan["eligible"] is True
+        assert plan["headers"] == {"Authorization": "Bearer oauth-access-token"}
+
+    @pytest.mark.asyncio
+    async def test_prepare_rust_mcp_tool_execution_returns_eligible_plan(self, tool_service):
+        """Simple MCP streamable-http tools should produce an eligible Rust execution plan."""
+        cache = self._cache_mock(self._cache_payload(timeout_ms=2500))
+        tool_service._plugin_manager = None
+
+        with (
+            patch("mcpgateway.services.tool_service._get_tool_lookup_cache", return_value=cache),
+            patch("mcpgateway.services.tool_service.current_trace_id", MagicMock(get=MagicMock(return_value=None))),
+            patch("mcpgateway.services.tool_service.global_config_cache", MagicMock(get_passthrough_headers=MagicMock(return_value=[]))),
+            patch("mcpgateway.services.tool_service.compute_passthrough_headers_cached", return_value={"Authorization": "Bearer abc"}),
+            patch.object(tool_service, "_check_tool_access", AsyncMock(return_value=True)),
+        ):
+            plan = await tool_service.prepare_rust_mcp_tool_execution(
+                MagicMock(),
+                "tool-one",
+                request_headers={"authorization": "Bearer abc"},
+                user_email="user@example.com",
+                token_teams=["team-a"],
+            )
+
+        assert plan == {
+            "eligible": True,
+            "transport": "streamablehttp",
+            "serverUrl": "http://gateway.example/mcp",
+            "remoteToolName": "tool-one",
+            "headers": {"Authorization": "Bearer abc"},
+            "timeoutMs": 2500,
+            "gatewayId": "gw-1",
+            "toolName": "tool-one",
+            "toolId": "tool-1",
+            "serverId": None,
+        }
+
+
     @pytest.mark.asyncio
     async def test_invoke_tool_header_gateway_not_found(self, tool_service, test_db):
         """Header present but gateway not in DB should fall through to normal tool lookup."""
diff --git a/tests/unit/mcpgateway/test_admin.py b/tests/unit/mcpgateway/test_admin.py
index de6a6714bc..c6dd0dee21 100644
--- a/tests/unit/mcpgateway/test_admin.py
+++ b/tests/unit/mcpgateway/test_admin.py
@@ -8965,6 +8965,10 @@ def make_query(value):
     engine.dialect.name = "sqlite"
     monkeypatch.setattr("mcpgateway.admin.version_module.engine", engine)
     monkeypatch.setattr("mcpgateway.admin.version_module._database_version", lambda: ("", True))
+    monkeypatch.setattr(
+        "mcpgateway.admin.version_module._mcp_runtime_status_payload",
+        lambda: {"mode": "rust-managed", "mounted": "rust", "session_core_mode": "rust", "resume_core_mode": "rust", "live_stream_core_mode": "rust", "affinity_core_mode": "rust", "session_auth_reuse_mode": "rust"},
+    )
     monkeypatch.setattr("mcpgateway.admin.version_module.REDIS_AVAILABLE", False)
     monkeypatch.setattr("mcpgateway.admin.version_module.START_TIME", 0)
 
@@ -8984,6 +8988,9 @@ async def aggregate_metrics(self, _db):
     response = await get_overview_partial(mock_request, db=mock_db, user={"email": "user@example.com", "db": mock_db})
     assert isinstance(response, HTMLResponse)
     assert mock_request.app.state.templates.TemplateResponse.called
+    context = mock_request.app.state.templates.TemplateResponse.call_args.args[2]
+    assert context["mcp_runtime"]["mode"] == "rust-managed"
+    assert context["mcp_runtime"]["mounted"] == "rust"
 
 
 @pytest.mark.asyncio
@@ -9024,6 +9031,10 @@ def make_query(value):
     engine.dialect.name = "sqlite"
     monkeypatch.setattr("mcpgateway.admin.version_module.engine", engine)
     monkeypatch.setattr("mcpgateway.admin.version_module._database_version", lambda: ("", True))
+    monkeypatch.setattr(
+        "mcpgateway.admin.version_module._mcp_runtime_status_payload",
+        lambda: {"mode": "python", "mounted": "python", "session_core_mode": "python", "resume_core_mode": "python", "live_stream_core_mode": "python", "affinity_core_mode": "python", "session_auth_reuse_mode": "python"},
+    )
     monkeypatch.setattr("mcpgateway.admin.version_module.REDIS_AVAILABLE", True)
     monkeypatch.setattr("mcpgateway.admin.version_module.START_TIME", 0)
 
@@ -9080,6 +9091,10 @@ def make_query(value):
     engine.dialect.name = "sqlite"
     monkeypatch.setattr("mcpgateway.admin.version_module.engine", engine)
     monkeypatch.setattr("mcpgateway.admin.version_module._database_version", lambda: ("", True))
+    monkeypatch.setattr(
+        "mcpgateway.admin.version_module._mcp_runtime_status_payload",
+        lambda: {"mode": "python", "mounted": "python", "session_core_mode": "python", "resume_core_mode": "python", "live_stream_core_mode": "python", "affinity_core_mode": "python", "session_auth_reuse_mode": "python"},
+    )
     monkeypatch.setattr("mcpgateway.admin.version_module.REDIS_AVAILABLE", True)
     monkeypatch.setattr("mcpgateway.admin.version_module.START_TIME", 0)
 
@@ -9131,6 +9146,10 @@ def make_query(value):
     engine.dialect.name = "sqlite"
     monkeypatch.setattr("mcpgateway.admin.version_module.engine", engine)
     monkeypatch.setattr("mcpgateway.admin.version_module._database_version", lambda: ("", True))
+    monkeypatch.setattr(
+        "mcpgateway.admin.version_module._mcp_runtime_status_payload",
+        lambda: {"mode": "python", "mounted": "python", "session_core_mode": "python", "resume_core_mode": "python", "live_stream_core_mode": "python", "affinity_core_mode": "python", "session_auth_reuse_mode": "python"},
+    )
     monkeypatch.setattr("mcpgateway.admin.version_module.REDIS_AVAILABLE", False)
     monkeypatch.setattr("mcpgateway.admin.version_module.START_TIME", 0)
 
diff --git a/tests/unit/mcpgateway/test_config.py b/tests/unit/mcpgateway/test_config.py
index 4f7a3e9bbf..71015e3464 100644
--- a/tests/unit/mcpgateway/test_config.py
+++ b/tests/unit/mcpgateway/test_config.py
@@ -442,6 +442,7 @@ def test_validate_secrets_low_entropy_warns():
 
 def test_validate_secrets_direct_call_non_secretstr_value():
     """Cover validate_secrets branch where v is not a SecretStr (config.py:691)."""
+
     class _Info:
         field_name = "jwt_secret_key"
         data = {"client_mode": True}
@@ -481,6 +482,7 @@ def test_validate_admin_password_low_complexity():
 
 def test_validate_admin_password_direct_call_plain_string():
     """Cover validate_admin_password branch where v is not a SecretStr (config.py:726)."""
+
     class _Info:
         data = {"client_mode": True}
 
@@ -519,6 +521,7 @@ def test_validate_cors_origins_invalid_format_warns():
 
 def test_validate_cors_origins_none_passthrough_direct_call():
     """Directly cover the validator branch returning None (config.py:767)."""
+
     # This branch is not reachable through Settings() because _parse_allowed_origins
     # turns inputs into a set, but we still want to keep the validator logic covered.
     class _Info:
@@ -529,6 +532,7 @@ class _Info:
 
 def test_validate_cors_origins_invalid_type_direct_call():
     """Directly cover the validator raising ValueError for invalid types (config.py:769)."""
+
     class _Info:
         data = {"client_mode": True}
 
@@ -796,6 +800,7 @@ def test_auto_enable_security_txt_empty():
 
 def test_auto_enable_security_txt_falls_back_to_bool_value_direct_call():
     """Directly cover fallback branch when well_known_security_txt is missing from validator context (config.py:1699)."""
+
     class _Info:
         data = {}
 
@@ -1047,6 +1052,41 @@ def test_mcp_require_auth_defaults_to_auth_required_false():
     assert s.mcp_require_auth is False
 
 
+def test_experimental_rust_mcp_runtime_defaults():
+    """Experimental Rust MCP runtime settings should default to disabled with local sidecar URL."""
+    s = Settings(_env_file=None)
+    assert s.experimental_rust_mcp_runtime_enabled is False
+    assert s.experimental_rust_mcp_runtime_url == "http://127.0.0.1:8787"
+    assert s.experimental_rust_mcp_runtime_uds is None
+    assert s.experimental_rust_mcp_runtime_timeout_seconds == 30
+    assert s.experimental_rust_mcp_session_core_enabled is False
+    assert s.experimental_rust_mcp_event_store_enabled is False
+    assert s.experimental_rust_mcp_resume_core_enabled is False
+    assert s.experimental_rust_mcp_live_stream_core_enabled is False
+    assert s.experimental_rust_mcp_affinity_core_enabled is False
+    assert s.experimental_rust_mcp_session_auth_reuse_enabled is False
+
+
+def test_experimental_rust_mcp_runtime_uds_accepts_absolute_path(tmp_path: Path):
+    """The optional Rust runtime UDS path should round-trip when configured."""
+    uds_path = tmp_path / "contextforge-rust.sock"
+    s = Settings(experimental_rust_mcp_runtime_uds=str(uds_path), _env_file=None)
+    assert s.experimental_rust_mcp_runtime_uds == str(uds_path)
+
+
+def test_experimental_rust_mcp_runtime_uds_rejects_relative_path():
+    """The Rust runtime UDS path must be absolute."""
+    with pytest.raises(ValueError, match="must be an absolute path"):
+        Settings(experimental_rust_mcp_runtime_uds="relative.sock", _env_file=None)
+
+
+def test_experimental_rust_mcp_runtime_uds_rejects_missing_parent(tmp_path: Path):
+    """The Rust runtime UDS parent directory must already exist."""
+    missing_parent = tmp_path / "missing" / "contextforge-rust.sock"
+    with pytest.raises(ValueError, match="parent directory does not exist"):
+        Settings(experimental_rust_mcp_runtime_uds=str(missing_parent), _env_file=None)
+
+
 def test_auth_required_true_with_explicit_mcp_permissive_warns(caplog):
     """AUTH_REQUIRED=true with explicit MCP_REQUIRE_AUTH=false should warn."""
     caplog.set_level("WARNING", logger="mcpgateway.config")
diff --git a/tests/unit/mcpgateway/test_main_extended.py b/tests/unit/mcpgateway/test_main_extended.py
index 138fa6331a..87c9046c1a 100644
--- a/tests/unit/mcpgateway/test_main_extended.py
+++ b/tests/unit/mcpgateway/test_main_extended.py
@@ -13,6 +13,7 @@
 # Standard
 import builtins
 import asyncio
+import base64
 import importlib.util
 import json
 from pathlib import Path
@@ -22,18 +23,33 @@
 import uuid
 
 # Third-Party
-from fastapi import HTTPException, Request
+from fastapi import HTTPException, Request, Response as FastAPIResponse
 from fastapi.testclient import TestClient
+import orjson
 import pytest
 import sqlalchemy as sa
 from starlette.responses import Response as StarletteResponse
 
 # First-Party
+from mcpgateway.common.models import LogLevel
 from mcpgateway.config import settings
 from mcpgateway.main import (
     AdminAuthMiddleware,
     DocsAuthMiddleware,
+    InternalTrustedMCPTransportBridge,
+    MCPRuntimeHeaderTransportWrapper,
     MCPPathRewriteMiddleware,
+    _expected_internal_mcp_runtime_auth_header,
+    _build_internal_mcp_auth_scope,
+    _build_internal_mcp_forwarded_user,
+    _decode_internal_mcp_auth_context,
+    _enforce_internal_mcp_server_scope,
+    _ensure_rpc_permission,
+    _extract_scoped_permissions,
+    _is_permission_admin_user,
+    _run_internal_mcp_authentication,
+    _serialize_mcp_tool_definition,
+    _serialize_legacy_tool_payloads,
     app,
     create_prompt,
     create_resource,
@@ -44,6 +60,34 @@
     export_configuration,
     export_selective_configuration,
     get_a2a_agent,
+    handle_internal_mcp_initialize,
+    handle_internal_mcp_completion_complete,
+    handle_internal_mcp_authenticate,
+    handle_internal_mcp_logging_set_level,
+    handle_internal_mcp_notifications_cancelled,
+    handle_internal_mcp_notifications_initialized,
+    handle_internal_mcp_notifications_message,
+    handle_internal_mcp_session_delete,
+    handle_internal_mcp_resources_list,
+    handle_internal_mcp_resources_read,
+    handle_internal_mcp_resources_subscribe,
+    handle_internal_mcp_resources_unsubscribe,
+    handle_internal_mcp_resource_templates_list,
+    handle_internal_mcp_roots_list,
+    handle_internal_mcp_prompts_get,
+    handle_internal_mcp_prompts_list,
+    handle_internal_mcp_prompts_get_authz,
+    handle_internal_mcp_prompts_list_authz,
+    handle_internal_mcp_resource_templates_list_authz,
+    handle_internal_mcp_resources_list_authz,
+    handle_internal_mcp_resources_read_authz,
+    handle_internal_mcp_sampling_create_message,
+    handle_internal_mcp_tools_call,
+    handle_internal_mcp_tools_call_metric,
+    handle_internal_mcp_tools_call_resolve,
+    handle_internal_mcp_tools_list_authz,
+    handle_internal_mcp_tools_list,
+    handle_internal_mcp_rpc,
     handle_rpc,
     import_configuration,
     jsonpath_modifier,
@@ -67,6 +111,9 @@
 import mcpgateway.db as db_mod
 from mcpgateway.plugins.framework import PluginError
 from mcpgateway.schemas import PromptCreate, PromptUpdate, ResourceCreate, ResourceUpdate, ToolCreate, ToolUpdate
+from mcpgateway.services.tool_service import ToolError, ToolNotFoundError
+from mcpgateway.transports.streamablehttp_transport import user_context_var
+from mcpgateway.validation.jsonrpc import JSONRPCError
 
 
 def _make_request(
@@ -88,6 +135,17 @@ def _make_request(
     return request
 
 
+def _trusted_internal_mcp_headers(auth_context: dict[str, object], **extra_headers: str) -> dict[str, str]:
+    """Build trusted Rust->Python internal MCP headers for unit tests."""
+    headers = {
+        "x-contextforge-mcp-runtime": "rust",
+        "x-contextforge-mcp-runtime-auth": _expected_internal_mcp_runtime_auth_header(),
+        "x-contextforge-auth-context": base64.urlsafe_b64encode(orjson.dumps(auth_context)).decode().rstrip("="),
+    }
+    headers.update(extra_headers)
+    return headers
+
+
 def _import_fresh_main_module(
     monkeypatch: pytest.MonkeyPatch,
     *,
@@ -167,6 +225,46 @@ def _guarded_import(name, globals=None, locals=None, fromlist=(), level=0):  # n
 class TestConditionalPaths:
     """Test conditional code paths to improve coverage."""
 
+    def test_import_uses_rust_mcp_proxy_when_enabled(self, monkeypatch):
+        """Module import should swap the mounted /mcp app to the Rust proxy when enabled."""
+        module = _import_fresh_main_module(
+            monkeypatch,
+            overrides={
+                "experimental_rust_mcp_runtime_enabled": True,
+                "experimental_rust_mcp_session_auth_reuse_enabled": True,
+                "experimental_rust_mcp_runtime_url": "http://127.0.0.1:8787",
+            },
+        )
+
+        assert module.mcp_transport_app.__class__.__name__ == "RustMCPRuntimeProxy"
+
+    def test_import_keeps_python_transport_when_rust_runtime_lacks_session_auth_reuse(self, monkeypatch):
+        """Module import should keep public /mcp on Python when Rust session auth reuse is disabled."""
+        module = _import_fresh_main_module(
+            monkeypatch,
+            overrides={
+                "experimental_rust_mcp_runtime_enabled": True,
+                "experimental_rust_mcp_session_auth_reuse_enabled": False,
+                "experimental_rust_mcp_runtime_url": "http://127.0.0.1:8787",
+            },
+        )
+
+        assert module.mcp_transport_app.__class__.__name__ == "MCPRuntimeHeaderTransportWrapper"
+
+    def test_import_warns_when_rust_artifacts_present_but_runtime_disabled(self, monkeypatch, caplog):
+        """A Rust-built image with the runtime flag disabled should warn loudly at import time."""
+        caplog.set_level("WARNING")
+        module = _import_fresh_main_module(
+            monkeypatch,
+            overrides={
+                "experimental_rust_mcp_runtime_enabled": False,
+            },
+            env={"CONTEXTFORGE_ENABLE_RUST_BUILD": "true"},
+        )
+
+        assert module.mcp_transport_app.__class__.__name__ == "MCPRuntimeHeaderTransportWrapper"
+        assert any("python-rust-built-disabled" in rec.message for rec in caplog.records)
+
     def test_redis_initialization_path(self, test_client, auth_headers):
         """Test Redis initialization path by mocking settings."""
         # Test that the Redis path is covered indirectly through existing functionality
@@ -182,6 +280,760 @@ def test_event_loop_task_creation(self, test_client, auth_headers):
         assert response.status_code == 200
 
 
+class TestInternalTrustedMcpTransportBridge:
+    """Test the trusted Rust -> Python MCP transport bridge."""
+
+    @pytest.mark.asyncio
+    async def test_python_transport_wrapper_sets_runtime_header(self):
+        sent = []
+
+        class FakeTransportApp:
+            async def handle_streamable_http(self, _scope, _receive, send):
+                await send({"type": "http.response.start", "status": 200, "headers": [(b"content-type", b"application/json")]})
+                await send({"type": "http.response.body", "body": b"{}", "more_body": False})
+
+        wrapper = MCPRuntimeHeaderTransportWrapper(FakeTransportApp(), runtime_name="python")
+
+        async def _receive():
+            return {"type": "http.request", "body": b"", "more_body": False}
+
+        async def _send(message):
+            sent.append(message)
+
+        await wrapper.handle_streamable_http({"type": "http", "method": "POST"}, _receive, _send)
+
+        start = next(message for message in sent if message["type"] == "http.response.start")
+        assert (b"x-contextforge-mcp-runtime", b"python") in start["headers"]
+        assert (b"x-contextforge-mcp-session-core", b"python") in start["headers"]
+        assert (b"x-contextforge-mcp-resume-core", b"python") in start["headers"]
+        assert (b"x-contextforge-mcp-live-stream-core", b"python") in start["headers"]
+        assert (b"x-contextforge-mcp-affinity-core", b"python") in start["headers"]
+        assert (b"x-contextforge-mcp-session-auth-reuse", b"python") in start["headers"]
+
+    @pytest.mark.asyncio
+    async def test_python_transport_wrapper_preserves_existing_runtime_headers(self):
+        """Existing runtime headers should not be duplicated."""
+        sent = []
+
+        class FakeTransportApp:
+            async def handle_streamable_http(self, _scope, _receive, send):
+                await send(
+                    {
+                        "type": "http.response.start",
+                        "status": 200,
+                        "headers": [
+                            (b"x-contextforge-mcp-runtime", b"rust"),
+                            (b"x-contextforge-mcp-session-core", b"rust"),
+                            (b"x-contextforge-mcp-resume-core", b"rust"),
+                            (b"x-contextforge-mcp-live-stream-core", b"rust"),
+                            (b"x-contextforge-mcp-affinity-core", b"rust"),
+                            (b"x-contextforge-mcp-session-auth-reuse", b"rust"),
+                        ],
+                    }
+                )
+                await send({"type": "http.response.body", "body": b"{}", "more_body": False})
+
+        wrapper = MCPRuntimeHeaderTransportWrapper(FakeTransportApp(), runtime_name="python")
+
+        async def _receive():
+            return {"type": "http.request", "body": b"", "more_body": False}
+
+        async def _send(message):
+            sent.append(message)
+
+        await wrapper.handle_streamable_http({"type": "http", "method": "POST"}, _receive, _send)
+
+        start = next(message for message in sent if message["type"] == "http.response.start")
+        header_names = [name for name, _value in start["headers"]]
+        assert header_names.count(b"x-contextforge-mcp-runtime") == 1
+        assert header_names.count(b"x-contextforge-mcp-session-core") == 1
+        assert header_names.count(b"x-contextforge-mcp-resume-core") == 1
+        assert header_names.count(b"x-contextforge-mcp-live-stream-core") == 1
+        assert header_names.count(b"x-contextforge-mcp-affinity-core") == 1
+        assert header_names.count(b"x-contextforge-mcp-session-auth-reuse") == 1
+
+    @pytest.mark.asyncio
+    async def test_bridge_sets_scope_and_forwarded_auth_context(self):
+        observed = {}
+
+        class FakeTransportApp:
+            async def handle_streamable_http(self, scope, receive, send):
+                observed["path"] = scope["path"]
+                observed["modified_path"] = scope["modified_path"]
+                observed["user_context"] = user_context_var.get()
+                await send(
+                    {
+                        "type": "http.response.start",
+                        "status": 204,
+                        "headers": [(b"x-contextforge-mcp-runtime", b"python")],
+                    }
+                )
+                await send({"type": "http.response.body", "body": b"", "more_body": False})
+
+        bridge = InternalTrustedMCPTransportBridge(FakeTransportApp())
+        encoded_auth = (
+            base64.urlsafe_b64encode(
+                orjson.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "token_use": "session",
+                    }
+                )
+            )
+            .decode("ascii")
+            .rstrip("=")
+        )
+
+        scope = {
+            "type": "http",
+            "method": "GET",
+            "path": "/_internal/mcp/transport",
+            "query_string": b"session_id=abc123",
+            "headers": [
+                (b"x-contextforge-mcp-runtime", b"rust"),
+                (b"x-contextforge-mcp-runtime-auth", _expected_internal_mcp_runtime_auth_header().encode("ascii")),
+                (b"x-contextforge-auth-context", encoded_auth.encode("ascii")),
+                (b"x-contextforge-server-id", b"server-1"),
+            ],
+            "client": ("127.0.0.1", 5000),
+        }
+
+        async def receive():
+            return {"type": "http.disconnect"}
+
+        events = []
+
+        async def send(message):
+            events.append(message)
+
+        await bridge.handle_streamable_http(scope, receive, send)
+
+        assert observed["path"] == "/mcp/"
+        assert observed["modified_path"] == "/servers/server-1/mcp"
+        assert observed["user_context"]["email"] == "user@example.com"
+        assert observed["user_context"]["teams"] == ["team-a"]
+        assert events[0]["status"] == 204
+
+    @pytest.mark.asyncio
+    async def test_bridge_marks_rust_validated_sessions_in_user_context(self):
+        observed = {}
+
+        class FakeTransportApp:
+            async def handle_streamable_http(self, _scope, _receive, send):
+                observed["user_context"] = user_context_var.get()
+                await send(
+                    {
+                        "type": "http.response.start",
+                        "status": 204,
+                        "headers": [(b"x-contextforge-mcp-runtime", b"python")],
+                    }
+                )
+                await send({"type": "http.response.body", "body": b"", "more_body": False})
+
+        bridge = InternalTrustedMCPTransportBridge(FakeTransportApp())
+        encoded_auth = (
+            base64.urlsafe_b64encode(
+                orjson.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                    }
+                )
+            )
+            .decode("ascii")
+            .rstrip("=")
+        )
+
+        scope = {
+            "type": "http",
+            "method": "GET",
+            "path": "/_internal/mcp/transport",
+            "query_string": b"session_id=abc123",
+            "headers": [
+                (b"x-contextforge-mcp-runtime", b"rust"),
+                (b"x-contextforge-mcp-runtime-auth", _expected_internal_mcp_runtime_auth_header().encode("ascii")),
+                (b"x-contextforge-auth-context", encoded_auth.encode("ascii")),
+                (b"x-contextforge-session-validated", b"rust"),
+            ],
+            "client": ("127.0.0.1", 5000),
+        }
+
+        async def receive():
+            return {"type": "http.disconnect"}
+
+        events = []
+
+        async def send(message):
+            events.append(message)
+
+        await bridge.handle_streamable_http(scope, receive, send)
+
+        assert observed["user_context"]["_rust_session_validated"] is True
+        assert events[0]["status"] == 204
+
+    @pytest.mark.asyncio
+    async def test_bridge_allows_post_transport_calls(self):
+        observed = {}
+
+        class FakeTransportApp:
+            async def handle_streamable_http(self, scope, receive, send):
+                observed["method"] = scope["method"]
+                observed["modified_path"] = scope["modified_path"]
+                observed["body"] = await receive()
+                await send(
+                    {
+                        "type": "http.response.start",
+                        "status": 200,
+                        "headers": [(b"x-contextforge-mcp-runtime", b"python")],
+                    }
+                )
+                await send({"type": "http.response.body", "body": b"{}", "more_body": False})
+
+        bridge = InternalTrustedMCPTransportBridge(FakeTransportApp())
+        encoded_auth = (
+            base64.urlsafe_b64encode(
+                orjson.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                    }
+                )
+            )
+            .decode("ascii")
+            .rstrip("=")
+        )
+
+        scope = {
+            "type": "http",
+            "method": "POST",
+            "path": "/_internal/mcp/transport",
+            "query_string": b"",
+            "headers": [
+                (b"x-contextforge-mcp-runtime", b"rust"),
+                (b"x-contextforge-mcp-runtime-auth", _expected_internal_mcp_runtime_auth_header().encode("ascii")),
+                (b"x-contextforge-auth-context", encoded_auth.encode("ascii")),
+                (b"x-contextforge-server-id", b"server-1"),
+            ],
+            "client": ("127.0.0.1", 5000),
+        }
+
+        async def receive():
+            return {"type": "http.request", "body": b'{"jsonrpc":"2.0","id":1}', "more_body": False}
+
+        events = []
+
+        async def send(message):
+            events.append(message)
+
+        await bridge.handle_streamable_http(scope, receive, send)
+
+        assert observed["method"] == "POST"
+        assert observed["modified_path"] == "/servers/server-1/mcp"
+        assert observed["body"]["body"] == b'{"jsonrpc":"2.0","id":1}'
+        assert events[0]["status"] == 200
+
+    @pytest.mark.asyncio
+    async def test_bridge_rejects_missing_internal_auth_context(self):
+        bridge = InternalTrustedMCPTransportBridge(AsyncMock())
+        scope = {
+            "type": "http",
+            "method": "GET",
+            "path": "/_internal/mcp/transport",
+            "query_string": b"",
+            "headers": [
+                (b"x-contextforge-mcp-runtime", b"rust"),
+                (b"x-contextforge-mcp-runtime-auth", _expected_internal_mcp_runtime_auth_header().encode("ascii")),
+            ],
+            "client": ("127.0.0.1", 5000),
+        }
+
+        async def receive():
+            return {"type": "http.disconnect"}
+
+        events = []
+
+        async def send(message):
+            events.append(message)
+
+        await bridge.handle_streamable_http(scope, receive, send)
+
+        assert events[0]["status"] == 400
+
+    def test_build_internal_mcp_auth_scope_uses_public_request_shape(self):
+        """Synthetic auth scope should preserve the public MCP path and client IP."""
+        scope = _build_internal_mcp_auth_scope(
+            method="post",
+            path="/servers/server-1/mcp",
+            query_string="session_id=abc123",
+            headers={"Authorization": "Bearer token", "X-Test": "value"},
+            client_ip="203.0.113.10",
+        )
+
+        assert scope["type"] == "http"
+        assert scope["method"] == "POST"
+        assert scope["path"] == "/servers/server-1/mcp"
+        assert scope["raw_path"] == b"/servers/server-1/mcp"
+        assert scope["query_string"] == b"session_id=abc123"
+        assert scope["client"] == ("203.0.113.10", 0)
+        assert (b"authorization", b"Bearer token") in scope["headers"]
+        assert (b"x-test", b"value") in scope["headers"]
+
+    @pytest.mark.asyncio
+    async def test_run_internal_mcp_authentication_returns_forwarded_user_context(self, monkeypatch):
+        """Successful internal MCP auth should surface the forwarded auth context."""
+
+        async def _fake_streamable_http_auth(_scope, _receive, _send):
+            user_context_var.set(
+                {
+                    "email": "user@example.com",
+                    "teams": ["team-a"],
+                    "is_authenticated": True,
+                }
+            )
+            return True
+
+        monkeypatch.setattr("mcpgateway.main.settings.email_auth_enabled", False)
+        monkeypatch.setattr("mcpgateway.main.streamable_http_auth", _fake_streamable_http_auth)
+
+        error_response, auth_context = await _run_internal_mcp_authentication(
+            method="POST",
+            path="/mcp",
+            query_string="",
+            headers={"authorization": "Bearer token"},
+            client_ip="203.0.113.10",
+        )
+
+        assert error_response is None
+        assert auth_context["email"] == "user@example.com"
+        assert auth_context["teams"] == ["team-a"]
+        assert auth_context["is_authenticated"] is True
+
+    @pytest.mark.asyncio
+    async def test_handle_internal_mcp_authenticate_returns_auth_context(self, monkeypatch):
+        """Trusted Rust authenticate requests should return the derived auth context."""
+        request = MagicMock(spec=Request)
+        request.json = AsyncMock(
+            return_value={
+                "method": "POST",
+                "path": "/servers/server-1/mcp",
+                "queryString": "session_id=abc123",
+                "headers": {"authorization": "Bearer token"},
+                "clientIp": "203.0.113.10",
+            }
+        )
+
+        monkeypatch.setattr("mcpgateway.main._is_trusted_internal_mcp_runtime_request", lambda _request: True)
+        monkeypatch.setattr(
+            "mcpgateway.main._run_internal_mcp_authentication",
+            AsyncMock(
+                return_value=(
+                    None,
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                    },
+                )
+            ),
+        )
+
+        response = await handle_internal_mcp_authenticate(request)
+
+        assert response.status_code == 200
+        assert orjson.loads(response.body)["authContext"]["email"] == "user@example.com"
+
+    @pytest.mark.asyncio
+    async def test_handle_internal_mcp_authenticate_rejects_untrusted_requests(self, monkeypatch):
+        """The authenticate bridge should remain trusted-runtime only."""
+        request = MagicMock(spec=Request)
+
+        monkeypatch.setattr("mcpgateway.main._is_trusted_internal_mcp_runtime_request", lambda _request: False)
+
+        with pytest.raises(HTTPException) as exc_info:
+            await handle_internal_mcp_authenticate(request)
+
+        assert exc_info.value.status_code == 403
+
+    def test_build_internal_mcp_auth_scope_skips_non_string_headers_and_defaults_unknown_client(self):
+        """Internal auth scope should ignore malformed headers and avoid loopback defaults."""
+        scope = _build_internal_mcp_auth_scope(
+            method="get",
+            path="/mcp",
+            query_string="cursor=1",
+            headers={"authorization": "Bearer token", "x-bad": 1, 2: "ignored"},  # type: ignore[dict-item]
+            client_ip=None,
+        )
+
+        assert scope["client"] == ("unknown", 0)
+        assert scope["query_string"] == b"cursor=1"
+        assert scope["headers"] == [(b"authorization", b"Bearer token")]
+
+    @pytest.mark.asyncio
+    async def test_run_internal_mcp_authentication_captures_forwarded_error_response(self, monkeypatch):
+        """Auth failures emitted through ASGI send should be reconstructed exactly."""
+
+        async def _fake_streamable_http_auth(_scope, receive, send):
+            await receive()
+            await send(
+                {
+                    "type": "http.response.start",
+                    "status": 401,
+                    "headers": [(b"content-type", b"application/json"), (b"www-authenticate", b"Bearer")],
+                }
+            )
+            await send({"type": "http.response.body", "body": b'{\"detail\":\"bad token\"}'})
+            return False
+
+        async def _passthrough_middleware(request, call_next):
+            return await call_next(request)
+
+        monkeypatch.setattr("mcpgateway.main.settings.email_auth_enabled", True)
+        monkeypatch.setattr("mcpgateway.main.streamable_http_auth", _fake_streamable_http_auth)
+        monkeypatch.setattr("mcpgateway.main.token_scoping_middleware", _passthrough_middleware)
+
+        error_response, auth_context = await _run_internal_mcp_authentication(
+            method="POST",
+            path="/mcp",
+            query_string="",
+            headers={"authorization": "Bearer token"},
+            client_ip="203.0.113.10",
+        )
+
+        assert auth_context == {}
+        assert error_response is not None
+        assert error_response.status_code == 401
+        assert error_response.headers["content-type"] == "application/json"
+        assert error_response.headers["www-authenticate"] == "Bearer"
+        assert error_response.body == b'{"detail":"bad token"}'
+
+    @pytest.mark.asyncio
+    async def test_run_internal_mcp_authentication_reconstructs_captured_response_when_middleware_returns_none(self, monkeypatch):
+        """A middleware chain that returns None should still yield a concrete response."""
+
+        async def _ignored_streamable_http_auth(_scope, _receive, _send):
+            return True
+
+        async def _none_middleware(_request, _call_next):
+            return None
+
+        monkeypatch.setattr("mcpgateway.main.settings.email_auth_enabled", True)
+        monkeypatch.setattr("mcpgateway.main.streamable_http_auth", _ignored_streamable_http_auth)
+        monkeypatch.setattr("mcpgateway.main.token_scoping_middleware", _none_middleware)
+
+        error_response, auth_context = await _run_internal_mcp_authentication(
+            method="GET",
+            path="/mcp",
+            query_string="",
+            headers={},
+            client_ip=None,
+        )
+
+        assert auth_context == {}
+        assert error_response is not None
+        assert error_response.status_code == 500
+
+    @pytest.mark.parametrize(
+        ("payload", "detail"),
+        [
+            (["bad"], "Invalid internal MCP authenticate payload"),
+            ({"method": "POST", "queryString": "", "headers": {}, "clientIp": "203.0.113.10"}, "requires path"),
+            ({"method": "POST", "path": "/mcp", "queryString": [], "headers": {}, "clientIp": "203.0.113.10"}, "queryString must be a string"),
+            ({"method": "POST", "path": "/mcp", "queryString": "", "headers": {"authorization": 1}, "clientIp": "203.0.113.10"}, "headers must be a string map"),
+            ({"method": "POST", "path": "/mcp", "queryString": "", "headers": {}, "clientIp": 123}, "clientIp must be a string"),
+        ],
+    )
+    @pytest.mark.asyncio
+    async def test_handle_internal_mcp_authenticate_validates_payload_shape(self, monkeypatch, payload, detail):
+        """Malformed trusted authenticate payloads should fail fast with 400s."""
+        request = MagicMock(spec=Request)
+        request.json = AsyncMock(return_value=payload)
+
+        monkeypatch.setattr("mcpgateway.main._is_trusted_internal_mcp_runtime_request", lambda _request: True)
+
+        with pytest.raises(HTTPException) as exc_info:
+            await handle_internal_mcp_authenticate(request)
+
+        assert exc_info.value.status_code == 400
+        assert detail in exc_info.value.detail
+
+    @pytest.mark.asyncio
+    async def test_handle_internal_mcp_authenticate_returns_forwarded_error_response(self, monkeypatch):
+        """Trusted authenticate requests should pass through auth-layer failure responses."""
+        request = MagicMock(spec=Request)
+        request.json = AsyncMock(
+            return_value={
+                "method": "POST",
+                "path": "/mcp",
+                "queryString": "",
+                "headers": {"authorization": "Bearer token"},
+                "clientIp": "203.0.113.10",
+            }
+        )
+        expected = FastAPIResponse(content=b"denied", status_code=401)
+
+        monkeypatch.setattr("mcpgateway.main._is_trusted_internal_mcp_runtime_request", lambda _request: True)
+        monkeypatch.setattr("mcpgateway.main._run_internal_mcp_authentication", AsyncMock(return_value=(expected, {})))
+
+        response = await handle_internal_mcp_authenticate(request)
+
+        assert response is expected
+
+    @pytest.mark.asyncio
+    async def test_bridge_rejects_non_http_scopes(self):
+        """Non-HTTP trusted transport requests should return 404."""
+        bridge = InternalTrustedMCPTransportBridge(AsyncMock())
+        events = []
+
+        async def receive():
+            return {"type": "websocket.disconnect"}
+
+        async def send(message):
+            events.append(message)
+
+        await bridge.handle_streamable_http({"type": "websocket"}, receive, send)
+
+        assert events[0]["status"] == 404
+
+    @pytest.mark.asyncio
+    async def test_bridge_rejects_unsupported_methods(self):
+        """Unsupported internal transport methods should return 405."""
+        bridge = InternalTrustedMCPTransportBridge(AsyncMock())
+        encoded_auth = base64.urlsafe_b64encode(orjson.dumps({"email": "user@example.com"})).decode("ascii").rstrip("=")
+        events = []
+
+        async def receive():
+            return {"type": "http.request", "body": b"", "more_body": False}
+
+        async def send(message):
+            events.append(message)
+
+        await bridge.handle_streamable_http(
+            {
+                "type": "http",
+                "method": "PATCH",
+                "headers": [
+                    (b"x-contextforge-mcp-runtime", b"rust"),
+                    (b"x-contextforge-auth-context", encoded_auth.encode("ascii")),
+                ],
+                "client": ("127.0.0.1", 5000),
+            },
+            receive,
+            send,
+        )
+
+        assert events[0]["status"] == 405
+
+
+class TestMcpSerialization:
+    """Test MCP-specific response shaping helpers."""
+
+    def test_serialize_mcp_tool_definition_strips_api_only_fields(self):
+        """MCP tool payloads should exclude API-only metadata like dict-shaped tags."""
+        payload = _serialize_mcp_tool_definition(
+            {
+                "name": "a2a-test-agent",
+                "description": "A2A tool",
+                "inputSchema": {"type": "object", "properties": {"query": {"type": "string"}}},
+                "outputSchema": {"type": "object"},
+                "annotations": {"title": "A2A tool"},
+                "tags": [{"id": "ai", "label": "ai"}],
+                "url": "https://example.com/agent",
+            }
+        )
+
+        assert payload == {
+            "name": "a2a-test-agent",
+            "description": "A2A tool",
+            "inputSchema": {"type": "object", "properties": {"query": {"type": "string"}}},
+            "outputSchema": {"type": "object"},
+            "annotations": {"title": "A2A tool"},
+        }
+        assert "tags" not in payload
+        assert "url" not in payload
+
+    def test_serialize_mcp_tool_definition_handles_unknown_objects(self):
+        """Unknown objects should serialize to an empty MCP payload."""
+        assert _serialize_mcp_tool_definition(object()) == {}
+
+    def test_serialize_legacy_tool_payloads_preserves_dicts_and_unknowns(self):
+        """Legacy payload serialization should preserve dicts and tolerate unknown objects."""
+        payloads = _serialize_legacy_tool_payloads([{"id": "tool-1"}, object()])
+        assert payloads == [{"id": "tool-1"}, {}]
+
+
+class TestInternalMcpHelperCoverage:
+    """Target helper branches added for trusted Rust MCP forwarding."""
+
+    def test_decode_internal_mcp_auth_context_rejects_non_object_payload(self):
+        """Non-object JSON payloads should be rejected."""
+        header_value = base64.urlsafe_b64encode(orjson.dumps(["not-an-object"])).decode().rstrip("=")
+        with pytest.raises(ValueError, match="must be an object"):
+            _decode_internal_mcp_auth_context(header_value)
+
+    def test_build_internal_mcp_forwarded_user_rejects_invalid_auth_context(self):
+        """Malformed forwarded auth context should return a 400-style HTTPException."""
+        request = MagicMock(spec=Request)
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-mcp-runtime-auth": _expected_internal_mcp_runtime_auth_header(),
+            "x-contextforge-auth-context": "not-base64",
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+
+        with pytest.raises(HTTPException) as excinfo:
+            _build_internal_mcp_forwarded_user(request)
+
+        assert excinfo.value.status_code == 400
+        assert "Invalid trusted MCP auth context" in excinfo.value.detail
+
+    def test_build_internal_mcp_forwarded_user_requires_internal_runtime_auth_header(self):
+        """Trusted Rust forwarding must include the shared internal-auth header."""
+        request = MagicMock(spec=Request)
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(orjson.dumps({"email": "user@example.com"})).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+
+        with pytest.raises(HTTPException) as excinfo:
+            _build_internal_mcp_forwarded_user(request)
+
+        assert excinfo.value.status_code == 403
+        assert "only available to the local Rust runtime" in excinfo.value.detail
+
+    def test_build_internal_mcp_forwarded_user_sets_session_validated_and_token_teams(self):
+        """Trusted forwarded auth should copy teams and set the Rust session validation marker."""
+        request = MagicMock(spec=Request)
+        request.headers = _trusted_internal_mcp_headers(
+            {
+                "email": "user@example.com",
+                "teams": ["team-a"],
+                "is_authenticated": True,
+                "is_admin": False,
+                "permission_is_admin": True,
+                "token_use": "session",
+            },
+            **{"x-contextforge-session-validated": "rust"},
+        )
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = SimpleNamespace()
+
+        forwarded = _build_internal_mcp_forwarded_user(request)
+
+        assert forwarded["email"] == "user@example.com"
+        assert forwarded["is_admin"] is True
+        assert request.state.token_teams == ["team-a"]
+        assert getattr(request.state, "_mcp_internal_auth_context")["_rust_session_validated"] is True
+
+    @pytest.mark.asyncio
+    async def test_handle_internal_mcp_tools_call_metric_records_buffered_metrics(self):
+        """Trusted Rust metrics writeback should use the buffered Python metric recorder."""
+        request = MagicMock(spec=Request)
+        request.headers = _trusted_internal_mcp_headers(
+            {
+                "email": "user@example.com",
+                "teams": ["team-a"],
+                "is_authenticated": True,
+                "is_admin": False,
+            },
+            **{"x-contextforge-server-id": "server-1"},
+        )
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = SimpleNamespace()
+        request.body = AsyncMock(
+            return_value=orjson.dumps(
+                {
+                    "toolId": "tool-1",
+                    "serverId": "server-1",
+                    "durationMs": 250.0,
+                    "success": True,
+                }
+            )
+        )
+        metrics_buffer = MagicMock()
+
+        with patch(
+            "mcpgateway.services.metrics_buffer_service.get_metrics_buffer_service",
+            return_value=metrics_buffer,
+        ):
+            response = await handle_internal_mcp_tools_call_metric(request)
+
+        assert response.status_code == 200
+        assert orjson.loads(response.body) == {"status": "ok"}
+        metrics_buffer.record_tool_metric_with_duration.assert_called_once_with(
+            tool_id="tool-1",
+            response_time=0.25,
+            success=True,
+            error_message=None,
+        )
+        metrics_buffer.record_server_metric_with_duration.assert_called_once_with(
+            server_id="server-1",
+            response_time=0.25,
+            success=True,
+            error_message=None,
+        )
+
+    @pytest.mark.asyncio
+    async def test_handle_internal_mcp_tools_call_metric_rejects_invalid_payload(self):
+        """Tool metric writeback should reject missing identifiers."""
+        request = MagicMock(spec=Request)
+        request.headers = _trusted_internal_mcp_headers({"email": "user@example.com"})
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = SimpleNamespace()
+        request.body = AsyncMock(return_value=orjson.dumps({"durationMs": 25, "success": True}))
+
+        response = await handle_internal_mcp_tools_call_metric(request)
+
+        assert response.status_code == 400
+        assert orjson.loads(response.body) == {"detail": "Missing toolId"}
+
+    def test_enforce_internal_mcp_server_scope_returns_when_no_auth_context(self):
+        """Missing forwarded auth context should skip server-scope enforcement."""
+        request = MagicMock(spec=Request)
+        request.headers = {}
+        request.state = SimpleNamespace()
+
+        _enforce_internal_mcp_server_scope(request, "server-1")
+
+    def test_extract_scoped_permissions_prefers_internal_auth_context(self):
+        """Internal auth context should drive scoped permissions, with empty values deferring to RBAC."""
+        request = MagicMock(spec=Request)
+        request.headers = {}
+        request.state = SimpleNamespace(_mcp_internal_auth_context={"scoped_permissions": []})
+
+        assert _extract_scoped_permissions(request) is None
+
+        request.state._mcp_internal_auth_context = {"scoped_permissions": ["tools.read", "servers.use"]}
+        assert _extract_scoped_permissions(request) == {"tools.read", "servers.use"}
+
+    def test_is_permission_admin_user_handles_object_and_dict_inputs(self):
+        """Permission-layer admin helper should handle object, dict, and unknown payloads."""
+        assert _is_permission_admin_user(SimpleNamespace(is_admin=True)) is True
+        assert _is_permission_admin_user({"permission_is_admin": True}) is True
+        assert _is_permission_admin_user({"is_admin": True}) is False
+        assert _is_permission_admin_user("not-a-user") is False
+
+    @pytest.mark.asyncio
+    async def test_ensure_rpc_permission_short_circuits_admin_system_config_for_permission_admin(self):
+        """Permission-layer admins should short-circuit admin.system_config after scope enforcement."""
+        request = MagicMock(spec=Request)
+        request.headers = {}
+        request.state = SimpleNamespace(_jwt_verified_payload=("token", {"scopes": {"permissions": ["admin.system_config"]}}))
+
+        with patch("mcpgateway.main.PermissionChecker.has_permission", new=AsyncMock(side_effect=AssertionError("RBAC should be skipped"))):
+            await _ensure_rpc_permission({"permission_is_admin": True}, MagicMock(), "admin.system_config", "roots/list", request)
+
+
 class TestEndpointErrorHandling:
     """Test error handling in various endpoints."""
 
@@ -1025,7 +1877,6 @@ def _db_gen():
             response = await middleware.dispatch(request, call_next)
             assert response.status_code == 500
 
-
     @pytest.mark.asyncio
     async def test_admin_auth_team_scoped_request_passes_with_team_role(self, monkeypatch):
         """User with only team-scoped admin.dashboard should pass when request has valid team_id."""
@@ -1320,10 +2171,7 @@ async def test_admin_auth_repeated_team_id_uses_last_value(self, monkeypatch):
             headers={"Authorization": "Bearer token"},
         )
         # Simulate repeated keys — .get() returns the last value
-        request.query_params = QueryParams(
-            "team_id=00000000000000000000000000000099"
-            "&team_id=a1b2c3d4e5f6789012345678abcdef01"
-        )
+        request.query_params = QueryParams("team_id=00000000000000000000000000000099" "&team_id=a1b2c3d4e5f6789012345678abcdef01")
         call_next = AsyncMock(return_value="ok")
 
         monkeypatch.setattr(settings, "auth_required", True)
@@ -4057,6 +4905,19 @@ async def test_list_and_get_a2a_agents_branches(self, monkeypatch):
 class TestRpcHandling:
     """Cover RPC handler branches."""
 
+    @pytest.fixture(autouse=True)
+    def _trust_internal_rust_headers_for_handler_logic_tests(self, monkeypatch):
+        """Keep this suite focused on handler logic, not trust-boundary validation.
+
+        The trust boundary itself is covered separately by the dedicated helper
+        and middleware tests above.
+        """
+        monkeypatch.setattr(
+            "mcpgateway.main._is_trusted_internal_mcp_runtime_request",
+            lambda request: request.headers.get("x-contextforge-mcp-runtime") == "rust"
+            and getattr(getattr(request, "client", None), "host", None) in ("127.0.0.1", "::1"),
+        )
+
     @staticmethod
     def _make_request(payload: dict) -> MagicMock:
         request = MagicMock(spec=Request)
@@ -4083,62 +4944,2867 @@ async def test_handle_rpc_tools_list_server(self):
         mock_db = MagicMock()
 
         with (
-            patch("mcpgateway.main.tool_service.list_server_tools", new=AsyncMock(return_value=[tool])),
+            patch("mcpgateway.main.tool_service.list_server_tools", new=AsyncMock(return_value=[tool])) as mock_list_server_tools,
             patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
         ):
             result = await handle_rpc(request, db=mock_db, user={"email": "user@example.com"})
-            assert result["result"]["tools"][0]["id"] == "tool-1"
+            assert len(result["result"]["tools"]) == 1
+            assert mock_list_server_tools.await_args.args[1] == "srv"
 
-    async def test_handle_rpc_list_tools_with_cursor(self):
-        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}}
+    async def test_handle_rpc_tools_list_uses_internal_rust_server_header(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {"server_id": "body-srv"}}
         request = self._make_request(payload)
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "header-srv",
+        }
 
         tool = MagicMock()
-        tool.model_dump.return_value = {"id": "tool-2"}
+        tool.model_dump.return_value = {"id": "tool-header"}
         mock_db = MagicMock()
 
         with (
-            patch("mcpgateway.main.tool_service.list_tools", new=AsyncMock(return_value=([tool], "next-cursor"))),
+            patch("mcpgateway.main.tool_service.list_server_tools", new=AsyncMock(return_value=[tool])) as mock_list_server_tools,
             patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
         ):
             result = await handle_rpc(request, db=mock_db, user={"email": "user@example.com"})
-            assert result["result"]["nextCursor"] == "next-cursor"
 
-    async def test_handle_rpc_list_gateways(self):
-        payload = {"jsonrpc": "2.0", "id": "1", "method": "list_gateways", "params": {}}
+        assert len(result["result"]["tools"]) == 1
+        assert mock_list_server_tools.await_args.args[1] == "header-srv"
+
+    async def test_handle_rpc_ignores_internal_server_header_without_rust_runtime_marker(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}}
         request = self._make_request(payload)
+        request.headers = {
+            "x-contextforge-server-id": "spoofed-srv",
+        }
 
-        gateway = MagicMock()
-        gateway.model_dump.return_value = {"id": "gw-1"}
+        tool = MagicMock()
+        tool.model_dump.return_value = {"id": "tool-plain"}
         mock_db = MagicMock()
 
-        with patch("mcpgateway.main.gateway_service.list_gateways", new=AsyncMock(return_value=([gateway], None))):
+        with (
+            patch("mcpgateway.main.tool_service.list_tools", new=AsyncMock(return_value=([tool], None))) as mock_list_tools,
+            patch("mcpgateway.main.tool_service.list_server_tools", new=AsyncMock()) as mock_list_server_tools,
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+        ):
             result = await handle_rpc(request, db=mock_db, user={"email": "user@example.com"})
-            assert result["result"]["gateways"][0]["id"] == "gw-1"
 
-    async def test_handle_rpc_list_roots_requires_admin_permission(self):
-        payload = {"jsonrpc": "2.0", "id": "roots-1", "method": "list_roots", "params": {}}
+        assert len(result["result"]["tools"]) == 1
+        mock_list_tools.assert_awaited_once()
+        mock_list_server_tools.assert_not_awaited()
+
+    async def test_handle_internal_mcp_rpc_uses_forwarded_auth_context(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}}
         request = self._make_request(payload)
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": True,
+                        "token_use": "session",
+                        "scoped_permissions": ["tools.read"],
+                        "scoped_server_id": "srv-scoped",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
 
-        with patch("mcpgateway.main.PermissionChecker.has_permission", new=AsyncMock(return_value=False)):
-            result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
-            assert result["error"]["code"] == -32003
-            assert "Access denied" in result["error"]["message"]
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._handle_rpc_authenticated", new=AsyncMock(return_value={"jsonrpc": "2.0", "result": {}, "id": "1"})) as mock_dispatch,
+        ):
+            result = await handle_internal_mcp_rpc(request)
 
-    async def test_handle_rpc_roots_list_requires_admin_permission(self):
-        payload = {"jsonrpc": "2.0", "id": "roots-2", "method": "roots/list", "params": {}}
+        assert result["jsonrpc"] == "2.0"
+        forwarded_user = mock_dispatch.await_args.kwargs["user"]
+        assert forwarded_user["email"] == "user@example.com"
+        assert forwarded_user["is_admin"] is True
+        assert request.state.token_teams == ["team-a"]
+        mock_db.commit.assert_called_once()
+        mock_db.close.assert_called_once()
+
+    async def test_handle_internal_mcp_rpc_rejects_non_loopback_requests(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}}
         request = self._make_request(payload)
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="10.0.0.2")
 
-        with patch("mcpgateway.main.PermissionChecker.has_permission", new=AsyncMock(return_value=False)):
-            result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
-            assert result["error"]["code"] == -32003
+        with pytest.raises(HTTPException) as excinfo:
+            await handle_internal_mcp_rpc(request)
 
-    async def test_handle_rpc_resources_read_missing_uri(self):
-        payload = {"jsonrpc": "2.0", "id": "1", "method": "resources/read", "params": {}}
+        assert excinfo.value.status_code == 403
+
+    async def test_handle_internal_mcp_rpc_rolls_back_on_dispatch_error(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}}
         request = self._make_request(payload)
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
 
-        with patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)):
-            result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._handle_rpc_authenticated", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_rpc(request)
+
+        mock_db.rollback.assert_called_once()
+        mock_db.close.assert_called_once()
+
+    async def test_handle_internal_mcp_rpc_skips_jsonrpc_model_validation(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}}
+        request = self._make_request(payload)
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": [],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": True,
+                        "scoped_permissions": ["tools.read"],
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        tool = MagicMock()
+        tool.model_dump.return_value = {"name": "tool-1", "description": "desc", "inputSchema": {"type": "object"}}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main.RPCRequest", side_effect=AssertionError("trusted internal MCP dispatch should skip RPCRequest validation")),
+            patch("mcpgateway.main.tool_service.list_tools", new=AsyncMock(return_value=([tool], None))),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+        ):
+            result = await handle_internal_mcp_rpc(request)
+
+        assert result["result"]["tools"][0]["name"] == "tool-1"
+
+    async def test_handle_internal_mcp_initialize_returns_jsonrpc_result(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "init-1", "method": "initialize", "params": {"session_id": "sess-1", "protocolVersion": "2025-11-25"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "mcp-session-id": "client-session-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        init_result = MagicMock()
+        init_result.model_dump.return_value = {"protocolVersion": "2025-11-25", "capabilities": {}}
+        monkeypatch.setattr("mcpgateway.main.session_registry.claim_session_owner", AsyncMock(return_value="user@example.com"))
+        handle_initialize_logic = AsyncMock(return_value=init_result)
+        monkeypatch.setattr("mcpgateway.main.session_registry.handle_initialize_logic", handle_initialize_logic)
+
+        response = await handle_internal_mcp_initialize(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "jsonrpc": "2.0",
+            "id": "init-1",
+            "result": {"protocolVersion": "2025-11-25", "capabilities": {}},
+        }
+        handle_initialize_logic.assert_awaited_once_with(
+            {"session_id": "sess-1", "protocolVersion": "2025-11-25"},
+            session_id="sess-1",
+            server_id="srv-1",
+        )
+
+    async def test_handle_internal_mcp_initialize_rejects_session_owner_mismatch(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "init-deny", "method": "initialize", "params": {"session_id": "sess-1", "protocolVersion": "2025-11-25"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr("mcpgateway.main.session_registry.claim_session_owner", AsyncMock(return_value="other@example.com"))
+        handle_initialize_logic = AsyncMock()
+        monkeypatch.setattr("mcpgateway.main.session_registry.handle_initialize_logic", handle_initialize_logic)
+
+        response = await handle_internal_mcp_initialize(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "jsonrpc": "2.0",
+            "id": "init-deny",
+            "error": {"code": -32003, "message": "Access denied", "data": {"method": "initialize"}},
+        }
+        handle_initialize_logic.assert_not_awaited()
+
+    async def test_handle_internal_mcp_session_delete_cleans_up_session_state(self, monkeypatch):
+        request = self._make_request({})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "mcp-session-id": "sess-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        remove_session = AsyncMock()
+        cleanup_owner = AsyncMock()
+        pool = MagicMock()
+        pool.cleanup_streamable_http_session_owner = cleanup_owner
+        monkeypatch.setattr("mcpgateway.main._validate_streamable_session_access", AsyncMock(return_value=(True, 200, "")))
+        monkeypatch.setattr("mcpgateway.main.session_registry.remove_session", remove_session)
+        monkeypatch.setattr("mcpgateway.main.settings.mcpgateway_session_affinity_enabled", True)
+
+        with patch("mcpgateway.services.mcp_session_pool.get_mcp_session_pool", return_value=pool):
+            response = await handle_internal_mcp_session_delete(request)
+
+        assert response.status_code == 204
+        remove_session.assert_awaited_once_with("sess-1")
+        cleanup_owner.assert_awaited_once_with("sess-1")
+
+    async def test_handle_internal_mcp_session_delete_skips_python_validation_when_rust_validated(self, monkeypatch):
+        request = self._make_request({})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "mcp-session-id": "sess-1",
+            "x-contextforge-session-validated": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        remove_session = AsyncMock()
+        monkeypatch.setattr("mcpgateway.main._validate_streamable_session_access", AsyncMock(side_effect=AssertionError("should not be called")))
+        monkeypatch.setattr("mcpgateway.main.session_registry.remove_session", remove_session)
+        monkeypatch.setattr("mcpgateway.main.settings.mcpgateway_session_affinity_enabled", False)
+
+        response = await handle_internal_mcp_session_delete(request)
+
+        assert response.status_code == 204
+        remove_session.assert_awaited_once_with("sess-1")
+
+    async def test_handle_internal_mcp_session_delete_requires_session_header(self):
+        request = self._make_request({})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        response = await handle_internal_mcp_session_delete(request)
+
+        assert response.status_code == 400
+        assert json.loads(response.body.decode()) == {"detail": "mcp-session-id header is required"}
+
+    async def test_handle_internal_mcp_notifications_initialized_returns_no_content(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "method": "notifications/initialized", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        notify = AsyncMock()
+        monkeypatch.setattr("mcpgateway.main.logging_service.notify", notify)
+
+        response = await handle_internal_mcp_notifications_initialized(request)
+
+        assert response.status_code == 204
+        notify.assert_awaited_once_with("Client initialized", LogLevel.INFO)
+
+    async def test_handle_internal_mcp_notifications_initialized_rejects_wrong_method(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "notif-1", "method": "notifications/message", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        response = await handle_internal_mcp_notifications_initialized(request)
+
+        assert response.status_code == 400
+        assert json.loads(response.body.decode()) == {
+            "jsonrpc": "2.0",
+            "id": "notif-1",
+            "error": {"code": -32600, "message": "Invalid Request"},
+        }
+
+    async def test_handle_internal_mcp_notifications_message_returns_no_content(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "method": "notifications/message", "params": {"data": "hello", "level": "info", "logger": "tests"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        notify = AsyncMock()
+        monkeypatch.setattr("mcpgateway.main.logging_service.notify", notify)
+
+        response = await handle_internal_mcp_notifications_message(request)
+
+        assert response.status_code == 204
+        notify.assert_awaited_once_with("hello", LogLevel.INFO, "tests")
+
+    async def test_handle_internal_mcp_notifications_message_rejects_wrong_method(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "notif-2", "method": "notifications/initialized", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        response = await handle_internal_mcp_notifications_message(request)
+
+        assert response.status_code == 400
+        assert json.loads(response.body.decode()) == {
+            "jsonrpc": "2.0",
+            "id": "notif-2",
+            "error": {"code": -32600, "message": "Invalid Request"},
+        }
+
+    async def test_handle_internal_mcp_notifications_cancelled_returns_no_content(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "method": "notifications/cancelled", "params": {"requestId": "run-1", "reason": "stop"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr("mcpgateway.main._authorize_run_cancellation", AsyncMock())
+        cancel_run = AsyncMock()
+        notify = AsyncMock()
+        monkeypatch.setattr("mcpgateway.main.cancellation_service.cancel_run", cancel_run)
+        monkeypatch.setattr("mcpgateway.main.logging_service.notify", notify)
+
+        response = await handle_internal_mcp_notifications_cancelled(request)
+
+        assert response.status_code == 204
+        cancel_run.assert_awaited_once_with("run-1", reason="stop")
+        notify.assert_awaited_once_with("Request cancelled: run-1", LogLevel.INFO)
+
+    async def test_handle_internal_mcp_notifications_cancelled_rejects_wrong_method(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "notif-3", "method": "notifications/initialized", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        response = await handle_internal_mcp_notifications_cancelled(request)
+
+        assert response.status_code == 400
+        assert json.loads(response.body.decode()) == {
+            "jsonrpc": "2.0",
+            "id": "notif-3",
+            "error": {"code": -32600, "message": "Invalid Request"},
+        }
+
+    async def test_handle_internal_mcp_resources_list_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resources-1", "method": "resources/list", "params": {"cursor": "cursor-1"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        resource = MagicMock()
+        resource.model_dump.return_value = {"uri": "resource://one", "name": "Resource One"}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.resource_service.list_resources", new=AsyncMock(return_value=([resource], "next-1"))),
+        ):
+            response = await handle_internal_mcp_resources_list(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "resources": [{"uri": "resource://one", "name": "Resource One"}],
+            "nextCursor": "next-1",
+        }
+
+    async def test_handle_internal_mcp_resources_read_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resources-read-1", "method": "resources/read", "params": {"uri": "resource://one", "requestId": "req-1"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+
+        resource = MagicMock()
+        resource.model_dump.return_value = {"uri": "resource://one", "text": "hello"}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.resource_service.read_resource", new=AsyncMock(return_value=resource)),
+        ):
+            response = await handle_internal_mcp_resources_read(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "contents": [{"uri": "resource://one", "text": "hello"}],
+        }
+
+    async def test_handle_internal_mcp_resources_read_normalizes_legacy_resource_content(self):
+        from mcpgateway.common.models import ResourceContent
+
+        request = self._make_request({"jsonrpc": "2.0", "id": "resources-read-legacy", "method": "resources/read", "params": {"uri": "resource://legacy"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+
+        resource = ResourceContent(
+            type="resource",
+            id="legacy-id",
+            uri="resource://legacy",
+            mime_type="text/plain",
+            text="legacy-text",
+        )
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.resource_service.read_resource", new=AsyncMock(return_value=resource)),
+        ):
+            response = await handle_internal_mcp_resources_read(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "contents": [{"uri": "resource://legacy", "mimeType": "text/plain", "text": "legacy-text"}],
+        }
+
+    async def test_handle_internal_mcp_resource_templates_list_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resource-templates-1", "method": "resources/templates/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        template = MagicMock()
+        template.model_dump.return_value = {"uriTemplate": "resource://{id}", "name": "Resource Template"}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.resource_service.list_resource_templates", new=AsyncMock(return_value=[template])),
+        ):
+            response = await handle_internal_mcp_resource_templates_list(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "resourceTemplates": [{"uriTemplate": "resource://{id}", "name": "Resource Template"}],
+        }
+
+    async def test_handle_internal_mcp_resource_templates_list_scope_and_cleanup_paths(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resource-templates-2", "method": "resources/templates/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        template = MagicMock()
+        template.model_dump.return_value = {"uriTemplate": "resource://{id}"}
+
+        ok_db = MagicMock()
+        ok_db.is_active = True
+        ok_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=ok_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main._enforce_internal_mcp_server_scope"),
+            patch("mcpgateway.main.resource_service.list_resource_templates", new=AsyncMock(return_value=[template])),
+        ):
+            response = await handle_internal_mcp_resource_templates_list(request)
+        assert response.status_code == 200
+
+        err_db = MagicMock()
+        err_db.rollback.side_effect = RuntimeError("rollback failed")
+        err_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.resource_service.list_resource_templates", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_resource_templates_list(request)
+        err_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_resources_subscribe_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resources-sub-1", "method": "resources/subscribe", "params": {"uri": "resource://one"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_scoped_resource_access_context", return_value=("user@example.com", [])),
+            patch("mcpgateway.main.resource_service.subscribe_resource", new=AsyncMock(return_value=None)) as subscribe_resource,
+        ):
+            response = await handle_internal_mcp_resources_subscribe(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {}
+        subscription = subscribe_resource.await_args.args[1]
+        assert subscription.uri == "resource://one"
+        assert subscription.subscriber_id == "user@example.com"
+
+    async def test_handle_internal_mcp_resources_unsubscribe_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resources-unsub-1", "method": "resources/unsubscribe", "params": {"uri": "resource://one"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main.resource_service.unsubscribe_resource", new=AsyncMock(return_value=None)) as unsubscribe_resource,
+        ):
+            response = await handle_internal_mcp_resources_unsubscribe(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {}
+        subscription = unsubscribe_resource.await_args.args[1]
+        assert subscription.uri == "resource://one"
+        assert subscription.subscriber_id == "user@example.com"
+
+    async def test_handle_internal_mcp_resources_subscribe_and_unsubscribe_extra_error_paths(self):
+        from mcpgateway.services.resource_service import ResourceNotFoundError
+
+        subscribe_request = self._make_request({"jsonrpc": "2.0", "id": "resources-sub-2", "method": "resources/subscribe", "params": []})
+        subscribe_request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        subscribe_request.client = SimpleNamespace(host="127.0.0.1")
+
+        missing_response = await handle_internal_mcp_resources_subscribe(subscribe_request)
+        assert missing_response.status_code == 400
+
+        subscribe_request.body = AsyncMock(return_value=json.dumps({"jsonrpc": "2.0", "id": "resources-sub-3", "method": "resources/subscribe", "params": {"uri": "resource://missing"}}).encode())
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=MagicMock()),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._enforce_internal_mcp_server_scope"),
+            patch("mcpgateway.main.resource_service.subscribe_resource", new=AsyncMock(side_effect=ResourceNotFoundError("missing"))),
+        ):
+            not_found_response = await handle_internal_mcp_resources_subscribe(subscribe_request)
+        assert not_found_response.status_code == 404
+
+        subscribe_request.body = AsyncMock(return_value=json.dumps({"jsonrpc": "2.0", "id": "resources-sub-4", "method": "resources/subscribe", "params": {"uri": "resource://one"}}).encode())
+        subscribe_request.headers.pop("x-contextforge-server-id", None)
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=MagicMock()),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main.resource_service.subscribe_resource", new=AsyncMock(side_effect=PermissionError("denied"))),
+        ):
+            denied_response = await handle_internal_mcp_resources_subscribe(subscribe_request)
+        assert denied_response.status_code == 403
+
+        subscribe_error_db = MagicMock()
+        subscribe_error_db.rollback.side_effect = RuntimeError("rollback failed")
+        subscribe_error_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=subscribe_error_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main.resource_service.subscribe_resource", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            error_response = await handle_internal_mcp_resources_subscribe(subscribe_request)
+        assert error_response.status_code == 500
+        subscribe_error_db.invalidate.assert_called_once()
+
+        unsubscribe_request = self._make_request({"jsonrpc": "2.0", "id": "resources-unsub-2", "method": "resources/unsubscribe", "params": []})
+        unsubscribe_request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        unsubscribe_request.client = SimpleNamespace(host="127.0.0.1")
+        unsubscribe_missing = await handle_internal_mcp_resources_unsubscribe(unsubscribe_request)
+        assert unsubscribe_missing.status_code == 400
+
+        err_db = MagicMock()
+        err_db.rollback.side_effect = RuntimeError("rollback failed")
+        err_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        unsubscribe_request.body = AsyncMock(return_value=json.dumps({"jsonrpc": "2.0", "id": "resources-unsub-3", "method": "resources/unsubscribe", "params": {"uri": "resource://one"}}).encode())
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._enforce_internal_mcp_server_scope"),
+            patch("mcpgateway.main.resource_service.unsubscribe_resource", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            error_response = await handle_internal_mcp_resources_unsubscribe(unsubscribe_request)
+        assert error_response.status_code == 500
+        err_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_prompts_list_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "prompts-1", "method": "prompts/list", "params": {"cursor": "cursor-1"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        prompt = MagicMock()
+        prompt.model_dump.return_value = {"name": "prompt-one", "description": "Prompt One"}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.prompt_service.list_prompts", new=AsyncMock(return_value=([prompt], "next-prompt"))),
+        ):
+            response = await handle_internal_mcp_prompts_list(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "prompts": [{"name": "prompt-one", "description": "Prompt One"}],
+            "nextCursor": "next-prompt",
+        }
+
+    async def test_handle_internal_mcp_prompts_get_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "prompts-get-1", "method": "prompts/get", "params": {"name": "prompt-one", "arguments": {"subject": "hi"}}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+
+        prompt = MagicMock()
+        prompt.model_dump.return_value = {"name": "prompt-one", "messages": [{"role": "user", "content": "hi"}]}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.prompt_service.get_prompt", new=AsyncMock(return_value=prompt)),
+        ):
+            response = await handle_internal_mcp_prompts_get(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "name": "prompt-one",
+            "messages": [{"role": "user", "content": "hi"}],
+        }
+
+    async def test_handle_internal_mcp_roots_list_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "roots-1", "method": "roots/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "admin@example.com",
+                        "teams": None,
+                        "is_authenticated": True,
+                        "is_admin": True,
+                        "permission_is_admin": True,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+        root = MagicMock()
+        root.model_dump.return_value = {"uri": "file:///tmp", "name": "tmp"}
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main.root_service.list_roots", new=AsyncMock(return_value=[root])),
+        ):
+            response = await handle_internal_mcp_roots_list(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {
+            "roots": [{"uri": "file:///tmp", "name": "tmp"}],
+        }
+
+    async def test_handle_internal_mcp_completion_complete_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "completion-1", "method": "completion/complete", "params": {"prompt": "hi"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.completion_service.handle_completion", new=AsyncMock(return_value={"completion": {"text": "done"}})),
+        ):
+            response = await handle_internal_mcp_completion_complete(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {"completion": {"text": "done"}}
+
+    async def test_handle_internal_mcp_completion_complete_returns_json_error_on_exception(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "completion-err-1", "method": "completion/complete", "params": {"prompt": "hi"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.completion_service.handle_completion", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            response = await handle_internal_mcp_completion_complete(request)
+
+        assert response.status_code == 500
+        assert json.loads(response.body.decode()) == {
+            "code": -32000,
+            "message": "Internal error",
+            "data": "boom",
+        }
+
+    async def test_handle_internal_mcp_completion_complete_scope_and_cleanup_variants(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "completion-3", "method": "completion/complete", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        ok_db = MagicMock()
+        ok_db.is_active = True
+        ok_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=ok_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main._enforce_internal_mcp_server_scope"),
+            patch("mcpgateway.main.completion_service.handle_completion", new=AsyncMock(return_value={"completion": {"text": "ok"}})),
+        ):
+            response = await handle_internal_mcp_completion_complete(request)
+        assert response.status_code == 200
+
+        err_db = MagicMock()
+        err_db.rollback.side_effect = RuntimeError("rollback failed")
+        err_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.completion_service.handle_completion", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            response = await handle_internal_mcp_completion_complete(request)
+        assert response.status_code == 500
+        err_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_roots_list_ignores_invalidate_failure_on_cleanup(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "roots-err", "method": "roots/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        err_db = MagicMock()
+        err_db.rollback.side_effect = RuntimeError("rollback failed")
+        err_db.invalidate.side_effect = RuntimeError("invalidate failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main.root_service.list_roots", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_roots_list(request)
+        err_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_sampling_create_message_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "sampling-1", "method": "sampling/createMessage", "params": {"messages": []}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main.sampling_handler.create_message", new=AsyncMock(return_value={"messages": [{"text": "ok"}]})),
+        ):
+            response = await handle_internal_mcp_sampling_create_message(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {"messages": [{"text": "ok"}]}
+
+    async def test_handle_internal_mcp_sampling_create_message_returns_json_error_on_exception(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "sampling-err-1", "method": "sampling/createMessage", "params": {"messages": []}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main.sampling_handler.create_message", new=AsyncMock(side_effect=RuntimeError("sampling boom"))),
+        ):
+            response = await handle_internal_mcp_sampling_create_message(request)
+
+        assert response.status_code == 500
+        assert json.loads(response.body.decode()) == {
+            "code": -32000,
+            "message": "Internal error",
+            "data": "sampling boom",
+        }
+
+    async def test_handle_internal_mcp_sampling_create_message_scope_and_jsonrpc_variants(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "sampling-3", "method": "sampling/createMessage", "params": []})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        ok_db = MagicMock()
+        ok_db.is_active = True
+        ok_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=ok_db),
+            patch("mcpgateway.main._enforce_internal_mcp_server_scope"),
+            patch("mcpgateway.main.sampling_handler.create_message", new=AsyncMock(return_value={"messages": []})),
+        ):
+            response = await handle_internal_mcp_sampling_create_message(request)
+        assert response.status_code == 200
+
+        err_db = MagicMock()
+        err_db.rollback.side_effect = RuntimeError("rollback failed")
+        err_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main.sampling_handler.create_message", new=AsyncMock(side_effect=JSONRPCError(-32003, "Access denied", {"method": "sampling/createMessage"}))),
+        ):
+            response = await handle_internal_mcp_sampling_create_message(request)
+        assert response.status_code == 403
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main.sampling_handler.create_message", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            response = await handle_internal_mcp_sampling_create_message(request)
+        assert response.status_code == 500
+        err_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_logging_set_level_returns_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "logging-1", "method": "logging/setLevel", "params": {"level": "warning"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "admin@example.com",
+                        "teams": None,
+                        "is_authenticated": True,
+                        "is_admin": True,
+                        "permission_is_admin": True,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main.logging_service.set_level", new=AsyncMock(return_value=None)),
+        ):
+            response = await handle_internal_mcp_logging_set_level(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {}
+
+    async def test_handle_internal_mcp_logging_set_level_non_dict_params_and_cleanup_path(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "logging-2", "method": "logging/setLevel", "params": []})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        ok_db = MagicMock()
+        ok_db.is_active = True
+        ok_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=ok_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main.LogLevel", lambda _value=None: "info"),
+            patch("mcpgateway.main.logging_service.set_level", new=AsyncMock(return_value=None)),
+        ):
+            response = await handle_internal_mcp_logging_set_level(request)
+        assert response.status_code == 200
+
+        err_db = MagicMock()
+        err_db.rollback.side_effect = RuntimeError("rollback failed")
+        err_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main.logging_service.set_level", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            response = await handle_internal_mcp_logging_set_level(request)
+        assert response.status_code == 500
+        err_db.invalidate.assert_called_once()
+
+    @pytest.mark.parametrize(
+        ("handler", "method_name"),
+        [
+            (handle_internal_mcp_initialize, "initialize"),
+            (handle_internal_mcp_notifications_initialized, "notifications/initialized"),
+            (handle_internal_mcp_notifications_message, "notifications/message"),
+            (handle_internal_mcp_notifications_cancelled, "notifications/cancelled"),
+            (handle_internal_mcp_resources_list, "resources/list"),
+            (handle_internal_mcp_resources_read, "resources/read"),
+            (handle_internal_mcp_resources_subscribe, "resources/subscribe"),
+            (handle_internal_mcp_resources_unsubscribe, "resources/unsubscribe"),
+            (handle_internal_mcp_resource_templates_list, "resources/templates/list"),
+            (handle_internal_mcp_roots_list, "roots/list"),
+            (handle_internal_mcp_completion_complete, "completion/complete"),
+            (handle_internal_mcp_sampling_create_message, "sampling/createMessage"),
+            (handle_internal_mcp_logging_set_level, "logging/setLevel"),
+            (handle_internal_mcp_prompts_list, "prompts/list"),
+            (handle_internal_mcp_prompts_get, "prompts/get"),
+        ],
+    )
+    async def test_internal_mcp_handlers_reject_parse_errors(self, handler, method_name):
+        """Trusted internal handlers should return JSON-RPC parse errors on malformed bodies."""
+        request = MagicMock(spec=Request)
+        request.body = AsyncMock(return_value=b"{bad")
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.query_params = {}
+        request.state = MagicMock()
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        if handler in {
+            handle_internal_mcp_resources_list,
+            handle_internal_mcp_resources_read,
+            handle_internal_mcp_resources_subscribe,
+            handle_internal_mcp_resources_unsubscribe,
+            handle_internal_mcp_resource_templates_list,
+            handle_internal_mcp_roots_list,
+            handle_internal_mcp_completion_complete,
+            handle_internal_mcp_sampling_create_message,
+            handle_internal_mcp_logging_set_level,
+            handle_internal_mcp_prompts_list,
+            handle_internal_mcp_prompts_get,
+        }:
+            mock_db = MagicMock()
+            mock_db.is_active = True
+            mock_db.in_transaction.return_value = object()
+            with patch("mcpgateway.main.SessionLocal", return_value=mock_db):
+                response = await handler(request)
+        else:
+            response = await handler(request)
+
+        assert response.status_code == 400, method_name
+        assert json.loads(response.body.decode())["error"]["code"] == -32700
+
+    @pytest.mark.parametrize(
+        ("handler", "expected_method", "wrong_method"),
+        [
+            (handle_internal_mcp_initialize, "initialize", "tools/list"),
+            (handle_internal_mcp_notifications_initialized, "notifications/initialized", "notifications/message"),
+            (handle_internal_mcp_notifications_message, "notifications/message", "notifications/initialized"),
+            (handle_internal_mcp_notifications_cancelled, "notifications/cancelled", "notifications/initialized"),
+            (handle_internal_mcp_resources_list, "resources/list", "tools/list"),
+            (handle_internal_mcp_resources_read, "resources/read", "resources/list"),
+            (handle_internal_mcp_resources_subscribe, "resources/subscribe", "resources/unsubscribe"),
+            (handle_internal_mcp_resources_unsubscribe, "resources/unsubscribe", "resources/subscribe"),
+            (handle_internal_mcp_resource_templates_list, "resources/templates/list", "resources/list"),
+            (handle_internal_mcp_roots_list, "roots/list", "tools/list"),
+            (handle_internal_mcp_completion_complete, "completion/complete", "tools/list"),
+            (handle_internal_mcp_sampling_create_message, "sampling/createMessage", "tools/list"),
+            (handle_internal_mcp_logging_set_level, "logging/setLevel", "tools/list"),
+            (handle_internal_mcp_prompts_list, "prompts/list", "tools/list"),
+            (handle_internal_mcp_prompts_get, "prompts/get", "prompts/list"),
+        ],
+    )
+    async def test_internal_mcp_handlers_reject_invalid_method(self, handler, expected_method, wrong_method):
+        """Trusted internal handlers should reject unexpected JSON-RPC methods."""
+        request = self._make_request({"jsonrpc": "2.0", "id": "bad-method", "method": wrong_method, "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        if handler in {
+            handle_internal_mcp_resources_list,
+            handle_internal_mcp_resources_read,
+            handle_internal_mcp_resources_subscribe,
+            handle_internal_mcp_resources_unsubscribe,
+            handle_internal_mcp_resource_templates_list,
+            handle_internal_mcp_roots_list,
+            handle_internal_mcp_completion_complete,
+            handle_internal_mcp_sampling_create_message,
+            handle_internal_mcp_logging_set_level,
+            handle_internal_mcp_prompts_list,
+            handle_internal_mcp_prompts_get,
+        }:
+            mock_db = MagicMock()
+            mock_db.is_active = True
+            mock_db.in_transaction.return_value = object()
+            with patch("mcpgateway.main.SessionLocal", return_value=mock_db):
+                response = await handler(request)
+        else:
+            response = await handler(request)
+
+        assert response.status_code == 400, expected_method
+        assert json.loads(response.body.decode())["error"]["code"] == -32600
+
+    @pytest.mark.parametrize(
+        ("handler", "method_name", "params", "patch_target", "expected_payload"),
+        [
+            (
+                handle_internal_mcp_resources_list,
+                "resources/list",
+                [],
+                "mcpgateway.main.resource_service.list_resources",
+                {"resources": [], "nextCursor": "next"},
+            ),
+            (
+                handle_internal_mcp_resource_templates_list,
+                "resources/templates/list",
+                [],
+                "mcpgateway.main.resource_service.list_resource_templates",
+                {"resourceTemplates": []},
+            ),
+            (
+                handle_internal_mcp_completion_complete,
+                "completion/complete",
+                [],
+                "mcpgateway.main.completion_service.handle_completion",
+                {"completion": {"text": "done"}},
+            ),
+            (
+                handle_internal_mcp_sampling_create_message,
+                "sampling/createMessage",
+                [],
+                "mcpgateway.main.sampling_handler.create_message",
+                {"messages": []},
+            ),
+            (
+                handle_internal_mcp_prompts_list,
+                "prompts/list",
+                [],
+                "mcpgateway.main.prompt_service.list_prompts",
+                {"prompts": [], "nextCursor": "next"},
+            ),
+        ],
+    )
+    async def test_internal_mcp_handlers_accept_non_dict_params(self, handler, method_name, params, patch_target, expected_payload):
+        """Handlers should coerce non-dict params to {} and continue safely."""
+        request = self._make_request({"jsonrpc": "2.0", "id": "params-1", "method": method_name, "params": params})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        patch_value = None
+        if handler in {handle_internal_mcp_resources_list, handle_internal_mcp_prompts_list}:
+            patch_value = ([], "next")
+        elif handler is handle_internal_mcp_resource_templates_list:
+            patch_value = []
+        elif handler is handle_internal_mcp_completion_complete:
+            patch_value = {"completion": {"text": "done"}}
+        elif handler is handle_internal_mcp_sampling_create_message:
+            patch_value = {"messages": []}
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main._get_scoped_resource_access_context", return_value=("user@example.com", [])),
+            patch(patch_target, new=AsyncMock(return_value=patch_value)),
+        ):
+            response = await handler(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == expected_payload
+
+    async def test_handle_internal_mcp_tools_list_returns_direct_definitions(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": True,
+                        "scoped_permissions": ["tools.read"],
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", ["team-a"], False)),
+            patch(
+                "mcpgateway.main.tool_service.list_server_mcp_tool_definitions",
+                new=AsyncMock(return_value=[{"name": "echo", "inputSchema": {"type": "object"}, "annotations": {}}]),
+            ) as mock_list_defs,
+        ):
+            response = await handle_internal_mcp_tools_list(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {"tools": [{"name": "echo", "inputSchema": {"type": "object"}, "annotations": {}}]}
+        assert mock_list_defs.await_args.args[1] == "srv-1"
+
+    async def test_handle_internal_mcp_tools_list_authz_returns_no_content(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": True,
+                        "scoped_permissions": ["tools.read"],
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with patch("mcpgateway.main.SessionLocal", return_value=mock_db):
+            response = await handle_internal_mcp_tools_list_authz(request)
+
+        assert response.status_code == 204
+        mock_db.commit.assert_called_once()
+        mock_db.close.assert_called_once()
+
+    async def test_handle_internal_mcp_tools_list_authz_skips_rbac_for_unauthenticated_public_only(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": None,
+                        "teams": [],
+                        "is_authenticated": False,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock(side_effect=AssertionError("RBAC should be skipped"))),
+        ):
+            response = await handle_internal_mcp_tools_list_authz(request)
+
+        assert response.status_code == 204
+        mock_db.commit.assert_called_once()
+        mock_db.close.assert_called_once()
+
+    @pytest.mark.parametrize(
+        "handler",
+        [
+            handle_internal_mcp_resources_list_authz,
+            handle_internal_mcp_resources_read_authz,
+            handle_internal_mcp_resource_templates_list_authz,
+            handle_internal_mcp_prompts_list_authz,
+            handle_internal_mcp_prompts_get_authz,
+        ],
+    )
+    async def test_server_scoped_internal_mcp_authz_wrappers_return_no_content(self, handler):
+        request = self._make_request({"jsonrpc": "2.0", "id": "1", "method": "noop", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+        ):
+            response = await handler(request)
+
+        assert response.status_code == 204
+        mock_db.commit.assert_called_once()
+        mock_db.close.assert_called_once()
+
+    async def test_server_scoped_internal_mcp_authz_wrapper_rolls_back_and_invalidates_on_error(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "1", "method": "noop", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.rollback.side_effect = RuntimeError("rollback failed")
+        mock_db.invalidate.side_effect = RuntimeError("invalidate failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_resources_list_authz(request)
+
+        mock_db.rollback.assert_called_once()
+        mock_db.invalidate.assert_called_once()
+        mock_db.close.assert_called_once()
+
+    async def test_handle_internal_mcp_tools_list_rejects_scoped_server_mismatch(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-2",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": True,
+                        "scoped_permissions": ["tools.read"],
+                        "scoped_server_id": "srv-1",
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        with pytest.raises(HTTPException) as excinfo:
+            await handle_internal_mcp_tools_list(request)
+
+        assert excinfo.value.status_code == 403
+
+    async def test_handle_internal_mcp_tools_list_requires_server_scope(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        with pytest.raises(HTTPException) as excinfo:
+            await handle_internal_mcp_tools_list(request)
+
+        assert excinfo.value.status_code == 400
+
+    async def test_handle_internal_mcp_tools_list_admin_public_and_cleanup_paths(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "tools-list-2", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        ok_db = MagicMock()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=ok_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main.tool_service.list_server_mcp_tool_definitions", new=AsyncMock(return_value=[])),
+        ):
+            response = await handle_internal_mcp_tools_list(request)
+        assert response.status_code == 200
+
+        request_public = self._make_request({"jsonrpc": "2.0", "id": "tools-list-3", "method": "tools/list", "params": {}})
+        request_public.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request_public.client = SimpleNamespace(host="127.0.0.1")
+
+        http_db = MagicMock()
+        http_db.rollback.side_effect = RuntimeError("rollback failed")
+        http_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=http_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(side_effect=HTTPException(status_code=403, detail="denied"))),
+        ):
+            with pytest.raises(HTTPException):
+                await handle_internal_mcp_tools_list(request_public)
+        http_db.invalidate.assert_called_once()
+
+        generic_db = MagicMock()
+        generic_db.rollback.side_effect = RuntimeError("rollback failed")
+        generic_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=generic_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.tool_service.list_server_mcp_tool_definitions", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            response = await handle_internal_mcp_tools_list(request_public)
+        assert response.status_code == 500
+        generic_db.invalidate.assert_called_once()
+
+        jsonrpc_db = MagicMock()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=jsonrpc_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(side_effect=JSONRPCError(-32003, "Access denied", {"method": "tools/list"}))),
+        ):
+            response = await handle_internal_mcp_tools_list(request_public)
+        assert response.status_code == 403
+        assert json.loads(response.body.decode())["code"] == -32003
+
+    async def test_handle_internal_mcp_tools_call_returns_jsonrpc_result(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "2", "method": "tools/call", "params": {"name": "echo", "arguments": {"text": "hello"}}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": True,
+                        "scoped_permissions": ["tools.execute"],
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+        tool_result = MagicMock()
+        tool_result.model_dump.return_value = {"content": [{"type": "text", "text": "ok"}], "isError": False}
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main.tool_service.invoke_tool", new=AsyncMock(return_value=tool_result)) as mock_invoke_tool,
+        ):
+            result = await handle_internal_mcp_tools_call(request)
+
+        assert result["jsonrpc"] == "2.0"
+        assert result["result"]["content"][0]["text"] == "ok"
+        assert mock_invoke_tool.await_args.kwargs["server_id"] == "srv-1"
+        mock_db.commit.assert_called_once()
+        mock_db.close.assert_called()
+
+    async def test_handle_internal_mcp_tools_call_skips_rbac_for_unauthenticated_public_only(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "3", "method": "tools/call", "params": {"name": "echo", "arguments": {}}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": None,
+                        "teams": [],
+                        "is_authenticated": False,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+        tool_result = MagicMock()
+        tool_result.model_dump.return_value = {"content": [{"type": "text", "text": "ok"}], "isError": False}
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock(side_effect=AssertionError("RBAC should be skipped"))),
+            patch("mcpgateway.main.tool_service.invoke_tool", new=AsyncMock(return_value=tool_result)),
+        ):
+            result = await handle_internal_mcp_tools_call(request)
+
+        assert result["result"]["content"][0]["text"] == "ok"
+        mock_db.commit.assert_called_once()
+        mock_db.close.assert_called()
+
+    async def test_handle_internal_mcp_tools_call_returns_jsonrpc_not_found(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "4", "method": "tools/call", "params": {"name": "missing-tool", "arguments": {}}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": True,
+                        "scoped_permissions": ["tools.execute"],
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main.tool_service.invoke_tool", new=AsyncMock(side_effect=ToolNotFoundError("Tool not found: missing-tool"))),
+        ):
+            result = await handle_internal_mcp_tools_call(request)
+
+        assert result["jsonrpc"] == "2.0"
+        assert result["id"] == "4"
+        assert result["error"]["code"] == -32601
+        assert "Tool not found: missing-tool" in result["error"]["message"]
+        mock_db.commit.assert_called_once()
+        mock_db.close.assert_called()
+
+    async def test_handle_internal_mcp_tools_call_resolve_returns_jsonrpc_not_found(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resolve-1", "method": "tools/call", "params": {"name": "missing-tool", "arguments": {}}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(
+                json.dumps(
+                    {
+                        "email": "user@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": True,
+                        "is_admin": False,
+                        "permission_is_admin": False,
+                        "scoped_permissions": ["tools.execute"],
+                    }
+                ).encode()
+            )
+            .decode()
+            .rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main.tool_service.prepare_rust_mcp_tool_execution", new=AsyncMock(side_effect=ToolNotFoundError("Tool not found: missing-tool"))),
+        ):
+            response = await handle_internal_mcp_tools_call_resolve(request)
+
+        assert response.status_code == 404
+        payload = json.loads(response.body)
+        assert payload["jsonrpc"] == "2.0"
+        assert payload["id"] == "resolve-1"
+        assert payload["error"]["code"] == -32601
+        assert "Tool not found: missing-tool" in payload["error"]["message"]
+        mock_db.close.assert_called()
+
+    async def test_handle_internal_mcp_initialize_non_dict_params_returns_internal_error(self, monkeypatch):
+        import mcpgateway.main as main_mod
+
+        request = self._make_request({"jsonrpc": "2.0", "id": "init-err", "method": "initialize", "params": []})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr(main_mod, "_execute_rpc_initialize", AsyncMock(side_effect=RuntimeError("init boom")))
+
+        response = await handle_internal_mcp_initialize(request)
+        payload = json.loads(response.body.decode())
+
+        assert payload["error"]["code"] == -32000
+        assert payload["error"]["data"] == "init boom"
+
+    async def test_handle_internal_mcp_initialize_generates_id_and_returns_jsonrpc_error(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "method": "initialize", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr("mcpgateway.main._execute_rpc_initialize", AsyncMock(side_effect=JSONRPCError(-32003, "Access denied", {"method": "initialize"})))
+
+        response = await handle_internal_mcp_initialize(request)
+        payload = json.loads(response.body.decode())
+
+        assert payload["error"]["code"] == -32003
+        assert payload["id"] is not None
+
+    async def test_handle_internal_mcp_session_delete_denies_invalid_session_access(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "sess-del", "method": "delete", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "mcp-session-id": "sess-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr("mcpgateway.main._validate_streamable_session_access", AsyncMock(return_value=(False, 403, "denied")))
+
+        response = await handle_internal_mcp_session_delete(request)
+        assert response.status_code == 403
+        assert json.loads(response.body.decode())["detail"] == "denied"
+
+    async def test_handle_internal_mcp_session_delete_ignores_pool_runtime_errors(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "sess-del", "method": "delete", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "mcp-session-id": "sess-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "_rust_session_validated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr("mcpgateway.main.settings.mcpgateway_session_affinity_enabled", True)
+        monkeypatch.setattr("mcpgateway.main.session_registry.remove_session", AsyncMock(return_value=None))
+        monkeypatch.setattr("mcpgateway.services.mcp_session_pool.get_mcp_session_pool", MagicMock(side_effect=RuntimeError("pool unavailable")))
+
+        response = await handle_internal_mcp_session_delete(request)
+        assert response.status_code == 204
+
+    async def test_handle_internal_mcp_notifications_initialized_re_raises_http_exception(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "n1", "method": "notifications/initialized", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr("mcpgateway.main._enforce_internal_mcp_server_scope", MagicMock(side_effect=HTTPException(status_code=403, detail="scope mismatch")))
+
+        with pytest.raises(HTTPException) as excinfo:
+            await handle_internal_mcp_notifications_initialized(request)
+
+        assert excinfo.value.status_code == 403
+
+    async def test_handle_internal_mcp_notifications_initialized_returns_internal_error_on_logging_failure(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "n2", "method": "notifications/initialized", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        monkeypatch.setattr("mcpgateway.main.logging_service.notify", AsyncMock(side_effect=RuntimeError("notify boom")))
+
+        response = await handle_internal_mcp_notifications_initialized(request)
+        assert json.loads(response.body.decode())["error"]["data"] == "notify boom"
+
+    async def test_handle_internal_mcp_notifications_message_accepts_non_dict_params(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "n3", "method": "notifications/message", "params": []})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        notify = AsyncMock(return_value=None)
+        monkeypatch.setattr("mcpgateway.main.logging_service.notify", notify)
+
+        response = await handle_internal_mcp_notifications_message(request)
+        assert response.status_code == 204
+        assert notify.await_args.args[0] is None
+
+    async def test_handle_internal_mcp_notifications_message_re_raises_http_exception(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "n3b", "method": "notifications/message", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        monkeypatch.setattr("mcpgateway.main._enforce_internal_mcp_server_scope", MagicMock(side_effect=HTTPException(status_code=403, detail="scope mismatch")))
+
+        with pytest.raises(HTTPException) as excinfo:
+            await handle_internal_mcp_notifications_message(request)
+
+        assert excinfo.value.status_code == 403
+
+    async def test_handle_internal_mcp_notifications_cancelled_accepts_non_dict_params_and_returns_internal_error(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "n4", "method": "notifications/cancelled", "params": []})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        monkeypatch.setattr("mcpgateway.main.logging_service.notify", AsyncMock(side_effect=RuntimeError("cancel notify boom")))
+
+        response = await handle_internal_mcp_notifications_cancelled(request)
+        payload = json.loads(response.body.decode())
+        assert payload["error"]["data"] == "cancel notify boom"
+
+    async def test_handle_internal_mcp_resources_list_server_scope_admin_unrestricted(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "res-list", "method": "resources/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        resource = MagicMock()
+        resource.model_dump.return_value = {"uri": "resource://one"}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main.resource_service.list_server_resources", new=AsyncMock(return_value=[resource])),
+        ):
+            response = await handle_internal_mcp_resources_list(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {"resources": [{"uri": "resource://one"}]}
+
+    async def test_handle_internal_mcp_resources_list_public_only_and_generic_cleanup_path(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "res-list-2", "method": "resources/list", "params": {"cursor": "c1"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        resource = MagicMock()
+        resource.model_dump.return_value = {"uri": "resource://two"}
+
+        list_db = MagicMock()
+        list_db.is_active = True
+        list_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=list_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.resource_service.list_resources", new=AsyncMock(return_value=([resource], "next-cursor"))),
+        ):
+            response = await handle_internal_mcp_resources_list(request)
+        assert json.loads(response.body.decode()) == {"resources": [{"uri": "resource://two"}], "nextCursor": "next-cursor"}
+
+        error_db = MagicMock()
+        error_db.rollback.side_effect = RuntimeError("rollback failed")
+        error_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=error_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.resource_service.list_resources", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            response = await handle_internal_mcp_resources_list(request)
+        assert response.status_code == 500
+        error_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_resources_read_server_scope_missing_uri(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "res-read", "method": "resources/read", "params": []})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+        ):
+            response = await handle_internal_mcp_resources_read(request)
+
+        assert response.status_code == 400
+        assert json.loads(response.body.decode())["message"] == "Missing resource URI in parameters"
+
+    async def test_handle_internal_mcp_resources_read_admin_unrestricted_with_plain_payload(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "res-read", "method": "resources/read", "params": {"uri": "resource://one"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main.resource_service.read_resource", new=AsyncMock(return_value={"uri": "resource://one"})),
+        ):
+            response = await handle_internal_mcp_resources_read(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {"contents": [{"uri": "resource://one"}]}
+
+    async def test_handle_internal_mcp_resources_read_returns_not_found_payload(self):
+        from mcpgateway.services.resource_service import ResourceNotFoundError
+
+        request = self._make_request({"jsonrpc": "2.0", "id": "res-read", "method": "resources/read", "params": {"uri": "resource://missing"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+        mock_db = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.resource_service.read_resource", new=AsyncMock(side_effect=ResourceNotFoundError("missing"))),
+        ):
+            response = await handle_internal_mcp_resources_read(request)
+
+        assert response.status_code == 404
+        assert json.loads(response.body.decode())["data"] == {"uri": "resource://missing"}
+
+    async def test_handle_internal_mcp_resources_read_ignores_invalidate_failure_on_cleanup(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "res-read-err", "method": "resources/read", "params": {"uri": "resource://err"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+        mock_db = MagicMock()
+        mock_db.rollback.side_effect = RuntimeError("rollback failed")
+        mock_db.invalidate.side_effect = RuntimeError("invalidate failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.resource_service.read_resource", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            response = await handle_internal_mcp_resources_read(request)
+
+        assert response.status_code == 500
+        mock_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_resources_read_returns_resource_error_payload(self):
+        from mcpgateway.services.resource_service import ResourceError
+
+        request = self._make_request({"jsonrpc": "2.0", "id": "res-read-ambiguous", "method": "resources/read", "params": {"uri": "resource://dup"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+        mock_db = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch(
+                "mcpgateway.main.resource_service.read_resource",
+                new=AsyncMock(side_effect=ResourceError("Resource URI 'resource://dup' is ambiguous across multiple servers; use /servers/{id}/mcp.")),
+            ),
+        ):
+            response = await handle_internal_mcp_resources_read(request)
+
+        assert response.status_code == 400
+        payload = json.loads(response.body.decode())
+        assert payload["code"] == -32602
+        assert payload["data"] == {"uri": "resource://dup"}
+
+    async def test_handle_internal_mcp_prompts_list_server_scope_public_only_when_token_teams_missing(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "prompts-list", "method": "prompts/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        prompt = MagicMock()
+        prompt.model_dump.return_value = {"name": "prompt-one"}
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.prompt_service.list_server_prompts", new=AsyncMock(return_value=[prompt])),
+        ):
+            response = await handle_internal_mcp_prompts_list(request)
+
+        assert response.status_code == 200
+        assert json.loads(response.body.decode()) == {"prompts": [{"name": "prompt-one"}]}
+
+    async def test_handle_internal_mcp_prompts_list_admin_unrestricted_and_cleanup_path(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "prompts-list-2", "method": "prompts/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        prompt = MagicMock()
+        prompt.model_dump.return_value = {"name": "prompt-two"}
+
+        admin_db = MagicMock()
+        admin_db.is_active = True
+        admin_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=admin_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main.prompt_service.list_prompts", new=AsyncMock(return_value=([prompt], "next"))),
+        ):
+            response = await handle_internal_mcp_prompts_list(request)
+        assert json.loads(response.body.decode()) == {"prompts": [{"name": "prompt-two"}], "nextCursor": "next"}
+
+        error_db = MagicMock()
+        error_db.rollback.side_effect = RuntimeError("rollback failed")
+        error_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=error_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.prompt_service.list_prompts", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_prompts_list(request)
+        error_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_prompts_get_missing_name_and_not_found(self):
+        from mcpgateway.services.prompt_service import PromptError, PromptNotFoundError
+
+        request_missing = self._make_request({"jsonrpc": "2.0", "id": "prompt-get", "method": "prompts/get", "params": []})
+        request_missing.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request_missing.client = SimpleNamespace(host="127.0.0.1")
+        request_missing.state = MagicMock()
+        mock_db = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+        ):
+            response = await handle_internal_mcp_prompts_get(request_missing)
+
+        assert response.status_code == 400
+        assert json.loads(response.body.decode())["message"] == "Missing prompt name in parameters"
+
+        request_not_found = self._make_request({"jsonrpc": "2.0", "id": "prompt-get", "method": "prompts/get", "params": {"name": "missing"}})
+        request_not_found.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request_not_found.client = SimpleNamespace(host="127.0.0.1")
+        request_not_found.state = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main.prompt_service.get_prompt", new=AsyncMock(side_effect=PromptNotFoundError("missing"))),
+        ):
+            response = await handle_internal_mcp_prompts_get(request_not_found)
+
+        assert response.status_code == 404
+        assert json.loads(response.body.decode())["data"] == {"name": "missing"}
+
+        request_invalid = self._make_request({"jsonrpc": "2.0", "id": "prompt-get", "method": "prompts/get", "params": {"name": "broken"}})
+        request_invalid.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com"}).encode()).decode().rstrip("="),
+        }
+        request_invalid.client = SimpleNamespace(host="127.0.0.1")
+        request_invalid.state = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "admin@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main.prompt_service.get_prompt", new=AsyncMock(side_effect=PromptError("bad prompt arguments"))),
+        ):
+            response = await handle_internal_mcp_prompts_get(request_invalid)
+
+        assert response.status_code == 422
+        body = json.loads(response.body.decode())
+        assert body["message"] == "bad prompt arguments"
+        assert body["data"] == {"name": "broken"}
+
+    async def test_handle_internal_mcp_prompts_get_public_only_and_generic_cleanup_path(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "prompt-get-2", "method": "prompts/get", "params": {"name": "prompt-one"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        request.state = MagicMock()
+
+        ok_db = MagicMock()
+        ok_db.is_active = True
+        ok_db.in_transaction.return_value = object()
+        payload = MagicMock()
+        payload.model_dump.return_value = {"name": "prompt-one", "template": "hi"}
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=ok_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.prompt_service.get_prompt", new=AsyncMock(return_value=payload)),
+        ):
+            response = await handle_internal_mcp_prompts_get(request)
+        assert json.loads(response.body.decode())["name"] == "prompt-one"
+
+        err_db = MagicMock()
+        err_db.rollback.side_effect = RuntimeError("rollback failed")
+        err_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=err_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(return_value={"email": "user@example.com"})),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.prompt_service.get_prompt", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_prompts_get(request)
+        err_db.invalidate.assert_called_once()
+
+    @pytest.mark.parametrize(
+        ("handler", "method_name"),
+        [
+            (handle_internal_mcp_resources_list, "resources/list"),
+            (handle_internal_mcp_resources_read, "resources/read"),
+            (handle_internal_mcp_resources_subscribe, "resources/subscribe"),
+            (handle_internal_mcp_resources_unsubscribe, "resources/unsubscribe"),
+            (handle_internal_mcp_resource_templates_list, "resources/templates/list"),
+            (handle_internal_mcp_roots_list, "roots/list"),
+            (handle_internal_mcp_completion_complete, "completion/complete"),
+            (handle_internal_mcp_logging_set_level, "logging/setLevel"),
+            (handle_internal_mcp_prompts_list, "prompts/list"),
+            (handle_internal_mcp_prompts_get, "prompts/get"),
+        ],
+    )
+    async def test_internal_mcp_handlers_return_jsonrpc_errors_from_authorization(self, handler, method_name):
+        request = self._make_request({"jsonrpc": "2.0", "id": "rpc-1", "method": method_name, "params": {"uri": "resource://one", "name": "prompt-one"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.query_params = {}
+        request.state = MagicMock()
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(side_effect=JSONRPCError(-32003, "Access denied", {"method": method_name}))),
+        ):
+            response = await handler(request)
+
+        assert response.status_code == 403
+
+    @pytest.mark.parametrize(
+        ("handler", "method_name", "patch_target", "raises"),
+        [
+            (handle_internal_mcp_resources_list, "resources/list", "mcpgateway.main._authorize_internal_mcp_request", False),
+            (handle_internal_mcp_resources_read, "resources/read", "mcpgateway.main._authorize_internal_mcp_request", False),
+            (handle_internal_mcp_resources_subscribe, "resources/subscribe", "mcpgateway.main._authorize_internal_mcp_request", False),
+            (handle_internal_mcp_resources_unsubscribe, "resources/unsubscribe", "mcpgateway.main._authorize_internal_mcp_request", False),
+            (handle_internal_mcp_resource_templates_list, "resources/templates/list", "mcpgateway.main._authorize_internal_mcp_request", True),
+            (handle_internal_mcp_roots_list, "roots/list", "mcpgateway.main._authorize_internal_mcp_request", True),
+            (handle_internal_mcp_completion_complete, "completion/complete", "mcpgateway.main._authorize_internal_mcp_request", False),
+            (handle_internal_mcp_sampling_create_message, "sampling/createMessage", "mcpgateway.main.sampling_handler.create_message", False),
+            (handle_internal_mcp_logging_set_level, "logging/setLevel", "mcpgateway.main._authorize_internal_mcp_request", False),
+            (handle_internal_mcp_prompts_list, "prompts/list", "mcpgateway.main._authorize_internal_mcp_request", True),
+            (handle_internal_mcp_prompts_get, "prompts/get", "mcpgateway.main._authorize_internal_mcp_request", True),
+        ],
+    )
+    async def test_internal_mcp_handlers_rollback_and_handle_generic_errors(self, handler, method_name, patch_target, raises):
+        request = self._make_request({"jsonrpc": "2.0", "id": "rpc-2", "method": method_name, "params": {"uri": "resource://one", "name": "prompt-one"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.query_params = {}
+        request.state = MagicMock()
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.rollback.side_effect = RuntimeError("rollback failed")
+
+        with patch("mcpgateway.main.SessionLocal", return_value=mock_db), patch(patch_target, new=AsyncMock(side_effect=RuntimeError("boom"))):
+            if raises:
+                with pytest.raises(RuntimeError, match="boom"):
+                    await handler(request)
+            else:
+                response = await handler(request)
+                assert response.status_code == 500
+
+        mock_db.rollback.assert_called_once()
+        mock_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_tools_call_returns_forwarded_affinity_response(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "aff-1", "method": "tools/call", "params": {"name": "echo"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._maybe_forward_affinitized_rpc_request", new=AsyncMock(return_value={"jsonrpc": "2.0", "result": {"ok": True}, "id": "aff-1"})),
+        ):
+            result = await handle_internal_mcp_tools_call(request)
+
+        assert result == {"jsonrpc": "2.0", "result": {"ok": True}, "id": "aff-1"}
+
+    async def test_handle_internal_mcp_tools_call_rolls_back_and_invalidates_on_unexpected_error(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "aff-2", "method": "tools/call", "params": {"name": "echo"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.rollback.side_effect = RuntimeError("rollback failed")
+        mock_db.invalidate.side_effect = RuntimeError("invalidate failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main._execute_rpc_tools_call", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_tools_call(request)
+
+        mock_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_tools_call_resolve_returns_jsonrpc_error_and_rolls_back(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resolve-2", "method": "tools/call", "params": {"name": "echo"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock(side_effect=JSONRPCError(-32003, "Access denied", {"method": "tools/call"}))),
+        ):
+            response = await handle_internal_mcp_tools_call_resolve(request)
+
+        assert response.status_code == 403
+        assert json.loads(response.body.decode())["code"] == -32003
+
+    async def test_handle_internal_mcp_tools_call_resolve_commits_success_and_invalidates_on_error(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resolve-3", "method": "tools/call", "params": {"name": "echo"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        success_db = MagicMock()
+        success_db.is_active = True
+        success_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=success_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main.tool_service.prepare_rust_mcp_tool_execution", new=AsyncMock(return_value={"eligible": True})),
+        ):
+            response = await handle_internal_mcp_tools_call_resolve(request)
+        assert response.status_code == 200
+        success_db.commit.assert_called_once()
+
+        error_db = MagicMock()
+        error_db.rollback.side_effect = RuntimeError("rollback failed")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=error_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main.tool_service.prepare_rust_mcp_tool_execution", new=AsyncMock(side_effect=RuntimeError("resolve boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="resolve boom"):
+                await handle_internal_mcp_tools_call_resolve(request)
+        error_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_rpc_rolls_back_and_invalidates_on_error(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "rpc-rollback", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.rollback.side_effect = RuntimeError("rollback failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._handle_rpc_authenticated", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_rpc(request)
+
+        mock_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_rpc_ignores_invalidate_failure_on_cleanup(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "rpc-rollback", "method": "tools/list", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.rollback.side_effect = RuntimeError("rollback failed")
+        mock_db.invalidate.side_effect = RuntimeError("invalidate failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._handle_rpc_authenticated", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_rpc(request)
+
+        mock_db.invalidate.assert_called_once()
+
+    async def test_handle_internal_mcp_notifications_message_returns_internal_error_on_logging_failure(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "n5", "method": "notifications/message", "params": {"level": "info"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        monkeypatch.setattr("mcpgateway.main.logging_service.notify", AsyncMock(side_effect=RuntimeError("message boom")))
+
+        response = await handle_internal_mcp_notifications_message(request)
+        assert json.loads(response.body.decode())["error"]["data"] == "message boom"
+
+    async def test_handle_internal_mcp_notifications_cancelled_re_raises_http_exception(self, monkeypatch):
+        request = self._make_request({"jsonrpc": "2.0", "id": "n6", "method": "notifications/cancelled", "params": {"requestId": "req-1"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        monkeypatch.setattr("mcpgateway.main._enforce_internal_mcp_server_scope", MagicMock(side_effect=HTTPException(status_code=403, detail="scope mismatch")))
+
+        with pytest.raises(HTTPException) as excinfo:
+            await handle_internal_mcp_notifications_cancelled(request)
+
+        assert excinfo.value.status_code == 403
+
+    async def test_handle_internal_mcp_tools_call_rejects_parse_error_invalid_method_and_missing_tool_name(self):
+        parse_request = MagicMock(spec=Request)
+        parse_request.body = AsyncMock(return_value=b"{bad")
+        parse_request.headers = {"x-contextforge-mcp-runtime": "rust", "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("=")}
+        parse_request.query_params = {}
+        parse_request.state = MagicMock()
+        parse_request.client = SimpleNamespace(host="127.0.0.1")
+
+        parse_response = await handle_internal_mcp_tools_call(parse_request)
+        assert parse_response.status_code == 400
+        assert json.loads(parse_response.body.decode())["error"]["code"] == -32700
+
+        invalid_request = self._make_request({"jsonrpc": "2.0", "id": "bad-method", "method": "tools/list", "params": {}})
+        invalid_request.headers = parse_request.headers
+        invalid_request.client = parse_request.client
+        invalid_result = await handle_internal_mcp_tools_call(invalid_request)
+        assert json.loads(invalid_result.body.decode())["error"]["code"] == -32600
+
+        missing_name_request = self._make_request({"jsonrpc": "2.0", "id": "missing-name", "method": "tools/call", "params": []})
+        missing_name_request.headers = parse_request.headers
+        missing_name_request.client = parse_request.client
+        missing_name_result = await handle_internal_mcp_tools_call(missing_name_request)
+        assert missing_name_result["error"]["code"] == -32602
+
+    async def test_handle_internal_mcp_tools_call_generates_id_and_reraises_plugin_error_while_ignoring_close_failures(self):
+        request = self._make_request({"jsonrpc": "2.0", "method": "tools/call", "params": {"name": "echo"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.is_active = True
+        mock_db.in_transaction.return_value = object()
+        mock_db.close.side_effect = [None, RuntimeError("close failed")]
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main._execute_rpc_tools_call", new=AsyncMock(side_effect=PluginError(MagicMock(message="plugin boom")))),
+        ):
+            with pytest.raises(PluginError):
+                await handle_internal_mcp_tools_call(request)
+
+    async def test_handle_internal_mcp_tools_call_resolve_rejects_parse_error_invalid_method_missing_name_and_tool_error(self):
+        base_headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+
+        parse_request = MagicMock(spec=Request)
+        parse_request.body = AsyncMock(return_value=b"{bad")
+        parse_request.headers = base_headers
+        parse_request.query_params = {}
+        parse_request.state = MagicMock()
+        parse_request.client = SimpleNamespace(host="127.0.0.1")
+        parse_response = await handle_internal_mcp_tools_call_resolve(parse_request)
+        assert parse_response.status_code == 400
+        assert json.loads(parse_response.body.decode())["error"]["code"] == -32700
+
+        invalid_request = self._make_request({"jsonrpc": "2.0", "id": "bad-method", "method": "tools/list", "params": {}})
+        invalid_request.headers = base_headers
+        invalid_request.client = parse_request.client
+        invalid_response = await handle_internal_mcp_tools_call_resolve(invalid_request)
+        assert invalid_response.status_code == 400
+        assert json.loads(invalid_response.body.decode())["error"]["code"] == -32600
+
+        missing_name_request = self._make_request({"jsonrpc": "2.0", "id": "missing-name", "method": "tools/call", "params": []})
+        missing_name_request.headers = base_headers
+        missing_name_request.client = parse_request.client
+        missing_name_response = await handle_internal_mcp_tools_call_resolve(missing_name_request)
+        assert missing_name_response.status_code == 400
+        assert json.loads(missing_name_response.body.decode())["error"]["code"] == -32602
+
+        tool_error_request = self._make_request({"jsonrpc": "2.0", "id": "tool-error", "method": "tools/call", "params": {"name": "echo"}})
+        tool_error_request.headers = base_headers
+        tool_error_request.client = parse_request.client
+        mock_db = MagicMock()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main.tool_service.prepare_rust_mcp_tool_execution", new=AsyncMock(side_effect=ToolError("tool boom"))),
+        ):
+            tool_error_response = await handle_internal_mcp_tools_call_resolve(tool_error_request)
+        assert tool_error_response.status_code == 400
+        assert json.loads(tool_error_response.body.decode())["error"]["code"] == -32000
+
+    async def test_handle_internal_mcp_tools_call_resolve_scope_and_filter_context_variants(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "resolve-scope", "method": "tools/call", "params": {"name": "echo"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "admin@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        admin_db = MagicMock()
+        admin_db.is_active = True
+        admin_db.in_transaction.return_value = object()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=admin_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main._enforce_internal_mcp_server_scope"),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("admin@example.com", None, True)),
+            patch("mcpgateway.main.tool_service.prepare_rust_mcp_tool_execution", new=AsyncMock(return_value={"eligible": True})),
+        ):
+            response = await handle_internal_mcp_tools_call_resolve(request)
+        assert response.status_code == 200
+
+        public_db = MagicMock()
+        public_db.rollback.side_effect = RuntimeError("rollback failed")
+        public_db.invalidate.side_effect = RuntimeError("invalidate failed")
+        request_no_scope = self._make_request({"jsonrpc": "2.0", "id": "resolve-scope-2", "method": "tools/call", "params": {"name": "echo"}})
+        request_no_scope.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request_no_scope.client = SimpleNamespace(host="127.0.0.1")
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=public_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+            patch("mcpgateway.main.tool_service.prepare_rust_mcp_tool_execution", new=AsyncMock(side_effect=RuntimeError("resolve boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="resolve boom"):
+                await handle_internal_mcp_tools_call_resolve(request_no_scope)
+        public_db.invalidate.assert_called_once()
+
+    async def test_internal_mcp_tools_call_resolve_re_raises_plugin_errors_and_ignores_close_failures(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "plugin-err", "method": "tools/call", "params": {"name": "echo"}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com", "is_authenticated": True}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.close.side_effect = RuntimeError("close failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._ensure_rpc_permission", new=AsyncMock()),
+            patch("mcpgateway.main.tool_service.prepare_rust_mcp_tool_execution", new=AsyncMock(side_effect=PluginError(MagicMock(message="plugin boom")))),
+        ):
+            with pytest.raises(PluginError):
+                await handle_internal_mcp_tools_call_resolve(request)
+
+    async def test_server_scoped_authz_missing_server_scope_and_jsonrpc_error(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "authz", "method": "noop", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        with pytest.raises(HTTPException) as excinfo:
+            await handle_internal_mcp_resources_list_authz(request)
+        assert excinfo.value.status_code == 400
+
+        request.headers["x-contextforge-server-id"] = "srv-1"
+        mock_db = MagicMock()
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(side_effect=JSONRPCError(-32003, "Access denied", {"method": "resources/list"}))),
+        ):
+            response = await handle_internal_mcp_resources_list_authz(request)
+
+        assert response.status_code == 403
+
+    async def test_server_scoped_authz_ignores_invalidate_failure_on_cleanup(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "authz", "method": "noop", "params": {}})
+        request.headers = {
+            "x-contextforge-mcp-runtime": "rust",
+            "x-contextforge-server-id": "srv-1",
+            "x-contextforge-auth-context": base64.urlsafe_b64encode(json.dumps({"email": "user@example.com"}).encode()).decode().rstrip("="),
+        }
+        request.client = SimpleNamespace(host="127.0.0.1")
+        mock_db = MagicMock()
+        mock_db.rollback.side_effect = RuntimeError("rollback failed")
+        mock_db.invalidate.side_effect = RuntimeError("invalidate failed")
+
+        with (
+            patch("mcpgateway.main.SessionLocal", return_value=mock_db),
+            patch("mcpgateway.main._authorize_internal_mcp_request", new=AsyncMock(side_effect=RuntimeError("boom"))),
+        ):
+            with pytest.raises(RuntimeError, match="boom"):
+                await handle_internal_mcp_resources_list_authz(request)
+
+        mock_db.invalidate.assert_called_once()
+
+    async def test_handle_rpc_uses_scoped_server_id_from_internal_auth_and_denies_wrong_server(self):
+        request = self._make_request({"jsonrpc": "2.0", "id": "rpc-scoped", "method": "tools/list", "params": []})
+        request.state._jwt_verified_payload = None
+        request.state._mcp_internal_auth_context = {"scoped_server_id": "srv-1"}
+
+        with (
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", [], False)),
+            patch("mcpgateway.main.tool_service.list_server_mcp_tool_definitions", new=AsyncMock(return_value=[])),
+        ):
+            result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
+
+        assert result["result"]["tools"] == []
+
+        denied_request = self._make_request({"jsonrpc": "2.0", "id": "rpc-denied", "method": "tools/list", "params": {"server_id": "srv-2"}})
+        denied_request.state._jwt_verified_payload = ("fake", {"scopes": {"server_id": "srv-1"}})
+        denied_request.state._mcp_internal_auth_context = None
+
+        denied_result = await handle_rpc(denied_request, db=MagicMock(), user={"email": "user@example.com"})
+        assert denied_result.status_code == 403
+
+    async def test_handle_rpc_list_tools_with_cursor(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "tools/list", "params": {}}
+        request = self._make_request(payload)
+
+        tool = MagicMock()
+        tool.model_dump.return_value = {"id": "tool-2"}
+        mock_db = MagicMock()
+
+        with (
+            patch("mcpgateway.main.tool_service.list_tools", new=AsyncMock(return_value=([tool], "next-cursor"))),
+            patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)),
+        ):
+            result = await handle_rpc(request, db=mock_db, user={"email": "user@example.com"})
+            assert result["result"]["nextCursor"] == "next-cursor"
+
+    async def test_handle_rpc_list_gateways(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "list_gateways", "params": {}}
+        request = self._make_request(payload)
+
+        gateway = MagicMock()
+        gateway.model_dump.return_value = {"id": "gw-1"}
+        mock_db = MagicMock()
+
+        with patch("mcpgateway.main.gateway_service.list_gateways", new=AsyncMock(return_value=([gateway], None))):
+            result = await handle_rpc(request, db=mock_db, user={"email": "user@example.com"})
+            assert result["result"]["gateways"][0]["id"] == "gw-1"
+
+    async def test_handle_rpc_list_roots_requires_admin_permission(self):
+        payload = {"jsonrpc": "2.0", "id": "roots-1", "method": "list_roots", "params": {}}
+        request = self._make_request(payload)
+
+        with patch("mcpgateway.main.PermissionChecker.has_permission", new=AsyncMock(return_value=False)):
+            result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
+            assert result["error"]["code"] == -32003
+            assert "Access denied" in result["error"]["message"]
+
+    async def test_handle_rpc_list_roots_short_circuits_permission_admin(self):
+        payload = {"jsonrpc": "2.0", "id": "roots-admin", "method": "list_roots", "params": {}}
+        request = self._make_request(payload)
+
+        with (
+            patch("mcpgateway.main.root_service.list_roots", new=AsyncMock(return_value=[])),
+            patch("mcpgateway.main.PermissionChecker.has_permission", new=AsyncMock(side_effect=AssertionError("RBAC lookup should be skipped for admins"))),
+        ):
+            result = await handle_rpc(request, db=MagicMock(), user={"email": "admin@example.com", "is_admin": True, "permission_is_admin": True})
+
+        assert result["result"]["roots"] == []
+
+    async def test_handle_rpc_roots_list_requires_admin_permission(self):
+        payload = {"jsonrpc": "2.0", "id": "roots-2", "method": "roots/list", "params": {}}
+        request = self._make_request(payload)
+
+        with patch("mcpgateway.main.PermissionChecker.has_permission", new=AsyncMock(return_value=False)):
+            result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
+            assert result["error"]["code"] == -32003
+
+    async def test_handle_rpc_admin_short_circuit_still_honors_token_scope_cap(self):
+        payload = {"jsonrpc": "2.0", "id": "roots-scope", "method": "roots/list", "params": {}}
+        request = self._make_request(payload)
+        request.state._mcp_internal_auth_context = {"scoped_permissions": ["tools.read"]}
+
+        with patch("mcpgateway.main.PermissionChecker.has_permission", new=AsyncMock(side_effect=AssertionError("RBAC lookup should not run when token scope already denies"))):
+            result = await handle_rpc(request, db=MagicMock(), user={"email": "admin@example.com", "is_admin": True})
+
+        assert result["error"]["code"] == -32003
+
+    async def test_handle_rpc_resources_read_missing_uri(self):
+        payload = {"jsonrpc": "2.0", "id": "1", "method": "resources/read", "params": {}}
+        request = self._make_request(payload)
+
+        with patch("mcpgateway.main._get_rpc_filter_context", return_value=("user@example.com", None, False)):
+            result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
             assert "error" in result
 
     async def test_handle_rpc_resources_list_with_cursor(self):
@@ -4769,6 +8435,24 @@ async def test_handle_rpc_session_affinity_internal_forwarded_executes_locally(s
         result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
         assert result["result"] == {}
 
+    async def test_maybe_forward_affinitized_rpc_request_internally_forwarded_branch(self, monkeypatch):
+        import mcpgateway.main as main_mod
+
+        monkeypatch.setattr(settings, "mcpgateway_session_affinity_enabled", True)
+        request = MagicMock(spec=Request)
+        request.headers = {"mcp-session-id": "sess-123", "x-forwarded-internally": "true"}
+        request.client = SimpleNamespace(host="127.0.0.1")
+
+        forwarded = await main_mod._maybe_forward_affinitized_rpc_request(
+            request,
+            method="tools/call",
+            params={"name": "echo"},
+            req_id="aff-local",
+            lowered_request_headers={"mcp-session-id": "sess-123"},
+        )
+
+        assert forwarded is None
+
     async def test_handle_rpc_initialize_registers_session_owner_success_and_failure(self, monkeypatch):
         """Cover initialize ownership claim paths."""
         monkeypatch.setattr(settings, "mcpgateway_session_affinity_enabled", True)
@@ -5348,6 +9032,45 @@ def close(self):
         assert "db down" in result["error"]
         assert sess.closed is True
 
+    def test_healthcheck_reports_runtime_mode_and_headers(self, monkeypatch):
+        import mcpgateway.main as main_mod
+
+        class FakeSession:  # noqa: D401 - test helper
+            def execute(self, _stmt):  # noqa: ANN001
+                return None
+
+            def commit(self):
+                return None
+
+            def close(self):
+                return None
+
+        monkeypatch.setattr(main_mod, "SessionLocal", lambda: FakeSession())
+        monkeypatch.setenv("CONTEXTFORGE_ENABLE_RUST_BUILD", "true")
+        monkeypatch.setenv("EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED", "false")
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_enabled", False)
+
+        response = FastAPIResponse()
+        result = main_mod.healthcheck(response)
+
+        assert result["status"] == "healthy"
+        assert result["mcp_runtime"]["mode"] == "python-rust-built-disabled"
+        assert result["mcp_runtime"]["mounted"] == "python"
+        assert result["mcp_runtime"]["rust_build_included"] is True
+        assert result["mcp_runtime"]["session_core_mode"] == "python"
+        assert result["mcp_runtime"]["event_store_mode"] == "python"
+        assert result["mcp_runtime"]["resume_core_mode"] == "python"
+        assert result["mcp_runtime"]["live_stream_core_mode"] == "python"
+        assert result["mcp_runtime"]["session_auth_reuse_mode"] == "python"
+        assert response.headers["x-contextforge-mcp-runtime-mode"] == "python-rust-built-disabled"
+        assert response.headers["x-contextforge-mcp-transport-mounted"] == "python"
+        assert response.headers["x-contextforge-rust-build-included"] == "true"
+        assert response.headers["x-contextforge-mcp-session-core-mode"] == "python"
+        assert response.headers["x-contextforge-mcp-event-store-mode"] == "python"
+        assert response.headers["x-contextforge-mcp-resume-core-mode"] == "python"
+        assert response.headers["x-contextforge-mcp-live-stream-core-mode"] == "python"
+        assert response.headers["x-contextforge-mcp-session-auth-reuse-mode"] == "python"
+
     async def test_readiness_check_invalidate_failure_is_best_effort(self, monkeypatch):
         import mcpgateway.main as main_mod
 
@@ -5379,6 +9102,128 @@ async def _to_thread(func, *args, **kwargs):  # noqa: ANN001
         payload = json.loads(response.body.decode())
         assert payload["status"] == "not ready"
 
+    async def test_readiness_check_reports_runtime_mode_headers(self, monkeypatch):
+        import mcpgateway.main as main_mod
+
+        class FakeSession:  # noqa: D401 - test helper
+            def execute(self, _stmt):  # noqa: ANN001
+                return None
+
+            def commit(self):
+                return None
+
+            def close(self):
+                return None
+
+        monkeypatch.setattr(main_mod, "SessionLocal", lambda: FakeSession())
+
+        async def _to_thread(func, *args, **kwargs):  # noqa: ANN001
+            return func(*args, **kwargs)
+
+        monkeypatch.setattr(main_mod.asyncio, "to_thread", _to_thread)
+        monkeypatch.setenv("CONTEXTFORGE_ENABLE_RUST_BUILD", "true")
+        monkeypatch.setenv("EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED", "true")
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_uds", "/tmp/contextforge-mcp-rust.sock")
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_session_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_event_store_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_resume_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_live_stream_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_session_auth_reuse_enabled", True)
+
+        response = await main_mod.readiness_check()
+        payload = json.loads(response.body.decode())
+
+        assert response.status_code == 200
+        assert payload["status"] == "ready"
+        assert payload["mcp_runtime"]["mode"] == "rust-managed"
+        assert payload["mcp_runtime"]["mounted"] == "rust"
+        assert payload["mcp_runtime"]["sidecar_transport"] == "uds"
+        assert payload["mcp_runtime"]["session_core_mode"] == "rust"
+        assert payload["mcp_runtime"]["event_store_mode"] == "rust"
+        assert payload["mcp_runtime"]["resume_core_mode"] == "rust"
+        assert payload["mcp_runtime"]["live_stream_core_mode"] == "rust"
+        assert payload["mcp_runtime"]["session_auth_reuse_mode"] == "rust"
+        assert response.headers["x-contextforge-mcp-runtime-mode"] == "rust-managed"
+        assert response.headers["x-contextforge-mcp-transport-mounted"] == "rust"
+        assert response.headers["x-contextforge-rust-build-included"] == "true"
+        assert response.headers["x-contextforge-mcp-session-core-mode"] == "rust"
+        assert response.headers["x-contextforge-mcp-event-store-mode"] == "rust"
+        assert response.headers["x-contextforge-mcp-resume-core-mode"] == "rust"
+        assert response.headers["x-contextforge-mcp-live-stream-core-mode"] == "rust"
+        assert response.headers["x-contextforge-mcp-session-auth-reuse-mode"] == "rust"
+
+    def test_runtime_status_payload_reports_http_transport_and_rust_affinity_core(self, monkeypatch):
+        import mcpgateway.main as main_mod
+
+        monkeypatch.setenv("CONTEXTFORGE_ENABLE_RUST_BUILD", "true")
+        monkeypatch.setenv("EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED", "true")
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_uds", None)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_affinity_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_session_auth_reuse_enabled", True)
+
+        payload = main_mod._mcp_runtime_status_payload()
+
+        assert main_mod._current_mcp_affinity_core_mode() == "rust"
+        assert payload["sidecar_transport"] == "http"
+        assert payload["sidecar_target"] == "http://127.0.0.1:8787"
+        assert payload["affinity_core_mode"] == "rust"
+        assert payload["session_auth_reuse_mode"] == "rust"
+
+    def test_runtime_status_payload_reports_python_mount_without_session_auth_reuse(self, monkeypatch):
+        import mcpgateway.main as main_mod
+
+        monkeypatch.setenv("CONTEXTFORGE_ENABLE_RUST_BUILD", "true")
+        monkeypatch.setenv("EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED", "true")
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_uds", "/tmp/contextforge-mcp-rust.sock")
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_session_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_event_store_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_resume_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_live_stream_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_affinity_core_enabled", True)
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_session_auth_reuse_enabled", False)
+
+        payload = main_mod._mcp_runtime_status_payload()
+
+        assert payload["mode"] == "rust-managed"
+        assert payload["mounted"] == "python"
+        assert payload["session_core_mode"] == "python"
+        assert payload["event_store_mode"] == "python"
+        assert payload["resume_core_mode"] == "python"
+        assert payload["live_stream_core_mode"] == "python"
+        assert payload["affinity_core_mode"] == "python"
+        assert payload["rust_session_core_enabled"] is False
+        assert payload["rust_event_store_enabled"] is False
+        assert payload["rust_resume_core_enabled"] is False
+        assert payload["rust_live_stream_core_enabled"] is False
+        assert payload["rust_affinity_core_enabled"] is False
+        assert payload["session_auth_reuse_mode"] == "python"
+
+    def test_healthcheck_unhealthy_applies_runtime_headers(self, monkeypatch):
+        import mcpgateway.main as main_mod
+
+        class FakeSession:  # noqa: D401 - test helper
+            def execute(self, _stmt):  # noqa: ANN001
+                raise RuntimeError("db down")
+
+            def rollback(self):
+                return None
+
+            def close(self):
+                return None
+
+        monkeypatch.setattr(main_mod, "SessionLocal", lambda: FakeSession())
+        monkeypatch.setattr(main_mod.settings, "experimental_rust_mcp_runtime_enabled", True)
+
+        response = FastAPIResponse()
+        result = main_mod.healthcheck(response)
+
+        assert result["status"] == "unhealthy"
+        assert response.headers["x-contextforge-mcp-runtime-mode"] == "rust-managed"
+
     async def test_sse_endpoint_cookie_auth_and_disconnect_cleanup(self, monkeypatch):
         import mcpgateway.main as main_mod
 
@@ -6771,9 +10616,7 @@ async def test_handle_rpc_completion_direct_admin_null_teams_preserves_bypass(mo
     import mcpgateway.main as main_mod
 
     request = MagicMock(spec=Request)
-    request.body = AsyncMock(
-        return_value=json.dumps({"jsonrpc": "2.0", "id": "rpc-id", "method": "completion/complete", "params": {"ref": {"type": "ref/prompt", "name": "p1"}}}).encode()
-    )
+    request.body = AsyncMock(return_value=json.dumps({"jsonrpc": "2.0", "id": "rpc-id", "method": "completion/complete", "params": {"ref": {"type": "ref/prompt", "name": "p1"}}}).encode())
     request.headers = {}
     request.query_params = {}
     db = MagicMock()
@@ -6797,9 +10640,7 @@ async def test_handle_rpc_completion_direct_non_admin_none_teams_becomes_public_
     import mcpgateway.main as main_mod
 
     request = MagicMock(spec=Request)
-    request.body = AsyncMock(
-        return_value=json.dumps({"jsonrpc": "2.0", "id": "rpc-id", "method": "completion/complete", "params": {"ref": {"type": "ref/prompt", "name": "p1"}}}).encode()
-    )
+    request.body = AsyncMock(return_value=json.dumps({"jsonrpc": "2.0", "id": "rpc-id", "method": "completion/complete", "params": {"ref": {"type": "ref/prompt", "name": "p1"}}}).encode())
     request.headers = {}
     request.query_params = {}
     db = MagicMock()
@@ -7047,18 +10888,18 @@ async def test_resources_subscribe_denied_with_servers_use_only(self):
         assert result["error"]["code"] == -32003
         assert "Access denied" in result["error"]["message"]
 
-    async def test_logging_set_level_allowed_with_servers_use(self):
-        """Token scoped to servers.use should be allowed logging/setLevel."""
+    async def test_logging_set_level_allowed_with_admin_system_config(self):
+        """Token scoped to admin.system_config should be allowed logging/setLevel."""
         payload = {"jsonrpc": "2.0", "id": 1, "method": "logging/setLevel", "params": {"level": "error"}}
-        request = self._make_request(payload, scoped_permissions=["servers.use"])
+        request = self._make_request(payload, scoped_permissions=["admin.system_config"])
 
         result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
         assert "error" not in result
 
-    async def test_logging_set_level_denied_without_servers_use(self):
-        """Token scoped to tools.read only (no servers.use) should be denied logging/setLevel."""
+    async def test_logging_set_level_denied_without_admin_system_config(self):
+        """Token scoped without admin.system_config should be denied logging/setLevel."""
         payload = {"jsonrpc": "2.0", "id": 1, "method": "logging/setLevel", "params": {"level": "error"}}
-        request = self._make_request(payload, scoped_permissions=["tools.read"])
+        request = self._make_request(payload, scoped_permissions=["servers.use"])
 
         result = await handle_rpc(request, db=MagicMock(), user={"email": "user@example.com"})
         assert result["error"]["code"] == -32003
diff --git a/tests/unit/mcpgateway/test_schemas_auth_validation.py b/tests/unit/mcpgateway/test_schemas_auth_validation.py
index dbbb7fa2b1..d82b1bc56c 100644
--- a/tests/unit/mcpgateway/test_schemas_auth_validation.py
+++ b/tests/unit/mcpgateway/test_schemas_auth_validation.py
@@ -12,7 +12,7 @@
 
 
 def test_gateway_create_authheaders_multi_duplicate(caplog):
-    caplog.set_level("WARNING")
+    caplog.set_level("WARNING", logger="mcpgateway.schemas")
     gateway = GatewayCreate(
         name="gw",
         url="https://example.com",
diff --git a/tests/unit/mcpgateway/test_schemas_validators_extra.py b/tests/unit/mcpgateway/test_schemas_validators_extra.py
index c98d69b9ef..99c73c0550 100644
--- a/tests/unit/mcpgateway/test_schemas_validators_extra.py
+++ b/tests/unit/mcpgateway/test_schemas_validators_extra.py
@@ -348,7 +348,7 @@ def test_tool_create_optional_none_branches():
 def test_tool_update_more_branches(caplog):
     assert ToolUpdate.validate_url(None) is None
 
-    caplog.set_level("INFO")
+    caplog.set_level("INFO", logger="mcpgateway.schemas")
     long_desc = "x" * (SecurityValidator.MAX_DESCRIPTION_LENGTH + 1)
     truncated = ToolUpdate.validate_description(long_desc)
     assert len(truncated) == SecurityValidator.MAX_DESCRIPTION_LENGTH
@@ -391,7 +391,7 @@ def test_resource_create_and_notifications_serialization():
 
 
 def test_prompt_update_description_truncation(caplog):
-    caplog.set_level("INFO")
+    caplog.set_level("INFO", logger="mcpgateway.schemas")
     long_desc = "x" * (SecurityValidator.MAX_DESCRIPTION_LENGTH + 1)
     truncated = PromptUpdate.validate_description(long_desc)
     assert len(truncated) == SecurityValidator.MAX_DESCRIPTION_LENGTH
@@ -424,7 +424,7 @@ def test_gateway_create_more_branches(monkeypatch):
 
 
 def test_gateway_update_more_branches(caplog):
-    caplog.set_level("WARNING")
+    caplog.set_level("WARNING", logger="mcpgateway.schemas")
     long_desc = "x" * (SecurityValidator.MAX_DESCRIPTION_LENGTH + 1)
     assert len(GatewayUpdate.validate_description(long_desc)) == SecurityValidator.MAX_DESCRIPTION_LENGTH
 
@@ -508,7 +508,7 @@ def test_rpc_and_event_admin_and_server_validators(caplog):
 
     assert AdminToolCreate.validate_json("") is None
 
-    caplog.set_level("INFO")
+    caplog.set_level("INFO", logger="mcpgateway.schemas")
     long_desc = "x" * (SecurityValidator.MAX_DESCRIPTION_LENGTH + 1)
     assert len(ServerCreate.validate_description(long_desc)) == SecurityValidator.MAX_DESCRIPTION_LENGTH
     assert len(ServerUpdate.validate_description(long_desc)) == SecurityValidator.MAX_DESCRIPTION_LENGTH
@@ -538,7 +538,7 @@ class NoVars:
 
 
 def test_a2a_agent_create_and_update_more_branches(monkeypatch, caplog):
-    caplog.set_level("WARNING")
+    caplog.set_level("WARNING", logger="mcpgateway.schemas")
     long_desc = "x" * (SecurityValidator.MAX_DESCRIPTION_LENGTH + 1)
     assert len(A2AAgentCreate.validate_description(long_desc)) == SecurityValidator.MAX_DESCRIPTION_LENGTH
     assert len(A2AAgentUpdate.validate_description(long_desc)) == SecurityValidator.MAX_DESCRIPTION_LENGTH
diff --git a/tests/unit/mcpgateway/test_version.py b/tests/unit/mcpgateway/test_version.py
index 06905ce25c..f35209b37b 100644
--- a/tests/unit/mcpgateway/test_version.py
+++ b/tests/unit/mcpgateway/test_version.py
@@ -117,6 +117,9 @@ def test_version_json_ok(client: TestClient) -> None:
     payload: Dict[str, Any] = rsp.json()
     assert payload["database"]["server_version"] == "db-vX"
     assert payload["system"] == {"stub": True}
+    assert "mcp_runtime" in payload
+    assert "mode" in payload["mcp_runtime"]
+    assert "mounted" in payload["mcp_runtime"]
 
 
 def test_version_html_query_param(client: TestClient) -> None:
@@ -135,7 +138,7 @@ def test_version_html_accept_header(client: TestClient) -> None:
 
 def test_version_html_all_sections(client: TestClient) -> None:
     html = client.get("/version?fmt=html").text
-    for sec in ["App", "Platform", "Database", "Redis", "Settings", "System", "Environment"]:
+    for sec in ["App", "Platform", "Database", "Redis", "Settings", "MCP Runtime", "System", "Environment"]:
         assert re.search(rf"<h2[^>]*>{sec}</h2>", html)
 
 
@@ -502,6 +505,7 @@ def test_version_partial_html_fragment(monkeypatch: pytest.MonkeyPatch) -> None:
     assert rsp.status_code == 200
     assert rsp.headers["content-type"].startswith("text/html")
     assert "Application Information" in rsp.text
+    assert "MCP Runtime" in rsp.text
 
 
 def test_version_partial_html_uses_existing_app_templates(monkeypatch: pytest.MonkeyPatch) -> None:
diff --git a/tests/unit/mcpgateway/transports/test_rust_mcp_runtime_proxy.py b/tests/unit/mcpgateway/transports/test_rust_mcp_runtime_proxy.py
new file mode 100644
index 0000000000..5d8c2cf31c
--- /dev/null
+++ b/tests/unit/mcpgateway/transports/test_rust_mcp_runtime_proxy.py
@@ -0,0 +1,697 @@
+# -*- coding: utf-8 -*-
+"""Unit tests for the experimental Rust MCP runtime proxy."""
+
+# Standard
+import base64
+import json
+from unittest.mock import AsyncMock
+
+# Third-Party
+import httpx
+import orjson
+import pytest
+
+# First-Party
+import mcpgateway.transports.rust_mcp_runtime_proxy as proxy_mod
+from mcpgateway.transports.rust_mcp_runtime_proxy import RustMCPRuntimeProxy
+
+
+def _make_receive(body: bytes):
+    sent = {"done": False}
+
+    async def receive():
+        if sent["done"]:
+            return {"type": "http.disconnect"}
+        sent["done"] = True
+        return {"type": "http.request", "body": body, "more_body": False}
+
+    return receive
+
+
+@pytest.mark.asyncio
+async def test_post_requests_proxy_to_rust_runtime_and_forward_internal_server_header(monkeypatch):
+    """POST MCP traffic should be proxied to Rust with server scope carried via an internal header."""
+    captured = {}
+
+    class FakeResponse:
+        def __init__(self):
+            self.status_code = 200
+            self.headers = httpx.Headers(
+                {
+                    "content-type": "application/json",
+                    "mcp-session-id": "session-1",
+                    "x-contextforge-mcp-runtime": "rust",
+                }
+            )
+
+        async def aiter_bytes(self):
+            yield b'{"jsonrpc":"2.0","id":1,'
+            yield b'"result":{"ok":true}}'
+
+    class FakeStreamContext:
+        def __init__(self, *, content):
+            self._content = content
+
+        async def __aenter__(self):
+            if isinstance(self._content, (bytes, bytearray)):
+                captured["content"] = bytes(self._content)
+            else:
+                parts = []
+                async for chunk in self._content:
+                    parts.append(chunk)
+                captured["content"] = b"".join(parts)
+            return FakeResponse()
+
+        async def __aexit__(self, exc_type, exc, tb):
+            return False
+
+    class FakeClient:
+        def stream(self, method, url, *, content, headers, timeout, follow_redirects):  # noqa: ANN001
+            captured["method"] = method
+            captured["url"] = url
+            captured["headers"] = headers
+            captured["timeout"] = timeout
+            captured["follow_redirects"] = follow_redirects
+            return FakeStreamContext(content=content)
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_timeout_seconds", 17)
+    monkeypatch.setattr(
+        "mcpgateway.transports.rust_mcp_runtime_proxy.get_streamable_http_auth_context",
+        lambda: {
+            "email": "user@example.com",
+            "teams": ["team-a"],
+            "is_authenticated": True,
+            "is_admin": False,
+            "permission_is_admin": True,
+            "token_use": "session",
+            "scoped_permissions": ["tools.read"],
+            "scoped_server_id": "server-scope-1",
+        },
+    )
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.get_http_client", AsyncMock(return_value=FakeClient()))
+
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+    events = []
+
+    async def send(message):
+        events.append(message)
+
+    scope = {
+        "type": "http",
+        "method": "POST",
+        "path": "/",
+        "modified_path": "/servers/123e4567-e89b-12d3-a456-426614174000/mcp",
+        "query_string": b"session_id=abc123",
+        "headers": [
+            (b"content-type", b"application/json"),
+            (b"authorization", b"Bearer test-token"),
+            (b"cookie", b"jwt_token=cookie-token"),
+            (b"mcp-protocol-version", b"2025-11-25"),
+            (b"x-forwarded-for", b"203.0.113.10"),
+            (b"x-forwarded-internally", b"true"),
+            (b"x-mcp-session-id", b"internal-only"),
+            (b"x-contextforge-server-id", b"spoofed-by-client"),
+        ],
+    }
+
+    await proxy.handle_streamable_http(
+        scope,
+        _make_receive(b'{"jsonrpc":"2.0","id":1,"method":"tools/list","params":{}}'),
+        send,
+    )
+
+    fallback.assert_not_awaited()
+    assert captured["method"] == "POST"
+    assert captured["url"] == "http://127.0.0.1:8787/mcp/?session_id=abc123"
+    assert captured["timeout"].connect == 17
+    assert captured["follow_redirects"] is False
+
+    forwarded_headers = dict(captured["headers"])
+    assert forwarded_headers["authorization"] == "Bearer test-token"
+    assert forwarded_headers["cookie"] == "jwt_token=cookie-token"
+    assert forwarded_headers["mcp-protocol-version"] == "2025-11-25"
+    assert "x-forwarded-for" not in forwarded_headers
+    assert "x-forwarded-internally" not in forwarded_headers
+    assert "x-mcp-session-id" not in forwarded_headers
+    assert forwarded_headers["x-contextforge-server-id"] == "123e4567-e89b-12d3-a456-426614174000"
+    auth_context = orjson.loads(base64.urlsafe_b64decode(f"{forwarded_headers['x-contextforge-auth-context']}=="))
+    assert auth_context == {
+        "email": "user@example.com",
+        "teams": ["team-a"],
+        "is_authenticated": True,
+        "is_admin": False,
+        "permission_is_admin": True,
+        "token_use": "session",
+        "scoped_permissions": ["tools.read"],
+        "scoped_server_id": "server-scope-1",
+    }
+    assert json.loads(captured["content"].decode()) == {"jsonrpc": "2.0", "id": 1, "method": "tools/list", "params": {}}
+
+    assert events[0]["type"] == "http.response.start"
+    assert events[0]["status"] == 200
+    assert (b"mcp-session-id", b"session-1") in events[0]["headers"]
+    assert (b"x-contextforge-mcp-runtime", b"rust") in events[0]["headers"]
+    assert events[1]["type"] == "http.response.body"
+    assert events[1]["more_body"] is True
+    assert events[2]["type"] == "http.response.body"
+    assert events[2]["more_body"] is True
+    assert events[3] == {"type": "http.response.body", "body": b"", "more_body": False}
+    streamed_body = b"".join(event["body"] for event in events[1:3])
+    assert json.loads(streamed_body.decode()) == {"jsonrpc": "2.0", "id": 1, "result": {"ok": True}}
+
+
+@pytest.mark.asyncio
+async def test_post_requests_without_server_scope_stream_body_to_rust(monkeypatch):
+    """Plain /mcp POSTs should stream the request body through without JSON mutation."""
+    captured = {}
+
+    class FakeResponse:
+        def __init__(self):
+            self.status_code = 200
+            self.headers = httpx.Headers({"content-type": "application/json"})
+
+        async def aiter_bytes(self):
+            yield b'{"jsonrpc":"2.0","id":1,"result":{}}'
+
+    class FakeStreamContext:
+        def __init__(self, *, content):
+            self._content = content
+
+        async def __aenter__(self):
+            parts = []
+            async for chunk in self._content:
+                parts.append(chunk)
+            captured["content"] = b"".join(parts)
+            return FakeResponse()
+
+        async def __aexit__(self, exc_type, exc, tb):
+            return False
+
+    class FakeClient:
+        def stream(self, method, url, *, content, headers, timeout, follow_redirects):  # noqa: ANN001
+            captured["method"] = method
+            captured["url"] = url
+            captured["headers"] = headers
+            captured["timeout"] = timeout
+            captured["follow_redirects"] = follow_redirects
+            return FakeStreamContext(content=content)
+
+    async def receive():
+        if not hasattr(receive, "calls"):
+            receive.calls = 0
+        receive.calls += 1
+        if receive.calls == 1:
+            return {"type": "http.request", "body": b'{"jsonrpc":"2.0","id":1,', "more_body": True}
+        if receive.calls == 2:
+            return {"type": "http.request", "body": b'"method":"ping","params":{}}', "more_body": False}
+        return {"type": "http.disconnect"}
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_timeout_seconds", 17)
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.get_http_client", AsyncMock(return_value=FakeClient()))
+
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+    events = []
+
+    async def send(message):
+        events.append(message)
+
+    await proxy.handle_streamable_http(
+        {
+            "type": "http",
+            "method": "POST",
+            "path": "/",
+            "modified_path": "/mcp/",
+            "query_string": b"",
+            "headers": [(b"content-type", b"application/json")],
+        },
+        receive,
+        send,
+    )
+
+    fallback.assert_not_awaited()
+    assert captured["method"] == "POST"
+    assert captured["url"] == "http://127.0.0.1:8787/mcp/"
+    assert captured["content"] == b'{"jsonrpc":"2.0","id":1,"method":"ping","params":{}}'
+    assert captured["follow_redirects"] is False
+    assert events[-1] == {"type": "http.response.body", "body": b"", "more_body": False}
+
+
+@pytest.mark.asyncio
+async def test_loopback_internal_forward_marks_affinity_for_rust(monkeypatch):
+    """Loopback owner-worker forwards should be marked for Rust without exposing spoofable headers."""
+    captured = {}
+
+    class FakeResponse:
+        def __init__(self):
+            self.status_code = 200
+            self.headers = httpx.Headers({"content-type": "application/json"})
+
+        async def aiter_bytes(self):
+            yield b'{"jsonrpc":"2.0","id":1,"result":{}}'
+
+    class FakeStreamContext:
+        async def __aenter__(self):
+            return FakeResponse()
+
+        async def __aexit__(self, exc_type, exc, tb):
+            return False
+
+    class FakeClient:
+        def stream(self, method, url, *, content, headers, timeout, follow_redirects):  # noqa: ANN001
+            captured["method"] = method
+            captured["url"] = url
+            captured["headers"] = dict(headers)
+            captured["timeout"] = timeout
+            captured["follow_redirects"] = follow_redirects
+            return FakeStreamContext()
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_timeout_seconds", 17)
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.get_http_client", AsyncMock(return_value=FakeClient()))
+    monkeypatch.setattr(
+        "mcpgateway.transports.rust_mcp_runtime_proxy.get_streamable_http_auth_context",
+        lambda: {"email": "owner@example.com", "token_use": "session"},
+    )
+
+    proxy = RustMCPRuntimeProxy(AsyncMock())
+    events = []
+
+    async def send(message):
+        events.append(message)
+
+    await proxy.handle_streamable_http(
+        {
+            "type": "http",
+            "client": ("127.0.0.1", 40123),
+            "method": "GET",
+            "path": "/mcp",
+            "modified_path": "/mcp",
+            "query_string": b"session_id=session-1",
+            "headers": [
+                (b"accept", b"text/event-stream"),
+                (b"x-forwarded-internally", b"true"),
+                (b"x-original-worker", b"worker-123"),
+            ],
+        },
+        _make_receive(b""),
+        send,
+    )
+
+    assert captured["method"] == "GET"
+    assert captured["url"] == "http://127.0.0.1:8787/mcp/?session_id=session-1"
+    assert captured["follow_redirects"] is False
+    assert captured["headers"]["x-contextforge-affinity-forwarded"] == "rust"
+    assert "x-forwarded-internally" not in captured["headers"]
+    assert "x-original-worker" not in captured["headers"]
+    assert "x-contextforge-auth-context" in captured["headers"]
+    assert events[0]["status"] == 200
+
+
+@pytest.mark.asyncio
+async def test_get_requests_proxy_to_rust_runtime(monkeypatch):
+    """GET MCP transport traffic should be proxied to Rust instead of falling back to Python."""
+    captured = {}
+
+    class FakeResponse:
+        def __init__(self):
+            self.status_code = 200
+            self.headers = httpx.Headers(
+                {
+                    "content-type": "text/event-stream",
+                    "x-contextforge-mcp-runtime": "rust",
+                    "mcp-session-id": "session-1",
+                }
+            )
+
+        async def aiter_bytes(self):
+            yield b"data: ping\\n\\n"
+
+    class FakeStreamContext:
+        async def __aenter__(self):
+            return FakeResponse()
+
+        async def __aexit__(self, exc_type, exc, tb):
+            return False
+
+    class FakeClient:
+        def stream(self, method, url, *, content, headers, timeout, follow_redirects):  # noqa: ANN001
+            captured["method"] = method
+            captured["url"] = url
+            captured["content"] = content
+            captured["headers"] = headers
+            captured["timeout"] = timeout
+            captured["follow_redirects"] = follow_redirects
+            return FakeStreamContext()
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_timeout_seconds", 17)
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.get_http_client", AsyncMock(return_value=FakeClient()))
+
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+    events = []
+
+    async def send(message):
+        events.append(message)
+
+    await proxy.handle_streamable_http(
+        {
+            "type": "http",
+            "method": "GET",
+            "path": "/",
+            "modified_path": "/servers/123e4567-e89b-12d3-a456-426614174000/mcp",
+            "query_string": b"session_id=abc123",
+            "headers": [
+                (b"authorization", b"Bearer test-token"),
+                (b"mcp-session-id", b"session-1"),
+            ],
+        },
+        _make_receive(b""),
+        send,
+    )
+
+    fallback.assert_not_awaited()
+    assert captured["method"] == "GET"
+    assert captured["url"] == "http://127.0.0.1:8787/mcp/?session_id=abc123"
+    assert captured["content"] == b""
+    assert captured["follow_redirects"] is False
+    assert dict(captured["headers"])["x-contextforge-server-id"] == "123e4567-e89b-12d3-a456-426614174000"
+    assert events[0]["status"] == 200
+    assert (b"content-type", b"text/event-stream") in events[0]["headers"]
+    assert (b"mcp-session-id", b"session-1") in events[0]["headers"]
+    assert events[1]["body"] == b"data: ping\\n\\n"
+    assert events[2] == {"type": "http.response.body", "body": b"", "more_body": False}
+
+
+@pytest.mark.asyncio
+async def test_post_requests_use_uds_client_when_configured(monkeypatch):
+    """Configured Rust runtime UDS should use a dedicated client instead of the shared HTTP client."""
+    constructed = {}
+
+    class FakeResponse:
+        status_code = 200
+        headers = httpx.Headers({"content-type": "application/json"})
+
+        async def aiter_bytes(self):
+            yield b'{"jsonrpc":"2.0","id":1,"result":{}}'
+
+    class FakeStreamContext:
+        async def __aenter__(self):
+            return FakeResponse()
+
+        async def __aexit__(self, exc_type, exc, tb):
+            return False
+
+    class FakeAsyncClient:
+        def __init__(self, **kwargs):
+            constructed["kwargs"] = kwargs
+
+        def stream(self, method, url, *, content, headers, timeout, follow_redirects):  # noqa: ANN001
+            constructed["method"] = method
+            constructed["url"] = url
+            constructed["headers"] = headers
+            constructed["timeout"] = timeout
+            constructed["follow_redirects"] = follow_redirects
+            return FakeStreamContext()
+
+    get_http_client_mock = AsyncMock()
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://localhost")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_uds", "/tmp/contextforge-mcp-rust.sock")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_timeout_seconds", 9)
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.get_http_client", get_http_client_mock)
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.httpx.AsyncClient", FakeAsyncClient)
+
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+    events = []
+
+    async def send(message):
+        events.append(message)
+
+    await proxy.handle_streamable_http(
+        {
+            "type": "http",
+            "method": "POST",
+            "path": "/",
+            "modified_path": "/mcp/",
+            "query_string": b"",
+            "headers": [(b"content-type", b"application/json")],
+        },
+        _make_receive(b'{"jsonrpc":"2.0","id":1,"method":"ping","params":{}}'),
+        send,
+    )
+
+    get_http_client_mock.assert_not_awaited()
+    assert constructed["method"] == "POST"
+    assert constructed["url"] == "http://localhost/mcp/"
+    assert constructed["kwargs"]["transport"]._pool._uds == "/tmp/contextforge-mcp-rust.sock"  # pylint: disable=protected-access
+    assert constructed["kwargs"]["follow_redirects"] is False
+    assert constructed["follow_redirects"] is False
+    assert events[-1] == {"type": "http.response.body", "body": b"", "more_body": False}
+
+
+@pytest.mark.asyncio
+async def test_runtime_proxy_surfaces_redirect_without_following(monkeypatch):
+    """Internal runtime redirects should be surfaced directly and never auto-followed."""
+    requests_seen = []
+
+    def handler(request: httpx.Request) -> httpx.Response:
+        requests_seen.append(str(request.url))
+        if request.url.path == "/mcp/":
+            return httpx.Response(
+                307,
+                headers={"location": "http://127.0.0.1:8787/final"},
+                request=request,
+            )
+        return httpx.Response(200, json={"jsonrpc": "2.0", "id": 1, "result": {"unexpected": True}}, request=request)
+
+    client = httpx.AsyncClient(transport=httpx.MockTransport(handler))
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.get_http_client", AsyncMock(return_value=client))
+
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+    events = []
+
+    async def send(message):
+        events.append(message)
+
+    try:
+        await proxy.handle_streamable_http(
+            {
+                "type": "http",
+                "method": "GET",
+                "path": "/",
+                "modified_path": "/mcp",
+                "query_string": b"session_id=abc123",
+                "headers": [],
+            },
+            _make_receive(b""),
+            send,
+        )
+    finally:
+        await client.aclose()
+
+    fallback.assert_not_awaited()
+    assert requests_seen == ["http://127.0.0.1:8787/mcp/?session_id=abc123"]
+    assert events[0]["status"] == 307
+    assert (b"location", b"http://127.0.0.1:8787/final") in events[0]["headers"]
+    assert events[-1] == {"type": "http.response.body", "body": b"", "more_body": False}
+
+
+@pytest.mark.asyncio
+async def test_unsupported_methods_fall_back_to_python_transport():
+    """Unsupported MCP transport methods should keep using the Python transport."""
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+
+    async def receive():
+        return {"type": "http.disconnect"}
+
+    async def send(_message):
+        return None
+
+    await proxy.handle_streamable_http(
+        {
+            "type": "http",
+            "method": "OPTIONS",
+            "path": "/",
+            "modified_path": "/mcp/",
+            "headers": [],
+            "query_string": b"",
+        },
+        receive,
+        send,
+    )
+
+    fallback.assert_awaited_once()
+
+
+@pytest.mark.asyncio
+async def test_non_http_scopes_fall_back_to_python_transport():
+    """Non-HTTP ASGI scopes should be forwarded to the Python fallback app."""
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+
+    async def receive():
+        return {"type": "websocket.disconnect"}
+
+    async def send(_message):
+        return None
+
+    await proxy.handle_streamable_http(
+        {
+            "type": "websocket",
+            "path": "/mcp/",
+        },
+        receive,
+        send,
+    )
+
+    fallback.assert_awaited_once()
+
+
+@pytest.mark.asyncio
+async def test_stream_request_body_skips_non_request_messages_and_disconnects():
+    """Request-body streaming should ignore non-request frames and stop on disconnect."""
+
+    async def receive():
+        if not hasattr(receive, "calls"):
+            receive.calls = 0
+        receive.calls += 1
+        if receive.calls == 1:
+            return {"type": "lifespan.startup"}
+        if receive.calls == 2:
+            return {"type": "http.request", "body": b"abc", "more_body": True}
+        if receive.calls == 3:
+            return {"type": "http.disconnect"}
+        return {"type": "http.request", "body": b"ignored", "more_body": False}
+
+    chunks = []
+    async for chunk in proxy_mod._stream_request_body(receive):
+        chunks.append(chunk)
+
+    assert chunks == [b"abc"]
+
+
+def test_build_runtime_mcp_url_handles_empty_and_prefixed_base_paths(monkeypatch):
+    """The Rust runtime target URL should normalize base paths consistently."""
+    scope = {"query_string": b"session_id=sess-1"}
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+    assert proxy_mod._build_runtime_mcp_url(scope) == "http://127.0.0.1:8787/mcp/?session_id=sess-1"
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787/base")
+    assert proxy_mod._build_runtime_mcp_url(scope) == "http://127.0.0.1:8787/base/mcp/?session_id=sess-1"
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787/base/mcp")
+    assert proxy_mod._build_runtime_mcp_url(scope) == "http://127.0.0.1:8787/base/mcp/?session_id=sess-1"
+
+
+def test_build_forward_headers_skips_malformed_and_non_bytes_headers(monkeypatch):
+    """Malformed header tuples and non-bytes headers should be ignored safely."""
+    monkeypatch.setattr(
+        "mcpgateway.transports.rust_mcp_runtime_proxy.get_streamable_http_auth_context",
+        lambda: {},
+    )
+
+    headers = proxy_mod._build_forward_headers(
+        {
+            "headers": [
+                ("authorization", "bad-types"),
+                (b"authorization", b"Bearer token"),
+                (b"x-forwarded-for", b"203.0.113.10"),
+                (b"x-contextforge-server-id", b"spoofed"),
+                (b"cookie", b"jwt_token=cookie-token"),
+                (b"broken",),
+            ],
+            "modified_path": "/servers/123e4567-e89b-12d3-a456-426614174000/mcp",
+        }
+    )
+
+    assert ("authorization", "Bearer token") in headers
+    assert ("cookie", "jwt_token=cookie-token") in headers
+    assert ("x-contextforge-server-id", "123e4567-e89b-12d3-a456-426614174000") in headers
+    assert not any(name == "x-forwarded-for" for name, _value in headers)
+
+
+def test_build_forward_headers_marks_affinity_forwarded_for_loopback_internal_requests(monkeypatch):
+    """Loopback requests forwarded internally should be marked for Rust affinity handling."""
+    monkeypatch.setattr(
+        "mcpgateway.transports.rust_mcp_runtime_proxy.get_streamable_http_auth_context",
+        lambda: {},
+    )
+
+    headers = proxy_mod._build_forward_headers(
+        {
+            "headers": [(b"x-forwarded-internally", b"true")],
+            "client": ("127.0.0.1", 4444),
+            "modified_path": "/mcp/",
+        }
+    )
+
+    assert ("x-contextforge-affinity-forwarded", "rust") in headers
+
+
+@pytest.mark.asyncio
+async def test_get_runtime_client_reuses_uds_client(monkeypatch):
+    """Configured UDS clients should be constructed once and reused."""
+    constructed = {"count": 0}
+
+    class FakeAsyncClient:
+        def __init__(self, **_kwargs):
+            constructed["count"] += 1
+
+    proxy = RustMCPRuntimeProxy(AsyncMock())
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_uds", "/tmp/contextforge-mcp-rust.sock")
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.httpx.AsyncClient", FakeAsyncClient)
+
+    first = await proxy._get_runtime_client()
+    second = await proxy._get_runtime_client()
+
+    assert first is second
+    assert constructed["count"] == 1
+
+
+@pytest.mark.asyncio
+async def test_runtime_failure_returns_jsonrpc_bad_gateway(monkeypatch):
+    """Connection failures to the Rust sidecar should return a JSON-RPC 502 error."""
+
+    class FailingClient:
+        def stream(self, *args, **kwargs):  # noqa: ANN002, ANN003
+            raise httpx.ConnectError("connect failed")
+
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.get_http_client", AsyncMock(return_value=FailingClient()))
+    monkeypatch.setattr("mcpgateway.transports.rust_mcp_runtime_proxy.settings.experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+
+    fallback = AsyncMock()
+    proxy = RustMCPRuntimeProxy(fallback)
+    events = []
+
+    async def send(message):
+        events.append(message)
+
+    await proxy.handle_streamable_http(
+        {
+            "type": "http",
+            "method": "POST",
+            "path": "/",
+            "modified_path": "/mcp/",
+            "headers": [(b"content-type", b"application/json")],
+            "query_string": b"",
+        },
+        _make_receive(b'{"jsonrpc":"2.0","id":1,"method":"ping","params":{}}'),
+        send,
+    )
+
+    fallback.assert_not_awaited()
+    assert events[0]["status"] == 502
+    body = json.loads(events[1]["body"].decode())
+    assert body["error"]["code"] == -32000
+    assert body["error"]["message"] == "Experimental Rust MCP runtime unavailable"
+    assert body["error"]["data"] == "See server logs"
diff --git a/tests/unit/mcpgateway/transports/test_streamablehttp_transport.py b/tests/unit/mcpgateway/transports/test_streamablehttp_transport.py
index 0961310c59..d50222a2ef 100644
--- a/tests/unit/mcpgateway/transports/test_streamablehttp_transport.py
+++ b/tests/unit/mcpgateway/transports/test_streamablehttp_transport.py
@@ -29,6 +29,7 @@
 
 # Third-Party
 from fastapi import HTTPException
+import httpx
 import pytest
 from starlette.types import Scope
 
@@ -151,6 +152,249 @@ async def collector(msg):
     assert sent[1].event_id == eid3
 
 
+@pytest.mark.asyncio
+async def test_rust_event_store_store_and_replay(monkeypatch):
+    """RustEventStore should proxy store/replay operations through the sidecar."""
+    captured_requests = []
+
+    class FakeResponse:
+        def __init__(self, payload):
+            self._payload = payload
+
+        def raise_for_status(self):
+            return None
+
+        def json(self):
+            return self._payload
+
+    class FakeClient:
+        async def post(self, url, json=None, timeout=None, follow_redirects=None):  # noqa: A002
+            captured_requests.append((url, json, timeout.read, follow_redirects))
+            if url.endswith("/store"):
+                return FakeResponse({"eventId": "event-123"})
+            return FakeResponse(
+                {
+                    "streamId": "stream-1",
+                    "events": [
+                        {"eventId": "event-124", "message": {"id": 2}},
+                        {"eventId": "event-125", "message": {"id": 3}},
+                    ],
+                }
+            )
+
+    monkeypatch.setattr(tr, "_get_rust_event_store_client", AsyncMock(return_value=FakeClient()))
+    monkeypatch.setattr(tr.settings, "experimental_rust_mcp_runtime_timeout_seconds", 17)
+    monkeypatch.setattr(tr.settings, "experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+
+    store = tr.RustEventStore(max_events_per_stream=77, ttl=321, key_prefix="mcpgw:eventstore:test")
+    event_id = await store.store_event("stream-1", {"id": 1})
+
+    replayed = []
+
+    async def collector(msg):
+        replayed.append(msg)
+
+    stream_id = await store.replay_events_after(event_id, collector)
+
+    assert event_id == "event-123"
+    assert stream_id == "stream-1"
+    assert replayed == [{"id": 2}, {"id": 3}]
+    assert captured_requests[0][0] == "http://127.0.0.1:8787/_internal/event-store/store"
+    assert captured_requests[0][1] == {
+        "streamId": "stream-1",
+        "message": {"id": 1},
+        "keyPrefix": "mcpgw:eventstore:test",
+        "maxEventsPerStream": 77,
+        "ttlSeconds": 321,
+    }
+    assert captured_requests[0][2] == 17
+    assert captured_requests[0][3] is False
+    assert captured_requests[1][0] == "http://127.0.0.1:8787/_internal/event-store/replay"
+    assert captured_requests[1][1] == {
+        "lastEventId": "event-123",
+        "keyPrefix": "mcpgw:eventstore:test",
+    }
+    assert captured_requests[1][3] is False
+
+
+@pytest.mark.asyncio
+async def test_rust_event_store_replay_rejects_redirects_without_following(monkeypatch):
+    """Replay requests should fail closed on redirects from the Rust sidecar."""
+    requests_seen = []
+
+    def handler(request: httpx.Request) -> httpx.Response:
+        requests_seen.append(str(request.url))
+        if request.url.path.endswith("/replay"):
+            return httpx.Response(
+                307,
+                headers={"location": "http://127.0.0.1:8787/final"},
+                request=request,
+            )
+        return httpx.Response(200, json={"streamId": "unexpected", "events": []}, request=request)
+
+    client = httpx.AsyncClient(transport=httpx.MockTransport(handler))
+    monkeypatch.setattr(tr, "_get_rust_event_store_client", AsyncMock(return_value=client))
+    monkeypatch.setattr(tr.settings, "experimental_rust_mcp_runtime_url", "http://127.0.0.1:8787")
+
+    store = tr.RustEventStore()
+
+    try:
+        with pytest.raises(httpx.HTTPStatusError, match="307 Temporary Redirect"):
+            await store.replay_events_after("event-123", AsyncMock())
+    finally:
+        await client.aclose()
+
+    assert requests_seen == ["http://127.0.0.1:8787/_internal/event-store/replay"]
+
+
+@pytest.mark.asyncio
+async def test_rust_event_store_store_rejects_invalid_event_id(monkeypatch):
+    """RustEventStore should reject empty or invalid event ids from the sidecar."""
+
+    class FakeResponse:
+        def raise_for_status(self):
+            return None
+
+        def json(self):
+            return {"eventId": ""}
+
+    class FakeClient:
+        async def post(self, *_args, **_kwargs):
+            return FakeResponse()
+
+    monkeypatch.setattr(tr, "_get_rust_event_store_client", AsyncMock(return_value=FakeClient()))
+
+    store = tr.RustEventStore()
+    with pytest.raises(RuntimeError, match="invalid eventId"):
+        await store.store_event("stream-1", {"id": 1})
+
+
+@pytest.mark.asyncio
+async def test_rust_event_store_replay_skips_invalid_entries(monkeypatch):
+    """Replay should skip malformed entries and return None for invalid stream ids."""
+
+    class FakeResponse:
+        def __init__(self, payload):
+            self._payload = payload
+
+        def raise_for_status(self):
+            return None
+
+        def json(self):
+            return self._payload
+
+    class FakeClient:
+        def __init__(self):
+            self.calls = 0
+
+        async def post(self, *_args, **_kwargs):
+            self.calls += 1
+            if self.calls == 1:
+                return FakeResponse({"streamId": "", "events": []})
+            return FakeResponse({"streamId": "stream-1", "events": ["bad", {"message": {"id": 2}}]})
+
+    client = FakeClient()
+    monkeypatch.setattr(tr, "_get_rust_event_store_client", AsyncMock(return_value=client))
+
+    store = tr.RustEventStore()
+    assert await store.replay_events_after("event-1", AsyncMock()) is None
+
+    replayed = []
+
+    async def collector(msg):
+        replayed.append(msg)
+
+    assert await store.replay_events_after("event-2", collector) == "stream-1"
+    assert replayed == [{"id": 2}]
+
+
+@pytest.mark.asyncio
+async def test_get_rust_event_store_client_uses_shared_http_client_without_uds(monkeypatch):
+    """Without UDS configured, the Rust event-store client should use the shared HTTP client."""
+    shared_client = AsyncMock()
+    monkeypatch.setattr(tr, "_rust_event_store_client", None)
+    monkeypatch.setattr(tr.settings, "experimental_rust_mcp_runtime_uds", None)
+    monkeypatch.setattr(tr, "get_http_client", AsyncMock(return_value=shared_client))
+
+    assert await tr._get_rust_event_store_client() is shared_client
+
+
+@pytest.mark.asyncio
+async def test_get_rust_event_store_client_reuses_uds_client(monkeypatch):
+    """UDS-backed Rust event-store client should be created once and then reused."""
+    constructed = {"count": 0, "kwargs": None}
+
+    class FakeAsyncClient:
+        def __init__(self, **_kwargs):
+            constructed["count"] += 1
+            constructed["kwargs"] = _kwargs
+
+    monkeypatch.setattr(tr, "_rust_event_store_client", None)
+    monkeypatch.setattr(tr.settings, "experimental_rust_mcp_runtime_uds", "/tmp/contextforge-mcp-rust.sock")
+    monkeypatch.setattr(tr, "httpx", MagicMock(AsyncClient=FakeAsyncClient, AsyncHTTPTransport=httpx.AsyncHTTPTransport, Timeout=httpx.Timeout))
+
+    first = await tr._get_rust_event_store_client()
+    second = await tr._get_rust_event_store_client()
+
+    assert first is second
+    assert constructed["count"] == 1
+    assert constructed["kwargs"]["follow_redirects"] is False
+
+
+def test_get_streamable_http_auth_context_returns_empty_for_non_dict_context():
+    """Non-dict auth contexts should not be forwarded to trusted internal hops."""
+    token = tr.user_context_var.set("not-a-dict")
+    try:
+        assert tr.get_streamable_http_auth_context() == {}
+    finally:
+        tr.user_context_var.reset(token)
+
+
+def test_get_streamable_http_auth_context_copies_supported_keys_and_lists():
+    """Forwarded auth context should copy supported keys and clone list values."""
+    original = {
+        "email": "user@example.com",
+        "teams": ["team-a"],
+        "is_authenticated": True,
+        "is_admin": False,
+        "token_use": "session",
+        "permission_is_admin": True,
+        "scoped_permissions": ["tools.read"],
+        "scoped_server_id": "srv-1",
+        "ignored": "value",
+    }
+    token = tr.user_context_var.set(original)
+    try:
+        forwarded = tr.get_streamable_http_auth_context()
+    finally:
+        tr.user_context_var.reset(token)
+
+    assert forwarded == {
+        "email": "user@example.com",
+        "teams": ["team-a"],
+        "is_authenticated": True,
+        "is_admin": False,
+        "token_use": "session",
+        "permission_is_admin": True,
+        "scoped_permissions": ["tools.read"],
+        "scoped_server_id": "srv-1",
+    }
+    assert forwarded["teams"] is not original["teams"]
+    assert forwarded["scoped_permissions"] is not original["scoped_permissions"]
+
+
+def test_record_mcp_auth_cache_event_swallows_metrics_errors(monkeypatch):
+    """Metrics failures must not break MCP auth cache instrumentation."""
+
+    class BrokenCounter:
+        def labels(self, **_kwargs):
+            raise RuntimeError("metrics down")
+
+    monkeypatch.setattr(tr, "mcp_auth_cache_events_counter", BrokenCounter())
+
+    tr._record_mcp_auth_cache_event("cache_miss")
+
+
 # ---------------------------------------------------------------------------
 # get_db, call_tool & list_tools tests
 # ---------------------------------------------------------------------------
@@ -272,7 +516,7 @@ async def fake_get_db():
     monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.get_db", fake_get_db)
     monkeypatch.setattr(tool_service, "invoke_tool", AsyncMock(return_value=mock_result))
 
-    with caplog.at_level("WARNING"):
+    with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
         result = await call_tool("mytool", {"foo": "bar"})
         assert result == []
         assert "No content returned by tool: mytool" in caplog.text
@@ -368,6 +612,26 @@ async def test_validate_streamable_session_access_fake_session_not_found(monkeyp
     assert "Session not found" in detail
 
 
+@pytest.mark.asyncio
+async def test_validate_streamable_session_access_skips_when_rust_already_validated(monkeypatch):
+    """Trusted Rust-validated session requests should skip duplicate Python owner checks."""
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.use_stateful_sessions", True)
+
+    session_registry = MagicMock()
+    session_registry.get_session_owner = AsyncMock(side_effect=AssertionError("should not be called"))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport._get_shared_session_registry", lambda: session_registry)
+
+    allowed, status, detail = await tr._validate_streamable_session_access(
+        mcp_session_id="sess-rust",
+        user_context={"email": "user@example.com", "is_admin": False, "is_authenticated": True, "_rust_session_validated": True},
+        rpc_method="tools/call",
+    )
+
+    assert allowed is True
+    assert status == 200
+    assert detail == ""
+
+
 @pytest.mark.asyncio
 async def test_list_tools_with_server_id(monkeypatch):
     """Test list_tools returns tools for a server_id."""
@@ -639,7 +903,7 @@ async def fake_get_db():
     monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.get_db", fake_get_db)
     monkeypatch.setattr(prompt_service, "get_prompt", AsyncMock(return_value=mock_result))
 
-    with caplog.at_level("WARNING"):
+    with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
         result = await get_prompt("empty_prompt")
         assert result == []
         assert "No content returned by prompt: empty_prompt" in caplog.text
@@ -660,7 +924,7 @@ async def fake_get_db():
     monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.get_db", fake_get_db)
     monkeypatch.setattr(prompt_service, "get_prompt", AsyncMock(return_value=None))
 
-    with caplog.at_level("WARNING"):
+    with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
         result = await get_prompt("missing_prompt")
         assert result == []
         assert "No content returned by prompt: missing_prompt" in caplog.text
@@ -1011,7 +1275,7 @@ async def fake_get_db():
     monkeypatch.setattr(resource_service, "read_resource", AsyncMock(return_value=mock_result))
 
     test_uri = AnyUrl("file:///empty.txt")
-    with caplog.at_level("WARNING"):
+    with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
         result = await read_resource(test_uri)
         assert result == ""
         assert "No content returned by resource: file:///empty.txt" in caplog.text
@@ -1036,7 +1300,7 @@ async def fake_get_db():
     monkeypatch.setattr(resource_service, "read_resource", AsyncMock(return_value=None))
 
     test_uri = AnyUrl("file:///missing.txt")
-    with caplog.at_level("WARNING"):
+    with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
         result = await read_resource(test_uri)
         assert result == ""
         assert "No content returned by resource: file:///missing.txt" in caplog.text
@@ -3403,7 +3667,7 @@ async def test_set_logging_level_exception():
 
 @pytest.mark.asyncio
 async def test_set_logging_level_requires_servers_use(monkeypatch):
-    """logging/setLevel requires servers.use permission for authenticated users."""
+    """logging/setLevel requires admin.system_config permission for authenticated users."""
     # First-Party
     from mcpgateway.transports.streamablehttp_transport import set_logging_level
 
@@ -3427,7 +3691,7 @@ async def test_set_logging_level_requires_servers_use(monkeypatch):
     mock_logging_service.set_level = AsyncMock()
     monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.logging_service", mock_logging_service)
 
-    # Should raise PermissionError for non-admin user without servers.use
+    # Should raise PermissionError for non-admin user without admin.system_config
     with pytest.raises(PermissionError, match="Access denied"):
         await set_logging_level("info")
     mock_logging_service.set_level.assert_not_called()
@@ -3435,7 +3699,7 @@ async def test_set_logging_level_requires_servers_use(monkeypatch):
 
 @pytest.mark.asyncio
 async def test_set_logging_level_admin_allowed(monkeypatch):
-    """logging/setLevel succeeds when the caller has servers.use permission."""
+    """logging/setLevel succeeds when the caller has admin.system_config permission."""
     # Third-Party
     from mcp import types as mcp_types
 
@@ -5334,6 +5598,90 @@ def capture_manager(**kwargs):
     assert isinstance(captured_config["event_store"], RedisEventStore)
 
 
+@pytest.mark.asyncio
+async def test_session_manager_wrapper_rust_event_store(monkeypatch):
+    """SessionManagerWrapper should use RustEventStore when the Rust event-store flag is enabled."""
+
+    captured_config = {}
+
+    def capture_manager(**kwargs):
+        captured_config.update(kwargs)
+        dummy = MagicMock()
+        dummy.run = MagicMock(return_value=asynccontextmanager(lambda: (yield dummy))())
+        return dummy
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.use_stateful_sessions", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.json_response_enabled", False)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_runtime_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_session_auth_reuse_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_event_store_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.streamable_http_max_events_per_stream", 75)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.streamable_http_event_ttl", 2700)
+    monkeypatch.setattr(tr, "StreamableHTTPSessionManager", capture_manager)
+
+    SessionManagerWrapper()
+
+    assert captured_config["stateless"] is False
+    assert isinstance(captured_config["event_store"], tr.RustEventStore)
+    assert captured_config["event_store"].max_events_per_stream == 75
+    assert captured_config["event_store"].ttl == 2700
+
+
+@pytest.mark.asyncio
+async def test_session_manager_wrapper_redis_event_store_when_rust_event_store_disabled(monkeypatch):
+    """SessionManagerWrapper should fall back to RedisEventStore when Rust event store is disabled."""
+
+    captured_config = {}
+
+    def capture_manager(**kwargs):
+        captured_config.update(kwargs)
+        dummy = MagicMock()
+        dummy.run = MagicMock(return_value=asynccontextmanager(lambda: (yield dummy))())
+        return dummy
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.use_stateful_sessions", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.json_response_enabled", False)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_runtime_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_event_store_enabled", False)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.cache_type", "redis")
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.redis_url", "redis://localhost:6379/0")
+    monkeypatch.setattr(tr, "StreamableHTTPSessionManager", capture_manager)
+
+    SessionManagerWrapper()
+
+    from mcpgateway.transports.redis_event_store import RedisEventStore
+
+    assert isinstance(captured_config["event_store"], RedisEventStore)
+
+
+@pytest.mark.asyncio
+async def test_session_manager_wrapper_falls_back_to_python_event_store_when_session_auth_reuse_disabled(monkeypatch):
+    """SessionManagerWrapper should not activate RustEventStore when public session auth reuse is disabled."""
+
+    captured_config = {}
+
+    def capture_manager(**kwargs):
+        captured_config.update(kwargs)
+        dummy = MagicMock()
+        dummy.run = MagicMock(return_value=asynccontextmanager(lambda: (yield dummy))())
+        return dummy
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.use_stateful_sessions", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.json_response_enabled", False)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_runtime_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_session_auth_reuse_enabled", False)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.experimental_rust_mcp_event_store_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.cache_type", "redis")
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.redis_url", "redis://localhost:6379/0")
+    monkeypatch.setattr(tr, "StreamableHTTPSessionManager", capture_manager)
+
+    SessionManagerWrapper()
+
+    from mcpgateway.transports.redis_event_store import RedisEventStore
+
+    assert isinstance(captured_config["event_store"], RedisEventStore)
+
+
 # ---------------------------------------------------------------------------
 # Group 3: Header parsing edge cases (lines 1344-1348)
 # ---------------------------------------------------------------------------
@@ -7251,6 +7599,295 @@ async def send(msg):
     assert any(m.get("type") == "http.response.start" and m.get("status") == 401 for m in sent)
 
 
+@pytest.mark.asyncio
+async def test_streamable_http_auth_uses_cached_auth_context(monkeypatch):
+    """Cached MCP auth context should bypass per-request revocation and user lookups."""
+
+    # First-Party
+    from mcpgateway.cache.auth_cache import CachedAuthContext, auth_cache
+
+    async def fake_verify(_token):
+        return {
+            "sub": "cached@example.com",
+            "jti": "cached-jti",
+            "token_use": "api",
+            "teams": [],
+        }
+
+    monkeypatch.setattr(tr, "verify_credentials", fake_verify)
+
+    scope = _make_scope("/servers/1/mcp", headers=[(b"authorization", b"Bearer token")])
+    sent = []
+
+    async def send(msg):
+        sent.append(msg)
+
+    with (
+        patch.object(
+            auth_cache,
+            "get_auth_context",
+            AsyncMock(
+                return_value=CachedAuthContext(
+                    user={
+                        "email": "cached@example.com",
+                        "is_admin": False,
+                        "is_active": True,
+                    },
+                    personal_team_id=None,
+                    is_token_revoked=False,
+                )
+            ),
+        ),
+        patch("mcpgateway.auth._check_token_revoked_sync", side_effect=AssertionError("should not be called")),
+        patch("mcpgateway.auth._get_user_by_email_sync", side_effect=AssertionError("should not be called")),
+    ):
+        result = await streamable_http_auth(scope, None, send)
+
+    assert result is True
+    assert sent == []
+    assert tr.user_context_var.get()["email"] == "cached@example.com"
+
+
+@pytest.mark.asyncio
+async def test_streamable_http_auth_rejects_revoked_cached_auth_context(monkeypatch):
+    """Cached revoked auth context should reject before touching the DB helpers."""
+
+    # First-Party
+    from mcpgateway.cache.auth_cache import CachedAuthContext, auth_cache
+
+    async def fake_verify(_token):
+        return {
+            "sub": "cached@example.com",
+            "jti": "cached-jti",
+            "token_use": "api",
+            "teams": [],
+        }
+
+    monkeypatch.setattr(tr, "verify_credentials", fake_verify)
+
+    scope = _make_scope("/servers/1/mcp", headers=[(b"authorization", b"Bearer token")])
+    sent = []
+
+    async def send(msg):
+        sent.append(msg)
+
+    with (
+        patch.object(
+            auth_cache,
+            "get_auth_context",
+            AsyncMock(
+                return_value=CachedAuthContext(
+                    user={
+                        "email": "cached@example.com",
+                        "is_admin": False,
+                        "is_active": True,
+                    },
+                    personal_team_id=None,
+                    is_token_revoked=True,
+                )
+            ),
+        ),
+        patch("mcpgateway.auth._check_token_revoked_sync", side_effect=AssertionError("should not be called")),
+        patch("mcpgateway.auth._get_user_by_email_sync", side_effect=AssertionError("should not be called")),
+    ):
+        result = await streamable_http_auth(scope, None, send)
+
+    assert result is False
+    assert any(m.get("type") == "http.response.start" and m.get("status") == 401 for m in sent)
+
+
+@pytest.mark.asyncio
+async def test_streamable_http_auth_rejects_inactive_cached_auth_context(monkeypatch):
+    """Cached inactive auth context should reject before touching the DB helpers."""
+
+    # First-Party
+    from mcpgateway.cache.auth_cache import CachedAuthContext, auth_cache
+
+    async def fake_verify(_token):
+        return {
+            "sub": "cached@example.com",
+            "jti": "cached-jti",
+            "token_use": "api",
+            "teams": [],
+        }
+
+    monkeypatch.setattr(tr, "verify_credentials", fake_verify)
+
+    scope = _make_scope("/servers/1/mcp", headers=[(b"authorization", b"Bearer token")])
+    sent = []
+
+    async def send(msg):
+        sent.append(msg)
+
+    with (
+        patch.object(
+            auth_cache,
+            "get_auth_context",
+            AsyncMock(
+                return_value=CachedAuthContext(
+                    user={
+                        "email": "cached@example.com",
+                        "is_admin": False,
+                        "is_active": False,
+                    },
+                    personal_team_id=None,
+                    is_token_revoked=False,
+                )
+            ),
+        ),
+        patch("mcpgateway.auth._check_token_revoked_sync", side_effect=AssertionError("should not be called")),
+        patch("mcpgateway.auth._get_user_by_email_sync", side_effect=AssertionError("should not be called")),
+    ):
+        result = await streamable_http_auth(scope, None, send)
+
+    assert result is False
+    assert any(m.get("type") == "http.response.start" and m.get("status") == 401 for m in sent)
+
+
+@pytest.mark.asyncio
+async def test_streamable_http_auth_uses_batched_auth_context(monkeypatch):
+    """MCP auth should use the existing batched auth lookup before per-query fallbacks."""
+
+    # First-Party
+    from mcpgateway.cache.auth_cache import auth_cache
+
+    async def fake_verify(_token):
+        return {
+            "sub": "batched@example.com",
+            "jti": "batched-jti",
+            "token_use": "api",
+            "teams": [],
+        }
+
+    monkeypatch.setattr(tr, "verify_credentials", fake_verify)
+
+    scope = _make_scope("/servers/1/mcp", headers=[(b"authorization", b"Bearer token")])
+    sent = []
+
+    async def send(msg):
+        sent.append(msg)
+
+    with (
+        patch.object(auth_cache, "get_auth_context", AsyncMock(return_value=None)),
+        patch.object(auth_cache, "set_auth_context", AsyncMock()) as mock_set_auth_context,
+        patch(
+            "mcpgateway.auth._get_auth_context_batched_sync",
+            return_value={
+                "user": {
+                    "email": "batched@example.com",
+                    "is_admin": False,
+                    "is_active": True,
+                },
+                "personal_team_id": None,
+                "is_token_revoked": False,
+                "team_ids": [],
+            },
+        ),
+        patch("mcpgateway.auth._check_token_revoked_sync", side_effect=AssertionError("should not be called")),
+        patch("mcpgateway.auth._get_user_by_email_sync", side_effect=AssertionError("should not be called")),
+    ):
+        result = await streamable_http_auth(scope, None, send)
+
+    assert result is True
+    assert sent == []
+    mock_set_auth_context.assert_awaited_once()
+    assert tr.user_context_var.get()["email"] == "batched@example.com"
+
+
+@pytest.mark.asyncio
+async def test_streamable_http_auth_rejects_revoked_batched_auth_context(monkeypatch):
+    """Batched MCP auth lookup should reject revoked tokens before individual DB fallbacks."""
+
+    # First-Party
+    from mcpgateway.cache.auth_cache import auth_cache
+
+    async def fake_verify(_token):
+        return {
+            "sub": "batched@example.com",
+            "jti": "batched-jti",
+            "token_use": "api",
+            "teams": [],
+        }
+
+    monkeypatch.setattr(tr, "verify_credentials", fake_verify)
+
+    scope = _make_scope("/servers/1/mcp", headers=[(b"authorization", b"Bearer token")])
+    sent = []
+
+    async def send(msg):
+        sent.append(msg)
+
+    with (
+        patch.object(auth_cache, "get_auth_context", AsyncMock(return_value=None)),
+        patch(
+            "mcpgateway.auth._get_auth_context_batched_sync",
+            return_value={
+                "user": {
+                    "email": "batched@example.com",
+                    "is_admin": False,
+                    "is_active": True,
+                },
+                "personal_team_id": None,
+                "is_token_revoked": True,
+                "team_ids": [],
+            },
+        ),
+        patch("mcpgateway.auth._check_token_revoked_sync", side_effect=AssertionError("should not be called")),
+        patch("mcpgateway.auth._get_user_by_email_sync", side_effect=AssertionError("should not be called")),
+    ):
+        result = await streamable_http_auth(scope, None, send)
+
+    assert result is False
+    assert any(m.get("type") == "http.response.start" and m.get("status") == 401 for m in sent)
+
+
+@pytest.mark.asyncio
+async def test_streamable_http_auth_rejects_inactive_batched_auth_context(monkeypatch):
+    """Batched MCP auth lookup should reject inactive users before individual DB fallbacks."""
+
+    # First-Party
+    from mcpgateway.cache.auth_cache import auth_cache
+
+    async def fake_verify(_token):
+        return {
+            "sub": "batched@example.com",
+            "jti": "batched-jti",
+            "token_use": "api",
+            "teams": [],
+        }
+
+    monkeypatch.setattr(tr, "verify_credentials", fake_verify)
+
+    scope = _make_scope("/servers/1/mcp", headers=[(b"authorization", b"Bearer token")])
+    sent = []
+
+    async def send(msg):
+        sent.append(msg)
+
+    with (
+        patch.object(auth_cache, "get_auth_context", AsyncMock(return_value=None)),
+        patch(
+            "mcpgateway.auth._get_auth_context_batched_sync",
+            return_value={
+                "user": {
+                    "email": "batched@example.com",
+                    "is_admin": False,
+                    "is_active": False,
+                },
+                "personal_team_id": None,
+                "is_token_revoked": False,
+                "team_ids": [],
+            },
+        ),
+        patch("mcpgateway.auth._check_token_revoked_sync", side_effect=AssertionError("should not be called")),
+        patch("mcpgateway.auth._get_user_by_email_sync", side_effect=AssertionError("should not be called")),
+    ):
+        result = await streamable_http_auth(scope, None, send)
+
+    assert result is False
+    assert any(m.get("type") == "http.response.start" and m.get("status") == 401 for m in sent)
+
+
 @pytest.mark.asyncio
 async def test_streamable_http_auth_rejects_inactive_user(monkeypatch):
     """Inactive users should be rejected after JWT validation."""
@@ -8535,7 +9172,7 @@ async def mock_get_db():
         with patch("mcpgateway.transports.streamablehttp_transport.resource_service") as mock_rs:
             mock_rs.list_server_resources = AsyncMock(return_value=[])
 
-            with caplog.at_level("WARNING"):
+            with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
                 await list_resources()
                 # Case-insensitive check or matching the exact log output
                 assert "Gateway gw-missing specified in X-Context-Forge-Gateway-Id header not found" in caplog.text
@@ -8614,7 +9251,7 @@ async def test_get_request_context_no_request_object(monkeypatch, caplog):
 
     try:
         with patch.object(type(mcp_app), "request_context", new_callable=PropertyMock, return_value=mock_ctx):
-            with caplog.at_level("WARNING"):
+            with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
                 sid, headers, user = await _get_request_context_or_default()
 
                 assert sid == "default_server_id"
@@ -8690,7 +9327,7 @@ async def test_get_request_context_auth_failure(monkeypatch, caplog):
 
     try:
         with patch.object(type(mcp_app), "request_context", new_callable=PropertyMock, return_value=mock_ctx):
-            with caplog.at_level("WARNING"):
+            with caplog.at_level("WARNING", logger="mcpgateway.transports.streamablehttp_transport"):
                 sid, headers, user = await _get_request_context_or_default()
 
                 assert sid == "default_server_id"
@@ -8814,6 +9451,73 @@ async def handle_request(self, scope, receive, send_func):
         await wrapper.shutdown()
 
 
+@pytest.mark.asyncio
+async def test_handle_streamable_http_server_scope_checks_any_team_for_team_api_token(monkeypatch):
+    """Server-scoped MCP requests should check RBAC across token teams for API tokens."""
+    # Third-Party
+    import orjson
+
+    # First-Party
+    from mcpgateway.transports.streamablehttp_transport import SessionManagerWrapper, user_context_var
+
+    class DummySessionManager:
+        @asynccontextmanager
+        async def run(self):
+            yield self
+
+        async def handle_request(self, scope, receive, send_func):
+            pass
+
+    dummy_manager = DummySessionManager()
+    dummy_manager.handle_request = AsyncMock()
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.StreamableHTTPSessionManager", lambda **kwargs: dummy_manager)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.mcpgateway_session_affinity_enabled", False)
+
+    permission_check = AsyncMock(return_value=True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport._check_streamable_permission", permission_check)
+
+    wrapper = SessionManagerWrapper()
+    await wrapper.initialize()
+
+    token = user_context_var.set(
+        {
+            "email": "dev@example.com",
+            "teams": ["team-1"],
+            "is_admin": False,
+            "is_authenticated": True,
+            "token_use": "api",
+        }
+    )
+    try:
+        scope = _make_scope("/servers/abc-123-def/mcp", method="POST", headers=[(b"mcp-session-id", b"sess-1")])
+        receive = _make_receive(orjson.dumps({"jsonrpc": "2.0", "method": "tools/list", "params": {}, "id": "1"}))
+        send, _messages = _make_send_collector()
+
+        await wrapper.handle_streamable_http(scope, receive, send)
+
+        assert permission_check.await_args.kwargs["permission"] == "servers.use"
+        assert permission_check.await_args.kwargs["check_any_team"] is True
+    finally:
+        user_context_var.reset(token)
+        await wrapper.shutdown()
+
+
+@pytest.mark.parametrize(
+    ("user_context", "server_id", "expected"),
+    [
+        (None, "srv-1", False),
+        ({"token_use": "session", "teams": []}, None, True),
+        ({"token_use": "api", "teams": ["team-1"]}, "srv-1", True),
+        ({"token_use": "api", "teams": []}, "srv-1", False),
+        ({"token_use": "api", "teams": ["team-1"]}, None, False),
+    ],
+)
+def test_check_any_team_for_server_scoped_rbac(user_context, server_id, expected):
+    """Server-scoped RBAC should reuse any-team lookup for session and team API tokens."""
+    assert tr._check_any_team_for_server_scoped_rbac(user_context, server_id) is expected
+
+
 # ---------------------------------------------------------------------------
 # streamable_http_auth exception fallbacks
 # ---------------------------------------------------------------------------
@@ -11189,6 +11893,265 @@ async def test_auth_jwt_scoped_permissions_in_user_context(monkeypatch):
     assert ctx["email"] == "user@example.com"
 
 
+@pytest.mark.asyncio
+async def test_auth_jwt_uses_cached_auth_context_and_cached_teams(monkeypatch):
+    """Cached auth context and cached teams should avoid fallback lookups and preserve scoped server ids."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler, user_context_var
+
+    jwt_payload = {
+        "sub": "user@example.com",
+        "is_admin": False,
+        "token_use": "session",
+        "scopes": {"server_id": "srv-1"},
+    }
+    cached_ctx = MagicMock()
+    cached_ctx.is_token_revoked = False
+    cached_ctx.user = {"is_active": True, "is_admin": True}
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(return_value=cached_ctx)
+    auth_cache.get_user_teams = AsyncMock(return_value=["team-a"])
+    auth_cache.get_team_membership_valid_sync = MagicMock(return_value=True)
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", False)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    result = await handler._auth_jwt(token="fake-token")
+
+    assert result is True
+    ctx = user_context_var.get()
+    assert ctx["teams"] == ["team-a"]
+    assert ctx["permission_is_admin"] is True
+    assert ctx["scoped_server_id"] == "srv-1"
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_falls_back_after_cache_errors_and_tolerates_cache_set_failure(monkeypatch):
+    """Fallback auth flow should survive cache lookup/set failures and revocation-check exceptions."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler, user_context_var
+
+    jwt_payload = {
+        "sub": "user@example.com",
+        "is_admin": False,
+        "token_use": "session",
+    }
+    user_record = MagicMock()
+    user_record.email = "user@example.com"
+    user_record.password_hash = "hash"
+    user_record.full_name = "User"
+    user_record.is_admin = True
+    user_record.is_active = True
+    user_record.auth_provider = "local"
+    user_record.password_change_required = False
+    user_record.email_verified_at = None
+    user_record.created_at = None
+    user_record.updated_at = None
+
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(side_effect=RuntimeError("cache down"))
+    auth_cache.set_auth_context = AsyncMock(side_effect=RuntimeError("cache set failed"))
+    auth_cache.set_user_teams = AsyncMock(return_value=None)
+    auth_cache.get_team_membership_valid_sync = MagicMock(return_value=True)
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", False)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+    monkeypatch.setattr("mcpgateway.auth._check_token_revoked_sync", MagicMock(side_effect=RuntimeError("revocation down")))
+    monkeypatch.setattr("mcpgateway.auth._get_user_by_email_sync", MagicMock(return_value=user_record))
+    monkeypatch.setattr("mcpgateway.auth._resolve_teams_from_db_sync", MagicMock(return_value=["team-a"]))
+
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    result = await handler._auth_jwt(token="fake-token")
+
+    assert result is True
+    ctx = user_context_var.get()
+    assert ctx["teams"] == ["team-a"]
+    assert ctx["permission_is_admin"] is True
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_uses_batched_auth_context_and_caches_team_list(monkeypatch):
+    """Batched auth lookups should populate context and tolerate team-cache write failures."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler, user_context_var
+
+    jwt_payload = {
+        "sub": "user@example.com",
+        "is_admin": False,
+        "token_use": "session",
+    }
+    batched_auth_ctx = {
+        "user": {"is_active": True, "is_admin": True},
+        "personal_team_id": None,
+        "is_token_revoked": False,
+        "team_ids": ["team-a"],
+    }
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(return_value=None)
+    auth_cache.set_auth_context = AsyncMock(return_value=None)
+    auth_cache.set_user_teams = AsyncMock(side_effect=RuntimeError("team cache down"))
+    auth_cache.get_team_membership_valid_sync = MagicMock(return_value=True)
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", True)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+    monkeypatch.setattr("mcpgateway.auth._get_auth_context_batched_sync", MagicMock(return_value=batched_auth_ctx))
+
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    result = await handler._auth_jwt(token="fake-token")
+
+    assert result is True
+    ctx = user_context_var.get()
+    assert ctx["teams"] == ["team-a"]
+    assert ctx["permission_is_admin"] is True
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_cached_context_requires_user_when_db_user_missing(monkeypatch):
+    """Cached auth contexts without a DB user should reject when REQUIRE_USER_IN_DB is enabled."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler
+
+    jwt_payload = {"sub": "user@example.com", "is_admin": False, "token_use": "session"}
+    cached_ctx = MagicMock()
+    cached_ctx.is_token_revoked = False
+    cached_ctx.user = None
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(return_value=cached_ctx)
+
+    send_error = AsyncMock(return_value=False)
+    monkeypatch.setattr(_StreamableHttpAuthHandler, "_send_error", send_error)
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", False)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.require_user_in_db", True)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+
+    assert await handler._auth_jwt(token="fake-token") is False
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_returns_invalid_credentials_when_cache_lookup_raises_http_exception(monkeypatch):
+    """HTTPException from auth cache lookup should be surfaced as invalid credentials."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler
+
+    jwt_payload = {"sub": "user@example.com", "is_admin": False, "token_use": "session"}
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(side_effect=HTTPException(status_code=401, detail="bad"))
+
+    send_error = AsyncMock(return_value=False)
+    monkeypatch.setattr(_StreamableHttpAuthHandler, "_send_error", send_error)
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", False)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+
+    assert await handler._auth_jwt(token="fake-token") is False
+    send_error.assert_awaited_once()
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_batched_context_requires_user_when_db_user_missing(monkeypatch):
+    """Batched auth lookups without a DB user should reject when REQUIRE_USER_IN_DB is enabled."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler
+
+    jwt_payload = {"sub": "user@example.com", "is_admin": False, "token_use": "session"}
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(return_value=None)
+
+    send_error = AsyncMock(return_value=False)
+    monkeypatch.setattr(_StreamableHttpAuthHandler, "_send_error", send_error)
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.require_user_in_db", True)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+    monkeypatch.setattr("mcpgateway.auth._get_auth_context_batched_sync", MagicMock(return_value={"user": None, "team_ids": [], "is_token_revoked": False}))
+
+    assert await handler._auth_jwt(token="fake-token") is False
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_records_batch_team_cache_hit_on_success(monkeypatch):
+    """Successful batched team caching should preserve the resolved team list."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler, user_context_var
+
+    jwt_payload = {"sub": "user@example.com", "is_admin": False, "token_use": "session"}
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(return_value=None)
+    auth_cache.set_auth_context = AsyncMock(return_value=None)
+    auth_cache.set_user_teams = AsyncMock(return_value=None)
+    auth_cache.get_team_membership_valid_sync = MagicMock(return_value=True)
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", True)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+    monkeypatch.setattr("mcpgateway.auth._get_auth_context_batched_sync", MagicMock(return_value={"user": {"is_active": True, "is_admin": False}, "team_ids": ["team-a"], "is_token_revoked": False}))
+
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+    assert await handler._auth_jwt(token="fake-token") is True
+    assert user_context_var.get()["teams"] == ["team-a"]
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_uses_batched_team_ids_when_auth_cache_is_disabled(monkeypatch):
+    """Batched auth lookups should still populate session team context without the cache layer."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler, user_context_var
+
+    jwt_payload = {"sub": "user@example.com", "is_admin": False, "token_use": "session"}
+    auth_cache = MagicMock()
+    auth_cache.get_team_membership_valid_sync = MagicMock(return_value=True)
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", False)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", True)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+    monkeypatch.setattr(
+        "mcpgateway.auth._get_auth_context_batched_sync",
+        MagicMock(return_value={"user": {"is_active": True, "is_admin": False}, "team_ids": ["team-b"], "is_token_revoked": False}),
+    )
+
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    assert await handler._auth_jwt(token="fake-token") is True
+    assert user_context_var.get()["teams"] == ["team-b"]
+
+
+@pytest.mark.asyncio
+async def test_auth_jwt_returns_invalid_credentials_when_batched_lookup_raises_http_exception(monkeypatch):
+    """HTTPException from the batched auth lookup should be surfaced as invalid credentials."""
+    from mcpgateway.transports.streamablehttp_transport import _StreamableHttpAuthHandler
+
+    jwt_payload = {"sub": "user@example.com", "is_admin": False, "token_use": "session"}
+    auth_cache = MagicMock()
+    auth_cache.get_auth_context = AsyncMock(return_value=None)
+
+    send_error = AsyncMock(return_value=False)
+    monkeypatch.setattr(_StreamableHttpAuthHandler, "_send_error", send_error)
+    handler = _StreamableHttpAuthHandler(scope={"type": "http", "headers": []}, receive=AsyncMock(), send=AsyncMock())
+
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.verify_credentials", AsyncMock(return_value=jwt_payload))
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_enabled", True)
+    monkeypatch.setattr("mcpgateway.transports.streamablehttp_transport.settings.auth_cache_batch_queries", True)
+    monkeypatch.setattr("mcpgateway.cache.auth_cache.get_auth_cache", lambda: auth_cache)
+    monkeypatch.setattr("mcpgateway.auth._get_auth_context_batched_sync", MagicMock(side_effect=HTTPException(status_code=401, detail="bad")))
+
+    assert await handler._auth_jwt(token="fake-token") is False
+    send_error.assert_awaited_once()
+
+
 @pytest.mark.asyncio
 async def test_complete_denied_by_token_scope(monkeypatch):
     """Token without tools.read should be denied completion/complete."""
diff --git a/tests/unit/mcpgateway/transports/test_websocket_transport.py b/tests/unit/mcpgateway/transports/test_websocket_transport.py
index 45ec99e468..0fc45f9b09 100644
--- a/tests/unit/mcpgateway/transports/test_websocket_transport.py
+++ b/tests/unit/mcpgateway/transports/test_websocket_transport.py
@@ -197,7 +197,7 @@ async def fake_receive_bytes():
 
         mock_ws.receive_bytes.side_effect = fake_receive_bytes
 
-        with caplog.at_level("WARNING"):
+        with caplog.at_level("WARNING", logger="mcpgateway.transports.websocket_transport"):
             await transport._ping_loop()
             assert "Invalid ping response" in caplog.text
 
diff --git a/tests/unit/mcpgateway/utils/test_passthrough_headers.py b/tests/unit/mcpgateway/utils/test_passthrough_headers.py
index 1f645815d6..da3d44ea93 100644
--- a/tests/unit/mcpgateway/utils/test_passthrough_headers.py
+++ b/tests/unit/mcpgateway/utils/test_passthrough_headers.py
@@ -91,7 +91,7 @@ def test_authorization_conflict_basic_auth(self, mock_settings, caplog):
         request_headers = {"authorization": "Bearer should-be-blocked", "x-tenant-id": "acme-corp"}
         base_headers = {"Content-Type": "application/json"}
 
-        with caplog.at_level(logging.WARNING):
+        with caplog.at_level(logging.WARNING, logger="mcpgateway.utils.passthrough_headers"):
             result = get_passthrough_headers(request_headers, base_headers, mock_db, mock_gateway)
 
         # Authorization should be blocked, X-Tenant-Id should pass through
@@ -119,7 +119,7 @@ def test_authorization_conflict_bearer_auth(self, mock_settings, caplog):
         request_headers = {"authorization": "Bearer should-be-blocked"}
         base_headers = {"Content-Type": "application/json"}
 
-        with caplog.at_level(logging.WARNING):
+        with caplog.at_level(logging.WARNING, logger="mcpgateway.utils.passthrough_headers"):
             result = get_passthrough_headers(request_headers, base_headers, mock_db, mock_gateway)
 
         # Only base headers should remain
@@ -143,7 +143,7 @@ def test_base_header_conflict_prevention(self, mock_settings, caplog):
         request_headers = {"content-type": "text/plain", "x-tenant-id": "acme-corp"}  # Conflicts with base header  # Should pass through
         base_headers = {"Content-Type": "application/json"}
 
-        with caplog.at_level(logging.WARNING):
+        with caplog.at_level(logging.WARNING, logger="mcpgateway.utils.passthrough_headers"):
             result = get_passthrough_headers(request_headers, base_headers, mock_db)
 
         # Base header preserved, tenant ID added
diff --git a/tests/unit/mcpgateway/utils/test_passthrough_headers_security.py b/tests/unit/mcpgateway/utils/test_passthrough_headers_security.py
index 57821d7e58..c8a9f25e47 100644
--- a/tests/unit/mcpgateway/utils/test_passthrough_headers_security.py
+++ b/tests/unit/mcpgateway/utils/test_passthrough_headers_security.py
@@ -121,7 +121,7 @@ def test_header_validation_applied_in_passthrough(self, mock_settings, caplog):
         # Standard
         import logging
 
-        with caplog.at_level(logging.WARNING):
+        with caplog.at_level(logging.WARNING, logger="mcpgateway.utils.passthrough_headers"):
             result = get_passthrough_headers(request_headers, base_headers, mock_db)
 
         # Only valid header should pass through
@@ -166,7 +166,7 @@ def test_empty_sanitized_header_skipped(self, mock_settings, caplog):
         # Standard
         import logging
 
-        with caplog.at_level(logging.WARNING):
+        with caplog.at_level(logging.WARNING, logger="mcpgateway.utils.passthrough_headers"):
             result = get_passthrough_headers(request_headers, base_headers, mock_db)
 
         # Header should be skipped
@@ -244,7 +244,7 @@ def test_authorization_header_security(self, mock_settings, caplog):
         # Standard
         import logging
 
-        with caplog.at_level(logging.WARNING):
+        with caplog.at_level(logging.WARNING, logger="mcpgateway.utils.passthrough_headers"):
             result = get_passthrough_headers(request_headers, base_headers, mock_db, mock_gateway)
 
         # Authorization should be blocked
diff --git a/todo/findings.md b/todo/findings.md
new file mode 100644
index 0000000000..a8c97cea8c
--- /dev/null
+++ b/todo/findings.md
@@ -0,0 +1,331 @@
+# Review Feedback For `todo/code-review.md`
+
+Scope: `git diff main`, with detailed validation focused on `tools_rust/mcp_runtime/` and `mcpgateway/transports/rust_mcp_runtime_proxy.py`.
+
+## Current status on `modular-design`
+
+This memo is now partly historical.
+
+The original review was useful, but several of the highest-severity findings
+have since been fixed on the branch:
+
+- direct public Rust ingress no longer trusts client-supplied
+  `x-contextforge-auth-context`
+- direct public Rust ingress no longer trusts client-supplied
+  `x-contextforge-server-id`
+- the Rust -> Python auth seam now uses the actual peer address and no longer
+  defaults a missing client IP to loopback
+- the public Rust listener now serves a dedicated public router and no longer
+  exposes the internal event-store endpoints
+- the public Rust listener now serves a minimal health payload instead of the
+  detailed internal runtime payload
+- Redis session counting now uses `SCAN` instead of `KEYS`
+- affinity Redis keys/channels now honor the configured cache prefix
+- the upstream session cache no longer holds its mutex across HTTP I/O
+- runtime/proxy transport errors are now redacted before they are returned to
+  clients
+
+The still-relevant follow-up items are:
+
+- Rust runtime PostgreSQL TLS support now exists for
+  `sslmode=disable|prefer|require` and optional `sslrootcert`, but client
+  certificate auth via `sslcert` / `sslkey` is still unimplemented
+- `session_id` query-parameter compatibility still exists in both Rust and
+  Python and remains security-sensitive compatibility debt
+- broader Python MCP handlers outside the runtime proxy still expose some
+  exception text in client responses and need a separate repository-wide
+  hardening pass if we want parity beyond the Rust runtime slice
+- maintainability observations like the large `lib.rs` are still fair, but they
+  are refactor opportunities rather than defect findings
+
+## Historical verdict
+
+`todo/code-review.md` is not complete.
+
+The strongest missing findings are:
+
+- Critical: direct public Rust ingress also trusts client-supplied `x-contextforge-server-id`, which can turn `/mcp` requests into server-scoped operations without the normal path-based per-server OAuth enforcement.
+- Critical: the Rust -> Python auth seam derives `client_ip` from spoofable forwarding headers and defaults missing client IP to `127.0.0.1`, which breaks the token-scoping middleware's assumption that `request.client.host` is trustworthy.
+
+Most of the existing concrete findings are real. The main corrections are:
+
+- Finding 2 is real but should be framed as a health-path scalability issue, not a normal MCP hot-path issue.
+- Finding 3 is better stated as "no PostgreSQL TLS support" rather than "guaranteed plaintext on every deployment".
+- Finding 5 is incomplete because the Python proxy leaks backend exception text too.
+- Finding 6 is existing compatibility/security debt, not a clean branch-specific regression.
+- Findings 8 and 9 are maintainability observations, not defect findings.
+
+## Missing Findings
+
+### 1. Critical: Client-supplied `x-contextforge-server-id` is trusted on the direct public Rust listener
+
+The reviewer caught the equivalent trust bug for `x-contextforge-auth-context`, but missed that the Rust public ingress also preserves and trusts `x-contextforge-server-id`.
+
+Evidence:
+
+- The Python proxy explicitly strips `x-contextforge-server-id` before forwarding requests to Rust in [mcpgateway/transports/rust_mcp_runtime_proxy.py:41-49](../mcpgateway/transports/rust_mcp_runtime_proxy.py).
+- The Rust public auth probe does not strip that header in [tools_rust/mcp_runtime/src/lib.rs:2182-2204](../tools_rust/mcp_runtime/src/lib.rs).
+- Rust treats any request carrying that header as server-scoped via [tools_rust/mcp_runtime/src/lib.rs:2146-2148](../tools_rust/mcp_runtime/src/lib.rs).
+- Rust forwards that header downstream because `should_forward_header()` does not block it in [tools_rust/mcp_runtime/src/lib.rs:7393-7412](../tools_rust/mcp_runtime/src/lib.rs).
+- Generic internal Rust-dispatched MCP RPC reads the header back into `params["server_id"]` in [mcpgateway/main.py:8748-8759](../mcpgateway/main.py).
+- Rust direct DB/authz paths also consume it directly, for example [tools_rust/mcp_runtime/src/lib.rs:4397-4417](../tools_rust/mcp_runtime/src/lib.rs) and [mcpgateway/main.py:8074-8129](../mcpgateway/main.py).
+
+Impact:
+
+- A client that can reach `public_listen_http` directly can send `/mcp` with a forged `x-contextforge-server-id`.
+- The internal auth check for direct public ingress uses the real request path (`/mcp`), not a server-scoped path, in [tools_rust/mcp_runtime/src/lib.rs:2360-2365](../tools_rust/mcp_runtime/src/lib.rs) and [mcpgateway/main.py:517-524](../mcpgateway/main.py).
+- Per-server OAuth enforcement in the normal Streamable HTTP auth path only triggers when the path itself matches `/servers/{server_id}/mcp` in [mcpgateway/transports/streamablehttp_transport.py:3090-3103](../mcpgateway/transports/streamablehttp_transport.py).
+- Internal Rust -> Python authorization assumes that per-server OAuth/path enforcement already happened before the internal hop, as documented in [mcpgateway/main.py:426-454](../mcpgateway/main.py).
+
+Why this matters:
+
+- This is not the same bug as forged `x-contextforge-auth-context`.
+- A caller does not need to forge an auth context to exploit it.
+- The bug can bypass the path-based "server requires OAuth" check for unauthenticated/public-only requests by smuggling server scope through a trusted internal header.
+
+Recommended fix:
+
+- Strip `x-contextforge-server-id` from direct public client requests before auth.
+- Treat it like other internal-only headers in the public listener path.
+- Only inject it from trusted routing state, not from client headers.
+
+### 2. Critical: Direct public Rust ingress allows spoofed or loopback-default client IP in token scoping
+
+The Rust public auth handoff breaks the token-scoping middleware's trust model for client IP.
+
+Evidence:
+
+- Rust derives `client_ip` from `X-Real-IP` or `X-Forwarded-For` in [tools_rust/mcp_runtime/src/lib.rs:2207-2223](../tools_rust/mcp_runtime/src/lib.rs).
+- Rust forwards that value into Python auth in [tools_rust/mcp_runtime/src/lib.rs:2360-2365](../tools_rust/mcp_runtime/src/lib.rs).
+- Python internal auth builds a synthetic ASGI scope with `client=(client_ip or "127.0.0.1", 0)` in [mcpgateway/main.py:463-490](../mcpgateway/main.py).
+- Token scoping intentionally trusts only `request.client.host`, not raw forwarding headers, in [mcpgateway/middleware/token_scoping.py:408-426](../mcpgateway/middleware/token_scoping.py) and enforces IP restrictions from that value in [mcpgateway/middleware/token_scoping.py:1304-1309](../mcpgateway/middleware/token_scoping.py).
+
+Impact:
+
+- A direct public client can spoof IP-based token restrictions by setting `X-Real-IP` or `X-Forwarded-For`.
+- If those headers are absent, the request is treated as coming from `127.0.0.1`.
+- Any token with loopback/internal-only IP restrictions can therefore be incorrectly accepted when the Rust public listener is reachable directly.
+
+Recommended fix:
+
+- Do not derive `client_ip` from client-controlled forwarding headers on the direct public listener.
+- Use the real socket peer address, or only trust forwarding headers after an actual trusted proxy layer has rewritten the peer IP.
+- Do not default missing `client_ip` to loopback in the internal auth scope.
+
+### 3. Medium: Public health endpoints leak internal runtime details
+
+The public Rust router exposes unauthenticated health endpoints that reveal internal configuration and topology.
+
+Evidence:
+
+- `/health` and `/healthz` are mounted on the same router as the public ingress in [tools_rust/mcp_runtime/src/lib.rs:897-929](../tools_rust/mcp_runtime/src/lib.rs) and served on both listeners in [tools_rust/mcp_runtime/src/lib.rs:937-964](../tools_rust/mcp_runtime/src/lib.rs).
+- The response includes `backend_rpc_url`, feature flags, protocol metadata, and active session counts via [tools_rust/mcp_runtime/src/lib.rs:180-192](../tools_rust/mcp_runtime/src/lib.rs) and [tools_rust/mcp_runtime/src/lib.rs:1010-1024](../tools_rust/mcp_runtime/src/lib.rs).
+
+Impact:
+
+- Anyone who can reach the public listener can enumerate backend topology and enabled runtime capabilities.
+- This is lower severity than the auth issues above, but still unnecessary information exposure.
+
+Recommended fix:
+
+- Serve a minimal external health payload on the public listener, or bind the detailed health endpoint to the private listener only.
+
+### 4. Missing extension to finding 5: the Python proxy also leaks detailed transport errors
+
+The current review only calls out the Rust runtime's client-visible error leakage. The Python proxy has the same issue.
+
+Evidence:
+
+- On `httpx.HTTPError`, the proxy returns `str(exc)` to the client in [mcpgateway/transports/rust_mcp_runtime_proxy.py:110-124](../mcpgateway/transports/rust_mcp_runtime_proxy.py).
+
+Impact:
+
+- Backend host/port and transport details can leak to clients even before a request reaches the Rust runtime.
+
+Recommended fix:
+
+- Keep detailed exception text in logs only.
+- Return a generic 502 payload to clients.
+
+## Validation Of Existing Findings In `todo/code-review.md`
+
+### 1. Client-supplied `x-contextforge-auth-context` header bypasses authentication
+
+Status: correct.
+
+Notes:
+
+- This is real on the direct public Rust listener in [tools_rust/mcp_runtime/src/lib.rs:2317-2357](../tools_rust/mcp_runtime/src/lib.rs).
+- The Python proxy strips the header before forwarding in [mcpgateway/transports/rust_mcp_runtime_proxy.py:41-49](../mcpgateway/transports/rust_mcp_runtime_proxy.py).
+- The review should be expanded to also cover the parallel `x-contextforge-server-id` trust issue above.
+
+### 2. Redis `KEYS` command in production path
+
+Status: partly correct.
+
+What is correct:
+
+- The code really uses `redis.keys()` in [tools_rust/mcp_runtime/src/lib.rs:2790-2798](../tools_rust/mcp_runtime/src/lib.rs).
+- `KEYS` is a scalability/latency risk on large Redis keyspaces.
+
+What should be corrected:
+
+- This is not on the normal MCP request hot path.
+- It is only used through the health endpoint path: [tools_rust/mcp_runtime/src/lib.rs:1010-1024](../tools_rust/mcp_runtime/src/lib.rs) -> [tools_rust/mcp_runtime/src/lib.rs:2726-2737](../tools_rust/mcp_runtime/src/lib.rs) -> [tools_rust/mcp_runtime/src/lib.rs:2790-2798](../tools_rust/mcp_runtime/src/lib.rs).
+
+Recommended wording:
+
+- Reframe as "health endpoint uses Redis `KEYS`, creating a potential Redis DoS/scalability problem under large keyspaces or frequent health polling."
+
+### 3. No TLS for PostgreSQL connections
+
+Status: partly correct.
+
+What is correct:
+
+- The runtime hardwires PostgreSQL to `NoTls` in [tools_rust/mcp_runtime/src/lib.rs:2118-2127](../tools_rust/mcp_runtime/src/lib.rs).
+- `tokio-postgres` is built without TLS support in [tools_rust/mcp_runtime/Cargo.toml:20-30](../tools_rust/mcp_runtime/Cargo.toml).
+
+What should be corrected:
+
+- "Credentials and query data are sent in plaintext" is too absolute.
+- If the database server requires TLS, the connection will fail rather than silently downgrading.
+
+Recommended wording:
+
+- Reframe as "the runtime has no PostgreSQL TLS support, so it cannot safely connect to deployments that require encrypted DB transport."
+
+### 4. Internal endpoints exposed without authentication
+
+Status: correct.
+
+Notes:
+
+- The shared router mounts the event-store endpoints in [tools_rust/mcp_runtime/src/lib.rs:897-905](../tools_rust/mcp_runtime/src/lib.rs).
+- The same router is used for both public and private listeners in [tools_rust/mcp_runtime/src/lib.rs:937-964](../tools_rust/mcp_runtime/src/lib.rs).
+- The handlers only check `event_store_enabled`, not caller identity, in [tools_rust/mcp_runtime/src/lib.rs:1105-1151](../tools_rust/mcp_runtime/src/lib.rs).
+
+### 5. Error detail leakage to clients
+
+Status: correct, but incomplete.
+
+What is correct:
+
+- The Rust runtime returns `err.to_string()` / `data: err.to_string()` in many client-visible errors.
+
+What is missing:
+
+- The Python proxy leaks `str(exc)` to clients too in [mcpgateway/transports/rust_mcp_runtime_proxy.py:110-124](../mcpgateway/transports/rust_mcp_runtime_proxy.py).
+
+### 6. `session_id` accepted from query parameters
+
+Status: partly correct.
+
+What is correct:
+
+- Rust accepts `session_id` from the query string in [tools_rust/mcp_runtime/src/lib.rs:3445-3454](../tools_rust/mcp_runtime/src/lib.rs).
+- This is security-sensitive because session IDs are effectively bearer-style session selectors.
+
+What should be corrected:
+
+- This is not a clean new regression introduced only by the Rust runtime.
+- The existing Python initialize path also accepts `request.query_params.get("session_id")` in [mcpgateway/main.py:8321-8332](../mcpgateway/main.py).
+- The Rust behavior is intentionally exercised in tests, for example [tools_rust/mcp_runtime/src/lib.rs:8487-8515](../tools_rust/mcp_runtime/src/lib.rs).
+
+Important nuance:
+
+- The risk is amplified because ownerless sessions are explicitly accepted in [tools_rust/mcp_runtime/src/lib.rs:9016-9052](../tools_rust/mcp_runtime/src/lib.rs).
+
+Recommended wording:
+
+- Reframe as "existing compatibility behavior that remains unsafe and should be retired," not as an accidental branch-specific regression.
+
+### 7. `ensure_upstream_session` holds mutex across HTTP I/O
+
+Status: correct.
+
+Notes:
+
+- The lock is held across `initialize_upstream_session().await` in [tools_rust/mcp_runtime/src/lib.rs:6791-6817](../tools_rust/mcp_runtime/src/lib.rs).
+- The contrast with the better RMCP pattern in [tools_rust/mcp_runtime/src/lib.rs:6991-7006](../tools_rust/mcp_runtime/src/lib.rs) is fair.
+
+### 8. Monolithic 9167-line `lib.rs`
+
+Status: accurate observation, but not a defect finding.
+
+Notes:
+
+- This is maintainability/refactor feedback, not a correctness or security bug.
+- I would not send it as a finding if the goal is a defect-focused review.
+
+### 9. URL derivation boilerplate
+
+Status: accurate observation, but not a defect finding.
+
+Notes:
+
+- Same as finding 8: valid cleanup suggestion, not a concrete bug/regression.
+
+### 10. Unbounded in-memory session caches
+
+Status: mostly correct.
+
+What is correct:
+
+- The caches are unbounded for unique cold keys.
+- There is no periodic background sweeper.
+- `resolved_tool_call_plans` keeps expired entries until overwritten in [tools_rust/mcp_runtime/src/lib.rs:6569-6592](../tools_rust/mcp_runtime/src/lib.rs).
+- `upstream_tool_sessions` only drop entries on explicit error/removal paths.
+
+What should be softened:
+
+- The current review table slightly overstates some behaviors.
+- `runtime_sessions` are lazily swept on access and health checks in [tools_rust/mcp_runtime/src/lib.rs:2726-2750](../tools_rust/mcp_runtime/src/lib.rs).
+- Reused keys overwrite prior entries rather than growing without bound for that key.
+
+Recommended wording:
+
+- "Cold unique sessions/plans can accumulate without a periodic sweeper or global size bound."
+
+### 11. Hardcoded Redis key prefixes for affinity
+
+Status: correct.
+
+Notes:
+
+- Runtime session keys use `cache_prefix`, but affinity keys hardcode `mcpgw:` in [tools_rust/mcp_runtime/src/lib.rs:2867-2869](../tools_rust/mcp_runtime/src/lib.rs) and [tools_rust/mcp_runtime/src/lib.rs:2918](../tools_rust/mcp_runtime/src/lib.rs).
+- Python uses the same hardcoded affinity key pattern, so the collision concern is real anywhere multiple deployments share a Redis instance.
+
+## Issues I Re-Checked And Am Not Promoting To Findings
+
+### 1. "Rust proxy should fall back to Python when the sidecar is unavailable"
+
+I am not treating this as a defect.
+
+Reason:
+
+- The current behavior looks intentional and is test-covered.
+- The proxy returns a JSON-RPC 502 instead of falling back in [mcpgateway/transports/rust_mcp_runtime_proxy.py:110-124](../mcpgateway/transports/rust_mcp_runtime_proxy.py).
+- That behavior is explicitly asserted in [tests/unit/mcpgateway/transports/test_rust_mcp_runtime_proxy.py:603-636](../tests/unit/mcpgateway/transports/test_rust_mcp_runtime_proxy.py).
+
+### 2. "Initialize can rebind a session to a different server"
+
+I am not treating this as a clean branch-specific finding.
+
+Reason:
+
+- The Rust initialize path does overwrite stored `server_id` on success in [tools_rust/mcp_runtime/src/lib.rs:2604-2672](../tools_rust/mcp_runtime/src/lib.rs).
+- But the existing Python initialize/session flow also does not maintain a server-bound session identity in [mcpgateway/main.py:8321-8332](../mcpgateway/main.py) and [mcpgateway/cache/session_registry.py:2086-2149](../mcpgateway/cache/session_registry.py).
+- That makes it existing system behavior, not a clearly introduced regression in this branch.
+
+## Bottom Line
+
+If this feedback is being sent back to the reviewer, the most important corrections are:
+
+- Add the missing `x-contextforge-server-id` trust bug on direct public Rust ingress.
+- Add the missing spoofable/default-loopback `client_ip` bug in the Rust -> Python auth seam.
+- Reframe finding 2 as a health-path `KEYS` issue.
+- Reframe finding 3 as missing PostgreSQL TLS support, not guaranteed plaintext in every deployment.
+- Extend finding 5 to include the Python proxy's client-visible exception text.
+- Reframe finding 6 as existing compatibility/security debt rather than a new accidental regression.
+- Drop or demote findings 8 and 9 if the goal is a bug-focused review.
diff --git a/todo/modular-design.md b/todo/modular-design.md
new file mode 100644
index 0000000000..91143adb12
--- /dev/null
+++ b/todo/modular-design.md
@@ -0,0 +1,826 @@
+# Modular Design Investigation: Making MCP and A2A Replaceable Extensions
+
+## Executive Summary
+
+Short answer:
+
+- Rewriting the **MCP protocol core** in Rust is feasible.
+- Replacing the current MCP implementation as a clean **extension** is **not easy today** because MCP behavior is spread across routing, transport, session state, auth/RBAC, and downstream client code.
+- Rewriting **A2A wire behavior** is easier than making **A2A a replaceable module**, because A2A is a first-class domain model tied to DB tables, admin UI, metrics, and tool/server integration.
+
+My recommendation:
+
+1. Do **not** start by trying to swap the whole MCP subsystem directly.
+2. First extract an internal **protocol runtime seam** in Python.
+3. Then implement the MCP runtime behind that seam as either:
+   - a **Rust sidecar** over Unix socket / gRPC / local HTTP for a full replacement, or
+   - a **PyO3 module** for targeted hot paths only.
+4. After MCP is modularized, apply the same runtime/extension pattern to A2A.
+
+If the goal is "I want to replace MCP and A2A independently," the architecture should move toward:
+
+- Python core = control plane, auth, RBAC, persistence, admin UI, config
+- Extension runtime = protocol engines
+- Thin adapters between the two
+
+## What I Investigated
+
+I dug through the current MCP and A2A implementation, validated existing Rust integration paths in the repo, and built two throwaway Rust proofs of concept under `/tmp/cf-modular-poc`:
+
+- an **in-process PyO3 MCP dispatcher**
+- an **out-of-process Rust sidecar MCP dispatcher**
+
+I also verified existing Rust assets already present in the repo:
+
+- `plugins_rust/` builds successfully with `cargo check`
+- `tools_rust/wrapper/` builds successfully with `cargo check`
+- there is now an in-repo Rust MCP runtime prototype at [`tools_rust/mcp_runtime`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime)
+
+## In-Repo Rust MCP Prototype
+
+There is now a working Rust MCP runtime prototype in the repo:
+
+- [`tools_rust/mcp_runtime/Cargo.toml`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime/Cargo.toml)
+- [`tools_rust/mcp_runtime/src/lib.rs`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime/src/lib.rs)
+- [`tools_rust/mcp_runtime/src/main.rs`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime/src/main.rs)
+- [`tools_rust/mcp_runtime/tests/runtime.rs`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime/tests/runtime.rs)
+
+Current ownership in Rust:
+
+- `POST /mcp`, `POST /mcp/`, `POST /rpc`, `POST /rpc/`
+- `MCP-Protocol-Version` validation with defaulting when the header is absent
+- JSON-RPC request validation and batch rejection
+- local `ping`
+- notification transport semantics (`202 Accepted`)
+- initialize parameter validation
+- backend forwarding to Python `/rpc` for business execution
+
+Still owned by Python:
+
+- auth and token scoping
+- RBAC
+- session ownership and affinity
+- streamable HTTP session lifecycle beyond plain POST JSON mode
+- upstream tool/resource/prompt behavior
+
+Verification completed:
+
+- `cargo test --release` passed for [`tools_rust/mcp_runtime`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime)
+- selected MCP 2025-11-25 compliance files passed against the Rust runtime when pointed at a small mock backend over `/rpc`
+- the repo's full `tests/e2e/test_mcp_cli_protocol.py` passed when routed through the Rust runtime with `mcpgateway.wrapper` in front and a controlled `/rpc` backend behind it
+
+This matters because the repo now has a real sidecar-style MCP runtime shell, not just throwaway `/tmp` experiments.
+
+## Current MCP Architecture
+
+MCP is currently spread across several layers, not one module.
+
+### Main MCP implementation sites
+
+- [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py)
+  - mounts `/mcp`
+  - defines `/rpc`
+  - defines `/initialize`, `/ping`, notifications, completion, sampling
+  - contains the large RPC method switch for `tools/list`, `tools/call`, `resources/list`, `resources/read`, `prompts/list`, `prompts/get`, `initialize`, notifications, elicitation, logging, etc.
+- [`mcpgateway/transports/streamablehttp_transport.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/transports/streamablehttp_transport.py)
+  - owns `mcp_app = Server("mcp-streamable-http")`
+  - registers MCP handlers with SDK decorators
+  - owns streamable HTTP auth
+  - owns `SessionManagerWrapper`
+  - directly depends on DB, permission checks, OAuth enforcement, and gateway services
+- [`mcpgateway/cache/session_registry.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/cache/session_registry.py)
+  - owns `handle_initialize_logic`
+  - tracks client capabilities, session owners, broadcast, elicitation capability
+  - internally loops back into `http://127.0.0.1:{settings.port}/rpc`
+- Upstream MCP client behavior is embedded in:
+  - [`mcpgateway/services/tool_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/tool_service.py)
+  - [`mcpgateway/services/resource_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/resource_service.py)
+  - [`mcpgateway/services/gateway_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/gateway_service.py)
+  - [`mcpgateway/services/mcp_session_pool.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/mcp_session_pool.py)
+
+### Why MCP is hard to swap today
+
+The MCP subsystem is not just "protocol handling." It is also:
+
+- FastAPI routing
+- ASGI path rewriting
+- auth and token normalization
+- RBAC enforcement
+- session affinity
+- session ownership
+- client capability tracking
+- SSE/WebSocket/Streamable HTTP handling
+- upstream MCP client pooling and federation
+
+That means a Rust rewrite cannot cleanly replace one file. It would either:
+
+- duplicate a lot of gateway logic, or
+- require a new internal seam first
+
+## Current A2A Architecture
+
+A2A is more domain-coupled than MCP.
+
+### Main A2A implementation sites
+
+- [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py)
+  - defines `/a2a` CRUD and invoke endpoints inline
+  - initializes the global `a2a_service`
+- [`mcpgateway/services/a2a_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/a2a_service.py)
+  - registration
+  - listing
+  - access checks
+  - outbound invocation
+  - metrics
+  - cache invalidation
+  - auth decode
+- [`mcpgateway/admin.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/admin.py)
+  - admin/UI behavior for A2A
+  - some direct SQL over `DbA2AAgent`
+- [`mcpgateway/db.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/db.py)
+  - `A2AAgent`
+  - metrics tables
+  - server association
+  - `tool_id` foreign key
+- [`mcpgateway/schemas.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/schemas.py)
+  - A2A request/response schemas and validation
+
+### Why A2A is hard to swap today
+
+A2A is tied to:
+
+- DB schema
+- admin UI
+- metrics and cache
+- RBAC permissions
+- tool auto-creation/update/delete
+- server associations
+
+There is also duplicated protocol behavior:
+
+- [`mcpgateway/services/a2a_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/a2a_service.py) invokes A2A agents
+- [`mcpgateway/services/tool_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/tool_service.py) also invokes A2A agents for `integration_type == "A2A"`
+
+So replacing the **A2A wire client** is feasible, but replacing **A2A as a core module** is a larger refactor.
+
+## Existing Extension and Rust Patterns Already in the Repo
+
+This matters because it shows what the codebase already tolerates.
+
+### Existing Rust patterns
+
+- PyO3 extension package:
+  - [`plugins_rust/Cargo.toml`](/home/cmihai/agents2/pr/mcp-context-forge/plugins_rust/Cargo.toml)
+  - [`plugins_rust/pyproject.toml`](/home/cmihai/agents2/pr/mcp-context-forge/plugins_rust/pyproject.toml)
+  - [`plugins_rust/src/lib.rs`](/home/cmihai/agents2/pr/mcp-context-forge/plugins_rust/src/lib.rs)
+- Standalone Rust binary:
+  - [`tools_rust/wrapper/Cargo.toml`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/wrapper/Cargo.toml)
+  - [`tools_rust/wrapper/src/lib.rs`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/wrapper/src/lib.rs)
+
+### Existing out-of-process extension patterns
+
+The plugin framework already supports external runtimes over multiple transports:
+
+- MCP transport:
+  - [`mcpgateway/plugins/framework/external/mcp/client.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/plugins/framework/external/mcp/client.py)
+  - [`mcpgateway/plugins/framework/external/mcp/server/runtime.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/plugins/framework/external/mcp/server/runtime.py)
+- gRPC transport:
+  - [`mcpgateway/plugins/framework/external/grpc/client.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/plugins/framework/external/grpc/client.py)
+  - [`mcpgateway/plugins/framework/external/grpc/server/runtime.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/plugins/framework/external/grpc/server/runtime.py)
+- Unix socket transport:
+  - [`mcpgateway/plugins/framework/external/unix/client.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/plugins/framework/external/unix/client.py)
+  - [`mcpgateway/plugins/framework/external/unix/server/server.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/plugins/framework/external/unix/server/server.py)
+
+This is a strong signal that a **sidecar protocol runtime** fits repo conventions better than a giant embedded FFI rewrite.
+
+## Best Extraction Seam Confirmed
+
+After going deeper into the current MCP implementation, the best first seam is clearer:
+
+- replace the mounted `/mcp` runtime layer in Rust
+- keep Python auth/path rewriting in front of it
+- keep Python `/rpc` as the business-logic backend
+
+Concretely, the most useful boundary today is:
+
+- Rust runtime behind the mounted MCP transport at [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py#L7836)
+- Python path rewrite and auth ahead of it at [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py#L1898) and [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py#L2021)
+- Python `/rpc` as the backend dispatch seam at [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py#L5940)
+
+Why this seam is better than extracting `SessionRegistry` first:
+
+- the current Streamable HTTP implementation already routes POSTs into `/rpc`
+- legacy SSE also self-calls `/rpc`
+- auth/session ownership logic is security-critical and still cleaner to leave in Python during the first cut
+- the decorated MCP SDK handlers are more coupled to service/DB internals than the `/mcp` mount boundary
+
+### Packaging and release implications
+
+PyO3 is supported here, but it is not yet integrated as a first-class path for the main gateway package.
+
+- Rust wheel packaging is separate today:
+  - [`plugins_rust/pyproject.toml`](/home/cmihai/agents2/pr/mcp-context-forge/plugins_rust/pyproject.toml) uses `maturin`
+  - the root [`pyproject.toml`](/home/cmihai/agents2/pr/mcp-context-forge/pyproject.toml) still builds the Python package separately
+- The repo already has explicit Rust build targets in [`Makefile`](/home/cmihai/agents2/pr/mcp-context-forge/Makefile), including `rust-build`, `rust-dev`, `rust-test`, and cross-platform wheel targets.
+
+Practical effect:
+
+- **PyO3** gives lower latency, but couples protocol delivery to Python wheel/ABI/release coordination.
+- **Sidecar** gives a cleaner release boundary:
+  - separate binary or container
+  - easier rollback
+  - easier crash isolation
+  - less packaging coupling to Python interpreter details
+
+## Prototype Results
+
+I built two throwaway prototypes outside the repo under `/tmp/cf-modular-poc`.
+
+### Prototype 1: PyO3 in-process MCP dispatcher
+
+What it tested:
+
+- Can Rust sit inside Python and accept gateway-shaped JSON-RPC payloads?
+- Is the packaging/build story workable?
+- What is the rough overhead of using Rust for dispatch/parsing?
+
+Result:
+
+- Build succeeded with `maturin develop --release`
+- The module handled `initialize`, `ping`, `tools/list`, and `tools/call`
+- Benchmark result for a simple `tools/call`-style dispatch loop:
+  - Rust PyO3 module: about **1.43 microseconds per call**
+  - Pure Python baseline: about **5.18 microseconds per call**
+  - Rough speedup: about **3.6x**
+
+Interpretation:
+
+- PyO3 is viable for hot-path parsing/dispatch/codec work.
+- It is attractive for:
+  - JSON-RPC validation
+  - schema normalization
+  - SSE framing/parsing
+  - message transforms
+- It is **not** the cleanest first choice for replacing the full MCP subsystem because the FFI boundary gets wide fast once async I/O, auth, sessions, and callbacks get involved.
+
+### Prototype 2: Rust sidecar MCP dispatcher
+
+What it tested:
+
+- Can Rust run as a separate protocol engine and respond to local JSON-RPC style requests cleanly?
+- What is the boundary overhead of crossing into another process?
+
+Result:
+
+- Build succeeded with `cargo build --release`
+- Local sidecar endpoint worked over loopback HTTP
+- Benchmark result with a reused keep-alive connection:
+  - about **239.8 microseconds per call**
+- I then extended the throwaway sidecar to support **Unix domain sockets**
+- Benchmark result with a reused UDS connection:
+  - about **161.3 microseconds per call**
+
+Interpretation:
+
+- Boundary cost is much higher than PyO3, as expected.
+- UDS is noticeably better than loopback TCP for the sidecar shape.
+- But the process boundary is architecturally cleaner:
+  - crash isolation
+  - simpler ownership split
+  - easier language boundary
+  - easier to swap implementations
+- For a full MCP engine replacement, this is the more realistic pattern.
+
+### Important benchmark caveat
+
+These prototypes only measured protocol dispatch overhead. They did **not** include:
+
+- DB access
+- auth/RBAC
+- Redis
+- session affinity
+- real MCP SDK compatibility
+- plugin execution
+
+So the benchmark is not "full system speed." It is only useful for understanding **integration cost at the seam**.
+
+## Compliance-Oriented Runtime Validation
+
+I ran the repo's MCP 2025-11-25 compliance tests against the new Rust runtime using:
+
+- Rust runtime as the HTTP edge
+- a small mock backend behind `/rpc`
+
+The following suites passed in that configuration:
+
+- `base/test_no_batch_payloads.py`
+- `lifecycle/test_initialize.py`
+- `transport_core/test_streamable_http_protocol_header.py`
+- `server_features/test_discovery_methods.py`
+- `utilities/test_ping_and_notifications.py`
+- `tasks/test_tasks_optional_capability.py`
+- `authorization/test_protected_resource_metadata.py`
+- `base/test_schema_surface_runtime.py`
+
+What that proves:
+
+- the Rust runtime already satisfies the MCP-2025 transport contract for:
+  - protocol header validation
+  - notification status mapping
+  - JSON-RPC envelope handling
+  - batch rejection
+  - `/mcp` POST behavior
+- the runtime is already a viable protocol shell
+- the remaining hard work is not basic MCP wire handling, it is the Python-owned policy/session/business coupling behind it
+
+## mcp-cli Validation
+
+I also ran the repo's actual `mcp-cli` E2E suite:
+
+- `tests/e2e/test_mcp_cli_protocol.py`
+
+with this path:
+
+- `mcp-cli`
+- `mcpgateway.wrapper` over stdio
+- Rust runtime on the HTTP MCP edge
+- controlled backend behind `/rpc`
+
+Result:
+
+- `22 passed`
+
+This matters because it validates more than protocol compliance. It proves the Rust runtime already works through the repo's actual stdio client bridge, not just direct HTTP JSON-RPC calls.
+
+Two practical compatibility details mattered:
+
+- the runtime needed `GET /health` because the `mcp-cli` E2E suite probes that path before running
+- default support for older MCP protocol versions still matters because the current `mcp-cli` path and helper stack are not yet fully `2025-11-25` only
+
+## Immediate Quick Wins
+
+These are low-risk refactors that improve modularity before any Rust rewrite.
+
+### MCP quick wins
+
+#### 1. Extract auth visibility normalization into one helper
+
+Why:
+
+- The `is_admin` / `token_teams` / `public-only` normalization pattern is duplicated heavily.
+- I counted **62** occurrences of `token_teams is None` in [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py).
+- I counted **23** occurrences of the same pattern in [`mcpgateway/transports/streamablehttp_transport.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/transports/streamablehttp_transport.py).
+
+Quick win:
+
+- create one helper that returns normalized auth scope context
+- use it in `/rpc`, REST MCP endpoints, and streamable HTTP handlers
+
+Why it matters:
+
+- removes copy-paste policy logic
+- lowers risk when MCP moves behind a protocol runtime boundary
+
+#### 2. Extract a shared MCP dispatcher from `/rpc`
+
+Why:
+
+- The main `/rpc` switch in [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py) is the current de facto MCP application core.
+- Streamable HTTP handlers in [`mcpgateway/transports/streamablehttp_transport.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/transports/streamablehttp_transport.py) implement overlapping operations again.
+
+Quick win:
+
+- create an `MCPDispatcher` or `MCPApplicationService`
+- have `/rpc` call it first
+- later route streamable HTTP through the same service
+
+Why it matters:
+
+- this is the cleanest seam needed for any Rust runtime
+- it matches the new in-repo Rust runtime, which already uses Python `/rpc` as its backend contract
+
+#### 3. Remove self-HTTP from `SessionRegistry`
+
+Why:
+
+- [`mcpgateway/cache/session_registry.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/cache/session_registry.py) still posts to `http://127.0.0.1:{settings.port}/rpc` for internal SSE RPC handling.
+
+Quick win:
+
+- inject the dispatcher directly instead of going through loopback HTTP
+
+Why it matters:
+
+- removes transport from internal control flow
+- reduces latency
+- makes the MCP core more portable to a runtime boundary later
+
+#### 4. Consolidate session-affinity forwarding logic
+
+Why:
+
+- session-affinity forwarding logic exists in both [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py) and [`mcpgateway/transports/streamablehttp_transport.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/transports/streamablehttp_transport.py)
+
+Quick win:
+
+- extract one reusable affinity-forwarding helper/service
+
+Why it matters:
+
+- lowers transport-specific duplication before any runtime swap
+
+### A2A quick wins
+
+#### 1. Create one shared A2A protocol adapter
+
+Why:
+
+- outbound A2A request shaping exists in both [`mcpgateway/services/a2a_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/a2a_service.py) and [`mcpgateway/services/tool_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/tool_service.py)
+- both build JSON-RPC payloads and custom A2A payloads separately
+
+Quick win:
+
+- create `A2AProtocolAdapter` or `A2AClient`
+- centralize:
+  - request shaping
+  - auth application
+  - query-param auth handling
+  - response normalization
+
+Why it matters:
+
+- this is the easiest first seam for later Rust or SDK-backed A2A replacement
+
+#### 2. Move admin A2A querying behind shared service/repository code
+
+Why:
+
+- [`mcpgateway/admin.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/admin.py) contains direct `DbA2AAgent` query logic for listing/searching/filtering
+- that bypasses a clean A2A abstraction
+
+Quick win:
+
+- extract shared query helpers or an `A2ARepository`
+
+Why it matters:
+
+- makes A2A less UI-coupled
+- reduces the amount of code that must change when A2A becomes more modular
+
+## Recommended First PRs
+
+If I were sequencing this for real, I would start with these PRs:
+
+1. Add a shared auth-scope normalization helper and replace duplicated `token_teams` handling in MCP paths.
+2. Extract an `MCPDispatcher` from the `/rpc` route without changing behavior.
+3. Replace `SessionRegistry` loopback `/rpc` calls with direct dispatcher invocation.
+4. Add an `A2AProtocolAdapter` and make both `A2AAgentService` and `ToolService` use it.
+5. Move admin-side A2A list/search query code into shared service/repository helpers.
+
+## Difficulty Assessment
+
+### MCP
+
+#### Replacing only hot paths with Rust
+
+Difficulty: **moderate**
+
+Examples:
+
+- JSON parsing
+- stream framing
+- schema validation/normalization
+- event buffer logic
+
+This is the easiest Rust entry point.
+
+#### Replacing the MCP protocol engine behind a new internal interface
+
+Difficulty: **medium-hard**
+
+This is the right target if you want MCP to become a true extension.
+
+Main blockers:
+
+- `/rpc` method dispatch is in [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py)
+- streamable HTTP auth is in [`mcpgateway/transports/streamablehttp_transport.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/transports/streamablehttp_transport.py)
+- session semantics live in [`mcpgateway/cache/session_registry.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/cache/session_registry.py)
+- upstream MCP client behavior is embedded in several services
+
+#### Replacing the entire current MCP subsystem immediately
+
+Difficulty: **hard**
+
+This is the wrong first move. Too much behavior is currently cross-wired.
+
+### A2A
+
+#### Replacing the A2A HTTP/JSON-RPC client logic
+
+Difficulty: **moderate**
+
+This is very doable and should happen before any full modularization.
+
+Main first step:
+
+- introduce one shared `A2AClient` or `A2AProtocolAdapter`
+- remove duplicate invocation logic from [`mcpgateway/services/a2a_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/a2a_service.py) and [`mcpgateway/services/tool_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/tool_service.py)
+
+#### Replacing A2A as a full extension
+
+Difficulty: **medium-hard to hard**
+
+Because A2A currently owns:
+
+- persistence
+- UI
+- metrics
+- server relationships
+- tool relationships
+
+## Recommended Architecture
+
+### Principle
+
+Protocols should become **runtimes**, not **core modules**.
+
+Core gateway should own:
+
+- auth
+- RBAC
+- token scoping
+- persistence
+- admin UI
+- plugin lifecycle
+- audit/logging/metrics policy
+
+Protocol runtimes should own:
+
+- protocol message parsing
+- transport semantics
+- capability negotiation
+- wire-level request/response mapping
+
+### Proposed internal seam
+
+Introduce a protocol runtime contract in Python first.
+
+Example shape:
+
+```python
+class ProtocolRuntime(Protocol):
+    name: str
+
+    async def initialize(self, ctx: RuntimeContext) -> None: ...
+    async def shutdown(self) -> None: ...
+
+    async def dispatch_rpc(self, call: ProtocolCall, ctx: RequestContext) -> ProtocolResult: ...
+    async def handle_stream(self, scope, receive, send, ctx: RequestContext) -> None: ...
+
+    async def create_upstream_client(self, target: UpstreamTarget) -> UpstreamProtocolClient: ...
+```
+
+And the gateway side would provide:
+
+- `RequestContextResolver`
+- `PermissionAuthorizer`
+- `SessionStore`
+- `GatewayCatalog`
+- `ToolCatalog`
+- `PromptCatalog`
+- `ResourceCatalog`
+
+That lets the runtime ask the core for business decisions instead of reimplementing them.
+
+## Best Rust strategy by scope
+
+### If you want performance acceleration inside the existing Python architecture
+
+Use **PyO3**.
+
+Good candidates:
+
+- JSON-RPC parser/validator
+- event ring buffer
+- SSE parser/framer
+- schema normalization
+- session-id parsing/validation
+
+Not recommended as the first step for:
+
+- full async transport ownership
+- auth callbacks crossing FFI
+- session lifecycle crossing FFI
+
+### If you want MCP to be truly replaceable
+
+Use a **Rust sidecar**.
+
+Preferred transports in order:
+
+1. **Unix socket**
+2. **gRPC**
+3. local HTTP
+
+Why:
+
+- Unix socket keeps latency lower than loopback TCP
+- process boundary is clean
+- fits current external runtime patterns already present in the plugin framework
+- aligns with `tools_rust/wrapper` being a separate Rust process
+
+## Concrete MCP Migration Plan
+
+### Phase 0: Stop adding more MCP logic to `main.py`
+
+Goal:
+
+- freeze the current architectural sprawl
+
+Actions:
+
+- no new MCP method handling in [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py)
+- no new self-HTTP loops where direct dispatcher calls would work better
+
+### Phase 1: Extract an in-process MCP application service
+
+Goal:
+
+- separate "protocol dispatch" from FastAPI routes
+
+Actions:
+
+- move the `/rpc` method switch out of [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py)
+- create one dispatcher that both `/rpc` and streamable HTTP use
+- remove the loopback dependency in [`mcpgateway/cache/session_registry.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/cache/session_registry.py)
+
+Success criteria:
+
+- `/rpc`, SSE, and streamable HTTP all call the same in-process dispatcher
+
+### Phase 2: Extract gateway-owned dependency interfaces
+
+Goal:
+
+- keep policy/core concerns in Python while making the protocol engine swappable
+
+Interfaces to extract:
+
+- auth context resolver
+- permission authorizer
+- session store
+- capability registry
+- tool/prompt/resource lookup and invocation adapters
+
+### Phase 3: Introduce runtime selection
+
+Goal:
+
+- make MCP runtime pluggable
+
+Example:
+
+- `python-sdk` runtime
+- `rust-sidecar` runtime
+
+At this stage, Python remains the default, Rust becomes an optional alternative.
+
+Practical note:
+
+- the new [`tools_rust/mcp_runtime`](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime) prototype is the starting point for the `rust-sidecar` runtime option
+
+### Phase 4: Move MCP wire protocol into Rust
+
+Goal:
+
+- Rust owns:
+  - message parsing
+  - initialize/ping/notifications semantics
+  - stream handling
+  - capability negotiation
+
+Python still owns:
+
+- auth
+- RBAC
+- DB-backed catalogs
+- policy
+- plugin hooks
+
+### Phase 5: Revisit upstream MCP client logic
+
+Goal:
+
+- decide whether upstream MCP client pooling/federation also moves behind the same runtime
+
+This should happen last, not first.
+
+## Concrete A2A Migration Plan
+
+### Phase 1: Extract one A2A protocol adapter
+
+Create a shared adapter used by both:
+
+- [`mcpgateway/services/a2a_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/a2a_service.py)
+- [`mcpgateway/services/tool_service.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/tool_service.py)
+
+This is the obvious cleanup step and should happen even if you never rewrite A2A in Rust.
+
+### Phase 2: Separate domain model from wire adapter
+
+Keep in Python:
+
+- `A2AAgent` persistence
+- metrics
+- admin UI
+- RBAC
+
+Move behind interface:
+
+- request building
+- auth/header/query-param application
+- outbound transport behavior
+- response normalization
+
+### Phase 3: Optional Rust A2A runtime
+
+Once MCP has a runtime model, A2A can follow it.
+
+Important point:
+
+A2A should probably be the **second** protocol runtime you modularize, not the first.
+
+MCP is the better pathfinder because:
+
+- it is more performance-sensitive
+- it already has stronger transport semantics
+- it already has Rust-adjacent code in the repo
+
+## What I Would Do Next
+
+In order:
+
+1. Extract a shared MCP dispatcher from [`mcpgateway/main.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/main.py).
+2. Remove the loopback `/rpc` dependency from [`mcpgateway/cache/session_registry.py`](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/cache/session_registry.py).
+3. Introduce a runtime contract for MCP.
+4. Build a **Rust sidecar** proof of concept against that contract using Unix sockets.
+5. Extract a shared A2A protocol adapter and deduplicate A2A invocation logic.
+6. Only after that, consider A2A as a full extension runtime.
+
+## Final Recommendation
+
+## Implementation Update: Integrated Rust MCP Edge
+
+The MCP Rust runtime is now integrated into the real gateway path behind an
+experimental flag.
+
+New runtime settings:
+
+- `EXPERIMENTAL_RUST_MCP_RUNTIME_ENABLED`
+- `EXPERIMENTAL_RUST_MCP_RUNTIME_URL`
+- `EXPERIMENTAL_RUST_MCP_RUNTIME_TIMEOUT_SECONDS`
+
+Container/launcher support:
+
+- `Containerfile.lite` now copies a bundled `contextforge-mcp-runtime` binary
+  when built with `--build-arg ENABLE_RUST=true`
+- `docker-entrypoint.sh` can supervise that sidecar with
+  `EXPERIMENTAL_RUST_MCP_RUNTIME_MANAGED=true`
+
+Important design decision:
+
+- the mounted `/mcp` app is now hybrid
+- POST MCP traffic proxies to Rust
+- non-POST MCP traffic still falls back to the Python streamable HTTP transport
+
+Why this matters:
+
+- it keeps existing session-management behavior available while the Rust runtime
+  is still POST-focused
+- it makes the integration safe enough to run in the actual gateway instead of
+  only in a synthetic standalone demo
+
+Correctness fix added during integration:
+
+- server-scoped `/servers/<id>/mcp` requests now preserve semantics because the
+  Python proxy injects `server_id` into forwarded JSON-RPC params before the
+  Rust runtime passes the request to Python `/rpc`
+
+Hardening fix added during integration:
+
+- the Rust runtime now strips internal-only headers such as
+  `x-forwarded-internally` and `x-mcp-session-id` instead of forwarding them
+  back into Python `/rpc`
+
+If the question is "how easy is it to rewrite MCP in Rust and then do the same for A2A?"
+
+My answer is:
+
+- **Rewriting MCP internals in Rust:** feasible
+- **Making MCP replaceable right now:** not easy
+- **Best path:** extract seams first, then use a Rust sidecar for the full protocol runtime
+- **A2A afterward:** yes, but first deduplicate and isolate the A2A wire adapter from the A2A domain model
+
+If you try to rewrite MCP directly without extracting the seam first, you will mostly be rewriting Python coupling in another language.
+
+If you extract the seam first, then the Rust rewrite becomes a bounded systems task instead of an architecture fight.
diff --git a/todo/remaining-items.md b/todo/remaining-items.md
new file mode 100644
index 0000000000..645ac02b4f
--- /dev/null
+++ b/todo/remaining-items.md
@@ -0,0 +1,40 @@
+# Remaining Rust MCP Items
+
+This file tracks the remaining work after the current Rust MCP hardening pass.
+
+## Implemented In This Branch
+
+- [x] Add runtime observability for the session-auth fast path.
+  - Rust `/health` now exposes `runtime_stats` with:
+    - session-auth reuse hits and misses
+    - miss reasons
+    - backend Python auth round-trips
+    - session access denial reasons
+    - affinity forward attempts and forwarded requests
+- [x] Extend the compose-backed Rust isolation suite with bounded-TTL revocation coverage.
+- [x] Extend the compose-backed Rust isolation suite with bounded-TTL team membership removal coverage.
+- [x] Extend the compose-backed Rust isolation suite with bounded-TTL team role revocation coverage.
+- [x] Add forced cross-worker affinity ownership coverage in the Rust runtime integration tests.
+- [x] Add a dedicated multi-user correctness load harness:
+  - `tests/loadtest/locustfile_mcp_isolation.py`
+  - `make test-mcp-session-isolation-load`
+- [x] Keep `session_id` query-parameter support non-breaking in this PR and document it as compatibility debt instead of changing Python behavior.
+
+## Still Open
+
+- [ ] Re-run the new bounded-TTL compose-backed isolation checks on every release candidate:
+  - `MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS=2 MCP_RUST_SESSION_AUTH_REUSE_GRACE_SECONDS=1 make testing-rebuild-rust-full`
+  - `make test-mcp-session-isolation`
+  - `make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s`
+- [ ] Investigate the remaining low-rate failures in sustained `5m` tools-only runs.
+- [ ] Decide whether to expose the new runtime stats beyond `/health` or export them into the broader metrics stack.
+- [ ] Decide whether `session_id` query-parameter compatibility should be formally deprecated and later retired across both Python and Rust.
+- [ ] Add client-certificate PostgreSQL TLS support for Rust (`sslcert` / `sslkey`) if that deployment mode is required.
+
+## Deferred To Follow-Up
+
+These remain intentionally outside this PR:
+
+- broader Python-side MCP error redaction beyond the Rust runtime proxy path
+- broader Playwright/admin login instability
+- broader Python compatibility cleanup around query-parameter session identifiers
diff --git a/tools_rust/mcp_runtime/.gitignore b/tools_rust/mcp_runtime/.gitignore
new file mode 100644
index 0000000000..e95c47db8b
--- /dev/null
+++ b/tools_rust/mcp_runtime/.gitignore
@@ -0,0 +1,7 @@
+# Local Rust crate artifacts
+/target
+Cargo.lock
+
+# Local editor/runtime noise
+.idea
+*.log
diff --git a/tools_rust/mcp_runtime/Cargo.toml b/tools_rust/mcp_runtime/Cargo.toml
new file mode 100644
index 0000000000..81a72a8657
--- /dev/null
+++ b/tools_rust/mcp_runtime/Cargo.toml
@@ -0,0 +1,41 @@
+[package]
+name = "contextforge_mcp_runtime"
+version = "0.1.0"
+edition = "2024"
+rust-version = "1.85"
+license = "Apache-2.0"
+authors = ["Mihai Criveti"]
+description = "Experimental Rust MCP runtime edge for ContextForge"
+
+[features]
+default = []
+rmcp-upstream-client = ["dep:rmcp", "dep:reqwest-rmcp"]
+
+[dependencies]
+async-stream = "0.3.6"
+axum = "0.8.8"
+base64 = "0.22.1"
+clap = { version = "4.5.60", features = ["derive", "env"] }
+deadpool-postgres = "0.14.1"
+futures-util = "0.3.31"
+redis = { version = "0.32.7", features = ["aio", "tokio-comp", "connection-manager"] }
+reqwest = { version = "0.12.23", default-features = false, features = ["json", "stream", "http2", "rustls-tls-native-roots"] }
+reqwest-rmcp = { package = "reqwest", version = "0.13.2", default-features = false, features = ["json", "stream", "rustls"], optional = true }
+rmcp = { version = "1.1.1", optional = true, default-features = false, features = ["client", "transport-streamable-http-client-reqwest", "reqwest"] }
+rustls = "0.23.37"
+rustls-native-certs = "0.8.3"
+rustls-pemfile = "2.2.0"
+serde = { version = "1.0.228", features = ["derive"] }
+serde_json = "1.0.149"
+sha2 = "0.10.9"
+thiserror = "2.0.16"
+tokio = { version = "1.50.0", features = ["full"] }
+tokio-postgres = { version = "0.7.15", features = ["with-serde_json-1"] }
+tokio-postgres-rustls = "0.13.0"
+tracing = "0.1.44"
+tracing-subscriber = { version = "0.3.20", features = ["env-filter"] }
+uuid = { version = "1.18.1", features = ["v4"] }
+
+[dev-dependencies]
+reqwest = { version = "0.12.23", default-features = false, features = ["json", "stream", "http2", "rustls-tls-native-roots"] }
+tokio = { version = "1.50.0", features = ["full"] }
diff --git a/tools_rust/mcp_runtime/DEVELOPING.md b/tools_rust/mcp_runtime/DEVELOPING.md
new file mode 100644
index 0000000000..a061c2d859
--- /dev/null
+++ b/tools_rust/mcp_runtime/DEVELOPING.md
@@ -0,0 +1,482 @@
+# Developing The Rust MCP Runtime
+
+This guide is the practical command checklist for developing
+[`tools_rust/mcp_runtime`](.) and the Python integration around it.
+
+Use it together with:
+
+- [README.md](README.md) for runtime architecture, modes, and operator workflows
+- [STATUS.md](STATUS.md) for the current branch-local validation and benchmark snapshot
+- [TESTING-DESIGN.md](TESTING-DESIGN.md) for the session/auth isolation threat model
+
+## Scope
+
+Changes in the Rust MCP runtime often affect more than the crate itself. A
+single feature can touch:
+
+- the Rust runtime crate
+- Python integration in `mcpgateway/`
+- Docker/compose startup wiring
+- MCP end-to-end tests
+- admin UI pages such as Overview and Version Info
+- load-test and benchmark behavior
+
+That means a complete development loop is usually layered:
+
+1. fast Rust-local checks
+2. broader Python/backend checks
+3. live compose-backed MCP validation
+4. UI validation when relevant
+5. benchmark and profiling work when performance-sensitive paths changed
+
+## Command Matrix
+
+Use the smallest set that matches your change.
+
+| Change type | Minimum checks |
+| --- | --- |
+| Pure Rust refactor in `src/` or `tests/` | `make -C tools_rust/mcp_runtime fmt-check clippy-all test test-rmcp` |
+| Rust + Python integration change | Rust-local checks plus `make doctest test htmlcov` |
+| MCP protocol, auth, session, or transport behavior | Rebuild stack and run `make test-mcp-cli test-mcp-rbac`; add `make test-mcp-plugin-parity` with `PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml` for live plugin parity, `make test-mcp-access-matrix` for detailed role/output verification, `make test-mcp-session-isolation` for Rust public path work, and `make test-mcp-session-isolation-load` for correctness-under-load changes |
+| Overview / Version Info / templates / JS / CSS | `make test-js-coverage lint-web flake8 bandit interrogate pylint`, plus `make test-ui-smoke` and targeted Playwright tests |
+| Packaging / release readiness | `make verify` |
+| Performance-sensitive hot path | relevant tests plus benchmark and profiling targets |
+
+## Fast Inner Loop
+
+For day-to-day Rust work, stay in the crate until the code shape is stable.
+
+```bash
+make -C tools_rust/mcp_runtime fmt-check
+make -C tools_rust/mcp_runtime check
+make -C tools_rust/mcp_runtime clippy
+make -C tools_rust/mcp_runtime clippy-all
+make -C tools_rust/mcp_runtime test
+make -C tools_rust/mcp_runtime test-rmcp
+```
+
+What these cover:
+
+- `fmt-check`: formatting drift
+- `check`: compile/type issues without full test cost
+- `clippy`: default all-target lint pass
+- `clippy-all`: all-targets, all-features lint pass
+- `test`: default Rust tests
+- `test-rmcp`: upstream RMCP client feature coverage
+
+Use these when:
+
+- editing `src/lib.rs`, `src/config.rs`, `src/main.rs`
+- changing request routing, auth/session logic, direct DB paths, or helpers
+- touching the optional RMCP path
+
+## Repo-Wide Hygiene
+
+These are the standard root-level formatting and linting commands the repo
+expects before a serious validation pass.
+
+```bash
+make autoflake isort black pre-commit
+make test-js-coverage lint-web flake8 bandit interrogate pylint verify
+make doctest test htmlcov
+```
+
+Notes:
+
+- `make autoflake isort black pre-commit`
+  - use after broader edits, especially mixed Python/template/doc changes
+- `make test-js-coverage lint-web flake8 bandit interrogate pylint verify`
+  - this is the wider hygiene gate for Python, docs, web assets, and package
+    metadata
+- `make doctest test htmlcov`
+  - this is the main broad backend confidence pass
+
+Important behavior:
+
+- `make test` is a broad Python test run against the `tests/` tree with
+  selected ignores
+  - it does **not** run Playwright
+  - it does **not** run performance/compliance suites
+  - it now ignores `tests/e2e_rust/`, so Rust-mode-only live tests do not pollute
+    the default backend test run
+- `make doctest` runs doctests against `mcpgateway/`
+- `make htmlcov` builds an HTML coverage report from `.coverage`
+- `make verify` builds the Python package and runs metadata/manifest checks
+
+## Recommended Root-Level Validation
+
+For most MCP runtime PR work, this is the minimum serious root-level gate:
+
+```bash
+make doctest test htmlcov
+make flake8 bandit interrogate pylint
+```
+
+Add these when you touched UI/templates/static files:
+
+```bash
+make test-js-coverage
+make lint-web
+make test-ui-smoke
+```
+
+Add this when the change is close to shipping:
+
+```bash
+make verify
+```
+
+## Compose-Backed MCP Validation
+
+Rust-local tests are not enough for this runtime. You also need live validation
+against the compose-backed gateway.
+
+### Python Baseline
+
+Use this when you want to confirm the non-Rust public MCP path still behaves
+correctly.
+
+```bash
+make testing-down
+make compose-clean
+make docker-prod DOCKER_BUILD_ARGS="--no-cache"
+make testing-up
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml make testing-up
+MCP_PLUGIN_PARITY_EXPECTED_RUNTIME=python make test-mcp-plugin-parity
+```
+
+Expected outcome:
+
+- `/health` reports Python MCP mode
+- `make test-mcp-cli` passes, with the Rust-only raw-header assertion skipped
+- `make test-mcp-rbac` passes
+- `make test-mcp-access-matrix` passes and verifies scoped-user access with
+  strong tool/resource/prompt sentinels
+- `make test-mcp-plugin-parity` passes with the Python runtime header and proves
+  active `resource_post_fetch`, `tool_post_invoke`, and `prompt_post_fetch`
+  behavior on the public MCP path
+
+### Rust Shadow
+
+Use this when validating that Rust can be present without owning the public MCP
+path.
+
+```bash
+make testing-rebuild-rust-shadow
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+```
+
+Expected outcome:
+
+- public `/mcp` still behaves like Python mode
+- `/health` shows Rust present internally but Python mounted publicly
+
+### Rust Edge
+
+Use this when validating the Rust public transport edge without the full Rust
+session/event-store stack.
+
+```bash
+make testing-rebuild-rust
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+```
+
+### Rust Full
+
+Use this when validating the fullest Rust path and any session/replay/live
+stream/auth reuse changes.
+
+```bash
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+make test-mcp-session-isolation
+make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s
+cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml
+PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml make testing-rebuild-rust-full
+MCP_PLUGIN_PARITY_EXPECTED_RUNTIME=rust make test-mcp-plugin-parity
+```
+
+Expected outcome:
+
+- `/health` reports Rust-managed runtime and Rust-mounted public transport
+- `make test-mcp-cli` passes
+- `make test-mcp-rbac` passes
+- `make test-mcp-access-matrix` passes on the Rust path
+- `make test-mcp-session-isolation` passes on the Rust path
+- `make test-mcp-session-isolation-load` validates owner traffic and hijack
+  denial under concurrent Locust load
+- `make test-mcp-plugin-parity` passes with the Rust runtime header and proves
+  the live plugin hooks still affect public MCP `resources/read`,
+  `tools/call`, and `prompts/get`
+- release Rust tests pass
+
+For revocation and membership/role-drift changes, validate with a short reuse
+TTL so the bounded-TTL contract completes quickly:
+
+```bash
+MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS=2 MCP_RUST_SESSION_AUTH_REUSE_GRACE_SECONDS=1 make testing-rebuild-rust-full
+make test-mcp-session-isolation
+make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s
+make test-mcp-access-matrix
+```
+
+## Verify What Is Actually Running
+
+Do not assume the stack is in the mode you intended. Check it.
+
+```bash
+curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'
+```
+
+What to look for:
+
+- Python baseline:
+  - `x-contextforge-mcp-runtime-mode: python`
+  - `x-contextforge-mcp-transport-mounted: python`
+- Rust shadow:
+  - `x-contextforge-mcp-runtime-mode: rust-managed`
+  - `x-contextforge-mcp-transport-mounted: python`
+- Rust edge/full:
+  - `x-contextforge-mcp-runtime-mode: rust-managed`
+  - `x-contextforge-mcp-transport-mounted: rust`
+
+If you changed the admin UI runtime display, also verify:
+
+- Overview page shows `🐍 Python MCP Core` or `🦀 Rust MCP Core`
+- Version Info page shows the MCP runtime card with the correct mounted/core
+  modes
+
+## UI And Web Checks
+
+You do not need these for every pure Rust refactor. You do need them when the
+change touches:
+
+- `mcpgateway/templates/`
+- `mcpgateway/static/`
+- `mcpgateway/admin.py`
+- `mcpgateway/version.py`
+- Overview / Version Info runtime display
+
+Recommended UI/web checks:
+
+```bash
+make test-js-coverage
+make lint-web
+make test-ui-smoke
+uv run pytest tests/playwright/test_version_page.py -q
+```
+
+Broader UI pass:
+
+```bash
+make test-ui-headless
+```
+
+Note:
+
+- `make test-ui-headless` exercises broad repo UI behavior and can expose
+  unrelated flaky admin flows
+- use targeted Playwright files first when you only changed one page
+
+## Coverage Workflows
+
+For Python coverage:
+
+```bash
+make coverage
+make htmlcov
+make doctest-coverage
+make diff-cover
+```
+
+For Rust coverage:
+
+```bash
+make -C tools_rust/mcp_runtime coverage
+```
+
+Coverage guidance:
+
+- use `make htmlcov` for a fast local report once `.coverage` already exists
+- use `make coverage` when you need to regenerate the full Python coverage set
+- use `make diff-cover` when you need changed-line coverage against the main
+  branch
+- use runtime-local `coverage` when you are explicitly improving Rust crate
+  coverage
+
+## Benchmarking
+
+Benchmark from the repository root against a compose-backed testing stack.
+
+Quick benchmarks:
+
+```bash
+make benchmark-mcp-mixed
+make benchmark-mcp-tools
+```
+
+Higher-concurrency distributed benchmarks:
+
+```bash
+make benchmark-mcp-mixed-300
+make benchmark-mcp-tools-300
+```
+
+Useful overrides:
+
+```bash
+make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=60s
+make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=300s
+make benchmark-mcp-mixed-300 MCP_BENCHMARK_HIGH_USERS=300 MCP_BENCHMARK_HIGH_RUN_TIME=60s
+```
+
+How to read the results:
+
+- `benchmark-mcp-tools*`
+  - cleanest signal for the Rust hot path
+  - use this when evaluating transport/runtime improvements
+- `benchmark-mcp-mixed*`
+  - exercises broader seeded data and fixture behavior
+  - useful, but noisier than tools-only numbers
+
+Expected outcomes:
+
+- Rust `edge|full` should materially outperform the pure Python path on the
+  tools-only workload
+- `shadow` should behave like the Python public path, not like the Rust public
+  path
+- compare current results against the latest snapshot in [STATUS.md](STATUS.md)
+  rather than treating one hardcoded number as a release threshold
+
+## Profiling
+
+For Rust-local profiling:
+
+```bash
+make -C tools_rust/mcp_runtime setup-profiling
+make -C tools_rust/mcp_runtime flamegraph-test
+make -C tools_rust/mcp_runtime flamegraph-test-rmcp
+```
+
+Artifacts are written under:
+
+```text
+tools_rust/mcp_runtime/profiles/
+```
+
+When to use profiling:
+
+- after a benchmark regression
+- after a change to direct `tools/call`, session handling, event store, or RMCP
+  client reuse
+- when you need proof that a suspected Rust hotspot is real
+
+Interpretation guidance:
+
+- one-shot flamegraphs are often setup-heavy
+- steady-state compose benchmarks are still the primary signal for end-to-end
+  throughput
+- if a benchmark regresses but the crate-local flamegraph does not show a Rust
+  hotspot, the issue may be in Python, upstream MCP servers, networking, Redis,
+  or compose/container behavior
+
+## Suggested Workflows
+
+### 1. Pure Rust Refactor
+
+```bash
+make -C tools_rust/mcp_runtime fmt-check
+make -C tools_rust/mcp_runtime clippy-all
+make -C tools_rust/mcp_runtime test-rmcp
+```
+
+### 2. Rust + Python MCP Integration Change
+
+```bash
+make -C tools_rust/mcp_runtime fmt-check clippy-all test-rmcp
+make doctest test htmlcov
+make flake8 bandit interrogate pylint
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+make test-mcp-session-isolation
+```
+
+### 3. Runtime UI / Admin Page Change
+
+```bash
+make autoflake isort black pre-commit
+make test-js-coverage lint-web flake8 bandit interrogate pylint
+make doctest test htmlcov
+make test-ui-smoke
+uv run pytest tests/playwright/test_version_page.py -q
+```
+
+### 4. Performance-Sensitive Change
+
+```bash
+make -C tools_rust/mcp_runtime fmt-check clippy-all test-rmcp
+make testing-rebuild-rust-full
+make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=60s
+make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=300s
+make -C tools_rust/mcp_runtime flamegraph-test
+```
+
+### 5. Pre-Push / Pre-Merge Gate
+
+```bash
+make autoflake isort black pre-commit
+make test-js-coverage lint-web flake8 bandit interrogate pylint verify
+make doctest test htmlcov
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+make test-mcp-session-isolation
+cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml
+```
+
+If the change affects fallback behavior or public MCP mounting:
+
+```bash
+make testing-up
+make test-mcp-cli
+make test-mcp-rbac
+```
+
+## What "Good" Looks Like
+
+Before calling a Rust MCP runtime change ready, the following should be true
+for the scopes you touched:
+
+- Rust-local lint/test passes
+- repo-wide Python/backend lint/test passes
+- live compose-backed MCP tests pass in the relevant runtime mode
+- Python baseline still works if you changed shared transport or fallback logic
+- benchmark results are not materially worse than the current branch snapshot in
+  [STATUS.md](STATUS.md) without a clear explanation
+- UI pages render the correct runtime mode if you touched admin/status surfaces
+
+If you are unsure which commands to run, default to the broader workflow:
+
+```bash
+make autoflake isort black pre-commit
+make test-js-coverage lint-web flake8 bandit interrogate pylint verify
+make doctest test htmlcov
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-access-matrix
+make test-mcp-session-isolation
+cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml
+```
diff --git a/tools_rust/mcp_runtime/FOLLOWUPS.md b/tools_rust/mcp_runtime/FOLLOWUPS.md
new file mode 100644
index 0000000000..9d274a16cc
--- /dev/null
+++ b/tools_rust/mcp_runtime/FOLLOWUPS.md
@@ -0,0 +1,1096 @@
+# Rust MCP Follow-Ups
+
+This file tracks issues discovered while validating the Rust MCP runtime that should be investigated or resolved in a separate PR, or after the core Rust MCP work is finished.
+
+## Recommended Scope
+
+These items are intentionally separated from the main Rust MCP runtime work because they are either:
+
+- broader test-suite stability issues
+- admin/UI problems not specific to the Rust MCP path
+- brittle test assumptions that should be cleaned up independently
+
+## Current Follow-Ups
+
+### 1. Broader Python MCP error redaction
+
+Status:
+- Needs a separate Python-focused hardening pass
+
+Observed behavior:
+- The Rust runtime and Rust runtime proxy now redact client-visible transport
+  errors, but broader Python MCP handlers still return some raw exception text.
+
+Why this matters:
+- Error-shaping parity is still incomplete outside the Rust-specific path.
+
+Likely area:
+- `mcpgateway/main.py`
+- Python MCP handlers that still return `str(exc)` or equivalent error data
+
+Recommended next step:
+- Audit the remaining Python MCP handlers and replace client-visible exception
+  text with generic transport-safe messages while keeping detailed logs
+  server-side.
+
+### 1a. JSON-RPC plugin violations can still surface non-200 HTTP statuses
+
+Status:
+- Deferred Python/MCP protocol-shaping follow-up
+
+Observed behavior:
+- The global `PluginViolationError` handler now derives HTTP status from plugin
+  metadata / violation-code mappings instead of always returning HTTP `200`.
+- That is fine for generic REST endpoints, but it is awkward for JSON-RPC /
+  MCP clients that expect HTTP `200` and parse the body-level `error` object.
+
+Why this matters:
+- A plugin deny path on MCP/JSON-RPC can look like a transport failure instead
+  of a protocol-level error, depending on the client.
+
+Likely area:
+- `mcpgateway/main.py`
+- global plugin violation exception handling for MCP / JSON-RPC routes
+
+Recommended next step:
+- Decide whether MCP / JSON-RPC routes should force HTTP `200` for plugin
+  violations while keeping richer HTTP statuses for REST endpoints.
+
+### 1b. Prompt post-hook payload still uses `prompt_id` for a prompt name
+
+Status:
+- Deferred Python/plugin contract follow-up
+
+Observed behavior:
+- `PromptPosthookPayload.prompt_id` is populated with the MCP prompt name rather
+  than the backing database UUID.
+
+Why this matters:
+- MCP prompt identity is name-based, so the current behavior may be intentional,
+  but the field name and plugin-facing semantics are now misleading.
+- Existing or future plugins that treat `prompt_id` as a database UUID could
+  break silently.
+
+Likely area:
+- `mcpgateway/services/prompt_service.py`
+- plugin payload schema / docs for prompt post-fetch hooks
+
+Recommended next step:
+- Decide whether to rename the field to reflect MCP name semantics, or restore a
+  true UUID field and add a separate prompt-name field for MCP-oriented plugins.
+
+### 2. Python `session_id` query-parameter compatibility debt
+
+Status:
+- Intentionally not changed in this PR
+
+Observed behavior:
+- Both Python and Rust still accept `session_id` via query parameters for MCP
+  transport compatibility.
+
+Why this matters:
+- This is security-sensitive compatibility debt because session identifiers can
+  appear in browser history, reverse-proxy logs, and access logs.
+- The current Rust MCP work deliberately documents this behavior instead of
+  making a breaking Python change.
+
+Likely area:
+- `mcpgateway/main.py`
+- `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Decide whether to formally deprecate the query-parameter fallback, add
+  explicit warnings/telemetry, and retire it in a separate compatibility
+  cleanup.
+
+### 2a. Client-supplied initialize session ids remain a shared Python/Rust compatibility behavior
+
+Status:
+- Deferred product/security semantics follow-up
+
+Observed behavior:
+- Both Python and Rust currently accept client-supplied initialize session ids:
+  - Python `_execute_rpc_initialize(...)` accepts `session_id` / `sessionId`
+    from JSON-RPC params plus `session_id` from the query string.
+  - Rust `requested_initialize_session_id(...)` accepts the same logical
+    inputs, with the transport header taking precedence when present.
+- This is not a Rust-only behavior introduced by this PR.
+- On the settled auth-required full-Rust stack, an authenticated second caller
+  could not hijack another caller's chosen initialize session id:
+  - the first caller initialized successfully
+  - the second caller targeting the same id received JSON-RPC `-32003 Access denied`
+- The remaining concern is the permissive/public MCP mode:
+  - ownerless sessions are intentionally allowed today
+  - custom client-chosen session ids are not constrained to UUID format
+  - that combination makes public/unauthenticated session semantics easier to
+    reason about incorrectly
+
+Why this matters:
+- Predictable client-chosen initialize session ids are more sensitive than
+  server-emitted opaque ids.
+- The behavior is currently a shared MCP transport compatibility choice rather
+  than a newly introduced Rust regression.
+
+Likely area:
+- `mcpgateway/main.py`
+- `mcpgateway/cache/session_registry.py`
+- `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Decide whether client-supplied initialize session ids should remain a
+  supported compatibility feature.
+- If yes:
+  - document the authenticated vs unauthenticated semantics explicitly
+  - add validation/telemetry for custom initialize session ids
+- If no:
+  - deprecate and remove the behavior in a coordinated Python + Rust change
+    rather than changing only one side in the Rust PR.
+
+### 3. Non-admin scoped `tools.execute` on `/servers/{id}/mcp`
+
+Status:
+- Important product/RBAC follow-up
+
+Observed behavior:
+- The new Rust access-matrix suite proves that server-scoped non-admin tokens
+  can:
+  - initialize a team-scoped MCP session
+  - list tools, resources, and prompts
+  - read resources and fetch prompts with correct data
+- However, a non-admin token that explicitly includes `tools.execute` is still
+  denied at `tools/call` on `/servers/{id}/mcp`.
+- A scoped admin token with the same MCP permissions succeeds.
+
+Why this matters:
+- This is easy to misread as a transport bug because the token carries
+  `tools.execute`, but the current live behavior still denies execution for the
+  non-admin path.
+- The new access-matrix coverage now documents and locks in this behavior, but
+  the underlying product decision is still unresolved.
+
+Likely area:
+- RBAC / MCP permission evaluation for server-scoped execution
+- Python auth/RBAC enforcement versus Rust transport parity
+
+Recommended next step:
+- Decide whether non-admin scoped tokens with `tools.execute` should be able to
+  execute tools on `/servers/{id}/mcp`.
+- If yes, change the product behavior and update the access-matrix tests to
+  prove the positive path.
+- If no, document this restriction more explicitly in the MCP/RBAC docs.
+
+### 3a. Rust direct tools/call can share upstream MCP sessions when no downstream session exists
+
+Status:
+- Deferred Rust-specific correctness/isolation follow-up
+
+Observed behavior:
+- `build_upstream_session_key()` uses `shared:{hash}` when `tools/call` runs
+  without a downstream MCP session id.
+- That means multiple callers that resolve to the same upstream target and auth
+  plan can reuse a single upstream MCP session.
+
+Why this matters:
+- Stateful upstream MCP servers can leak state or cross-contaminate behavior
+  between otherwise unrelated callers on the sessionless direct-execution path.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Decide whether sessionless callers should:
+  - never reuse upstream sessions, or
+  - use a caller-specific key that still isolates upstream state between users.
+
+### 4. Python aggregated `/mcp` resource-read ambiguity
+
+Status:
+- Needs a Python/product behavior follow-up
+
+Observed behavior:
+- Server-scoped MCP resource reads now behave correctly for duplicate resource
+  URIs because the lookup is scoped by `server_id`.
+- On the plain Python aggregated `/mcp/` path, `resources/read` for a duplicate
+  URI can still succeed with an empty payload instead of returning an explicit
+  ambiguity error.
+- On the Rust path, the same ambiguous generic `/mcp/` request now returns a
+  clean client error instructing the caller to use `/servers/{id}/mcp`.
+
+Why this matters:
+- The benchmark and server-scoped MCP path are fixed, but Python and Rust still
+  differ on how the generic aggregated endpoint handles ambiguous resource URIs.
+- This is a product-behavior mismatch, not a core Rust MCP transport failure.
+
+Likely area:
+- `mcpgateway/services/resource_service.py`
+- generic aggregated `/mcp/` `resources/read` behavior in the Python path
+
+Recommended next step:
+- Decide whether the generic aggregated Python `/mcp/` endpoint should match
+  the Rust behavior by returning an explicit ambiguity error whenever multiple
+  resources share the same URI across servers.
+
+### 5. Playwright admin JWT login instability
+
+Status:
+- Needs investigation
+
+Observed behavior:
+- In larger Playwright file runs, the admin JWT-cookie login helper can intermittently remain on `/admin/login`.
+- Gateway logs show matching `401 Invalid token` errors during some of these failures.
+
+Why this matters:
+- This affects admin/UI suite reliability.
+- It is not currently proven to be a Rust MCP runtime issue.
+
+Likely area:
+- [`tests/playwright/conftest.py`](../../../tests/playwright/conftest.py)
+- admin JWT cookie seeding / validation path
+- admin auth middleware / login redirect handling
+
+Recommended next step:
+- Add targeted instrumentation around `_ensure_admin_logged_in(...)` and capture redirect/response traces when JWT-cookie login falls back to `/admin/login`.
+
+### 5a. Prompt/plugin deny-path parity is still follow-up work
+
+Status:
+- Important compatibility follow-up, but no longer a prompt happy-path release
+  blocker
+
+Observed behavior:
+- The compose testing stack enables the plugin framework with `PLUGINS_ENABLED=true`.
+- However, the default [plugins/config.yaml](/home/cmihai/agents2/pr/mcp-context-forge/plugins/config.yaml) keeps built-in plugins such as `PIIFilterPlugin` in `mode: "disabled"`, so the current Rust MCP end-to-end battery does not exercise live plugin enforcement or transformation behavior.
+- Manual spot checks with temporary plugin enablement showed:
+  - `resource_post_fetch` parity for `resources/read` using `LicenseHeaderInjector`
+  - `prompt_pre_fetch` is reached on Rust full mode using `DenyListPlugin`
+- So the broad "Rust bypasses plugins" concern is not supported by current evidence.
+- Python service implementations invoke plugin hooks for:
+  - `tool_pre_invoke` / `tool_post_invoke`
+  - `prompt_pre_fetch` / `prompt_post_fetch`
+  - `resource_pre_fetch` / `resource_post_fetch`
+- In Rust full mode, the direct fast paths in [lib.rs](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime/src/lib.rs) serve several of those methods directly:
+  - `direct_server_tools_list(...)`
+  - `direct_server_resources_list(...)`
+  - `direct_server_resource_templates_list(...)`
+  - `direct_server_prompts_list(...)`
+  - `direct_server_resources_read(...)`
+  - `direct_server_prompts_get(...)`
+  - `execute_tools_call_direct(...)`
+  without an explicit plugin-aware fallback guard.
+
+Why this matters:
+- We now have a stable automated parity gate for:
+  - `resources/read` + `LicenseHeaderInjector`
+  - `tools/call` + `ToolOutputSentinelPlugin`
+  - `prompts/get` + `PromptOutputSentinelPlugin`
+- We also have a Rust-only regression guard that invalid prompt argument shapes
+  return a structured MCP error instead of a Rust-side decode failure.
+- The remaining prompt follow-up is the plugin deny-path, not the normal
+  `prompts/get` happy path.
+
+Likely area:
+- [tool_service.py](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/tool_service.py)
+- [prompt_service.py](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/prompt_service.py)
+- [resource_service.py](/home/cmihai/agents2/pr/mcp-context-forge/mcpgateway/services/resource_service.py)
+- [lib.rs](/home/cmihai/agents2/pr/mcp-context-forge/tools_rust/mcp_runtime/src/lib.rs)
+
+Recommended next step:
+- Keep `make test-mcp-plugin-parity` green in both Python mode and Rust full mode using `tests/e2e/plugin_parity_config.yaml`.
+- Follow-up gates:
+  - blocked `prompts/get` parity after the Python-side prompt deny-path response shape is cleaned up
+  - additional plugin families if Rust fast paths expand beyond the current resource/tool parity probes
+
+### 6. Circuit breaker unit test timing flake
+
+Status:
+- Likely brittle test
+
+Observed behavior:
+- [`test_circuit_resets_after_timeout`](../../../tests/unit/mcpgateway/services/test_mcp_session_pool.py) failed in the full suite, but passed in isolation and repeated reruns.
+
+Why this matters:
+- Creates noise in `make test`.
+
+Likely cause:
+- Fixed `asyncio.sleep(...)` timing in the test versus wall-clock timing in the circuit-breaker implementation.
+
+Recommended next step:
+- Rewrite the test to poll until reset rather than relying on a fixed sleep margin.
+
+### 7. Gateway delete Playwright assertion is too strict
+
+Status:
+- Likely brittle test
+
+Observed behavior:
+- [`test_delete_button_with_confirmation`](../../../tests/playwright/test_gateways.py) waits for a gateway row to exist after deletion.
+- That fails if the deleted gateway was the last visible row.
+
+Why this matters:
+- Produces false negatives in the UI suite.
+
+Recommended next step:
+- Verify deletion by name or empty-state handling instead of requiring at least one remaining row.
+
+### 8. Gateway edit modal file-scope instability
+
+Status:
+- Needs investigation
+
+Observed behavior:
+- [`test_edit_modal_transport_options`](../../../tests/playwright/entities/test_gateways_extended.py) can fail at file scope with the edit modal not opening, while passing in single-test isolation.
+
+Why this matters:
+- Suggests residual UI/file-state coupling.
+
+Recommended next step:
+- Reproduce on a fresh stack with focused instrumentation around modal open requests and Alpine/HTMX state changes.
+
+### 9. Prompt/admin page file-scope login failures
+
+Status:
+- Needs investigation
+
+Observed behavior:
+- Some prompt/admin-oriented Playwright files fail at fixture setup because the admin page remains on `/admin/login`.
+
+Why this matters:
+- Same likely root as the admin JWT-cookie instability, but worth tracking explicitly because it impacts multiple UI areas.
+
+Recommended next step:
+- Treat as part of the admin login fixture investigation rather than fixing prompt-specific tests first.
+
+### 10. `register_fast_time_sse` sync quirk
+
+Status:
+- Needs investigation
+
+Observed behavior:
+- On clean startup, `register_fast_time_sse` can still create its SSE virtual server with zero associated tools even though related tooling can later appear reachable.
+
+Why this matters:
+- Compose test ergonomics and fixture predictability.
+
+### 11. Remaining Rust runtime test-hardening lanes from `todo/test-improvement.md`
+
+Status:
+- Deferred on purpose from this PR
+
+What is already covered now:
+- SSE parser helper edge cases in Rust unit tests
+- representative specialized-endpoint success/error JSON-RPC envelope coverage
+- explicit `elicitation/create` forwarded-path coverage
+- direct `tools/call` upstream-session retry after cached-session failure
+
+Still deferred:
+- concurrent direct `tools/call` contention on the shared upstream-session key
+- direct public-listener end-to-end coverage against the real Python auth backend
+- full resumable GET lifecycle in one end-to-end flow
+- multi-worker isolation/load against 2+ Rust runtime instances behind nginx
+
+Why this matters:
+- These are still useful confidence layers, but they are either timing-sensitive
+  or require broader compose/test-infra changes that would widen this PR.
+
+Recommended next step:
+- Take these as the next Rust-runtime test-focused PR once the current branch is
+  merged or otherwise stabilized.
+
+Recommended next step:
+- Inspect server sync timing and transport filtering on the SSE registration path separately from the `register_fast_time` auth/startup race that was already fixed.
+
+### 11. `rpc_inner()` dispatch-table refactor
+
+Status:
+- Deferred maintainability refactor
+
+Observed behavior:
+- `rpc_inner()` still carries most of the runtime's method-selection complexity.
+- Adding or changing a method still requires coordinated edits across boolean flag calculation, logging mode selection, and dispatch branches.
+
+Why this matters:
+- This is the largest remaining Rust-specific cognitive-complexity hotspot.
+
+Recommended next step:
+- Replace the current three-phase method dispatch with a single dispatch table or a more structured `match`-based handler map.
+
+### 12. Generic `send_*_to_backend()` / `forward_*_to_backend()` consolidation
+
+Status:
+- Deferred maintainability refactor
+
+Observed behavior:
+- The runtime still has many nearly identical `send_*_to_backend()` and JSON-RPC-wrapping `forward_*_to_backend()` helpers.
+- This PR reduced some duplication elsewhere, but did not collapse these method families.
+
+Why this matters:
+- The repetition increases change surface and makes response-shaping fixes harder to apply uniformly.
+
+Recommended next step:
+- Introduce generic backend send/forward helpers and migrate the method-specific wrappers onto them.
+
+### 13. DB visibility/query preamble extraction
+
+Status:
+- Deferred maintainability refactor
+
+Observed behavior:
+- The direct DB query helpers still repeat the same pool acquisition, admin bypass, and team-scope preamble before table-specific SQL.
+
+Why this matters:
+- The logic is correct, but repetitive and easy to drift when visibility rules change.
+
+Recommended next step:
+- Extract the shared DB visibility/query setup into a reusable helper and keep only the table-specific SQL in each query function.
+
+## Validated Remaining-Items Review
+
+These notes capture the current status of the Rust-specific items from
+`todo/remaining.md` after revalidation on the current branch.
+
+### Already mitigated or not worth tracking further here
+
+- Rust client-visible transport/dispatch/decode errors are already redacted through
+  `backend_detail_error_response(...)`, `backend_jsonrpc_error_response(...)`,
+  and targeted `CLIENT_ERROR_DETAIL` response shaping in
+  `tools_rust/mcp_runtime/src/lib.rs`.
+- Affinity-forwarded responses already flow through the same
+  `should_forward_response_header(...)` allowlist used for other backend
+  responses, so sensitive response headers like `set-cookie` and
+  `authorization` are not reflected to clients.
+- The protocol-version review finding is stale: the runtime currently checks
+  for exact membership in `supported_protocol_versions()` rather than doing a
+  lexicographic version comparison.
+- The runtime crate now declares `rust-version = "1.85"` in
+  `tools_rust/mcp_runtime/Cargo.toml`.
+
+### Deferred Rust-specific follow-ups
+
+#### 11. Redis affinity pub/sub trust model
+
+Status:
+- Deferred by design
+
+Observed behavior:
+- Affinity forwarding publishes request payloads to Redis channels and accepts
+  the first response on the generated response channel without per-message
+  authentication or signatures.
+
+Why this matters:
+- The current design assumes Redis stays on a trusted private network.
+- If Redis trust assumptions change, the affinity control plane will need
+  authentication or message signing.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- `forward_transport_request_via_affinity_owner(...)`
+
+Recommended next step:
+- Keep the current trusted-network assumption for now, but document it in any
+  deployment guidance that places Redis outside a tightly controlled network.
+
+#### 12. Explicit Rust request body size limit
+
+Status:
+- Deferred hardening
+
+Observed behavior:
+- The Rust runtime does not currently install an explicit body-size limit layer.
+
+Why this matters:
+- The runtime relies on default extractor behavior instead of a clear,
+  centrally documented request-size ceiling.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- router construction for public and internal listeners
+
+Recommended next step:
+- Decide on a runtime-specific request-size limit and apply it explicitly at
+  the Axum router layer.
+
+#### 13. Session existence is distinguishable from session denial
+
+Status:
+- Deferred product/security tradeoff
+
+Observed behavior:
+- Missing sessions return `404 Session not found`.
+- Existing sessions owned by another principal return `403 Session access denied`.
+
+Why this matters:
+- This can leak whether a guessed session id exists, even though the ids are
+  high-entropy UUIDs and not realistically enumerable by brute force.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- `validate_runtime_session_request(...)`
+
+Recommended next step:
+- Decide whether parity with the current behavior is sufficient, or whether all
+  deny paths should collapse to a single public error.
+
+#### 14. Direct DB list/read pagination parity
+
+Status:
+- Deferred feature-parity work
+
+Observed behavior:
+- The Rust direct DB paths optimize common discovery/read flows, but they do
+  not yet implement broader MCP pagination semantics the way a fully proxied
+  backend path could.
+
+Why this matters:
+- This is a feature-parity/documentation gap rather than a correctness failure
+  for the currently optimized hot paths.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- direct DB query helpers for tools/resources/prompts
+
+Recommended next step:
+- Either document the current pagination limitations clearly or extend the Rust
+  direct DB paths to support paginated list results.
+
+#### 15. Header helper cleanup and silent header insertion failures
+
+Status:
+- Deferred maintainability cleanup
+
+Observed behavior:
+- Header insertion and response decoration patterns still appear in many places.
+- Some header insertions are best-effort and intentionally skip malformed
+  values without logging.
+
+Why this matters:
+- The behavior is safe today, but the duplication makes future changes easier
+  to get wrong and harder to audit.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Extract small helper functions for repeated response-header decoration and
+  decide where malformed-header skips should log warnings instead of silently
+  continuing.
+
+#### 16. Resume-path duplicate validation
+
+Status:
+- Deferred cleanup
+
+Observed behavior:
+- Resumable GET handling still re-derives some session/access validation that
+  overlaps with the general transport validation flow.
+
+Why this matters:
+- This is mostly duplicated logic rather than a proven correctness bug.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- resumable GET `/mcp` flow
+
+Recommended next step:
+- Thread the validated session record through the resume path instead of
+  reloading and rechecking it.
+
+#### 17. Runtime modularization and low-priority Rust cleanup
+
+Status:
+- Deferred refactor
+
+Observed behavior:
+- `lib.rs` remains large and contains repeated URL derivation, backend bridge,
+  and helper patterns.
+- `query_param(...)` still returns raw values without percent-decoding.
+- Some in-process cache keys still use `DefaultHasher`.
+- Fingerprint comparisons are not constant-time.
+
+Why this matters:
+- These are maintainability and polish issues, not active correctness
+  regressions in the Rust MCP path.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Split transport/session/direct-execution code into modules, then clean up the
+  lower-risk helper issues as part of that refactor.
+
+#### 18. Shutdown cleanup
+
+Status:
+- Deferred lifecycle cleanup
+
+Observed behavior:
+- The Rust runtime does not currently do much explicit shutdown cleanup for its
+  in-memory/runtime-owned resources.
+- The Python proxy still caches a UDS `httpx.AsyncClient` without an explicit
+  close hook.
+
+Why this matters:
+- This is mostly a lifecycle hygiene issue during process shutdown and restart,
+  not a live-request correctness problem.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- `mcpgateway/transports/rust_mcp_runtime_proxy.py`
+
+Recommended next step:
+- Add explicit shutdown cleanup on the Rust side and a `close()`/shutdown hook
+  for the Python proxy's cached UDS client in a separate follow-up.
+
+#### 19. Redis hot-path round-trip and cache single-flight polish
+
+Status:
+- Deferred performance polish
+
+Observed behavior:
+- Runtime-session refresh in Redis still uses `GET` followed by `EXPIRE`
+  instead of a single `GETEX`-style refresh.
+- Event-store replay still fetches replay payloads one entry at a time from
+  the Redis hash instead of batching those lookups.
+- A few in-process caches still use simple double-checked locking rather than
+  a stronger single-flight pattern, so duplicate initialization work is still
+  possible under contention.
+
+Why this matters:
+- These are performance and efficiency opportunities, not current correctness
+  regressions.
+- They are most visible under heavy load or when many workers race to populate
+  the same hot cache entries.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Revisit the Redis/runtime hot paths in a focused performance pass and assess:
+  - `GETEX` or equivalent atomic session-touch semantics
+  - `HMGET`/pipeline replay fetches for event batches
+  - `OnceCell` or another single-flight pattern for expensive cache fills
+
+#### 20. Session-auth reuse still trades freshness for fewer auth round-trips
+
+Status:
+- Deferred Rust-specific design follow-up
+
+Observed behavior:
+- The Rust runtime now has explicit revocation/membership/role-change coverage,
+  but the implementation still relies on a bounded reuse TTL rather than
+  immediate revocation signals.
+
+Why this matters:
+- This is the remaining architectural tradeoff in the fast auth-reuse path:
+  fewer Rust -> Python auth round-trips versus immediate freshness after
+  revocation.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- session-auth reuse cache invalidation design
+
+Recommended next step:
+- Decide whether the current bounded TTL contract is enough, or whether Rust
+  should consume a revocation/invalidation signal from Python to drop cached
+  auth state immediately.
+
+#### 21. Sustained tools-only load still has a small internal-auth/control-plane failure tail
+
+Status:
+- Deferred Rust-specific performance/reliability follow-up
+
+Observed behavior:
+- On the normal full-Rust compose stack, sustained distributed tools-only load
+  is still not perfectly clean:
+  - `make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=300s`
+    produced `20` failures in `1,842,181` requests on the richer `fast_time`
+    server profile.
+- After isolating the upstreams:
+  - the simpler `fast_test` server reduced the same class of load to `3`
+    failures in `1,042,973` requests, all plain `502`s
+  - a controlled `fast_time` run with
+    `MCP_RUST_USE_RMCP_UPSTREAM_CLIENT=false` removed the `HTTP 0` / ~30s tail
+    entirely and reduced the exact `1000 users / 300s` run to `9` failures in
+    `1,799,022` requests
+- The remaining `9` failures with RMCP explicitly off were all internal
+  control-plane `502`s:
+  - `8` `tools/call` failures from Rust -> Python
+    `/_internal/mcp/authenticate`
+  - `1` `tools/list` failure from Rust -> Python
+    `/_internal/mcp/tools/list/authz`
+
+Why this matters:
+- The current “sustained-load tail” is not one problem:
+  - one part is specific to the experimental RMCP upstream client path on the
+    richer `fast_time` server profile
+  - the other part is a lower-rate internal Rust -> Python auth/authz hop
+    reliability issue under heavy distributed load
+- This is now a bounded, diagnosable release note rather than a vague generic
+  instability concern.
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- Rust internal backend auth/authz client path
+- RMCP upstream client path for direct `tools/call`
+
+Recommended next step:
+- Keep the sustained tools-only failure tail split into two sub-investigations:
+  - internal Rust -> Python auth/authz send failures under heavy load
+  - RMCP upstream client instability on the richer `fast_time` benchmark path
+- Re-run the same `1000 users / 300s` benchmark after any auth/authz client
+  tuning and after any RMCP upstream client fixes, rather than treating all
+  remaining failures as one bucket.
+
+#### 22. Docker Compose currently exports an empty RMCP bool env var
+
+Status:
+- Deferred configuration/wiring follow-up
+
+Observed behavior:
+- The current compose wiring exports
+  `MCP_RUST_USE_RMCP_UPSTREAM_CLIENT=` into the gateway container even when the
+  operator has not set a value.
+- In practice, the normal full-Rust compose stack behaved as if the RMCP
+  upstream client path was enabled, while an explicit
+  `MCP_RUST_USE_RMCP_UPSTREAM_CLIENT=false` runtime override materially changed
+  the sustained-load results.
+
+Why this matters:
+- Empty-string bool env handling is easy to misread operationally.
+- The experimental RMCP path should not appear enabled “by accident” through
+  ambiguous compose/env wiring.
+
+Likely area:
+- `docker-compose.yml`
+- Rust runtime bool env parsing / startup visibility
+
+Recommended next step:
+- Make the compose behavior unambiguous:
+  - either omit the env var entirely when unset
+  - or set it explicitly to `true` / `false`
+- Add a small startup/logging signal or health detail that makes the effective
+  RMCP-upstream-client mode obvious during live testing.
+
+#### 23. Legacy migration suites are still red
+
+Status:
+- Deferred broader release/upgrade follow-up
+
+Observed behavior:
+- `make migration-test-sqlite` is still not release-clean:
+  - `7 failed, 3 passed`
+  - failures show post-upgrade data loss across `0.5.0/0.6.0/latest` paths
+- `make migration-test-postgres` now gets past the earlier harness issues, but
+  still fails on real legacy startup/migration behavior:
+  - the `0.5.0` image cannot locate Alembic revision `1fc1795f6983`
+
+Why this matters:
+- These are real release-upgrade concerns, but they are not Rust-runtime
+  transport regressions.
+- They affect broader product upgrade confidence across older versions.
+
+Likely area:
+- `tests/migration/*`
+- legacy image migration chains
+- historical Alembic revision continuity
+
+Recommended next step:
+- Treat the migration failures as a separate upgrade-hardening track.
+- Decide which historical upgrade paths must be supported for the release, then
+  fix the legacy migration/data-retention issues independently of the Rust MCP
+  transport PR.
+
+#### 24. PostgreSQL client-certificate authentication is still unsupported
+
+Status:
+- Deferred feature-gap follow-up
+
+Observed behavior:
+- Live PostgreSQL TLS validation has now been executed locally for:
+  - Python with `sslmode=require`
+  - Rust with `sslmode=require`
+  - Rust with `sslmode=prefer`
+  - Rust non-TLS fallback with `sslmode=disable`
+- Those paths are all working as expected.
+- The remaining gap is PostgreSQL client-certificate authentication on the
+  Rust runtime path:
+  - `sslcert` / `sslkey` in `MCP_RUST_DATABASE_URL` are not supported
+  - the runtime fails fast clearly at startup instead of silently ignoring the
+    settings
+
+Why this matters:
+- The current behavior is safe and explicit, but environments that require
+  mTLS-style PostgreSQL client auth still cannot use the Rust runtime path.
+
+Likely area:
+- Rust database URL/config parsing and TLS connector setup in
+  `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Add actual `sslcert` / `sslkey` support for the Rust PostgreSQL client path.
+- Keep the current fail-fast startup validation until client-cert auth is fully
+  implemented and tested end to end.
+
+#### 25. Minikube clean reinstall flow still looks unhealthy
+
+Status:
+- Deferred Helm/deployment follow-up
+
+Observed behavior:
+- The Minikube validation pass successfully deployed and served traffic.
+- However, the explicit empty-namespace reinstall flow was not release-clean:
+  - resources were created in the fresh namespace
+  - `helm list` remained empty
+  - the namespace had to be deleted again to avoid leaving orphaned resources
+
+Why this matters:
+- This is a deployment/release-process problem, not a Rust transport bug.
+- It affects confidence in Helm reinstall semantics and cleanup behavior.
+
+Likely area:
+- Helm release lifecycle around `charts/mcp-stack`
+- local Minikube/Helm state handling
+- install/upgrade wrapper behavior in the `Makefile`
+
+Recommended next step:
+- Reproduce the clean reinstall flow in isolation and determine whether the
+  issue is in Helm invocation, namespace lifecycle timing, or local Minikube
+  state.
+
+#### 25a. Rust-enabled Minikube / Helm direct gateway path emits Zstandard MCP responses that break current clients
+
+Status:
+- Deferred Kubernetes/Rust transport compatibility follow-up
+
+Observed behavior:
+- A dedicated Rust-enabled Helm deployment was validated on Minikube with:
+  - gateway image override:
+    - `mcpgateway/mcpgateway:latest`
+  - gateway config override:
+    - `RUST_MCP_MODE=full`
+  - release:
+    - `mcp-stack-rust` in namespace `mcp-private-rust`
+- The deployment itself came up healthy and `/health` reported:
+  - `mcp_runtime.mode = rust-managed`
+- Raw HTTP MCP calls worked when compression was not negotiated.
+- When the client advertised `Accept-Encoding: zstd`, the direct Minikube
+  gateway service returned `Content-Encoding: zstd` on Rust MCP responses:
+  - `/mcp/`
+  - `/servers/<id>/mcp/`
+- The same probe against the compose full-Rust stack behind nginx returned
+  plain JSON with no `Content-Encoding`.
+- Client-visible failures on the Rust-enabled Minikube path included:
+  - `make test-mcp-cli`:
+    - `14 failed`, `9 passed`, `4 rerun`
+  - `make test-mcp-access-matrix`:
+    - `2 failed`, `3 passed`
+  - wrapper `Invalid JSON response`
+  - `UnicodeDecodeError` in `response.json()`
+- A direct validation of the workaround succeeded:
+  - setting `COMPRESSION_ENABLED=false` on the Rust-enabled Helm release and
+    restarting the gateway removed `Content-Encoding: zstd` from `/mcp/`
+  - `make test-mcp-cli` then passed cleanly against the same Rust-enabled
+    Minikube endpoint:
+    - `23 passed`
+- The current Python compression middleware behavior explains the issue:
+  - app-level compression is enabled globally in `mcpgateway/main.py`
+  - `SSEAwareCompressMiddleware` only bypasses MCP compression when
+    `json_response_enabled=false` (SSE mode)
+  - in normal JSON MCP mode, `/mcp` and `/servers/*/mcp` responses are still
+    compressed like generic REST JSON responses
+- There is no corresponding compression feature gap inside the Rust runtime
+  binary itself; this is a gateway-layer response-compression policy issue.
+
+Why this matters:
+- The Helm deploy itself is healthy, but the direct k8s Rust public transport
+  is not yet compatible with the current wrapper / test clients when Zstandard
+  compression is negotiated.
+- This is a real gap in claiming Rust-enabled Kubernetes readiness, even though
+  the compose full-Rust path remains healthy behind nginx.
+
+Likely area:
+- Python gateway response compression middleware around the Rust public MCP
+  transport path (not missing compression support inside the Rust runtime
+  binary itself)
+- response compression middleware / `starlette-compress`
+- compression negotiation differences between:
+  - direct gateway service
+  - nginx-fronted compose deployment
+- client compatibility expectations in:
+  - `mcpgateway.wrapper`
+  - `tests/e2e/test_mcp_cli_protocol.py`
+  - `tests/e2e_rust/test_mcp_access_matrix.py`
+
+Recommended next step:
+- Change the Python gateway compression policy so MCP endpoints bypass
+  app-level compression entirely, not just in SSE mode:
+  - `/mcp`
+  - `/mcp/`
+  - `/servers/*/mcp`
+  - `/servers/*/mcp/`
+- Decide whether the direct Rust k8s gateway should:
+  - disable Zstandard on MCP JSON-RPC responses, or
+  - only enable encodings known to work with supported clients, or
+  - ensure the wrapper/test/client stack decodes Zstandard reliably
+- The strongest validated immediate mitigation is:
+  - disable app-level compression for the Rust-enabled direct k8s gateway
+    (`COMPRESSION_ENABLED=false`)
+- Re-run the Rust-enabled Minikube validation after that change:
+  - `/health`
+  - `make test-mcp-cli`
+  - `make test-mcp-access-matrix`
+
+#### 26. Optional `2025-11-25-report` surface is not release-clean
+
+Status:
+- Deferred protocol-surface follow-up
+
+Observed behavior:
+- `make 2025-11-25-core` and `make 2025-11-25-auth` are green on the settled
+  full-Rust stack.
+- The broader optional report target is still red:
+  - `9 failed, 44 passed, 2 skipped`
+- Remaining failing live methods on the Rust full path were:
+  - `completion/complete` -> HTTP `500`
+  - `prompts/get` -> HTTP `404`
+  - `resources/read` -> HTTP `404`
+  - `resources/subscribe` -> HTTP `500`
+  - `sampling/createMessage` -> HTTP `500`
+  - `tasks/list|get|result|cancel` -> HTTP `200`, but error code `-32000`
+- The same targeted calls were replayed against the plain Python stack:
+  - `completion/complete` -> HTTP `200`, valid JSON-RPC `result`
+  - `prompts/get` -> HTTP `200`, JSON-RPC `error` envelope
+  - `resources/read` -> HTTP `200`, JSON-RPC `result`
+  - `resources/subscribe` -> HTTP `200`, `-32601`
+  - `sampling/createMessage` -> HTTP `200`, `-32602`
+  - `tasks/list|get|result|cancel` -> HTTP `200`, `-32601` / `-32602`
+
+Why this matters:
+- These failures are mostly Rust-path parity gaps on the broader optional
+  report surface, not just generic product limitations.
+- They are still not being treated as merge blockers for this PR because:
+  - `2025-11-25-core` and `2025-11-25-auth` are green
+  - the main live MCP runtime lanes are green
+  - this lane is broader optional/report coverage rather than the primary
+    release gate for the experimental opt-in Rust MCP runtime
+
+Likely area:
+- `tools_rust/mcp_runtime/src/lib.rs`
+- Python internal MCP handlers reached via the Rust bridge
+- optional MCP method behavior and error-shape expectations
+- server-specific sample-data assumptions for prompts/resources/completion
+
+Recommended next step:
+- Bring the Rust full path into parity with the Python path for the optional
+  report surface, specifically:
+  - return JSON-RPC envelopes on `prompts/get` / `resources/read` missing-item
+    paths instead of Rust-only `404`s
+  - map `resources/subscribe` and `sampling/createMessage` failures to clean
+    JSON-RPC method/params errors instead of opaque `500`s
+  - align unsupported `tasks/*` methods to `-32601` / `-32602`
+  - align `completion/complete` missing-prompt behavior with the Python path
+
+#### 27. Nginx should still strip internal `x-contextforge-*` trust headers as defense in depth
+
+Status:
+- Deferred deployment hardening follow-up
+
+Observed behavior:
+- The direct trust-boundary bypass is fixed in this PR:
+  - trusted `/_internal/mcp/*` requests now require loopback, the Rust runtime
+    marker header, and a shared-secret-derived internal auth header
+- However, the nginx configs do not currently clear internal
+  `x-contextforge-*` trust headers from public requests before proxying them to
+  the gateway.
+
+Why this matters:
+- This is no longer a direct merge blocker because Python no longer trusts only
+  the forwarded header names.
+- It is still worthwhile defense in depth:
+  - reduces accidental future trust on spoofable public headers
+  - reduces confusing logs/debug traces that appear to carry internal headers
+
+Likely area:
+- `infra/nginx/nginx-performance.conf`
+- `infra/nginx/nginx-tls.conf`
+- other nginx variants used for embedded/test deployments
+
+Recommended next step:
+- Explicitly clear internal trust headers at the public nginx ingress layers,
+  including at least:
+  - `x-contextforge-mcp-runtime`
+  - `x-contextforge-mcp-runtime-auth`
+  - `x-contextforge-auth-context`
+  - `x-contextforge-server-id`
+  - any session-validation or affinity-only internal headers
+
+#### 28. Edge-mode Rust public listener still defaults to `0.0.0.0:8787`
+
+Status:
+- Deferred deployment-hardening follow-up
+
+Observed behavior:
+- `docker-entrypoint.sh` currently defaults `MCP_RUST_PUBLIC_LISTEN_HTTP` to
+  `0.0.0.0:8787` when:
+  - Rust runtime is enabled
+  - Rust runtime is managed
+  - session-auth reuse is enabled
+
+Why this matters:
+- The public Rust listener is meant for nginx-mediated edge/full mode.
+- Binding it broadly by default increases the chance of direct sidecar
+  exposure in ad-hoc or partially hardened deployments.
+
+Likely area:
+- `docker-entrypoint.sh`
+- compose/Helm docs around edge/full deployment expectations
+
+Recommended next step:
+- Decide whether the safer default should be:
+  - loopback-only by default, with explicit opt-in for wider bind addresses, or
+  - current broad bind, but with much clearer deployment guidance and warnings
+    when nginx or network policy is not constraining exposure.
+
+#### 29. Forwarded internal auth context is still trusted by channel security, not by its own signature
+
+Status:
+- Deferred internal-transport hardening follow-up
+
+Observed behavior:
+- Internal MCP auth context continues to be forwarded as base64-encoded JSON.
+- After the current C1 fix, those forwarded requests are protected by:
+  - loopback checks on the Python side
+  - the Rust runtime marker header
+  - the shared-secret-derived `x-contextforge-mcp-runtime-auth` header
+- The auth context payload itself is not separately signed.
+
+Why this matters:
+- The current model is acceptable for the local trusted channel the runtime is
+  using today.
+- If the internal transport model broadens in future, independently signing or
+  MACing the auth context may become desirable rather than trusting only the
+  channel and outer request authenticator.
+
+Likely area:
+- `mcpgateway/main.py`
+- `mcpgateway/middleware/token_scoping.py`
+- `mcpgateway/transports/rust_mcp_runtime_proxy.py`
+- `tools_rust/mcp_runtime/src/lib.rs`
+
+Recommended next step:
+- Keep the current channel-authenticated approach for now.
+- If the internal hop ever extends beyond tightly local/private channels,
+  consider signing or MACing the forwarded auth context itself.
+
+## Not In Scope Here
+
+These items are not currently believed to be blocking the main Rust MCP runtime work:
+
+- core MCP protocol parity
+- Rust MCP session isolation correctness
+- Rust MCP performance benchmarking
+
+Those are tracked in:
+
+- [`README.md`](./README.md)
+- [`STATUS.md`](./STATUS.md)
+- [`TESTING-DESIGN.md`](./TESTING-DESIGN.md)
diff --git a/tools_rust/mcp_runtime/Makefile b/tools_rust/mcp_runtime/Makefile
new file mode 100644
index 0000000000..e8a383c4c6
--- /dev/null
+++ b/tools_rust/mcp_runtime/Makefile
@@ -0,0 +1,258 @@
+# ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+#   CONTEXTFORGE MCP RUNTIME - Makefile
+# ━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+#
+# Description: Build, test, lint, and coverage helpers for the Rust MCP runtime
+# Usage: run `make` or `make help` to view available targets
+#
+# help: CONTEXTFORGE MCP RUNTIME
+#
+# ──────────────────────────────────────────────────────────────────────────
+SHELL := /bin/bash
+.SHELLFLAGS := -eu -o pipefail -c
+
+CARGO ?= cargo
+RUSTUP ?= rustup
+FEATURE_RMCP := rmcp-upstream-client
+CLIPPY_FLAGS ?= -W clippy::pedantic
+CLIPPY_CONF_DIR ?= $(CURDIR)
+RUN_ARGS ?=
+PROFILE_DIR ?= $(CURDIR)/profiles
+PERF_CMD := $(firstword $(wildcard /usr/lib/linux-tools-*/perf))
+ifeq ($(strip $(PERF_CMD)),)
+PERF_CMD := perf
+endif
+PERF_SHIM_DIR ?= $(PROFILE_DIR)/bin
+PERF_SHIM ?= $(PERF_SHIM_DIR)/perf
+FLAMEGRAPH_TEST_TARGET ?= runtime
+FLAMEGRAPH_TEST_FILTER ?= tools_call_uses_rust_direct_execution_and_reuses_upstream_session
+FLAMEGRAPH_RMCP_TEST_FILTER ?= tools_call_can_use_rmcp_upstream_client
+FLAMEGRAPH_OUTPUT ?= $(PROFILE_DIR)/runtime-test-flamegraph.svg
+FLAMEGRAPH_RMCP_OUTPUT ?= $(PROFILE_DIR)/runtime-test-rmcp-flamegraph.svg
+export CLIPPY_CONF_DIR
+
+.DEFAULT_GOAL := help
+
+# =============================================================================
+# DYNAMIC HELP
+# =============================================================================
+.PHONY: help
+help:
+	@grep "^# help:" Makefile | grep -v grep | sed 's/# help: //' | sed 's/# help://'
+
+# =============================================================================
+# BUILD
+# =============================================================================
+
+.PHONY: build build-release build-rmcp build-release-rmcp run run-rmcp run-release run-release-rmcp clean
+
+# help: build b                    - Run cargo build
+build b:
+	@echo "Running cargo build..."
+	@$(CARGO) build
+
+# help: build-release br           - Run cargo build --release
+build-release br:
+	@echo "Running cargo build --release..."
+	@$(CARGO) build --release
+
+# help: build-rmcp                 - Run cargo build with rmcp upstream client feature
+build-rmcp:
+	@echo "Running cargo build --features $(FEATURE_RMCP)..."
+	@$(CARGO) build --features $(FEATURE_RMCP)
+
+# help: build-release-rmcp         - Run cargo build --release with rmcp upstream client feature
+build-release-rmcp:
+	@echo "Running cargo build --release --features $(FEATURE_RMCP)..."
+	@$(CARGO) build --release --features $(FEATURE_RMCP)
+
+# help: run                        - Run cargo run (override with RUN_ARGS='...')
+run:
+	@echo "Running cargo run $(RUN_ARGS)..."
+	@$(CARGO) run -- $(RUN_ARGS)
+
+# help: run-rmcp                   - Run cargo run with rmcp upstream client feature
+run-rmcp:
+	@echo "Running cargo run --features $(FEATURE_RMCP) $(RUN_ARGS)..."
+	@$(CARGO) run --features $(FEATURE_RMCP) -- $(RUN_ARGS)
+
+# help: run-release                - Run cargo run --release
+run-release:
+	@echo "Running cargo run --release $(RUN_ARGS)..."
+	@$(CARGO) run --release -- $(RUN_ARGS)
+
+# help: run-release-rmcp           - Run cargo run --release with rmcp upstream client feature
+run-release-rmcp:
+	@echo "Running cargo run --release --features $(FEATURE_RMCP) $(RUN_ARGS)..."
+	@$(CARGO) run --release --features $(FEATURE_RMCP) -- $(RUN_ARGS)
+
+# help: clean                      - Remove cargo build artifacts
+clean:
+	@echo "Running cargo clean..."
+	@$(CARGO) clean
+
+# =============================================================================
+# TEST
+# =============================================================================
+
+.PHONY: test test-release test-rmcp test-release-rmcp doc-test
+
+# help: test t                     - Run cargo test
+test t:
+	@echo "Running cargo test..."
+	@$(CARGO) test
+
+# help: test-release tr            - Run cargo test --release
+test-release tr:
+	@echo "Running cargo test --release..."
+	@$(CARGO) test --release
+
+# help: test-rmcp                  - Run cargo test with rmcp upstream client feature
+test-rmcp:
+	@echo "Running cargo test --features $(FEATURE_RMCP)..."
+	@$(CARGO) test --features $(FEATURE_RMCP)
+
+# help: test-release-rmcp          - Run cargo test --release with rmcp upstream client feature
+test-release-rmcp:
+	@echo "Running cargo test --release --features $(FEATURE_RMCP)..."
+	@$(CARGO) test --release --features $(FEATURE_RMCP)
+
+# help: doc-test                   - Run cargo test --doc
+doc-test:
+	@echo "Running cargo test --doc..."
+	@$(CARGO) test --doc
+
+# =============================================================================
+# CARGO CHECKS
+# =============================================================================
+
+.PHONY: check check-test check-rmcp check-all-targets
+
+# help: check chk c                - Run cargo check
+check chk c:
+	@echo "Running cargo check..."
+	@$(CARGO) check
+
+# help: check-test ct              - Run cargo check --tests
+check-test ct:
+	@echo "Running cargo check --tests..."
+	@$(CARGO) check --tests
+
+# help: check-rmcp                 - Run cargo check with rmcp upstream client feature
+check-rmcp:
+	@echo "Running cargo check --features $(FEATURE_RMCP)..."
+	@$(CARGO) check --features $(FEATURE_RMCP)
+
+# help: check-all-targets          - Run cargo check --all-targets --all-features
+check-all-targets:
+	@echo "Running cargo check --all-targets --all-features..."
+	@$(CARGO) check --all-targets --all-features
+
+# =============================================================================
+# FORMAT & LINT
+# =============================================================================
+
+.PHONY: fmt fmt-check clippy clippy-tests clippy-rmcp clippy-all clippy-fix lint lint-rmcp
+
+# help: fmt                        - Run cargo fmt
+fmt:
+	@echo "Running cargo fmt..."
+	@$(CARGO) fmt
+
+# help: fmt-check                  - Run cargo fmt --check
+fmt-check:
+	@echo "Running cargo fmt --check..."
+	@$(CARGO) fmt --check
+
+# help: clippy                     - Run cargo clippy on all targets
+clippy:
+	@echo "Running cargo clippy --all-targets..."
+	@$(CARGO) clippy --all-targets -- $(CLIPPY_FLAGS)
+
+# help: clippy-tests               - Run cargo clippy on test targets
+clippy-tests:
+	@echo "Running cargo clippy --tests..."
+	@$(CARGO) clippy --tests -- $(CLIPPY_FLAGS)
+
+# help: clippy-rmcp                - Run cargo clippy with rmcp upstream client feature
+clippy-rmcp:
+	@echo "Running cargo clippy --all-targets --features $(FEATURE_RMCP)..."
+	@$(CARGO) clippy --all-targets --features $(FEATURE_RMCP) -- $(CLIPPY_FLAGS)
+
+# help: clippy-all                 - Run cargo clippy on all targets and all features
+clippy-all:
+	@echo "Running cargo clippy --all-targets --all-features..."
+	@$(CARGO) clippy --all-targets --all-features -- $(CLIPPY_FLAGS)
+
+# help: clippy-fix                 - Run cargo clippy --fix on all targets
+clippy-fix:
+	@echo "Running cargo clippy --fix --all-targets..."
+	@$(CARGO) clippy --fix --all-targets --allow-dirty --allow-staged -- $(CLIPPY_FLAGS)
+
+# help: lint                       - Run fmt-check, clippy, and tests
+lint:
+	@$(MAKE) fmt-check
+	@$(MAKE) clippy
+	@$(MAKE) test
+
+# help: lint-rmcp                  - Run fmt-check, clippy-rmcp, and test-rmcp
+lint-rmcp:
+	@$(MAKE) fmt-check
+	@$(MAKE) clippy-rmcp
+	@$(MAKE) test-rmcp
+
+# =============================================================================
+# COVERAGE & TOOLING
+# =============================================================================
+
+.PHONY: coverage setup-coverage setup-profiling flamegraph-test flamegraph-test-rmcp deny
+
+# help: setup-coverage             - Install llvm coverage prerequisites
+setup-coverage:
+	@echo "Installing llvm coverage prerequisites..."
+	@$(RUSTUP) component add llvm-tools-preview
+	@$(CARGO) install cargo-llvm-cov --locked
+
+# help: coverage cov               - Generate HTML coverage report with llvm-cov
+coverage cov:
+	@echo "Generating coverage report..."
+	@$(MAKE) setup-coverage
+	@$(CARGO) llvm-cov --html --all-features
+	@echo "Coverage report generated at target/llvm-cov/html/index.html"
+
+# help: setup-profiling            - Install cargo flamegraph for local Rust profiling
+setup-profiling:
+	@echo "Installing Rust profiling prerequisites..."
+	@$(CARGO) install flamegraph --locked
+
+# help: flamegraph-test            - Generate a flamegraph for the default runtime hot-path test
+flamegraph-test:
+	@echo "Generating flamegraph for $(FLAMEGRAPH_TEST_TARGET)::$(FLAMEGRAPH_TEST_FILTER)..."
+	@mkdir -p $(PROFILE_DIR) $(PERF_SHIM_DIR)
+	@$(MAKE) setup-profiling
+	@printf '%s\n' '#!/bin/sh' 'exec "$(PERF_CMD)" "$$@"' > $(PERF_SHIM)
+	@chmod +x $(PERF_SHIM)
+	@PATH="$(PERF_SHIM_DIR):$$PATH" CARGO_PROFILE_RELEASE_DEBUG=true $(CARGO) flamegraph \
+		-o $(FLAMEGRAPH_OUTPUT) \
+		--test $(FLAMEGRAPH_TEST_TARGET) -- \
+		$(FLAMEGRAPH_TEST_FILTER) --exact --nocapture
+	@echo "Flamegraph generated at $(FLAMEGRAPH_OUTPUT)"
+
+# help: flamegraph-test-rmcp       - Generate a flamegraph for the RMCP upstream-client runtime test
+flamegraph-test-rmcp:
+	@echo "Generating RMCP flamegraph for $(FLAMEGRAPH_TEST_TARGET)::$(FLAMEGRAPH_RMCP_TEST_FILTER)..."
+	@mkdir -p $(PROFILE_DIR) $(PERF_SHIM_DIR)
+	@$(MAKE) setup-profiling
+	@printf '%s\n' '#!/bin/sh' 'exec "$(PERF_CMD)" "$$@"' > $(PERF_SHIM)
+	@chmod +x $(PERF_SHIM)
+	@PATH="$(PERF_SHIM_DIR):$$PATH" CARGO_PROFILE_RELEASE_DEBUG=true $(CARGO) flamegraph \
+		-o $(FLAMEGRAPH_RMCP_OUTPUT) \
+		--features $(FEATURE_RMCP) \
+		--test $(FLAMEGRAPH_TEST_TARGET) -- \
+		$(FLAMEGRAPH_RMCP_TEST_FILTER) --exact --nocapture
+	@echo "Flamegraph generated at $(FLAMEGRAPH_RMCP_OUTPUT)"
+
+# help: deny                       - Run cargo deny checks if installed
+deny:
+	@echo "Running cargo deny..."
+	@cargo deny check
diff --git a/tools_rust/mcp_runtime/README.md b/tools_rust/mcp_runtime/README.md
new file mode 100644
index 0000000000..0f0eae3e72
--- /dev/null
+++ b/tools_rust/mcp_runtime/README.md
@@ -0,0 +1,354 @@
+# ContextForge MCP Runtime (Rust)
+
+This crate is the optional Rust MCP sidecar/runtime for `ContextForge`.
+
+It can act as:
+
+- an internal-only Rust sidecar for parity and rollback testing
+- the public MCP HTTP edge for `GET /mcp`, `POST /mcp`, and `DELETE /mcp`
+- the owner of selected session, replay, live-stream, affinity, and direct
+  execution paths in `full` mode
+
+Python still remains the authority for authentication, token scoping, and
+RBAC.
+
+Further reading:
+
+- [Rust MCP runtime architecture](../../docs/docs/architecture/rust-mcp-runtime.md)
+- [ADR-043: Rust MCP runtime sidecar + mode model](../../docs/docs/architecture/adr/043-rust-mcp-runtime-sidecar-mode-model.md)
+- [Current status snapshot](STATUS.md)
+- [Session/auth isolation testing design](TESTING-DESIGN.md)
+
+## Mode model
+
+The top-level UX is controlled by `RUST_MCP_MODE`.
+
+| Mode | Public `/mcp` served by | Main Rust-owned behavior | Intended use |
+| --- | --- | --- | --- |
+| `off` | Python | none | baseline / no Rust MCP |
+| `shadow` | Python | Rust sidecar is built/running internally | safest fallback and comparison mode |
+| `edge` | Rust | Rust public MCP edge and direct fast paths | fast public edge without full session/event cores |
+| `full` | Rust | `edge` plus Rust session/event-store/resume/live-stream/affinity cores | fullest Rust runtime path |
+
+Important nuance:
+
+- `edge` and `full` default to the Rust session-auth reuse fast path through
+  the mode presets in [docker-entrypoint.sh](../../docker-entrypoint.sh).
+- `RUST_MCP_SESSION_AUTH_REUSE=true|false` still exists as an advanced
+  override. Prefer `RUST_MCP_MODE` unless you are intentionally testing a
+  specific override path.
+
+## Quick reference
+
+### Build and start
+
+```bash
+make testing-rebuild-rust-shadow
+make testing-rebuild-rust
+make testing-rebuild-rust-full
+```
+
+Start without rebuilding:
+
+```bash
+make testing-up-rust-shadow
+make testing-up-rust
+make testing-up-rust-full
+```
+
+### Core validation
+
+```bash
+make test
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-session-isolation
+make test-mcp-session-isolation-load
+cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml
+```
+
+### Benchmarks
+
+```bash
+make benchmark-mcp-mixed
+make benchmark-mcp-tools
+make benchmark-mcp-mixed-300
+make benchmark-mcp-tools-300
+```
+
+### Rust-local crate checks
+
+```bash
+make -C tools_rust/mcp_runtime fmt-check
+make -C tools_rust/mcp_runtime check
+make -C tools_rust/mcp_runtime clippy
+make -C tools_rust/mcp_runtime clippy-all
+make -C tools_rust/mcp_runtime test
+make -C tools_rust/mcp_runtime test-rmcp
+make -C tools_rust/mcp_runtime coverage
+```
+
+### Rust-local profiling
+
+```bash
+make -C tools_rust/mcp_runtime setup-profiling
+make -C tools_rust/mcp_runtime flamegraph-test
+make -C tools_rust/mcp_runtime flamegraph-test-rmcp
+```
+
+Generated profiling artifacts are written under:
+
+```text
+tools_rust/mcp_runtime/profiles/
+```
+
+## Verify what is running
+
+### Compose/gateway view
+
+```bash
+curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'
+```
+
+Typical full-Rust health headers:
+
+```text
+x-contextforge-mcp-runtime-mode: rust-managed
+x-contextforge-mcp-transport-mounted: rust
+x-contextforge-mcp-session-core-mode: rust
+x-contextforge-mcp-event-store-mode: rust
+x-contextforge-mcp-resume-core-mode: rust
+x-contextforge-mcp-live-stream-core-mode: rust
+x-contextforge-mcp-affinity-core-mode: rust
+x-contextforge-mcp-session-auth-reuse-mode: rust
+```
+
+Typical shadow/fallback health headers:
+
+```text
+x-contextforge-mcp-runtime-mode: rust-managed
+x-contextforge-mcp-transport-mounted: python
+x-contextforge-mcp-session-core-mode: python
+x-contextforge-mcp-event-store-mode: python
+x-contextforge-mcp-resume-core-mode: python
+x-contextforge-mcp-live-stream-core-mode: python
+x-contextforge-mcp-affinity-core-mode: python
+x-contextforge-mcp-session-auth-reuse-mode: python
+```
+
+### Per-request proof
+
+Responses generated by the Rust edge include:
+
+- `x-contextforge-mcp-runtime: rust`
+- `x-contextforge-mcp-session-core: rust|python`
+- `x-contextforge-mcp-event-store: rust|python`
+- `x-contextforge-mcp-resume-core: rust|python`
+- `x-contextforge-mcp-live-stream-core: rust|python`
+- `x-contextforge-mcp-affinity-core: rust|python`
+
+Direct `tools/call` responses can also expose:
+
+- `x-contextforge-mcp-upstream-client: native`
+- `x-contextforge-mcp-upstream-client: rmcp`
+
+### Raw runtime view
+
+When running the crate directly, the runtime exposes:
+
+- `GET /health`
+- `GET /healthz`
+
+Example:
+
+```bash
+curl http://127.0.0.1:8787/healthz
+```
+
+## Architecture boundary
+
+### Rust owns today
+
+- public MCP transport edge in `edge|full`
+- protocol/version validation and JSON-RPC request shaping
+- local `ping`
+- notification transport semantics
+- direct `tools/call` fast path with reusable upstream sessions
+- optional `rmcp` upstream client path
+- server-scoped DB-backed direct reads where Rust can preserve parity:
+  - `tools/list`
+  - `resources/list`
+  - `resources/read`
+  - `resources/templates/list`
+  - `prompts/list`
+  - `prompts/get`
+- in `full` mode:
+  - runtime session metadata
+  - Redis-backed event store and replay
+  - live-stream response edge
+  - affinity forwarding edge
+
+### Python still owns today
+
+- authentication
+- token scoping
+- RBAC
+- the trusted internal authenticate endpoint
+- fallback compatibility handlers
+- parts of the underlying stream/session behavior behind the trusted bridge
+- existing business logic and data/model semantics where Rust intentionally
+  falls back for parity
+
+## Auth and session model
+
+Python still authenticates public MCP traffic first.
+
+In `edge|full`, Rust can then:
+
+- call the trusted internal authenticate endpoint
+- bind the encoded auth context to a runtime session after `initialize`
+- reuse that auth context for the same session while:
+  - the auth-binding fingerprint still matches
+  - the server scope still matches
+  - the reuse TTL has not expired
+
+That means:
+
+- the shared Python auth cache still matters in all modes
+- session-auth reuse is session-bound, not a global user cache
+- same-email / different-token and cross-user session reuse attempts are denied
+  by the runtime session ownership checks
+- bounded-TTL revocation and membership/role drift cases are now covered in the
+  compose-backed Rust isolation suite
+- runtime `/health` now exposes `runtime_stats` so reuse hits, misses,
+  denial reasons, and affinity forwarding can be inspected during validation
+
+See [TESTING-DESIGN.md](TESTING-DESIGN.md) for the threat model and
+compose-backed isolation coverage.
+
+## Running the crate directly
+
+Compose users should prefer the `make testing-*` targets above. The examples
+below are for crate-only development.
+
+### Run over TCP
+
+```bash
+cd tools_rust/mcp_runtime
+cargo run --release -- \
+  --backend-rpc-url http://127.0.0.1:4444/_internal/mcp/rpc \
+  --listen-http 127.0.0.1:8787
+```
+
+### Run over Unix socket
+
+```bash
+cd tools_rust/mcp_runtime
+cargo run --release -- \
+  --backend-rpc-url http://127.0.0.1:4444/_internal/mcp/rpc \
+  --listen-uds /tmp/contextforge-mcp-rust.sock
+```
+
+### Optional direct public listener
+
+```bash
+cd tools_rust/mcp_runtime
+cargo run --release -- \
+  --backend-rpc-url http://127.0.0.1:4444/_internal/mcp/rpc \
+  --listen-uds /tmp/contextforge-mcp-rust.sock \
+  --public-listen-http 127.0.0.1:8787
+```
+
+## Example requests
+
+### Health
+
+```bash
+curl http://127.0.0.1:8787/healthz
+```
+
+### Ping
+
+```bash
+curl -s http://127.0.0.1:8787/mcp/ \
+  -H 'content-type: application/json' \
+  -H 'mcp-protocol-version: 2025-11-25' \
+  -d '{"jsonrpc":"2.0","id":1,"method":"ping","params":{}}'
+```
+
+### Initialize
+
+```bash
+curl -s http://127.0.0.1:8787/mcp/ \
+  -H 'content-type: application/json' \
+  -H 'mcp-protocol-version: 2025-11-25' \
+  -H 'authorization: Bearer YOUR_TOKEN' \
+  -d '{"jsonrpc":"2.0","id":"init-1","method":"initialize","params":{"protocolVersion":"2025-11-25","capabilities":{},"clientInfo":{"name":"curl","version":"1.0"}}}'
+```
+
+### Tools list
+
+```bash
+curl -s http://127.0.0.1:8787/mcp/ \
+  -H 'content-type: application/json' \
+  -H 'mcp-protocol-version: 2025-11-25' \
+  -H 'authorization: Bearer YOUR_TOKEN' \
+  -d '{"jsonrpc":"2.0","id":1,"method":"tools/list","params":{}}'
+```
+
+## Benchmark guidance
+
+Use the make targets from the repository root:
+
+```bash
+make benchmark-mcp-mixed
+make benchmark-mcp-tools
+make benchmark-mcp-mixed-300
+make benchmark-mcp-tools-300
+```
+
+Guidance:
+
+- `benchmark-mcp-tools*` is the cleanest signal for the Rust hot path
+- `benchmark-mcp-mixed*` exercises broader fixture/data behavior and can expose
+  seeded test-server issues that are not transport regressions
+- for branch-local numbers, use [STATUS.md](STATUS.md) instead of hardcoding
+  benchmark snapshots here
+
+## Current recommended validation flow
+
+For the full-Rust public path:
+
+```bash
+make testing-rebuild-rust-full
+make test-mcp-cli
+make test-mcp-rbac
+make test-mcp-session-isolation
+cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml
+make benchmark-mcp-tools
+```
+
+For the bounded-TTL drift checks, rerun the Rust full stack with a short reuse
+TTL:
+
+```bash
+MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS=2 MCP_RUST_SESSION_AUTH_REUSE_GRACE_SECONDS=1 make testing-rebuild-rust-full
+make test-mcp-session-isolation
+make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s
+```
+
+For the safe fallback path:
+
+```bash
+make testing-rebuild-rust-shadow
+make test-mcp-cli
+make test-mcp-rbac
+```
+
+## Further reading
+
+- [Architecture: Rust MCP runtime](../../docs/docs/architecture/rust-mcp-runtime.md)
+- [ADR-043: Rust MCP runtime sidecar + mode model](../../docs/docs/architecture/adr/043-rust-mcp-runtime-sidecar-mode-model.md)
+- [Current status snapshot](STATUS.md)
+- [Session/auth isolation testing design](TESTING-DESIGN.md)
+- [Follow-ups for separate cleanup work](FOLLOWUPS.md)
diff --git a/tools_rust/mcp_runtime/RELEASE-CHECKLIST.md b/tools_rust/mcp_runtime/RELEASE-CHECKLIST.md
new file mode 100644
index 0000000000..63ef1bfb29
--- /dev/null
+++ b/tools_rust/mcp_runtime/RELEASE-CHECKLIST.md
@@ -0,0 +1,325 @@
+## Release Checklist
+
+Use this file as the pre-release checklist for the Rust MCP runtime.
+
+Rules:
+
+- Leave every item unchecked in git.
+- Check items off only in your working copy after the command or manual check
+  completes successfully.
+- If an item is not applicable for a specific release candidate, add a short
+  note rather than silently skipping it.
+- If an item fails because of a known unrelated repo issue, note that
+  explicitly before continuing.
+
+## 1. Rust Runtime Inner Loop
+
+- [ ] `make -C tools_rust/mcp_runtime fmt-check`
+- [ ] `make -C tools_rust/mcp_runtime check`
+- [ ] `make -C tools_rust/mcp_runtime check-all-targets`
+- [ ] `make -C tools_rust/mcp_runtime clippy`
+- [ ] `make -C tools_rust/mcp_runtime clippy-all`
+- [ ] `make -C tools_rust/mcp_runtime test`
+- [ ] `make -C tools_rust/mcp_runtime test-rmcp`
+- [ ] `make -C tools_rust/mcp_runtime doc-test`
+- [ ] `make -C tools_rust/mcp_runtime coverage`
+
+## 2. Repo Formatting And Hygiene
+
+- [ ] `make autoflake`
+- [ ] `make isort`
+- [ ] `make black`
+- [ ] `make pre-commit`
+
+## 3. Python / Backend Quality Gates
+
+- [ ] `make doctest`
+- [ ] `make test`
+- [ ] `make htmlcov`
+- [ ] `make flake8`
+- [ ] `make bandit`
+- [ ] `make interrogate`
+- [ ] `make pylint`
+- [ ] `make verify`
+
+## 4. Web / Frontend Gates
+
+- [ ] `make test-js-coverage`
+- [ ] `make lint-web`
+- [ ] `make test-ui-smoke`
+- [ ] `make test-ui-headless`
+- [ ] `uv run pytest tests/playwright/test_version_page.py -q`
+
+## 5. Python Baseline MCP Validation
+
+- [ ] `make testing-down`
+- [ ] `make compose-clean`
+- [ ] `make docker-prod DOCKER_BUILD_ARGS="--no-cache"`
+- [ ] `make testing-up`
+- [ ] `curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'`
+- [ ] Confirm `/health` reports Python MCP mode
+- [ ] Confirm admin Overview shows `🐍 Python MCP Core`
+- [ ] Confirm Version Info shows the MCP Runtime card in Python mode
+- [ ] `make test-mcp-cli`
+- [ ] `make test-mcp-rbac`
+- [ ] `make test-mcp-access-matrix`
+- [ ] `make 2025-11-25-core`
+- [ ] `make 2025-11-25-auth`
+- [ ] `make testing-down`
+- [ ] `PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml make testing-up`
+- [ ] `MCP_PLUGIN_PARITY_EXPECTED_RUNTIME=python make test-mcp-plugin-parity`
+- [ ] Confirm Python plugin parity covers `resources/read`, `tools/call`, and `prompts/get`
+- [ ] `make testing-down`
+- [ ] `make testing-up`
+- [ ] Perform one manual `/mcp` tool call and confirm `x-contextforge-mcp-runtime: python`
+- [ ] Perform one freshness check against `fast-time-get-system-time`
+
+## 6. Rust Shadow Validation
+
+- [ ] `make testing-rebuild-rust-shadow`
+- [ ] `curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'`
+- [ ] Confirm `/health` reports `rust-managed` runtime with Python transport mounted
+- [ ] Confirm admin Overview shows Rust runtime present but Python public transport semantics
+- [ ] `make test-mcp-cli`
+- [ ] `make test-mcp-rbac`
+- [ ] `make test-mcp-access-matrix`
+- [ ] `make 2025-11-25-core`
+- [ ] `make 2025-11-25-auth`
+
+## 7. Rust Edge Validation
+
+- [ ] `make testing-rebuild-rust`
+- [ ] `curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'`
+- [ ] Confirm `/health` reports Rust transport mounted
+- [ ] Confirm admin Overview shows `🦀 Rust MCP Core`
+- [ ] Confirm Version Info shows MCP Runtime card with Rust transport mounted
+- [ ] `make test-mcp-cli`
+- [ ] `make test-mcp-rbac`
+- [ ] `make test-mcp-access-matrix`
+- [ ] `make 2025-11-25-core`
+- [ ] `make 2025-11-25-auth`
+
+## 8. Rust Full Validation
+
+- [ ] `make testing-rebuild-rust-full`
+- [ ] `curl -sD - http://localhost:8080/health -o /dev/null | rg 'x-contextforge-mcp-'`
+- [ ] Confirm `/health` reports Rust transport/session/event-store/resume/live-stream/affinity/auth-reuse mounted as expected
+- [ ] Confirm admin Overview shows `🦀 Rust MCP Core`
+- [ ] Confirm Version Info shows MCP Runtime card with the expected mounted/core modes
+- [ ] `make test-mcp-cli`
+- [ ] `make test-mcp-rbac`
+- [ ] `make test-mcp-access-matrix`
+- [ ] `make test-mcp-session-isolation`
+- [ ] `make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s`
+- [ ] `make 2025-11-25-core`
+- [ ] `make 2025-11-25-auth`
+- [ ] `PLUGINS_CONFIG_FILE=plugins/plugin_parity_config.yaml make testing-rebuild-rust-full`
+- [ ] `MCP_PLUGIN_PARITY_EXPECTED_RUNTIME=rust make test-mcp-plugin-parity`
+- [ ] Confirm Rust plugin parity covers `resources/read`, `tools/call`, and `prompts/get`
+- [ ] `make testing-rebuild-rust-full`
+- [ ] `uv run pytest tests/e2e_rust/test_mcp_access_matrix.py -q -k 'invalid_arguments_return_structured_error'`
+- [ ] Confirm malformed `prompts/get` arguments return MCP `-32602` on the Rust public path instead of an opaque backend decode failure
+- [ ] `cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml`
+- [ ] Perform one manual `/mcp` tool call and confirm `x-contextforge-mcp-runtime: rust`
+- [ ] Perform one manual freshness check against `fast-time-get-system-time`
+- [ ] Re-run the Rust full validation with a short session-auth reuse TTL for bounded revocation checks:
+  `MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS=2 MCP_RUST_SESSION_AUTH_REUSE_GRACE_SECONDS=1 make testing-rebuild-rust-full`
+- [ ] Re-run `make test-mcp-session-isolation` on the short-TTL stack
+- [ ] Re-run `make test-mcp-session-isolation-load MCP_ISOLATION_LOAD_RUN_TIME=30s` on the short-TTL stack
+- [ ] Re-run `make test-mcp-access-matrix` on the short-TTL stack
+
+## 9. Optional PostgreSQL TLS Validation
+
+These checks are required for any release that claims Rust PostgreSQL TLS
+support beyond local non-TLS compose testing.
+
+- [ ] Validate Python runtime against a PostgreSQL deployment that requires TLS (`DATABASE_URL=...?...sslmode=require`)
+- [ ] Validate Rust runtime against a PostgreSQL deployment that requires TLS (`MCP_RUST_DATABASE_URL=...?...sslmode=require`)
+- [ ] Validate Rust runtime against a PostgreSQL deployment using `sslmode=prefer`
+- [ ] Validate Rust runtime against a PostgreSQL deployment using `sslrootcert=/path/to/ca.pem`
+- [ ] Confirm the Rust runtime still starts and serves requests against a non-TLS local PostgreSQL deployment
+- [ ] Confirm unsupported `sslcert` / `sslkey` inputs fail fast with a clear startup/config error
+
+## 10. MCP Runtime UI Validation
+
+- [ ] Open `http://localhost:8080/admin/`
+- [ ] Confirm Overview shows `🐍 Python MCP Core` in Python mode
+- [ ] Confirm Overview shows `🦀 Rust MCP Core` in Rust mode
+- [ ] Confirm Version Info shows the MCP Runtime card
+- [ ] Confirm Version Info reflects mounted transport/core modes correctly
+- [ ] Confirm runtime mode badges match `/health`
+
+## 10a. Optional Embedded UI Validation
+
+- [ ] `make embedded-up`
+- [ ] `make embedded-status`
+- [ ] Confirm the embedded stack comes up cleanly with the iframe-safe UI mode
+- [ ] Open the embedded/admin surface and confirm MCP Runtime indicators still render correctly
+- [ ] `make embedded-down`
+- [ ] `make embedded-clean`
+
+## 10b. Optional Minikube / Helm Validation
+
+- [ ] `make helm-lint`
+- [ ] `make helm-package`
+- [ ] `make minikube-start`
+- [ ] `make minikube-context`
+- [ ] `make minikube-image-load`
+- [ ] `VALUES=charts/mcp-stack/values-minikube.yaml NAMESPACE=mcp-private RELEASE_NAME=mcp-stack make helm-deploy`
+- [ ] `make minikube-status`
+- [ ] `kubectl get all -n mcp-private`
+- [ ] `helm status mcp-stack -n mcp-private --show-desc`
+- [ ] `make minikube-port-forward`
+- [ ] Confirm `/health` is reachable through the Minikube deployment
+- [ ] Confirm the admin UI loads through the Minikube deployment
+- [ ] Run at least one MCP protocol check against the Minikube deployment (`make test-mcp-cli` with the base URL pointed at the forwarded service)
+- [ ] If re-install validation is required, run the explicit cleanup/reinstall flow:
+  `helm list -A | grep mcp-stack`
+- [ ] `helm uninstall mcp-stack -n mcp-private`
+- [ ] `kubectl delete pvc --all -n mcp-private` when data reset is acceptable
+- [ ] `kubectl delete namespace mcp-private` when namespace reset is acceptable
+- [ ] `kubectl create namespace mcp-private`
+- [ ] `helm upgrade --install mcp-stack charts/mcp-stack --namespace mcp-private -f charts/mcp-stack/values-minikube.yaml --wait --timeout 15m --debug`
+- [ ] `kubectl get all -n mcp-private`
+- [ ] `helm status mcp-stack -n mcp-private --show-desc`
+- [ ] `RELEASE_NAME=mcp-stack NAMESPACE=mcp-private make helm-delete`
+
+Note:
+- if validating a Rust-enabled direct Minikube/Helm gateway path (`RUST_MCP_MODE=edge|full`),
+  explicitly verify MCP responses are not app-level compressed with `zstd`
+  on the direct service path, or disable app-level compression for that lane
+  until MCP compression bypass is fixed
+
+## 10c. Upgrade / Migration Validation
+
+- [ ] `make upgrade-validate`
+- [ ] Confirm the default upgrade base image is still `ghcr.io/ibm/mcp-context-forge:1.0.0-BETA-2`
+- [ ] `make migration-test-postgres`
+- [ ] `make migration-test-sqlite`
+- [ ] Review upgrade logs for Alembic failures, startup regressions, or post-upgrade data loss
+- [ ] If validating a Helm release originally installed from `1.0.0-BETA-2`, apply the documented one-time MinIO selector workaround when needed:
+  `kubectl delete deployment -n mcp-private mcp-stack-minio`
+- [ ] Re-run the Helm upgrade after the BETA-2 MinIO workaround and confirm success
+
+## 11. Benchmarking
+
+- [ ] `make benchmark-mcp-mixed`
+- [ ] `make benchmark-mcp-tools`
+- [ ] `make benchmark-mcp-mixed-300`
+- [ ] `make benchmark-mcp-tools-300`
+- [ ] `make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=60s`
+- [ ] `make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=300s`
+- [ ] Compare results against `tools_rust/mcp_runtime/STATUS.md`
+- [ ] Note any regression or unexpected failure count before release
+- [ ] Record Python baseline tools-only benchmark numbers for comparison
+- [ ] Record Rust full tools-only benchmark numbers for comparison
+
+## 11a. Optional MCP Compliance Artifacts
+
+- [ ] `make 2025-11-25-report`
+- [ ] Review generated artifacts under `artifacts/mcp-2025-11-25/`
+
+## 12. Profiling
+
+- [ ] `make -C tools_rust/mcp_runtime setup-profiling`
+- [ ] `make -C tools_rust/mcp_runtime flamegraph-test`
+- [ ] `make -C tools_rust/mcp_runtime flamegraph-test-rmcp`
+- [ ] Review artifacts under `tools_rust/mcp_runtime/profiles/`
+- [ ] Confirm any performance-sensitive change has a profiling note or rationale
+
+## 13. SonarQube Static Analysis
+
+Run a full SonarQube scan with Clippy enabled against the Rust runtime.
+See `todo/sonar-rust.md` for detailed reproduction steps and prior findings.
+
+```bash
+# Start SonarQube and fix ES disk watermarks
+make sonar-up-docker
+docker exec mcp-context-forge-sonarqube-1 bash -c \
+  'wget -q -O- --method=PUT \
+    --body-data="{\"persistent\":{\"cluster.routing.allocation.disk.watermark.flood_stage\":\"99%\",\"cluster.routing.allocation.disk.watermark.high\":\"98%\",\"cluster.routing.allocation.disk.watermark.low\":\"97%\"}}" \
+    --header="Content-Type: application/json" "http://localhost:9001/_cluster/settings"'
+docker exec mcp-context-forge-sonarqube-1 bash -c \
+  'wget -q -O- --method=PUT \
+    --body-data="{\"index.blocks.read_only_allow_delete\": null}" \
+    --header="Content-Type: application/json" "http://localhost:9001/_all/_settings"'
+
+# Build the Rust-enabled scanner image (one-time)
+docker build -t sonar-scanner-rust:latest -f- /tmp <<'DOCKERFILE'
+FROM docker.io/sonarsource/sonar-scanner-cli:latest
+USER root
+RUN dnf install -y gcc make openssl-devel pkgconfig git && dnf clean all
+ENV RUSTUP_HOME=/usr/local/rustup CARGO_HOME=/usr/local/cargo
+ENV PATH="/usr/local/cargo/bin:${PATH}"
+RUN curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | \
+    sh -s -- -y --default-toolchain stable --profile minimal --component clippy
+RUN chmod -R a+rwX /usr/local/cargo /usr/local/rustup
+USER scanner-cli
+DOCKERFILE
+
+# Create project and token (skip if already exists)
+curl -s -u admin:admin -X POST \
+  "http://localhost:9000/api/projects/create?name=mcp-runtime-rust&project=mcp-runtime-rust"
+TOKEN=$(curl -s -u admin:admin -X POST \
+  "http://localhost:9000/api/user_tokens/generate?name=scan-$(date +%s)" \
+  | python3 -c "import sys,json;print(json.load(sys.stdin)['token'])")
+
+# Run the scan
+docker run --rm \
+  --network mcp-context-forge_sonarnet \
+  -v "$PWD/tools_rust/mcp_runtime:/usr/src:ro" \
+  -e SONAR_HOST_URL="http://sonarqube:9000" \
+  -e SONAR_TOKEN="$TOKEN" \
+  -e CARGO_TARGET_DIR="/tmp/cargo-target" \
+  sonar-scanner-rust:latest \
+  -Dsonar.projectKey=mcp-runtime-rust \
+  -Dsonar.sources=src \
+  -Dsonar.tests=tests \
+  -Dsonar.exclusions="**/target/**,**/*.lock" \
+  -Dsonar.scm.disabled=true
+
+# View results
+echo "Dashboard: http://localhost:9000/dashboard?id=mcp-runtime-rust"
+```
+
+- [ ] SonarQube quality gate passes (status: OK)
+- [ ] No new bugs or vulnerabilities introduced
+- [ ] No new security hotspots
+- [ ] Clippy sensor ran successfully (check scanner output for `Sensor Clippy [rust] (done)` without `ERROR Failed to run Clippy`)
+- [ ] Cognitive complexity issues are not worse than the baseline in `todo/sonar-rust.md`
+- [ ] Duplication percentage is not significantly worse than baseline (13.2% as of 2026-03-15)
+- [ ] Review any new findings against `todo/sonar-rust.md` and note regressions
+
+## 14. Security / Correctness Review
+
+- [ ] Review `todo/code-review.md`
+- [ ] Review `todo/findings.md`
+- [ ] Review `todo/sonar-rust.md`
+- [ ] Review `tools_rust/mcp_runtime/STATUS.md`
+- [ ] Confirm remaining open items are documented and acceptable for release
+- [ ] Recheck that direct public Rust ingress strips internal-only headers
+- [ ] Recheck that session ownership / auth-binding isolation tests still pass
+- [ ] Recheck that error responses do not leak internal transport details on the Rust path
+- [ ] Review Rust `/health` `runtime_stats` and confirm reuse/fallback/denial counters look sane during the validation run
+
+## 15. Docs And Release Docs
+
+- [ ] Review `tools_rust/mcp_runtime/README.md`
+- [ ] Review `tools_rust/mcp_runtime/STATUS.md`
+- [ ] Review `tools_rust/mcp_runtime/TESTING-DESIGN.md`
+- [ ] Review `tools_rust/mcp_runtime/DEVELOPING.md`
+- [ ] Review `docs/docs/architecture/rust-mcp-runtime.md`
+- [ ] Review `docs/docs/architecture/adr/043-rust-mcp-runtime-sidecar-mode-model.md`
+- [ ] Review `docs/docs/testing/index.md`
+- [ ] Review `docs/docs/testing/performance.md`
+- [ ] Review `docs/docs/development/profiling.md`
+- [ ] `cd docs && make build`
+
+## 16. Final Release Notes
+
+- [ ] Record final Python baseline MCP result summary
+- [ ] Record final Rust full MCP result summary
+- [ ] Record final benchmark summary
+- [ ] Record final profiling summary
+- [ ] Record any known caveats or follow-up items
+- [ ] Confirm this file is left unchecked before commit
diff --git a/tools_rust/mcp_runtime/STATUS.md b/tools_rust/mcp_runtime/STATUS.md
new file mode 100644
index 0000000000..331cc26cf8
--- /dev/null
+++ b/tools_rust/mcp_runtime/STATUS.md
@@ -0,0 +1,372 @@
+# Rust MCP Runtime Status
+
+Last updated: March 15, 2026
+
+## Current snapshot
+
+The Rust MCP runtime is now a real optional runtime slice in `ContextForge`,
+not just a transport experiment.
+
+Current top-level mode model:
+
+- `RUST_MCP_MODE=off`
+- `RUST_MCP_MODE=shadow`
+- `RUST_MCP_MODE=edge`
+- `RUST_MCP_MODE=full`
+
+Current meaning:
+
+- `off`: public MCP stays on Python
+- `shadow`: Rust sidecar is present, but public `/mcp` stays on Python
+- `edge`: public `/mcp` is routed directly to Rust
+- `full`: `edge` plus Rust session/event-store/resume/live-stream/affinity
+  cores
+
+Python still remains the authority for:
+
+- authentication
+- token scoping
+- RBAC
+- trusted internal auth/context derivation
+- fallback compatibility/business logic
+
+## What is implemented
+
+### Rust-owned today
+
+- public `GET /mcp`, `POST /mcp`, and `DELETE /mcp` edge in `edge|full`
+- MCP protocol/version validation
+- JSON-RPC validation and batch rejection
+- local `ping`
+- notification transport semantics
+- direct `tools/call` fast path with reusable upstream sessions
+- optional `rmcp` upstream client path
+- server-scoped direct fast paths for:
+  - `tools/list`
+  - `resources/list`
+  - `resources/read`
+  - `resources/templates/list`
+  - `prompts/list`
+  - `prompts/get`
+- in `full` mode:
+  - runtime session metadata
+  - Redis-backed event store and replay
+  - public resumable `GET /mcp`
+  - public live-stream `GET /mcp`
+  - affinity forwarding edge
+
+### Python-owned today
+
+- trusted internal MCP authenticate endpoint
+- auth cache and revocation/user/team lookups
+- token scoping and RBAC decisions
+- fallback dispatcher/business logic where Rust deliberately bails out for
+  parity
+- parts of the underlying stream/session behavior behind the trusted internal
+  bridge
+
+## Session/auth reuse status
+
+Session-auth reuse is implemented.
+
+Current behavior:
+
+- public Rust ingress still treats Python as the auth authority
+- after `initialize`, Rust can bind the encoded auth context to the runtime
+  session
+- reuse is only allowed when:
+  - the session exists
+  - the server scope still matches
+  - the auth-binding fingerprint still matches
+  - the reuse TTL has not expired
+
+This logic is enforced in:
+
+- [authenticate_public_request_if_needed](src/lib.rs)
+- [validate_runtime_session_request](src/lib.rs)
+- [runtime_session_allows_access](src/lib.rs)
+- [maybe_bind_session_auth_context](src/lib.rs)
+
+The safe fallback still exists:
+
+- `RUST_MCP_MODE=shadow` keeps public MCP on Python
+- `RUST_MCP_SESSION_AUTH_REUSE=false` remains an advanced override for
+  explicitly testing away from the default fast path
+
+## Validation status
+
+### Rust-local validation on the current tree
+
+Verified locally and currently green:
+
+- `make -C tools_rust/mcp_runtime fmt-check`
+- `make -C tools_rust/mcp_runtime check`
+- `make -C tools_rust/mcp_runtime clippy`
+- `make -C tools_rust/mcp_runtime clippy-all`
+- `make -C tools_rust/mcp_runtime test`
+- `make -C tools_rust/mcp_runtime test-rmcp`
+
+### Latest compose-backed MCP/runtime validation on this branch
+
+Most recent rebuilt full-Rust compose validation on this branch:
+
+- `make test-mcp-cli`
+  - `23 passed`
+- `make test-mcp-rbac`
+  - `40 passed`
+- `make test-mcp-plugin-parity`
+  - plugin-parity gate is green in both Python mode and Rust full mode
+  - live coverage now includes:
+    - `resources/read` with `LicenseHeaderInjector`
+    - `tools/call` with `TestToolOutputSentinelPlugin`
+    - `prompts/get` with `PromptOutputSentinelPlugin`
+- `make test-mcp-session-isolation`
+  - `10 passed`
+- `make test-mcp-session-isolation-load`
+  - dedicated Rust-only Locust correctness harness
+  - validate with a short session-auth reuse TTL during release-style checks
+- `cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml`
+  - `48 passed`
+- `make test`
+  - `14626 passed`
+  - `485 skipped`
+  - `19 warnings`
+
+## Performance snapshot
+
+These are branch-local measurements from rebuilt full-Rust compose runs and
+should be treated as current engineering signals, not release targets.
+
+### Recent tools-only measurements
+
+- `60s / 1000 users`
+  - `10454.16 RPS` overall
+  - `9937.7 RPS` on `MCP tools/call [rapid]`
+  - `0` failures
+- `300s / 1000 users`
+  - `6350.12 RPS` overall
+  - `6045.2 RPS` on `MCP tools/call [rapid]`
+  - `5` failures total
+
+### Current throughput read
+
+- short-run peak is much higher than sustained `5m` throughput
+- the practical sustained sweet spot on the tools-only workload is about
+  `1000` concurrent users
+- `2000+` users are beyond the efficient knee for sustained tools-only load
+
+### Current profiling read
+
+The obvious Rust-specific setup bottleneck was already removed by reusing a
+shared RMCP `reqwest 0.13` client. Current profiling points more at:
+
+- syscall/network cost (`writev`, `futex`, `recvfrom`)
+- broader system/upstream behavior
+- remaining Rust <-> Python control/auth seam work
+
+Notably, the earlier Rust-side TLS/client setup cost is no longer the main
+runtime-specific hotspot.
+
+## Known caveats
+
+### 1. Python is still on the control/auth seam
+
+Even in `edge|full`, Python still owns auth, RBAC, and the trusted internal
+auth-context derivation step.
+
+That means:
+
+- the shared Python auth cache still matters
+- reducing internal Rust -> Python control/auth hops remains a useful next
+  optimization target
+
+### 2. Mixed benchmarks are noisier than tools-only benchmarks
+
+The tools-only benchmark targets are the cleanest transport/runtime signal.
+
+The mixed benchmark targets exercise broader seeded fixture and data behavior.
+If they fail, validate whether the issue is:
+
+- a transport/runtime regression, or
+- a seeded server/data issue on the benchmark fixture
+
+before attributing the result to Rust MCP itself.
+
+### 3. Session-auth reuse is still TTL-based
+
+The isolation and correctness coverage is much stronger now:
+
+- revocation-after-initialize is covered with a bounded TTL contract
+- team membership removal and role revocation are covered with the same bounded
+  TTL contract
+- forced cross-worker affinity ownership is covered in Rust integration tests
+- there is now a dedicated multi-user correctness load harness
+
+The remaining caveat is architectural, not missing test coverage:
+
+- session-auth reuse still depends on a bounded reuse TTL and therefore does
+  not react instantly to revocation without another Python auth check
+
+See [TESTING-DESIGN.md](TESTING-DESIGN.md).
+
+### 4. Broader UI flakiness is not a Rust-runtime signal
+
+The wider Playwright suite still has broader repo instability/flakiness. That
+should not be used as the primary signal for the MCP runtime slice unless the
+failure path actually exercises `/mcp`.
+
+### 5. Prompt deny-path parity is still follow-up work
+
+Prompt happy-path correctness is now covered and release-gated:
+
+- `prompts/get` succeeds on both Python mode and Rust full mode under the
+  plugin-parity stack
+- the prompt post-fetch sentinel plugin is exercised live in both modes
+- malformed prompt argument shapes now return a structured MCP `-32602` error
+  on the Rust public path instead of an opaque backend decode failure
+
+The remaining prompt caveat is narrower:
+
+- blocked `prompts/get` parity is still noisy on the Python side and remains
+  tracked as follow-up work rather than a Rust MCP correctness gap
+
+## Code review follow-up
+
+The March 15, 2026 review in [todo/code-review.md](../../todo/code-review.md)
+identified a mix of real vulnerabilities, performance issues, and longer-term
+design tradeoffs.
+
+### Addressed in the current branch
+
+- public ingress now strips client-supplied internal auth headers before the
+  Rust -> Python auth hop
+- public ingress no longer trusts client-supplied `x-contextforge-server-id`
+  and only uses trusted routing state for server-scoped dispatch
+- internal auth handoff now uses the actual peer address and does not default a
+  missing client IP to loopback
+- the direct public Rust listener now exposes a dedicated public router and no
+  longer exposes internal event-store routes
+- upstream tool-session initialization no longer holds the shared mutex across
+  HTTP I/O
+- local in-memory runtime caches now have periodic sweeping and expiry cleanup
+- Redis affinity keys/channels now honor the configured cache prefix
+- runtime session counting in Redis now uses `SCAN` instead of `KEYS`
+- the direct public Rust listener now returns a minimal public health payload
+  instead of the detailed internal runtime view
+- runtime/proxy transport failures now log full exception details server-side
+  while returning redacted client-visible error data
+- Rust direct DB mode now supports optional PostgreSQL TLS via
+  `MCP_RUST_DATABASE_URL` / `sslmode=disable|prefer|require`, while preserving
+  the existing non-TLS local/test path
+- Rust `/health` now exposes runtime fast-path observability counters for:
+  - session-auth reuse hits and misses
+  - miss reasons
+  - internal Python auth round-trips
+  - session access denial reasons
+  - affinity forward attempts and forwarded requests
+- the compose-backed Rust isolation suite now includes bounded-TTL coverage for:
+  - token revocation after initialize
+  - team membership removal after initialize
+  - team role revocation after initialize
+- the Rust integration suite now includes forced cross-worker affinity
+  ownership validation
+- a dedicated Rust-only correctness load harness now exists at
+  `tests/loadtest/locustfile_mcp_isolation.py`
+
+### Still open / follow-up
+
+- `session_id` query-parameter compatibility still exists in both Rust and
+  Python; this branch documents it as compatibility debt rather than making a
+  breaking behavior change
+- the new Rust access-matrix coverage shows that non-admin scoped tokens can
+  initialize and read on `/servers/{id}/mcp`, but are still denied at
+  `tools/call` even when the token includes `tools.execute`; this needs a
+  product/RBAC follow-up to decide whether that restriction is intentional
+- Rust direct DB mode still does not support client certificate authentication
+  via `sslcert` / `sslkey`; the current TLS support covers the common
+  `sslmode=require`/system-roots path and optional `sslrootcert`
+- catch-all `sampling/`, `completion/`, `logging/`, and `elicitation/` methods
+  still return an empty success object; that appears to be existing project
+  behavior, but it should be documented or revisited
+- session-auth reuse is still TTL-based and therefore does not immediately
+  react to revocation events without a fresh Python auth check
+- broader Python MCP handlers outside the Rust runtime proxy still need their
+  own repository-wide error-redaction pass
+
+## Recommended next steps
+
+### 1. Investigate residual long-run tools-only failures
+
+The remaining low-rate failures in sustained tools-only runs are the clearest
+quality issue left on the hot path.
+
+### 2. Use the new runtime stats to keep reducing avoidable seam work
+
+The next meaningful gains are more likely to come from:
+
+- removing remaining Rust -> Python control/auth round-trips
+- trimming fallback frequency
+- improving upstream server behavior
+
+than from small Rust micro-optimizations inside the current crate.
+
+### 3. Decide the `session_id` compatibility strategy
+
+This branch intentionally does not make breaking Python behavior changes. The
+remaining decision is whether to:
+
+- keep the query-parameter fallback as an explicit compatibility exception, or
+- deprecate it and later retire it across both Rust and Python
+
+### 4. Decide whether Rust needs DB client-certificate TLS
+
+The common PostgreSQL TLS path is now supported. Only the `sslcert` / `sslkey`
+client-certificate mode remains unimplemented.
+
+## Related documents
+
+- [Runtime overview and operator guide](README.md)
+- [Session/auth isolation testing design](TESTING-DESIGN.md)
+- [Rust MCP runtime architecture](../../docs/docs/architecture/rust-mcp-runtime.md)
+- [ADR-043: Rust MCP runtime sidecar + mode model](../../docs/docs/architecture/adr/043-rust-mcp-runtime-sidecar-mode-model.md)
+
+## Next steps checklist
+
+This PR should stay open until the Rust MCP path is revalidated against the
+items below and any remaining issues are either fixed or explicitly understood.
+
+- [ ] Re-run the full Rust validation battery on the exact PR head after each
+  substantive change:
+  - `make testing-rebuild-rust-full`
+  - `make test`
+  - `make test-mcp-cli`
+  - `make test-mcp-rbac`
+  - `make test-mcp-session-isolation`
+  - `cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml`
+- [x] Add observability for the session-auth fast path:
+  - reuse hits
+  - reuse misses
+  - fallback-to-Python reasons
+  - owner mismatch denials
+  - server-id mismatch denials
+  - internal Python auth round-trips
+- [x] Extend the isolation suite with explicit revocation-after-initialize
+  coverage.
+- [x] Extend the isolation suite with explicit membership/role-change coverage
+  after initialize.
+- [x] Add forced cross-worker affinity ownership coverage so forwarded and
+  local handling prove the same ownership rules.
+- [x] Add a dedicated multi-user load/correctness harness separate from the
+  throughput benchmarks.
+- [ ] Investigate and explain the remaining low-rate failures in sustained
+  tools-only runs.
+- [ ] Use the new observability to identify and reduce avoidable Rust -> Python
+  control/auth seam work before attempting more micro-optimizations inside the
+  crate.
+- [ ] Re-run the sustained tools-only benchmark after each meaningful
+  control/auth seam change:
+  - `make benchmark-mcp-tools-300 MCP_BENCHMARK_HIGH_USERS=1000 MCP_BENCHMARK_HIGH_RUN_TIME=300s`
+- [ ] Keep broader Playwright/admin UI flakiness tracked separately unless the
+  failing path clearly exercises `/mcp`.
+- [ ] Do not merge until the MCP/Rust-specific validation, isolation tests, and
+  benchmark results are green and understood.
diff --git a/tools_rust/mcp_runtime/TESTING-DESIGN.md b/tools_rust/mcp_runtime/TESTING-DESIGN.md
new file mode 100644
index 0000000000..3e580754ab
--- /dev/null
+++ b/tools_rust/mcp_runtime/TESTING-DESIGN.md
@@ -0,0 +1,328 @@
+# Rust MCP Session/Auth Isolation Testing Design
+
+Last updated: March 14, 2026
+
+## Goal
+
+Prove that Rust MCP session/auth reuse does not leak one caller's identity,
+scope, server context, replay stream, or tool/resource/prompt visibility to
+another caller.
+
+This is stricter than "benchmark still works." Cross-user or cross-session
+contamination is a release blocker for the fast Rust public path.
+
+## Current implementation status
+
+The first end-to-end implementation is already in place:
+
+- [tests/e2e_rust/test_mcp_session_isolation.py](/home/cmihai/agents2/pr/mcp-context-forge/tests/e2e_rust/test_mcp_session_isolation.py)
+- `make test-mcp-session-isolation`
+
+Current compose-backed validation on this branch:
+
+- `make test-mcp-session-isolation` -> `10 passed`
+- `make test-mcp-cli` -> `23 passed`
+- `make test-mcp-rbac` -> `40 passed`
+- `cargo test --release --manifest-path tools_rust/mcp_runtime/Cargo.toml`
+  -> `48 passed`
+
+The implemented suite currently proves:
+
+- same-team peer session hijack denial
+- same-email narrower-token session hijack denial
+- cross-user live `GET /mcp` hijack denial
+- cross-user replay/resume hijack denial
+- cross-user `DELETE /mcp` denial with owner-session survival
+- live tool-result freshness validation
+- concurrent owner traffic plus peer hijack attempts without result leakage
+- token revocation after `initialize` is denied within the documented bounded
+  reuse TTL
+- team membership removal after `initialize` is denied within the documented
+  bounded reuse TTL
+- team role revocation after `initialize` is denied within the documented
+  bounded reuse TTL
+
+Rust integration coverage also now proves:
+
+- forced cross-worker affinity ownership preserves owner access
+- peer reuse attempts are still denied when the request is forwarded across
+  workers
+
+This design therefore supplements existing coverage now; it is no longer purely
+aspirational.
+
+## Scope
+
+This design covers:
+
+- public MCP transport in `RUST_MCP_MODE=edge|full`
+- runtime session metadata and session-auth reuse
+- Redis-backed event-store and replay
+- live-stream and affinity slices in `full`
+- safe fallback behavior in `RUST_MCP_MODE=shadow`
+
+It assumes the compose-backed environment from
+[docker-compose.yml](/home/cmihai/agents2/pr/mcp-context-forge/docker-compose.yml),
+which uses PostgreSQL and Redis.
+
+## Why this matters
+
+The current fast path binds authenticated context to MCP sessions inside Rust.
+That is the right direction for performance, but it creates obvious security
+questions:
+
+- can caller B reuse caller A's `mcp-session-id`?
+- can one token context silently leak into another token context?
+- can replay/resume leak another caller's events?
+- can affinity forwarding weaken ownership checks?
+- can revocation or membership/role changes leave stale session auth usable for
+  too long?
+
+Those must be proven by tests, not inferred from implementation details.
+
+## Security invariants
+
+The following invariants should stay explicit and testable:
+
+1. A session is owned by exactly one authenticated caller context.
+2. A second caller must never gain access by reusing the same
+   `mcp-session-id`.
+3. Session-auth reuse must never widen visibility beyond the currently
+   presented auth material and server scope.
+4. Server-scoped MCP sessions must remain bound to the original `server_id`.
+5. Replay/resume must never return another caller's events.
+6. Affinity forwarding must preserve the same ownership checks as local
+   handling.
+7. Public/team/owner visibility must remain correct under reuse.
+8. Revocation and membership/role changes must have a defined, bounded effect
+   on existing sessions.
+9. Safe fallback modes must not silently leave public MCP on an unsafe hybrid
+   path.
+10. Freshness checks must prove the fast path is returning live results, not
+    stale or synthetic data.
+
+## Current coverage
+
+### Existing non-isolation suites
+
+Useful existing coverage already lives in:
+
+- [tests/e2e/test_mcp_rbac_transport.py](/home/cmihai/agents2/pr/mcp-context-forge/tests/e2e/test_mcp_rbac_transport.py)
+- [tests/integration/test_streamable_http_redis.py](/home/cmihai/agents2/pr/mcp-context-forge/tests/integration/test_streamable_http_redis.py)
+- [tests/e2e/test_session_pool_e2e.py](/home/cmihai/agents2/pr/mcp-context-forge/tests/e2e/test_session_pool_e2e.py)
+- [tests/loadtest/locustfile_mcp_protocol.py](/home/cmihai/agents2/pr/mcp-context-forge/tests/loadtest/locustfile_mcp_protocol.py)
+
+These are useful, but they are not enough on their own for Rust session-auth
+reuse.
+
+### Implemented isolation cases
+
+The current compose-backed suite maps to the design like this:
+
+- Session ownership: `POST`
+  - same-team peer denied when reusing another caller's session
+- Same email, different token
+  - narrower/public-only token denied when reusing a team-scoped session
+- Session ownership: live `GET /mcp`
+  - cross-user attach denied
+- Session ownership: replay/resume
+  - cross-user replay denied
+- Session ownership: `DELETE`
+  - cross-user delete denied and owner session survives
+- Freshness / no stale result reuse
+  - live time/echo validation
+- Concurrency
+  - owner traffic plus hijack attempts do not leak results
+
+## Current matrix
+
+The core matrix should continue to be:
+
+- `RUST_MCP_MODE=shadow`
+- `RUST_MCP_MODE=edge`
+- `RUST_MCP_MODE=full`
+
+Important nuance:
+
+- `edge` and `full` currently default to session-auth reuse through the mode
+  presets
+- `RUST_MCP_SESSION_AUTH_REUSE=false` should still be exercised as an advanced
+  override case, but it is no longer the primary UX
+
+That means there are two guarantees to keep proving:
+
+- the fast public Rust path is correct
+- the safe fallback path is correct
+
+## Test actors
+
+The design still assumes dynamically created callers through the real REST API:
+
+1. `admin_unrestricted`
+   - `is_admin=true`
+   - `teams=null`
+2. `team_a_dev`
+3. `team_a_viewer`
+4. `team_b_dev`
+5. `public_only_user`
+6. `same_email_alt_scope`
+
+The implemented compose-backed suite already uses real REST setup and minted
+tokens; additional scenarios should keep following that pattern.
+
+## Test data
+
+Continue to prefer dynamic API-created fixtures over long-lived compose state.
+
+Recommended server content:
+
+- public, team-scoped, and owner-scoped objects
+- at least one live time/echo tool for freshness validation
+
+The current isolation suite prefers a compose-backed time-capable streamable
+HTTP gateway:
+
+- canonical preference: `fast_time`
+- fallback: `fast_test`
+
+That fallback is acceptable because the suite is proving session/auth binding,
+not benchmarking a specific upstream server.
+
+## Implemented hardening additions
+
+The following design items are now implemented:
+
+1. Revocation after initialize
+2. Team membership / role change after initialize
+3. Forced cross-worker affinity ownership scenarios
+4. Multi-user correctness load harness
+5. Explicit reuse/fallback observability counters
+
+### 1. Revocation after initialize
+
+Scenario:
+
+1. user A initializes a session
+2. revoke A's token
+3. continue MCP traffic on the same session
+
+Required outcome:
+
+- either strict invalidation, or
+- a clearly documented and explicitly tested bounded TTL contract
+
+Current status:
+
+- implemented as a bounded TTL contract in
+  `tests/e2e_rust/test_mcp_session_isolation.py`
+
+### 2. Team membership / role change after initialize
+
+Scenario:
+
+1. user A initializes while in team A
+2. remove A from team A or downgrade A's role
+3. repeat discovery and action calls on the same session
+
+Required outcome:
+
+- same explicit contract as revocation
+
+Current status:
+
+- implemented for both membership removal and role revocation in
+  `tests/e2e_rust/test_mcp_session_isolation.py`
+
+### 3. Forced cross-worker affinity ownership
+
+Scenario:
+
+1. user A initializes on worker 1
+2. subsequent traffic lands on another worker
+3. user B attempts the same hijack from a different worker
+
+Required outcome:
+
+- owner succeeds across workers
+- non-owner is denied across workers
+- forwarded and local handling enforce the same ownership rule
+
+Current status:
+
+- implemented in `tools_rust/mcp_runtime/tests/runtime.rs`
+
+### 4. Multi-user load correctness harness
+
+Add a dedicated load harness that validates:
+
+- expected allowlist per user
+- denylist never appears
+- hijack attempts fail correctly
+- time/echo results remain live and per-user
+
+This should be a separate correctness harness, not a replacement for the
+throughput benchmarks.
+
+Current status:
+
+- implemented in `tests/loadtest/locustfile_mcp_isolation.py`
+- exposed as `make test-mcp-session-isolation-load`
+
+## Observability now available
+
+Rust `/health` now exposes `runtime_stats` for:
+
+- session-auth reuse hits
+- session-auth reuse misses
+- miss reasons
+- backend Python auth round-trips
+- session-owner and auth-binding denials
+- server-scope mismatch denials
+- affinity forward attempts and forwarded requests
+
+## Remaining gaps
+
+The main remaining gaps are now narrower:
+
+1. Routine release validation of the bounded TTL contract under a short test TTL
+2. Broader correctness-load validation as part of release-style testing, not
+   just availability of the harness
+3. Longer-term architectural work if the project wants revocation-aware
+   invalidation instead of a bounded TTL contract
+
+## Rollout gate
+
+Because `edge` and `full` now default to the fast path in local mode presets,
+the right question is no longer "can we ever enable this?" It is:
+
+"What must stay green before we trust it more broadly and rely less on the safe
+fallback?"
+
+Recommended gate:
+
+1. Keep `test-mcp-session-isolation` green
+2. Keep the short-TTL revocation/membership/role-change cases green
+3. Keep forced cross-worker affinity ownership coverage green
+4. Run the multi-user load/correctness harness
+5. Review `runtime_stats` to confirm the fast path is being exercised and that
+   denial/fallback behavior looks sane
+
+## Short version
+
+We now have an initial proof that the Rust fast path preserves session
+ownership for the main hijack and freshness cases.
+
+What is now implemented covers the main deny path plus the bounded-TTL drift
+cases around:
+
+- revocation
+- membership/role drift
+- forced cross-worker ownership
+- correctness under concurrent multi-user load
+
+What remains is mostly operational rigor:
+
+- re-running the short-TTL correctness suite before release
+- using the new stats to understand reuse/fallback behavior in real runs
+- deciding whether bounded TTL reuse is acceptable long-term or should be
+  replaced with revocation-aware invalidation
diff --git a/tools_rust/mcp_runtime/clippy.toml b/tools_rust/mcp_runtime/clippy.toml
new file mode 100644
index 0000000000..a8a47994fd
--- /dev/null
+++ b/tools_rust/mcp_runtime/clippy.toml
@@ -0,0 +1,2 @@
+too-many-lines-threshold = 1000
+max-struct-bools = 10
diff --git a/tools_rust/mcp_runtime/src/config.rs b/tools_rust/mcp_runtime/src/config.rs
new file mode 100644
index 0000000000..88c47193e1
--- /dev/null
+++ b/tools_rust/mcp_runtime/src/config.rs
@@ -0,0 +1,403 @@
+// Copyright 2026
+// SPDX-License-Identifier: Apache-2.0
+// Authors: Mihai Criveti
+
+//! CLI and environment-backed configuration for the Rust MCP runtime.
+
+use clap::Parser;
+use std::{net::SocketAddr, path::PathBuf};
+
+const DEFAULT_SUPPORTED_PROTOCOL_VERSIONS: &[&str] =
+    &["2025-11-25", "2025-06-18", "2025-03-26", "2024-11-05"];
+
+#[derive(Debug, Clone, Parser)]
+#[command(name = "contextforge-mcp-runtime")]
+#[command(about = "Experimental Rust MCP runtime edge for ContextForge")]
+/// Runtime configuration parsed from CLI flags and environment variables.
+///
+/// These options are intentionally low-level. In normal compose/test workflows,
+/// the top-level `RUST_MCP_MODE` helper configures the right runtime behavior
+/// and these values are only used as advanced overrides.
+pub struct RuntimeConfig {
+    #[arg(
+        long,
+        env = "MCP_RUST_BACKEND_RPC_URL",
+        default_value = "http://127.0.0.1:4444/rpc"
+    )]
+    pub backend_rpc_url: String,
+
+    #[arg(long, env = "MCP_RUST_LISTEN_HTTP", default_value = "127.0.0.1:8787")]
+    pub listen_http: String,
+
+    #[arg(long, env = "MCP_RUST_LISTEN_UDS")]
+    pub listen_uds: Option<PathBuf>,
+
+    #[arg(long, env = "MCP_RUST_PUBLIC_LISTEN_HTTP")]
+    pub public_listen_http: Option<String>,
+
+    #[arg(long, env = "MCP_RUST_PROTOCOL_VERSION", default_value = "2025-11-25")]
+    pub protocol_version: String,
+
+    #[arg(
+        long = "supported-protocol-version",
+        env = "MCP_RUST_SUPPORTED_PROTOCOL_VERSIONS",
+        value_delimiter = ','
+    )]
+    pub supported_protocol_versions: Vec<String>,
+
+    #[arg(long, env = "MCP_RUST_SERVER_NAME", default_value = "ContextForge")]
+    pub server_name: String,
+
+    #[arg(long, env = "MCP_RUST_SERVER_VERSION", default_value = env!("CARGO_PKG_VERSION"))]
+    pub server_version: String,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_INSTRUCTIONS",
+        default_value = "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration."
+    )]
+    pub instructions: String,
+
+    #[arg(long, env = "MCP_RUST_REQUEST_TIMEOUT_MS", default_value_t = 30_000)]
+    pub request_timeout_ms: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_CLIENT_CONNECT_TIMEOUT_MS",
+        default_value_t = 5_000
+    )]
+    pub client_connect_timeout_ms: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_CLIENT_POOL_IDLE_TIMEOUT_SECONDS",
+        default_value_t = 90
+    )]
+    pub client_pool_idle_timeout_seconds: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_CLIENT_POOL_MAX_IDLE_PER_HOST",
+        default_value_t = 1024
+    )]
+    pub client_pool_max_idle_per_host: usize,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_CLIENT_TCP_KEEPALIVE_SECONDS",
+        default_value_t = 30
+    )]
+    pub client_tcp_keepalive_seconds: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_TOOLS_CALL_PLAN_TTL_SECONDS",
+        default_value_t = 30
+    )]
+    pub tools_call_plan_ttl_seconds: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_UPSTREAM_SESSION_TTL_SECONDS",
+        default_value_t = 300
+    )]
+    pub upstream_session_ttl_seconds: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_USE_RMCP_UPSTREAM_CLIENT",
+        default_value_t = false
+    )]
+    pub use_rmcp_upstream_client: bool,
+
+    #[arg(long, env = "MCP_RUST_SESSION_CORE_ENABLED", default_value_t = false)]
+    pub session_core_enabled: bool,
+
+    #[arg(long, env = "MCP_RUST_EVENT_STORE_ENABLED", default_value_t = false)]
+    pub event_store_enabled: bool,
+
+    #[arg(long, env = "MCP_RUST_RESUME_CORE_ENABLED", default_value_t = false)]
+    pub resume_core_enabled: bool,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_LIVE_STREAM_CORE_ENABLED",
+        default_value_t = false
+    )]
+    pub live_stream_core_enabled: bool,
+
+    #[arg(long, env = "MCP_RUST_AFFINITY_CORE_ENABLED", default_value_t = false)]
+    pub affinity_core_enabled: bool,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_SESSION_AUTH_REUSE_ENABLED",
+        default_value_t = false
+    )]
+    pub session_auth_reuse_enabled: bool,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_SESSION_AUTH_REUSE_TTL_SECONDS",
+        default_value_t = 30
+    )]
+    pub session_auth_reuse_ttl_seconds: u64,
+
+    #[arg(long, env = "MCP_RUST_SESSION_TTL_SECONDS", default_value_t = 3_600)]
+    pub session_ttl_seconds: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_EVENT_STORE_MAX_EVENTS_PER_STREAM",
+        default_value_t = 100
+    )]
+    pub event_store_max_events_per_stream: usize,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_EVENT_STORE_TTL_SECONDS",
+        default_value_t = 3_600
+    )]
+    pub event_store_ttl_seconds: u64,
+
+    #[arg(
+        long,
+        env = "MCP_RUST_EVENT_STORE_POLL_INTERVAL_MS",
+        default_value_t = 250
+    )]
+    pub event_store_poll_interval_ms: u64,
+
+    #[arg(long, env = "MCP_RUST_CACHE_PREFIX", default_value = "mcpgw:")]
+    pub cache_prefix: String,
+
+    #[arg(long, env = "MCP_RUST_DATABASE_URL")]
+    pub database_url: Option<String>,
+
+    #[arg(long, env = "MCP_RUST_REDIS_URL")]
+    pub redis_url: Option<String>,
+
+    #[arg(long, env = "MCP_RUST_DB_POOL_MAX_SIZE", default_value_t = 20)]
+    pub db_pool_max_size: usize,
+
+    #[arg(long, env = "MCP_RUST_LOG", default_value = "info")]
+    pub log_filter: String,
+
+    #[arg(long, env = "MCP_RUST_EXIT_AFTER_STARTUP_MS", hide = true)]
+    pub exit_after_startup_ms: Option<u64>,
+}
+
+#[derive(Debug, Clone)]
+/// Primary listener target for the runtime.
+pub enum ListenTarget {
+    Http(SocketAddr),
+    Uds(PathBuf),
+}
+
+impl RuntimeConfig {
+    #[must_use]
+    /// Returns the effective list of protocol versions accepted by this runtime.
+    ///
+    /// The configured primary protocol version is always included even when the
+    /// caller provided an explicit supported-version list.
+    pub fn effective_supported_protocol_versions(&self) -> Vec<String> {
+        let mut versions = self.supported_protocol_versions.clone();
+
+        if versions.is_empty() {
+            versions = DEFAULT_SUPPORTED_PROTOCOL_VERSIONS
+                .iter()
+                .map(|version| (*version).to_string())
+                .collect();
+        }
+
+        if !versions
+            .iter()
+            .any(|version| version == &self.protocol_version)
+        {
+            versions.insert(0, self.protocol_version.clone());
+        }
+
+        versions
+    }
+
+    /// Returns the primary listen target for the runtime.
+    ///
+    /// # Errors
+    ///
+    /// Returns an error when `listen_http` is configured with an invalid socket address.
+    pub fn listen_target(&self) -> Result<ListenTarget, String> {
+        if let Some(path) = &self.listen_uds {
+            return Ok(ListenTarget::Uds(path.clone()));
+        }
+
+        self.listen_http
+            .parse::<SocketAddr>()
+            .map(ListenTarget::Http)
+            .map_err(|err| format!("invalid listen address '{}': {err}", self.listen_http))
+    }
+
+    /// Returns the optional public HTTP listen address when it differs from the primary listener.
+    ///
+    /// # Errors
+    ///
+    /// Returns an error when `public_listen_http` is configured with an invalid socket address
+    /// or when deriving the primary listen target fails.
+    pub fn public_listen_addr(&self) -> Result<Option<SocketAddr>, String> {
+        let Some(addr) = self.public_listen_http.as_deref() else {
+            return Ok(None);
+        };
+
+        let parsed = addr
+            .parse::<SocketAddr>()
+            .map_err(|err| format!("invalid public listen address '{addr}': {err}"))?;
+
+        match self.listen_target()? {
+            ListenTarget::Http(existing) if existing == parsed => Ok(None),
+            _ => Ok(Some(parsed)),
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::{ListenTarget, RuntimeConfig};
+    use clap::Parser;
+    use std::path::PathBuf;
+
+    fn config_from<I, T>(args: I) -> RuntimeConfig
+    where
+        I: IntoIterator<Item = T>,
+        T: Into<std::ffi::OsString> + Clone,
+    {
+        RuntimeConfig::parse_from(args)
+    }
+
+    #[test]
+    fn effective_supported_protocol_versions_uses_defaults_and_inserts_protocol() {
+        let config = config_from([
+            "contextforge-mcp-runtime",
+            "--protocol-version",
+            "2099-01-01",
+        ]);
+
+        let versions = config.effective_supported_protocol_versions();
+
+        assert_eq!(versions.first().map(String::as_str), Some("2099-01-01"));
+        assert!(versions.iter().any(|value| value == "2025-11-25"));
+        assert!(versions.iter().any(|value| value == "2025-03-26"));
+    }
+
+    #[test]
+    fn effective_supported_protocol_versions_preserves_existing_protocol() {
+        let config = config_from([
+            "contextforge-mcp-runtime",
+            "--protocol-version",
+            "2025-03-26",
+            "--supported-protocol-version",
+            "2025-03-26,2025-06-18",
+        ]);
+
+        let versions = config.effective_supported_protocol_versions();
+
+        assert_eq!(
+            versions,
+            vec!["2025-03-26".to_string(), "2025-06-18".to_string()]
+        );
+    }
+
+    #[test]
+    fn listen_target_uses_uds_when_configured() {
+        let mut config = config_from(["contextforge-mcp-runtime"]);
+        config.listen_uds = Some(PathBuf::from("/tmp/contextforge.sock"));
+
+        assert!(matches!(
+            config.listen_target().expect("uds target"),
+            ListenTarget::Uds(path) if path == PathBuf::from("/tmp/contextforge.sock")
+        ));
+    }
+
+    #[test]
+    fn listen_target_rejects_invalid_http_address() {
+        let config = config_from(["contextforge-mcp-runtime", "--listen-http", "not-an-addr"]);
+
+        let error = config
+            .listen_target()
+            .expect_err("invalid listen addr should fail");
+
+        assert!(error.contains("invalid listen address"));
+        assert!(error.contains("not-an-addr"));
+    }
+
+    #[test]
+    fn public_listen_addr_returns_none_when_unset() {
+        let config = config_from(["contextforge-mcp-runtime"]);
+
+        assert_eq!(config.public_listen_addr().expect("public addr"), None);
+    }
+
+    #[test]
+    fn public_listen_addr_returns_none_when_same_as_primary_http_listener() {
+        let config = config_from([
+            "contextforge-mcp-runtime",
+            "--listen-http",
+            "127.0.0.1:8787",
+            "--public-listen-http",
+            "127.0.0.1:8787",
+        ]);
+
+        assert_eq!(config.public_listen_addr().expect("public addr"), None);
+    }
+
+    #[test]
+    fn public_listen_addr_returns_some_when_distinct() {
+        let config = config_from([
+            "contextforge-mcp-runtime",
+            "--listen-http",
+            "127.0.0.1:8787",
+            "--public-listen-http",
+            "127.0.0.1:9797",
+        ]);
+
+        assert_eq!(
+            config.public_listen_addr().expect("public addr"),
+            Some("127.0.0.1:9797".parse().expect("socket addr"))
+        );
+    }
+
+    #[test]
+    fn public_listen_addr_rejects_invalid_public_address() {
+        let config = config_from([
+            "contextforge-mcp-runtime",
+            "--public-listen-http",
+            "invalid-public-addr",
+        ]);
+
+        let error = config
+            .public_listen_addr()
+            .expect_err("invalid public addr should fail");
+
+        assert!(error.contains("invalid public listen address"));
+        assert!(error.contains("invalid-public-addr"));
+    }
+
+    #[test]
+    fn public_listen_addr_ignores_public_http_when_primary_target_is_uds() {
+        let mut config = config_from([
+            "contextforge-mcp-runtime",
+            "--public-listen-http",
+            "127.0.0.1:9797",
+        ]);
+        config.listen_uds = Some(PathBuf::from("/tmp/contextforge.sock"));
+
+        assert_eq!(
+            config.public_listen_addr().expect("public addr"),
+            Some("127.0.0.1:9797".parse().expect("socket addr"))
+        );
+    }
+
+    #[test]
+    fn hidden_exit_after_startup_flag_is_parseable() {
+        let config = config_from(["contextforge-mcp-runtime", "--exit-after-startup-ms", "25"]);
+
+        assert_eq!(config.exit_after_startup_ms, Some(25));
+    }
+}
diff --git a/tools_rust/mcp_runtime/src/lib.rs b/tools_rust/mcp_runtime/src/lib.rs
new file mode 100644
index 0000000000..6eb4eb5ca9
--- /dev/null
+++ b/tools_rust/mcp_runtime/src/lib.rs
@@ -0,0 +1,10714 @@
+// Copyright 2026
+// SPDX-License-Identifier: Apache-2.0
+// Authors: Mihai Criveti
+
+//! Rust MCP runtime sidecar for `ContextForge`.
+//!
+//! This crate owns the Rust-backed public MCP HTTP edge and, in `full` mode,
+//! can also own MCP session/event-store/resume/live-stream/affinity cores while
+//! still delegating authentication and RBAC authority to Python.
+
+pub mod config;
+
+use axum::{
+    Json, Router,
+    body::{Body, Bytes},
+    extract::{ConnectInfo, FromRequestParts, Path as AxumPath, State},
+    http::request::Parts,
+    http::{HeaderMap, HeaderName, HeaderValue, StatusCode, header::CONTENT_TYPE},
+    response::{
+        IntoResponse, Response,
+        sse::{Event, KeepAlive, Sse},
+    },
+    routing::{get, post},
+};
+use base64::{Engine as _, engine::general_purpose::URL_SAFE_NO_PAD};
+use deadpool_postgres::{Manager, ManagerConfig, Pool, RecyclingMethod};
+use futures_util::{StreamExt, TryStreamExt};
+use redis::{AsyncCommands, Script, aio::ConnectionManager as RedisConnectionManager};
+use reqwest::{Client, Url};
+#[cfg(feature = "rmcp-upstream-client")]
+use reqwest_rmcp::Client as RmcpReqwestClient;
+use rustls::{ClientConfig as RustlsClientConfig, RootCertStore};
+use serde::{Deserialize, Serialize};
+use serde_json::{Map, Value, json};
+use sha2::{Digest, Sha256};
+use std::{
+    collections::{HashMap, hash_map::DefaultHasher},
+    convert::Infallible,
+    fs,
+    hash::{Hash, Hasher},
+    net::{IpAddr, SocketAddr},
+    path::Path,
+    str::{self, FromStr},
+    sync::{
+        Arc, OnceLock,
+        atomic::{AtomicU64, Ordering},
+    },
+    time::{Duration, Instant, SystemTime, UNIX_EPOCH},
+};
+use thiserror::Error;
+use tokio::sync::Mutex;
+use tokio_postgres::config::SslMode;
+use tokio_postgres_rustls::MakeRustlsConnect;
+use tracing::{debug, error, info, warn};
+use uuid::Uuid;
+
+#[cfg(feature = "rmcp-upstream-client")]
+use rmcp::{
+    ServiceError as RmcpServiceError,
+    model::{
+        CallToolRequestParams as RmcpCallToolRequestParams,
+        ClientCapabilities as RmcpClientCapabilities, ClientInfo as RmcpClientInfo,
+        Implementation as RmcpImplementation, ProtocolVersion as RmcpProtocolVersion,
+    },
+    serve_client as rmcp_serve_client,
+    service::{RoleClient as RmcpRoleClient, RunningService as RmcpRunningService},
+    transport::{
+        StreamableHttpClientTransport, streamable_http_client::StreamableHttpClientTransportConfig,
+    },
+};
+
+use crate::config::{ListenTarget, RuntimeConfig};
+
+const JSONRPC_VERSION: &str = "2.0";
+const RUNTIME_HEADER: &str = "x-contextforge-mcp-runtime";
+const RUNTIME_NAME: &str = "rust";
+const INTERNAL_RUNTIME_AUTH_HEADER: &str = "x-contextforge-mcp-runtime-auth";
+const INTERNAL_RUNTIME_AUTH_CONTEXT: &str = "contextforge-internal-mcp-runtime-v1";
+const DEFAULT_INTERNAL_RUNTIME_AUTH_SECRET: &str = "my-test-salt";
+const UPSTREAM_CLIENT_HEADER: &str = "x-contextforge-mcp-upstream-client";
+const MCP_PROTOCOL_VERSION_HEADER: &str = "mcp-protocol-version";
+const SESSION_VALIDATED_HEADER: &str = "x-contextforge-session-validated";
+const SESSION_CORE_HEADER: &str = "x-contextforge-mcp-session-core";
+const EVENT_STORE_HEADER: &str = "x-contextforge-mcp-event-store";
+const RESUME_CORE_HEADER: &str = "x-contextforge-mcp-resume-core";
+const LIVE_STREAM_CORE_HEADER: &str = "x-contextforge-mcp-live-stream-core";
+const AFFINITY_CORE_HEADER: &str = "x-contextforge-mcp-affinity-core";
+const SESSION_AUTH_REUSE_HEADER: &str = "x-contextforge-mcp-session-auth-reuse";
+const INTERNAL_AFFINITY_FORWARDED_HEADER: &str = "x-contextforge-affinity-forwarded";
+const INTERNAL_AFFINITY_FORWARDED_VALUE: &str = "rust";
+
+#[derive(Debug, Error)]
+/// Top-level runtime errors surfaced during startup and listener execution.
+pub enum RuntimeError {
+    #[error("{0}")]
+    Config(String),
+    #[error("http client error: {0}")]
+    HttpClient(#[from] reqwest::Error),
+    #[error("postgres error: {0}")]
+    Postgres(#[from] tokio_postgres::Error),
+    #[error("io error: {0}")]
+    Io(#[from] std::io::Error),
+}
+
+#[derive(Clone)]
+/// Shared application state for the Rust MCP runtime.
+///
+/// The state intentionally separates:
+///
+/// - the direct-path reqwest client used for Python/internal HTTP calls
+/// - the RMCP reqwest client used by the optional RMCP upstream transport
+/// - runtime/session/tool caches that keep the public MCP hot path off repeated
+///   backend lookups where possible
+pub struct AppState {
+    backend_rpc_url: Arc<str>,
+    backend_authenticate_url: Arc<str>,
+    backend_initialize_url: Arc<str>,
+    backend_notifications_initialized_url: Arc<str>,
+    backend_notifications_message_url: Arc<str>,
+    backend_notifications_cancelled_url: Arc<str>,
+    backend_transport_url: Arc<str>,
+    backend_tools_list_url: Arc<str>,
+    backend_resources_list_url: Arc<str>,
+    backend_resources_read_url: Arc<str>,
+    backend_resources_subscribe_url: Arc<str>,
+    backend_resources_unsubscribe_url: Arc<str>,
+    backend_resource_templates_list_url: Arc<str>,
+    backend_prompts_list_url: Arc<str>,
+    backend_prompts_get_url: Arc<str>,
+    backend_roots_list_url: Arc<str>,
+    backend_completion_complete_url: Arc<str>,
+    backend_sampling_create_message_url: Arc<str>,
+    backend_logging_set_level_url: Arc<str>,
+    backend_tools_list_authz_url: Arc<str>,
+    backend_resources_list_authz_url: Arc<str>,
+    backend_resources_read_authz_url: Arc<str>,
+    backend_resource_templates_list_authz_url: Arc<str>,
+    backend_prompts_list_authz_url: Arc<str>,
+    backend_prompts_get_authz_url: Arc<str>,
+    backend_tools_call_url: Arc<str>,
+    backend_tools_call_resolve_url: Arc<str>,
+    backend_tools_call_metric_url: Arc<str>,
+    client: Client,
+    // RMCP currently uses reqwest 0.13 while the direct gateway/runtime path
+    // uses reqwest 0.12, so the runtime keeps a separate shared client for that
+    // transport instead of rebuilding it per upstream session/client.
+    #[cfg(feature = "rmcp-upstream-client")]
+    rmcp_client: RmcpReqwestClient,
+    redis_client: Option<redis::Client>,
+    redis_manager: Arc<Mutex<Option<RedisConnectionManager>>>,
+    protocol_version: Arc<str>,
+    supported_protocol_versions: Arc<Vec<String>>,
+    server_name: Arc<str>,
+    server_version: Arc<str>,
+    instructions: Arc<str>,
+    #[cfg(feature = "rmcp-upstream-client")]
+    use_rmcp_upstream_client: bool,
+    session_core_enabled: bool,
+    event_store_enabled: bool,
+    resume_core_enabled: bool,
+    live_stream_core_enabled: bool,
+    affinity_core_enabled: bool,
+    session_auth_reuse_enabled: bool,
+    cache_prefix: Arc<str>,
+    event_store_max_events_per_stream: usize,
+    event_store_ttl: Duration,
+    event_store_poll_interval: Duration,
+    db_pool: Option<Pool>,
+    runtime_sessions: Arc<Mutex<HashMap<String, RuntimeSessionRecord>>>,
+    upstream_tool_sessions: Arc<Mutex<HashMap<String, UpstreamToolSession>>>,
+    #[cfg(feature = "rmcp-upstream-client")]
+    rmcp_upstream_clients: Arc<Mutex<HashMap<String, CachedRmcpUpstreamClient>>>,
+    resolved_tool_call_plans: Arc<Mutex<HashMap<String, CachedResolvedToolCallPlan>>>,
+    tools_call_plan_ttl: Duration,
+    upstream_session_ttl: Duration,
+    session_ttl: Duration,
+    session_auth_reuse_ttl: Duration,
+    public_ingress_enabled: bool,
+    runtime_stats: Arc<RuntimeStats>,
+}
+
+#[derive(Debug, Clone, Deserialize)]
+/// Minimal JSON-RPC request envelope accepted by the runtime edge.
+pub struct JsonRpcRequest {
+    pub jsonrpc: Option<String>,
+    pub method: String,
+    #[serde(default)]
+    pub params: Value,
+    #[serde(default)]
+    pub id: Option<Value>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+/// Health payload returned by `/health` and `/healthz`.
+pub struct HealthResponse {
+    pub status: &'static str,
+    pub runtime: &'static str,
+    pub backend_rpc_url: String,
+    pub protocol_version: String,
+    pub supported_protocol_versions: Vec<String>,
+    pub server_name: String,
+    pub session_core_enabled: bool,
+    pub event_store_enabled: bool,
+    pub resume_core_enabled: bool,
+    pub live_stream_core_enabled: bool,
+    pub affinity_core_enabled: bool,
+    pub session_auth_reuse_enabled: bool,
+    pub active_sessions: usize,
+    pub runtime_stats: RuntimeStatsSnapshot,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+struct PublicHealthResponse {
+    status: &'static str,
+    runtime: &'static str,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, Default)]
+pub struct RuntimeStatsSnapshot {
+    pub session_auth_reuse: SessionAuthReuseStatsSnapshot,
+    pub session_access_denials: SessionAccessDenialStatsSnapshot,
+    pub affinity: AffinityStatsSnapshot,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, Default)]
+pub struct SessionAuthReuseStatsSnapshot {
+    pub hits: u64,
+    pub misses: u64,
+    pub backend_auth_round_trips: u64,
+    pub miss_disabled: u64,
+    pub miss_no_session: u64,
+    pub miss_server_scope_mismatch: u64,
+    pub miss_missing_encoded_auth_context: u64,
+    pub miss_missing_auth_binding_fingerprint: u64,
+    pub miss_auth_binding_mismatch: u64,
+    pub miss_ttl_expired: u64,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, Default)]
+pub struct SessionAccessDenialStatsSnapshot {
+    pub server_scope_mismatches: u64,
+    pub missing_auth_context: u64,
+    pub owner_email_mismatches: u64,
+    pub missing_auth_binding_fingerprint: u64,
+    pub auth_binding_mismatches: u64,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, Default)]
+pub struct AffinityStatsSnapshot {
+    pub forward_attempts: u64,
+    pub forwarded_requests: u64,
+}
+
+#[derive(Debug, Default)]
+struct RuntimeStats {
+    session_auth_reuse_hits: AtomicU64,
+    session_auth_reuse_misses: AtomicU64,
+    session_auth_backend_round_trips: AtomicU64,
+    session_auth_reuse_miss_disabled: AtomicU64,
+    session_auth_reuse_miss_no_session: AtomicU64,
+    session_auth_reuse_miss_server_scope_mismatch: AtomicU64,
+    session_auth_reuse_miss_missing_encoded_auth_context: AtomicU64,
+    session_auth_reuse_miss_missing_auth_binding_fingerprint: AtomicU64,
+    session_auth_reuse_miss_auth_binding_mismatch: AtomicU64,
+    session_auth_reuse_miss_ttl_expired: AtomicU64,
+    session_access_server_scope_mismatches: AtomicU64,
+    session_access_missing_auth_context: AtomicU64,
+    session_access_owner_email_mismatches: AtomicU64,
+    session_access_missing_auth_binding_fingerprint: AtomicU64,
+    session_access_auth_binding_mismatches: AtomicU64,
+    affinity_forward_attempts: AtomicU64,
+    affinity_forwarded_requests: AtomicU64,
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+enum SessionAuthReuseMissReason {
+    Disabled,
+    NoSession,
+    ServerScopeMismatch,
+    MissingEncodedAuthContext,
+    MissingAuthBindingFingerprint,
+    AuthBindingMismatch,
+    TtlExpired,
+}
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+enum SessionAccessDenyReason {
+    MissingAuthContext,
+    OwnerEmailMismatch,
+    MissingAuthBindingFingerprint,
+    AuthBindingMismatch,
+}
+
+const CLIENT_ERROR_DETAIL: &str = "See server logs";
+
+#[derive(Debug, Clone, Copy, Default)]
+struct TrustedPeerAddr(Option<SocketAddr>);
+
+impl<S> FromRequestParts<S> for TrustedPeerAddr
+where
+    S: Send + Sync,
+{
+    type Rejection = Infallible;
+
+    async fn from_request_parts(parts: &mut Parts, _state: &S) -> Result<Self, Self::Rejection> {
+        Ok(Self(
+            parts
+                .extensions
+                .get::<ConnectInfo<SocketAddr>>()
+                .map(|info| info.0),
+        ))
+    }
+}
+
+#[derive(Debug, Default, Clone)]
+struct PendingSseFrame {
+    id: Option<String>,
+    event: Option<String>,
+    data_lines: Vec<String>,
+    retry_ms: Option<u64>,
+    saw_field: bool,
+}
+
+#[derive(Debug, Clone)]
+struct FinalizedSseFrame {
+    id: Option<String>,
+    event: Option<String>,
+    data: String,
+    retry_ms: Option<u64>,
+}
+
+#[derive(Debug, Clone, Deserialize)]
+struct InitializeParams {
+    #[serde(rename = "protocolVersion")]
+    protocol_version: Option<String>,
+}
+
+#[derive(Debug, Clone, Deserialize)]
+/// Minimal normalized auth context returned by Python to the Rust edge.
+///
+/// Rust uses this for ownership checks and optional session-bound auth reuse,
+/// but Python remains the source of truth for authentication and RBAC.
+struct InternalAuthContext {
+    email: Option<String>,
+    teams: Option<Vec<String>>,
+    #[serde(default)]
+    is_admin: bool,
+    #[serde(default)]
+    is_authenticated: bool,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+#[serde(rename_all = "camelCase")]
+/// Payload sent to Python's trusted internal authenticate endpoint.
+///
+/// The request captures the public MCP request shape after nginx/Rust ingress
+/// normalization so Python can evaluate auth and token scoping exactly once.
+struct InternalAuthenticateRequest {
+    method: String,
+    path: String,
+    query_string: String,
+    headers: HashMap<String, String>,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    client_ip: Option<String>,
+}
+
+#[derive(Debug, Clone, Deserialize)]
+#[serde(rename_all = "camelCase")]
+/// Successful response from Python's trusted internal authenticate endpoint.
+struct InternalAuthenticateResponse {
+    auth_context: Value,
+}
+
+#[derive(Debug, Clone, Deserialize)]
+#[serde(rename_all = "camelCase")]
+/// Pre-resolved direct-execution plan for a `tools/call` request.
+///
+/// Python decides whether a call is eligible for Rust-side direct execution and
+/// returns the concrete upstream routing information. Rust then caches the
+/// parsed form of the plan to keep the hot path off repeated JSON/header work.
+struct ResolvedMcpToolCallPlan {
+    eligible: bool,
+    #[serde(default)]
+    fallback_reason: Option<String>,
+    #[serde(default)]
+    tool_id: Option<String>,
+    #[serde(default)]
+    server_id: Option<String>,
+    #[serde(default)]
+    server_url: Option<String>,
+    #[serde(default)]
+    remote_tool_name: Option<String>,
+    #[serde(default)]
+    headers: Option<HashMap<String, String>>,
+    #[serde(default)]
+    timeout_ms: Option<u64>,
+    #[serde(default)]
+    transport: Option<String>,
+    #[serde(skip)]
+    parsed_headers: Option<Vec<(HeaderName, HeaderValue)>>,
+    #[serde(skip)]
+    headers_hash: Option<u64>,
+}
+
+#[derive(Debug, Clone)]
+/// Cached upstream session for a direct or RMCP tool target.
+///
+/// The key is derived from the downstream MCP session plus the resolved tool
+/// plan so unrelated callers or upstreams never share the same upstream MCP
+/// session accidentally.
+struct UpstreamToolSession {
+    session_id: Option<String>,
+    last_used: Instant,
+}
+
+#[allow(dead_code)]
+#[derive(Debug, Clone)]
+/// Runtime-owned metadata for a public MCP session.
+///
+/// This is the central record used for session ownership, optional auth-context
+/// reuse, server-scope pinning, and cross-worker sharing via Redis.
+struct RuntimeSessionRecord {
+    owner_email: Option<String>,
+    server_id: Option<String>,
+    protocol_version: Option<String>,
+    client_capabilities: Option<Value>,
+    encoded_auth_context: Option<String>,
+    auth_binding_fingerprint: Option<String>,
+    auth_context_expires_at_epoch_ms: Option<u64>,
+    created_at: Instant,
+    last_used: Instant,
+}
+
+#[cfg(feature = "rmcp-upstream-client")]
+#[derive(Debug, Clone)]
+struct CachedRmcpUpstreamClient {
+    client: Arc<RmcpRunningService<RmcpRoleClient, RmcpClientInfo>>,
+    last_used: Instant,
+}
+
+#[derive(Debug, Clone)]
+struct CachedResolvedToolCallPlan {
+    plan: ResolvedMcpToolCallPlan,
+    cached_at: Instant,
+}
+
+#[derive(Debug, Clone, Serialize)]
+#[serde(rename_all = "camelCase")]
+struct ToolsCallMetricRecordRequest {
+    tool_id: String,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    server_id: Option<String>,
+    duration_ms: f64,
+    success: bool,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    error_message: Option<String>,
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+/// Redis-serializable subset of [`RuntimeSessionRecord`].
+///
+/// Local-only timing state such as `created_at` and `last_used` is intentionally
+/// rebuilt per worker because it is only used for in-process cache management.
+struct StoredRuntimeSessionRecord {
+    owner_email: Option<String>,
+    server_id: Option<String>,
+    protocol_version: Option<String>,
+    client_capabilities: Option<Value>,
+    encoded_auth_context: Option<String>,
+    auth_binding_fingerprint: Option<String>,
+    auth_context_expires_at_epoch_ms: Option<u64>,
+}
+
+#[derive(Debug, Deserialize)]
+#[serde(rename_all = "camelCase")]
+struct EventStoreStoreRequest {
+    stream_id: String,
+    #[serde(default)]
+    message: Option<Value>,
+    #[serde(default)]
+    key_prefix: Option<String>,
+    #[serde(default)]
+    max_events_per_stream: Option<usize>,
+    #[serde(default)]
+    ttl_seconds: Option<u64>,
+}
+
+#[derive(Debug, Serialize)]
+#[serde(rename_all = "camelCase")]
+struct EventStoreStoreResponse {
+    event_id: String,
+}
+
+#[derive(Debug, Deserialize)]
+#[serde(rename_all = "camelCase")]
+struct EventStoreReplayRequest {
+    last_event_id: String,
+    #[serde(default)]
+    key_prefix: Option<String>,
+}
+
+#[derive(Debug, Serialize)]
+#[serde(rename_all = "camelCase")]
+struct EventStoreReplayResponse {
+    stream_id: Option<String>,
+    events: Vec<EventStoreReplayEvent>,
+}
+
+#[derive(Debug, Serialize)]
+#[serde(rename_all = "camelCase")]
+struct EventStoreReplayEvent {
+    event_id: String,
+    message: Value,
+}
+
+#[derive(Debug, Serialize)]
+struct AffinityForwardRequest<'a> {
+    #[serde(rename = "type")]
+    kind: &'static str,
+    response_channel: String,
+    mcp_session_id: &'a str,
+    method: &'a str,
+    path: &'a str,
+    query_string: &'a str,
+    headers: HashMap<String, String>,
+    body: String,
+    original_worker: &'static str,
+    timestamp: f64,
+}
+
+#[derive(Debug, Deserialize)]
+struct AffinityForwardResponse {
+    status: u16,
+    #[serde(default)]
+    headers: HashMap<String, String>,
+    #[serde(default)]
+    body: String,
+}
+
+#[derive(Debug, Deserialize)]
+struct EventIndexRecord {
+    stream_id: String,
+    seq_num: i64,
+}
+
+impl From<&RuntimeSessionRecord> for StoredRuntimeSessionRecord {
+    fn from(value: &RuntimeSessionRecord) -> Self {
+        Self {
+            owner_email: value.owner_email.clone(),
+            server_id: value.server_id.clone(),
+            protocol_version: value.protocol_version.clone(),
+            client_capabilities: value.client_capabilities.clone(),
+            encoded_auth_context: value.encoded_auth_context.clone(),
+            auth_binding_fingerprint: value.auth_binding_fingerprint.clone(),
+            auth_context_expires_at_epoch_ms: value.auth_context_expires_at_epoch_ms,
+        }
+    }
+}
+
+impl From<StoredRuntimeSessionRecord> for RuntimeSessionRecord {
+    fn from(value: StoredRuntimeSessionRecord) -> Self {
+        Self {
+            owner_email: value.owner_email,
+            server_id: value.server_id,
+            protocol_version: value.protocol_version,
+            client_capabilities: value.client_capabilities,
+            encoded_auth_context: value.encoded_auth_context,
+            auth_binding_fingerprint: value.auth_binding_fingerprint,
+            auth_context_expires_at_epoch_ms: value.auth_context_expires_at_epoch_ms,
+            created_at: std::time::Instant::now(),
+            last_used: std::time::Instant::now(),
+        }
+    }
+}
+
+#[derive(Debug)]
+enum ResolveToolsCallError {
+    Fallback(String),
+    JsonRpcError {
+        payload: Value,
+        headers: reqwest::header::HeaderMap,
+    },
+}
+
+#[derive(Debug, Clone, Serialize)]
+struct McpToolDefinition {
+    name: String,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    description: Option<String>,
+    #[serde(rename = "inputSchema")]
+    input_schema: Value,
+    #[serde(rename = "annotations")]
+    annotations: Value,
+    #[serde(rename = "outputSchema", skip_serializing_if = "Option::is_none")]
+    output_schema: Option<Value>,
+}
+
+impl JsonRpcRequest {
+    fn is_notification(&self) -> bool {
+        matches!(self.id.as_ref(), None | Some(Value::Null))
+            && self.method.starts_with("notifications/")
+    }
+}
+
+impl AppState {
+    /// Builds the shared application state for the Rust MCP runtime.
+    ///
+    /// # Errors
+    ///
+    /// Returns an error when the HTTP client, database pool, or Redis client cannot be
+    /// initialized from the provided configuration.
+    pub fn new(config: &RuntimeConfig) -> Result<Self, RuntimeError> {
+        let client = Client::builder()
+            .connect_timeout(Duration::from_millis(config.client_connect_timeout_ms))
+            .pool_idle_timeout(Duration::from_secs(config.client_pool_idle_timeout_seconds))
+            .pool_max_idle_per_host(config.client_pool_max_idle_per_host)
+            .tcp_keepalive(Duration::from_secs(config.client_tcp_keepalive_seconds))
+            .timeout(Duration::from_millis(config.request_timeout_ms))
+            .build()?;
+        #[cfg(feature = "rmcp-upstream-client")]
+        let rmcp_client = RmcpReqwestClient::builder()
+            .connect_timeout(Duration::from_millis(config.client_connect_timeout_ms))
+            .pool_idle_timeout(Duration::from_secs(config.client_pool_idle_timeout_seconds))
+            .pool_max_idle_per_host(config.client_pool_max_idle_per_host)
+            .tcp_keepalive(Duration::from_secs(config.client_tcp_keepalive_seconds))
+            .timeout(Duration::from_millis(config.request_timeout_ms))
+            .build()
+            .map_err(|err| RuntimeError::Config(format!("rmcp http client error: {err}")))?;
+        let db_pool = build_db_pool(config)?;
+        let redis_client = build_redis_client(config)?;
+
+        Ok(Self {
+            backend_rpc_url: Arc::from(config.backend_rpc_url.clone()),
+            backend_authenticate_url: Arc::from(derive_backend_authenticate_url(
+                &config.backend_rpc_url,
+            )),
+            backend_initialize_url: Arc::from(derive_backend_initialize_url(
+                &config.backend_rpc_url,
+            )),
+            backend_notifications_initialized_url: Arc::from(
+                derive_backend_notifications_initialized_url(&config.backend_rpc_url),
+            ),
+            backend_notifications_message_url: Arc::from(derive_backend_notifications_message_url(
+                &config.backend_rpc_url,
+            )),
+            backend_notifications_cancelled_url: Arc::from(
+                derive_backend_notifications_cancelled_url(&config.backend_rpc_url),
+            ),
+            backend_transport_url: Arc::from(derive_backend_transport_url(&config.backend_rpc_url)),
+            backend_tools_list_url: Arc::from(derive_backend_tools_list_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resources_list_url: Arc::from(derive_backend_resources_list_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resources_read_url: Arc::from(derive_backend_resources_read_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resources_subscribe_url: Arc::from(derive_backend_resources_subscribe_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resources_unsubscribe_url: Arc::from(derive_backend_resources_unsubscribe_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resource_templates_list_url: Arc::from(
+                derive_backend_resource_templates_list_url(&config.backend_rpc_url),
+            ),
+            backend_prompts_list_url: Arc::from(derive_backend_prompts_list_url(
+                &config.backend_rpc_url,
+            )),
+            backend_prompts_get_url: Arc::from(derive_backend_prompts_get_url(
+                &config.backend_rpc_url,
+            )),
+            backend_roots_list_url: Arc::from(derive_backend_roots_list_url(
+                &config.backend_rpc_url,
+            )),
+            backend_completion_complete_url: Arc::from(derive_backend_completion_complete_url(
+                &config.backend_rpc_url,
+            )),
+            backend_sampling_create_message_url: Arc::from(
+                derive_backend_sampling_create_message_url(&config.backend_rpc_url),
+            ),
+            backend_logging_set_level_url: Arc::from(derive_backend_logging_set_level_url(
+                &config.backend_rpc_url,
+            )),
+            backend_tools_list_authz_url: Arc::from(derive_backend_tools_list_authz_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resources_list_authz_url: Arc::from(derive_backend_resources_list_authz_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resources_read_authz_url: Arc::from(derive_backend_resources_read_authz_url(
+                &config.backend_rpc_url,
+            )),
+            backend_resource_templates_list_authz_url: Arc::from(
+                derive_backend_resource_templates_list_authz_url(&config.backend_rpc_url),
+            ),
+            backend_prompts_list_authz_url: Arc::from(derive_backend_prompts_list_authz_url(
+                &config.backend_rpc_url,
+            )),
+            backend_prompts_get_authz_url: Arc::from(derive_backend_prompts_get_authz_url(
+                &config.backend_rpc_url,
+            )),
+            backend_tools_call_url: Arc::from(derive_backend_tools_call_url(
+                &config.backend_rpc_url,
+            )),
+            backend_tools_call_resolve_url: Arc::from(derive_backend_tools_call_resolve_url(
+                &config.backend_rpc_url,
+            )),
+            backend_tools_call_metric_url: Arc::from(derive_backend_tools_call_metric_url(
+                &config.backend_rpc_url,
+            )),
+            client,
+            #[cfg(feature = "rmcp-upstream-client")]
+            rmcp_client,
+            redis_client,
+            redis_manager: Arc::new(Mutex::new(None)),
+            protocol_version: Arc::from(config.protocol_version.clone()),
+            supported_protocol_versions: Arc::new(config.effective_supported_protocol_versions()),
+            server_name: Arc::from(config.server_name.clone()),
+            server_version: Arc::from(config.server_version.clone()),
+            instructions: Arc::from(config.instructions.clone()),
+            #[cfg(feature = "rmcp-upstream-client")]
+            use_rmcp_upstream_client: config.use_rmcp_upstream_client,
+            session_core_enabled: config.session_core_enabled,
+            event_store_enabled: config.event_store_enabled,
+            resume_core_enabled: config.resume_core_enabled,
+            live_stream_core_enabled: config.live_stream_core_enabled,
+            affinity_core_enabled: config.affinity_core_enabled,
+            session_auth_reuse_enabled: config.session_auth_reuse_enabled,
+            cache_prefix: Arc::from(config.cache_prefix.clone()),
+            event_store_max_events_per_stream: config.event_store_max_events_per_stream,
+            event_store_ttl: Duration::from_secs(config.event_store_ttl_seconds),
+            event_store_poll_interval: Duration::from_millis(config.event_store_poll_interval_ms),
+            db_pool,
+            runtime_sessions: Arc::new(Mutex::new(HashMap::new())),
+            upstream_tool_sessions: Arc::new(Mutex::new(HashMap::new())),
+            #[cfg(feature = "rmcp-upstream-client")]
+            rmcp_upstream_clients: Arc::new(Mutex::new(HashMap::new())),
+            resolved_tool_call_plans: Arc::new(Mutex::new(HashMap::new())),
+            tools_call_plan_ttl: Duration::from_secs(config.tools_call_plan_ttl_seconds),
+            upstream_session_ttl: Duration::from_secs(config.upstream_session_ttl_seconds),
+            session_ttl: Duration::from_secs(config.session_ttl_seconds),
+            session_auth_reuse_ttl: Duration::from_secs(config.session_auth_reuse_ttl_seconds),
+            public_ingress_enabled: config.public_listen_http.is_some(),
+            runtime_stats: Arc::new(RuntimeStats::default()),
+        })
+    }
+
+    #[must_use]
+    pub fn backend_rpc_url(&self) -> &str {
+        &self.backend_rpc_url
+    }
+
+    #[must_use]
+    pub fn backend_authenticate_url(&self) -> &str {
+        &self.backend_authenticate_url
+    }
+
+    #[must_use]
+    pub fn backend_initialize_url(&self) -> &str {
+        &self.backend_initialize_url
+    }
+
+    #[must_use]
+    pub fn backend_notifications_initialized_url(&self) -> &str {
+        &self.backend_notifications_initialized_url
+    }
+
+    #[must_use]
+    pub fn backend_notifications_message_url(&self) -> &str {
+        &self.backend_notifications_message_url
+    }
+
+    #[must_use]
+    pub fn backend_notifications_cancelled_url(&self) -> &str {
+        &self.backend_notifications_cancelled_url
+    }
+
+    #[must_use]
+    pub fn backend_transport_url(&self) -> &str {
+        &self.backend_transport_url
+    }
+
+    #[must_use]
+    pub fn backend_tools_list_url(&self) -> &str {
+        &self.backend_tools_list_url
+    }
+
+    #[must_use]
+    pub fn backend_resources_list_url(&self) -> &str {
+        &self.backend_resources_list_url
+    }
+
+    #[must_use]
+    pub fn backend_resources_read_url(&self) -> &str {
+        &self.backend_resources_read_url
+    }
+
+    #[must_use]
+    pub fn backend_resources_subscribe_url(&self) -> &str {
+        &self.backend_resources_subscribe_url
+    }
+
+    #[must_use]
+    pub fn backend_resources_unsubscribe_url(&self) -> &str {
+        &self.backend_resources_unsubscribe_url
+    }
+
+    #[must_use]
+    pub fn backend_resource_templates_list_url(&self) -> &str {
+        &self.backend_resource_templates_list_url
+    }
+
+    #[must_use]
+    pub fn backend_prompts_list_url(&self) -> &str {
+        &self.backend_prompts_list_url
+    }
+
+    #[must_use]
+    pub fn backend_prompts_get_url(&self) -> &str {
+        &self.backend_prompts_get_url
+    }
+
+    #[must_use]
+    pub fn backend_roots_list_url(&self) -> &str {
+        &self.backend_roots_list_url
+    }
+
+    #[must_use]
+    pub fn backend_completion_complete_url(&self) -> &str {
+        &self.backend_completion_complete_url
+    }
+
+    #[must_use]
+    pub fn backend_sampling_create_message_url(&self) -> &str {
+        &self.backend_sampling_create_message_url
+    }
+
+    #[must_use]
+    pub fn backend_logging_set_level_url(&self) -> &str {
+        &self.backend_logging_set_level_url
+    }
+
+    #[must_use]
+    pub fn backend_tools_list_authz_url(&self) -> &str {
+        &self.backend_tools_list_authz_url
+    }
+
+    #[must_use]
+    pub fn backend_resources_list_authz_url(&self) -> &str {
+        &self.backend_resources_list_authz_url
+    }
+
+    #[must_use]
+    pub fn backend_resources_read_authz_url(&self) -> &str {
+        &self.backend_resources_read_authz_url
+    }
+
+    #[must_use]
+    pub fn backend_resource_templates_list_authz_url(&self) -> &str {
+        &self.backend_resource_templates_list_authz_url
+    }
+
+    #[must_use]
+    pub fn backend_prompts_list_authz_url(&self) -> &str {
+        &self.backend_prompts_list_authz_url
+    }
+
+    #[must_use]
+    pub fn backend_prompts_get_authz_url(&self) -> &str {
+        &self.backend_prompts_get_authz_url
+    }
+
+    #[must_use]
+    pub fn backend_tools_call_url(&self) -> &str {
+        &self.backend_tools_call_url
+    }
+
+    #[must_use]
+    pub fn backend_tools_call_resolve_url(&self) -> &str {
+        &self.backend_tools_call_resolve_url
+    }
+
+    #[must_use]
+    pub fn backend_tools_call_metric_url(&self) -> &str {
+        &self.backend_tools_call_metric_url
+    }
+
+    #[must_use]
+    pub fn protocol_version(&self) -> &str {
+        &self.protocol_version
+    }
+
+    async fn redis(&self) -> Option<RedisConnectionManager> {
+        if let Some(manager) = self.redis_manager.lock().await.clone() {
+            return Some(manager);
+        }
+
+        let client = self.redis_client.clone()?;
+        let manager = match RedisConnectionManager::new(client).await {
+            Ok(manager) => manager,
+            Err(err) => {
+                warn!("Rust MCP Redis manager initialization failed: {err}");
+                return None;
+            }
+        };
+
+        let mut slot = self.redis_manager.lock().await;
+        *slot = Some(manager.clone());
+        Some(manager)
+    }
+
+    #[must_use]
+    pub fn supported_protocol_versions(&self) -> &[String] {
+        self.supported_protocol_versions.as_slice()
+    }
+
+    #[must_use]
+    pub fn server_name(&self) -> &str {
+        &self.server_name
+    }
+
+    #[must_use]
+    pub fn server_version(&self) -> &str {
+        &self.server_version
+    }
+
+    #[must_use]
+    pub fn instructions(&self) -> &str {
+        &self.instructions
+    }
+
+    #[allow(clippy::unused_self)]
+    fn use_rmcp_upstream_client(&self) -> bool {
+        #[cfg(feature = "rmcp-upstream-client")]
+        {
+            self.use_rmcp_upstream_client
+        }
+        #[cfg(not(feature = "rmcp-upstream-client"))]
+        {
+            false
+        }
+    }
+
+    #[must_use]
+    pub fn session_core_enabled(&self) -> bool {
+        self.session_core_enabled
+    }
+
+    #[must_use]
+    pub fn event_store_enabled(&self) -> bool {
+        self.event_store_enabled
+    }
+
+    #[must_use]
+    pub fn resume_core_enabled(&self) -> bool {
+        self.resume_core_enabled
+    }
+
+    #[must_use]
+    pub fn live_stream_core_enabled(&self) -> bool {
+        self.live_stream_core_enabled
+    }
+
+    #[must_use]
+    pub fn affinity_core_enabled(&self) -> bool {
+        self.affinity_core_enabled
+    }
+
+    #[must_use]
+    pub fn session_auth_reuse_enabled(&self) -> bool {
+        self.session_auth_reuse_enabled
+    }
+
+    fn cache_prefix(&self) -> &str {
+        &self.cache_prefix
+    }
+
+    fn event_store_max_events_per_stream(&self) -> usize {
+        self.event_store_max_events_per_stream
+    }
+
+    fn event_store_ttl(&self) -> Duration {
+        self.event_store_ttl
+    }
+
+    fn event_store_poll_interval(&self) -> Duration {
+        self.event_store_poll_interval
+    }
+
+    #[must_use]
+    pub fn db_pool(&self) -> Option<&Pool> {
+        self.db_pool.as_ref()
+    }
+
+    fn runtime_sessions(&self) -> &Arc<Mutex<HashMap<String, RuntimeSessionRecord>>> {
+        &self.runtime_sessions
+    }
+
+    fn upstream_tool_sessions(&self) -> &Arc<Mutex<HashMap<String, UpstreamToolSession>>> {
+        &self.upstream_tool_sessions
+    }
+
+    #[cfg(feature = "rmcp-upstream-client")]
+    fn rmcp_upstream_clients(&self) -> &Arc<Mutex<HashMap<String, CachedRmcpUpstreamClient>>> {
+        &self.rmcp_upstream_clients
+    }
+
+    fn resolved_tool_call_plans(&self) -> &Arc<Mutex<HashMap<String, CachedResolvedToolCallPlan>>> {
+        &self.resolved_tool_call_plans
+    }
+
+    fn tools_call_plan_ttl(&self) -> Duration {
+        self.tools_call_plan_ttl
+    }
+
+    fn upstream_session_ttl(&self) -> Duration {
+        self.upstream_session_ttl
+    }
+
+    fn session_ttl(&self) -> Duration {
+        self.session_ttl
+    }
+
+    fn session_auth_reuse_ttl(&self) -> Duration {
+        self.session_auth_reuse_ttl
+    }
+
+    fn public_ingress_enabled(&self) -> bool {
+        self.public_ingress_enabled
+    }
+
+    fn runtime_stats(&self) -> &Arc<RuntimeStats> {
+        &self.runtime_stats
+    }
+}
+
+impl RuntimeStats {
+    fn snapshot(&self) -> RuntimeStatsSnapshot {
+        RuntimeStatsSnapshot {
+            session_auth_reuse: SessionAuthReuseStatsSnapshot {
+                hits: self.session_auth_reuse_hits.load(Ordering::Relaxed),
+                misses: self.session_auth_reuse_misses.load(Ordering::Relaxed),
+                backend_auth_round_trips: self
+                    .session_auth_backend_round_trips
+                    .load(Ordering::Relaxed),
+                miss_disabled: self
+                    .session_auth_reuse_miss_disabled
+                    .load(Ordering::Relaxed),
+                miss_no_session: self
+                    .session_auth_reuse_miss_no_session
+                    .load(Ordering::Relaxed),
+                miss_server_scope_mismatch: self
+                    .session_auth_reuse_miss_server_scope_mismatch
+                    .load(Ordering::Relaxed),
+                miss_missing_encoded_auth_context: self
+                    .session_auth_reuse_miss_missing_encoded_auth_context
+                    .load(Ordering::Relaxed),
+                miss_missing_auth_binding_fingerprint: self
+                    .session_auth_reuse_miss_missing_auth_binding_fingerprint
+                    .load(Ordering::Relaxed),
+                miss_auth_binding_mismatch: self
+                    .session_auth_reuse_miss_auth_binding_mismatch
+                    .load(Ordering::Relaxed),
+                miss_ttl_expired: self
+                    .session_auth_reuse_miss_ttl_expired
+                    .load(Ordering::Relaxed),
+            },
+            session_access_denials: SessionAccessDenialStatsSnapshot {
+                server_scope_mismatches: self
+                    .session_access_server_scope_mismatches
+                    .load(Ordering::Relaxed),
+                missing_auth_context: self
+                    .session_access_missing_auth_context
+                    .load(Ordering::Relaxed),
+                owner_email_mismatches: self
+                    .session_access_owner_email_mismatches
+                    .load(Ordering::Relaxed),
+                missing_auth_binding_fingerprint: self
+                    .session_access_missing_auth_binding_fingerprint
+                    .load(Ordering::Relaxed),
+                auth_binding_mismatches: self
+                    .session_access_auth_binding_mismatches
+                    .load(Ordering::Relaxed),
+            },
+            affinity: AffinityStatsSnapshot {
+                forward_attempts: self.affinity_forward_attempts.load(Ordering::Relaxed),
+                forwarded_requests: self.affinity_forwarded_requests.load(Ordering::Relaxed),
+            },
+        }
+    }
+
+    fn record_session_auth_reuse_hit(&self) {
+        self.session_auth_reuse_hits.fetch_add(1, Ordering::Relaxed);
+    }
+
+    fn record_session_auth_reuse_miss(&self, reason: SessionAuthReuseMissReason) {
+        self.session_auth_reuse_misses
+            .fetch_add(1, Ordering::Relaxed);
+        match reason {
+            SessionAuthReuseMissReason::Disabled => {
+                self.session_auth_reuse_miss_disabled
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAuthReuseMissReason::NoSession => {
+                self.session_auth_reuse_miss_no_session
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAuthReuseMissReason::ServerScopeMismatch => {
+                self.session_auth_reuse_miss_server_scope_mismatch
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAuthReuseMissReason::MissingEncodedAuthContext => {
+                self.session_auth_reuse_miss_missing_encoded_auth_context
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAuthReuseMissReason::MissingAuthBindingFingerprint => {
+                self.session_auth_reuse_miss_missing_auth_binding_fingerprint
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAuthReuseMissReason::AuthBindingMismatch => {
+                self.session_auth_reuse_miss_auth_binding_mismatch
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAuthReuseMissReason::TtlExpired => {
+                self.session_auth_reuse_miss_ttl_expired
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+        }
+    }
+
+    fn record_session_auth_backend_round_trip(&self) {
+        self.session_auth_backend_round_trips
+            .fetch_add(1, Ordering::Relaxed);
+    }
+
+    fn record_session_access_denial(&self, reason: SessionAccessDenyReason) {
+        match reason {
+            SessionAccessDenyReason::MissingAuthContext => {
+                self.session_access_missing_auth_context
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAccessDenyReason::OwnerEmailMismatch => {
+                self.session_access_owner_email_mismatches
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAccessDenyReason::MissingAuthBindingFingerprint => {
+                self.session_access_missing_auth_binding_fingerprint
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+            SessionAccessDenyReason::AuthBindingMismatch => {
+                self.session_access_auth_binding_mismatches
+                    .fetch_add(1, Ordering::Relaxed);
+            }
+        }
+    }
+
+    fn record_session_server_scope_mismatch(&self) {
+        self.session_access_server_scope_mismatches
+            .fetch_add(1, Ordering::Relaxed);
+    }
+
+    fn record_affinity_forward_attempt(&self) {
+        self.affinity_forward_attempts
+            .fetch_add(1, Ordering::Relaxed);
+    }
+
+    fn record_affinity_forwarded_request(&self) {
+        self.affinity_forwarded_requests
+            .fetch_add(1, Ordering::Relaxed);
+    }
+}
+
+/// Builds the Axum router for the Rust MCP runtime.
+///
+/// The router exposes public MCP ingress, health probes, and internal helpers
+/// used by tests and mode-specific runtime slices.
+pub fn build_router(state: AppState) -> Router {
+    Router::new()
+        .route("/health", get(healthz))
+        .route("/healthz", get(healthz))
+        .route("/_internal/event-store/store", post(store_event_endpoint))
+        .route(
+            "/_internal/event-store/replay",
+            post(replay_events_endpoint),
+        )
+        .route("/rpc", post(rpc))
+        .route("/rpc/", post(rpc))
+        .route(
+            "/mcp",
+            get(transport_get).delete(transport_delete).post(rpc),
+        )
+        .route(
+            "/mcp/",
+            get(transport_get).delete(transport_delete).post(rpc),
+        )
+        .route(
+            "/servers/{server_id}/mcp",
+            get(transport_get_server_scoped)
+                .delete(transport_delete_server_scoped)
+                .post(rpc_server_scoped),
+        )
+        .route(
+            "/servers/{server_id}/mcp/",
+            get(transport_get_server_scoped)
+                .delete(transport_delete_server_scoped)
+                .post(rpc_server_scoped),
+        )
+        .with_state(state)
+}
+
+fn build_public_router(state: AppState) -> Router {
+    Router::new()
+        .route("/health", get(public_healthz))
+        .route("/healthz", get(public_healthz))
+        .route("/rpc", post(rpc))
+        .route("/rpc/", post(rpc))
+        .route(
+            "/mcp",
+            get(transport_get).delete(transport_delete).post(rpc),
+        )
+        .route(
+            "/mcp/",
+            get(transport_get).delete(transport_delete).post(rpc),
+        )
+        .route(
+            "/servers/{server_id}/mcp",
+            get(transport_get_server_scoped)
+                .delete(transport_delete_server_scoped)
+                .post(rpc_server_scoped),
+        )
+        .route(
+            "/servers/{server_id}/mcp/",
+            get(transport_get_server_scoped)
+                .delete(transport_delete_server_scoped)
+                .post(rpc_server_scoped),
+        )
+        .with_state(state)
+}
+
+/// Runs the Rust MCP runtime with the configured listeners.
+///
+/// # Errors
+///
+/// Returns an error when configuration parsing fails, listener startup fails, or a listener
+/// exits with an application-level runtime error.
+pub async fn run(config: RuntimeConfig) -> Result<(), RuntimeError> {
+    let state = AppState::new(&config)?;
+    spawn_local_cache_sweeper(state.clone());
+    let app = build_router(state.clone());
+    let public_app = build_public_router(state);
+
+    let primary_target = config.listen_target().map_err(RuntimeError::Config)?;
+    let public_http_addr = config.public_listen_addr().map_err(RuntimeError::Config)?;
+    let shutdown_after = config.exit_after_startup_ms.map(Duration::from_millis);
+
+    match (primary_target, public_http_addr) {
+        (ListenTarget::Http(addr), None) => {
+            serve_http(app, addr, shutdown_after).await?;
+        }
+        (ListenTarget::Http(addr), Some(public_addr)) => {
+            tokio::try_join!(
+                serve_http(app.clone(), addr, shutdown_after),
+                serve_http(public_app, public_addr, shutdown_after)
+            )?;
+        }
+        (ListenTarget::Uds(path), None) => {
+            serve_uds(app, path, shutdown_after).await?;
+        }
+        (ListenTarget::Uds(path), Some(public_addr)) => {
+            tokio::try_join!(
+                serve_uds(app.clone(), path, shutdown_after),
+                serve_http(public_app, public_addr, shutdown_after)
+            )?;
+        }
+    }
+
+    Ok(())
+}
+
+async fn serve_http(
+    app: Router,
+    addr: std::net::SocketAddr,
+    shutdown_after: Option<Duration>,
+) -> Result<(), RuntimeError> {
+    info!("starting Rust MCP runtime on http://{addr}");
+    let listener = tokio::net::TcpListener::bind(addr).await?;
+    if let Some(delay) = shutdown_after {
+        axum::serve(
+            listener,
+            app.into_make_service_with_connect_info::<SocketAddr>(),
+        )
+        .with_graceful_shutdown(async move {
+            tokio::time::sleep(delay).await;
+        })
+        .await?;
+    } else {
+        axum::serve(
+            listener,
+            app.into_make_service_with_connect_info::<SocketAddr>(),
+        )
+        .await?;
+    }
+    Ok(())
+}
+
+async fn serve_uds(
+    app: Router,
+    path: std::path::PathBuf,
+    shutdown_after: Option<Duration>,
+) -> Result<(), RuntimeError> {
+    if Path::new(&path).exists() {
+        std::fs::remove_file(&path)?;
+    }
+    info!("starting Rust MCP runtime on unix://{}", path.display());
+    let listener = tokio::net::UnixListener::bind(&path)?;
+    if let Some(delay) = shutdown_after {
+        axum::serve(listener, app)
+            .with_graceful_shutdown(async move {
+                tokio::time::sleep(delay).await;
+            })
+            .await?;
+    } else {
+        axum::serve(listener, app).await?;
+    }
+    Ok(())
+}
+
+async fn healthz(State(state): State<AppState>) -> Json<HealthResponse> {
+    let active_sessions = active_runtime_session_count(&state).await;
+    Json(HealthResponse {
+        status: "ok",
+        runtime: RUNTIME_NAME,
+        backend_rpc_url: state.backend_rpc_url().to_string(),
+        protocol_version: state.protocol_version().to_string(),
+        supported_protocol_versions: state.supported_protocol_versions().to_vec(),
+        server_name: state.server_name().to_string(),
+        session_core_enabled: state.session_core_enabled(),
+        event_store_enabled: state.event_store_enabled(),
+        resume_core_enabled: state.resume_core_enabled(),
+        live_stream_core_enabled: state.live_stream_core_enabled(),
+        affinity_core_enabled: state.affinity_core_enabled(),
+        session_auth_reuse_enabled: state.session_auth_reuse_enabled(),
+        active_sessions,
+        runtime_stats: state.runtime_stats().snapshot(),
+    })
+}
+
+async fn public_healthz() -> Json<PublicHealthResponse> {
+    Json(PublicHealthResponse {
+        status: "ok",
+        runtime: RUNTIME_NAME,
+    })
+}
+
+async fn transport_get(
+    State(state): State<AppState>,
+    peer_addr: TrustedPeerAddr,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+) -> Response {
+    transport_get_inner(state, peer_addr.0, headers, uri, None).await
+}
+
+async fn transport_delete(
+    State(state): State<AppState>,
+    peer_addr: TrustedPeerAddr,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+) -> Response {
+    transport_delete_inner(state, peer_addr.0, headers, uri, None).await
+}
+
+async fn transport_get_server_scoped(
+    State(state): State<AppState>,
+    AxumPath(server_id): AxumPath<String>,
+    peer_addr: TrustedPeerAddr,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+) -> Response {
+    transport_get_inner(state, peer_addr.0, headers, uri, Some(server_id)).await
+}
+
+async fn transport_delete_server_scoped(
+    State(state): State<AppState>,
+    AxumPath(server_id): AxumPath<String>,
+    peer_addr: TrustedPeerAddr,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+) -> Response {
+    transport_delete_inner(state, peer_addr.0, headers, uri, Some(server_id)).await
+}
+
+async fn transport_get_inner(
+    state: AppState,
+    peer_addr: Option<SocketAddr>,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+    server_id: Option<String>,
+) -> Response {
+    let (headers, path) = match authenticate_public_request_if_needed(
+        &state,
+        "GET",
+        headers,
+        &uri,
+        server_id.as_deref(),
+        peer_addr,
+    )
+    .await
+    {
+        Ok(result) => result,
+        Err(response) => return response,
+    };
+    forward_transport_request(&state, reqwest::Method::GET, headers, path, uri).await
+}
+
+async fn transport_delete_inner(
+    state: AppState,
+    peer_addr: Option<SocketAddr>,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+    server_id: Option<String>,
+) -> Response {
+    let (headers, path) = match authenticate_public_request_if_needed(
+        &state,
+        "DELETE",
+        headers,
+        &uri,
+        server_id.as_deref(),
+        peer_addr,
+    )
+    .await
+    {
+        Ok(result) => result,
+        Err(response) => return response,
+    };
+    forward_transport_request(&state, reqwest::Method::DELETE, headers, path, uri).await
+}
+
+async fn store_event_endpoint(
+    State(state): State<AppState>,
+    Json(request): Json<EventStoreStoreRequest>,
+) -> Response {
+    if !state.event_store_enabled() {
+        return json_response(
+            StatusCode::NOT_IMPLEMENTED,
+            json!({"detail": "Rust event store is disabled"}),
+        );
+    }
+
+    let event_id = match store_event_in_rust_event_store(&state, request).await {
+        Ok(event_id) => event_id,
+        Err(response) => return response,
+    };
+
+    let mut response = Json(EventStoreStoreResponse { event_id }).into_response();
+    response.headers_mut().insert(
+        HeaderName::from_static(RUNTIME_HEADER),
+        HeaderValue::from_static(RUNTIME_NAME),
+    );
+    response.headers_mut().insert(
+        HeaderName::from_static(EVENT_STORE_HEADER),
+        HeaderValue::from_static("rust"),
+    );
+    response
+}
+
+async fn replay_events_endpoint(
+    State(state): State<AppState>,
+    Json(request): Json<EventStoreReplayRequest>,
+) -> Response {
+    if !state.event_store_enabled() {
+        return json_response(
+            StatusCode::NOT_IMPLEMENTED,
+            json!({"detail": "Rust event store is disabled"}),
+        );
+    }
+
+    let replay = match replay_events_from_rust_event_store(&state, request).await {
+        Ok(replay) => replay,
+        Err(response) => return response,
+    };
+
+    let mut response = Json(replay).into_response();
+    response.headers_mut().insert(
+        HeaderName::from_static(RUNTIME_HEADER),
+        HeaderValue::from_static(RUNTIME_NAME),
+    );
+    response.headers_mut().insert(
+        HeaderName::from_static(EVENT_STORE_HEADER),
+        HeaderValue::from_static("rust"),
+    );
+    response
+}
+
+async fn rpc(
+    State(state): State<AppState>,
+    peer_addr: TrustedPeerAddr,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+    body: Bytes,
+) -> Response {
+    rpc_inner(state, peer_addr.0, headers, uri, body, None).await
+}
+
+async fn rpc_server_scoped(
+    State(state): State<AppState>,
+    AxumPath(server_id): AxumPath<String>,
+    peer_addr: TrustedPeerAddr,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+    body: Bytes,
+) -> Response {
+    rpc_inner(state, peer_addr.0, headers, uri, body, Some(server_id)).await
+}
+
+async fn rpc_inner(
+    state: AppState,
+    peer_addr: Option<SocketAddr>,
+    headers: HeaderMap,
+    uri: axum::http::Uri,
+    body: Bytes,
+    server_id: Option<String>,
+) -> Response {
+    let (headers, path) = match authenticate_public_request_if_needed(
+        &state,
+        "POST",
+        headers,
+        &uri,
+        server_id.as_deref(),
+        peer_addr,
+    )
+    .await
+    {
+        Ok(result) => result,
+        Err(response) => return response,
+    };
+
+    if let Err(response) = validate_protocol_version(&state, &headers) {
+        return response;
+    }
+
+    let request = match decode_request(&body) {
+        Ok(request) => request,
+        Err(response) => return response,
+    };
+
+    let server_scoped_request = has_server_scope(&headers);
+    let server_scoped_tools_list = request.method == "tools/list" && server_scoped_request;
+    let rust_db_direct_tools_list = server_scoped_tools_list && state.db_pool().is_some();
+    let specialized_initialize = request.method == "initialize";
+    let specialized_resources_list = request.method == "resources/list";
+    let specialized_resources_read = request.method == "resources/read";
+    let specialized_resources_subscribe = request.method == "resources/subscribe";
+    let specialized_resources_unsubscribe = request.method == "resources/unsubscribe";
+    let specialized_resource_templates_list = request.method == "resources/templates/list";
+    let specialized_prompts_list = request.method == "prompts/list";
+    let specialized_prompts_get = request.method == "prompts/get";
+    let specialized_roots_list = request.method == "roots/list";
+    let specialized_completion_complete = request.method == "completion/complete";
+    let specialized_sampling_create_message = request.method == "sampling/createMessage";
+    let specialized_logging_set_level = request.method == "logging/setLevel";
+    let specialized_initialized_notification =
+        request.is_notification() && request.method == "notifications/initialized";
+    let specialized_message_notification =
+        request.is_notification() && request.method == "notifications/message";
+    let specialized_cancelled_notification =
+        request.is_notification() && request.method == "notifications/cancelled";
+    let catch_all_notifications = request.method.starts_with("notifications/")
+        && !specialized_initialized_notification
+        && !specialized_message_notification
+        && !specialized_cancelled_notification;
+    let catch_all_sampling =
+        request.method.starts_with("sampling/") && !specialized_sampling_create_message;
+    let catch_all_completion =
+        request.method.starts_with("completion/") && !specialized_completion_complete;
+    let catch_all_logging =
+        request.method.starts_with("logging/") && !specialized_logging_set_level;
+    let catch_all_elicitation =
+        request.method.starts_with("elicitation/") && request.method != "elicitation/create";
+    let specialized_tools_call = request.method == "tools/call";
+    let rust_db_direct_resources_list =
+        specialized_resources_list && server_scoped_request && state.db_pool().is_some();
+    let rust_db_direct_resources_read = specialized_resources_read
+        && server_scoped_request
+        && state.db_pool().is_some()
+        && can_use_direct_resources_read(&request.params);
+    let rust_db_direct_resource_templates_list =
+        specialized_resource_templates_list && server_scoped_request && state.db_pool().is_some();
+    let rust_db_direct_prompts_list =
+        specialized_prompts_list && server_scoped_request && state.db_pool().is_some();
+    let rust_db_direct_prompts_get = specialized_prompts_get
+        && server_scoped_request
+        && state.db_pool().is_some()
+        && can_use_direct_prompts_get(&request.params);
+    let mut effective_headers = headers.clone();
+
+    if specialized_prompts_get
+        && let Some(params) = request.params.as_object()
+        && let Err(response) = validate_prompt_get_arguments(params, request.id.as_ref())
+    {
+        return response;
+    }
+
+    if state.session_core_enabled() {
+        if specialized_initialize {
+            return handle_initialize_with_session_core(
+                &state,
+                effective_headers,
+                uri,
+                body,
+                &request,
+            )
+            .await;
+        }
+
+        if let Err(response) =
+            validate_runtime_session_request(&state, &mut effective_headers, &uri).await
+        {
+            return response;
+        }
+    }
+
+    let request_session_id = runtime_session_id_from_request(&effective_headers, &uri);
+    if state.affinity_core_enabled()
+        && state.session_core_enabled()
+        && !specialized_initialize
+        && request_session_id.is_some()
+    {
+        let affinity_response = match forward_transport_request_via_affinity_owner(
+            &state,
+            request_session_id.as_deref().unwrap_or_default(),
+            reqwest::Method::POST,
+            path.as_str(),
+            uri.query().unwrap_or_default(),
+            &effective_headers,
+            &body,
+        )
+        .await
+        {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+        if let Some(response) = affinity_response {
+            let mut response = response;
+            if let Ok(value) = HeaderValue::from_str(if state.affinity_core_enabled() {
+                "rust"
+            } else {
+                "python"
+            }) {
+                response
+                    .headers_mut()
+                    .insert(HeaderName::from_static(AFFINITY_CORE_HEADER), value);
+            }
+            return response;
+        }
+    }
+
+    let mode = if request.method == "ping" {
+        "local"
+    } else if specialized_initialized_notification {
+        "backend-notifications-initialized-direct"
+    } else if specialized_message_notification {
+        "backend-notifications-message-direct"
+    } else if specialized_cancelled_notification {
+        "backend-notifications-cancelled-direct"
+    } else if rust_db_direct_resources_list {
+        "db-resources-list-direct"
+    } else if specialized_resources_list {
+        "backend-resources-list-direct"
+    } else if rust_db_direct_resources_read {
+        "db-resources-read-direct"
+    } else if specialized_resources_read {
+        "backend-resources-read-direct"
+    } else if specialized_resources_subscribe {
+        "backend-resources-subscribe-direct"
+    } else if specialized_resources_unsubscribe {
+        "backend-resources-unsubscribe-direct"
+    } else if rust_db_direct_resource_templates_list {
+        "db-resource-templates-list-direct"
+    } else if specialized_resource_templates_list {
+        "backend-resource-templates-list-direct"
+    } else if rust_db_direct_prompts_list {
+        "db-prompts-list-direct"
+    } else if specialized_prompts_list {
+        "backend-prompts-list-direct"
+    } else if rust_db_direct_prompts_get {
+        "db-prompts-get-direct"
+    } else if specialized_prompts_get {
+        "backend-prompts-get-direct"
+    } else if specialized_roots_list {
+        "backend-roots-list-direct"
+    } else if specialized_completion_complete {
+        "backend-completion-complete-direct"
+    } else if specialized_sampling_create_message {
+        "backend-sampling-create-message-direct"
+    } else if specialized_logging_set_level {
+        "backend-logging-set-level-direct"
+    } else if catch_all_notifications {
+        "local-notifications-catchall"
+    } else if catch_all_sampling {
+        "local-sampling-catchall"
+    } else if catch_all_completion {
+        "local-completion-catchall"
+    } else if catch_all_logging {
+        "local-logging-catchall"
+    } else if catch_all_elicitation {
+        "local-elicitation-catchall"
+    } else if specialized_initialize {
+        "backend-initialize-direct"
+    } else if specialized_tools_call {
+        "backend-tools-call-direct"
+    } else if rust_db_direct_tools_list {
+        "db-tools-list-direct"
+    } else if server_scoped_tools_list {
+        "backend-tools-list-direct"
+    } else {
+        "backend-forward"
+    };
+    info!("rust_mcp_runtime method={} mode={}", request.method, mode);
+
+    if specialized_initialized_notification {
+        return forward_initialized_notification_to_backend(&state, effective_headers, body).await;
+    }
+
+    if specialized_message_notification {
+        return forward_message_notification_to_backend(&state, effective_headers, body).await;
+    }
+
+    if specialized_cancelled_notification {
+        return forward_cancelled_notification_to_backend(&state, effective_headers, body).await;
+    }
+
+    if rust_db_direct_resources_list {
+        return direct_server_resources_list(&state, effective_headers, request.id.clone()).await;
+    }
+
+    if specialized_resources_list {
+        return forward_resources_list_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if rust_db_direct_resources_read {
+        return direct_server_resources_read(
+            &state,
+            effective_headers,
+            request.id.clone(),
+            &request,
+            body,
+        )
+        .await;
+    }
+
+    if specialized_resources_read {
+        return forward_resources_read_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if specialized_resources_subscribe {
+        return forward_resources_subscribe_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if specialized_resources_unsubscribe {
+        return forward_resources_unsubscribe_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if rust_db_direct_resource_templates_list {
+        return direct_server_resource_templates_list(
+            &state,
+            effective_headers,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if specialized_resource_templates_list {
+        return forward_resource_templates_list_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if rust_db_direct_prompts_list {
+        return direct_server_prompts_list(&state, effective_headers, request.id.clone()).await;
+    }
+
+    if specialized_prompts_list {
+        return forward_prompts_list_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if rust_db_direct_prompts_get {
+        return direct_server_prompts_get(
+            &state,
+            effective_headers,
+            request.id.clone(),
+            &request,
+            body,
+        )
+        .await;
+    }
+
+    if specialized_prompts_get {
+        return forward_prompts_get_to_backend(&state, effective_headers, body, request.id.clone())
+            .await;
+    }
+
+    if specialized_roots_list {
+        return forward_roots_list_to_backend(&state, effective_headers, body, request.id.clone())
+            .await;
+    }
+
+    if specialized_completion_complete {
+        return forward_completion_complete_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if specialized_sampling_create_message {
+        return forward_sampling_create_message_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if specialized_logging_set_level {
+        return forward_logging_set_level_to_backend(
+            &state,
+            effective_headers,
+            body,
+            request.id.clone(),
+        )
+        .await;
+    }
+
+    if catch_all_notifications {
+        if request.is_notification() {
+            return empty_response(StatusCode::ACCEPTED);
+        }
+        return json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request.id,
+                "result": {},
+            }),
+        );
+    }
+
+    if catch_all_sampling || catch_all_completion || catch_all_logging || catch_all_elicitation {
+        return json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request.id,
+                "result": {},
+            }),
+        );
+    }
+
+    if request.is_notification() {
+        return forward_notification_to_backend(&state, headers, body).await;
+    }
+
+    if request.method == "ping" {
+        return json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request.id,
+                "result": {},
+            }),
+        );
+    }
+
+    if request.method == "initialize"
+        && let Err(response) =
+            validate_initialize_params(&state, &request.params, request.id.as_ref())
+    {
+        return response;
+    }
+
+    if specialized_initialize {
+        return forward_initialize_to_backend(&state, effective_headers, body).await;
+    }
+
+    if rust_db_direct_tools_list {
+        return direct_server_tools_list(&state, effective_headers, request.id.clone()).await;
+    }
+
+    if server_scoped_tools_list {
+        return forward_server_tools_list_to_backend(&state, effective_headers, request.id.clone())
+            .await;
+    }
+
+    if specialized_tools_call {
+        return handle_tools_call(&state, effective_headers, body, request).await;
+    }
+
+    forward_to_backend(&state, effective_headers, body).await
+}
+
+const BACKEND_RPC_SUFFIXES: &[&str] =
+    &["/_internal/mcp/rpc", "/_internal/mcp/rpc/", "/rpc", "/rpc/"];
+
+fn derive_backend_url(backend_rpc_url: &str, path: &str) -> String {
+    for suffix in BACKEND_RPC_SUFFIXES {
+        if let Some(prefix) = backend_rpc_url.strip_suffix(suffix) {
+            return format!("{prefix}/_internal/mcp/{path}");
+        }
+    }
+    format!(
+        "{}/_internal/mcp/{path}",
+        backend_rpc_url.trim_end_matches('/')
+    )
+}
+
+fn derive_backend_tools_list_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "tools/list")
+}
+fn derive_backend_resources_list_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/list")
+}
+fn derive_backend_resources_read_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/read")
+}
+fn derive_backend_resources_subscribe_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/subscribe")
+}
+fn derive_backend_resources_unsubscribe_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/unsubscribe")
+}
+fn derive_backend_resource_templates_list_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/templates/list")
+}
+fn derive_backend_prompts_list_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "prompts/list")
+}
+fn derive_backend_prompts_get_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "prompts/get")
+}
+fn derive_backend_roots_list_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "roots/list")
+}
+fn derive_backend_completion_complete_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "completion/complete")
+}
+fn derive_backend_sampling_create_message_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "sampling/createMessage")
+}
+fn derive_backend_logging_set_level_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "logging/setLevel")
+}
+fn derive_backend_initialize_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "initialize")
+}
+fn derive_backend_transport_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "transport")
+}
+fn derive_backend_session_delete_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "session")
+}
+fn derive_backend_notifications_initialized_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "notifications/initialized")
+}
+fn derive_backend_notifications_message_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "notifications/message")
+}
+fn derive_backend_notifications_cancelled_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "notifications/cancelled")
+}
+fn derive_backend_tools_list_authz_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "tools/list/authz")
+}
+fn derive_backend_resources_list_authz_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/list/authz")
+}
+fn derive_backend_resources_read_authz_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/read/authz")
+}
+fn derive_backend_resource_templates_list_authz_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "resources/templates/list/authz")
+}
+fn derive_backend_prompts_list_authz_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "prompts/list/authz")
+}
+fn derive_backend_prompts_get_authz_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "prompts/get/authz")
+}
+fn derive_backend_tools_call_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "tools/call")
+}
+fn derive_backend_tools_call_resolve_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "tools/call/resolve")
+}
+fn derive_backend_tools_call_metric_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "tools/call/metric")
+}
+fn derive_backend_authenticate_url(backend_rpc_url: &str) -> String {
+    derive_backend_url(backend_rpc_url, "authenticate")
+}
+
+fn build_db_pool(config: &RuntimeConfig) -> Result<Option<Pool>, RuntimeError> {
+    let Some(database_url) = config.database_url.as_deref() else {
+        return Ok(None);
+    };
+
+    if database_url.starts_with("sqlite:") {
+        warn!("Rust MCP direct DB mode disabled: sqlite is not supported");
+        return Ok(None);
+    }
+
+    let (normalized_url, tls_options) = normalize_postgres_database_url(database_url)?;
+    let pg_config = tokio_postgres::Config::from_str(&normalized_url).map_err(|err| {
+        RuntimeError::Config(format!(
+            "invalid MCP_RUST_DATABASE_URL '{normalized_url}': {err}"
+        ))
+    })?;
+    let tls_connector = build_postgres_tls_connector(&tls_options)?;
+    let mgr_config = ManagerConfig {
+        recycling_method: RecyclingMethod::Fast,
+    };
+    match pg_config.get_ssl_mode() {
+        SslMode::Disable => info!("Rust MCP direct DB pool TLS disabled via sslmode=disable"),
+        SslMode::Prefer => info!("Rust MCP direct DB pool TLS optional via sslmode=prefer"),
+        SslMode::Require => info!("Rust MCP direct DB pool TLS required via sslmode=require"),
+        _ => info!("Rust MCP direct DB pool TLS configured with a non-default sslmode"),
+    }
+    let manager = Manager::from_config(pg_config, tls_connector, mgr_config);
+    let pool = Pool::builder(manager)
+        .max_size(config.db_pool_max_size)
+        .build()
+        .map_err(|err| RuntimeError::Config(format!("failed to build Rust MCP DB pool: {err}")))?;
+
+    Ok(Some(pool))
+}
+
+#[derive(Debug, Default, Clone, PartialEq, Eq)]
+#[allow(clippy::struct_field_names)]
+struct PostgresTlsOptions {
+    ssl_root_cert: Option<String>,
+    ssl_cert: Option<String>,
+    ssl_key: Option<String>,
+}
+
+fn normalize_postgres_database_url(
+    database_url: &str,
+) -> Result<(String, PostgresTlsOptions), RuntimeError> {
+    let normalized_url = database_url.replace("postgresql+psycopg://", "postgresql://");
+    let mut parsed = Url::parse(&normalized_url).map_err(|err| {
+        RuntimeError::Config(format!(
+            "invalid MCP_RUST_DATABASE_URL '{normalized_url}': {err}"
+        ))
+    })?;
+    let mut tls_options = PostgresTlsOptions::default();
+    let retained_query_pairs = parsed
+        .query_pairs()
+        .into_owned()
+        .filter_map(|(key, value)| match key.as_str() {
+            "sslrootcert" => {
+                tls_options.ssl_root_cert = Some(value);
+                None
+            }
+            "sslcert" => {
+                tls_options.ssl_cert = Some(value);
+                None
+            }
+            "sslkey" => {
+                tls_options.ssl_key = Some(value);
+                None
+            }
+            _ => Some((key, value)),
+        })
+        .collect::<Vec<_>>();
+    {
+        let mut query_pairs = parsed.query_pairs_mut();
+        query_pairs.clear();
+        query_pairs.extend_pairs(
+            retained_query_pairs
+                .iter()
+                .map(|(key, value)| (key.as_str(), value.as_str())),
+        );
+    }
+
+    Ok((parsed.to_string(), tls_options))
+}
+
+fn build_postgres_tls_connector(
+    tls_options: &PostgresTlsOptions,
+) -> Result<MakeRustlsConnect, RuntimeError> {
+    if tls_options.ssl_cert.is_some() || tls_options.ssl_key.is_some() {
+        return Err(RuntimeError::Config(
+            "MCP_RUST_DATABASE_URL client certificate authentication via sslcert/sslkey is not supported yet".to_string(),
+        ));
+    }
+
+    ensure_rustls_crypto_provider();
+
+    let mut root_cert_store = RootCertStore::empty();
+    let native_certs = rustls_native_certs::load_native_certs();
+    for load_error in native_certs.errors {
+        warn!("Rust MCP DB TLS native root load warning: {load_error}");
+    }
+    let (_added, _ignored) = root_cert_store.add_parsable_certificates(native_certs.certs);
+
+    if let Some(path) = tls_options.ssl_root_cert.as_deref() {
+        let pem_bytes = fs::read(path).map_err(|err| {
+            RuntimeError::Config(format!(
+                "invalid MCP_RUST_DATABASE_URL sslrootcert '{path}': {err}"
+            ))
+        })?;
+        let mut pem_reader = std::io::BufReader::new(pem_bytes.as_slice());
+        let certificates = rustls_pemfile::certs(&mut pem_reader)
+            .collect::<Result<Vec<_>, _>>()
+            .map_err(|err| {
+                RuntimeError::Config(format!(
+                    "invalid MCP_RUST_DATABASE_URL sslrootcert '{path}': {err}"
+                ))
+            })?;
+        let (added, _ignored) = root_cert_store.add_parsable_certificates(certificates);
+        if added == 0 {
+            return Err(RuntimeError::Config(format!(
+                "invalid MCP_RUST_DATABASE_URL sslrootcert '{path}': no certificates were parsed"
+            )));
+        }
+    }
+
+    let tls_connector = RustlsClientConfig::builder()
+        .with_root_certificates(root_cert_store)
+        .with_no_client_auth();
+
+    Ok(MakeRustlsConnect::new(tls_connector))
+}
+
+fn ensure_rustls_crypto_provider() {
+    static RUSTLS_CRYPTO_PROVIDER: OnceLock<()> = OnceLock::new();
+
+    RUSTLS_CRYPTO_PROVIDER.get_or_init(|| {
+        let _ = rustls::crypto::aws_lc_rs::default_provider().install_default();
+    });
+}
+
+fn build_redis_client(config: &RuntimeConfig) -> Result<Option<redis::Client>, RuntimeError> {
+    let Some(redis_url) = config.redis_url.as_deref() else {
+        return Ok(None);
+    };
+
+    let client = redis::Client::open(redis_url).map_err(|err| {
+        RuntimeError::Config(format!("invalid MCP_RUST_REDIS_URL '{redis_url}': {err}"))
+    })?;
+    Ok(Some(client))
+}
+
+fn has_server_scope(headers: &HeaderMap) -> bool {
+    headers.contains_key("x-contextforge-server-id")
+}
+
+fn can_use_direct_resources_read(params: &Value) -> bool {
+    let Some(params) = params.as_object() else {
+        return false;
+    };
+    matches!(params.get("uri"), Some(Value::String(uri)) if !uri.is_empty())
+        && !params.contains_key("requestId")
+        && !params.contains_key("_meta")
+}
+
+fn can_use_direct_prompts_get(params: &Value) -> bool {
+    let Some(params) = params.as_object() else {
+        return false;
+    };
+
+    let has_name = matches!(params.get("name"), Some(Value::String(name)) if !name.is_empty());
+    let arguments_are_empty = match params.get("arguments") {
+        None | Some(Value::Null) => true,
+        Some(Value::Object(arguments)) => arguments.is_empty(),
+        _ => false,
+    };
+
+    has_name && arguments_are_empty && !params.contains_key("_meta")
+}
+
+fn public_mcp_path(uri: &axum::http::Uri, server_id: Option<&str>) -> String {
+    match server_id {
+        Some(server_id) if uri.path().ends_with('/') => format!("/servers/{server_id}/mcp/"),
+        Some(server_id) => format!("/servers/{server_id}/mcp"),
+        None => uri.path().to_string(),
+    }
+}
+
+fn build_public_auth_headers(incoming_headers: &HeaderMap) -> HashMap<String, String> {
+    let mut headers = HashMap::new();
+    for (name, value) in incoming_headers {
+        if matches!(
+            name.as_str(),
+            "host"
+                | "content-length"
+                | "connection"
+                | "transfer-encoding"
+                | "keep-alive"
+                | RUNTIME_HEADER
+                | SESSION_VALIDATED_HEADER
+                | INTERNAL_AFFINITY_FORWARDED_HEADER
+                | INTERNAL_RUNTIME_AUTH_HEADER
+                | "x-contextforge-auth-context"
+                | "x-contextforge-server-id"
+        ) {
+            continue;
+        }
+
+        if let Ok(value) = value.to_str() {
+            headers.insert(name.as_str().to_string(), value.to_string());
+        }
+    }
+    headers
+}
+
+fn public_client_ip(incoming_headers: &HeaderMap, peer_addr: Option<SocketAddr>) -> Option<String> {
+    let peer_ip = peer_addr.map(|addr| addr.ip());
+    let real_ip = incoming_headers
+        .get("x-real-ip")
+        .and_then(|value| value.to_str().ok())
+        .map(str::trim)
+        .filter(|value| !value.is_empty())
+        .map(str::to_string);
+    let forwarded_for_ip = incoming_headers
+        .get("x-forwarded-for")
+        .and_then(|value| value.to_str().ok())
+        .and_then(|value| value.split(',').next_back())
+        .map(str::trim)
+        .filter(|value| !value.is_empty())
+        .map(str::to_string);
+
+    match peer_ip {
+        Some(peer_ip) if proxy_header_hop_is_trusted(peer_ip) => real_ip
+            .or(forwarded_for_ip)
+            .or_else(|| Some(peer_ip.to_string())),
+        Some(peer_ip) => Some(peer_ip.to_string()),
+        None => None,
+    }
+}
+
+fn internal_runtime_auth_header_value() -> HeaderValue {
+    static HEADER_VALUE: OnceLock<HeaderValue> = OnceLock::new();
+    HEADER_VALUE
+        .get_or_init(|| {
+            let secret = std::env::var("AUTH_ENCRYPTION_SECRET")
+                .unwrap_or_else(|_| DEFAULT_INTERNAL_RUNTIME_AUTH_SECRET.to_string());
+            let digest =
+                Sha256::digest(format!("{secret}:{INTERNAL_RUNTIME_AUTH_CONTEXT}").as_bytes());
+            HeaderValue::from_str(&hex_encode(digest.as_ref()))
+                .expect("derived internal MCP runtime auth header must be valid")
+        })
+        .clone()
+}
+
+fn proxy_header_hop_is_trusted(ip: IpAddr) -> bool {
+    match ip {
+        IpAddr::V4(ipv4) => ipv4.is_loopback() || ipv4.is_private() || ipv4.is_link_local(),
+        IpAddr::V6(ipv6) => {
+            ipv6.is_loopback() || ipv6.is_unique_local() || ipv6.is_unicast_link_local()
+        }
+    }
+}
+
+fn unix_epoch_millis() -> u64 {
+    u64::try_from(
+        SystemTime::now()
+            .duration_since(UNIX_EPOCH)
+            .unwrap_or_default()
+            .as_millis(),
+    )
+    .unwrap_or(u64::MAX)
+}
+
+fn current_encoded_auth_context_header(incoming_headers: &HeaderMap) -> Option<String> {
+    incoming_headers
+        .get("x-contextforge-auth-context")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string)
+}
+
+fn auth_binding_fingerprint(incoming_headers: &HeaderMap) -> Option<String> {
+    let mut material = String::new();
+
+    for header_name in ["authorization", "cookie"] {
+        if let Some(value) = incoming_headers
+            .get(header_name)
+            .and_then(|value| value.to_str().ok())
+            .map(str::trim)
+            .filter(|value| !value.is_empty())
+        {
+            material.push_str(header_name);
+            material.push('=');
+            material.push_str(value);
+            material.push('\n');
+        }
+    }
+
+    if material.is_empty() {
+        return None;
+    }
+
+    let digest = Sha256::digest(material.as_bytes());
+    Some(URL_SAFE_NO_PAD.encode(digest))
+}
+
+fn can_reuse_session_auth(
+    state: &AppState,
+    record: &RuntimeSessionRecord,
+    incoming_headers: &HeaderMap,
+    requested_server_id: Option<&str>,
+) -> Result<String, SessionAuthReuseMissReason> {
+    if !state.session_auth_reuse_enabled() {
+        return Err(SessionAuthReuseMissReason::Disabled);
+    }
+
+    if requested_server_id.is_some() && record.server_id.as_deref() != requested_server_id {
+        return Err(SessionAuthReuseMissReason::ServerScopeMismatch);
+    }
+
+    let encoded_auth_context = record
+        .encoded_auth_context
+        .clone()
+        .ok_or(SessionAuthReuseMissReason::MissingEncodedAuthContext)?;
+    let expected_fingerprint = record
+        .auth_binding_fingerprint
+        .as_deref()
+        .ok_or(SessionAuthReuseMissReason::MissingAuthBindingFingerprint)?;
+    let actual_fingerprint = auth_binding_fingerprint(incoming_headers)
+        .ok_or(SessionAuthReuseMissReason::MissingAuthBindingFingerprint)?;
+    if actual_fingerprint != expected_fingerprint {
+        return Err(SessionAuthReuseMissReason::AuthBindingMismatch);
+    }
+
+    let expires_at = record
+        .auth_context_expires_at_epoch_ms
+        .ok_or(SessionAuthReuseMissReason::TtlExpired)?;
+    if unix_epoch_millis() >= expires_at {
+        return Err(SessionAuthReuseMissReason::TtlExpired);
+    }
+
+    Ok(encoded_auth_context)
+}
+
+#[allow(clippy::result_large_err)]
+fn encode_internal_auth_context_header(auth_context: &Value) -> Result<HeaderValue, Response> {
+    let encoded = URL_SAFE_NO_PAD.encode(serde_json::to_vec(auth_context).map_err(|err| {
+        error!("internal MCP auth context serialization failed: {err}");
+        json_response(
+            StatusCode::BAD_GATEWAY,
+            json!({
+                "detail": "Internal MCP auth context serialization failed",
+            }),
+        )
+    })?);
+
+    HeaderValue::from_str(&encoded).map_err(|err| {
+        error!("internal MCP auth context header encoding failed: {err}");
+        json_response(
+            StatusCode::BAD_GATEWAY,
+            json!({
+                "detail": "Internal MCP auth context header encoding failed",
+            }),
+        )
+    })
+}
+
+async fn authenticate_public_request_if_needed(
+    state: &AppState,
+    method: &str,
+    mut incoming_headers: HeaderMap,
+    uri: &axum::http::Uri,
+    server_id: Option<&str>,
+    peer_addr: Option<SocketAddr>,
+) -> Result<(HeaderMap, String), Response> {
+    // Public Rust ingress still treats Python as the auth authority. Incoming
+    // client headers are scrubbed of internal-only state first; the only fast
+    // path is reusing auth that was previously bound to this runtime session.
+    let public_path = public_mcp_path(uri, server_id);
+    if !state.public_ingress_enabled() {
+        if let Some(server_id) = server_id {
+            inject_server_id_header(&mut incoming_headers, server_id);
+        }
+        return Ok((incoming_headers, public_path));
+    }
+
+    incoming_headers.remove("x-contextforge-auth-context");
+    incoming_headers.remove("x-contextforge-server-id");
+    if let Some(server_id) = server_id {
+        inject_server_id_header(&mut incoming_headers, server_id);
+    }
+
+    if state.session_core_enabled()
+        && let Some(session_id) = runtime_session_id_from_request(&incoming_headers, uri)
+    {
+        if let Some(record) = get_runtime_session(state, &session_id).await {
+            match can_reuse_session_auth(state, &record, &incoming_headers, server_id) {
+                Ok(encoded_auth_context) => {
+                    state.runtime_stats().record_session_auth_reuse_hit();
+                    let encoded_auth_context = HeaderValue::from_str(&encoded_auth_context)
+                        .map_err(|err| {
+                            error!("stored MCP auth context header encoding failed: {err}");
+                            json_response(
+                                StatusCode::BAD_GATEWAY,
+                                json!({
+                                    "detail": "Stored MCP auth context header encoding failed",
+                                }),
+                            )
+                        })?;
+                    incoming_headers.insert(
+                        HeaderName::from_static("x-contextforge-auth-context"),
+                        encoded_auth_context,
+                    );
+                    return Ok((incoming_headers, public_path));
+                }
+                Err(reason) => state.runtime_stats().record_session_auth_reuse_miss(reason),
+            }
+        } else {
+            state
+                .runtime_stats()
+                .record_session_auth_reuse_miss(SessionAuthReuseMissReason::NoSession);
+        }
+    }
+
+    state
+        .runtime_stats()
+        .record_session_auth_backend_round_trip();
+    let request_body = InternalAuthenticateRequest {
+        method: method.to_string(),
+        path: public_path.clone(),
+        query_string: uri.query().unwrap_or_default().to_string(),
+        headers: build_public_auth_headers(&incoming_headers),
+        client_ip: public_client_ip(&incoming_headers, peer_addr),
+    };
+
+    let backend_response = state
+        .client
+        .post(state.backend_authenticate_url())
+        .header(RUNTIME_HEADER, RUNTIME_NAME)
+        .header(
+            HeaderName::from_static(INTERNAL_RUNTIME_AUTH_HEADER),
+            internal_runtime_auth_header_value(),
+        )
+        .json(&request_body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP authenticate failed: {err}");
+            backend_detail_error_response("Backend MCP authenticate failed")
+        })?;
+
+    if !backend_response.status().is_success() {
+        return Err(response_from_backend(backend_response));
+    }
+
+    let response_body: InternalAuthenticateResponse =
+        backend_response.json().await.map_err(|err| {
+            error!("backend MCP authenticate decode failed: {err}");
+            backend_detail_error_response("Backend MCP authenticate decode failed")
+        })?;
+
+    let encoded_auth_context = encode_internal_auth_context_header(&response_body.auth_context)?;
+    incoming_headers.insert(
+        HeaderName::from_static("x-contextforge-auth-context"),
+        encoded_auth_context,
+    );
+
+    Ok((incoming_headers, public_path))
+}
+
+#[allow(clippy::result_large_err)]
+fn decode_request(body: &[u8]) -> Result<JsonRpcRequest, Response> {
+    let parsed: Value = serde_json::from_slice(body).map_err(|_| parse_error_response())?;
+
+    if parsed.is_array() {
+        return Err(batch_rejected_response());
+    }
+
+    let object = parsed
+        .as_object()
+        .ok_or_else(|| invalid_request_response(&Value::Null))?;
+
+    let request_id = object.get("id").cloned().unwrap_or(Value::Null);
+    if let Some(version) = object.get("jsonrpc").and_then(Value::as_str)
+        && version != JSONRPC_VERSION
+    {
+        return Err(invalid_request_response(&request_id));
+    }
+
+    let method = object
+        .get("method")
+        .and_then(Value::as_str)
+        .ok_or_else(|| invalid_request_response(&request_id))?;
+
+    Ok(JsonRpcRequest {
+        jsonrpc: Some(JSONRPC_VERSION.to_string()),
+        method: method.to_string(),
+        params: object.get("params").cloned().unwrap_or_else(|| json!({})),
+        id: object.get("id").cloned(),
+    })
+}
+
+#[allow(clippy::result_large_err)]
+fn validate_protocol_version(state: &AppState, headers: &HeaderMap) -> Result<(), Response> {
+    let protocol_version = headers
+        .get(MCP_PROTOCOL_VERSION_HEADER)
+        .and_then(|value| value.to_str().ok())
+        .unwrap_or(state.protocol_version());
+
+    if state
+        .supported_protocol_versions()
+        .iter()
+        .any(|supported| supported == protocol_version)
+    {
+        return Ok(());
+    }
+
+    let supported = state.supported_protocol_versions().join(", ");
+    Err(json_response(
+        StatusCode::BAD_REQUEST,
+        json!({
+            "error": "Bad Request",
+            "message": format!(
+                "Unsupported protocol version: {protocol_version}. Supported versions: {supported}"
+            ),
+        }),
+    ))
+}
+
+#[allow(clippy::result_large_err)]
+fn validate_initialize_params(
+    state: &AppState,
+    params: &Value,
+    request_id: Option<&Value>,
+) -> Result<(), Response> {
+    let params: InitializeParams = match serde_json::from_value(params.clone()) {
+        Ok(params) => params,
+        Err(_) => {
+            return Err(json_response(
+                StatusCode::OK,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id.cloned(),
+                    "error": {
+                        "code": -32602,
+                        "message": "Invalid params",
+                    },
+                }),
+            ));
+        }
+    };
+
+    let Some(protocol_version) = params.protocol_version else {
+        return Err(json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id.cloned(),
+                "error": {
+                    "code": -32602,
+                    "message": "Missing protocolVersion",
+                },
+            }),
+        ));
+    };
+
+    if state
+        .supported_protocol_versions()
+        .iter()
+        .all(|supported| supported != &protocol_version)
+    {
+        return Err(json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id,
+                "error": {
+                    "code": -32602,
+                    "message": format!("Unsupported protocolVersion: {protocol_version}"),
+                },
+            }),
+        ));
+    }
+
+    Ok(())
+}
+
+#[allow(clippy::result_large_err)]
+fn validate_prompt_get_arguments(
+    params: &Map<String, Value>,
+    request_id: Option<&Value>,
+) -> Result<(), Response> {
+    let Some(arguments) = params.get("arguments") else {
+        return Ok(());
+    };
+
+    let Some(arguments_object) = arguments.as_object() else {
+        return Err(json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id.cloned(),
+                "error": {
+                    "code": -32602,
+                    "message": "Prompt arguments must be an object with string values",
+                },
+            }),
+        ));
+    };
+
+    for (key, value) in arguments_object {
+        if !value.is_string() {
+            return Err(json_response(
+                StatusCode::OK,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id.cloned(),
+                    "error": {
+                        "code": -32602,
+                        "message": format!("Prompt argument '{key}' must be a string value"),
+                    },
+                }),
+            ));
+        }
+    }
+
+    Ok(())
+}
+
+fn parse_error_response() -> Response {
+    json_response(
+        StatusCode::BAD_REQUEST,
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": Value::Null,
+            "error": {
+                "code": -32700,
+                "message": "Parse error",
+            }
+        }),
+    )
+}
+
+fn invalid_request_response(id: &Value) -> Response {
+    json_response(
+        StatusCode::BAD_REQUEST,
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": id,
+            "error": {
+                "code": -32600,
+                "message": "Invalid Request",
+            }
+        }),
+    )
+}
+
+fn batch_rejected_response() -> Response {
+    json_response(
+        StatusCode::BAD_REQUEST,
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": Value::Null,
+            "error": {
+                "code": -32600,
+                "message": "Batch requests are not supported",
+            }
+        }),
+    )
+}
+
+async fn forward_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Response {
+    let backend_response =
+        match send_to_backend_url(state, state.backend_rpc_url(), incoming_headers, body).await {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+
+    response_from_backend(backend_response)
+}
+
+async fn forward_initialize_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Response {
+    let backend_response = match send_to_backend_url(
+        state,
+        state.backend_initialize_url(),
+        incoming_headers,
+        body,
+    )
+    .await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    response_from_backend(backend_response)
+}
+
+async fn handle_initialize_with_session_core(
+    state: &AppState,
+    mut incoming_headers: HeaderMap,
+    uri: axum::http::Uri,
+    body: Bytes,
+    request: &JsonRpcRequest,
+) -> Response {
+    let auth_context = decode_internal_auth_context_from_headers_optional(&incoming_headers);
+    let session_id = requested_initialize_session_id(&incoming_headers, &uri, request)
+        .unwrap_or_else(|| Uuid::new_v4().to_string());
+
+    if let Some(existing) = get_runtime_session(state, &session_id).await
+        && let Err(reason) =
+            runtime_session_access_outcome(&existing, auth_context.as_ref(), &incoming_headers)
+    {
+        state.runtime_stats().record_session_access_denial(reason);
+        return json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request.id,
+                "error": {
+                    "code": -32003,
+                    "message": "Access denied",
+                    "data": {"method": "initialize"},
+                }
+            }),
+        );
+    }
+
+    inject_session_header(&mut incoming_headers, &session_id);
+    if let Some(server_id) = extract_server_id_header(&incoming_headers) {
+        inject_server_id_header(&mut incoming_headers, &server_id);
+    }
+
+    let backend_response = match send_transport_to_backend(
+        state,
+        reqwest::Method::POST,
+        &incoming_headers,
+        &uri,
+        Some(body.clone()),
+        false,
+    )
+    .await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    let status = backend_response.status();
+    let response_session_id = backend_response
+        .headers()
+        .get("mcp-session-id")
+        .and_then(|value| value.to_str().ok())
+        .map_or_else(|| session_id.clone(), str::to_string);
+
+    if status.is_success() {
+        let mut record = RuntimeSessionRecord {
+            owner_email: auth_context
+                .as_ref()
+                .and_then(|context| context.email.clone()),
+            server_id: extract_server_id_header(&incoming_headers),
+            protocol_version: requested_protocol_version(request),
+            client_capabilities: extract_client_capabilities(request),
+            encoded_auth_context: None,
+            auth_binding_fingerprint: None,
+            auth_context_expires_at_epoch_ms: None,
+            created_at: std::time::Instant::now(),
+            last_used: std::time::Instant::now(),
+        };
+        maybe_bind_session_auth_context(
+            state,
+            &mut record,
+            &incoming_headers,
+            auth_context.as_ref(),
+        );
+        upsert_runtime_session(state, response_session_id.clone(), record).await;
+    } else {
+        remove_runtime_session(state, &response_session_id).await;
+    }
+
+    let mut response = response_from_backend_with_session_hint(
+        backend_response,
+        Some(response_session_id.as_str()),
+    );
+    inject_runtime_capability_headers(
+        &mut response,
+        &[
+            (SESSION_CORE_HEADER, state.session_core_enabled()),
+            (EVENT_STORE_HEADER, state.event_store_enabled()),
+            (
+                SESSION_AUTH_REUSE_HEADER,
+                state.session_auth_reuse_enabled(),
+            ),
+            (RESUME_CORE_HEADER, state.resume_core_enabled()),
+        ],
+    );
+    response
+}
+
+async fn active_runtime_session_count(state: &AppState) -> usize {
+    let now = Instant::now();
+    let ttl = state.session_ttl();
+    let mut sessions = state.runtime_sessions().lock().await;
+    sessions.retain(|_, record| now.duration_since(record.last_used) <= ttl);
+    let local_count = sessions.len();
+    drop(sessions);
+
+    if state.redis().await.is_some()
+        && let Some(redis_count) = count_runtime_sessions_in_redis(state).await
+    {
+        return redis_count;
+    }
+
+    local_count
+}
+
+async fn get_runtime_session(state: &AppState, session_id: &str) -> Option<RuntimeSessionRecord> {
+    let now = Instant::now();
+    let ttl = state.session_ttl();
+    {
+        let mut sessions = state.runtime_sessions().lock().await;
+        if let Some(record) = sessions.get_mut(session_id) {
+            if now.duration_since(record.last_used) > ttl {
+                sessions.remove(session_id);
+            } else {
+                record.last_used = now;
+                return Some(record.clone());
+            }
+        }
+    }
+
+    let record = get_runtime_session_from_redis(state, session_id).await?;
+    cache_runtime_session_locally(state, session_id.to_string(), record.clone()).await;
+    Some(record)
+}
+
+async fn upsert_runtime_session(
+    state: &AppState,
+    session_id: String,
+    mut record: RuntimeSessionRecord,
+) {
+    record.last_used = Instant::now();
+    cache_runtime_session_locally(state, session_id.clone(), record.clone()).await;
+    upsert_runtime_session_in_redis(state, &session_id, &record).await;
+}
+
+async fn remove_runtime_session(state: &AppState, session_id: &str) {
+    let mut sessions = state.runtime_sessions().lock().await;
+    sessions.remove(session_id);
+    drop(sessions);
+    remove_runtime_session_from_redis(state, session_id).await;
+}
+
+async fn cache_runtime_session_locally(
+    state: &AppState,
+    session_id: String,
+    mut record: RuntimeSessionRecord,
+) {
+    record.last_used = Instant::now();
+    let mut sessions = state.runtime_sessions().lock().await;
+    sessions.insert(session_id, record);
+}
+
+async fn count_runtime_sessions_in_redis(state: &AppState) -> Option<usize> {
+    let mut redis = state.redis().await?;
+    let pattern = format!("{}rust:mcp:session:*", state.cache_prefix());
+    match redis.scan_match::<_, String>(pattern).await {
+        Ok(mut iter) => {
+            let mut count = 0usize;
+            while iter.next_item().await.is_some() {
+                count = count.saturating_add(1);
+            }
+            Some(count)
+        }
+        Err(err) => {
+            warn!("Rust MCP session count Redis lookup failed: {err}");
+            None
+        }
+    }
+}
+
+async fn sweep_local_caches(state: &AppState) {
+    {
+        let mut sessions = state.runtime_sessions().lock().await;
+        let ttl = state.session_ttl();
+        sessions.retain(|_, record| record.last_used.elapsed() < ttl);
+    }
+
+    {
+        let mut sessions = state.upstream_tool_sessions().lock().await;
+        let ttl = state.upstream_session_ttl();
+        sessions.retain(|_, record| record.last_used.elapsed() < ttl);
+    }
+
+    #[cfg(feature = "rmcp-upstream-client")]
+    {
+        let mut clients = state.rmcp_upstream_clients().lock().await;
+        let ttl = state.upstream_session_ttl();
+        clients.retain(|_, cached| cached.last_used.elapsed() < ttl);
+    }
+
+    {
+        let mut plans = state.resolved_tool_call_plans().lock().await;
+        let ttl = state.tools_call_plan_ttl();
+        plans.retain(|_, cached| cached.cached_at.elapsed() < ttl);
+    }
+}
+
+fn spawn_local_cache_sweeper(state: AppState) {
+    tokio::spawn(async move {
+        let mut interval = tokio::time::interval(Duration::from_secs(60));
+        loop {
+            interval.tick().await;
+            sweep_local_caches(&state).await;
+        }
+    });
+}
+
+async fn get_runtime_session_from_redis(
+    state: &AppState,
+    session_id: &str,
+) -> Option<RuntimeSessionRecord> {
+    let mut redis = state.redis().await?;
+    let key = runtime_session_key(state, session_id);
+    match redis.get::<_, Option<String>>(&key).await {
+        Ok(Some(payload)) => {
+            if let Ok(ttl_i64) = i64::try_from(state.session_ttl().as_secs()) {
+                let _ = redis.expire::<_, bool>(&key, ttl_i64).await;
+            }
+            match serde_json::from_str::<StoredRuntimeSessionRecord>(&payload) {
+                Ok(record) => Some(record.into()),
+                Err(err) => {
+                    warn!("Rust MCP session decode failed for {session_id}: {err}");
+                    None
+                }
+            }
+        }
+        Ok(None) => None,
+        Err(err) => {
+            warn!("Rust MCP session Redis lookup failed for {session_id}: {err}");
+            None
+        }
+    }
+}
+
+async fn upsert_runtime_session_in_redis(
+    state: &AppState,
+    session_id: &str,
+    record: &RuntimeSessionRecord,
+) {
+    let Some(mut redis) = state.redis().await else {
+        return;
+    };
+    let payload = match serde_json::to_string(&StoredRuntimeSessionRecord::from(record)) {
+        Ok(payload) => payload,
+        Err(err) => {
+            warn!("Rust MCP session serialization failed for {session_id}: {err}");
+            return;
+        }
+    };
+    let key = runtime_session_key(state, session_id);
+    if let Err(err) = redis
+        .set_ex::<_, _, ()>(&key, payload, state.session_ttl().as_secs())
+        .await
+    {
+        warn!("Rust MCP session Redis write failed for {session_id}: {err}");
+    }
+}
+
+async fn remove_runtime_session_from_redis(state: &AppState, session_id: &str) {
+    let Some(mut redis) = state.redis().await else {
+        return;
+    };
+    let key = runtime_session_key(state, session_id);
+    if let Err(err) = redis.del::<_, ()>(&key).await {
+        warn!("Rust MCP session Redis delete failed for {session_id}: {err}");
+    }
+}
+
+fn runtime_session_key(state: &AppState, session_id: &str) -> String {
+    format!("{}rust:mcp:session:{session_id}", state.cache_prefix())
+}
+
+fn pool_owner_key(state: &AppState, session_id: &str) -> String {
+    format!("{}pool_owner:{session_id}", state.cache_prefix())
+}
+
+fn pool_http_channel(state: &AppState, owner_worker_id: &str) -> String {
+    format!("{}pool_http:{owner_worker_id}", state.cache_prefix())
+}
+
+fn pool_http_response_channel(state: &AppState, response_id: &str) -> String {
+    format!("{}pool_http_response:{response_id}", state.cache_prefix())
+}
+
+fn is_affinity_forwarded_request(headers: &HeaderMap) -> bool {
+    headers
+        .get(INTERNAL_AFFINITY_FORWARDED_HEADER)
+        .and_then(|value| value.to_str().ok())
+        == Some(INTERNAL_AFFINITY_FORWARDED_VALUE)
+}
+
+async fn get_pool_session_owner(state: &AppState, session_id: &str) -> Option<String> {
+    let mut redis = state.redis().await?;
+    match redis
+        .get::<_, Option<String>>(pool_owner_key(state, session_id))
+        .await
+    {
+        Ok(owner) => owner,
+        Err(err) => {
+            warn!("Rust MCP affinity owner lookup failed for {session_id}: {err}");
+            None
+        }
+    }
+}
+
+async fn forward_transport_request_via_affinity_owner(
+    state: &AppState,
+    session_id: &str,
+    method: reqwest::Method,
+    path: &str,
+    query_string: &str,
+    incoming_headers: &HeaderMap,
+    body: &[u8],
+) -> Result<Option<Response>, Response> {
+    // Affinity forwarding keeps a session on the worker that already owns the
+    // long-lived transport state. Requests are only forwarded when affinity is
+    // enabled, Redis knows a different owner, and the current request is not
+    // itself already an affinity-forwarded replay.
+    if !state.affinity_core_enabled() || is_affinity_forwarded_request(incoming_headers) {
+        return Ok(None);
+    }
+
+    let Some(owner_worker_id) = get_pool_session_owner(state, session_id).await else {
+        return Ok(None);
+    };
+
+    let Some(redis_client) = state.redis_client.clone() else {
+        return Ok(None);
+    };
+
+    state.runtime_stats().record_affinity_forward_attempt();
+    let owner_channel = pool_http_channel(state, &owner_worker_id);
+    let response_channel = pool_http_response_channel(state, &Uuid::new_v4().simple().to_string());
+    let mut pubsub = redis_client
+        .get_async_pubsub()
+        .await
+        .map_err(|err| affinity_forward_error_response("Pub/Sub initialization failed", err))?;
+
+    pubsub
+        .subscribe(&response_channel)
+        .await
+        .map_err(|err| affinity_forward_error_response("Pub/Sub subscribe failed", err))?;
+
+    let mut publish_conn = state.redis().await.ok_or_else(|| {
+        json_response(
+            StatusCode::BAD_GATEWAY,
+            json!({
+                "detail": "Rust MCP affinity forwarding requires Redis",
+            }),
+        )
+    })?;
+
+    let headers = build_affinity_forward_headers(incoming_headers);
+    let payload = AffinityForwardRequest {
+        kind: "http_forward",
+        response_channel: response_channel.clone(),
+        mcp_session_id: session_id,
+        method: method.as_str(),
+        path,
+        query_string,
+        headers,
+        body: hex_encode(body),
+        original_worker: "rust-mcp-runtime",
+        timestamp: current_unix_timestamp_seconds(),
+    };
+    let payload_json = serde_json::to_vec(&payload).map_err(|err| {
+        error!("Rust MCP affinity payload serialization failed: {err}");
+        json_response(
+            StatusCode::BAD_GATEWAY,
+            json!({
+                "detail": "Rust MCP affinity payload serialization failed",
+            }),
+        )
+    })?;
+
+    redis::cmd("PUBLISH")
+        .arg(&owner_channel)
+        .arg(payload_json)
+        .query_async::<i64>(&mut publish_conn)
+        .await
+        .map_err(|err| affinity_forward_error_response("Affinity request publish failed", err))?;
+
+    let mut stream = pubsub.on_message();
+    let timeout = Duration::from_secs(30);
+    let message = tokio::time::timeout(timeout, stream.next())
+        .await
+        .map_err(|_| {
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "detail": "Timed out waiting for owner worker response",
+                }),
+            )
+        })?
+        .ok_or_else(|| {
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "detail": "Affinity response channel closed before a response arrived",
+                }),
+            )
+        })?;
+
+    let payload_json: String = message.get_payload().map_err(|err| {
+        affinity_forward_error_response("Affinity response payload decode failed", err)
+    })?;
+    let payload: AffinityForwardResponse = serde_json::from_str(&payload_json).map_err(|err| {
+        affinity_forward_error_response("Affinity response JSON decode failed", err)
+    })?;
+    state.runtime_stats().record_affinity_forwarded_request();
+    Ok(Some(response_from_affinity_forward_response(
+        payload,
+        Some(session_id),
+    )))
+}
+
+fn build_affinity_forward_headers(headers: &HeaderMap) -> HashMap<String, String> {
+    let mut forwarded = HashMap::new();
+    for (name, value) in headers {
+        if matches!(
+            name.as_str(),
+            "host" | "content-length" | "connection" | "transfer-encoding" | "keep-alive"
+        ) {
+            continue;
+        }
+        if name.as_str() == INTERNAL_AFFINITY_FORWARDED_HEADER {
+            continue;
+        }
+        if let Ok(value_str) = value.to_str() {
+            forwarded.insert(name.as_str().to_string(), value_str.to_string());
+        }
+    }
+    forwarded
+}
+
+fn response_from_affinity_forward_response(
+    payload: AffinityForwardResponse,
+    session_hint: Option<&str>,
+) -> Response {
+    let status = StatusCode::from_u16(payload.status).unwrap_or(StatusCode::BAD_GATEWAY);
+    let body = hex_decode(payload.body.as_bytes()).unwrap_or_default();
+    let mut builder = Response::builder().status(status);
+    builder = builder.header(RUNTIME_HEADER, RUNTIME_NAME);
+
+    let mut has_content_type = false;
+    let mut has_session_id = false;
+    for (name, value) in payload.headers {
+        let lower = name.to_ascii_lowercase();
+        if !should_forward_response_header(lower.as_str()) {
+            continue;
+        }
+        if lower == "content-type" {
+            has_content_type = true;
+        }
+        if lower == "mcp-session-id" {
+            has_session_id = true;
+        }
+        if let (Ok(header_name), Ok(header_value)) = (
+            HeaderName::from_bytes(lower.as_bytes()),
+            HeaderValue::from_str(&value),
+        ) {
+            builder = builder.header(header_name, header_value);
+        }
+    }
+
+    if !has_content_type {
+        builder = builder.header(CONTENT_TYPE, "application/json");
+    }
+    if !has_session_id && let Some(session_id) = session_hint {
+        builder = builder.header("mcp-session-id", session_id);
+    }
+
+    builder
+        .body(Body::from(body))
+        .unwrap_or_else(|_| Response::new(Body::from("internal response construction error")))
+}
+
+fn affinity_forward_error_response<E>(message: &str, err: E) -> Response
+where
+    E: std::fmt::Display,
+{
+    error!("Rust MCP affinity forwarding failed: {message}: {err}");
+    json_response(
+        StatusCode::BAD_GATEWAY,
+        json!({
+            "detail": message,
+        }),
+    )
+}
+
+fn current_unix_timestamp_seconds() -> f64 {
+    match std::time::SystemTime::now().duration_since(std::time::UNIX_EPOCH) {
+        Ok(duration) => duration.as_secs_f64(),
+        Err(_) => 0.0,
+    }
+}
+
+fn hex_encode(bytes: &[u8]) -> String {
+    const HEX: &[u8; 16] = b"0123456789abcdef";
+    let mut encoded = String::with_capacity(bytes.len() * 2);
+    for byte in bytes {
+        encoded.push(HEX[(byte >> 4) as usize] as char);
+        encoded.push(HEX[(byte & 0x0f) as usize] as char);
+    }
+    encoded
+}
+
+fn hex_decode(input: &[u8]) -> Option<Vec<u8>> {
+    if input.len() % 2 != 0 {
+        return None;
+    }
+
+    let mut decoded = Vec::with_capacity(input.len() / 2);
+    for chunk in input.chunks_exact(2) {
+        let high = hex_value(chunk[0])?;
+        let low = hex_value(chunk[1])?;
+        decoded.push((high << 4) | low);
+    }
+    Some(decoded)
+}
+
+fn hex_value(byte: u8) -> Option<u8> {
+    match byte {
+        b'0'..=b'9' => Some(byte - b'0'),
+        b'a'..=b'f' => Some(byte - b'a' + 10),
+        b'A'..=b'F' => Some(byte - b'A' + 10),
+        _ => None,
+    }
+}
+
+const STORE_EVENT_LUA: &str = r"
+local meta_key = KEYS[1]
+local events_key = KEYS[2]
+local messages_key = KEYS[3]
+
+local event_id = ARGV[1]
+local message_json = ARGV[2]
+local ttl = tonumber(ARGV[3])
+local max_events = tonumber(ARGV[4])
+local index_prefix = ARGV[5]
+local stream_id = ARGV[6]
+
+local seq_num = redis.call('HINCRBY', meta_key, 'next_seq', 1)
+local count = redis.call('HINCRBY', meta_key, 'count', 1)
+if count == 1 then
+  redis.call('HSET', meta_key, 'start_seq', seq_num)
+end
+
+redis.call('ZADD', events_key, seq_num, event_id)
+redis.call('HSET', messages_key, event_id, message_json)
+
+local index_key = index_prefix .. event_id
+redis.call('SET', index_key, cjson.encode({stream_id=stream_id, seq_num=seq_num}), 'EX', ttl)
+
+if count > max_events then
+  local to_evict = count - max_events
+  local evicted_ids = redis.call('ZRANGE', events_key, 0, to_evict - 1)
+  redis.call('ZREMRANGEBYRANK', events_key, 0, to_evict - 1)
+
+  if #evicted_ids > 0 then
+    redis.call('HDEL', messages_key, unpack(evicted_ids))
+    for _, ev_id in ipairs(evicted_ids) do
+      redis.call('DEL', index_prefix .. ev_id)
+    end
+  end
+
+  redis.call('HSET', meta_key, 'count', max_events)
+  local first = redis.call('ZRANGE', events_key, 0, 0, 'WITHSCORES')
+  if #first >= 2 then
+    redis.call('HSET', meta_key, 'start_seq', tonumber(first[2]))
+  else
+    redis.call('HSET', meta_key, 'start_seq', seq_num)
+  end
+end
+
+redis.call('EXPIRE', meta_key, ttl)
+redis.call('EXPIRE', events_key, ttl)
+redis.call('EXPIRE', messages_key, ttl)
+
+return seq_num
+";
+
+async fn store_event_in_rust_event_store(
+    state: &AppState,
+    request: EventStoreStoreRequest,
+) -> Result<String, Response> {
+    // The Redis event store keeps a bounded per-stream history plus an index
+    // from event id -> (stream id, sequence number). That lets resume lookups
+    // answer "replay everything after event X" without scanning all streams.
+    let Some(mut redis) = state.redis().await else {
+        return Err(json_response(
+            StatusCode::SERVICE_UNAVAILABLE,
+            json!({"detail": "Rust Redis event store is unavailable"}),
+        ));
+    };
+
+    let event_id = Uuid::new_v4().to_string();
+    let key_prefix = event_store_key_prefix(state, request.key_prefix.as_deref());
+    let message_json = serde_json::to_string(&request.message).map_err(|err| {
+        json_response(
+            StatusCode::BAD_REQUEST,
+            json!({"detail": format!("Invalid event payload: {err}")}),
+        )
+    })?;
+    let ttl = request
+        .ttl_seconds
+        .unwrap_or(state.event_store_ttl().as_secs());
+    let max_events = request
+        .max_events_per_stream
+        .unwrap_or(state.event_store_max_events_per_stream());
+    let ttl_i64 = i64::try_from(ttl).map_err(|_| {
+        json_response(
+            StatusCode::BAD_REQUEST,
+            json!({"detail": "Rust event store ttl exceeds supported range"}),
+        )
+    })?;
+    let max_events_i64 = i64::try_from(max_events).map_err(|_| {
+        json_response(
+            StatusCode::BAD_REQUEST,
+            json!({"detail": "Rust event store max events exceeds supported range"}),
+        )
+    })?;
+
+    let meta_key = format!("{key_prefix}:{}:meta", request.stream_id);
+    let events_key = format!("{key_prefix}:{}:events", request.stream_id);
+    let messages_key = format!("{key_prefix}:{}:messages", request.stream_id);
+    let index_prefix = format!("{key_prefix}:event_index:");
+
+    Script::new(STORE_EVENT_LUA)
+        .key(meta_key)
+        .key(events_key)
+        .key(messages_key)
+        .arg(event_id.clone())
+        .arg(message_json)
+        .arg(ttl_i64)
+        .arg(max_events_i64)
+        .arg(index_prefix)
+        .arg(request.stream_id)
+        .invoke_async::<i64>(&mut redis)
+        .await
+        .map_err(|err| {
+            error!("Rust event store write failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({"detail": "Rust event store write failed"}),
+            )
+        })?;
+
+    Ok(event_id)
+}
+
+async fn replay_events_from_rust_event_store(
+    state: &AppState,
+    request: EventStoreReplayRequest,
+) -> Result<EventStoreReplayResponse, Response> {
+    // Replay is intentionally tolerant. Missing index entries or replay points
+    // older than the retained stream window return an empty replay rather than
+    // surfacing a hard error to the public transport path.
+    let Some(mut redis) = state.redis().await else {
+        return Err(json_response(
+            StatusCode::SERVICE_UNAVAILABLE,
+            json!({"detail": "Rust Redis event store is unavailable"}),
+        ));
+    };
+
+    let key_prefix = event_store_key_prefix(state, request.key_prefix.as_deref());
+    let index_key = format!("{key_prefix}:event_index:{}", request.last_event_id);
+    let Some(index_payload) = redis
+        .get::<_, Option<String>>(&index_key)
+        .await
+        .map_err(|err| {
+            error!("Rust event store replay lookup failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({"detail": "Rust event store replay lookup failed"}),
+            )
+        })?
+    else {
+        return Ok(EventStoreReplayResponse {
+            stream_id: None,
+            events: Vec::new(),
+        });
+    };
+
+    let index_record: EventIndexRecord = serde_json::from_str(&index_payload).map_err(|err| {
+        error!("Rust event store index decode failed: {err}");
+        json_response(
+            StatusCode::BAD_GATEWAY,
+            json!({"detail": "Rust event store index decode failed"}),
+        )
+    })?;
+    let meta_key = format!("{key_prefix}:{}:meta", index_record.stream_id);
+    let events_key = format!("{key_prefix}:{}:events", index_record.stream_id);
+    let messages_key = format!("{key_prefix}:{}:messages", index_record.stream_id);
+
+    if let Some(start_seq) = redis
+        .hget::<_, _, Option<i64>>(&meta_key, "start_seq")
+        .await
+        .map_err(|err| {
+            error!("Rust event store meta lookup failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({"detail": "Rust event store meta lookup failed"}),
+            )
+        })?
+        && index_record.seq_num < start_seq
+    {
+        return Ok(EventStoreReplayResponse {
+            stream_id: None,
+            events: Vec::new(),
+        });
+    }
+
+    let event_ids = redis::cmd("ZRANGEBYSCORE")
+        .arg(&events_key)
+        .arg(index_record.seq_num + 1)
+        .arg("+inf")
+        .query_async::<Vec<String>>(&mut redis)
+        .await
+        .map_err(|err| {
+            error!("Rust event store replay scan failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({"detail": "Rust event store replay scan failed"}),
+            )
+        })?;
+
+    let mut events = Vec::with_capacity(event_ids.len());
+    for event_id in event_ids {
+        let Some(message_json) = redis
+            .hget::<_, _, Option<String>>(&messages_key, &event_id)
+            .await
+            .map_err(|err| {
+                error!("Rust event store replay fetch failed: {err}");
+                json_response(
+                    StatusCode::BAD_GATEWAY,
+                    json!({"detail": "Rust event store replay fetch failed"}),
+                )
+            })?
+        else {
+            continue;
+        };
+
+        match serde_json::from_str::<Value>(&message_json) {
+            Ok(message) => events.push(EventStoreReplayEvent { event_id, message }),
+            Err(err) => {
+                error!(
+                    "Rust event store replay decode failed for stream {} event {}: {err}",
+                    index_record.stream_id, event_id
+                );
+                return Err(json_response(
+                    StatusCode::BAD_GATEWAY,
+                    json!({"detail": "Rust event store replay decode failed"}),
+                ));
+            }
+        }
+    }
+
+    Ok(EventStoreReplayResponse {
+        stream_id: Some(index_record.stream_id),
+        events,
+    })
+}
+
+fn event_store_key_prefix(state: &AppState, override_prefix: Option<&str>) -> String {
+    let prefix = override_prefix
+        .unwrap_or("eventstore")
+        .trim_end_matches(':');
+    if prefix.contains(':') {
+        prefix.to_string()
+    } else {
+        format!("{}{}", state.cache_prefix(), prefix)
+    }
+}
+
+async fn validate_runtime_session_request(
+    state: &AppState,
+    incoming_headers: &mut HeaderMap,
+    uri: &axum::http::Uri,
+) -> Result<Option<String>, Response> {
+    // Session validation is intentionally strict:
+    // - the session must exist
+    // - server-scoped requests must stay on the original server
+    // - the current caller must match the stored auth binding/owner
+    // Only after that do we normalize the session/server headers that the
+    // downstream Python transport bridge expects.
+    let Some(session_id) = runtime_session_id_from_request(incoming_headers, uri) else {
+        return Ok(None);
+    };
+
+    let Some(record) = get_runtime_session(state, &session_id).await else {
+        return Err(json_response(
+            StatusCode::NOT_FOUND,
+            json!({
+                "detail": "Session not found",
+            }),
+        ));
+    };
+
+    if let (Some(session_server_id), Some(request_server_id)) = (
+        record.server_id.as_deref(),
+        extract_server_id_header(incoming_headers).as_deref(),
+    ) && session_server_id != request_server_id
+    {
+        state.runtime_stats().record_session_server_scope_mismatch();
+        return Err(json_response(
+            StatusCode::FORBIDDEN,
+            json!({
+                "detail": "Session access denied",
+            }),
+        ));
+    }
+
+    let auth_context = decode_internal_auth_context_from_headers_optional(incoming_headers);
+    if let Err(reason) =
+        runtime_session_access_outcome(&record, auth_context.as_ref(), incoming_headers)
+    {
+        state.runtime_stats().record_session_access_denial(reason);
+        return Err(json_response(
+            StatusCode::FORBIDDEN,
+            json!({
+                "detail": "Session access denied",
+            }),
+        ));
+    }
+
+    inject_session_header(incoming_headers, &session_id);
+    if let Some(server_id) = record.server_id.as_deref()
+        && !incoming_headers.contains_key("x-contextforge-server-id")
+    {
+        inject_server_id_header(incoming_headers, server_id);
+    }
+
+    Ok(Some(session_id))
+}
+
+fn runtime_session_access_outcome(
+    record: &RuntimeSessionRecord,
+    auth_context: Option<&InternalAuthContext>,
+    incoming_headers: &HeaderMap,
+) -> Result<(), SessionAccessDenyReason> {
+    // The auth-binding fingerprint prevents a caller from reusing another
+    // client's session identifier even when the email or visible scope appears
+    // superficially compatible.
+    if let Some(expected_fingerprint) = record.auth_binding_fingerprint.as_deref() {
+        let Some(actual_fingerprint) = auth_binding_fingerprint(incoming_headers) else {
+            return Err(SessionAccessDenyReason::MissingAuthBindingFingerprint);
+        };
+        if actual_fingerprint != expected_fingerprint {
+            return Err(SessionAccessDenyReason::AuthBindingMismatch);
+        }
+    }
+
+    let Some(owner_email) = record.owner_email.as_deref() else {
+        return Ok(());
+    };
+    let Some(auth_context) = auth_context else {
+        return Err(SessionAccessDenyReason::MissingAuthContext);
+    };
+    if auth_context.email.as_deref() == Some(owner_email) {
+        Ok(())
+    } else {
+        Err(SessionAccessDenyReason::OwnerEmailMismatch)
+    }
+}
+
+fn requested_initialize_session_id(
+    incoming_headers: &HeaderMap,
+    uri: &axum::http::Uri,
+    request: &JsonRpcRequest,
+) -> Option<String> {
+    runtime_session_id_from_request(incoming_headers, uri).or_else(|| {
+        request
+            .params
+            .get("session_id")
+            .or_else(|| request.params.get("sessionId"))
+            .and_then(Value::as_str)
+            .map(str::to_string)
+    })
+}
+
+fn runtime_session_id_from_request(
+    incoming_headers: &HeaderMap,
+    uri: &axum::http::Uri,
+) -> Option<String> {
+    incoming_headers
+        .get("mcp-session-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string)
+        .or_else(|| query_param(uri, "session_id"))
+}
+
+fn requested_protocol_version(request: &JsonRpcRequest) -> Option<String> {
+    request
+        .params
+        .get("protocolVersion")
+        .or_else(|| request.params.get("protocol_version"))
+        .and_then(Value::as_str)
+        .map(str::to_string)
+}
+
+fn extract_client_capabilities(request: &JsonRpcRequest) -> Option<Value> {
+    request.params.get("capabilities").cloned()
+}
+
+fn extract_server_id_header(incoming_headers: &HeaderMap) -> Option<String> {
+    incoming_headers
+        .get("x-contextforge-server-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string)
+}
+
+fn requested_protocol_version_from_headers(incoming_headers: &HeaderMap) -> Option<String> {
+    incoming_headers
+        .get(MCP_PROTOCOL_VERSION_HEADER)
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string)
+}
+
+fn maybe_bind_session_auth_context(
+    state: &AppState,
+    record: &mut RuntimeSessionRecord,
+    incoming_headers: &HeaderMap,
+    auth_context: Option<&InternalAuthContext>,
+) {
+    // Session auth reuse is opt-in and conservative. Any missing or
+    // unauthenticated signal clears the cached auth material so the next public
+    // request will round-trip back through Python authentication.
+    if !state.session_auth_reuse_enabled() {
+        record.encoded_auth_context = None;
+        record.auth_binding_fingerprint = None;
+        record.auth_context_expires_at_epoch_ms = None;
+        return;
+    }
+
+    let Some(auth_context) = auth_context else {
+        record.encoded_auth_context = None;
+        record.auth_binding_fingerprint = None;
+        record.auth_context_expires_at_epoch_ms = None;
+        return;
+    };
+
+    if !auth_context.is_authenticated {
+        record.encoded_auth_context = None;
+        record.auth_binding_fingerprint = None;
+        record.auth_context_expires_at_epoch_ms = None;
+        return;
+    }
+
+    let Some(encoded_auth_context) = current_encoded_auth_context_header(incoming_headers) else {
+        record.encoded_auth_context = None;
+        record.auth_binding_fingerprint = None;
+        record.auth_context_expires_at_epoch_ms = None;
+        return;
+    };
+
+    let Some(fingerprint) = auth_binding_fingerprint(incoming_headers) else {
+        record.encoded_auth_context = None;
+        record.auth_binding_fingerprint = None;
+        record.auth_context_expires_at_epoch_ms = None;
+        return;
+    };
+
+    record.encoded_auth_context = Some(encoded_auth_context);
+    record.auth_binding_fingerprint = Some(fingerprint);
+    let auth_context_ttl_ms =
+        u64::try_from(state.session_auth_reuse_ttl().as_millis()).unwrap_or(u64::MAX);
+    record.auth_context_expires_at_epoch_ms =
+        Some(unix_epoch_millis().saturating_add(auth_context_ttl_ms));
+}
+
+fn inject_session_header(incoming_headers: &mut HeaderMap, session_id: &str) {
+    if let Ok(value) = HeaderValue::from_str(session_id) {
+        incoming_headers.insert(HeaderName::from_static("mcp-session-id"), value);
+    }
+}
+
+fn inject_server_id_header(incoming_headers: &mut HeaderMap, server_id: &str) {
+    if let Ok(value) = HeaderValue::from_str(server_id) {
+        incoming_headers.insert(HeaderName::from_static("x-contextforge-server-id"), value);
+    }
+}
+
+fn query_param(uri: &axum::http::Uri, key: &str) -> Option<String> {
+    uri.query().and_then(|query| {
+        query.split('&').find_map(|pair| {
+            let (name, value) = pair.split_once('=')?;
+            if name == key {
+                Some(value.to_string())
+            } else {
+                None
+            }
+        })
+    })
+}
+
+async fn maybe_upsert_runtime_session_from_transport_response(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    request_session_id: Option<&str>,
+    response_headers: &reqwest::header::HeaderMap,
+) -> Option<String> {
+    // The runtime tracks both sessions created by initialize responses and
+    // client-provided session ids reused by the Python transport bridge so that
+    // follow-up GET/POST/DELETE requests can be validated consistently.
+    let response_session_id = response_headers
+        .get("mcp-session-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string)
+        .or_else(|| request_session_id.map(str::to_string));
+
+    if !state.session_core_enabled() {
+        return response_session_id;
+    }
+
+    let session_id = response_session_id.clone()?;
+
+    let existing = get_runtime_session(state, &session_id).await;
+    let auth_context = decode_internal_auth_context_from_headers_optional(incoming_headers);
+    let now = Instant::now();
+    let mut record = RuntimeSessionRecord {
+        owner_email: existing
+            .as_ref()
+            .and_then(|record| record.owner_email.clone())
+            .or_else(|| {
+                auth_context
+                    .as_ref()
+                    .and_then(|context| context.email.clone())
+            }),
+        server_id: existing
+            .as_ref()
+            .and_then(|record| record.server_id.clone())
+            .or_else(|| extract_server_id_header(incoming_headers)),
+        protocol_version: existing
+            .as_ref()
+            .and_then(|record| record.protocol_version.clone())
+            .or_else(|| requested_protocol_version_from_headers(incoming_headers)),
+        client_capabilities: existing
+            .as_ref()
+            .and_then(|record| record.client_capabilities.clone()),
+        encoded_auth_context: existing
+            .as_ref()
+            .and_then(|record| record.encoded_auth_context.clone()),
+        auth_binding_fingerprint: existing
+            .as_ref()
+            .and_then(|record| record.auth_binding_fingerprint.clone()),
+        auth_context_expires_at_epoch_ms: existing
+            .as_ref()
+            .and_then(|record| record.auth_context_expires_at_epoch_ms),
+        created_at: existing.as_ref().map_or(now, |record| record.created_at),
+        last_used: now,
+    };
+    maybe_bind_session_auth_context(state, &mut record, incoming_headers, auth_context.as_ref());
+    upsert_runtime_session(state, session_id.clone(), record).await;
+
+    Some(session_id)
+}
+
+fn accepts_sse(headers: &HeaderMap) -> bool {
+    headers
+        .get("accept")
+        .and_then(|value| value.to_str().ok())
+        .is_some_and(|value| {
+            value.split(',').any(|part| {
+                let normalized = part.trim().to_ascii_lowercase();
+                normalized == "text/event-stream"
+                    || normalized.starts_with("text/event-stream;")
+                    || normalized == "*/*"
+            })
+        })
+}
+
+fn parse_sse_line(frame: &mut PendingSseFrame, raw_line: &str) {
+    // This is a minimal SSE parser for upstream responses. It keeps only the
+    // fields the runtime needs to preserve (`id`, `event`, `data`, `retry`) and
+    // intentionally ignores comments and unknown fields.
+    if raw_line.starts_with(':') {
+        return;
+    }
+
+    let (field, value) = raw_line
+        .split_once(':')
+        .map_or((raw_line, ""), |(field, value)| (field, value.trim_start()));
+
+    match field {
+        "id" => {
+            frame.id = Some(value.to_string());
+            frame.saw_field = true;
+        }
+        "event" => {
+            frame.event = Some(value.to_string());
+            frame.saw_field = true;
+        }
+        "data" => {
+            frame.data_lines.push(value.to_string());
+            frame.saw_field = true;
+        }
+        "retry" => {
+            frame.retry_ms = value.parse::<u64>().ok();
+            frame.saw_field = true;
+        }
+        _ => {}
+    }
+}
+
+fn finalize_sse_frame(frame: &mut PendingSseFrame) -> Option<FinalizedSseFrame> {
+    // Empty lines terminate the current SSE frame. Frames without any parsed
+    // fields are treated as keep-alive noise and dropped.
+    if !frame.saw_field {
+        *frame = PendingSseFrame::default();
+        return None;
+    }
+
+    let finalized = FinalizedSseFrame {
+        id: frame.id.take(),
+        event: frame.event.take(),
+        data: frame.data_lines.join("\n"),
+        retry_ms: frame.retry_ms.take(),
+    };
+    *frame = PendingSseFrame::default();
+    Some(finalized)
+}
+
+fn build_forwarded_sse_event(frame: &FinalizedSseFrame) -> Event {
+    let mut event = Event::default();
+    if let Some(id) = frame.id.as_deref() {
+        event = event.id(id);
+    }
+    if let Some(name) = frame.event.as_deref() {
+        event = event.event(name);
+    }
+    if let Some(retry_ms) = frame.retry_ms {
+        event = event.retry(Duration::from_millis(retry_ms));
+    }
+    event.data(frame.data.clone())
+}
+
+async fn handle_resume_transport_request(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    _uri: axum::http::Uri,
+    session_id: Option<&str>,
+) -> Response {
+    // Resumable GET /mcp replays events from the Rust event store first and
+    // then tails the same stream by polling Redis for newly appended events.
+    // The stream stops once the owning runtime session disappears.
+    let Some(last_event_id) = incoming_headers
+        .get("last-event-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string)
+    else {
+        return json_response(
+            StatusCode::BAD_REQUEST,
+            json!({"detail": "Last-Event-ID header is required for resumable GET /mcp"}),
+        );
+    };
+
+    let initial_replay = match replay_events_from_rust_event_store(
+        state,
+        EventStoreReplayRequest {
+            last_event_id: last_event_id.clone(),
+            key_prefix: None,
+        },
+    )
+    .await
+    {
+        Ok(replay) => replay,
+        Err(response) => return response,
+    };
+    let protocol_version = incoming_headers
+        .get(MCP_PROTOCOL_VERSION_HEADER)
+        .and_then(|value| value.to_str().ok())
+        .unwrap_or(state.protocol_version())
+        .to_string();
+
+    let keep_alive = KeepAlive::new().interval(Duration::from_secs(15)).text("");
+    let poll_interval = state.event_store_poll_interval();
+    let session_id = session_id.map(str::to_string);
+    let stream_session_id = session_id.clone();
+    let state_cloned = state.clone();
+    let mut replay_cursor = last_event_id.clone();
+    let mut initial_events = initial_replay.events;
+    let stream_id = initial_replay.stream_id;
+
+    let event_stream = async_stream::stream! {
+        for event in initial_events.drain(..) {
+            replay_cursor.clone_from(&event.event_id);
+            yield Ok::<Event, Infallible>(build_sse_event(&event.event_id, &event.message));
+        }
+
+        if let Some(stream_id_value) = stream_id {
+            // Protocol versions are ISO dates (`YYYY-MM-DD`), so lexical
+            // ordering matches chronological ordering for this gate.
+            if protocol_version.as_str() >= "2025-11-25"
+                && let Ok(priming_event_id) = store_event_in_rust_event_store(
+                    &state_cloned,
+                    EventStoreStoreRequest {
+                        stream_id: stream_id_value.clone(),
+                        message: None,
+                        key_prefix: None,
+                        max_events_per_stream: None,
+                        ttl_seconds: None,
+                    },
+                ).await {
+                    replay_cursor.clone_from(&priming_event_id);
+                    yield Ok::<Event, Infallible>(Event::default().id(priming_event_id).data(""));
+                }
+
+            loop {
+                if let Some(session_id_value) = stream_session_id.as_deref()
+                    && get_runtime_session(&state_cloned, session_id_value).await.is_none()
+                {
+                    break;
+                }
+
+                match replay_events_from_rust_event_store(
+                    &state_cloned,
+                    EventStoreReplayRequest {
+                        last_event_id: replay_cursor.clone(),
+                        key_prefix: None,
+                    },
+                )
+                .await {
+                    Ok(replay) => {
+                        if replay.events.is_empty() {
+                            tokio::time::sleep(poll_interval).await;
+                            continue;
+                        }
+                        for event in replay.events {
+                            replay_cursor.clone_from(&event.event_id);
+                            yield Ok::<Event, Infallible>(build_sse_event(&event.event_id, &event.message));
+                        }
+                    }
+                    Err(_) => break,
+                }
+            }
+        }
+    };
+
+    let mut response = Sse::new(event_stream)
+        .keep_alive(keep_alive)
+        .into_response();
+    response
+        .headers_mut()
+        .insert(CONTENT_TYPE, HeaderValue::from_static("text/event-stream"));
+    response.headers_mut().insert(
+        HeaderName::from_static("cache-control"),
+        HeaderValue::from_static("no-cache, no-transform"),
+    );
+    response.headers_mut().insert(
+        HeaderName::from_static("connection"),
+        HeaderValue::from_static("keep-alive"),
+    );
+    response.headers_mut().insert(
+        HeaderName::from_static(RUNTIME_HEADER),
+        HeaderValue::from_static(RUNTIME_NAME),
+    );
+    inject_runtime_capability_headers(
+        &mut response,
+        &[
+            (SESSION_CORE_HEADER, true),
+            (EVENT_STORE_HEADER, true),
+            (RESUME_CORE_HEADER, true),
+            (
+                SESSION_AUTH_REUSE_HEADER,
+                state.session_auth_reuse_enabled(),
+            ),
+            (LIVE_STREAM_CORE_HEADER, state.live_stream_core_enabled()),
+        ],
+    );
+    if let Some(session_id_value) = session_id.as_deref()
+        && let Ok(value) = HeaderValue::from_str(session_id_value)
+    {
+        response
+            .headers_mut()
+            .insert(HeaderName::from_static("mcp-session-id"), value);
+    }
+    response
+}
+
+fn handle_live_stream_transport_request(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    uri: &axum::http::Uri,
+    session_id: Option<&str>,
+) -> Response {
+    // Live stream mode keeps Python as the transport source of truth and has
+    // Rust act as an SSE relay. Rust parses the upstream byte stream into SSE
+    // frames so it can preserve event ids and attach its own runtime metadata.
+    let keep_alive = KeepAlive::new().interval(Duration::from_secs(15)).text("");
+    let state_cloned = state.clone();
+    let backend_headers = incoming_headers.clone();
+    let request_session_id = session_id.map(str::to_string);
+    let response_session_id = request_session_id.clone();
+    let uri_cloned = uri.clone();
+
+    let event_stream = async_stream::stream! {
+        let backend_response = match send_transport_to_backend(
+            &state_cloned,
+            reqwest::Method::GET,
+            &backend_headers,
+            &uri_cloned,
+            None,
+            request_session_id.is_some(),
+        )
+        .await
+        {
+            Ok(response) => response,
+            Err(response) => {
+                error!(
+                    "backend MCP live stream open failed with status {}",
+                    response.status()
+                );
+                return;
+            }
+        };
+
+        let status = backend_response.status();
+        let response_headers = backend_response.headers().clone();
+        let content_type = response_headers
+            .get(CONTENT_TYPE)
+            .and_then(|value| value.to_str().ok())
+            .unwrap_or_default()
+            .to_ascii_lowercase();
+
+        let _response_session_id = maybe_upsert_runtime_session_from_transport_response(
+            &state_cloned,
+            &backend_headers,
+            request_session_id.as_deref(),
+            &response_headers,
+        )
+        .await;
+
+        if !status.is_success() || !content_type.contains("text/event-stream") {
+            error!(
+                "backend MCP live stream returned non-stream response status={} content_type={}",
+                status,
+                content_type
+            );
+            return;
+        }
+
+        let mut upstream_stream = backend_response.bytes_stream();
+        let mut buffer: Vec<u8> = Vec::new();
+        let mut frame = PendingSseFrame::default();
+
+        loop {
+            match upstream_stream.next().await {
+                Some(Ok(chunk)) => {
+                    buffer.extend_from_slice(&chunk);
+
+                    while let Some(newline_index) = buffer.iter().position(|byte| *byte == b'\n') {
+                        let mut line_bytes: Vec<u8> = buffer.drain(..=newline_index).collect();
+                        if matches!(line_bytes.last(), Some(b'\n')) {
+                            line_bytes.pop();
+                        }
+                        if matches!(line_bytes.last(), Some(b'\r')) {
+                            line_bytes.pop();
+                        }
+
+                        let line = String::from_utf8_lossy(&line_bytes);
+                        if line.is_empty() {
+                            if let Some(finalized) = finalize_sse_frame(&mut frame) {
+                                yield Ok::<Event, Infallible>(build_forwarded_sse_event(&finalized));
+                            }
+                            continue;
+                        }
+
+                        parse_sse_line(&mut frame, &line);
+                    }
+                }
+                Some(Err(err)) => {
+                    error!("backend MCP live stream read failed: {err}");
+                    break;
+                }
+                None => {
+                    if !buffer.is_empty() {
+                        let line = String::from_utf8_lossy(&buffer);
+                        parse_sse_line(&mut frame, line.trim_end_matches(['\r', '\n']));
+                        buffer.clear();
+                    }
+                    if let Some(finalized) = finalize_sse_frame(&mut frame) {
+                        yield Ok::<Event, Infallible>(build_forwarded_sse_event(&finalized));
+                    }
+                    break;
+                }
+            }
+        }
+    };
+
+    let mut response = Sse::new(event_stream)
+        .keep_alive(keep_alive)
+        .into_response();
+    response
+        .headers_mut()
+        .insert(CONTENT_TYPE, HeaderValue::from_static("text/event-stream"));
+    response.headers_mut().insert(
+        HeaderName::from_static("cache-control"),
+        HeaderValue::from_static("no-cache, no-transform"),
+    );
+    response.headers_mut().insert(
+        HeaderName::from_static("connection"),
+        HeaderValue::from_static("keep-alive"),
+    );
+    response.headers_mut().insert(
+        HeaderName::from_static(RUNTIME_HEADER),
+        HeaderValue::from_static(RUNTIME_NAME),
+    );
+    inject_runtime_capability_headers(
+        &mut response,
+        &[
+            (LIVE_STREAM_CORE_HEADER, true),
+            (SESSION_CORE_HEADER, state.session_core_enabled()),
+            (EVENT_STORE_HEADER, state.event_store_enabled()),
+            (RESUME_CORE_HEADER, state.resume_core_enabled()),
+            (
+                SESSION_AUTH_REUSE_HEADER,
+                state.session_auth_reuse_enabled(),
+            ),
+        ],
+    );
+    if let Some(session_id_value) = response_session_id.as_deref()
+        && let Ok(value) = HeaderValue::from_str(session_id_value)
+    {
+        response
+            .headers_mut()
+            .insert(HeaderName::from_static("mcp-session-id"), value);
+    }
+    response
+}
+
+fn build_sse_event(event_id: &str, message: &Value) -> Event {
+    let event = Event::default().id(event_id);
+    if message.is_null() {
+        return event.data("");
+    }
+
+    event
+        .event("message")
+        .data(serde_json::to_string(message).unwrap_or_else(|_| "null".to_string()))
+}
+
+async fn send_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    send_to_backend_url(state, state.backend_rpc_url(), incoming_headers, body).await
+}
+
+async fn send_to_backend_url(
+    state: &AppState,
+    backend_url: &str,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(backend_url)
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP dispatch failed: {err}");
+            backend_jsonrpc_error_response(None, "Backend MCP dispatch failed")
+        })
+}
+
+async fn forward_transport_request(
+    state: &AppState,
+    method: reqwest::Method,
+    mut incoming_headers: HeaderMap,
+    public_path: String,
+    uri: axum::http::Uri,
+) -> Response {
+    // This is the main transport router for GET/DELETE streamable-HTTP traffic.
+    // It decides, in order:
+    // - whether a runtime session must be validated
+    // - whether the request is a resumable GET served by Rust event replay
+    // - whether affinity should forward the request to another Rust worker
+    // - whether live SSE streaming should be proxied directly by Rust
+    // - otherwise, whether the request should fall through to Python's
+    //   existing transport/session implementation
+    let session_id = if state.session_core_enabled() {
+        match validate_runtime_session_request(state, &mut incoming_headers, &uri).await {
+            Ok(session_id) => session_id,
+            Err(response) => return response,
+        }
+    } else {
+        None
+    };
+    let session_validated = state.session_core_enabled() && session_id.is_some();
+
+    if method == reqwest::Method::GET
+        && state.resume_core_enabled()
+        && state.session_core_enabled()
+        && state.event_store_enabled()
+        && accepts_sse(&incoming_headers)
+        && incoming_headers.contains_key("last-event-id")
+    {
+        if let Some(session_id_value) = session_id.as_deref() {
+            let Some(record) = get_runtime_session(state, session_id_value).await else {
+                return json_response(
+                    StatusCode::NOT_FOUND,
+                    json!({
+                        "jsonrpc": JSONRPC_VERSION,
+                        "id": "server-error",
+                        "error": {
+                            "code": -32600,
+                            "message": "Session not found",
+                        }
+                    }),
+                );
+            };
+
+            let auth_context =
+                decode_internal_auth_context_from_headers_optional(&incoming_headers);
+            if let Err(reason) =
+                runtime_session_access_outcome(&record, auth_context.as_ref(), &incoming_headers)
+            {
+                state.runtime_stats().record_session_access_denial(reason);
+                return json_response(
+                    StatusCode::FORBIDDEN,
+                    json!({
+                        "detail": "Session access denied",
+                    }),
+                );
+            }
+            inject_session_header(&mut incoming_headers, session_id_value);
+            if let Some(server_id) = record.server_id.as_deref()
+                && !incoming_headers.contains_key("x-contextforge-server-id")
+            {
+                inject_server_id_header(&mut incoming_headers, server_id);
+            }
+        } else {
+            return json_response(
+                StatusCode::BAD_REQUEST,
+                json!({
+                    "detail": "mcp-session-id header or session_id query parameter is required for resumable GET /mcp",
+                }),
+            );
+        }
+
+        return handle_resume_transport_request(
+            state,
+            incoming_headers,
+            uri,
+            session_id.as_deref(),
+        )
+        .await;
+    }
+
+    if state.affinity_core_enabled()
+        && state.session_core_enabled()
+        && session_id.is_some()
+        && (method == reqwest::Method::GET || method == reqwest::Method::DELETE)
+    {
+        let affinity_response = match forward_transport_request_via_affinity_owner(
+            state,
+            session_id.as_deref().unwrap_or_default(),
+            method.clone(),
+            public_path.as_str(),
+            uri.query().unwrap_or_default(),
+            &incoming_headers,
+            &[],
+        )
+        .await
+        {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+        if let Some(mut response) = affinity_response {
+            inject_runtime_capability_headers(
+                &mut response,
+                &[(AFFINITY_CORE_HEADER, state.affinity_core_enabled())],
+            );
+            return response;
+        }
+    }
+
+    if method == reqwest::Method::GET
+        && state.live_stream_core_enabled()
+        && accepts_sse(&incoming_headers)
+        && !incoming_headers.contains_key("last-event-id")
+    {
+        return handle_live_stream_transport_request(
+            state,
+            &incoming_headers,
+            &uri,
+            session_id.as_deref(),
+        );
+    }
+
+    if state.session_core_enabled() && method == reqwest::Method::DELETE && session_id.is_some() {
+        let backend_response =
+            match send_session_delete_to_backend(state, &incoming_headers, session_validated).await
+            {
+                Ok(response) => response,
+                Err(response) => return response,
+            };
+
+        if backend_response.status().is_success()
+            && let Some(session_id_value) = session_id.as_deref()
+        {
+            remove_runtime_session(state, session_id_value).await;
+        }
+
+        let mut response =
+            response_from_backend_with_session_hint(backend_response, session_id.as_deref());
+        inject_runtime_capability_headers(
+            &mut response,
+            &[
+                (SESSION_CORE_HEADER, state.session_core_enabled()),
+                (EVENT_STORE_HEADER, state.event_store_enabled()),
+                (RESUME_CORE_HEADER, state.resume_core_enabled()),
+                (LIVE_STREAM_CORE_HEADER, state.live_stream_core_enabled()),
+                (AFFINITY_CORE_HEADER, state.affinity_core_enabled()),
+            ],
+        );
+        return response;
+    }
+
+    let backend_response = match send_transport_to_backend(
+        state,
+        method.clone(),
+        &incoming_headers,
+        &uri,
+        None,
+        session_validated,
+    )
+    .await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    if state.session_core_enabled()
+        && method == reqwest::Method::DELETE
+        && backend_response.status().is_success()
+        && let Some(session_id_value) = session_id.as_deref()
+    {
+        remove_runtime_session(state, session_id_value).await;
+    }
+
+    let mut response =
+        response_from_backend_with_session_hint(backend_response, session_id.as_deref());
+    inject_runtime_capability_headers(
+        &mut response,
+        &[
+            (SESSION_CORE_HEADER, state.session_core_enabled()),
+            (EVENT_STORE_HEADER, state.event_store_enabled()),
+            (RESUME_CORE_HEADER, state.resume_core_enabled()),
+            (LIVE_STREAM_CORE_HEADER, state.live_stream_core_enabled()),
+            (AFFINITY_CORE_HEADER, state.affinity_core_enabled()),
+        ],
+    );
+    response
+}
+
+async fn forward_server_tools_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response = match send_tools_list_to_backend(state, incoming_headers).await {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP tools/list response decode failed: {err}");
+            return backend_jsonrpc_error_response(
+                request_id.clone(),
+                "Backend MCP tools/list decode failed",
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn direct_server_tools_list(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    request_id: Option<Value>,
+) -> Response {
+    let server_id = incoming_headers
+        .get("x-contextforge-server-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+    let auth_context = decode_internal_auth_context_from_headers(&incoming_headers);
+
+    let (Some(server_id), Ok(auth_context)) = (server_id, auth_context) else {
+        warn!(
+            "Rust MCP direct tools/list missing trusted context; falling back to Python dispatcher"
+        );
+        return forward_server_tools_list_to_backend(state, incoming_headers, request_id).await;
+    };
+
+    if let Err(response) = authorize_server_method_via_backend(
+        state,
+        &incoming_headers,
+        request_id.clone(),
+        state.backend_tools_list_authz_url(),
+        "tools/list",
+    )
+    .await
+    {
+        return response;
+    }
+
+    match query_server_tools_list_from_db(state, &server_id, &auth_context).await {
+        Ok(tools) => json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id,
+                "result": {
+                    "tools": tools,
+                },
+            }),
+        ),
+        Err(err) => {
+            error!(
+                "Rust MCP direct tools/list DB query failed: {err}; falling back to Python dispatcher"
+            );
+            forward_server_tools_list_to_backend(state, incoming_headers, request_id).await
+        }
+    }
+}
+
+async fn query_server_tools_list_from_db(
+    state: &AppState,
+    server_id: &str,
+    auth_context: &InternalAuthContext,
+) -> Result<Vec<McpToolDefinition>, RuntimeError> {
+    let pool = state
+        .db_pool()
+        .ok_or_else(|| RuntimeError::Config("Rust MCP DB pool is not configured".to_string()))?;
+    let client = pool.get().await.map_err(|err| {
+        RuntimeError::Config(format!("failed to acquire Rust MCP DB connection: {err}"))
+    })?;
+
+    let is_unrestricted_admin = auth_context.is_admin && auth_context.teams.is_none();
+    let rows = if is_unrestricted_admin {
+        client
+            .query(
+                "SELECT t.name, t.description, t.input_schema, t.output_schema, t.annotations \
+                 FROM tools t \
+                 JOIN server_tool_association sta ON t.id = sta.tool_id \
+                 WHERE sta.server_id = $1 AND t.enabled = TRUE",
+                &[&server_id],
+            )
+            .await?
+    } else {
+        let team_ids = auth_context.teams.clone().unwrap_or_default();
+        let is_public_only = match auth_context.teams.as_ref() {
+            None => true,
+            Some(teams) => teams.is_empty(),
+        };
+        let allow_owner_access = !is_public_only && auth_context.email.is_some();
+        let owner_email = auth_context.email.as_deref();
+
+        client
+            .query(
+                "SELECT t.name, t.description, t.input_schema, t.output_schema, t.annotations \
+                 FROM tools t \
+                 JOIN server_tool_association sta ON t.id = sta.tool_id \
+                 WHERE sta.server_id = $1 \
+                   AND t.enabled = TRUE \
+                   AND ( \
+                        t.visibility = 'public' \
+                        OR ($2::bool AND t.owner_email = $3) \
+                        OR (COALESCE(array_length($4::text[], 1), 0) > 0 AND t.team_id = ANY($4::text[]) AND t.visibility IN ('team', 'public')) \
+                   )",
+                &[&server_id, &allow_owner_access, &owner_email, &team_ids],
+            )
+            .await?
+    };
+
+    Ok(rows
+        .into_iter()
+        .map(|row| McpToolDefinition {
+            name: row.get("name"),
+            description: row.get("description"),
+            input_schema: row
+                .get::<_, Option<Value>>("input_schema")
+                .unwrap_or_else(|| json!({"type": "object", "properties": {}})),
+            annotations: row
+                .get::<_, Option<Value>>("annotations")
+                .unwrap_or_else(|| json!({})),
+            output_schema: row.get("output_schema"),
+        })
+        .collect())
+}
+
+async fn direct_server_resources_list(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    request_id: Option<Value>,
+) -> Response {
+    // Direct DB-backed reads are only used when Rust already has the trusted
+    // auth context and Python authorizes the server-scoped method. Any missing
+    // context or DB/read-shape mismatch falls back to the Python dispatcher.
+    let server_id = incoming_headers
+        .get("x-contextforge-server-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+    let auth_context = decode_internal_auth_context_from_headers(&incoming_headers);
+
+    let (Some(server_id), Ok(auth_context)) = (server_id, auth_context) else {
+        warn!(
+            "Rust MCP direct resources/list missing trusted context; falling back to Python dispatcher"
+        );
+        return forward_resources_list_to_backend(
+            state,
+            incoming_headers,
+            Bytes::from_static(br#"{"jsonrpc":"2.0","method":"resources/list","params":{}}"#),
+            request_id,
+        )
+        .await;
+    };
+
+    if let Err(response) = authorize_server_method_via_backend(
+        state,
+        &incoming_headers,
+        request_id.clone(),
+        state.backend_resources_list_authz_url(),
+        "resources/list",
+    )
+    .await
+    {
+        return response;
+    }
+
+    match query_server_resources_list_from_db(state, &server_id, &auth_context).await {
+        Ok(resources) => json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id,
+                "result": {
+                    "resources": resources,
+                },
+            }),
+        ),
+        Err(err) => {
+            error!(
+                "Rust MCP direct resources/list DB query failed: {err}; falling back to Python dispatcher"
+            );
+            forward_resources_list_to_backend(
+                state,
+                incoming_headers,
+                Bytes::from_static(br#"{"jsonrpc":"2.0","method":"resources/list","params":{}}"#),
+                request_id,
+            )
+            .await
+        }
+    }
+}
+
+async fn direct_server_resource_templates_list(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    request_id: Option<Value>,
+) -> Response {
+    // Resource template listing follows the same conservative pattern as
+    // `resources/list`: trust Python for authz, use Rust for the common DB read
+    // path, and fall back immediately when the local preconditions are missing.
+    let server_id = incoming_headers
+        .get("x-contextforge-server-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+    let auth_context = decode_internal_auth_context_from_headers(&incoming_headers);
+
+    let (Some(server_id), Ok(auth_context)) = (server_id, auth_context) else {
+        warn!(
+            "Rust MCP direct resources/templates/list missing trusted context; falling back to Python dispatcher"
+        );
+        return forward_resource_templates_list_to_backend(
+            state,
+            incoming_headers,
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","method":"resources/templates/list","params":{}}"#,
+            ),
+            request_id,
+        )
+        .await;
+    };
+
+    if let Err(response) = authorize_server_method_via_backend(
+        state,
+        &incoming_headers,
+        request_id.clone(),
+        state.backend_resource_templates_list_authz_url(),
+        "resources/templates/list",
+    )
+    .await
+    {
+        return response;
+    }
+
+    match query_server_resource_templates_list_from_db(state, &server_id, &auth_context).await {
+        Ok(resource_templates) => json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id,
+                "result": {
+                    "resourceTemplates": resource_templates,
+                },
+            }),
+        ),
+        Err(err) => {
+            error!(
+                "Rust MCP direct resources/templates/list DB query failed: {err}; falling back to Python dispatcher"
+            );
+            forward_resource_templates_list_to_backend(
+                state,
+                incoming_headers,
+                Bytes::from_static(
+                    br#"{"jsonrpc":"2.0","method":"resources/templates/list","params":{}}"#,
+                ),
+                request_id,
+            )
+            .await
+        }
+    }
+}
+
+async fn direct_server_prompts_list(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    request_id: Option<Value>,
+) -> Response {
+    // Prompt listing is safe to serve directly from Rust when visibility can be
+    // expressed with a single DB query over the trusted auth context.
+    let server_id = incoming_headers
+        .get("x-contextforge-server-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+    let auth_context = decode_internal_auth_context_from_headers(&incoming_headers);
+
+    let (Some(server_id), Ok(auth_context)) = (server_id, auth_context) else {
+        warn!(
+            "Rust MCP direct prompts/list missing trusted context; falling back to Python dispatcher"
+        );
+        return forward_prompts_list_to_backend(
+            state,
+            incoming_headers,
+            Bytes::from_static(br#"{"jsonrpc":"2.0","method":"prompts/list","params":{}}"#),
+            request_id,
+        )
+        .await;
+    };
+
+    if let Err(response) = authorize_server_method_via_backend(
+        state,
+        &incoming_headers,
+        request_id.clone(),
+        state.backend_prompts_list_authz_url(),
+        "prompts/list",
+    )
+    .await
+    {
+        return response;
+    }
+
+    match query_server_prompts_list_from_db(state, &server_id, &auth_context).await {
+        Ok(prompts) => json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id,
+                "result": {
+                    "prompts": prompts,
+                },
+            }),
+        ),
+        Err(err) => {
+            error!(
+                "Rust MCP direct prompts/list DB query failed: {err}; falling back to Python dispatcher"
+            );
+            forward_prompts_list_to_backend(
+                state,
+                incoming_headers,
+                Bytes::from_static(br#"{"jsonrpc":"2.0","method":"prompts/list","params":{}}"#),
+                request_id,
+            )
+            .await
+        }
+    }
+}
+
+async fn direct_server_resources_read(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    request_id: Option<Value>,
+    request: &JsonRpcRequest,
+    body: Bytes,
+) -> Response {
+    // `resources/read` is intentionally more conservative than list-style
+    // methods. Rust only serves the read directly for simple stored-resource
+    // rows; gateway-backed content, templates, ambiguous rows, or unsupported
+    // shapes deliberately fall back to Python for parity.
+    let server_id = incoming_headers
+        .get("x-contextforge-server-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+    let auth_context = decode_internal_auth_context_from_headers(&incoming_headers);
+
+    let (Some(server_id), Ok(auth_context)) = (server_id, auth_context) else {
+        warn!(
+            "Rust MCP direct resources/read missing trusted context; falling back to Python dispatcher"
+        );
+        return forward_resources_read_to_backend(state, incoming_headers, body, request_id).await;
+    };
+
+    let Some(uri) = request
+        .params
+        .as_object()
+        .and_then(|params| params.get("uri"))
+        .and_then(Value::as_str)
+        .filter(|value| !value.is_empty())
+    else {
+        return forward_resources_read_to_backend(state, incoming_headers, body, request_id).await;
+    };
+
+    if let Err(response) = authorize_server_method_via_backend(
+        state,
+        &incoming_headers,
+        request_id.clone(),
+        state.backend_resources_read_authz_url(),
+        "resources/read",
+    )
+    .await
+    {
+        return response;
+    }
+
+    match query_server_resource_read_from_db(state, &server_id, &auth_context, uri).await {
+        Ok(Some(content)) => json_response(
+            StatusCode::OK,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id,
+                "result": {
+                    "contents": [content],
+                },
+            }),
+        ),
+        Ok(None) => json_response(
+            StatusCode::NOT_FOUND,
+            json!({
+                "jsonrpc": JSONRPC_VERSION,
+                "id": request_id,
+                "error": {
+                    "code": -32002,
+                    "message": format!("Resource not found: {uri}"),
+                    "data": {"uri": uri},
+                },
+            }),
+        ),
+        Err(RuntimeError::Config(reason)) if reason == "fallback-python" => {
+            forward_resources_read_to_backend(state, incoming_headers, body, request_id).await
+        }
+        Err(err) => {
+            error!(
+                "Rust MCP direct resources/read DB query failed: {err}; falling back to Python dispatcher"
+            );
+            forward_resources_read_to_backend(state, incoming_headers, body, request_id).await
+        }
+    }
+}
+
+async fn direct_server_prompts_get(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    request_id: Option<Value>,
+    request: &JsonRpcRequest,
+    body: Bytes,
+) -> Response {
+    // Prompt execution depends on Python-owned rendering and plugin hooks for
+    // gateway-backed prompts. The Rust runtime still short-circuits authz to
+    // avoid unnecessary backend work on obvious deny paths, but all successful
+    // `prompts/get` requests are delegated to Python for authoritative
+    // rendering/normalization.
+    let Some(params) = request.params.as_object() else {
+        return forward_prompts_get_to_backend(state, incoming_headers, body, request_id).await;
+    };
+
+    let Some(name) = params
+        .get("name")
+        .and_then(Value::as_str)
+        .filter(|value| !value.is_empty())
+    else {
+        return forward_prompts_get_to_backend(state, incoming_headers, body, request_id).await;
+    };
+
+    if let Err(response) = validate_prompt_get_arguments(params, request_id.as_ref()) {
+        return response;
+    }
+
+    if let Err(response) = authorize_server_method_via_backend(
+        state,
+        &incoming_headers,
+        request_id.clone(),
+        state.backend_prompts_get_authz_url(),
+        "prompts/get",
+    )
+    .await
+    {
+        return response;
+    }
+
+    debug!("Rust MCP direct prompts/get delegated to Python dispatcher for prompt '{name}'");
+    forward_prompts_get_to_backend(state, incoming_headers, body, request_id).await
+}
+
+async fn query_server_resources_list_from_db(
+    state: &AppState,
+    server_id: &str,
+    auth_context: &InternalAuthContext,
+) -> Result<Vec<Value>, RuntimeError> {
+    // Visibility is derived from the same normalized auth context Python
+    // produced: unrestricted admins with `teams=null` bypass filters; all other
+    // callers see public rows plus any owner/team rows implied by the token.
+    let pool = state
+        .db_pool()
+        .ok_or_else(|| RuntimeError::Config("Rust MCP DB pool is not configured".to_string()))?;
+    let client = pool.get().await.map_err(|err| {
+        RuntimeError::Config(format!("failed to acquire Rust MCP DB connection: {err}"))
+    })?;
+
+    let is_unrestricted_admin = auth_context.is_admin && auth_context.teams.is_none();
+    let rows = if is_unrestricted_admin {
+        client
+            .query(
+                "SELECT r.uri, r.name, r.description, r.mime_type, r.size \
+                 FROM resources r \
+                 JOIN server_resource_association sra ON r.id = sra.resource_id \
+                 WHERE sra.server_id = $1 AND r.uri_template IS NULL AND r.enabled = TRUE",
+                &[&server_id],
+            )
+            .await?
+    } else {
+        let team_ids = auth_context.teams.clone().unwrap_or_default();
+        let is_public_only = auth_context.teams.as_ref().is_none_or(Vec::is_empty);
+        let allow_owner_access = !is_public_only && auth_context.email.is_some();
+        let owner_email = auth_context.email.as_deref();
+
+        client
+            .query(
+                "SELECT r.uri, r.name, r.description, r.mime_type, r.size \
+                 FROM resources r \
+                 JOIN server_resource_association sra ON r.id = sra.resource_id \
+                 WHERE sra.server_id = $1 \
+                   AND r.uri_template IS NULL \
+                   AND r.enabled = TRUE \
+                   AND ( \
+                        r.visibility = 'public' \
+                        OR ($2::bool AND r.owner_email = $3) \
+                        OR (COALESCE(array_length($4::text[], 1), 0) > 0 AND r.team_id = ANY($4::text[]) AND r.visibility IN ('team', 'public')) \
+                   )",
+                &[&server_id, &allow_owner_access, &owner_email, &team_ids],
+            )
+            .await?
+    };
+
+    Ok(rows
+        .into_iter()
+        .map(|row| resource_row_to_value(&row))
+        .collect())
+}
+
+async fn query_server_resource_templates_list_from_db(
+    state: &AppState,
+    server_id: &str,
+    auth_context: &InternalAuthContext,
+) -> Result<Vec<Value>, RuntimeError> {
+    let pool = state
+        .db_pool()
+        .ok_or_else(|| RuntimeError::Config("Rust MCP DB pool is not configured".to_string()))?;
+    let client = pool.get().await.map_err(|err| {
+        RuntimeError::Config(format!("failed to acquire Rust MCP DB connection: {err}"))
+    })?;
+
+    let is_unrestricted_admin = auth_context.is_admin && auth_context.teams.is_none();
+    let rows = if is_unrestricted_admin {
+        client
+            .query(
+                "SELECT r.id, r.uri_template, r.name, r.description, r.mime_type \
+                 FROM resources r \
+                 JOIN server_resource_association sra ON r.id = sra.resource_id \
+                 WHERE sra.server_id = $1 AND r.uri_template IS NOT NULL AND r.enabled = TRUE",
+                &[&server_id],
+            )
+            .await?
+    } else {
+        let team_ids = auth_context.teams.clone().unwrap_or_default();
+        let is_public_only = auth_context.teams.as_ref().is_none_or(Vec::is_empty);
+        let allow_owner_access = !is_public_only && auth_context.email.is_some();
+        let owner_email = auth_context.email.as_deref();
+
+        client
+            .query(
+                "SELECT r.id, r.uri_template, r.name, r.description, r.mime_type \
+                 FROM resources r \
+                 JOIN server_resource_association sra ON r.id = sra.resource_id \
+                 WHERE sra.server_id = $1 \
+                   AND r.uri_template IS NOT NULL \
+                   AND r.enabled = TRUE \
+                   AND ( \
+                        r.visibility = 'public' \
+                        OR ($2::bool AND r.owner_email = $3) \
+                        OR (COALESCE(array_length($4::text[], 1), 0) > 0 AND r.team_id = ANY($4::text[]) AND r.visibility IN ('team', 'public')) \
+                   )",
+                &[&server_id, &allow_owner_access, &owner_email, &team_ids],
+            )
+            .await?
+    };
+
+    Ok(rows
+        .into_iter()
+        .map(|row| resource_template_row_to_value(&row))
+        .collect())
+}
+
+async fn query_server_prompts_list_from_db(
+    state: &AppState,
+    server_id: &str,
+    auth_context: &InternalAuthContext,
+) -> Result<Vec<Value>, RuntimeError> {
+    let pool = state
+        .db_pool()
+        .ok_or_else(|| RuntimeError::Config("Rust MCP DB pool is not configured".to_string()))?;
+    let client = pool.get().await.map_err(|err| {
+        RuntimeError::Config(format!("failed to acquire Rust MCP DB connection: {err}"))
+    })?;
+
+    let is_unrestricted_admin = auth_context.is_admin && auth_context.teams.is_none();
+    let rows = if is_unrestricted_admin {
+        client
+            .query(
+                "SELECT p.name, p.description, p.argument_schema \
+                 FROM prompts p \
+                 JOIN server_prompt_association spa ON p.id = spa.prompt_id \
+                 WHERE spa.server_id = $1 AND p.enabled = TRUE",
+                &[&server_id],
+            )
+            .await?
+    } else {
+        let team_ids = auth_context.teams.clone().unwrap_or_default();
+        let is_public_only = auth_context.teams.as_ref().is_none_or(Vec::is_empty);
+        let allow_owner_access = !is_public_only && auth_context.email.is_some();
+        let owner_email = auth_context.email.as_deref();
+
+        client
+            .query(
+                "SELECT p.name, p.description, p.argument_schema \
+                 FROM prompts p \
+                 JOIN server_prompt_association spa ON p.id = spa.prompt_id \
+                 WHERE spa.server_id = $1 \
+                   AND p.enabled = TRUE \
+                   AND ( \
+                        p.visibility = 'public' \
+                        OR ($2::bool AND p.owner_email = $3) \
+                        OR (COALESCE(array_length($4::text[], 1), 0) > 0 AND p.team_id = ANY($4::text[]) AND p.visibility IN ('team', 'public')) \
+                   )",
+                &[&server_id, &allow_owner_access, &owner_email, &team_ids],
+            )
+            .await?
+    };
+
+    Ok(rows
+        .into_iter()
+        .map(|row| prompt_row_to_value(&row))
+        .collect())
+}
+
+async fn query_server_resource_read_from_db(
+    state: &AppState,
+    server_id: &str,
+    auth_context: &InternalAuthContext,
+    uri: &str,
+) -> Result<Option<Value>, RuntimeError> {
+    // This helper returns `fallback-python` for any case where Rust cannot
+    // reproduce Python behavior exactly: duplicate matches, gateway-backed
+    // resources, templates, or rows without directly serializable content.
+    let pool = state
+        .db_pool()
+        .ok_or_else(|| RuntimeError::Config("Rust MCP DB pool is not configured".to_string()))?;
+    let client = pool.get().await.map_err(|err| {
+        RuntimeError::Config(format!("failed to acquire Rust MCP DB connection: {err}"))
+    })?;
+
+    let is_unrestricted_admin = auth_context.is_admin && auth_context.teams.is_none();
+    let rows = if is_unrestricted_admin {
+        client
+            .query(
+                "SELECT r.uri, r.mime_type, r.text_content, r.binary_content, r.gateway_id, r.uri_template \
+                 FROM resources r \
+                 JOIN server_resource_association sra ON r.id = sra.resource_id \
+                 WHERE sra.server_id = $1 AND r.uri = $2 AND r.enabled = TRUE \
+                 LIMIT 2",
+                &[&server_id, &uri],
+            )
+            .await?
+    } else {
+        let team_ids = auth_context.teams.clone().unwrap_or_default();
+        let is_public_only = auth_context.teams.as_ref().is_none_or(Vec::is_empty);
+        let allow_owner_access = !is_public_only && auth_context.email.is_some();
+        let owner_email = auth_context.email.as_deref();
+
+        client
+            .query(
+                "SELECT r.uri, r.mime_type, r.text_content, r.binary_content, r.gateway_id, r.uri_template \
+                 FROM resources r \
+                 JOIN server_resource_association sra ON r.id = sra.resource_id \
+                 WHERE sra.server_id = $1 \
+                   AND r.uri = $2 \
+                   AND r.enabled = TRUE \
+                   AND ( \
+                        r.visibility = 'public' \
+                        OR ($3::bool AND r.owner_email = $4) \
+                        OR (COALESCE(array_length($5::text[], 1), 0) > 0 AND r.team_id = ANY($5::text[]) AND r.visibility IN ('team', 'public')) \
+                   ) \
+                 LIMIT 2",
+                &[&server_id, &uri, &allow_owner_access, &owner_email, &team_ids],
+            )
+            .await?
+    };
+
+    if rows.len() > 1 {
+        warn!(
+            "Rust MCP direct resources/read found multiple rows for uri={uri}; falling back to Python dispatcher"
+        );
+        return Err(RuntimeError::Config("fallback-python".to_string()));
+    }
+
+    let Some(row) = rows.into_iter().next() else {
+        return Ok(None);
+    };
+
+    let gateway_id = row.get::<_, Option<String>>("gateway_id");
+    let uri_template = row.get::<_, Option<String>>("uri_template");
+    if gateway_id.is_some() || uri_template.is_some() {
+        return Err(RuntimeError::Config("fallback-python".to_string()));
+    }
+
+    let text_content = row.get::<_, Option<String>>("text_content");
+    let binary_content = row.get::<_, Option<Vec<u8>>>("binary_content");
+    let resource_uri = row.get::<_, String>("uri");
+    let mime_type = row.get::<_, Option<String>>("mime_type");
+
+    let mut content = serde_json::Map::new();
+    content.insert("uri".to_string(), Value::String(resource_uri));
+    if let Some(mime_type) = mime_type {
+        content.insert("mimeType".to_string(), Value::String(mime_type));
+    }
+    if let Some(text_content) = text_content {
+        content.insert("text".to_string(), Value::String(text_content));
+        return Ok(Some(Value::Object(content)));
+    }
+    if let Some(binary_content) = binary_content {
+        content.insert(
+            "blob".to_string(),
+            Value::String(base64::engine::general_purpose::STANDARD.encode(binary_content)),
+        );
+        return Ok(Some(Value::Object(content)));
+    }
+
+    Err(RuntimeError::Config("fallback-python".to_string()))
+}
+
+#[allow(dead_code)]
+async fn query_server_prompt_get_from_db(
+    state: &AppState,
+    server_id: &str,
+    auth_context: &InternalAuthContext,
+    name: &str,
+) -> Result<Option<Value>, RuntimeError> {
+    // Prompt reads are intentionally normalized into the MCP prompt result
+    // shape expected by clients so the direct Rust path can substitute for the
+    // Python dispatcher without changing the wire contract.
+    let pool = state
+        .db_pool()
+        .ok_or_else(|| RuntimeError::Config("Rust MCP DB pool is not configured".to_string()))?;
+    let client = pool.get().await.map_err(|err| {
+        RuntimeError::Config(format!("failed to acquire Rust MCP DB connection: {err}"))
+    })?;
+
+    let is_unrestricted_admin = auth_context.is_admin && auth_context.teams.is_none();
+    let row = if is_unrestricted_admin {
+        client
+            .query_opt(
+                "SELECT p.template, p.description \
+                 FROM prompts p \
+                 JOIN server_prompt_association spa ON p.id = spa.prompt_id \
+                 WHERE spa.server_id = $1 AND p.name = $2 AND p.enabled = TRUE",
+                &[&server_id, &name],
+            )
+            .await?
+    } else {
+        let team_ids = auth_context.teams.clone().unwrap_or_default();
+        let is_public_only = auth_context.teams.as_ref().is_none_or(Vec::is_empty);
+        let allow_owner_access = !is_public_only && auth_context.email.is_some();
+        let owner_email = auth_context.email.as_deref();
+
+        client
+            .query_opt(
+                "SELECT p.template, p.description \
+                 FROM prompts p \
+                 JOIN server_prompt_association spa ON p.id = spa.prompt_id \
+                 WHERE spa.server_id = $1 \
+                   AND p.name = $2 \
+                   AND p.enabled = TRUE \
+                   AND ( \
+                        p.visibility = 'public' \
+                        OR ($3::bool AND p.owner_email = $4) \
+                        OR (COALESCE(array_length($5::text[], 1), 0) > 0 AND p.team_id = ANY($5::text[]) AND p.visibility IN ('team', 'public')) \
+                   )",
+                &[&server_id, &name, &allow_owner_access, &owner_email, &team_ids],
+            )
+            .await?
+    };
+
+    let Some(row) = row else {
+        return Ok(None);
+    };
+
+    Ok(Some(json!({
+        "description": row.get::<_, Option<String>>("description"),
+        "messages": [{
+            "role": "user",
+            "content": {
+                "type": "text",
+                "text": row.get::<_, String>("template"),
+            }
+        }],
+    })))
+}
+
+fn resource_row_to_value(row: &tokio_postgres::Row) -> Value {
+    let mut resource = serde_json::Map::new();
+    resource.insert("uri".to_string(), Value::String(row.get("uri")));
+    resource.insert("name".to_string(), Value::String(row.get("name")));
+    if let Some(description) = row.get::<_, Option<String>>("description") {
+        resource.insert("description".to_string(), Value::String(description));
+    }
+    if let Some(mime_type) = row.get::<_, Option<String>>("mime_type") {
+        resource.insert("mimeType".to_string(), Value::String(mime_type));
+    }
+    if let Some(size) = row.get::<_, Option<i32>>("size") {
+        resource.insert("size".to_string(), Value::Number(size.into()));
+    }
+    Value::Object(resource)
+}
+
+fn resource_template_row_to_value(row: &tokio_postgres::Row) -> Value {
+    let mut resource_template = serde_json::Map::new();
+    resource_template.insert("id".to_string(), Value::String(row.get("id")));
+    resource_template.insert(
+        "uriTemplate".to_string(),
+        Value::String(row.get("uri_template")),
+    );
+    resource_template.insert("name".to_string(), Value::String(row.get("name")));
+    if let Some(description) = row.get::<_, Option<String>>("description") {
+        resource_template.insert("description".to_string(), Value::String(description));
+    }
+    if let Some(mime_type) = row.get::<_, Option<String>>("mime_type") {
+        resource_template.insert("mimeType".to_string(), Value::String(mime_type));
+    }
+    Value::Object(resource_template)
+}
+
+fn prompt_row_to_value(row: &tokio_postgres::Row) -> Value {
+    let mut prompt = serde_json::Map::new();
+    prompt.insert("name".to_string(), Value::String(row.get("name")));
+    if let Some(description) = row.get::<_, Option<String>>("description") {
+        prompt.insert("description".to_string(), Value::String(description));
+    }
+    prompt.insert(
+        "arguments".to_string(),
+        Value::Array(prompt_arguments_from_schema(
+            row.get::<_, Option<Value>>("argument_schema"),
+        )),
+    );
+    Value::Object(prompt)
+}
+
+fn prompt_arguments_from_schema(argument_schema: Option<Value>) -> Vec<Value> {
+    let Some(argument_schema) = argument_schema else {
+        return Vec::new();
+    };
+    let Some(schema_object) = argument_schema.as_object() else {
+        return Vec::new();
+    };
+    let properties = schema_object
+        .get("properties")
+        .and_then(Value::as_object)
+        .cloned()
+        .unwrap_or_default();
+    let required = schema_object
+        .get("required")
+        .and_then(Value::as_array)
+        .cloned()
+        .unwrap_or_default();
+
+    let required_names: std::collections::HashSet<String> = required
+        .into_iter()
+        .filter_map(|value| value.as_str().map(str::to_string))
+        .collect();
+
+    let mut arguments = Vec::new();
+    for (name, property) in properties {
+        let description = property
+            .as_object()
+            .and_then(|object| object.get("description"))
+            .and_then(Value::as_str)
+            .unwrap_or_default()
+            .to_string();
+        arguments.push(json!({
+            "name": name,
+            "description": description,
+            "required": required_names.contains(&name),
+        }));
+    }
+    arguments
+}
+
+async fn authorize_server_method_via_backend(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    request_id: Option<Value>,
+    url: &str,
+    method_label: &str,
+) -> Result<(), Response> {
+    let backend_response = state
+        .client
+        .post(url)
+        .headers(build_forwarded_headers(incoming_headers))
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP {method_label} authz failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": format!("Backend MCP {method_label} authz failed"),
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })?;
+
+    if backend_response.status().is_success() {
+        return Ok(());
+    }
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP {method_label} authz response decode failed: {err}");
+            return Err(json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": format!("Backend MCP {method_label} authz decode failed"),
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            ));
+        }
+    };
+
+    Err(response_from_json_with_headers(
+        status,
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        }),
+        &backend_headers,
+    ))
+}
+
+fn decode_internal_auth_context_from_headers(
+    incoming_headers: &HeaderMap,
+) -> Result<InternalAuthContext, String> {
+    // The internal auth header is produced by Python and transported as a
+    // base64url-encoded JSON blob so Rust can validate session ownership
+    // without trusting any client-supplied identity fields directly.
+    let header_value = incoming_headers
+        .get("x-contextforge-auth-context")
+        .and_then(|value| value.to_str().ok())
+        .ok_or_else(|| "missing x-contextforge-auth-context".to_string())?;
+    let decoded = URL_SAFE_NO_PAD
+        .decode(header_value)
+        .map_err(|err| format!("invalid auth context encoding: {err}"))?;
+    serde_json::from_slice::<InternalAuthContext>(&decoded)
+        .map_err(|err| format!("invalid auth context payload: {err}"))
+}
+
+fn decode_internal_auth_context_from_headers_optional(
+    incoming_headers: &HeaderMap,
+) -> Option<InternalAuthContext> {
+    decode_internal_auth_context_from_headers(incoming_headers).ok()
+}
+
+async fn forward_notification_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Response {
+    let backend_response = match send_to_backend(state, incoming_headers, body).await {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    if backend_response.status().is_success() {
+        return empty_response(StatusCode::ACCEPTED);
+    }
+
+    response_from_backend(backend_response)
+}
+
+async fn forward_initialized_notification_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Response {
+    let backend_response = match send_to_backend_url(
+        state,
+        state.backend_notifications_initialized_url(),
+        incoming_headers,
+        body,
+    )
+    .await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    if backend_response.status().is_success() {
+        return empty_response(StatusCode::ACCEPTED);
+    }
+
+    response_from_backend(backend_response)
+}
+
+async fn forward_message_notification_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Response {
+    let backend_response = match send_to_backend_url(
+        state,
+        state.backend_notifications_message_url(),
+        incoming_headers,
+        body,
+    )
+    .await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    if backend_response.status().is_success() {
+        return empty_response(StatusCode::ACCEPTED);
+    }
+
+    response_from_backend(backend_response)
+}
+
+async fn forward_resources_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response = match send_resources_list_to_backend(state, incoming_headers, body).await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP resources/list response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/list decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_resources_read_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response = match send_resources_read_to_backend(state, incoming_headers, body).await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP resources/read response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/read decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_resources_subscribe_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response =
+        match send_resources_subscribe_to_backend(state, incoming_headers, body).await {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP resources/subscribe response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/subscribe decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_resources_unsubscribe_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response =
+        match send_resources_unsubscribe_to_backend(state, incoming_headers, body).await {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP resources/unsubscribe response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/unsubscribe decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_resource_templates_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response =
+        match send_resource_templates_list_to_backend(state, incoming_headers, body).await {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP resources/templates/list response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/templates/list decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_roots_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response = match send_roots_list_to_backend(state, incoming_headers, body).await {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP roots/list response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP roots/list decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_prompts_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response = match send_prompts_list_to_backend(state, incoming_headers, body).await {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP prompts/list response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP prompts/list decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_prompts_get_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response = match send_prompts_get_to_backend(state, incoming_headers, body).await {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP prompts/get response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP prompts/get decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_completion_complete_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response =
+        match send_completion_complete_to_backend(state, incoming_headers, body).await {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP completion/complete response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP completion/complete decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_sampling_create_message_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response =
+        match send_sampling_create_message_to_backend(state, incoming_headers, body).await {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP sampling/createMessage response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP sampling/createMessage decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_logging_set_level_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request_id: Option<Value>,
+) -> Response {
+    let backend_response =
+        match send_logging_set_level_to_backend(state, incoming_headers, body).await {
+            Ok(response) => response,
+            Err(response) => return response,
+        };
+
+    let status = backend_response.status();
+    let backend_headers = backend_response.headers().clone();
+    let payload: Value = match backend_response.json().await {
+        Ok(payload) => payload,
+        Err(err) => {
+            error!("backend MCP logging/setLevel response decode failed: {err}");
+            return json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": request_id,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP logging/setLevel decode failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            );
+        }
+    };
+
+    let response_payload = if status.is_success() {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "result": payload,
+        })
+    } else {
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id,
+            "error": payload,
+        })
+    };
+
+    response_from_json_with_headers(status, response_payload, &backend_headers)
+}
+
+async fn forward_cancelled_notification_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Response {
+    let backend_response = match send_to_backend_url(
+        state,
+        state.backend_notifications_cancelled_url(),
+        incoming_headers,
+        body,
+    )
+    .await
+    {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    if backend_response.status().is_success() {
+        return empty_response(StatusCode::ACCEPTED);
+    }
+
+    response_from_backend(backend_response)
+}
+
+async fn send_transport_to_backend(
+    state: &AppState,
+    method: reqwest::Method,
+    incoming_headers: &HeaderMap,
+    uri: &axum::http::Uri,
+    body: Option<Bytes>,
+    session_validated: bool,
+) -> Result<reqwest::Response, Response> {
+    // Generic transport bridge to Python. When Rust already validated the
+    // runtime session, it marks that fact in forwarded headers so Python can
+    // skip repeating the same session-ownership check on the internal hop.
+    let target_url = build_backend_transport_url(state.backend_transport_url(), uri);
+    let mut request = state.client.request(method, target_url).headers(
+        build_forwarded_headers_with_session_validation(incoming_headers, session_validated),
+    );
+    if let Some(body) = body {
+        request = request.body(body);
+    }
+    request.send().await.map_err(|err| {
+        error!("backend MCP transport dispatch failed: {err}");
+        json_response(
+            StatusCode::BAD_GATEWAY,
+            json!({
+                "error": "Bad Gateway",
+                "message": "Backend MCP transport dispatch failed",
+                "data": CLIENT_ERROR_DETAIL,
+            }),
+        )
+    })
+}
+
+async fn send_session_delete_to_backend(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    session_validated: bool,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .delete(derive_backend_session_delete_url(state.backend_rpc_url()))
+        .headers(build_forwarded_headers_with_session_validation(
+            incoming_headers,
+            session_validated,
+        ))
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP session delete dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "detail": "Backend MCP session delete dispatch failed",
+                    "data": CLIENT_ERROR_DETAIL,
+                }),
+            )
+        })
+}
+
+async fn send_tools_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+) -> Result<reqwest::Response, Response> {
+    // The helpers below are thin, method-specific bridges to Python's internal
+    // MCP handlers. They keep the runtime's public response shaping separate
+    // from the actual HTTP dispatch and error translation.
+    state
+        .client
+        .post(state.backend_tools_list_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP tools/list dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP tools/list dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_resources_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_resources_list_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP resources/list dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/list dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_resources_read_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_resources_read_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP resources/read dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/read dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_resources_subscribe_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_resources_subscribe_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP resources/subscribe dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/subscribe dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_resources_unsubscribe_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_resources_unsubscribe_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP resources/unsubscribe dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/unsubscribe dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_resource_templates_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_resource_templates_list_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP resources/templates/list dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP resources/templates/list dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_roots_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_roots_list_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP roots/list dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP roots/list dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_completion_complete_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_completion_complete_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP completion/complete dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP completion/complete dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_sampling_create_message_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_sampling_create_message_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP sampling/createMessage dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP sampling/createMessage dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_logging_set_level_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_logging_set_level_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP logging/setLevel dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP logging/setLevel dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_prompts_list_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_prompts_list_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP prompts/list dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP prompts/list dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_prompts_get_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_prompts_get_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP prompts/get dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP prompts/get dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn handle_tools_call(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+    request: JsonRpcRequest,
+) -> Response {
+    // `tools/call` is the main Rust fast path. The runtime first asks Python to
+    // resolve whether the call is eligible for direct execution. Only eligible
+    // streamable-http targets stay in Rust; everything else falls back to the
+    // existing Python implementation.
+    let plan = match resolve_tools_call(state, &incoming_headers, &request, body.clone()).await {
+        Ok(plan) => plan,
+        Err(ResolveToolsCallError::JsonRpcError { payload, headers }) => {
+            return response_from_json_with_headers(StatusCode::OK, payload, &headers);
+        }
+        Err(ResolveToolsCallError::Fallback(err)) => {
+            warn!("Rust MCP direct tools/call resolve fallback: {err}");
+            return forward_tools_call_to_backend(state, incoming_headers, body).await;
+        }
+    };
+
+    if !plan.eligible || plan.transport.as_deref() != Some("streamablehttp") {
+        if let Some(reason) = plan.fallback_reason.as_deref() {
+            info!("Rust MCP direct tools/call falling back to Python: {reason}");
+        }
+        return forward_tools_call_to_backend(state, incoming_headers, body).await;
+    }
+
+    match execute_tools_call_direct(state, &incoming_headers, &request, &plan).await {
+        Ok(response) => response,
+        Err(err) => {
+            warn!("Rust MCP direct tools/call execution fallback: {err}");
+            forward_tools_call_to_backend(state, incoming_headers, body).await
+        }
+    }
+}
+
+async fn forward_tools_call_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Response {
+    let backend_response = match send_tools_call_to_backend(state, incoming_headers, body).await {
+        Ok(response) => response,
+        Err(response) => return response,
+    };
+
+    response_from_backend(backend_response)
+}
+
+async fn resolve_tools_call_plan_via_backend(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    body: Bytes,
+) -> Result<ResolvedMcpToolCallPlan, ResolveToolsCallError> {
+    let response = state
+        .client
+        .post(state.backend_tools_call_resolve_url())
+        .headers(build_forwarded_headers(incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| ResolveToolsCallError::Fallback(format!("resolve request failed: {err}")))?;
+
+    let status = response.status();
+    let headers = response.headers().clone();
+    let response_body = response
+        .bytes()
+        .await
+        .map_err(|err| ResolveToolsCallError::Fallback(format!("resolve read failed: {err}")))?;
+
+    if !status.is_success() {
+        if let Ok(payload) = serde_json::from_slice::<Value>(&response_body)
+            && payload.get("jsonrpc") == Some(&Value::String(JSONRPC_VERSION.to_string()))
+            && payload.get("error").is_some()
+        {
+            return Err(ResolveToolsCallError::JsonRpcError { payload, headers });
+        }
+        return Err(ResolveToolsCallError::Fallback(format!(
+            "resolve returned status {status}"
+        )));
+    }
+
+    let mut plan =
+        serde_json::from_slice::<ResolvedMcpToolCallPlan>(&response_body).map_err(|err| {
+            if let Ok(payload) = serde_json::from_slice::<Value>(&response_body)
+                && payload.get("jsonrpc") == Some(&Value::String(JSONRPC_VERSION.to_string()))
+                && payload.get("error").is_some()
+            {
+                return ResolveToolsCallError::JsonRpcError { payload, headers };
+            }
+            ResolveToolsCallError::Fallback(format!("resolve decode failed: {err}"))
+        })?;
+    prepare_resolved_tools_call_plan(&mut plan).map_err(ResolveToolsCallError::Fallback)?;
+    Ok(plan)
+}
+
+async fn resolve_tools_call(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    request: &JsonRpcRequest,
+    body: Bytes,
+) -> Result<ResolvedMcpToolCallPlan, ResolveToolsCallError> {
+    // Plan resolution is cached by the resolved request shape and selected
+    // forwarded headers. This keeps steady-state tools/call traffic off Python
+    // resolve requests when the upstream target is stable.
+    let cache_key = build_tools_call_plan_cache_key(incoming_headers, request)
+        .map_err(ResolveToolsCallError::Fallback)?;
+    {
+        let mut cached_plans = state.resolved_tool_call_plans().lock().await;
+        if let Some(cached) = cached_plans.get_mut(&cache_key) {
+            if cached.cached_at.elapsed() < state.tools_call_plan_ttl() {
+                cached.cached_at = Instant::now();
+                return Ok(cached.plan.clone());
+            }
+            cached_plans.remove(&cache_key);
+        }
+    }
+
+    let plan = resolve_tools_call_plan_via_backend(state, incoming_headers, body).await?;
+    if plan.eligible && plan.transport.as_deref() == Some("streamablehttp") {
+        state.resolved_tool_call_plans().lock().await.insert(
+            cache_key,
+            CachedResolvedToolCallPlan {
+                plan: plan.clone(),
+                cached_at: Instant::now(),
+            },
+        );
+    }
+    Ok(plan)
+}
+
+async fn send_tools_call_to_backend(
+    state: &AppState,
+    incoming_headers: HeaderMap,
+    body: Bytes,
+) -> Result<reqwest::Response, Response> {
+    state
+        .client
+        .post(state.backend_tools_call_url())
+        .headers(build_forwarded_headers(&incoming_headers))
+        .body(body)
+        .send()
+        .await
+        .map_err(|err| {
+            error!("backend MCP tools/call dispatch failed: {err}");
+            json_response(
+                StatusCode::BAD_GATEWAY,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": Value::Null,
+                    "error": {
+                        "code": -32000,
+                        "message": "Backend MCP tools/call dispatch failed",
+                        "data": CLIENT_ERROR_DETAIL,
+                    }
+                }),
+            )
+        })
+}
+
+async fn send_tools_call_metric_to_backend(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    payload: &ToolsCallMetricRecordRequest,
+) -> Result<(), String> {
+    let response = state
+        .client
+        .post(state.backend_tools_call_metric_url())
+        .headers(build_forwarded_headers(incoming_headers))
+        .json(payload)
+        .send()
+        .await
+        .map_err(|err| format!("tools/call metric writeback failed: {err}"))?;
+
+    if response.status().is_success() {
+        Ok(())
+    } else {
+        Err(format!(
+            "tools/call metric writeback returned status {}",
+            response.status()
+        ))
+    }
+}
+
+fn classify_tools_call_metric_outcome(
+    status: StatusCode,
+    payload: &Value,
+) -> (bool, Option<String>) {
+    if let Some(error) = payload.get("error") {
+        let message = error
+            .get("message")
+            .and_then(Value::as_str)
+            .map(str::to_string)
+            .or_else(|| Some(error.to_string()));
+        return (false, message);
+    }
+
+    if !status.is_success() {
+        return (false, Some(format!("HTTP {}", status.as_u16())));
+    }
+
+    (true, None)
+}
+
+async fn record_tools_call_metric(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    plan: &ResolvedMcpToolCallPlan,
+    duration_ms: f64,
+    success: bool,
+    error_message: Option<String>,
+) {
+    let Some(tool_id) = plan.tool_id.clone() else {
+        return;
+    };
+
+    let payload = ToolsCallMetricRecordRequest {
+        tool_id,
+        server_id: plan.server_id.clone(),
+        duration_ms,
+        success,
+        error_message,
+    };
+
+    if let Err(err) = send_tools_call_metric_to_backend(state, incoming_headers, &payload).await {
+        warn!("{err}");
+    }
+}
+
+async fn execute_tools_call_direct(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    request: &JsonRpcRequest,
+    plan: &ResolvedMcpToolCallPlan,
+) -> Result<Response, String> {
+    let request_started = Instant::now();
+    // Direct execution mirrors the MCP client lifecycle explicitly:
+    // initialize once, reuse the upstream session while it is healthy, and
+    // retry once with a fresh upstream session if the cached session fails.
+    if state.use_rmcp_upstream_client() {
+        #[cfg(feature = "rmcp-upstream-client")]
+        match execute_tools_call_via_rmcp(state, incoming_headers, request, plan).await {
+            Ok((response, success, error_message)) => {
+                record_tools_call_metric(
+                    state,
+                    incoming_headers,
+                    plan,
+                    request_started.elapsed().as_secs_f64() * 1000.0,
+                    success,
+                    error_message,
+                )
+                .await;
+                return Ok(response);
+            }
+            Err(err) => warn!("Rust MCP rmcp tools/call fallback: {err}"),
+        }
+    }
+
+    let server_url = plan
+        .server_url
+        .as_deref()
+        .ok_or_else(|| "resolved tools/call plan missing server_url".to_string())?;
+    let remote_tool_name = plan
+        .remote_tool_name
+        .as_deref()
+        .ok_or_else(|| "resolved tools/call plan missing remote_tool_name".to_string())?;
+    let protocol_version = incoming_headers
+        .get(MCP_PROTOCOL_VERSION_HEADER)
+        .and_then(|value| value.to_str().ok())
+        .unwrap_or(state.protocol_version())
+        .to_string();
+    let timeout_ms = plan.timeout_ms.unwrap_or(30_000);
+    let downstream_session_id = incoming_headers
+        .get("mcp-session-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+
+    let upstream_session_id = ensure_upstream_session(
+        state,
+        plan,
+        downstream_session_id.as_deref(),
+        &protocol_version,
+        timeout_ms,
+    )
+    .await?;
+
+    let mut tool_response = send_direct_tools_call(
+        state,
+        server_url,
+        plan,
+        request,
+        remote_tool_name,
+        &protocol_version,
+        upstream_session_id.as_deref(),
+        timeout_ms,
+    )
+    .await?;
+
+    if !tool_response.status().is_success() {
+        let session_key = build_upstream_session_key(downstream_session_id.as_deref(), plan)?;
+        state
+            .upstream_tool_sessions()
+            .lock()
+            .await
+            .remove(&session_key);
+        let refreshed_session_id = ensure_upstream_session(
+            state,
+            plan,
+            downstream_session_id.as_deref(),
+            &protocol_version,
+            timeout_ms,
+        )
+        .await?;
+        tool_response = send_direct_tools_call(
+            state,
+            server_url,
+            plan,
+            request,
+            remote_tool_name,
+            &protocol_version,
+            refreshed_session_id.as_deref(),
+            timeout_ms,
+        )
+        .await?;
+    }
+
+    let status = tool_response.status();
+    let payload = decode_upstream_json_payload(tool_response)
+        .await
+        .map_err(|err| format!("direct tools/call decode failed: {err}"))?;
+    let (success, error_message) = classify_tools_call_metric_outcome(status, &payload);
+    record_tools_call_metric(
+        state,
+        incoming_headers,
+        plan,
+        request_started.elapsed().as_secs_f64() * 1000.0,
+        success,
+        error_message,
+    )
+    .await;
+
+    let mut response = json_response(status, payload);
+    if let Some(session_id) = downstream_session_id
+        && let Ok(value) = HeaderValue::from_str(&session_id)
+    {
+        response
+            .headers_mut()
+            .insert(HeaderName::from_static("mcp-session-id"), value);
+    }
+    response.headers_mut().insert(
+        HeaderName::from_static(UPSTREAM_CLIENT_HEADER),
+        HeaderValue::from_static("native"),
+    );
+    Ok(response)
+}
+
+#[cfg(feature = "rmcp-upstream-client")]
+async fn execute_tools_call_via_rmcp(
+    state: &AppState,
+    incoming_headers: &HeaderMap,
+    request: &JsonRpcRequest,
+    plan: &ResolvedMcpToolCallPlan,
+) -> Result<(Response, bool, Option<String>), String> {
+    let remote_tool_name = plan
+        .remote_tool_name
+        .as_deref()
+        .ok_or_else(|| "resolved tools/call plan missing remote_tool_name".to_string())?;
+    let protocol_version = incoming_headers
+        .get(MCP_PROTOCOL_VERSION_HEADER)
+        .and_then(|value| value.to_str().ok())
+        .unwrap_or(state.protocol_version())
+        .to_string();
+    let downstream_session_id = incoming_headers
+        .get("mcp-session-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+    let session_key = build_upstream_session_key(downstream_session_id.as_deref(), plan)?;
+
+    let rmcp_client =
+        get_or_create_rmcp_upstream_client(state, plan, &session_key, &protocol_version).await?;
+
+    let (response, success, error_message) =
+        match invoke_tools_call_via_rmcp(rmcp_client.as_ref(), request, remote_tool_name).await {
+            Ok(response) => response,
+            Err(err) => {
+                state
+                    .rmcp_upstream_clients()
+                    .lock()
+                    .await
+                    .remove(&session_key);
+                let retried_client = get_or_create_rmcp_upstream_client(
+                    state,
+                    plan,
+                    &session_key,
+                    &protocol_version,
+                )
+                .await?;
+                invoke_tools_call_via_rmcp(retried_client.as_ref(), request, remote_tool_name)
+                    .await
+                    .map_err(|retry_err| format!("rmcp retry failed after {err}: {retry_err}"))?
+            }
+        };
+
+    let mut response = response;
+    if let Some(session_id) = downstream_session_id
+        && let Ok(value) = HeaderValue::from_str(&session_id)
+    {
+        response
+            .headers_mut()
+            .insert(HeaderName::from_static("mcp-session-id"), value);
+    }
+    response.headers_mut().insert(
+        HeaderName::from_static(UPSTREAM_CLIENT_HEADER),
+        HeaderValue::from_static("rmcp"),
+    );
+    Ok((response, success, error_message))
+}
+
+async fn ensure_upstream_session(
+    state: &AppState,
+    plan: &ResolvedMcpToolCallPlan,
+    downstream_session_id: Option<&str>,
+    protocol_version: &str,
+    timeout_ms: u64,
+) -> Result<Option<String>, String> {
+    // Upstream sessions are keyed by both downstream session identity and the
+    // resolved upstream target. That keeps parallel callers from sharing an
+    // upstream MCP session across users or servers.
+    let session_key = build_upstream_session_key(downstream_session_id, plan)?;
+    {
+        let mut sessions = state.upstream_tool_sessions().lock().await;
+        if let Some(existing) = sessions.get_mut(&session_key)
+            && existing.last_used.elapsed() < state.upstream_session_ttl()
+        {
+            existing.last_used = Instant::now();
+            return Ok(existing.session_id.clone());
+        }
+        sessions.remove(&session_key);
+    }
+
+    let upstream_session_id =
+        initialize_upstream_session(state, plan, protocol_version, timeout_ms).await?;
+    let mut sessions = state.upstream_tool_sessions().lock().await;
+    if let Some(existing) = sessions.get_mut(&session_key)
+        && existing.last_used.elapsed() < state.upstream_session_ttl()
+    {
+        existing.last_used = Instant::now();
+        return Ok(existing.session_id.clone());
+    }
+    sessions.insert(
+        session_key,
+        UpstreamToolSession {
+            session_id: upstream_session_id.clone(),
+            last_used: Instant::now(),
+        },
+    );
+    Ok(upstream_session_id)
+}
+
+async fn initialize_upstream_session(
+    state: &AppState,
+    plan: &ResolvedMcpToolCallPlan,
+    protocol_version: &str,
+    timeout_ms: u64,
+) -> Result<Option<String>, String> {
+    // Rust behaves like a well-formed MCP client here: send initialize, record
+    // the upstream session id if present, then best-effort send the matching
+    // initialized notification before using the session for tools/call.
+    let server_url = plan
+        .server_url
+        .as_deref()
+        .ok_or_else(|| "resolved tools/call plan missing server_url".to_string())?;
+    let headers = build_upstream_headers(plan, protocol_version, None)?;
+    let response = state
+        .client
+        .post(server_url)
+        .headers(headers)
+        .timeout(Duration::from_millis(timeout_ms))
+        .json(&json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": "__contextforge_init__",
+            "method": "initialize",
+            "params": {
+                "protocolVersion": protocol_version,
+                "capabilities": {},
+                "clientInfo": {
+                    "name": "contextforge-rust-runtime",
+                    "version": state.server_version(),
+                }
+            }
+        }))
+        .send()
+        .await
+        .map_err(|err| format!("upstream initialize failed: {err}"))?;
+
+    if !response.status().is_success() {
+        return Err(format!(
+            "upstream initialize returned status {}",
+            response.status()
+        ));
+    }
+
+    let upstream_session_id = response
+        .headers()
+        .get("mcp-session-id")
+        .and_then(|value| value.to_str().ok())
+        .map(str::to_string);
+    let payload = decode_upstream_json_payload(response)
+        .await
+        .map_err(|err| format!("upstream initialize decode failed: {err}"))?;
+    if payload.get("error").is_some() {
+        return Err(format!("upstream initialize returned error: {payload}"));
+    }
+
+    if let Some(session_id) = upstream_session_id.as_deref() {
+        let _ =
+            send_initialized_notification(state, server_url, plan, protocol_version, session_id)
+                .await;
+    }
+
+    Ok(upstream_session_id)
+}
+
+async fn send_initialized_notification(
+    state: &AppState,
+    server_url: &str,
+    plan: &ResolvedMcpToolCallPlan,
+    protocol_version: &str,
+    upstream_session_id: &str,
+) -> Result<(), String> {
+    let headers = build_upstream_headers(plan, protocol_version, Some(upstream_session_id))?;
+    state
+        .client
+        .post(server_url)
+        .headers(headers)
+        .json(&json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "method": "notifications/initialized",
+            "params": {}
+        }))
+        .send()
+        .await
+        .map_err(|err| format!("upstream initialized notification failed: {err}"))?;
+    Ok(())
+}
+
+#[allow(clippy::too_many_arguments)]
+async fn send_direct_tools_call(
+    state: &AppState,
+    server_url: &str,
+    plan: &ResolvedMcpToolCallPlan,
+    request: &JsonRpcRequest,
+    remote_tool_name: &str,
+    protocol_version: &str,
+    upstream_session_id: Option<&str>,
+    timeout_ms: u64,
+) -> Result<reqwest::Response, String> {
+    let mut params = request.params.clone();
+    let params_object = params
+        .as_object_mut()
+        .ok_or_else(|| "tools/call params must be an object".to_string())?;
+    params_object.insert(
+        "name".to_string(),
+        Value::String(remote_tool_name.to_string()),
+    );
+
+    state
+        .client
+        .post(server_url)
+        .headers(build_upstream_headers(plan, protocol_version, upstream_session_id)?)
+        .timeout(Duration::from_millis(timeout_ms))
+        .json(&json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request.id.clone().unwrap_or(Value::String("__contextforge_tools_call__".to_string())),
+            "method": "tools/call",
+            "params": params,
+        }))
+        .send()
+        .await
+        .map_err(|err| format!("direct tools/call request failed: {err}"))
+}
+
+fn build_upstream_headers(
+    plan: &ResolvedMcpToolCallPlan,
+    protocol_version: &str,
+    upstream_session_id: Option<&str>,
+) -> Result<reqwest::header::HeaderMap, String> {
+    // These are the exact headers Rust forwards to the upstream MCP server for
+    // direct execution. Resolved plan headers come from Python authorization
+    // and are already filtered before they reach this point.
+    let mut headers = reqwest::header::HeaderMap::new();
+    headers.insert(
+        reqwest::header::ACCEPT,
+        HeaderValue::from_static("application/json, text/event-stream"),
+    );
+    headers.insert(CONTENT_TYPE, HeaderValue::from_static("application/json"));
+    headers.insert(
+        HeaderName::from_static(MCP_PROTOCOL_VERSION_HEADER),
+        HeaderValue::from_str(protocol_version)
+            .map_err(|err| format!("invalid protocol version header: {err}"))?,
+    );
+
+    if let Some(parsed_headers) = plan.parsed_headers.as_ref() {
+        for (header_name, header_value) in parsed_headers {
+            headers.insert(header_name.clone(), header_value.clone());
+        }
+    } else if let Some(header_values) = plan.headers.as_ref() {
+        for (name, value) in header_values {
+            let header_name = reqwest::header::HeaderName::from_str(name)
+                .map_err(|err| format!("invalid upstream header name '{name}': {err}"))?;
+            let header_value = HeaderValue::from_str(value)
+                .map_err(|err| format!("invalid upstream header '{name}': {err}"))?;
+            headers.insert(header_name, header_value);
+        }
+    }
+
+    if let Some(session_id) = upstream_session_id {
+        headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_str(session_id)
+                .map_err(|err| format!("invalid upstream session header: {err}"))?,
+        );
+    }
+
+    Ok(headers)
+}
+
+#[cfg(feature = "rmcp-upstream-client")]
+async fn get_or_create_rmcp_upstream_client(
+    state: &AppState,
+    plan: &ResolvedMcpToolCallPlan,
+    session_key: &str,
+    protocol_version: &str,
+) -> Result<Arc<RmcpRunningService<RmcpRoleClient, RmcpClientInfo>>, String> {
+    // RMCP clients are cached at the same session granularity as direct
+    // upstream sessions so the sidecar can amortize setup/TLS cost without
+    // weakening cross-user or cross-server isolation.
+    {
+        let mut clients = state.rmcp_upstream_clients().lock().await;
+        if let Some(existing) = clients.get_mut(session_key) {
+            if existing.last_used.elapsed() < state.upstream_session_ttl()
+                && !existing.client.is_closed()
+            {
+                existing.last_used = Instant::now();
+                return Ok(existing.client.clone());
+            }
+            clients.remove(session_key);
+        }
+    }
+
+    let transport = StreamableHttpClientTransport::with_client(
+        state.rmcp_client.clone(),
+        build_rmcp_transport_config(plan, protocol_version)?,
+    );
+    let client_info = build_rmcp_client_info(state, protocol_version)?;
+    let client = Arc::new(
+        rmcp_serve_client(client_info, transport)
+            .await
+            .map_err(|err| format!("rmcp upstream client initialize failed: {err}"))?,
+    );
+
+    state.rmcp_upstream_clients().lock().await.insert(
+        session_key.to_string(),
+        CachedRmcpUpstreamClient {
+            client: client.clone(),
+            last_used: Instant::now(),
+        },
+    );
+    Ok(client)
+}
+
+#[cfg(feature = "rmcp-upstream-client")]
+fn build_rmcp_transport_config(
+    plan: &ResolvedMcpToolCallPlan,
+    protocol_version: &str,
+) -> Result<StreamableHttpClientTransportConfig, String> {
+    let server_url = plan
+        .server_url
+        .as_deref()
+        .ok_or_else(|| "resolved tools/call plan missing server_url".to_string())?;
+    let mut custom_headers = HashMap::new();
+    custom_headers.insert(
+        HeaderName::from_static(MCP_PROTOCOL_VERSION_HEADER),
+        HeaderValue::from_str(protocol_version)
+            .map_err(|err| format!("invalid protocol version header: {err}"))?,
+    );
+
+    if let Some(parsed_headers) = plan.parsed_headers.as_ref() {
+        for (header_name, header_value) in parsed_headers {
+            custom_headers.insert(header_name.clone(), header_value.clone());
+        }
+    } else if let Some(header_values) = plan.headers.as_ref() {
+        for (name, value) in header_values {
+            let header_name = HeaderName::from_str(name)
+                .map_err(|err| format!("invalid upstream header name '{name}': {err}"))?;
+            let header_value = HeaderValue::from_str(value)
+                .map_err(|err| format!("invalid upstream header value for '{name}': {err}"))?;
+            custom_headers.insert(header_name, header_value);
+        }
+    }
+
+    Ok(StreamableHttpClientTransportConfig::with_uri(server_url).custom_headers(custom_headers))
+}
+
+#[cfg(feature = "rmcp-upstream-client")]
+fn build_rmcp_client_info(
+    state: &AppState,
+    protocol_version: &str,
+) -> Result<RmcpClientInfo, String> {
+    let protocol_version =
+        serde_json::from_value::<RmcpProtocolVersion>(Value::String(protocol_version.to_string()))
+            .map_err(|err| format!("invalid rmcp protocol version '{protocol_version}': {err}"))?;
+
+    Ok(RmcpClientInfo::new(
+        RmcpClientCapabilities::default(),
+        RmcpImplementation::new(
+            "contextforge-rust-runtime",
+            state.server_version().to_string(),
+        ),
+    )
+    .with_protocol_version(protocol_version))
+}
+
+#[cfg(feature = "rmcp-upstream-client")]
+async fn invoke_tools_call_via_rmcp(
+    client: &RmcpRunningService<RmcpRoleClient, RmcpClientInfo>,
+    request: &JsonRpcRequest,
+    remote_tool_name: &str,
+) -> Result<(Response, bool, Option<String>), String> {
+    let mut params = request.params.clone();
+    let params_object = params
+        .as_object_mut()
+        .ok_or_else(|| "tools/call params must be an object".to_string())?;
+    params_object.insert(
+        "name".to_string(),
+        Value::String(remote_tool_name.to_string()),
+    );
+
+    let params = serde_json::from_value::<RmcpCallToolRequestParams>(params)
+        .map_err(|err| format!("rmcp tools/call params decode failed: {err}"))?;
+    let response_id = request
+        .id
+        .clone()
+        .unwrap_or(Value::String("__contextforge_tools_call__".to_string()));
+
+    match client.peer().call_tool(params).await {
+        Ok(result) => Ok((
+            json_response(
+                StatusCode::OK,
+                json!({
+                    "jsonrpc": JSONRPC_VERSION,
+                    "id": response_id,
+                    "result": serde_json::to_value(result)
+                        .map_err(|err| format!("rmcp tools/call result encode failed: {err}"))?,
+                }),
+            ),
+            true,
+            None,
+        )),
+        Err(RmcpServiceError::McpError(error)) => {
+            let error_message = error.message.to_string();
+            Ok((
+                json_response(
+                    StatusCode::OK,
+                    json!({
+                        "jsonrpc": JSONRPC_VERSION,
+                        "id": response_id,
+                        "error": serde_json::to_value(error)
+                            .map_err(|err| format!("rmcp tools/call error encode failed: {err}"))?,
+                    }),
+                ),
+                false,
+                Some(error_message),
+            ))
+        }
+        Err(err) => Err(format!("rmcp direct tools/call failed: {err}")),
+    }
+}
+
+async fn decode_upstream_json_payload(response: reqwest::Response) -> Result<Value, String> {
+    let content_type = response
+        .headers()
+        .get(reqwest::header::CONTENT_TYPE)
+        .and_then(|value| value.to_str().ok())
+        .unwrap_or_default()
+        .to_ascii_lowercase();
+    let body = response
+        .bytes()
+        .await
+        .map_err(|err| format!("read body failed: {err}"))?;
+
+    decode_upstream_json_payload_bytes(&body, &content_type)
+}
+
+fn decode_upstream_json_payload_bytes(body: &[u8], content_type: &str) -> Result<Value, String> {
+    if content_type.contains("text/event-stream") || body.starts_with(b"data:") {
+        let text = str::from_utf8(body).map_err(|err| format!("invalid utf-8 SSE body: {err}"))?;
+        let data = extract_first_sse_data_payload(text)
+            .ok_or_else(|| "missing SSE data payload".to_string())?;
+        return serde_json::from_str(&data)
+            .map_err(|err| format!("invalid SSE JSON payload: {err}"));
+    }
+
+    serde_json::from_slice(body).map_err(|err| format!("invalid JSON payload: {err}"))
+}
+
+fn extract_first_sse_data_payload(body: &str) -> Option<String> {
+    let mut current_event_data = Vec::new();
+
+    for raw_line in body.lines() {
+        let line = raw_line.trim_end_matches('\r');
+        if line.is_empty() {
+            if !current_event_data.is_empty() {
+                return Some(current_event_data.join("\n"));
+            }
+            continue;
+        }
+
+        if let Some(data) = line.strip_prefix("data:") {
+            current_event_data.push(data.trim_start().to_string());
+        }
+    }
+
+    if current_event_data.is_empty() {
+        None
+    } else {
+        Some(current_event_data.join("\n"))
+    }
+}
+
+fn build_upstream_session_key(
+    downstream_session_id: Option<&str>,
+    plan: &ResolvedMcpToolCallPlan,
+) -> Result<String, String> {
+    let server_url = plan
+        .server_url
+        .as_deref()
+        .ok_or_else(|| "resolved tools/call plan missing server_url".to_string())?;
+    let mut hasher = DefaultHasher::new();
+    server_url.hash(&mut hasher);
+    if let Some(headers_hash) = plan.headers_hash {
+        headers_hash.hash(&mut hasher);
+    } else if let Some(header_values) = plan.headers.as_ref() {
+        hash_ordered_pairs(
+            header_values
+                .iter()
+                .map(|(name, value)| (name.as_str(), value.as_str())),
+        )
+        .hash(&mut hasher);
+    }
+    match downstream_session_id {
+        Some(session_id) => Ok(format!("downstream:{session_id}:{}", hasher.finish())),
+        None => Ok(format!("shared:{}", hasher.finish())),
+    }
+}
+
+fn build_tools_call_plan_cache_key(
+    incoming_headers: &HeaderMap,
+    request: &JsonRpcRequest,
+) -> Result<String, String> {
+    let tool_name = request
+        .params
+        .get("name")
+        .and_then(Value::as_str)
+        .ok_or_else(|| "tools/call params missing name".to_string())?;
+    let mut hasher = DefaultHasher::new();
+    tool_name.hash(&mut hasher);
+
+    let mut header_pairs = Vec::new();
+    for (name, value) in incoming_headers {
+        if should_cache_plan_header(name) {
+            let header_value = value
+                .to_str()
+                .map_err(|err| format!("invalid cacheable header '{}': {err}", name.as_str()))?;
+            header_pairs.push((name.as_str(), header_value));
+        }
+    }
+    hash_ordered_pairs(header_pairs).hash(&mut hasher);
+
+    Ok(format!("tool-plan:{}", hasher.finish()))
+}
+
+fn prepare_resolved_tools_call_plan(plan: &mut ResolvedMcpToolCallPlan) -> Result<(), String> {
+    let Some(header_values) = plan.headers.as_ref() else {
+        plan.parsed_headers = None;
+        plan.headers_hash = None;
+        return Ok(());
+    };
+
+    // Parse and hash backend-provided headers once when the plan is decoded so
+    // hot-path request execution can reuse them without reparsing or rebuilding
+    // ordered header maps on every tools/call.
+    let mut parsed_headers = Vec::with_capacity(header_values.len());
+    for (name, value) in header_values {
+        let header_name = HeaderName::from_str(name)
+            .map_err(|err| format!("invalid upstream header name '{name}': {err}"))?;
+        let header_value = HeaderValue::from_str(value)
+            .map_err(|err| format!("invalid upstream header value for '{name}': {err}"))?;
+        parsed_headers.push((header_name, header_value));
+    }
+
+    plan.headers_hash = Some(hash_ordered_pairs(
+        header_values
+            .iter()
+            .map(|(name, value)| (name.as_str(), value.as_str())),
+    ));
+    plan.parsed_headers = Some(parsed_headers);
+    Ok(())
+}
+
+fn hash_ordered_pairs<'a, I>(pairs: I) -> u64
+where
+    I: IntoIterator<Item = (&'a str, &'a str)>,
+{
+    let mut ordered_pairs: Vec<_> = pairs.into_iter().collect();
+    ordered_pairs.sort_unstable();
+    let mut hasher = DefaultHasher::new();
+    for (name, value) in ordered_pairs {
+        name.hash(&mut hasher);
+        value.hash(&mut hasher);
+    }
+    hasher.finish()
+}
+
+fn should_cache_plan_header(name: &HeaderName) -> bool {
+    let name = name.as_str();
+    name == "authorization" || name == "cookie" || name.starts_with("x-contextforge-")
+}
+
+fn build_forwarded_headers(incoming_headers: &HeaderMap) -> reqwest::header::HeaderMap {
+    build_forwarded_headers_with_session_validation(incoming_headers, false)
+}
+
+fn build_forwarded_headers_with_session_validation(
+    incoming_headers: &HeaderMap,
+    session_validated: bool,
+) -> reqwest::header::HeaderMap {
+    let mut forwarded_headers = reqwest::header::HeaderMap::new();
+
+    for (name, value) in incoming_headers {
+        if should_forward_header(name) {
+            forwarded_headers.insert(name.clone(), value.clone());
+        }
+    }
+
+    forwarded_headers.insert(
+        HeaderName::from_static(RUNTIME_HEADER),
+        HeaderValue::from_static(RUNTIME_NAME),
+    );
+    forwarded_headers.insert(
+        HeaderName::from_static(INTERNAL_RUNTIME_AUTH_HEADER),
+        internal_runtime_auth_header_value(),
+    );
+    if session_validated {
+        forwarded_headers.insert(
+            HeaderName::from_static(SESSION_VALIDATED_HEADER),
+            HeaderValue::from_static(RUNTIME_NAME),
+        );
+    }
+    forwarded_headers
+}
+
+fn build_backend_transport_url(base_url: &str, uri: &axum::http::Uri) -> String {
+    match uri.query() {
+        Some(query) if !query.is_empty() => format!("{base_url}?{query}"),
+        _ => base_url.to_string(),
+    }
+}
+
+fn should_forward_response_header(name: &str) -> bool {
+    matches!(
+        name,
+        "content-type"
+            | "mcp-session-id"
+            | "x-mcp-session-id"
+            | "www-authenticate"
+            | "x-request-id"
+            | "x-correlation-id"
+    )
+}
+
+fn response_from_backend(backend_response: reqwest::Response) -> Response {
+    response_from_backend_with_session_hint(backend_response, None)
+}
+
+fn response_from_backend_with_session_hint(
+    backend_response: reqwest::Response,
+    session_hint: Option<&str>,
+) -> Response {
+    let status = backend_response.status();
+    let headers = backend_response.headers().clone();
+    let body = Body::from_stream(backend_response.bytes_stream().map_err(|err| {
+        error!("backend MCP response body stream failed: {err}");
+        std::io::Error::other(err.to_string())
+    }));
+
+    let mut builder = Response::builder().status(status);
+    builder = builder.header(RUNTIME_HEADER, RUNTIME_NAME);
+
+    if !headers
+        .keys()
+        .any(|name| should_forward_response_header(name.as_str()) && name == CONTENT_TYPE)
+    {
+        builder = builder.header(CONTENT_TYPE, "application/json");
+    }
+
+    for (header_name, value) in &headers {
+        if should_forward_response_header(header_name.as_str()) {
+            builder = builder.header(header_name, value.clone());
+        }
+    }
+
+    if headers.get("mcp-session-id").is_none()
+        && let Some(session_id) = session_hint
+    {
+        builder = builder.header("mcp-session-id", session_id);
+    }
+
+    builder
+        .body(body)
+        .unwrap_or_else(|_| Response::new(Body::from("internal response construction error")))
+}
+
+fn response_from_json_with_headers(
+    status: StatusCode,
+    payload: Value,
+    headers: &reqwest::header::HeaderMap,
+) -> Response {
+    let mut response = json_response(status, payload);
+    let response_headers = response.headers_mut();
+
+    for (header_name, value) in headers {
+        if should_forward_response_header(header_name.as_str()) {
+            response_headers.insert(header_name.clone(), value.clone());
+        }
+    }
+
+    response
+}
+
+fn inject_runtime_capability_headers(response: &mut Response, headers: &[(&'static str, bool)]) {
+    let response_headers = response.headers_mut();
+    for (header_name, rust_owned) in headers {
+        let value = if *rust_owned { "rust" } else { "python" };
+        if let Ok(value) = HeaderValue::from_str(value) {
+            response_headers.insert(HeaderName::from_static(header_name), value);
+        }
+    }
+}
+
+fn should_forward_header(name: &HeaderName) -> bool {
+    !matches!(
+        name.as_str(),
+        "host"
+            | "content-length"
+            | "connection"
+            | "transfer-encoding"
+            | "keep-alive"
+            | "x-real-ip"
+            | "x-forwarded-for"
+            | "x-forwarded-proto"
+            | "x-forwarded-host"
+            | "forwarded"
+            | "x-forwarded-internally"
+            | "x-mcp-session-id"
+            | INTERNAL_AFFINITY_FORWARDED_HEADER
+            | INTERNAL_RUNTIME_AUTH_HEADER
+            | SESSION_VALIDATED_HEADER
+            | RUNTIME_HEADER
+    )
+}
+
+fn json_response(status: StatusCode, payload: Value) -> Response {
+    let payload = if status.is_server_error() {
+        redact_server_error_payload(payload)
+    } else {
+        payload
+    };
+    let mut response = (status, Json(payload)).into_response();
+    response.headers_mut().insert(
+        HeaderName::from_static(RUNTIME_HEADER),
+        HeaderValue::from_static(RUNTIME_NAME),
+    );
+    response
+}
+
+fn backend_detail_error_response(detail: &str) -> Response {
+    json_response(
+        StatusCode::BAD_GATEWAY,
+        json!({
+            "detail": detail,
+            "error": CLIENT_ERROR_DETAIL,
+        }),
+    )
+}
+
+fn backend_jsonrpc_error_response(
+    request_id: Option<Value>,
+    message: impl Into<String>,
+) -> Response {
+    json_response(
+        StatusCode::BAD_GATEWAY,
+        json!({
+            "jsonrpc": JSONRPC_VERSION,
+            "id": request_id.unwrap_or(Value::Null),
+            "error": {
+                "code": -32000,
+                "message": message.into(),
+                "data": CLIENT_ERROR_DETAIL,
+            }
+        }),
+    )
+}
+
+fn redact_server_error_payload(mut payload: Value) -> Value {
+    if let Some(error_value) = payload.get_mut("error") {
+        if let Some(error_object) = error_value.as_object_mut()
+            && let Some(data_value) = error_object.get_mut("data")
+            && data_value.is_string()
+        {
+            *data_value = Value::String(CLIENT_ERROR_DETAIL.to_string());
+        }
+    }
+
+    payload
+}
+
+fn empty_response(status: StatusCode) -> Response {
+    let mut response = Response::new(Body::empty());
+    *response.status_mut() = status;
+    response.headers_mut().insert(
+        HeaderName::from_static(RUNTIME_HEADER),
+        HeaderValue::from_static(RUNTIME_NAME),
+    );
+    response
+}
+
+#[cfg(test)]
+mod unit_tests {
+    use base64::Engine;
+
+    use super::{
+        AffinityForwardResponse, AppState, Bytes, CLIENT_ERROR_DETAIL, EventStoreReplayRequest,
+        EventStoreStoreRequest, INTERNAL_RUNTIME_AUTH_HEADER, InternalAuthContext,
+        InternalAuthenticateRequest, JsonRpcRequest, RUNTIME_HEADER, RUNTIME_NAME, RuntimeConfig,
+        RuntimeError, RuntimeSessionRecord, SessionAuthReuseMissReason, TrustedPeerAddr,
+        URL_SAFE_NO_PAD, accepts_sse, active_runtime_session_count,
+        affinity_forward_error_response, auth_binding_fingerprint,
+        authenticate_public_request_if_needed, authorize_server_method_via_backend,
+        batch_rejected_response, build_forwarded_sse_event, build_public_router,
+        can_reuse_session_auth, can_use_direct_prompts_get, can_use_direct_resources_read,
+        decode_request, decode_upstream_json_payload_bytes, derive_backend_authenticate_url,
+        derive_backend_completion_complete_url, derive_backend_initialize_url,
+        derive_backend_logging_set_level_url, derive_backend_notifications_cancelled_url,
+        derive_backend_notifications_initialized_url, derive_backend_notifications_message_url,
+        derive_backend_prompts_get_authz_url, derive_backend_prompts_get_url,
+        derive_backend_prompts_list_authz_url, derive_backend_prompts_list_url,
+        derive_backend_resource_templates_list_authz_url,
+        derive_backend_resource_templates_list_url, derive_backend_resources_list_authz_url,
+        derive_backend_resources_list_url, derive_backend_resources_read_authz_url,
+        derive_backend_resources_read_url, derive_backend_resources_subscribe_url,
+        derive_backend_resources_unsubscribe_url, derive_backend_roots_list_url,
+        derive_backend_sampling_create_message_url, derive_backend_session_delete_url,
+        derive_backend_tools_call_metric_url, derive_backend_tools_call_resolve_url,
+        derive_backend_tools_call_url, derive_backend_tools_list_authz_url,
+        derive_backend_tools_list_url, derive_backend_transport_url, direct_server_prompts_get,
+        direct_server_prompts_list, direct_server_resource_templates_list,
+        direct_server_resources_list, direct_server_resources_read,
+        encode_internal_auth_context_header, event_store_key_prefix, extract_client_capabilities,
+        extract_first_sse_data_payload, finalize_sse_frame, forward_initialize_to_backend,
+        forward_to_backend, forward_transport_request, get_runtime_session,
+        handle_initialize_with_session_core, handle_resume_transport_request, has_server_scope,
+        hex_decode, hex_encode, inject_server_id_header, inject_session_header,
+        invalid_request_response, is_affinity_forwarded_request, maybe_bind_session_auth_context,
+        maybe_upsert_runtime_session_from_transport_response, normalize_postgres_database_url,
+        parse_error_response, parse_sse_line, pool_owner_key, prompt_arguments_from_schema,
+        public_client_ip, query_param, remove_runtime_session, replay_events_endpoint,
+        requested_initialize_session_id, requested_protocol_version,
+        response_from_affinity_forward_response, run, runtime_session_access_outcome,
+        runtime_session_id_from_request, runtime_session_key, send_tools_list_to_backend,
+        send_transport_to_backend, serve_http, serve_uds, store_event_endpoint,
+        transport_delete_server_scoped, transport_get_server_scoped, upsert_runtime_session,
+        validate_initialize_params, validate_protocol_version, validate_runtime_session_request,
+    };
+    use axum::{
+        Json, Router,
+        body::to_bytes,
+        extract::{Path as AxumPath, State},
+        http::{HeaderMap, HeaderName, HeaderValue, StatusCode, Uri},
+        response::{IntoResponse, Response, sse::Sse},
+        routing::{get, post},
+    };
+    use futures_util::stream;
+    use reqwest::Url;
+    use serde_json::{Value, json};
+    use std::collections::HashMap;
+    use std::{
+        convert::Infallible,
+        net::{SocketAddr, TcpListener},
+        path::PathBuf,
+        sync::{Arc, Mutex},
+        time::Duration,
+    };
+    use tokio::time::{Instant, sleep};
+    use uuid::Uuid;
+
+    fn free_tcp_addr() -> String {
+        let listener = TcpListener::bind("127.0.0.1:0").expect("bind ephemeral port");
+        let addr = listener.local_addr().expect("local addr");
+        drop(listener);
+        addr.to_string()
+    }
+
+    async fn spawn_router(router: Router) -> String {
+        let listener = tokio::net::TcpListener::bind("127.0.0.1:0")
+            .await
+            .expect("bind test listener");
+        let addr = listener.local_addr().expect("local addr");
+        tokio::spawn(async move {
+            axum::serve(listener, router)
+                .await
+                .expect("serve test router");
+        });
+        format!("http://{addr}")
+    }
+
+    fn trusted_auth_context_json() -> Value {
+        json!({
+            "email": "owner@example.com",
+            "teams": ["team-1"],
+            "is_authenticated": true
+        })
+    }
+
+    fn trusted_server_headers(server_id: &str) -> HeaderMap {
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer alpha"),
+        );
+        headers.insert(
+            HeaderName::from_static("x-contextforge-auth-context"),
+            encode_internal_auth_context_header(&trusted_auth_context_json())
+                .expect("encode auth context"),
+        );
+        headers.insert(
+            HeaderName::from_static("x-contextforge-server-id"),
+            HeaderValue::from_str(server_id).expect("valid server id"),
+        );
+        headers
+    }
+
+    async fn response_json(response: Response) -> Value {
+        serde_json::from_slice(
+            &to_bytes(response.into_body(), usize::MAX)
+                .await
+                .expect("body"),
+        )
+        .expect("json body")
+    }
+
+    fn test_config() -> RuntimeConfig {
+        RuntimeConfig {
+            backend_rpc_url: "http://127.0.0.1:4444/rpc".to_string(),
+            listen_http: free_tcp_addr(),
+            listen_uds: None,
+            public_listen_http: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: Vec::new(),
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions:
+                "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration."
+                    .to_string(),
+            request_timeout_ms: 30_000,
+            client_connect_timeout_ms: 5_000,
+            client_pool_idle_timeout_seconds: 90,
+            client_pool_max_idle_per_host: 1024,
+            client_tcp_keepalive_seconds: 30,
+            tools_call_plan_ttl_seconds: 30,
+            upstream_session_ttl_seconds: 300,
+            use_rmcp_upstream_client: false,
+            session_core_enabled: true,
+            event_store_enabled: true,
+            resume_core_enabled: true,
+            live_stream_core_enabled: true,
+            affinity_core_enabled: true,
+            session_auth_reuse_enabled: true,
+            session_auth_reuse_ttl_seconds: 45,
+            session_ttl_seconds: 3_600,
+            event_store_max_events_per_stream: 123,
+            event_store_ttl_seconds: 4_200,
+            event_store_poll_interval_ms: 333,
+            cache_prefix: "mcpgw:test:".to_string(),
+            database_url: None,
+            redis_url: None,
+            db_pool_max_size: 7,
+            log_filter: "error".to_string(),
+            exit_after_startup_ms: None,
+        }
+    }
+
+    #[tokio::test]
+    async fn app_state_new_exposes_derived_urls_and_runtime_flags() {
+        let config = test_config();
+        let state = AppState::new(&config).expect("state");
+
+        assert_eq!(state.backend_rpc_url(), "http://127.0.0.1:4444/rpc");
+        assert_eq!(
+            state.backend_authenticate_url(),
+            "http://127.0.0.1:4444/_internal/mcp/authenticate"
+        );
+        assert_eq!(
+            state.backend_initialize_url(),
+            "http://127.0.0.1:4444/_internal/mcp/initialize"
+        );
+        assert_eq!(
+            state.backend_notifications_initialized_url(),
+            "http://127.0.0.1:4444/_internal/mcp/notifications/initialized"
+        );
+        assert_eq!(
+            state.backend_notifications_message_url(),
+            "http://127.0.0.1:4444/_internal/mcp/notifications/message"
+        );
+        assert_eq!(
+            state.backend_notifications_cancelled_url(),
+            "http://127.0.0.1:4444/_internal/mcp/notifications/cancelled"
+        );
+        assert_eq!(
+            state.backend_transport_url(),
+            "http://127.0.0.1:4444/_internal/mcp/transport"
+        );
+        assert_eq!(
+            state.backend_tools_list_url(),
+            "http://127.0.0.1:4444/_internal/mcp/tools/list"
+        );
+        assert_eq!(
+            state.backend_resources_list_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/list"
+        );
+        assert_eq!(
+            state.backend_resources_read_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/read"
+        );
+        assert_eq!(
+            state.backend_resources_subscribe_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/subscribe"
+        );
+        assert_eq!(
+            state.backend_resources_unsubscribe_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/unsubscribe"
+        );
+        assert_eq!(
+            state.backend_resource_templates_list_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/templates/list"
+        );
+        assert_eq!(
+            state.backend_prompts_list_url(),
+            "http://127.0.0.1:4444/_internal/mcp/prompts/list"
+        );
+        assert_eq!(
+            state.backend_prompts_get_url(),
+            "http://127.0.0.1:4444/_internal/mcp/prompts/get"
+        );
+        assert_eq!(
+            state.backend_roots_list_url(),
+            "http://127.0.0.1:4444/_internal/mcp/roots/list"
+        );
+        assert_eq!(
+            state.backend_completion_complete_url(),
+            "http://127.0.0.1:4444/_internal/mcp/completion/complete"
+        );
+        assert_eq!(
+            state.backend_sampling_create_message_url(),
+            "http://127.0.0.1:4444/_internal/mcp/sampling/createMessage"
+        );
+        assert_eq!(
+            state.backend_logging_set_level_url(),
+            "http://127.0.0.1:4444/_internal/mcp/logging/setLevel"
+        );
+        assert_eq!(
+            state.backend_tools_list_authz_url(),
+            "http://127.0.0.1:4444/_internal/mcp/tools/list/authz"
+        );
+        assert_eq!(
+            state.backend_resources_list_authz_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/list/authz"
+        );
+        assert_eq!(
+            state.backend_resources_read_authz_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/read/authz"
+        );
+        assert_eq!(
+            state.backend_resource_templates_list_authz_url(),
+            "http://127.0.0.1:4444/_internal/mcp/resources/templates/list/authz"
+        );
+        assert_eq!(
+            state.backend_prompts_list_authz_url(),
+            "http://127.0.0.1:4444/_internal/mcp/prompts/list/authz"
+        );
+        assert_eq!(
+            state.backend_prompts_get_authz_url(),
+            "http://127.0.0.1:4444/_internal/mcp/prompts/get/authz"
+        );
+        assert_eq!(
+            state.backend_tools_call_url(),
+            "http://127.0.0.1:4444/_internal/mcp/tools/call"
+        );
+        assert_eq!(
+            state.backend_tools_call_resolve_url(),
+            "http://127.0.0.1:4444/_internal/mcp/tools/call/resolve"
+        );
+        assert_eq!(
+            state.backend_tools_call_metric_url(),
+            "http://127.0.0.1:4444/_internal/mcp/tools/call/metric"
+        );
+        assert_eq!(state.protocol_version(), "2025-11-25");
+        assert_eq!(state.server_name(), "ContextForge");
+        assert_eq!(state.server_version(), "0.1.0");
+        assert_eq!(
+            state.instructions(),
+            "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration."
+        );
+        assert!(
+            state
+                .supported_protocol_versions()
+                .iter()
+                .any(|v| v == "2025-03-26")
+        );
+        assert!(state.session_core_enabled());
+        assert!(state.event_store_enabled());
+        assert!(state.resume_core_enabled());
+        assert!(state.live_stream_core_enabled());
+        assert!(state.affinity_core_enabled());
+        assert!(state.session_auth_reuse_enabled());
+        assert!(state.db_pool().is_none());
+        assert_eq!(state.cache_prefix(), "mcpgw:test:");
+        assert_eq!(state.event_store_max_events_per_stream(), 123);
+        assert_eq!(state.event_store_ttl(), Duration::from_secs(4_200));
+        assert_eq!(
+            state.event_store_poll_interval(),
+            Duration::from_millis(333)
+        );
+        assert_eq!(state.tools_call_plan_ttl(), Duration::from_secs(30));
+        assert_eq!(state.upstream_session_ttl(), Duration::from_secs(300));
+        assert_eq!(state.session_ttl(), Duration::from_secs(3_600));
+        assert_eq!(state.session_auth_reuse_ttl(), Duration::from_secs(45));
+        assert!(!state.public_ingress_enabled());
+        assert!(state.runtime_sessions().lock().await.is_empty());
+        assert!(state.upstream_tool_sessions().lock().await.is_empty());
+        assert!(state.resolved_tool_call_plans().lock().await.is_empty());
+        #[cfg(feature = "rmcp-upstream-client")]
+        {
+            assert!(!state.use_rmcp_upstream_client());
+            assert!(state.rmcp_upstream_clients().lock().await.is_empty());
+        }
+    }
+
+    #[test]
+    fn app_state_new_accepts_sqlite_but_disables_direct_db_pool() {
+        let mut config = test_config();
+        config.database_url = Some("sqlite:///tmp/runtime.db".to_string());
+
+        let state = AppState::new(&config).expect("state");
+
+        assert!(state.db_pool().is_none());
+    }
+
+    #[test]
+    fn app_state_new_rejects_invalid_database_url() {
+        let mut config = test_config();
+        config.database_url =
+            Some("postgresql+psycopg://user:pass@127.0.0.1:notaport/db".to_string());
+
+        let Err(error) = AppState::new(&config) else {
+            panic!("invalid db url should fail");
+        };
+
+        match error {
+            RuntimeError::Config(message) => {
+                assert!(message.contains("invalid MCP_RUST_DATABASE_URL"));
+            }
+            other => panic!("expected config error, got {other}"),
+        }
+    }
+
+    #[test]
+    fn app_state_new_accepts_database_url_with_sslmode_require() {
+        let mut config = test_config();
+        config.database_url =
+            Some("postgresql+psycopg://user:pass@127.0.0.1:5432/db?sslmode=require".to_string());
+
+        let state = AppState::new(&config).expect("state");
+
+        assert!(state.db_pool().is_some());
+    }
+
+    #[test]
+    fn app_state_new_rejects_missing_sslrootcert_file() {
+        let mut config = test_config();
+        config.database_url = Some(
+            "postgresql+psycopg://user:pass@127.0.0.1:5432/db?sslmode=require&sslrootcert=/tmp/contextforge-missing-root-ca.pem".to_string(),
+        );
+
+        let Err(error) = AppState::new(&config) else {
+            panic!("missing sslrootcert should fail");
+        };
+
+        match error {
+            RuntimeError::Config(message) => {
+                assert!(message.contains("sslrootcert"));
+            }
+            other => panic!("expected config error, got {other}"),
+        }
+    }
+
+    #[test]
+    fn app_state_new_rejects_unsupported_client_certificate_parameters() {
+        let mut config = test_config();
+        config.database_url = Some(
+            "postgresql+psycopg://user:pass@127.0.0.1:5432/db?sslmode=require&sslcert=/tmp/client.pem&sslkey=/tmp/client.key".to_string(),
+        );
+
+        let Err(error) = AppState::new(&config) else {
+            panic!("sslcert/sslkey should fail");
+        };
+
+        match error {
+            RuntimeError::Config(message) => {
+                assert!(message.contains("sslcert/sslkey"));
+            }
+            other => panic!("expected config error, got {other}"),
+        }
+    }
+
+    #[test]
+    fn normalize_postgres_database_url_strips_tls_only_query_parameters() {
+        let (normalized_url, tls_options) = normalize_postgres_database_url(
+            "postgresql+psycopg://user:pass@db.example.com:5432/mcp?sslmode=require&options=-c%20search_path%3Dmcp_gateway&sslrootcert=/tmp/root-ca.pem",
+        )
+        .expect("normalized");
+        let parsed = Url::parse(&normalized_url).expect("parsed");
+        let query_pairs = parsed
+            .query_pairs()
+            .into_owned()
+            .collect::<std::collections::HashMap<_, _>>();
+
+        assert!(normalized_url.starts_with("postgresql://user:pass@db.example.com:5432/mcp?"));
+        assert!(!normalized_url.contains("sslrootcert"));
+        assert_eq!(
+            query_pairs.get("sslmode").map(String::as_str),
+            Some("require")
+        );
+        assert_eq!(
+            query_pairs.get("options").map(String::as_str),
+            Some("-c search_path=mcp_gateway")
+        );
+        assert_eq!(
+            tls_options.ssl_root_cert.as_deref(),
+            Some("/tmp/root-ca.pem")
+        );
+        assert_eq!(tls_options.ssl_cert, None);
+        assert_eq!(tls_options.ssl_key, None);
+    }
+
+    #[test]
+    fn app_state_new_rejects_invalid_redis_url() {
+        let mut config = test_config();
+        config.redis_url = Some("not a redis url".to_string());
+
+        let Err(error) = AppState::new(&config) else {
+            panic!("invalid redis url should fail");
+        };
+
+        match error {
+            RuntimeError::Config(message) => {
+                assert!(message.contains("invalid MCP_RUST_REDIS_URL"));
+            }
+            other => panic!("expected config error, got {other}"),
+        }
+    }
+
+    #[test]
+    fn backend_url_derivation_helpers_cover_all_supported_rpc_suffixes() {
+        type Deriver = fn(&str) -> String;
+
+        let derivations: [(&str, Deriver); 21] = [
+            ("_internal/mcp/tools/list", derive_backend_tools_list_url),
+            (
+                "_internal/mcp/resources/list",
+                derive_backend_resources_list_url,
+            ),
+            (
+                "_internal/mcp/resources/read",
+                derive_backend_resources_read_url,
+            ),
+            (
+                "_internal/mcp/resources/subscribe",
+                derive_backend_resources_subscribe_url,
+            ),
+            (
+                "_internal/mcp/resources/unsubscribe",
+                derive_backend_resources_unsubscribe_url,
+            ),
+            (
+                "_internal/mcp/resources/templates/list",
+                derive_backend_resource_templates_list_url,
+            ),
+            (
+                "_internal/mcp/prompts/list",
+                derive_backend_prompts_list_url,
+            ),
+            ("_internal/mcp/prompts/get", derive_backend_prompts_get_url),
+            ("_internal/mcp/roots/list", derive_backend_roots_list_url),
+            (
+                "_internal/mcp/completion/complete",
+                derive_backend_completion_complete_url,
+            ),
+            (
+                "_internal/mcp/sampling/createMessage",
+                derive_backend_sampling_create_message_url,
+            ),
+            (
+                "_internal/mcp/logging/setLevel",
+                derive_backend_logging_set_level_url,
+            ),
+            ("_internal/mcp/initialize", derive_backend_initialize_url),
+            ("_internal/mcp/transport", derive_backend_transport_url),
+            ("_internal/mcp/session", derive_backend_session_delete_url),
+            (
+                "_internal/mcp/notifications/initialized",
+                derive_backend_notifications_initialized_url,
+            ),
+            (
+                "_internal/mcp/notifications/message",
+                derive_backend_notifications_message_url,
+            ),
+            (
+                "_internal/mcp/notifications/cancelled",
+                derive_backend_notifications_cancelled_url,
+            ),
+            (
+                "_internal/mcp/tools/list/authz",
+                derive_backend_tools_list_authz_url,
+            ),
+            (
+                "_internal/mcp/resources/list/authz",
+                derive_backend_resources_list_authz_url,
+            ),
+            (
+                "_internal/mcp/resources/read/authz",
+                derive_backend_resources_read_authz_url,
+            ),
+        ];
+
+        let inputs = [
+            (
+                "http://gateway.example/_internal/mcp/rpc",
+                "http://gateway.example",
+            ),
+            (
+                "http://gateway.example/_internal/mcp/rpc/",
+                "http://gateway.example",
+            ),
+            ("http://gateway.example/rpc", "http://gateway.example"),
+            ("http://gateway.example/rpc/", "http://gateway.example"),
+            (
+                "http://gateway.example/custom/base/",
+                "http://gateway.example/custom/base",
+            ),
+        ];
+
+        for (suffix, derive) in derivations {
+            for (input, prefix) in inputs {
+                assert_eq!(derive(input), format!("{prefix}/{suffix}"), "input {input}");
+            }
+        }
+
+        let authz_derivations: [(&str, Deriver); 7] = [
+            (
+                "_internal/mcp/resources/templates/list/authz",
+                derive_backend_resource_templates_list_authz_url,
+            ),
+            (
+                "_internal/mcp/prompts/list/authz",
+                derive_backend_prompts_list_authz_url,
+            ),
+            (
+                "_internal/mcp/prompts/get/authz",
+                derive_backend_prompts_get_authz_url,
+            ),
+            ("_internal/mcp/tools/call", derive_backend_tools_call_url),
+            (
+                "_internal/mcp/tools/call/resolve",
+                derive_backend_tools_call_resolve_url,
+            ),
+            (
+                "_internal/mcp/tools/call/metric",
+                derive_backend_tools_call_metric_url,
+            ),
+            (
+                "_internal/mcp/authenticate",
+                derive_backend_authenticate_url,
+            ),
+        ];
+
+        for (suffix, derive) in authz_derivations {
+            for (input, prefix) in inputs {
+                assert_eq!(derive(input), format!("{prefix}/{suffix}"), "input {input}");
+            }
+        }
+    }
+
+    #[tokio::test]
+    async fn run_http_listener_can_exit_after_startup_delay() {
+        let mut config = test_config();
+        config.exit_after_startup_ms = Some(5);
+
+        run(config).await.expect("run http listener");
+    }
+
+    #[tokio::test]
+    async fn run_dual_http_listeners_can_exit_after_startup_delay() {
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        config.exit_after_startup_ms = Some(5);
+
+        run(config).await.expect("run dual http listeners");
+    }
+
+    #[tokio::test]
+    async fn run_uds_listener_can_exit_after_startup_delay() {
+        let mut config = test_config();
+        config.listen_uds = Some(PathBuf::from(format!(
+            "/tmp/contextforge-mcp-runtime-{}.sock",
+            Uuid::new_v4()
+        )));
+        config.exit_after_startup_ms = Some(5);
+
+        run(config.clone()).await.expect("run uds listener");
+
+        if let Some(path) = config.listen_uds {
+            let _ = std::fs::remove_file(path);
+        }
+    }
+
+    #[tokio::test]
+    async fn run_uds_and_public_http_can_exit_after_startup_delay() {
+        let mut config = test_config();
+        config.listen_uds = Some(PathBuf::from(format!(
+            "/tmp/contextforge-mcp-runtime-{}.sock",
+            Uuid::new_v4()
+        )));
+        config.public_listen_http = Some(free_tcp_addr());
+        config.exit_after_startup_ms = Some(5);
+
+        run(config.clone())
+            .await
+            .expect("run uds and public http listeners");
+
+        if let Some(path) = config.listen_uds {
+            let _ = std::fs::remove_file(path);
+        }
+    }
+
+    #[test]
+    fn direct_server_scope_helper_predicates_cover_valid_and_invalid_shapes() {
+        let mut headers = HeaderMap::new();
+        assert!(!has_server_scope(&headers));
+        headers.insert(
+            HeaderName::from_static("x-contextforge-server-id"),
+            HeaderValue::from_static("server-1"),
+        );
+        assert!(has_server_scope(&headers));
+
+        assert!(!can_use_direct_resources_read(&Value::Null));
+        assert!(!can_use_direct_resources_read(&json!({"uri": ""})));
+        assert!(!can_use_direct_resources_read(
+            &json!({"uri": "resource://one", "requestId": "123"})
+        ));
+        assert!(!can_use_direct_resources_read(
+            &json!({"uri": "resource://one", "_meta": {"trace": true}})
+        ));
+        assert!(can_use_direct_resources_read(
+            &json!({"uri": "resource://one"})
+        ));
+
+        assert!(!can_use_direct_prompts_get(&Value::Null));
+        assert!(!can_use_direct_prompts_get(&json!({"name": ""})));
+        assert!(!can_use_direct_prompts_get(
+            &json!({"name": "prompt-1", "arguments": {"who": "world"}})
+        ));
+        assert!(!can_use_direct_prompts_get(
+            &json!({"name": "prompt-1", "_meta": {"trace": true}})
+        ));
+        assert!(can_use_direct_prompts_get(&json!({"name": "prompt-1"})));
+        assert!(can_use_direct_prompts_get(
+            &json!({"name": "prompt-1", "arguments": {}})
+        ));
+        assert!(can_use_direct_prompts_get(
+            &json!({"name": "prompt-1", "arguments": null})
+        ));
+    }
+
+    #[tokio::test]
+    async fn authenticate_public_request_strips_client_supplied_internal_headers_on_public_ingress()
+    {
+        let state = AppState::new(&test_config()).expect("state");
+        let uri: Uri = "/mcp?session_id=abc".parse().expect("uri");
+        let (headers, path) = authenticate_public_request_if_needed(
+            &state,
+            "GET",
+            HeaderMap::new(),
+            &uri,
+            Some("server-1"),
+            None,
+        )
+        .await
+        .expect("python ingress path");
+        assert_eq!(path, "/servers/server-1/mcp");
+        assert_eq!(
+            headers
+                .get("x-contextforge-server-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("server-1")
+        );
+
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        let captured = Arc::new(Mutex::new(None::<InternalAuthenticateRequest>));
+        let captured_auth = captured.clone();
+        let captured_request_headers = Arc::new(Mutex::new(None::<HashMap<String, String>>));
+        let captured_request_headers_auth = captured_request_headers.clone();
+        let backend = Router::new().route(
+            "/_internal/mcp/authenticate",
+            post(
+                move |headers: HeaderMap, Json(request): Json<InternalAuthenticateRequest>| {
+                    let captured_auth = captured_auth.clone();
+                    let captured_request_headers_auth = captured_request_headers_auth.clone();
+                    async move {
+                        *captured_auth.lock().expect("lock") = Some(request);
+                        *captured_request_headers_auth.lock().expect("lock") = Some(
+                            headers
+                                .iter()
+                                .filter_map(|(name, value)| {
+                                    value
+                                        .to_str()
+                                        .ok()
+                                        .map(|value| (name.as_str().to_string(), value.to_string()))
+                                })
+                                .collect(),
+                        );
+                        Json(json!({
+                            "authContext": {
+                                "email": "trusted@example.com",
+                                "teams": ["team-a"],
+                                "is_authenticated": true,
+                                "is_admin": false
+                            }
+                        }))
+                    }
+                },
+            ),
+        );
+        let backend_url = spawn_router(backend).await;
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("x-contextforge-auth-context"),
+            HeaderValue::from_static("already-present"),
+        );
+        headers.insert(
+            HeaderName::from_static("x-contextforge-server-id"),
+            HeaderValue::from_static("forged-server"),
+        );
+        let (headers, path) = authenticate_public_request_if_needed(
+            &state,
+            "GET",
+            headers,
+            &"/mcp".parse::<Uri>().expect("uri"),
+            None,
+            Some(SocketAddr::from(([198, 51, 100, 9], 44444))),
+        )
+        .await
+        .expect("public ingress auth");
+        assert_eq!(path, "/mcp");
+        let decoded_auth_context: Value = serde_json::from_slice(
+            &URL_SAFE_NO_PAD
+                .decode(
+                    headers
+                        .get("x-contextforge-auth-context")
+                        .and_then(|value| value.to_str().ok())
+                        .expect("auth context header"),
+                )
+                .expect("decode auth context"),
+        )
+        .expect("auth context json");
+        assert_eq!(
+            decoded_auth_context,
+            json!({
+                "email": "trusted@example.com",
+                "teams": ["team-a"],
+                "is_authenticated": true,
+                "is_admin": false
+            })
+        );
+        assert!(!headers.contains_key("x-contextforge-server-id"));
+
+        let captured = captured
+            .lock()
+            .expect("lock")
+            .clone()
+            .expect("captured request");
+        let captured_request_headers = captured_request_headers
+            .lock()
+            .expect("lock")
+            .clone()
+            .expect("captured request headers");
+        assert!(!captured.headers.contains_key("x-contextforge-auth-context"));
+        assert!(
+            !captured
+                .headers
+                .contains_key("x-contextforge-mcp-runtime-auth")
+        );
+        assert!(!captured.headers.contains_key("x-contextforge-server-id"));
+        assert_eq!(captured.client_ip.as_deref(), Some("198.51.100.9"));
+        assert_eq!(
+            captured_request_headers
+                .get(RUNTIME_HEADER)
+                .map(String::as_str),
+            Some(RUNTIME_NAME)
+        );
+        assert!(captured_request_headers.contains_key(INTERNAL_RUNTIME_AUTH_HEADER));
+    }
+
+    #[tokio::test]
+    async fn authenticate_public_request_surfaces_backend_transport_and_decode_failures() {
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        config.backend_rpc_url = "http://127.0.0.1:1/rpc".to_string();
+        let state = AppState::new(&config).expect("state");
+
+        let response = authenticate_public_request_if_needed(
+            &state,
+            "GET",
+            HeaderMap::new(),
+            &"/mcp".parse::<Uri>().expect("uri"),
+            None,
+            None,
+        )
+        .await
+        .expect_err("unreachable backend should fail");
+        assert_eq!(response.status(), StatusCode::BAD_GATEWAY);
+        let payload: Value = serde_json::from_slice(
+            &to_bytes(response.into_body(), usize::MAX)
+                .await
+                .expect("body"),
+        )
+        .expect("json body");
+        assert_eq!(payload["detail"], "Backend MCP authenticate failed");
+        assert_eq!(payload["error"], CLIENT_ERROR_DETAIL);
+
+        let backend = Router::new().route(
+            "/_internal/mcp/authenticate",
+            post(|| async move { (StatusCode::OK, "not-json") }),
+        );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+
+        let response = authenticate_public_request_if_needed(
+            &state,
+            "GET",
+            HeaderMap::new(),
+            &"/mcp".parse::<Uri>().expect("uri"),
+            None,
+            None,
+        )
+        .await
+        .expect_err("invalid backend payload should fail");
+        assert_eq!(response.status(), StatusCode::BAD_GATEWAY);
+        let payload: Value = serde_json::from_slice(
+            &to_bytes(response.into_body(), usize::MAX)
+                .await
+                .expect("body"),
+        )
+        .expect("json body");
+        assert_eq!(payload["detail"], "Backend MCP authenticate decode failed");
+        assert_eq!(payload["error"], CLIENT_ERROR_DETAIL);
+    }
+
+    #[tokio::test]
+    async fn event_store_endpoints_report_disabled_and_unavailable_states() {
+        let mut disabled_config = test_config();
+        disabled_config.event_store_enabled = false;
+        let state = AppState::new(&disabled_config).expect("state");
+
+        let disabled_store = store_event_endpoint(
+            State(state.clone()),
+            Json(EventStoreStoreRequest {
+                stream_id: "stream-1".to_string(),
+                message: Some(json!({"hello": "world"})),
+                key_prefix: None,
+                max_events_per_stream: None,
+                ttl_seconds: None,
+            }),
+        )
+        .await;
+        assert_eq!(disabled_store.status(), StatusCode::NOT_IMPLEMENTED);
+
+        let disabled_replay = replay_events_endpoint(
+            State(state),
+            Json(EventStoreReplayRequest {
+                last_event_id: "event-1".to_string(),
+                key_prefix: None,
+            }),
+        )
+        .await;
+        assert_eq!(disabled_replay.status(), StatusCode::NOT_IMPLEMENTED);
+
+        let mut config = test_config();
+        config.event_store_enabled = true;
+        let state = AppState::new(&config).expect("state");
+
+        let unavailable_store = store_event_endpoint(
+            State(state.clone()),
+            Json(EventStoreStoreRequest {
+                stream_id: "stream-1".to_string(),
+                message: Some(json!({"hello": "world"})),
+                key_prefix: None,
+                max_events_per_stream: None,
+                ttl_seconds: None,
+            }),
+        )
+        .await;
+        assert_eq!(unavailable_store.status(), StatusCode::SERVICE_UNAVAILABLE);
+
+        let unavailable_replay = replay_events_endpoint(
+            State(state),
+            Json(EventStoreReplayRequest {
+                last_event_id: "event-1".to_string(),
+                key_prefix: None,
+            }),
+        )
+        .await;
+        assert_eq!(unavailable_replay.status(), StatusCode::SERVICE_UNAVAILABLE);
+    }
+
+    #[tokio::test]
+    async fn public_router_does_not_expose_internal_event_store_routes() {
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        let state = AppState::new(&config).expect("state");
+        let runtime_url = spawn_router(build_public_router(state)).await;
+        let client = reqwest::Client::new();
+
+        let store = client
+            .post(format!("{runtime_url}/_internal/event-store/store"))
+            .json(&json!({
+                "streamId": "stream-1",
+                "message": {"hello": "world"},
+            }))
+            .send()
+            .await
+            .expect("store response");
+        assert_eq!(store.status(), StatusCode::NOT_FOUND);
+
+        let replay = client
+            .post(format!("{runtime_url}/_internal/event-store/replay"))
+            .json(&json!({
+                "lastEventId": "event-1",
+            }))
+            .send()
+            .await
+            .expect("replay response");
+        assert_eq!(replay.status(), StatusCode::NOT_FOUND);
+
+        let health = client
+            .get(format!("{runtime_url}/health"))
+            .send()
+            .await
+            .expect("health response");
+        let payload: Value = health.json().await.expect("health json");
+        assert_eq!(payload, json!({"status": "ok", "runtime": "rust"}));
+    }
+
+    #[tokio::test]
+    async fn server_scoped_transport_wrappers_inject_server_header() {
+        let calls = Arc::new(Mutex::new(Vec::<(String, Option<String>)>::new()));
+        let backend = {
+            let get_calls = calls.clone();
+            let delete_calls = calls.clone();
+            Router::new().route(
+                "/_internal/mcp/transport",
+                get(move |headers: HeaderMap| {
+                    let calls = get_calls.clone();
+                    async move {
+                        calls.lock().expect("lock").push((
+                            "GET".to_string(),
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                        ));
+                        (
+                            StatusCode::OK,
+                            [(
+                                "content-type",
+                                HeaderValue::from_static("text/event-stream"),
+                            )],
+                            "data: ok\n\n",
+                        )
+                    }
+                })
+                .delete(move |headers: HeaderMap| {
+                    let calls = delete_calls.clone();
+                    async move {
+                        calls.lock().expect("lock").push((
+                            "DELETE".to_string(),
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                        ));
+                        StatusCode::NO_CONTENT
+                    }
+                }),
+            )
+        };
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/_internal/mcp/rpc");
+        config.session_core_enabled = false;
+        config.live_stream_core_enabled = false;
+        let state = AppState::new(&config).expect("state");
+
+        let get_response = transport_get_server_scoped(
+            State(state.clone()),
+            AxumPath("server-xyz".to_string()),
+            TrustedPeerAddr::default(),
+            HeaderMap::new(),
+            "/servers/server-xyz/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+        assert_eq!(get_response.status(), StatusCode::OK);
+
+        let delete_response = transport_delete_server_scoped(
+            State(state),
+            AxumPath("server-xyz".to_string()),
+            TrustedPeerAddr::default(),
+            HeaderMap::new(),
+            "/servers/server-xyz/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+        assert_eq!(delete_response.status(), StatusCode::NO_CONTENT);
+
+        let calls = calls.lock().expect("lock");
+        assert_eq!(
+            *calls,
+            vec![
+                ("GET".to_string(), Some("server-xyz".to_string())),
+                ("DELETE".to_string(), Some("server-xyz".to_string())),
+            ]
+        );
+    }
+
+    #[tokio::test]
+    async fn public_transport_wrappers_return_backend_auth_failures() {
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        config.backend_rpc_url = "http://127.0.0.1:1/rpc".to_string();
+        let state = AppState::new(&config).expect("state");
+
+        let get_response = super::transport_get(
+            State(state.clone()),
+            TrustedPeerAddr::default(),
+            HeaderMap::new(),
+            "/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+        assert_eq!(get_response.status(), StatusCode::BAD_GATEWAY);
+
+        let delete_response = super::transport_delete(
+            State(state.clone()),
+            TrustedPeerAddr::default(),
+            HeaderMap::new(),
+            "/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+        assert_eq!(delete_response.status(), StatusCode::BAD_GATEWAY);
+
+        let post_response = super::rpc(
+            State(state),
+            TrustedPeerAddr::default(),
+            HeaderMap::new(),
+            "/mcp".parse::<Uri>().expect("uri"),
+            Bytes::from(
+                serde_json::to_vec(&json!({
+                    "jsonrpc": "2.0",
+                    "id": 1,
+                    "method": "ping",
+                    "params": {}
+                }))
+                .expect("request body"),
+            ),
+        )
+        .await;
+        assert_eq!(post_response.status(), StatusCode::BAD_GATEWAY);
+    }
+
+    #[tokio::test]
+    async fn backend_dispatch_error_helpers_redact_client_visible_details() {
+        let mut config = test_config();
+        config.backend_rpc_url = "http://127.0.0.1:1/rpc".to_string();
+        let state = AppState::new(&config).expect("state");
+        let uri = "/mcp".parse::<Uri>().expect("uri");
+
+        let transport_error = send_transport_to_backend(
+            &state,
+            reqwest::Method::POST,
+            &HeaderMap::new(),
+            &uri,
+            Some(Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":1,"method":"ping"}"#,
+            )),
+            false,
+        )
+        .await
+        .expect_err("unreachable backend should fail");
+        assert_eq!(transport_error.status(), StatusCode::BAD_GATEWAY);
+        let transport_payload: Value = serde_json::from_slice(
+            &to_bytes(transport_error.into_body(), usize::MAX)
+                .await
+                .expect("body"),
+        )
+        .expect("json body");
+        assert_eq!(transport_payload["data"], CLIENT_ERROR_DETAIL);
+
+        let tools_list_error = send_tools_list_to_backend(&state, HeaderMap::new())
+            .await
+            .expect_err("unreachable backend should fail");
+        assert_eq!(tools_list_error.status(), StatusCode::BAD_GATEWAY);
+        let tools_list_payload: Value = serde_json::from_slice(
+            &to_bytes(tools_list_error.into_body(), usize::MAX)
+                .await
+                .expect("body"),
+        )
+        .expect("json body");
+        assert_eq!(tools_list_payload["error"]["data"], CLIENT_ERROR_DETAIL);
+    }
+
+    #[tokio::test]
+    async fn serve_http_without_shutdown_can_be_aborted_after_serving_requests() {
+        let addr: SocketAddr = free_tcp_addr().parse().expect("socket addr");
+        let app = Router::new().route("/health", get(|| async { "ok" }));
+        let handle = tokio::spawn(serve_http(app, addr, None));
+        let client = reqwest::Client::new();
+        let deadline = Instant::now() + Duration::from_secs(2);
+        let mut seen_ok = false;
+        while Instant::now() < deadline {
+            if let Ok(response) = client.get(format!("http://{addr}/health")).send().await
+                && response.status() == StatusCode::OK
+            {
+                seen_ok = true;
+                break;
+            }
+            sleep(Duration::from_millis(10)).await;
+        }
+        assert!(seen_ok, "serve_http should accept requests before abort");
+        handle.abort();
+        let _ = handle.await;
+    }
+
+    #[tokio::test]
+    async fn serve_uds_without_shutdown_removes_existing_socket_file_and_can_be_aborted() {
+        let path = PathBuf::from(format!(
+            "/tmp/contextforge-mcp-runtime-existing-{}.sock",
+            Uuid::new_v4()
+        ));
+        std::fs::write(&path, b"placeholder").expect("seed placeholder socket file");
+        let app = Router::new().route("/health", get(|| async { "ok" }));
+        let handle = tokio::spawn(serve_uds(app, path.clone(), None));
+
+        let deadline = Instant::now() + Duration::from_secs(2);
+        let mut rebound = false;
+        while Instant::now() < deadline {
+            if path.exists() {
+                rebound = true;
+                break;
+            }
+            sleep(Duration::from_millis(10)).await;
+        }
+        assert!(rebound, "serve_uds should replace the seeded socket path");
+
+        handle.abort();
+        let _ = handle.await;
+        let _ = std::fs::remove_file(path);
+    }
+
+    #[test]
+    fn decode_request_and_validation_helpers_cover_error_paths() {
+        let state = AppState::new(&test_config()).expect("state");
+        let invalid_json = decode_request(br#"{"jsonrpc":"2.0""#).expect_err("parse error");
+        assert_eq!(invalid_json.status(), StatusCode::BAD_REQUEST);
+
+        let batch = decode_request(br#"[{"jsonrpc":"2.0","id":1,"method":"ping"}]"#)
+            .expect_err("batch should fail");
+        assert_eq!(batch.status(), StatusCode::BAD_REQUEST);
+
+        let invalid_version = decode_request(br#"{"jsonrpc":"1.0","id":1,"method":"ping"}"#)
+            .expect_err("invalid version should fail");
+        assert_eq!(invalid_version.status(), StatusCode::BAD_REQUEST);
+
+        let missing_method =
+            decode_request(br#"{"jsonrpc":"2.0","id":1}"#).expect_err("missing method should fail");
+        assert_eq!(missing_method.status(), StatusCode::BAD_REQUEST);
+
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("mcp-protocol-version"),
+            HeaderValue::from_static("2099-01-01"),
+        );
+        let unsupported_protocol =
+            validate_protocol_version(&state, &headers).expect_err("unsupported protocol");
+        assert_eq!(unsupported_protocol.status(), StatusCode::BAD_REQUEST);
+
+        let invalid_params =
+            validate_initialize_params(&state, &json!({"protocolVersion": 5}), Some(&json!(7)))
+                .expect_err("invalid params");
+        assert_eq!(invalid_params.status(), StatusCode::OK);
+
+        let missing_protocol =
+            validate_initialize_params(&state, &json!({"capabilities": {}}), Some(&json!(8)))
+                .expect_err("missing protocol");
+        assert_eq!(missing_protocol.status(), StatusCode::OK);
+
+        let unsupported_initialize = validate_initialize_params(
+            &state,
+            &json!({"protocolVersion": "2099-01-01", "capabilities": {}}),
+            Some(&json!(9)),
+        )
+        .expect_err("unsupported initialize protocol");
+        assert_eq!(unsupported_initialize.status(), StatusCode::OK);
+
+        assert_eq!(parse_error_response().status(), StatusCode::BAD_REQUEST);
+        assert_eq!(
+            invalid_request_response(&json!(1)).status(),
+            StatusCode::BAD_REQUEST
+        );
+        assert_eq!(batch_rejected_response().status(), StatusCode::BAD_REQUEST);
+    }
+
+    #[test]
+    fn sse_parser_helpers_cover_spec_edge_cases() {
+        let mut frame = super::PendingSseFrame::default();
+        parse_sse_line(&mut frame, ": keepalive");
+        assert!(!frame.saw_field);
+
+        parse_sse_line(&mut frame, "data: hello");
+        parse_sse_line(&mut frame, "data:world");
+        parse_sse_line(&mut frame, "id: event-1");
+        parse_sse_line(&mut frame, "event: message");
+        parse_sse_line(&mut frame, "retry: 1500");
+        parse_sse_line(&mut frame, "foo: bar");
+        let finalized = finalize_sse_frame(&mut frame).expect("frame should finalize");
+        assert_eq!(finalized.id.as_deref(), Some("event-1"));
+        assert_eq!(finalized.event.as_deref(), Some("message"));
+        assert_eq!(finalized.data, "hello\nworld");
+        assert_eq!(finalized.retry_ms, Some(1500));
+
+        let mut invalid_retry = super::PendingSseFrame::default();
+        parse_sse_line(&mut invalid_retry, "retry: nope");
+        parse_sse_line(&mut invalid_retry, "data: payload");
+        let invalid_retry = finalize_sse_frame(&mut invalid_retry).expect("invalid retry frame");
+        assert_eq!(invalid_retry.retry_ms, None);
+        assert_eq!(invalid_retry.data, "payload");
+
+        let mut no_colon_frame = super::PendingSseFrame::default();
+        parse_sse_line(&mut no_colon_frame, "data");
+        let no_colon = finalize_sse_frame(&mut no_colon_frame).expect("empty data field");
+        assert_eq!(no_colon.data, "");
+
+        let mut comments_only = super::PendingSseFrame::default();
+        parse_sse_line(&mut comments_only, ": still ignored");
+        assert!(finalize_sse_frame(&mut comments_only).is_none());
+
+        let mut empty = super::PendingSseFrame::default();
+        assert!(finalize_sse_frame(&mut empty).is_none());
+    }
+
+    #[tokio::test]
+    async fn build_forwarded_sse_event_and_payload_decoders_cover_edge_cases() {
+        let frame = super::FinalizedSseFrame {
+            id: Some("event-7".to_string()),
+            event: Some("message".to_string()),
+            data: "line one\nline two".to_string(),
+            retry_ms: Some(2500),
+        };
+        let response = Sse::new(stream::iter(vec![Ok::<_, Infallible>(
+            build_forwarded_sse_event(&frame),
+        )]))
+        .into_response();
+        let encoded = String::from_utf8(
+            to_bytes(response.into_body(), usize::MAX)
+                .await
+                .expect("encoded event body")
+                .to_vec(),
+        )
+        .expect("utf-8 body");
+        assert!(encoded.contains("id: event-7"));
+        assert!(encoded.contains("event: message"));
+        assert!(encoded.contains("retry: 2500"));
+        assert!(encoded.contains("data: line one"));
+        assert!(encoded.contains("data: line two"));
+
+        assert_eq!(
+            extract_first_sse_data_payload("data: first\n\ndata: second\n\n"),
+            Some("first".to_string())
+        );
+        assert_eq!(
+            extract_first_sse_data_payload("data: first\ndata: second"),
+            Some("first\nsecond".to_string())
+        );
+        assert_eq!(extract_first_sse_data_payload("event: message\n\n"), None);
+        assert_eq!(
+            extract_first_sse_data_payload("data:   padded value\n\n"),
+            Some("padded value".to_string())
+        );
+
+        let sse_json = decode_upstream_json_payload_bytes(
+            br#"data: {"ok":true}
+
+"#,
+            "text/event-stream",
+        )
+        .expect("valid SSE JSON");
+        assert_eq!(sse_json["ok"], json!(true));
+
+        let inferred_sse = decode_upstream_json_payload_bytes(br#"data: {"via":"prefix"}"#, "")
+            .expect("body prefix infers SSE");
+        assert_eq!(inferred_sse["via"], json!("prefix"));
+
+        let plain_json =
+            decode_upstream_json_payload_bytes(br#"{"plain":true}"#, "application/json")
+                .expect("plain JSON");
+        assert_eq!(plain_json["plain"], json!(true));
+
+        let invalid_sse =
+            decode_upstream_json_payload_bytes(b"data: not-json\n\n", "text/event-stream")
+                .expect_err("invalid SSE JSON should fail");
+        assert!(invalid_sse.contains("invalid SSE JSON payload"));
+
+        let empty_json = decode_upstream_json_payload_bytes(b"", "application/json")
+            .expect_err("empty JSON body should fail");
+        assert!(empty_json.contains("invalid JSON payload"));
+    }
+
+    #[test]
+    fn client_ip_and_session_auth_reuse_helpers_cover_edge_cases() {
+        let mut headers = HeaderMap::new();
+        assert_eq!(public_client_ip(&headers, None), None);
+
+        headers.insert(
+            HeaderName::from_static("x-forwarded-for"),
+            HeaderValue::from_static(" 198.51.100.10 , 203.0.113.5 "),
+        );
+        assert_eq!(
+            public_client_ip(&headers, Some(SocketAddr::from(([127, 0, 0, 1], 8080)))),
+            Some("203.0.113.5".to_string())
+        );
+
+        headers.insert(
+            HeaderName::from_static("x-real-ip"),
+            HeaderValue::from_static("203.0.113.9"),
+        );
+        assert_eq!(
+            public_client_ip(&headers, Some(SocketAddr::from(([127, 0, 0, 1], 8080)))),
+            Some("203.0.113.9".to_string())
+        );
+        assert_eq!(
+            public_client_ip(&headers, Some(SocketAddr::from(([198, 51, 100, 77], 9000)))),
+            Some("198.51.100.77".to_string())
+        );
+        assert_eq!(auth_binding_fingerprint(&HeaderMap::new()), None);
+
+        let mut auth_headers = HeaderMap::new();
+        auth_headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer alpha"),
+        );
+        let fingerprint = auth_binding_fingerprint(&auth_headers).expect("fingerprint");
+
+        let mut config = test_config();
+        config.session_auth_reuse_enabled = true;
+        let state = AppState::new(&config).expect("state");
+        let now = super::unix_epoch_millis();
+        let record = RuntimeSessionRecord {
+            owner_email: Some("owner@example.com".to_string()),
+            server_id: Some("server-1".to_string()),
+            protocol_version: None,
+            client_capabilities: None,
+            encoded_auth_context: Some("encoded-context".to_string()),
+            auth_binding_fingerprint: Some(fingerprint.clone()),
+            auth_context_expires_at_epoch_ms: Some(now + 60_000),
+            created_at: std::time::Instant::now(),
+            last_used: std::time::Instant::now(),
+        };
+
+        assert_eq!(
+            can_reuse_session_auth(&state, &record, &auth_headers, Some("server-1")),
+            Ok("encoded-context".to_string())
+        );
+        assert_eq!(
+            can_reuse_session_auth(&state, &record, &auth_headers, Some("server-2")),
+            Err(SessionAuthReuseMissReason::ServerScopeMismatch)
+        );
+
+        let mut mismatched_headers = HeaderMap::new();
+        mismatched_headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer beta"),
+        );
+        assert_eq!(
+            can_reuse_session_auth(&state, &record, &mismatched_headers, Some("server-1")),
+            Err(SessionAuthReuseMissReason::AuthBindingMismatch)
+        );
+
+        let expired = RuntimeSessionRecord {
+            auth_context_expires_at_epoch_ms: Some(now.saturating_sub(1)),
+            ..record.clone()
+        };
+        assert_eq!(
+            can_reuse_session_auth(&state, &expired, &auth_headers, Some("server-1")),
+            Err(SessionAuthReuseMissReason::TtlExpired)
+        );
+
+        let mut disabled_config = test_config();
+        disabled_config.session_auth_reuse_enabled = false;
+        let disabled_state = AppState::new(&disabled_config).expect("state");
+        assert_eq!(
+            can_reuse_session_auth(&disabled_state, &record, &auth_headers, Some("server-1")),
+            Err(SessionAuthReuseMissReason::Disabled)
+        );
+    }
+
+    #[tokio::test]
+    async fn authenticate_public_request_handles_invalid_reused_auth_header_and_backend_denials() {
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        config.session_core_enabled = true;
+        config.session_auth_reuse_enabled = true;
+        let state = AppState::new(&config).expect("state");
+
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer alpha"),
+        );
+        headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("session-1"),
+        );
+        let fingerprint = auth_binding_fingerprint(&headers).expect("fingerprint");
+        state.runtime_sessions().lock().await.insert(
+            "session-1".to_string(),
+            RuntimeSessionRecord {
+                owner_email: Some("owner@example.com".to_string()),
+                server_id: None,
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: Some("bad\nheader".to_string()),
+                auth_binding_fingerprint: Some(fingerprint),
+                auth_context_expires_at_epoch_ms: Some(super::unix_epoch_millis() + 60_000),
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        );
+
+        let response = authenticate_public_request_if_needed(
+            &state,
+            "GET",
+            headers,
+            &"/mcp".parse::<Uri>().expect("uri"),
+            None,
+            None,
+        )
+        .await
+        .expect_err("invalid stored auth header should fail");
+        assert_eq!(response.status(), StatusCode::BAD_GATEWAY);
+
+        let backend = Router::new().route(
+            "/_internal/mcp/authenticate",
+            post(|| async move { (StatusCode::UNAUTHORIZED, Json(json!({"detail": "denied"}))) }),
+        );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+        let response = authenticate_public_request_if_needed(
+            &state,
+            "GET",
+            HeaderMap::new(),
+            &"/mcp".parse::<Uri>().expect("uri"),
+            None,
+            None,
+        )
+        .await
+        .expect_err("backend denial should be forwarded");
+        assert_eq!(response.status(), StatusCode::UNAUTHORIZED);
+    }
+
+    #[test]
+    fn runtime_session_request_helpers_cover_headers_params_and_injection() {
+        let request = JsonRpcRequest {
+            jsonrpc: Some("2.0".to_string()),
+            method: "initialize".to_string(),
+            params: json!({
+                "sessionId": "param-session-id",
+                "protocolVersion": "2025-03-26",
+                "capabilities": {"roots": {"listChanged": true}},
+            }),
+            id: Some(json!(1)),
+        };
+        let uri = "/mcp?session_id=query-session-id"
+            .parse::<Uri>()
+            .expect("uri");
+        let empty_headers = HeaderMap::new();
+
+        assert_eq!(
+            runtime_session_id_from_request(&empty_headers, &uri),
+            Some("query-session-id".to_string())
+        );
+        assert_eq!(
+            requested_initialize_session_id(
+                &empty_headers,
+                &"/mcp".parse::<Uri>().expect("uri"),
+                &request
+            ),
+            Some("param-session-id".to_string())
+        );
+        assert_eq!(
+            requested_protocol_version(&request),
+            Some("2025-03-26".to_string())
+        );
+        assert_eq!(
+            extract_client_capabilities(&request),
+            Some(json!({"roots": {"listChanged": true}}))
+        );
+        assert_eq!(
+            query_param(&uri, "session_id"),
+            Some("query-session-id".to_string())
+        );
+        assert_eq!(query_param(&uri, "missing"), None);
+
+        let mut headers = HeaderMap::new();
+        inject_session_header(&mut headers, "header-session-id");
+        inject_server_id_header(&mut headers, "server-123");
+        assert_eq!(
+            runtime_session_id_from_request(&headers, &uri),
+            Some("header-session-id".to_string())
+        );
+        assert_eq!(
+            requested_initialize_session_id(&headers, &uri, &request),
+            Some("header-session-id".to_string())
+        );
+        assert_eq!(
+            headers
+                .get("x-contextforge-server-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("server-123")
+        );
+    }
+
+    #[tokio::test]
+    async fn runtime_session_local_cache_helpers_cover_lifecycle_and_keys() {
+        let mut config = test_config();
+        config.session_ttl_seconds = 1;
+        let state = AppState::new(&config).expect("state");
+        state.runtime_sessions().lock().await.insert(
+            "stale-session".to_string(),
+            RuntimeSessionRecord {
+                owner_email: Some("stale@example.com".to_string()),
+                server_id: None,
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: None,
+                auth_binding_fingerprint: None,
+                auth_context_expires_at_epoch_ms: None,
+                created_at: std::time::Instant::now()
+                    .checked_sub(Duration::from_secs(5))
+                    .expect("subtract"),
+                last_used: std::time::Instant::now()
+                    .checked_sub(Duration::from_secs(5))
+                    .expect("subtract"),
+            },
+        );
+
+        assert_eq!(active_runtime_session_count(&state).await, 0);
+        assert!(get_runtime_session(&state, "stale-session").await.is_none());
+
+        let record = RuntimeSessionRecord {
+            owner_email: Some("owner@example.com".to_string()),
+            server_id: Some("server-1".to_string()),
+            protocol_version: Some("2025-03-26".to_string()),
+            client_capabilities: Some(json!({"roots": {"listChanged": true}})),
+            encoded_auth_context: None,
+            auth_binding_fingerprint: None,
+            auth_context_expires_at_epoch_ms: None,
+            created_at: std::time::Instant::now(),
+            last_used: std::time::Instant::now(),
+        };
+        upsert_runtime_session(&state, "session-1".to_string(), record.clone()).await;
+        let fetched = get_runtime_session(&state, "session-1")
+            .await
+            .expect("session cached");
+        assert_eq!(fetched.owner_email, record.owner_email);
+        assert_eq!(
+            runtime_session_key(&state, "session-1"),
+            "mcpgw:test:rust:mcp:session:session-1"
+        );
+        assert_eq!(
+            pool_owner_key(&state, "session-1"),
+            "mcpgw:test:pool_owner:session-1"
+        );
+
+        let mut forwarded_headers = HeaderMap::new();
+        assert!(!is_affinity_forwarded_request(&forwarded_headers));
+        forwarded_headers.insert(
+            HeaderName::from_static("x-contextforge-affinity-forwarded"),
+            HeaderValue::from_static("rust"),
+        );
+        assert!(is_affinity_forwarded_request(&forwarded_headers));
+
+        remove_runtime_session(&state, "session-1").await;
+        assert!(get_runtime_session(&state, "session-1").await.is_none());
+    }
+
+    #[tokio::test]
+    async fn session_auth_binding_and_validation_helpers_cover_access_controls() {
+        let mut config = test_config();
+        config.session_auth_reuse_enabled = true;
+        let state = AppState::new(&config).expect("state");
+
+        let auth_context_json = json!({
+            "email": "owner@example.com",
+            "teams": ["team-1"],
+            "is_admin": false,
+            "is_authenticated": true
+        });
+        let auth_context = InternalAuthContext {
+            email: Some("owner@example.com".to_string()),
+            teams: Some(vec!["team-1".to_string()]),
+            is_admin: false,
+            is_authenticated: true,
+        };
+
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer alpha"),
+        );
+        headers.insert(
+            HeaderName::from_static("x-contextforge-auth-context"),
+            encode_internal_auth_context_header(&auth_context_json).expect("encode auth context"),
+        );
+        headers.insert(
+            HeaderName::from_static("x-contextforge-server-id"),
+            HeaderValue::from_static("server-1"),
+        );
+
+        let mut record = RuntimeSessionRecord {
+            owner_email: Some("owner@example.com".to_string()),
+            server_id: Some("server-1".to_string()),
+            protocol_version: None,
+            client_capabilities: None,
+            encoded_auth_context: None,
+            auth_binding_fingerprint: None,
+            auth_context_expires_at_epoch_ms: None,
+            created_at: std::time::Instant::now(),
+            last_used: std::time::Instant::now(),
+        };
+        maybe_bind_session_auth_context(&state, &mut record, &headers, Some(&auth_context));
+        assert_eq!(
+            record.encoded_auth_context,
+            Some(
+                headers
+                    .get("x-contextforge-auth-context")
+                    .and_then(|value| value.to_str().ok())
+                    .expect("header value")
+                    .to_string()
+            )
+        );
+        assert!(record.auth_binding_fingerprint.is_some());
+        assert!(
+            record.auth_context_expires_at_epoch_ms.expect("ttl is set")
+                > super::unix_epoch_millis()
+        );
+        assert!(runtime_session_access_outcome(&record, Some(&auth_context), &headers).is_ok());
+
+        upsert_runtime_session(&state, "session-validate".to_string(), record.clone()).await;
+
+        let mut validation_headers = headers.clone();
+        validation_headers.remove("x-contextforge-server-id");
+        let validated = validate_runtime_session_request(
+            &state,
+            &mut validation_headers,
+            &"/mcp?session_id=session-validate"
+                .parse::<Uri>()
+                .expect("uri"),
+        )
+        .await
+        .expect("validation succeeds");
+        assert_eq!(validated, Some("session-validate".to_string()));
+        assert_eq!(
+            validation_headers
+                .get("x-contextforge-server-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("server-1")
+        );
+
+        let mut wrong_server_headers = headers.clone();
+        wrong_server_headers.insert(
+            HeaderName::from_static("x-contextforge-server-id"),
+            HeaderValue::from_static("server-2"),
+        );
+        let response = validate_runtime_session_request(
+            &state,
+            &mut wrong_server_headers,
+            &"/mcp?session_id=session-validate"
+                .parse::<Uri>()
+                .expect("uri"),
+        )
+        .await
+        .expect_err("server mismatch is denied");
+        assert_eq!(response.status(), StatusCode::FORBIDDEN);
+        assert_eq!(
+            state
+                .runtime_stats()
+                .snapshot()
+                .session_access_denials
+                .server_scope_mismatches,
+            1
+        );
+
+        let mut wrong_auth_headers = headers.clone();
+        wrong_auth_headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer beta"),
+        );
+        let response = validate_runtime_session_request(
+            &state,
+            &mut wrong_auth_headers,
+            &"/mcp?session_id=session-validate"
+                .parse::<Uri>()
+                .expect("uri"),
+        )
+        .await
+        .expect_err("auth mismatch is denied");
+        assert_eq!(response.status(), StatusCode::FORBIDDEN);
+        let runtime_stats = state.runtime_stats().snapshot();
+        assert_eq!(
+            runtime_stats.session_access_denials.auth_binding_mismatches,
+            1
+        );
+    }
+
+    #[tokio::test]
+    async fn authenticate_public_request_updates_runtime_stats_for_reuse_hits_and_misses() {
+        let backend = Router::new().route(
+            "/_internal/mcp/authenticate",
+            post(|| async move {
+                Json(json!({
+                    "authContext": {
+                        "email": "owner@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": true,
+                        "is_admin": false,
+                        "permission_is_admin": false,
+                        "token_use": "session"
+                    }
+                }))
+            }),
+        );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.public_listen_http = Some(free_tcp_addr());
+        config.session_core_enabled = true;
+        config.session_auth_reuse_enabled = true;
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+
+        let auth_context_json = json!({
+            "email": "owner@example.com",
+            "teams": ["team-a"],
+            "is_authenticated": true
+        });
+        let encoded_auth_context =
+            encode_internal_auth_context_header(&auth_context_json).expect("auth context");
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer alpha"),
+        );
+        headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("session-hit"),
+        );
+        headers.insert(
+            HeaderName::from_static("x-contextforge-auth-context"),
+            encoded_auth_context.clone(),
+        );
+        let fingerprint = auth_binding_fingerprint(&headers).expect("fingerprint");
+        upsert_runtime_session(
+            &state,
+            "session-hit".to_string(),
+            RuntimeSessionRecord {
+                owner_email: Some("owner@example.com".to_string()),
+                server_id: None,
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: Some(
+                    encoded_auth_context
+                        .to_str()
+                        .expect("encoded auth context str")
+                        .to_string(),
+                ),
+                auth_binding_fingerprint: Some(fingerprint),
+                auth_context_expires_at_epoch_ms: Some(super::unix_epoch_millis() + 60_000),
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        )
+        .await;
+
+        let (returned_headers, _) = authenticate_public_request_if_needed(
+            &state,
+            "POST",
+            headers.clone(),
+            &"/mcp".parse::<Uri>().expect("uri"),
+            None,
+            None,
+        )
+        .await
+        .expect("reused auth context");
+        assert!(returned_headers.contains_key("x-contextforge-auth-context"));
+
+        let mut miss_headers = HeaderMap::new();
+        miss_headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer beta"),
+        );
+        miss_headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("session-hit"),
+        );
+        let (_returned_headers, _path) = authenticate_public_request_if_needed(
+            &state,
+            "POST",
+            miss_headers,
+            &"/mcp".parse::<Uri>().expect("uri"),
+            None,
+            None,
+        )
+        .await
+        .expect("backend auth fallback succeeds");
+
+        let runtime_stats = state.runtime_stats().snapshot();
+        assert_eq!(runtime_stats.session_auth_reuse.hits, 1);
+        assert_eq!(runtime_stats.session_auth_reuse.misses, 1);
+        assert_eq!(
+            runtime_stats.session_auth_reuse.miss_auth_binding_mismatch,
+            1
+        );
+        assert_eq!(runtime_stats.session_auth_reuse.backend_auth_round_trips, 1);
+    }
+
+    #[test]
+    fn affinity_response_and_hex_helpers_cover_edge_cases() {
+        assert_eq!(hex_encode(b"Hi"), "4869");
+        assert_eq!(hex_decode(b"4869"), Some(b"Hi".to_vec()));
+        assert_eq!(hex_decode(b"486"), None);
+        assert_eq!(hex_decode(b"GG"), None);
+
+        let response = response_from_affinity_forward_response(
+            AffinityForwardResponse {
+                status: 200,
+                headers: [
+                    ("x-custom".to_string(), "present".to_string()),
+                    ("bad header".to_string(), "ignored".to_string()),
+                ]
+                .into_iter()
+                .collect(),
+                body: hex_encode(br#"{"ok":true}"#),
+            },
+            Some("session-hint"),
+        );
+        assert_eq!(response.status(), StatusCode::OK);
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-runtime")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("content-type")
+                .and_then(|value| value.to_str().ok()),
+            Some("application/json")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("mcp-session-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("session-hint")
+        );
+        assert!(!response.headers().contains_key("x-custom"));
+    }
+
+    #[tokio::test]
+    async fn maybe_upsert_runtime_session_from_transport_response_persists_session_metadata() {
+        let state = AppState::new(&test_config()).expect("state");
+        let auth_context_json = json!({
+            "email": "owner@example.com",
+            "teams": ["team-1"],
+            "is_authenticated": true
+        });
+
+        let mut request_headers = HeaderMap::new();
+        request_headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer alpha"),
+        );
+        request_headers.insert(
+            HeaderName::from_static("x-contextforge-auth-context"),
+            encode_internal_auth_context_header(&auth_context_json).expect("encode auth context"),
+        );
+        request_headers.insert(
+            HeaderName::from_static("x-contextforge-server-id"),
+            HeaderValue::from_static("server-1"),
+        );
+        request_headers.insert(
+            HeaderName::from_static("mcp-protocol-version"),
+            HeaderValue::from_static("2025-03-26"),
+        );
+
+        let mut response_headers = reqwest::header::HeaderMap::new();
+        response_headers.insert(
+            "mcp-session-id",
+            reqwest::header::HeaderValue::from_static("response-session"),
+        );
+        let session_id = maybe_upsert_runtime_session_from_transport_response(
+            &state,
+            &request_headers,
+            Some("request-session"),
+            &response_headers,
+        )
+        .await
+        .expect("session id returned");
+        assert_eq!(session_id, "response-session");
+
+        let stored = get_runtime_session(&state, "response-session")
+            .await
+            .expect("stored session");
+        assert_eq!(stored.owner_email.as_deref(), Some("owner@example.com"));
+        assert_eq!(stored.server_id.as_deref(), Some("server-1"));
+        assert_eq!(stored.protocol_version.as_deref(), Some("2025-03-26"));
+        assert!(stored.encoded_auth_context.is_some());
+        assert!(stored.auth_binding_fingerprint.is_some());
+
+        let mut disabled_config = test_config();
+        disabled_config.session_core_enabled = false;
+        let disabled_state = AppState::new(&disabled_config).expect("state");
+        let passthrough = maybe_upsert_runtime_session_from_transport_response(
+            &disabled_state,
+            &HeaderMap::new(),
+            Some("request-session"),
+            &reqwest::header::HeaderMap::new(),
+        )
+        .await;
+        assert_eq!(passthrough, Some("request-session".to_string()));
+    }
+
+    #[tokio::test]
+    async fn backend_forward_helpers_and_initialize_session_core_cover_error_and_denial_paths() {
+        let mut error_config = test_config();
+        error_config.backend_rpc_url = "http://127.0.0.1:1/rpc".to_string();
+        let error_state = AppState::new(&error_config).expect("state");
+
+        let response =
+            forward_to_backend(&error_state, HeaderMap::new(), Bytes::from_static(b"{}")).await;
+        assert_eq!(response.status(), StatusCode::BAD_GATEWAY);
+
+        let response = forward_initialize_to_backend(
+            &error_state,
+            HeaderMap::new(),
+            Bytes::from_static(b"{}"),
+        )
+        .await;
+        assert_eq!(response.status(), StatusCode::BAD_GATEWAY);
+
+        let state = AppState::new(&test_config()).expect("state");
+        let auth_context_json = json!({
+            "email": "owner@example.com",
+            "teams": ["team-1"],
+            "is_authenticated": true
+        });
+        let mut incoming_headers = HeaderMap::new();
+        incoming_headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer beta"),
+        );
+        incoming_headers.insert(
+            HeaderName::from_static("x-contextforge-auth-context"),
+            encode_internal_auth_context_header(&auth_context_json).expect("encode auth context"),
+        );
+        incoming_headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("denied-session"),
+        );
+        upsert_runtime_session(
+            &state,
+            "denied-session".to_string(),
+            RuntimeSessionRecord {
+                owner_email: Some("owner@example.com".to_string()),
+                server_id: None,
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: Some("cached".to_string()),
+                auth_binding_fingerprint: Some("different-fingerprint".to_string()),
+                auth_context_expires_at_epoch_ms: Some(super::unix_epoch_millis() + 60_000),
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        )
+        .await;
+
+        let request = JsonRpcRequest {
+            jsonrpc: Some("2.0".to_string()),
+            method: "initialize".to_string(),
+            params: json!({"protocolVersion": "2025-03-26"}),
+            id: Some(json!(42)),
+        };
+        let response = handle_initialize_with_session_core(
+            &state,
+            incoming_headers,
+            "/mcp".parse::<Uri>().expect("uri"),
+            Bytes::from_static(br#"{"jsonrpc":"2.0","method":"initialize"}"#),
+            &request,
+        )
+        .await;
+        assert_eq!(response.status(), StatusCode::OK);
+    }
+
+    #[test]
+    fn session_auth_binding_helper_clears_reuse_state_for_disabled_or_invalid_inputs() {
+        let stale_value = Some("stale".to_string());
+        let stale_ttl = Some(super::unix_epoch_millis() + 60_000);
+        let authenticated_context = InternalAuthContext {
+            email: Some("owner@example.com".to_string()),
+            teams: Some(vec!["team-1".to_string()]),
+            is_admin: false,
+            is_authenticated: true,
+        };
+        let unauthenticated_context = InternalAuthContext {
+            is_authenticated: false,
+            ..authenticated_context.clone()
+        };
+
+        let mut base_record = RuntimeSessionRecord {
+            owner_email: Some("owner@example.com".to_string()),
+            server_id: None,
+            protocol_version: None,
+            client_capabilities: None,
+            encoded_auth_context: stale_value.clone(),
+            auth_binding_fingerprint: stale_value.clone(),
+            auth_context_expires_at_epoch_ms: stale_ttl,
+            created_at: std::time::Instant::now(),
+            last_used: std::time::Instant::now(),
+        };
+
+        let disabled_state = AppState::new(&{
+            let mut config = test_config();
+            config.session_auth_reuse_enabled = false;
+            config
+        })
+        .expect("state");
+        maybe_bind_session_auth_context(
+            &disabled_state,
+            &mut base_record,
+            &HeaderMap::new(),
+            Some(&authenticated_context),
+        );
+        assert!(base_record.encoded_auth_context.is_none());
+        assert!(base_record.auth_binding_fingerprint.is_none());
+        assert!(base_record.auth_context_expires_at_epoch_ms.is_none());
+
+        let enabled_state = AppState::new(&test_config()).expect("state");
+        let mut record = RuntimeSessionRecord {
+            encoded_auth_context: stale_value.clone(),
+            auth_binding_fingerprint: stale_value.clone(),
+            auth_context_expires_at_epoch_ms: stale_ttl,
+            ..base_record.clone()
+        };
+        maybe_bind_session_auth_context(&enabled_state, &mut record, &HeaderMap::new(), None);
+        assert!(record.encoded_auth_context.is_none());
+
+        let mut record = RuntimeSessionRecord {
+            encoded_auth_context: stale_value.clone(),
+            auth_binding_fingerprint: stale_value.clone(),
+            auth_context_expires_at_epoch_ms: stale_ttl,
+            ..base_record.clone()
+        };
+        maybe_bind_session_auth_context(
+            &enabled_state,
+            &mut record,
+            &HeaderMap::new(),
+            Some(&unauthenticated_context),
+        );
+        assert!(record.encoded_auth_context.is_none());
+
+        let auth_context_json = json!({
+            "email": "owner@example.com",
+            "teams": ["team-1"],
+            "is_authenticated": true
+        });
+        let mut missing_fingerprint_headers = HeaderMap::new();
+        missing_fingerprint_headers.insert(
+            HeaderName::from_static("x-contextforge-auth-context"),
+            encode_internal_auth_context_header(&auth_context_json).expect("encode auth context"),
+        );
+        let mut record = RuntimeSessionRecord {
+            encoded_auth_context: stale_value.clone(),
+            auth_binding_fingerprint: stale_value.clone(),
+            auth_context_expires_at_epoch_ms: stale_ttl,
+            ..base_record.clone()
+        };
+        maybe_bind_session_auth_context(
+            &enabled_state,
+            &mut record,
+            &missing_fingerprint_headers,
+            Some(&authenticated_context),
+        );
+        assert!(record.encoded_auth_context.is_none());
+
+        let mut missing_auth_context_headers = HeaderMap::new();
+        missing_auth_context_headers.insert(
+            HeaderName::from_static("authorization"),
+            HeaderValue::from_static("Bearer alpha"),
+        );
+        let mut record = RuntimeSessionRecord {
+            encoded_auth_context: stale_value,
+            auth_binding_fingerprint: Some("fingerprint".to_string()),
+            auth_context_expires_at_epoch_ms: stale_ttl,
+            ..base_record
+        };
+        maybe_bind_session_auth_context(
+            &enabled_state,
+            &mut record,
+            &missing_auth_context_headers,
+            Some(&authenticated_context),
+        );
+        assert!(record.encoded_auth_context.is_none());
+    }
+
+    #[tokio::test]
+    async fn validate_runtime_session_request_covers_missing_and_ownerless_sessions() {
+        let state = AppState::new(&test_config()).expect("state");
+
+        let response = validate_runtime_session_request(
+            &state,
+            &mut HeaderMap::new(),
+            &"/mcp?session_id=missing".parse::<Uri>().expect("uri"),
+        )
+        .await
+        .expect_err("missing session is not found");
+        assert_eq!(response.status(), StatusCode::NOT_FOUND);
+
+        upsert_runtime_session(
+            &state,
+            "ownerless".to_string(),
+            RuntimeSessionRecord {
+                owner_email: None,
+                server_id: None,
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: None,
+                auth_binding_fingerprint: None,
+                auth_context_expires_at_epoch_ms: None,
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        )
+        .await;
+
+        let validated = validate_runtime_session_request(
+            &state,
+            &mut HeaderMap::new(),
+            &"/mcp?session_id=ownerless".parse::<Uri>().expect("uri"),
+        )
+        .await
+        .expect("ownerless session is allowed");
+        assert_eq!(validated, Some("ownerless".to_string()));
+    }
+
+    #[test]
+    fn accepts_sse_event_store_prefix_and_injection_helpers_cover_edge_cases() {
+        let state = AppState::new(&test_config()).expect("state");
+        let mut headers = HeaderMap::new();
+        assert!(!accepts_sse(&headers));
+        headers.insert(
+            HeaderName::from_static("accept"),
+            HeaderValue::from_static("application/json"),
+        );
+        assert!(!accepts_sse(&headers));
+        headers.insert(
+            HeaderName::from_static("accept"),
+            HeaderValue::from_static("text/event-stream; charset=utf-8"),
+        );
+        assert!(accepts_sse(&headers));
+        headers.insert(
+            HeaderName::from_static("accept"),
+            HeaderValue::from_static("*/*"),
+        );
+        assert!(accepts_sse(&headers));
+
+        assert_eq!(
+            event_store_key_prefix(&state, None),
+            "mcpgw:test:eventstore"
+        );
+        assert_eq!(
+            event_store_key_prefix(&state, Some("custom")),
+            "mcpgw:test:custom"
+        );
+        assert_eq!(
+            event_store_key_prefix(&state, Some("already:scoped:prefix:")),
+            "already:scoped:prefix"
+        );
+
+        let mut invalid_headers = HeaderMap::new();
+        inject_session_header(&mut invalid_headers, "bad\nsession");
+        inject_server_id_header(&mut invalid_headers, "bad\nserver");
+        assert!(!invalid_headers.contains_key("mcp-session-id"));
+        assert!(!invalid_headers.contains_key("x-contextforge-server-id"));
+
+        let snake_case_request = JsonRpcRequest {
+            jsonrpc: Some("2.0".to_string()),
+            method: "initialize".to_string(),
+            params: json!({"protocol_version": "2025-11-25"}),
+            id: Some(json!(1)),
+        };
+        assert_eq!(
+            requested_protocol_version(&snake_case_request),
+            Some("2025-11-25".to_string())
+        );
+
+        let weird_uri = "/mcp?broken&session_id=kept".parse::<Uri>().expect("uri");
+        assert_eq!(
+            query_param(&weird_uri, "session_id"),
+            Some("kept".to_string())
+        );
+    }
+
+    #[test]
+    fn affinity_response_helpers_preserve_existing_headers_and_errors() {
+        let response = response_from_affinity_forward_response(
+            AffinityForwardResponse {
+                status: 204,
+                headers: [
+                    ("content-type".to_string(), "text/plain".to_string()),
+                    ("mcp-session-id".to_string(), "already-present".to_string()),
+                    ("x-request-id".to_string(), "request-123".to_string()),
+                    ("set-cookie".to_string(), "secret=1".to_string()),
+                    ("authorization".to_string(), "Bearer hidden".to_string()),
+                    ("content-length".to_string(), "99".to_string()),
+                    ("connection".to_string(), "keep-alive".to_string()),
+                ]
+                .into_iter()
+                .collect(),
+                body: "invalid-hex".to_string(),
+            },
+            Some("ignored-hint"),
+        );
+        assert_eq!(response.status(), StatusCode::NO_CONTENT);
+        assert_eq!(
+            response
+                .headers()
+                .get("content-type")
+                .and_then(|value| value.to_str().ok()),
+            Some("text/plain")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("mcp-session-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("already-present")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("x-request-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("request-123")
+        );
+        assert!(!response.headers().contains_key("set-cookie"));
+        assert!(!response.headers().contains_key("authorization"));
+        assert!(!response.headers().contains_key("content-length"));
+        assert!(!response.headers().contains_key("connection"));
+
+        let error = affinity_forward_error_response("publish failed", "boom");
+        assert_eq!(error.status(), StatusCode::BAD_GATEWAY);
+    }
+
+    #[tokio::test]
+    async fn direct_server_list_methods_fall_back_without_trusted_context() {
+        let backend = Router::new()
+            .route(
+                "/_internal/mcp/resources/list",
+                post(|| async { Json(json!({"marker": "resources-list"})) }),
+            )
+            .route(
+                "/_internal/mcp/resources/templates/list",
+                post(|| async { Json(json!({"marker": "resource-templates-list"})) }),
+            )
+            .route(
+                "/_internal/mcp/prompts/list",
+                post(|| async { Json(json!({"marker": "prompts-list"})) }),
+            );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+
+        let resources_response =
+            direct_server_resources_list(&state, HeaderMap::new(), Some(json!(1))).await;
+        assert_eq!(resources_response.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(resources_response).await["result"]["marker"],
+            "resources-list"
+        );
+
+        let templates_response =
+            direct_server_resource_templates_list(&state, HeaderMap::new(), Some(json!(2))).await;
+        assert_eq!(templates_response.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(templates_response).await["result"]["marker"],
+            "resource-templates-list"
+        );
+
+        let prompts_response =
+            direct_server_prompts_list(&state, HeaderMap::new(), Some(json!(3))).await;
+        assert_eq!(prompts_response.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(prompts_response).await["result"]["marker"],
+            "prompts-list"
+        );
+    }
+
+    #[tokio::test]
+    async fn direct_server_read_methods_fall_back_for_missing_required_params() {
+        let backend = Router::new()
+            .route(
+                "/_internal/mcp/resources/read",
+                post(|| async { Json(json!({"marker": "resources-read"})) }),
+            )
+            .route(
+                "/_internal/mcp/prompts/get",
+                post(|| async { Json(json!({"marker": "prompts-get"})) }),
+            );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+        let trusted_headers = trusted_server_headers("server-1");
+
+        let resources_request = JsonRpcRequest {
+            jsonrpc: Some("2.0".to_string()),
+            method: "resources/read".to_string(),
+            params: json!({}),
+            id: Some(json!(11)),
+        };
+        let resources_response = direct_server_resources_read(
+            &state,
+            trusted_headers.clone(),
+            Some(json!(11)),
+            &resources_request,
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":11,"method":"resources/read","params":{}}"#,
+            ),
+        )
+        .await;
+        assert_eq!(resources_response.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(resources_response).await["result"]["marker"],
+            "resources-read"
+        );
+
+        let prompts_request = JsonRpcRequest {
+            jsonrpc: Some("2.0".to_string()),
+            method: "prompts/get".to_string(),
+            params: json!({}),
+            id: Some(json!(12)),
+        };
+        let prompts_response = direct_server_prompts_get(
+            &state,
+            trusted_headers,
+            Some(json!(12)),
+            &prompts_request,
+            Bytes::from_static(br#"{"jsonrpc":"2.0","id":12,"method":"prompts/get","params":{}}"#),
+        )
+        .await;
+        assert_eq!(prompts_response.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(prompts_response).await["result"]["marker"],
+            "prompts-get"
+        );
+    }
+
+    #[tokio::test]
+    async fn direct_server_prompts_get_falls_back_when_arguments_are_supplied() {
+        let backend = Router::new()
+            .route(
+                "/_internal/mcp/prompts/get/authz",
+                post(|| async { StatusCode::OK }),
+            )
+            .route(
+                "/_internal/mcp/prompts/get",
+                post(|| async {
+                    Json(json!({
+                        "description": "rendered",
+                        "messages": [{
+                            "role": "user",
+                            "content": {
+                                "type": "text",
+                                "text": "Rendered prompt for America/New_York and Europe/Dublin"
+                            }
+                        }]
+                    }))
+                }),
+            );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+
+        let response = direct_server_prompts_get(
+            &state,
+            trusted_server_headers("server-1"),
+            Some(json!(31)),
+            &JsonRpcRequest {
+                jsonrpc: Some("2.0".to_string()),
+                method: "prompts/get".to_string(),
+                params: json!({
+                    "name": "fast-time-convert-time-detailed",
+                    "arguments": {
+                        "time": "2025-01-15T12:00:00Z",
+                        "from_timezone": "UTC",
+                        "to_timezones": "America/New_York,Europe/Dublin",
+                    }
+                }),
+                id: Some(json!(31)),
+            },
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":31,"method":"prompts/get","params":{"name":"fast-time-convert-time-detailed","arguments":{"time":"2025-01-15T12:00:00Z","from_timezone":"UTC","to_timezones":"America/New_York,Europe/Dublin"}}}"#,
+            ),
+        )
+        .await;
+
+        assert_eq!(response.status(), StatusCode::OK);
+        let payload = response_json(response).await;
+        assert_eq!(payload["result"]["description"], "rendered");
+        assert_eq!(
+            payload["result"]["messages"][0]["content"]["text"],
+            "Rendered prompt for America/New_York and Europe/Dublin"
+        );
+    }
+
+    #[tokio::test]
+    async fn direct_server_prompts_get_rejects_non_string_argument_values() {
+        let state = AppState::new(&test_config()).expect("state");
+
+        let response = direct_server_prompts_get(
+            &state,
+            trusted_server_headers("server-1"),
+            Some(json!(32)),
+            &JsonRpcRequest {
+                jsonrpc: Some("2.0".to_string()),
+                method: "prompts/get".to_string(),
+                params: json!({
+                    "name": "fast-time-convert-time-detailed",
+                    "arguments": {
+                        "target_timezones": ["America/New_York", "Europe/Dublin"]
+                    }
+                }),
+                id: Some(json!(32)),
+            },
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":32,"method":"prompts/get","params":{"name":"fast-time-convert-time-detailed","arguments":{"target_timezones":["America/New_York","Europe/Dublin"]}}}"#,
+            ),
+        )
+        .await;
+
+        assert_eq!(response.status(), StatusCode::OK);
+        let payload = response_json(response).await;
+        assert_eq!(payload["error"]["code"], -32602);
+        assert_eq!(
+            payload["error"]["message"],
+            "Prompt argument 'target_timezones' must be a string value"
+        );
+    }
+
+    #[tokio::test]
+    async fn direct_server_methods_fall_back_after_authz_success_without_db_pool() {
+        let backend = Router::new()
+            .route(
+                "/_internal/mcp/resources/list/authz",
+                post(|| async { StatusCode::OK }),
+            )
+            .route(
+                "/_internal/mcp/resources/templates/list/authz",
+                post(|| async { StatusCode::OK }),
+            )
+            .route(
+                "/_internal/mcp/prompts/list/authz",
+                post(|| async { StatusCode::OK }),
+            )
+            .route(
+                "/_internal/mcp/resources/read/authz",
+                post(|| async { StatusCode::OK }),
+            )
+            .route(
+                "/_internal/mcp/prompts/get/authz",
+                post(|| async { StatusCode::OK }),
+            )
+            .route(
+                "/_internal/mcp/resources/list",
+                post(|| async { Json(json!({"marker": "resources-list-db-fallback"})) }),
+            )
+            .route(
+                "/_internal/mcp/resources/templates/list",
+                post(|| async { Json(json!({"marker": "resource-templates-db-fallback"})) }),
+            )
+            .route(
+                "/_internal/mcp/prompts/list",
+                post(|| async { Json(json!({"marker": "prompts-list-db-fallback"})) }),
+            )
+            .route(
+                "/_internal/mcp/resources/read",
+                post(|| async { Json(json!({"marker": "resources-read-db-fallback"})) }),
+            )
+            .route(
+                "/_internal/mcp/prompts/get",
+                post(|| async { Json(json!({"marker": "prompts-get-db-fallback"})) }),
+            );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+        let trusted_headers = trusted_server_headers("server-1");
+
+        let resources_list =
+            direct_server_resources_list(&state, trusted_headers.clone(), Some(json!(21))).await;
+        assert_eq!(resources_list.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(resources_list).await["result"]["marker"],
+            "resources-list-db-fallback"
+        );
+
+        let templates_list =
+            direct_server_resource_templates_list(&state, trusted_headers.clone(), Some(json!(22)))
+                .await;
+        assert_eq!(templates_list.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(templates_list).await["result"]["marker"],
+            "resource-templates-db-fallback"
+        );
+
+        let prompts_list =
+            direct_server_prompts_list(&state, trusted_headers.clone(), Some(json!(23))).await;
+        assert_eq!(prompts_list.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(prompts_list).await["result"]["marker"],
+            "prompts-list-db-fallback"
+        );
+
+        let resources_request = JsonRpcRequest {
+            jsonrpc: Some("2.0".to_string()),
+            method: "resources/read".to_string(),
+            params: json!({"uri": "time://formats"}),
+            id: Some(json!(24)),
+        };
+        let resources_read = direct_server_resources_read(
+            &state,
+            trusted_headers.clone(),
+            Some(json!(24)),
+            &resources_request,
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":24,"method":"resources/read","params":{"uri":"time://formats"}}"#,
+            ),
+        )
+        .await;
+        assert_eq!(resources_read.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(resources_read).await["result"]["marker"],
+            "resources-read-db-fallback"
+        );
+
+        let prompts_request = JsonRpcRequest {
+            jsonrpc: Some("2.0".to_string()),
+            method: "prompts/get".to_string(),
+            params: json!({"name": "hello"}),
+            id: Some(json!(25)),
+        };
+        let prompts_get = direct_server_prompts_get(
+            &state,
+            trusted_headers,
+            Some(json!(25)),
+            &prompts_request,
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":25,"method":"prompts/get","params":{"name":"hello"}}"#,
+            ),
+        )
+        .await;
+        assert_eq!(prompts_get.status(), StatusCode::OK);
+        assert_eq!(
+            response_json(prompts_get).await["result"]["marker"],
+            "prompts-get-db-fallback"
+        );
+    }
+
+    #[tokio::test]
+    async fn direct_server_methods_return_authz_denials_before_db_fallback() {
+        let backend = Router::new()
+            .route(
+                "/_internal/mcp/resources/list/authz",
+                post(|| async {
+                    (
+                        StatusCode::FORBIDDEN,
+                        Json(json!({"detail": "resources/list denied"})),
+                    )
+                }),
+            )
+            .route(
+                "/_internal/mcp/resources/templates/list/authz",
+                post(|| async {
+                    (
+                        StatusCode::FORBIDDEN,
+                        Json(json!({"detail": "templates denied"})),
+                    )
+                }),
+            )
+            .route(
+                "/_internal/mcp/prompts/list/authz",
+                post(|| async {
+                    (
+                        StatusCode::FORBIDDEN,
+                        Json(json!({"detail": "prompts/list denied"})),
+                    )
+                }),
+            )
+            .route(
+                "/_internal/mcp/resources/read/authz",
+                post(|| async {
+                    (
+                        StatusCode::FORBIDDEN,
+                        Json(json!({"detail": "resources/read denied"})),
+                    )
+                }),
+            )
+            .route(
+                "/_internal/mcp/prompts/get/authz",
+                post(|| async {
+                    (
+                        StatusCode::FORBIDDEN,
+                        Json(json!({"detail": "prompts/get denied"})),
+                    )
+                }),
+            );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+        let trusted_headers = trusted_server_headers("server-1");
+
+        let resources_list =
+            direct_server_resources_list(&state, trusted_headers.clone(), Some(json!(26))).await;
+        assert_eq!(resources_list.status(), StatusCode::FORBIDDEN);
+        assert_eq!(
+            response_json(resources_list).await["error"]["detail"],
+            "resources/list denied"
+        );
+
+        let templates_list =
+            direct_server_resource_templates_list(&state, trusted_headers.clone(), Some(json!(27)))
+                .await;
+        assert_eq!(templates_list.status(), StatusCode::FORBIDDEN);
+        assert_eq!(
+            response_json(templates_list).await["error"]["detail"],
+            "templates denied"
+        );
+
+        let prompts_list =
+            direct_server_prompts_list(&state, trusted_headers.clone(), Some(json!(28))).await;
+        assert_eq!(prompts_list.status(), StatusCode::FORBIDDEN);
+        assert_eq!(
+            response_json(prompts_list).await["error"]["detail"],
+            "prompts/list denied"
+        );
+
+        let resources_read = direct_server_resources_read(
+            &state,
+            trusted_headers.clone(),
+            Some(json!(29)),
+            &JsonRpcRequest {
+                jsonrpc: Some("2.0".to_string()),
+                method: "resources/read".to_string(),
+                params: json!({"uri": "time://formats"}),
+                id: Some(json!(29)),
+            },
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":29,"method":"resources/read","params":{"uri":"time://formats"}}"#,
+            ),
+        )
+        .await;
+        assert_eq!(resources_read.status(), StatusCode::FORBIDDEN);
+        assert_eq!(
+            response_json(resources_read).await["error"]["detail"],
+            "resources/read denied"
+        );
+
+        let prompts_get = direct_server_prompts_get(
+            &state,
+            trusted_headers,
+            Some(json!(30)),
+            &JsonRpcRequest {
+                jsonrpc: Some("2.0".to_string()),
+                method: "prompts/get".to_string(),
+                params: json!({"name": "time_prompt"}),
+                id: Some(json!(30)),
+            },
+            Bytes::from_static(
+                br#"{"jsonrpc":"2.0","id":30,"method":"prompts/get","params":{"name":"time_prompt"}}"#,
+            ),
+        )
+        .await;
+        assert_eq!(prompts_get.status(), StatusCode::FORBIDDEN);
+        assert_eq!(
+            response_json(prompts_get).await["error"]["detail"],
+            "prompts/get denied"
+        );
+    }
+
+    #[tokio::test]
+    async fn authorize_server_method_via_backend_covers_success_denial_and_decode_failure() {
+        let backend = Router::new()
+            .route("/authz-ok", post(|| async { StatusCode::OK }))
+            .route(
+                "/authz-deny",
+                post(|| async {
+                    (
+                        StatusCode::FORBIDDEN,
+                        Json(json!({"code": "denied", "detail": "nope"})),
+                    )
+                }),
+            )
+            .route(
+                "/authz-bad-json",
+                post(|| async { (StatusCode::FORBIDDEN, "not-json") }),
+            );
+        let backend_url = spawn_router(backend).await;
+        let state = AppState::new(&{
+            let mut config = test_config();
+            config.backend_rpc_url = format!("{backend_url}/rpc");
+            config
+        })
+        .expect("state");
+
+        authorize_server_method_via_backend(
+            &state,
+            &trusted_server_headers("server-1"),
+            Some(json!(31)),
+            &format!("{backend_url}/authz-ok"),
+            "resources/list",
+        )
+        .await
+        .expect("success should pass through");
+
+        let denied = authorize_server_method_via_backend(
+            &state,
+            &trusted_server_headers("server-1"),
+            Some(json!(32)),
+            &format!("{backend_url}/authz-deny"),
+            "resources/list",
+        )
+        .await
+        .expect_err("deny should return response");
+        assert_eq!(denied.status(), StatusCode::FORBIDDEN);
+        assert_eq!(response_json(denied).await["error"]["code"], "denied");
+
+        let bad_json = authorize_server_method_via_backend(
+            &state,
+            &trusted_server_headers("server-1"),
+            Some(json!(33)),
+            &format!("{backend_url}/authz-bad-json"),
+            "resources/list",
+        )
+        .await
+        .expect_err("invalid deny payload should return response");
+        assert_eq!(bad_json.status(), StatusCode::BAD_GATEWAY);
+        assert_eq!(
+            response_json(bad_json).await["error"]["data"],
+            CLIENT_ERROR_DETAIL
+        );
+    }
+
+    #[test]
+    fn prompt_arguments_from_schema_covers_edge_cases() {
+        assert!(prompt_arguments_from_schema(None).is_empty());
+        assert!(prompt_arguments_from_schema(Some(json!("bad"))).is_empty());
+        assert!(prompt_arguments_from_schema(Some(json!({"type": "object"}))).is_empty());
+
+        let arguments = prompt_arguments_from_schema(Some(json!({
+            "type": "object",
+            "properties": {
+                "name": {"description": "Person name"},
+                "age": {}
+            },
+            "required": ["name", 123]
+        })));
+        assert_eq!(arguments.len(), 2);
+        assert!(arguments.iter().any(|value| {
+            value["name"] == "name"
+                && value["description"] == "Person name"
+                && value["required"] == true
+        }));
+        assert!(arguments.iter().any(|value| {
+            value["name"] == "age" && value["description"] == "" && value["required"] == false
+        }));
+    }
+
+    #[tokio::test]
+    async fn forward_transport_request_delete_removes_runtime_session_and_sets_core_headers() {
+        let backend = Router::new().route(
+            "/_internal/mcp/session",
+            axum::routing::delete(|| async { StatusCode::NO_CONTENT }),
+        );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+
+        upsert_runtime_session(
+            &state,
+            "delete-me".to_string(),
+            RuntimeSessionRecord {
+                owner_email: Some("owner@example.com".to_string()),
+                server_id: Some("server-1".to_string()),
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: Some("cached".to_string()),
+                auth_binding_fingerprint: Some(
+                    auth_binding_fingerprint(&trusted_server_headers("server-1"))
+                        .expect("fingerprint"),
+                ),
+                auth_context_expires_at_epoch_ms: None,
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        )
+        .await;
+
+        let mut headers = trusted_server_headers("server-1");
+        headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("delete-me"),
+        );
+        let response = forward_transport_request(
+            &state,
+            reqwest::Method::DELETE,
+            headers,
+            "/mcp".to_string(),
+            "/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+
+        assert_eq!(response.status(), StatusCode::NO_CONTENT);
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-session-core")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-event-store")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-resume-core")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-live-stream-core")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-affinity-core")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert!(get_runtime_session(&state, "delete-me").await.is_none());
+    }
+
+    #[tokio::test]
+    async fn forward_transport_request_get_forwards_to_backend_and_sets_session_hint_headers() {
+        let backend = Router::new().route(
+            "/_internal/mcp/transport",
+            axum::routing::get(|| async { Json(json!({"ok": true, "path": "transport"})) }),
+        );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        config.live_stream_core_enabled = false;
+        config.affinity_core_enabled = false;
+        let state = AppState::new(&config).expect("state");
+
+        upsert_runtime_session(
+            &state,
+            "read-session".to_string(),
+            RuntimeSessionRecord {
+                owner_email: None,
+                server_id: Some("server-1".to_string()),
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: None,
+                auth_binding_fingerprint: None,
+                auth_context_expires_at_epoch_ms: None,
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        )
+        .await;
+
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("read-session"),
+        );
+        let response = forward_transport_request(
+            &state,
+            reqwest::Method::GET,
+            headers,
+            "/mcp".to_string(),
+            "/mcp?session_id=ignored".parse::<Uri>().expect("uri"),
+        )
+        .await;
+
+        assert_eq!(response.status(), StatusCode::OK);
+        assert_eq!(
+            response
+                .headers()
+                .get("mcp-session-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("read-session")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-session-core")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-event-store")
+                .and_then(|value| value.to_str().ok()),
+            Some("rust")
+        );
+        assert_eq!(response_json(response).await["ok"], json!(true));
+    }
+
+    #[tokio::test]
+    async fn forward_transport_request_delete_backend_failure_keeps_runtime_session() {
+        let backend = Router::new().route(
+            "/_internal/mcp/session",
+            axum::routing::delete(|| async {
+                (
+                    StatusCode::BAD_GATEWAY,
+                    Json(json!({"detail": "backend delete failed"})),
+                )
+            }),
+        );
+        let backend_url = spawn_router(backend).await;
+
+        let mut config = test_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        let state = AppState::new(&config).expect("state");
+
+        upsert_runtime_session(
+            &state,
+            "delete-error".to_string(),
+            RuntimeSessionRecord {
+                owner_email: None,
+                server_id: Some("server-1".to_string()),
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: None,
+                auth_binding_fingerprint: None,
+                auth_context_expires_at_epoch_ms: None,
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        )
+        .await;
+
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("delete-error"),
+        );
+        let response = forward_transport_request(
+            &state,
+            reqwest::Method::DELETE,
+            headers,
+            "/mcp".to_string(),
+            "/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+
+        assert_eq!(response.status(), StatusCode::BAD_GATEWAY);
+        assert_eq!(
+            response_json(response).await["detail"],
+            json!("backend delete failed")
+        );
+        assert!(get_runtime_session(&state, "delete-error").await.is_some());
+    }
+
+    #[tokio::test]
+    async fn handle_resume_transport_request_requires_last_event_id_header() {
+        let state = AppState::new(&test_config()).expect("state");
+        let response = handle_resume_transport_request(
+            &state,
+            HeaderMap::new(),
+            "/mcp".parse::<Uri>().expect("uri"),
+            None,
+        )
+        .await;
+        assert_eq!(response.status(), StatusCode::BAD_REQUEST);
+        assert_eq!(
+            response_json(response).await["detail"],
+            "Last-Event-ID header is required for resumable GET /mcp"
+        );
+    }
+
+    #[tokio::test]
+    async fn forward_transport_request_resumable_get_requires_session_id() {
+        let state = AppState::new(&test_config()).expect("state");
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("accept"),
+            HeaderValue::from_static("text/event-stream"),
+        );
+        headers.insert(
+            HeaderName::from_static("last-event-id"),
+            HeaderValue::from_static("event-1"),
+        );
+
+        let response = forward_transport_request(
+            &state,
+            reqwest::Method::GET,
+            headers,
+            "/mcp".to_string(),
+            "/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+        assert_eq!(response.status(), StatusCode::BAD_REQUEST);
+        assert_eq!(
+            response_json(response).await["detail"],
+            "mcp-session-id header or session_id query parameter is required for resumable GET /mcp"
+        );
+    }
+
+    #[tokio::test]
+    async fn forward_transport_request_resumable_get_reports_unavailable_event_store_without_redis()
+    {
+        let state = AppState::new(&test_config()).expect("state");
+        upsert_runtime_session(
+            &state,
+            "resume-session".to_string(),
+            RuntimeSessionRecord {
+                owner_email: None,
+                server_id: None,
+                protocol_version: None,
+                client_capabilities: None,
+                encoded_auth_context: None,
+                auth_binding_fingerprint: None,
+                auth_context_expires_at_epoch_ms: None,
+                created_at: std::time::Instant::now(),
+                last_used: std::time::Instant::now(),
+            },
+        )
+        .await;
+
+        let mut headers = HeaderMap::new();
+        headers.insert(
+            HeaderName::from_static("accept"),
+            HeaderValue::from_static("text/event-stream"),
+        );
+        headers.insert(
+            HeaderName::from_static("last-event-id"),
+            HeaderValue::from_static("event-1"),
+        );
+        headers.insert(
+            HeaderName::from_static("mcp-session-id"),
+            HeaderValue::from_static("resume-session"),
+        );
+
+        let response = forward_transport_request(
+            &state,
+            reqwest::Method::GET,
+            headers,
+            "/mcp".to_string(),
+            "/mcp".parse::<Uri>().expect("uri"),
+        )
+        .await;
+        assert_eq!(response.status(), StatusCode::SERVICE_UNAVAILABLE);
+        assert_eq!(
+            response_json(response).await["detail"],
+            "Rust Redis event store is unavailable"
+        );
+    }
+
+    #[tokio::test]
+    async fn maybe_upsert_runtime_session_from_transport_response_returns_none_without_session_id()
+    {
+        let state = AppState::new(&test_config()).expect("state");
+        assert_eq!(
+            maybe_upsert_runtime_session_from_transport_response(
+                &state,
+                &HeaderMap::new(),
+                None,
+                &reqwest::header::HeaderMap::new(),
+            )
+            .await,
+            None
+        );
+    }
+}
diff --git a/tools_rust/mcp_runtime/src/main.rs b/tools_rust/mcp_runtime/src/main.rs
new file mode 100644
index 0000000000..0d462174fc
--- /dev/null
+++ b/tools_rust/mcp_runtime/src/main.rs
@@ -0,0 +1,25 @@
+// Copyright 2026
+// SPDX-License-Identifier: Apache-2.0
+// Authors: Mihai Criveti
+
+//! Binary entry point for the Rust MCP runtime.
+
+use clap::Parser;
+use contextforge_mcp_runtime::{config::RuntimeConfig, run};
+use tracing_subscriber::EnvFilter;
+
+#[tokio::main]
+async fn main() {
+    let config = RuntimeConfig::parse();
+
+    tracing_subscriber::fmt()
+        .with_env_filter(EnvFilter::new(config.log_filter.clone()))
+        .with_target(false)
+        .compact()
+        .init();
+
+    if let Err(err) = run(config).await {
+        eprintln!("contextforge-mcp-runtime failed: {err}");
+        std::process::exit(1);
+    }
+}
diff --git a/tools_rust/mcp_runtime/tests/cli.rs b/tools_rust/mcp_runtime/tests/cli.rs
new file mode 100644
index 0000000000..abb57aabf9
--- /dev/null
+++ b/tools_rust/mcp_runtime/tests/cli.rs
@@ -0,0 +1,53 @@
+// Copyright 2026
+// SPDX-License-Identifier: Apache-2.0
+// Authors: Mihai Criveti
+
+use std::{net::TcpListener, process::Command};
+
+fn free_tcp_addr() -> String {
+    let listener = TcpListener::bind("127.0.0.1:0").expect("bind ephemeral port");
+    let addr = listener.local_addr().expect("local addr");
+    drop(listener);
+    addr.to_string()
+}
+
+#[test]
+fn binary_can_start_and_exit_cleanly_with_hidden_shutdown_flag() {
+    let output = Command::new(env!("CARGO_BIN_EXE_contextforge_mcp_runtime"))
+        .arg("--listen-http")
+        .arg(free_tcp_addr())
+        .arg("--backend-rpc-url")
+        .arg("http://127.0.0.1:4444/rpc")
+        .arg("--log-filter")
+        .arg("error")
+        .arg("--exit-after-startup-ms")
+        .arg("10")
+        .output()
+        .expect("run runtime binary");
+
+    assert!(
+        output.status.success(),
+        "expected success, stderr was: {}",
+        String::from_utf8_lossy(&output.stderr)
+    );
+}
+
+#[test]
+fn binary_exits_with_failure_for_invalid_listen_address() {
+    let output = Command::new(env!("CARGO_BIN_EXE_contextforge_mcp_runtime"))
+        .arg("--listen-http")
+        .arg("not-an-addr")
+        .arg("--backend-rpc-url")
+        .arg("http://127.0.0.1:4444/rpc")
+        .arg("--log-filter")
+        .arg("error")
+        .output()
+        .expect("run runtime binary");
+
+    assert!(!output.status.success(), "expected non-zero exit status");
+    assert!(
+        String::from_utf8_lossy(&output.stderr).contains("contextforge-mcp-runtime failed"),
+        "stderr was: {}",
+        String::from_utf8_lossy(&output.stderr)
+    );
+}
diff --git a/tools_rust/mcp_runtime/tests/runtime.rs b/tools_rust/mcp_runtime/tests/runtime.rs
new file mode 100644
index 0000000000..653c51abcd
--- /dev/null
+++ b/tools_rust/mcp_runtime/tests/runtime.rs
@@ -0,0 +1,6239 @@
+// Copyright 2026
+// SPDX-License-Identifier: Apache-2.0
+// Authors: Mihai Criveti
+
+use axum::{
+    Json, Router,
+    http::{HeaderMap, StatusCode, Uri},
+    response::IntoResponse,
+    routing::{any, delete, get, post},
+};
+use base64::{Engine as _, engine::general_purpose::URL_SAFE_NO_PAD};
+use contextforge_mcp_runtime::{AppState, build_router, config::RuntimeConfig};
+use futures_util::StreamExt;
+use redis::AsyncCommands;
+use reqwest::header::HeaderValue;
+use serde_json::{Value, json};
+use std::{
+    sync::{Arc, Mutex},
+    time::{Duration, Instant},
+};
+use uuid::Uuid;
+
+type ObservedBackendCall = (String, Option<String>, Option<String>);
+
+#[derive(Clone, Default)]
+struct BackendObservation {
+    calls: Arc<Mutex<Vec<ObservedBackendCall>>>,
+}
+
+fn hex_encode(bytes: &[u8]) -> String {
+    let mut encoded = String::with_capacity(bytes.len() * 2);
+    for byte in bytes {
+        use std::fmt::Write as _;
+        let _ = write!(&mut encoded, "{byte:02x}");
+    }
+    encoded
+}
+
+fn hex_decode(input: &str) -> Vec<u8> {
+    input
+        .as_bytes()
+        .chunks_exact(2)
+        .filter_map(|chunk| {
+            let high = (chunk[0] as char).to_digit(16)?;
+            let low = (chunk[1] as char).to_digit(16)?;
+            u8::try_from((high << 4) | low).ok()
+        })
+        .collect()
+}
+
+async fn spawn_router(router: Router) -> String {
+    let listener = tokio::net::TcpListener::bind("127.0.0.1:0")
+        .await
+        .expect("bind test listener");
+    let addr = listener.local_addr().expect("local addr");
+    tokio::spawn(async move {
+        axum::serve(listener, router)
+            .await
+            .expect("serve test router");
+    });
+    format!("http://{addr}")
+}
+
+fn test_runtime_config() -> RuntimeConfig {
+    RuntimeConfig {
+        backend_rpc_url: "http://127.0.0.1:4444/rpc".to_string(),
+        listen_http: "127.0.0.1:8787".to_string(),
+        listen_uds: None,
+        public_listen_http: None,
+        protocol_version: "2025-11-25".to_string(),
+        supported_protocol_versions: vec![],
+        server_name: "ContextForge".to_string(),
+        server_version: "0.1.0".to_string(),
+        instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+        request_timeout_ms: 30_000,
+        client_connect_timeout_ms: 5_000,
+        client_pool_idle_timeout_seconds: 90,
+        client_pool_max_idle_per_host: 1024,
+        client_tcp_keepalive_seconds: 30,
+        tools_call_plan_ttl_seconds: 30,
+        upstream_session_ttl_seconds: 300,
+        use_rmcp_upstream_client: false,
+        session_core_enabled: false,
+        event_store_enabled: false,
+        resume_core_enabled: false,
+        live_stream_core_enabled: false,
+        affinity_core_enabled: false,
+        session_auth_reuse_enabled: false,
+        session_auth_reuse_ttl_seconds: 30,
+        session_ttl_seconds: 3_600,
+        event_store_max_events_per_stream: 100,
+        event_store_ttl_seconds: 3_600,
+        event_store_poll_interval_ms: 250,
+        cache_prefix: "mcpgw:".to_string(),
+        database_url: None,
+        redis_url: None,
+        db_pool_max_size: 20,
+        log_filter: "error".to_string(),
+        exit_after_startup_ms: None,
+    }
+}
+
+async fn redis_is_available(redis_url: &str) -> bool {
+    let Ok(client) = redis::Client::open(redis_url) else {
+        return false;
+    };
+    let Ok(mut conn) = client.get_multiplexed_async_connection().await else {
+        return false;
+    };
+    redis::cmd("PING")
+        .query_async::<String>(&mut conn)
+        .await
+        .is_ok()
+}
+
+async fn cleanup_redis_prefix(redis_url: &str, prefix: &str) {
+    let Ok(client) = redis::Client::open(redis_url) else {
+        return;
+    };
+    let Ok(mut conn) = client.get_multiplexed_async_connection().await else {
+        return;
+    };
+    let pattern = format!("{prefix}*");
+    let keys = redis::cmd("KEYS")
+        .arg(pattern)
+        .query_async::<Vec<String>>(&mut conn)
+        .await
+        .unwrap_or_default();
+    if !keys.is_empty() {
+        let _ = conn.del::<_, ()>(keys).await;
+    }
+}
+
+async fn initialize_runtime_session(
+    runtime_url: &str,
+    session_id: &str,
+    auth_context: Option<&str>,
+) {
+    let client = reqwest::Client::new();
+    let mut request = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "2025-11-25")
+        .header("mcp-session-id", session_id)
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "initialize",
+            "params": {"protocolVersion": "2025-11-25", "capabilities": {}}
+        }));
+    if let Some(auth_context) = auth_context {
+        request = request.header("x-contextforge-auth-context", auth_context);
+    }
+    let response = request.send().await.expect("initialize response");
+    let status = response.status();
+    let body = response.text().await.expect("initialize body");
+    assert_eq!(
+        status,
+        StatusCode::OK,
+        "initialize session {session_id} failed: {body}"
+    );
+}
+
+#[tokio::test]
+async fn ping_is_handled_locally() {
+    let observation = BackendObservation::default();
+    let backend = {
+        let observation = observation.clone();
+        Router::new().route(
+            "/rpc",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let observation = observation.clone();
+                async move {
+                    observation.calls.lock().expect("lock").push((
+                        body.get("method")
+                            .and_then(Value::as_str)
+                            .unwrap_or("unknown")
+                            .to_string(),
+                        headers
+                            .get("authorization")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                    ));
+                    Json(json!({"jsonrpc":"2.0","id":1,"result":{"backend":true}}))
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/rpc"))
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 42,
+            "method": "ping",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("ping response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"], json!({}));
+    assert!(observation.calls.lock().expect("lock").is_empty());
+}
+
+#[tokio::test]
+async fn health_alias_is_available_for_gateway_style_probes() {
+    let config = RuntimeConfig {
+        backend_rpc_url: "http://127.0.0.1:4444/rpc".to_string(),
+        listen_http: "127.0.0.1:8787".to_string(),
+        listen_uds: None,
+        protocol_version: "2025-11-25".to_string(),
+        supported_protocol_versions: vec![],
+        server_name: "ContextForge".to_string(),
+        server_version: "0.1.0".to_string(),
+        instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+        request_timeout_ms: 30_000,
+        database_url: None,
+        db_pool_max_size: 20,
+        log_filter: "error".to_string(),
+        ..test_runtime_config()
+    };
+    let runtime_url = spawn_router(build_router(AppState::new(&config).expect("state"))).await;
+
+    let response = reqwest::Client::new()
+        .get(format!("{runtime_url}/health"))
+        .send()
+        .await
+        .expect("health response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["status"], "ok");
+    assert_eq!(body["session_core_enabled"], json!(false));
+    assert_eq!(body["event_store_enabled"], json!(false));
+    assert_eq!(body["resume_core_enabled"], json!(false));
+    assert_eq!(body["live_stream_core_enabled"], json!(false));
+    assert_eq!(body["session_auth_reuse_enabled"], json!(false));
+    assert_eq!(body["active_sessions"], json!(0));
+    assert_eq!(
+        body["runtime_stats"]["session_auth_reuse"]["hits"],
+        json!(0)
+    );
+    assert_eq!(
+        body["runtime_stats"]["session_access_denials"]["server_scope_mismatches"],
+        json!(0)
+    );
+    assert!(
+        body["supported_protocol_versions"]
+            .as_array()
+            .expect("supported protocol versions array")
+            .iter()
+            .any(|value| value == "2025-03-26")
+    );
+}
+
+#[tokio::test]
+async fn server_scoped_public_initialize_authenticates_before_backend_dispatch() {
+    let auth_calls = Arc::new(Mutex::new(Vec::<Value>::new()));
+    let initialize_calls = Arc::new(Mutex::new(Vec::<(Option<String>, Option<String>)>::new()));
+
+    let backend = {
+        let auth_calls = auth_calls.clone();
+        let initialize_calls = initialize_calls.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/authenticate",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let auth_calls = auth_calls.clone();
+                    async move {
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        auth_calls.lock().expect("lock").push(body.clone());
+                        Json(json!({
+                            "authContext": {
+                                "email": "user@example.com",
+                                "teams": ["team-a"],
+                                "is_authenticated": true,
+                                "is_admin": false,
+                                "permission_is_admin": false,
+                                "token_use": "session"
+                            }
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/initialize",
+                post(move |headers: HeaderMap, Json(_body): Json<Value>| {
+                    let initialize_calls = initialize_calls.clone();
+                    async move {
+                        initialize_calls.lock().expect("lock").push((
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                            headers
+                                .get("x-contextforge-auth-context")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                        ));
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": 1,
+                            "result": {
+                                "protocolVersion": "2025-11-25",
+                                "capabilities": {},
+                                "serverInfo": {"name": "ContextForge", "version": "0.1.0"}
+                            }
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            public_listen_http: Some("127.0.0.1:8788".to_string()),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/servers/server-1/mcp"))
+        .header("authorization", "Bearer test-token")
+        .header("x-forwarded-for", "203.0.113.10")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "initialize",
+            "params": {"protocolVersion": "2025-11-25", "capabilities": {}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+
+    let auth_call = auth_calls.lock().expect("lock");
+    assert_eq!(auth_call.len(), 1);
+    assert_eq!(auth_call[0]["path"], "/servers/server-1/mcp");
+    assert!(auth_call[0]["clientIp"].is_null());
+    assert_eq!(
+        auth_call[0]["headers"]["authorization"],
+        "Bearer test-token"
+    );
+
+    let initialize_call = initialize_calls.lock().expect("lock");
+    assert_eq!(initialize_call.len(), 1);
+    assert_eq!(initialize_call[0].0.as_deref(), Some("server-1"));
+    assert!(initialize_call[0].1.is_some());
+}
+
+#[tokio::test]
+async fn public_session_reuses_authenticated_context_when_flag_enabled() {
+    let auth_calls = Arc::new(Mutex::new(0usize));
+    let roots_calls = Arc::new(Mutex::new(Vec::<Option<String>>::new()));
+
+    let backend = {
+        let auth_calls = auth_calls.clone();
+        let roots_calls = roots_calls.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/authenticate",
+                post(move || {
+                    let auth_calls = auth_calls.clone();
+                    async move {
+                        *auth_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "authContext": {
+                                "email": "user@example.com",
+                                "teams": ["team-a"],
+                                "is_authenticated": true,
+                                "is_admin": false,
+                                "permission_is_admin": false,
+                                "token_use": "session"
+                            }
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/transport",
+                post(|| async move {
+                    Json(json!({
+                        "jsonrpc": "2.0",
+                        "id": 1,
+                        "result": {
+                            "protocolVersion": "2025-11-25",
+                            "capabilities": {},
+                            "serverInfo": {"name": "ContextForge", "version": "0.1.0"}
+                        }
+                    }))
+                }),
+            )
+            .route(
+                "/_internal/mcp/roots/list",
+                post(move |headers: HeaderMap| {
+                    let roots_calls = roots_calls.clone();
+                    async move {
+                        roots_calls.lock().expect("lock").push(
+                            headers
+                                .get("x-contextforge-auth-context")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                        );
+                        Json(json!({"jsonrpc":"2.0","id":2,"result":{"roots":[]}}))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            public_listen_http: Some("127.0.0.1:8788".to_string()),
+            session_core_enabled: true,
+            session_auth_reuse_enabled: true,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer alpha")
+        .header("mcp-session-id", "session-reuse-1")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "initialize",
+            "params": {"protocolVersion": "2025-11-25", "capabilities": {}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    assert_eq!(initialize_response.status(), StatusCode::OK);
+
+    let roots_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer alpha")
+        .header("mcp-session-id", "session-reuse-1")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 2,
+            "method": "roots/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("roots response");
+    assert_eq!(roots_response.status(), StatusCode::OK);
+
+    assert_eq!(*auth_calls.lock().expect("lock"), 1);
+    assert_eq!(roots_calls.lock().expect("lock").len(), 1);
+    assert!(
+        roots_calls.lock().expect("lock")[0].is_some(),
+        "Rust should forward the reused auth context header to the backend roots/list route",
+    );
+}
+
+#[tokio::test]
+async fn public_session_denies_when_auth_binding_changes() {
+    let auth_calls = Arc::new(Mutex::new(0usize));
+
+    let backend = {
+        let auth_calls = auth_calls.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/authenticate",
+                post(move || {
+                    let auth_calls = auth_calls.clone();
+                    async move {
+                        *auth_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "authContext": {
+                                "email": "user@example.com",
+                                "teams": ["team-a"],
+                                "is_authenticated": true,
+                                "is_admin": false,
+                                "permission_is_admin": false,
+                                "token_use": "session"
+                            }
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/transport",
+                post(|| async move {
+                    Json(json!({
+                        "jsonrpc": "2.0",
+                        "id": 1,
+                        "result": {
+                            "protocolVersion": "2025-11-25",
+                            "capabilities": {},
+                            "serverInfo": {"name": "ContextForge", "version": "0.1.0"}
+                        }
+                    }))
+                }),
+            )
+            .route(
+                "/_internal/mcp/roots/list",
+                post(|| async move { Json(json!({"jsonrpc":"2.0","id":2,"result":{"roots":[]}})) }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            public_listen_http: Some("127.0.0.1:8788".to_string()),
+            session_core_enabled: true,
+            session_auth_reuse_enabled: true,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer alpha")
+        .header("mcp-session-id", "session-reuse-2")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "initialize",
+            "params": {"protocolVersion": "2025-11-25", "capabilities": {}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    assert_eq!(initialize_response.status(), StatusCode::OK);
+
+    let roots_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer beta")
+        .header("mcp-session-id", "session-reuse-2")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 2,
+            "method": "roots/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("roots response");
+    assert_eq!(roots_response.status(), StatusCode::FORBIDDEN);
+    let body: Value = roots_response.json().await.expect("roots json");
+    assert_eq!(body["detail"], json!("Session access denied"));
+
+    assert_eq!(
+        *auth_calls.lock().expect("lock"),
+        2,
+        "Changed auth material should still be rechecked before the public MCP session is denied",
+    );
+}
+
+#[tokio::test]
+async fn public_session_reauthenticates_after_auth_reuse_ttl_expires() {
+    let auth_calls = Arc::new(Mutex::new(0usize));
+
+    let backend = {
+        let auth_calls = auth_calls.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/authenticate",
+                post(move || {
+                    let auth_calls = auth_calls.clone();
+                    async move {
+                        *auth_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "authContext": {
+                                "email": "user@example.com",
+                                "teams": ["team-a"],
+                                "is_authenticated": true,
+                                "is_admin": false,
+                                "permission_is_admin": false,
+                                "token_use": "session"
+                            }
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/transport",
+                post(|| async move {
+                    Json(json!({
+                        "jsonrpc": "2.0",
+                        "id": 1,
+                        "result": {
+                            "protocolVersion": "2025-11-25",
+                            "capabilities": {},
+                            "serverInfo": {"name": "ContextForge", "version": "0.1.0"}
+                        }
+                    }))
+                }),
+            )
+            .route(
+                "/_internal/mcp/roots/list",
+                post(|| async move { Json(json!({"jsonrpc":"2.0","id":2,"result":{"roots":[]}})) }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            public_listen_http: Some("127.0.0.1:8788".to_string()),
+            session_core_enabled: true,
+            session_auth_reuse_enabled: true,
+            session_auth_reuse_ttl_seconds: 1,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer alpha")
+        .header("mcp-session-id", "session-reuse-3")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "initialize",
+            "params": {"protocolVersion": "2025-11-25", "capabilities": {}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    assert_eq!(initialize_response.status(), StatusCode::OK);
+
+    let deadline = Instant::now() + Duration::from_secs(4);
+    let mut last_status = None;
+    while Instant::now() < deadline {
+        tokio::time::sleep(Duration::from_millis(200)).await;
+        let roots_response = client
+            .post(format!("{runtime_url}/mcp"))
+            .header("authorization", "Bearer alpha")
+            .header("mcp-session-id", "session-reuse-3")
+            .header("mcp-protocol-version", "2025-11-25")
+            .json(&json!({
+                "jsonrpc": "2.0",
+                "id": 2,
+                "method": "roots/list",
+                "params": {}
+            }))
+            .send()
+            .await
+            .expect("roots response");
+        last_status = Some(roots_response.status());
+        if *auth_calls.lock().expect("lock") == 2 {
+            break;
+        }
+    }
+    assert_eq!(last_status, Some(StatusCode::OK));
+
+    assert_eq!(
+        *auth_calls.lock().expect("lock"),
+        2,
+        "Expired session-bound auth context should force Rust to fall back to backend authenticate",
+    );
+}
+
+#[tokio::test]
+async fn get_and_delete_mcp_routes_forward_to_internal_transport_bridge() {
+    let transport_calls = Arc::new(Mutex::new(Vec::<(
+        String,
+        Option<String>,
+        Option<String>,
+        Option<String>,
+    )>::new()));
+    let backend = {
+        let get_transport_calls = transport_calls.clone();
+        let delete_transport_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            get(move |headers: HeaderMap, uri: Uri| {
+                let transport_calls = get_transport_calls.clone();
+                async move {
+                    transport_calls.lock().expect("lock").push((
+                        "GET".to_string(),
+                        headers
+                            .get("authorization")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        uri.query().map(str::to_string),
+                    ));
+                    (
+                        StatusCode::OK,
+                        [(
+                            "content-type",
+                            HeaderValue::from_static("text/event-stream"),
+                        )],
+                        "data: ping\n\n",
+                    )
+                }
+            })
+            .delete(move |headers: HeaderMap, uri: Uri| {
+                let transport_calls = delete_transport_calls.clone();
+                async move {
+                    transport_calls.lock().expect("lock").push((
+                        "DELETE".to_string(),
+                        headers
+                            .get("authorization")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        uri.query().map(str::to_string),
+                    ));
+                    StatusCode::NO_CONTENT
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let get_response = client
+        .get(format!("{runtime_url}/mcp?session_id=session-42"))
+        .header("authorization", "Bearer test-token")
+        .header("mcp-session-id", "client-session-1")
+        .header("x-contextforge-server-id", "server-1")
+        .send()
+        .await
+        .expect("get response");
+
+    assert_eq!(get_response.status(), StatusCode::OK);
+    assert_eq!(
+        get_response
+            .headers()
+            .get("content-type")
+            .and_then(|value| value.to_str().ok()),
+        Some("text/event-stream")
+    );
+    assert_eq!(
+        get_response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    assert_eq!(
+        get_response.text().await.expect("stream text"),
+        "data: ping\n\n"
+    );
+
+    let delete_response = client
+        .delete(format!("{runtime_url}/mcp?session_id=session-42"))
+        .header("authorization", "Bearer test-token")
+        .header("mcp-session-id", "client-session-1")
+        .header("x-contextforge-server-id", "server-1")
+        .send()
+        .await
+        .expect("delete response");
+
+    assert_eq!(delete_response.status(), StatusCode::NO_CONTENT);
+    assert_eq!(
+        delete_response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls.len(), 2);
+    assert_eq!(
+        calls[0],
+        (
+            "GET".to_string(),
+            Some("Bearer test-token".to_string()),
+            Some("client-session-1".to_string()),
+            Some("session_id=session-42".to_string())
+        )
+    );
+    assert_eq!(
+        calls[1],
+        (
+            "DELETE".to_string(),
+            Some("Bearer test-token".to_string()),
+            Some("client-session-1".to_string()),
+            Some("session_id=session-42".to_string())
+        )
+    );
+}
+
+#[tokio::test]
+async fn session_core_initialize_tracks_session_and_reuses_server_scope_for_transport_requests() {
+    let transport_calls = Arc::new(Mutex::new(Vec::<(
+        String,
+        Option<String>,
+        Option<String>,
+        Option<String>,
+        Option<String>,
+    )>::new()));
+    let backend = {
+        let post_calls = transport_calls.clone();
+        let get_calls = transport_calls.clone();
+        let delete_calls = transport_calls.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/transport",
+                post(move |headers: HeaderMap, uri: Uri, Json(body): Json<Value>| {
+                    let transport_calls = post_calls.clone();
+                    async move {
+                        transport_calls.lock().expect("lock").push((
+                            "POST".to_string(),
+                            headers
+                                .get("mcp-session-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                            uri.query().map(str::to_string),
+                            headers
+                                .get("x-contextforge-session-validated")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                        ));
+                        let mut response_headers = HeaderMap::new();
+                        response_headers.insert(
+                            "mcp-session-id",
+                            HeaderValue::from_static("transport-session-1"),
+                        );
+                        (
+                            StatusCode::OK,
+                            response_headers,
+                            Json(json!({
+                                "jsonrpc":"2.0",
+                                "id": body["id"],
+                                "result": {"protocolVersion":"2025-11-25","capabilities":{},"serverInfo":{"name":"ContextForge","version":"0.1.0"}}
+                            })),
+                        )
+                    }
+                })
+                .get(move |headers: HeaderMap, uri: Uri| {
+                    let transport_calls = get_calls.clone();
+                    async move {
+                        transport_calls.lock().expect("lock").push((
+                            "GET".to_string(),
+                            headers
+                                .get("mcp-session-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                            uri.query().map(str::to_string),
+                            headers
+                                .get("x-contextforge-session-validated")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                        ));
+                        (
+                            StatusCode::OK,
+                            [("content-type", HeaderValue::from_static("text/event-stream"))],
+                            "data: ping\n\n",
+                        )
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/session",
+                delete(move |headers: HeaderMap| {
+                    let transport_calls = delete_calls.clone();
+                    async move {
+                        transport_calls.lock().expect("lock").push((
+                            "SESSION_DELETE".to_string(),
+                            headers
+                                .get("mcp-session-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                            None,
+                            headers
+                                .get("x-contextforge-session-validated")
+                                .and_then(|value| value.to_str().ok())
+                                .map(str::to_string),
+                        ));
+                        StatusCode::NO_CONTENT
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let auth_context = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "user@example.com",
+            "teams": ["team-a"],
+            "is_admin": false
+        }))
+        .expect("auth context json"),
+    );
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-auth-context", auth_context.clone())
+        .header("x-contextforge-server-id", "server-123")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"initialize",
+            "params":{"protocolVersion":"2025-11-25","capabilities":{"elicitation":{}}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+
+    assert_eq!(initialize_response.status(), StatusCode::OK);
+    assert_eq!(
+        initialize_response
+            .headers()
+            .get("mcp-session-id")
+            .and_then(|value| value.to_str().ok()),
+        Some("transport-session-1")
+    );
+    assert_eq!(
+        initialize_response
+            .headers()
+            .get("x-contextforge-mcp-session-core")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+
+    let get_response = client
+        .get(format!("{runtime_url}/mcp?session_id=transport-session-1"))
+        .header("x-contextforge-auth-context", auth_context.clone())
+        .send()
+        .await
+        .expect("get response");
+    assert_eq!(get_response.status(), StatusCode::OK);
+
+    let delete_response = client
+        .delete(format!("{runtime_url}/mcp?session_id=transport-session-1"))
+        .header("x-contextforge-auth-context", auth_context)
+        .send()
+        .await
+        .expect("delete response");
+    assert_eq!(delete_response.status(), StatusCode::NO_CONTENT);
+
+    let health_response = client
+        .get(format!("{runtime_url}/health"))
+        .send()
+        .await
+        .expect("health response");
+    let health_body: Value = health_response.json().await.expect("health json");
+    assert_eq!(health_body["session_core_enabled"], json!(true));
+    assert_eq!(health_body["active_sessions"], json!(0));
+    assert_eq!(
+        health_body["runtime_stats"]["session_auth_reuse"]["hits"],
+        json!(0)
+    );
+
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls[0].0, "POST".to_string());
+    assert!(calls[0].1.is_some());
+    assert_eq!(calls[0].2.as_deref(), Some("server-123"));
+    assert_eq!(calls[0].3, None);
+    assert_eq!(calls[0].4, None);
+    assert_eq!(
+        calls[1],
+        (
+            "GET".to_string(),
+            Some("transport-session-1".to_string()),
+            Some("server-123".to_string()),
+            Some("session_id=transport-session-1".to_string()),
+            Some("rust".to_string()),
+        )
+    );
+    assert_eq!(
+        calls[2],
+        (
+            "SESSION_DELETE".to_string(),
+            Some("transport-session-1".to_string()),
+            Some("server-123".to_string()),
+            None,
+            Some("rust".to_string()),
+        )
+    );
+}
+
+#[tokio::test]
+async fn affinity_core_preserves_owner_access_across_workers_and_denies_peer_reuse() {
+    let redis_url = "redis://127.0.0.1:6379/0";
+    if !redis_is_available(redis_url).await {
+        eprintln!(
+            "skipping cross-worker affinity test because Redis is unavailable at {redis_url}"
+        );
+        return;
+    }
+
+    let cache_prefix = format!("mcpgw:rust-affinity-itest:{}:", Uuid::new_v4());
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+
+    let owner_worker_id = format!("worker-{}", Uuid::new_v4().simple());
+    let session_id = format!("affinity-session-{}", Uuid::new_v4().simple());
+    let backend_calls = Arc::new(Mutex::new(Vec::<String>::new()));
+    let backend_calls_clone = backend_calls.clone();
+    let initialize_session_id = session_id.clone();
+    let backend = Router::new()
+        .route(
+            "/_internal/mcp/authenticate",
+            post(|Json(body): Json<Value>| async move {
+                let auth_context = if body["headers"]["authorization"]
+                    .as_str()
+                    .is_some_and(|value| value.contains("peer-token"))
+                {
+                    json!({
+                        "email": "peer@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": true,
+                        "is_admin": false,
+                        "permission_is_admin": false,
+                        "token_use": "session"
+                    })
+                } else {
+                    json!({
+                        "email": "owner@example.com",
+                        "teams": ["team-a"],
+                        "is_authenticated": true,
+                        "is_admin": false,
+                        "permission_is_admin": false,
+                        "token_use": "session"
+                    })
+                };
+                Json(json!({"authContext": auth_context}))
+            }),
+        )
+        .route(
+            "/_internal/mcp/transport",
+            post(move || {
+                let initialize_session_id = initialize_session_id.clone();
+                async move {
+                    (
+                        StatusCode::OK,
+                        [("mcp-session-id", initialize_session_id)],
+                        Json(json!({
+                            "protocolVersion": "2025-11-25",
+                            "capabilities": {}
+                        })),
+                    )
+                }
+            }),
+        )
+        .route(
+            "/_internal/mcp/rpc",
+            post(move || {
+                let backend_calls = backend_calls_clone.clone();
+                async move {
+                    backend_calls
+                        .lock()
+                        .expect("lock")
+                        .push("tools-list".to_string());
+                    Json(json!({
+                        "jsonrpc": "2.0",
+                        "id": 2,
+                        "result": {"tools": [{"name": "fast-time-get-system-time"}]},
+                    }))
+                }
+            }),
+        )
+        .route(
+            "/_internal/mcp/tools/list",
+            post({
+                let backend_calls = backend_calls.clone();
+                move || {
+                    let backend_calls = backend_calls.clone();
+                    async move {
+                        backend_calls
+                            .lock()
+                            .expect("lock")
+                            .push("tools-list".to_string());
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": 2,
+                            "result": {"tools": [{"name": "fast-time-get-system-time"}]},
+                        }))
+                    }
+                }
+            }),
+        )
+        .fallback({
+            let backend_calls = backend_calls.clone();
+            any(move |uri: Uri| {
+                let backend_calls = backend_calls.clone();
+                async move {
+                    backend_calls
+                        .lock()
+                        .expect("lock")
+                        .push(format!("unexpected:{}", uri.path()));
+                    (StatusCode::NOT_FOUND, uri.path().to_string())
+                }
+            })
+        });
+    let backend_url = spawn_router(backend).await;
+
+    let runtime_1 = {
+        let mut config = test_runtime_config();
+        config.backend_rpc_url = format!("{backend_url}/_internal/mcp/rpc");
+        config.public_listen_http = Some("127.0.0.1:8788".to_string());
+        config.session_core_enabled = true;
+        config.affinity_core_enabled = true;
+        config.session_auth_reuse_enabled = true;
+        config.redis_url = Some(redis_url.to_string());
+        config.cache_prefix = cache_prefix.clone();
+        build_router(AppState::new(&config).expect("state 1"))
+    };
+    let runtime_2 = {
+        let mut config = test_runtime_config();
+        config.backend_rpc_url = format!("{backend_url}/_internal/mcp/rpc");
+        config.public_listen_http = Some("127.0.0.1:8788".to_string());
+        config.session_core_enabled = true;
+        config.affinity_core_enabled = true;
+        config.session_auth_reuse_enabled = true;
+        config.redis_url = Some(redis_url.to_string());
+        config.cache_prefix = cache_prefix.clone();
+        build_router(AppState::new(&config).expect("state 2"))
+    };
+    let runtime_1_url = spawn_router(runtime_1).await;
+    let runtime_2_url = spawn_router(runtime_2).await;
+
+    let redis_client = redis::Client::open(redis_url).expect("redis client");
+    let mut redis = redis_client
+        .get_multiplexed_async_connection()
+        .await
+        .expect("redis connection");
+    redis
+        .set_ex::<_, _, ()>(
+            format!("{cache_prefix}pool_owner:{session_id}"),
+            owner_worker_id.clone(),
+            300,
+        )
+        .await
+        .expect("set owner");
+
+    let responder = {
+        let redis_client = redis_client.clone();
+        let runtime_2_url = runtime_2_url.clone();
+        let owner_worker_id = owner_worker_id.clone();
+        let cache_prefix = cache_prefix.clone();
+        tokio::spawn(async move {
+            let mut pubsub = redis_client.get_async_pubsub().await.expect("pubsub");
+            pubsub
+                .subscribe(format!("{cache_prefix}pool_http:{owner_worker_id}"))
+                .await
+                .expect("subscribe");
+            let mut stream = pubsub.on_message();
+            if let Some(message) = stream.next().await {
+                let payload_json: String = message.get_payload().expect("payload");
+                let payload: Value = serde_json::from_str(&payload_json).expect("payload json");
+                let method = payload["method"].as_str().expect("method");
+                let path = payload["path"].as_str().expect("path");
+                let query = payload["query_string"].as_str().unwrap_or_default();
+                let response_channel = payload["response_channel"]
+                    .as_str()
+                    .expect("response channel")
+                    .to_string();
+
+                let mut request_builder = reqwest::Client::new()
+                    .request(
+                        reqwest::Method::from_bytes(method.as_bytes()).expect("request method"),
+                        if query.is_empty() {
+                            format!("{runtime_2_url}{path}")
+                        } else {
+                            format!("{runtime_2_url}{path}?{query}")
+                        },
+                    )
+                    .header("x-contextforge-affinity-forwarded", "rust");
+
+                for (name, value) in payload["headers"].as_object().expect("headers map") {
+                    request_builder =
+                        request_builder.header(name, value.as_str().expect("header value"));
+                }
+
+                let body_hex = payload["body"].as_str().unwrap_or_default();
+                if !body_hex.is_empty() {
+                    request_builder = request_builder.body(hex_decode(body_hex));
+                }
+
+                let response = request_builder.send().await.expect("forwarded response");
+                let status = response.status().as_u16();
+                let headers = response
+                    .headers()
+                    .iter()
+                    .filter_map(|(name, value)| {
+                        value
+                            .to_str()
+                            .ok()
+                            .map(|value_str| (name.as_str().to_string(), value_str.to_string()))
+                    })
+                    .collect::<std::collections::HashMap<String, String>>();
+                let body = response.bytes().await.expect("response body");
+                let response = serde_json::to_string(&json!({
+                    "status": status,
+                    "headers": headers,
+                    "body": hex_encode(&body),
+                }))
+                .expect("response payload");
+                let mut publish_conn = redis_client
+                    .get_multiplexed_async_connection()
+                    .await
+                    .expect("publish connection");
+                redis::cmd("PUBLISH")
+                    .arg(response_channel)
+                    .arg(response)
+                    .query_async::<i64>(&mut publish_conn)
+                    .await
+                    .expect("publish response");
+            }
+        })
+    };
+
+    let client = reqwest::Client::new();
+    let initialize = client
+        .post(format!("{runtime_1_url}/mcp"))
+        .header("authorization", "Bearer owner-token")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"initialize",
+            "params":{"protocolVersion":"2025-11-25","capabilities":{}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    assert_eq!(initialize.status(), StatusCode::OK);
+
+    let owner_response = client
+        .post(format!("{runtime_1_url}/mcp"))
+        .header("authorization", "Bearer owner-token")
+        .header("mcp-protocol-version", "2025-11-25")
+        .header("mcp-session-id", session_id.clone())
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":2,
+            "method":"tools/list",
+            "params":{}
+        }))
+        .send()
+        .await
+        .expect("owner response");
+    let owner_status = owner_response.status();
+    let owner_text = owner_response.text().await.expect("owner body");
+    assert!(
+        owner_status == StatusCode::OK,
+        "owner status={owner_status} body={owner_text}"
+    );
+    let owner_body: Value = serde_json::from_str(&owner_text).expect("owner json");
+    assert_eq!(
+        owner_body["result"]["tools"][0]["name"],
+        json!("fast-time-get-system-time")
+    );
+    responder.await.expect("responder");
+
+    let peer_response = client
+        .post(format!("{runtime_1_url}/mcp"))
+        .header("authorization", "Bearer peer-token")
+        .header("mcp-protocol-version", "2025-11-25")
+        .header("mcp-session-id", session_id.clone())
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":3,
+            "method":"tools/list",
+            "params":{}
+        }))
+        .send()
+        .await
+        .expect("peer response");
+    assert_eq!(peer_response.status(), StatusCode::FORBIDDEN);
+
+    let health_response = client
+        .get(format!("{runtime_1_url}/health"))
+        .send()
+        .await
+        .expect("health response");
+    let health_body: Value = health_response.json().await.expect("health json");
+    assert_eq!(
+        health_body["runtime_stats"]["affinity"]["forward_attempts"],
+        json!(1)
+    );
+    assert_eq!(
+        health_body["runtime_stats"]["affinity"]["forwarded_requests"],
+        json!(1)
+    );
+    assert_eq!(
+        health_body["runtime_stats"]["session_access_denials"]["auth_binding_mismatches"],
+        json!(1)
+    );
+
+    {
+        let calls = backend_calls.lock().expect("lock");
+        assert_eq!(calls.as_slice(), &["tools-list".to_string()]);
+    }
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+}
+
+#[tokio::test]
+async fn session_core_rejects_missing_session_before_backend_dispatch() {
+    let backend_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let backend_calls = backend_calls.clone();
+        Router::new().fallback(any(move || {
+            let backend_calls = backend_calls.clone();
+            async move {
+                *backend_calls.lock().expect("lock") += 1;
+                (StatusCode::OK, Json(json!({"unexpected": true})))
+            }
+        }))
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let auth_context = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "user@example.com",
+            "teams": ["team-a"],
+            "is_admin": false,
+            "is_authenticated": true,
+        }))
+        .expect("auth context json"),
+    );
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-auth-context", auth_context)
+        .header("mcp-session-id", "missing-session")
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"tools/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("missing session response");
+
+    assert_eq!(response.status(), StatusCode::NOT_FOUND);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["detail"], json!("Session not found"));
+    assert_eq!(*backend_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn session_core_transport_denies_non_owner_before_backend_dispatch() {
+    let transport_calls = Arc::new(Mutex::new(Vec::<String>::new()));
+    let backend = {
+        let post_calls = transport_calls.clone();
+        let get_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let transport_calls = post_calls.clone();
+                async move {
+                    transport_calls.lock().expect("lock").push(format!(
+                        "POST:{}",
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .unwrap_or("missing")
+                    ));
+                    let mut response_headers = HeaderMap::new();
+                    response_headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("owned-session-1"),
+                    );
+                    (
+                        StatusCode::OK,
+                        response_headers,
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": body["id"],
+                            "result": {"protocolVersion":"2025-11-25","capabilities":{},"serverInfo":{"name":"ContextForge","version":"0.1.0"}}
+                        })),
+                    )
+                }
+            })
+            .get(move || {
+                let transport_calls = get_calls.clone();
+                async move {
+                    transport_calls.lock().expect("lock").push("GET".to_string());
+                    (
+                        StatusCode::OK,
+                        [("content-type", HeaderValue::from_static("text/event-stream"))],
+                        "data: ping\n\n",
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let owner_auth = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "owner@example.com",
+            "teams": ["team-a"],
+            "is_admin": false,
+            "is_authenticated": true,
+        }))
+        .expect("owner auth context json"),
+    );
+    let intruder_auth = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "intruder@example.com",
+            "teams": ["team-a"],
+            "is_admin": false,
+            "is_authenticated": true,
+        }))
+        .expect("intruder auth context json"),
+    );
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-auth-context", owner_auth)
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"initialize",
+            "params":{"protocolVersion":"2025-11-25","capabilities":{}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    let initialize_status = initialize_response.status();
+    let initialize_body = initialize_response.text().await.expect("initialize body");
+    assert!(
+        initialize_status == StatusCode::OK,
+        "initialize status={initialize_status} body={initialize_body}"
+    );
+
+    let get_response = client
+        .get(format!("{runtime_url}/mcp?session_id=owned-session-1"))
+        .header("x-contextforge-auth-context", intruder_auth)
+        .send()
+        .await
+        .expect("get response");
+
+    assert_eq!(get_response.status(), StatusCode::FORBIDDEN);
+    let body: Value = get_response.json().await.expect("json body");
+    assert_eq!(body["detail"], json!("Session access denied"));
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls.len(), 1);
+    assert!(calls[0].starts_with("POST:"));
+}
+
+#[tokio::test]
+async fn session_core_transport_denies_same_email_with_different_auth_binding() {
+    let transport_calls = Arc::new(Mutex::new(Vec::<String>::new()));
+    let backend = {
+        let post_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let transport_calls = post_calls.clone();
+                async move {
+                    transport_calls.lock().expect("lock").push(format!(
+                        "POST:{}",
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .unwrap_or("missing")
+                    ));
+                    let mut response_headers = HeaderMap::new();
+                    response_headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("bound-session-1"),
+                    );
+                    (
+                        StatusCode::OK,
+                        response_headers,
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": body["id"],
+                            "result": {"protocolVersion":"2025-11-25","capabilities":{},"serverInfo":{"name":"ContextForge","version":"0.1.0"}}
+                        })),
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            session_auth_reuse_enabled: true,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let owner_auth = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "owner@example.com",
+            "teams": ["team-a"],
+            "is_admin": false,
+            "is_authenticated": true,
+        }))
+        .expect("owner auth context json"),
+    );
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer owner-session-token")
+        .header("x-contextforge-auth-context", owner_auth.clone())
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"initialize",
+            "params":{"protocolVersion":"2025-11-25","capabilities":{}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    let initialize_status = initialize_response.status();
+    let initialize_body = initialize_response.text().await.expect("initialize body");
+    assert!(
+        initialize_status == StatusCode::OK,
+        "initialize status={initialize_status} body={initialize_body}"
+    );
+
+    let get_response = client
+        .get(format!("{runtime_url}/mcp?session_id=bound-session-1"))
+        .header("authorization", "Bearer owner-public-only-token")
+        .header("x-contextforge-auth-context", owner_auth)
+        .send()
+        .await
+        .expect("get response");
+
+    assert_eq!(get_response.status(), StatusCode::FORBIDDEN);
+    let body: Value = get_response.json().await.expect("json body");
+    assert_eq!(body["detail"], json!("Session access denied"));
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls.len(), 1);
+    assert!(calls[0].starts_with("POST:"));
+}
+
+#[tokio::test]
+async fn session_core_redis_shares_sessions_across_runtime_instances() {
+    let redis_url = "redis://127.0.0.1:6379/0";
+    if !redis_is_available(redis_url).await {
+        return;
+    }
+
+    let cache_prefix = format!("mcpgw:rust-session-itest:{}:", Uuid::new_v4());
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+
+    let transport_calls = Arc::new(Mutex::new(Vec::<(
+        String,
+        Option<String>,
+        Option<String>,
+        Option<String>,
+    )>::new()));
+    let backend = {
+        let post_calls = transport_calls.clone();
+        let get_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let transport_calls = post_calls.clone();
+                async move {
+                    transport_calls.lock().expect("lock").push((
+                        "POST".to_string(),
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        headers
+                            .get("x-contextforge-server-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        None,
+                    ));
+                    let mut response_headers = HeaderMap::new();
+                    response_headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("redis-session-1"),
+                    );
+                    (
+                        StatusCode::OK,
+                        response_headers,
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": body["id"],
+                            "result": {"protocolVersion":"2025-11-25","capabilities":{},"serverInfo":{"name":"ContextForge","version":"0.1.0"}}
+                        })),
+                    )
+                }
+            })
+            .get(move |headers: HeaderMap, uri: Uri| {
+                let transport_calls = get_calls.clone();
+                async move {
+                    transport_calls.lock().expect("lock").push((
+                        "GET".to_string(),
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        headers
+                            .get("x-contextforge-server-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        uri.query().map(str::to_string),
+                    ));
+                    (
+                        StatusCode::OK,
+                        [("content-type", HeaderValue::from_static("text/event-stream"))],
+                        "data: ok\n\n",
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime_1 = build_router(
+        AppState::new(&RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            redis_url: Some(redis_url.to_string()),
+            cache_prefix: cache_prefix.clone(),
+            ..test_runtime_config()
+        })
+        .expect("state 1"),
+    );
+    let runtime_2 = build_router(
+        AppState::new(&RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            redis_url: Some(redis_url.to_string()),
+            cache_prefix: cache_prefix.clone(),
+            ..test_runtime_config()
+        })
+        .expect("state 2"),
+    );
+    let runtime_1_url = spawn_router(runtime_1).await;
+    let runtime_2_url = spawn_router(runtime_2).await;
+
+    let auth_context = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "user@example.com",
+            "teams": ["team-a"],
+            "is_admin": false
+        }))
+        .expect("auth context json"),
+    );
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_1_url}/mcp"))
+        .header("x-contextforge-auth-context", auth_context.clone())
+        .header("x-contextforge-server-id", "server-redis")
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"initialize",
+            "params":{"protocolVersion":"2025-11-25","capabilities":{}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    let initialize_status = initialize_response.status();
+    let initialize_headers = initialize_response.headers().clone();
+    let initialize_body = initialize_response.text().await.expect("initialize body");
+    assert!(
+        initialize_status == StatusCode::OK,
+        "initialize status={initialize_status} body={initialize_body}"
+    );
+    assert_eq!(
+        initialize_headers
+            .get("mcp-session-id")
+            .and_then(|value| value.to_str().ok()),
+        Some("redis-session-1")
+    );
+
+    let get_response = client
+        .get(format!("{runtime_2_url}/mcp?session_id=redis-session-1"))
+        .header("x-contextforge-auth-context", auth_context)
+        .send()
+        .await
+        .expect("get response");
+    assert_eq!(get_response.status(), StatusCode::OK);
+
+    {
+        let calls = transport_calls.lock().expect("lock");
+        assert_eq!(calls[0].0, "POST");
+        assert_eq!(calls[0].2.as_deref(), Some("server-redis"));
+        assert_eq!(
+            calls[1],
+            (
+                "GET".to_string(),
+                Some("redis-session-1".to_string()),
+                Some("server-redis".to_string()),
+                Some("session_id=redis-session-1".to_string()),
+            )
+        );
+    }
+
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+}
+
+#[tokio::test]
+async fn affinity_core_forwards_session_post_to_owner_worker_channel() {
+    let redis_url = "redis://127.0.0.1:6379/0";
+    if !redis_is_available(redis_url).await {
+        eprintln!("skipping affinity-core test because Redis is unavailable at {redis_url}");
+        return;
+    }
+
+    let owner_worker_id = format!("worker-{}", Uuid::new_v4().simple());
+    let session_id = format!("affinity-session-{}", Uuid::new_v4().simple());
+    cleanup_redis_prefix(redis_url, &format!("mcpgw:pool_owner:{session_id}")).await;
+
+    let backend_calls = Arc::new(Mutex::new(Vec::<String>::new()));
+    let backend_calls_clone = backend_calls.clone();
+    let initialize_session_id = session_id.clone();
+    let backend = Router::new()
+        .route(
+            "/_internal/mcp/transport",
+            post(move || {
+                let backend_calls = backend_calls_clone.clone();
+                let initialize_session_id = initialize_session_id.clone();
+                async move {
+                    backend_calls
+                        .lock()
+                        .expect("lock")
+                        .push("initialize".to_string());
+                    (
+                        StatusCode::OK,
+                        [("mcp-session-id", initialize_session_id)],
+                        Json(json!({
+                            "protocolVersion": "2025-11-25",
+                            "capabilities": {}
+                        })),
+                    )
+                }
+            }),
+        )
+        .fallback({
+            let backend_calls = backend_calls.clone();
+            any(move || {
+                let backend_calls = backend_calls.clone();
+                async move {
+                    backend_calls
+                        .lock()
+                        .expect("lock")
+                        .push("unexpected".to_string());
+                    StatusCode::INTERNAL_SERVER_ERROR
+                }
+            })
+        });
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            affinity_core_enabled: true,
+            redis_url: Some(redis_url.to_string()),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let redis_client = redis::Client::open(redis_url).expect("redis client");
+    let mut redis = redis_client
+        .get_multiplexed_async_connection()
+        .await
+        .expect("redis connection");
+    redis
+        .set_ex::<_, _, ()>(
+            format!("mcpgw:pool_owner:{session_id}"),
+            owner_worker_id.clone(),
+            300,
+        )
+        .await
+        .expect("set owner");
+
+    let responder = {
+        let redis_client = redis_client.clone();
+        let session_id = session_id.clone();
+        let owner_worker_id = owner_worker_id.clone();
+        tokio::spawn(async move {
+            let mut pubsub = redis_client.get_async_pubsub().await.expect("pubsub");
+            pubsub
+                .subscribe(format!("mcpgw:pool_http:{owner_worker_id}"))
+                .await
+                .expect("subscribe");
+            let mut stream = pubsub.on_message();
+            let message = tokio::time::timeout(Duration::from_secs(5), stream.next())
+                .await
+                .expect("timeout waiting for forwarded request")
+                .expect("forwarded request");
+            let payload_json: String = message.get_payload().expect("payload");
+            let payload: Value = serde_json::from_str(&payload_json).expect("payload json");
+            assert_eq!(payload["mcp_session_id"], session_id);
+            assert_eq!(payload["method"], "POST");
+            assert_eq!(payload["path"], "/mcp");
+            assert_eq!(payload["query_string"], "");
+
+            let response_body = serde_json::to_vec(&json!({
+                "jsonrpc": "2.0",
+                "id": 2,
+                "result": {"forwarded": true}
+            }))
+            .expect("response json");
+            let mut response_hex = String::with_capacity(response_body.len() * 2);
+            for byte in &response_body {
+                use std::fmt::Write as _;
+                let _ = write!(&mut response_hex, "{byte:02x}");
+            }
+            let response = serde_json::to_string(&json!({
+                "status": 200,
+                "headers": {
+                    "content-type": "application/json",
+                    "mcp-session-id": session_id,
+                },
+                "body": response_hex,
+            }))
+            .expect("response payload");
+            let response_channel = payload["response_channel"]
+                .as_str()
+                .expect("response channel")
+                .to_string();
+            let mut publish_conn = redis_client
+                .get_multiplexed_async_connection()
+                .await
+                .expect("publish connection");
+            redis::cmd("PUBLISH")
+                .arg(response_channel)
+                .arg(response)
+                .query_async::<i64>(&mut publish_conn)
+                .await
+                .expect("publish response");
+        })
+    };
+
+    let auth_context = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "user@example.com",
+            "teams": ["team-a"],
+            "is_admin": false
+        }))
+        .expect("auth context json"),
+    );
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-auth-context", auth_context.clone())
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"initialize",
+            "params":{"protocolVersion":"2025-11-25","capabilities":{}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    let initialize_status = initialize_response.status();
+    let initialize_body = initialize_response.text().await.expect("initialize body");
+    assert!(
+        initialize_status == StatusCode::OK,
+        "initialize status={initialize_status} body={initialize_body}"
+    );
+
+    let response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-auth-context", auth_context)
+        .header("mcp-protocol-version", "2025-11-25")
+        .header("mcp-session-id", session_id.clone())
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":2,
+            "method":"tools/list",
+            "params":{}
+        }))
+        .send()
+        .await
+        .expect("post response");
+    let response_headers = response.headers().clone();
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["forwarded"], json!(true));
+    assert_eq!(
+        response_headers
+            .get("x-contextforge-mcp-affinity-core")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+
+    responder.await.expect("responder");
+    {
+        let calls = backend_calls.lock().expect("lock");
+        assert_eq!(calls.as_slice(), &["initialize".to_string()]);
+    }
+    cleanup_redis_prefix(redis_url, &format!("mcpgw:pool_owner:{session_id}")).await;
+}
+
+#[tokio::test]
+async fn rust_event_store_replays_events_across_runtime_instances() {
+    let redis_url = "redis://127.0.0.1:6379/0";
+    if !redis_is_available(redis_url).await {
+        return;
+    }
+
+    let cache_prefix = format!("mcpgw:rust-eventstore-itest:{}:", Uuid::new_v4());
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+
+    let runtime_1 = build_router(
+        AppState::new(&RuntimeConfig {
+            redis_url: Some(redis_url.to_string()),
+            event_store_enabled: true,
+            cache_prefix: cache_prefix.clone(),
+            ..test_runtime_config()
+        })
+        .expect("state 1"),
+    );
+    let runtime_2 = build_router(
+        AppState::new(&RuntimeConfig {
+            redis_url: Some(redis_url.to_string()),
+            event_store_enabled: true,
+            cache_prefix: cache_prefix.clone(),
+            ..test_runtime_config()
+        })
+        .expect("state 2"),
+    );
+    let runtime_1_url = spawn_router(runtime_1).await;
+    let runtime_2_url = spawn_router(runtime_2).await;
+    let client = reqwest::Client::new();
+
+    let first = client
+        .post(format!("{runtime_1_url}/_internal/event-store/store"))
+        .json(&json!({
+            "streamId": "stream-1",
+            "message": {"id": 1},
+        }))
+        .send()
+        .await
+        .expect("store first");
+    let first_body: Value = first.json().await.expect("first json");
+    let first_event_id = first_body["eventId"]
+        .as_str()
+        .expect("first event id")
+        .to_string();
+
+    let second = client
+        .post(format!("{runtime_1_url}/_internal/event-store/store"))
+        .json(&json!({
+            "streamId": "stream-1",
+            "message": {"id": 2},
+        }))
+        .send()
+        .await
+        .expect("store second");
+    assert_eq!(second.status(), StatusCode::OK);
+
+    let replay = client
+        .post(format!("{runtime_2_url}/_internal/event-store/replay"))
+        .json(&json!({
+            "lastEventId": first_event_id,
+        }))
+        .send()
+        .await
+        .expect("replay response");
+    assert_eq!(replay.status(), StatusCode::OK);
+    assert_eq!(
+        replay
+            .headers()
+            .get("x-contextforge-mcp-event-store")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    let replay_body: Value = replay.json().await.expect("replay json");
+    assert_eq!(replay_body["streamId"], "stream-1");
+    assert_eq!(replay_body["events"][0]["message"], json!({"id": 2}));
+
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+}
+
+#[tokio::test]
+async fn rust_event_store_replay_fails_closed_on_corrupt_messages() {
+    let redis_url = "redis://127.0.0.1:6379/0";
+    if !redis_is_available(redis_url).await {
+        return;
+    }
+
+    let cache_prefix = format!("mcpgw:rust-eventstore-corrupt-itest:{}:", Uuid::new_v4());
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+
+    let runtime = build_router(
+        AppState::new(&RuntimeConfig {
+            redis_url: Some(redis_url.to_string()),
+            event_store_enabled: true,
+            cache_prefix: cache_prefix.clone(),
+            ..test_runtime_config()
+        })
+        .expect("state"),
+    );
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let first = client
+        .post(format!("{runtime_url}/_internal/event-store/store"))
+        .json(&json!({
+            "streamId": "stream-1",
+            "message": {"id": 1},
+        }))
+        .send()
+        .await
+        .expect("store first");
+    let first_body: Value = first.json().await.expect("first json");
+    let first_event_id = first_body["eventId"]
+        .as_str()
+        .expect("first event id")
+        .to_string();
+
+    let second = client
+        .post(format!("{runtime_url}/_internal/event-store/store"))
+        .json(&json!({
+            "streamId": "stream-1",
+            "message": {"id": 2},
+        }))
+        .send()
+        .await
+        .expect("store second");
+    let second_body: Value = second.json().await.expect("second json");
+    let second_event_id = second_body["eventId"]
+        .as_str()
+        .expect("second event id")
+        .to_string();
+
+    let redis_client = redis::Client::open(redis_url).expect("redis client");
+    let mut redis = redis_client
+        .get_multiplexed_async_connection()
+        .await
+        .expect("redis connection");
+    redis
+        .hset::<_, _, _, ()>(
+            format!("{cache_prefix}eventstore:stream-1:messages"),
+            second_event_id,
+            "{not-json",
+        )
+        .await
+        .expect("corrupt stored payload");
+
+    let replay = client
+        .post(format!("{runtime_url}/_internal/event-store/replay"))
+        .json(&json!({
+            "lastEventId": first_event_id,
+        }))
+        .send()
+        .await
+        .expect("replay response");
+    assert_eq!(replay.status(), StatusCode::BAD_GATEWAY);
+    let replay_body: Value = replay.json().await.expect("replay json");
+    assert_eq!(
+        replay_body,
+        json!({"detail": "Rust event store replay decode failed"})
+    );
+
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+}
+
+#[tokio::test]
+async fn resume_core_replays_public_get_from_rust_event_store() {
+    let redis_url = "redis://127.0.0.1:6379/0";
+    if !redis_is_available(redis_url).await {
+        return;
+    }
+
+    let cache_prefix = format!("mcpgw:rust-resume-itest:{}:", Uuid::new_v4());
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+
+    let transport_calls: Arc<Mutex<Vec<String>>> = Arc::new(Mutex::new(Vec::new()));
+    let backend = {
+        let post_transport_calls = transport_calls.clone();
+        let get_transport_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            post(move |headers: HeaderMap, Json(_body): Json<Value>| {
+                let transport_calls = post_transport_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("POST".to_string());
+                    let mut response = Json(json!({
+                        "jsonrpc": "2.0",
+                        "id": 1,
+                        "result": {
+                            "protocolVersion": "2025-11-25",
+                            "capabilities": {},
+                            "serverInfo": {"name": "ContextForge", "version": "0.1.0"}
+                        }
+                    }))
+                    .into_response();
+                    response.headers_mut().insert(
+                        "mcp-session-id",
+                        headers
+                            .get("mcp-session-id")
+                            .cloned()
+                            .unwrap_or_else(|| HeaderValue::from_static("resume-session-1")),
+                    );
+                    response
+                }
+            })
+            .get(move || {
+                let transport_calls = get_transport_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("GET".to_string());
+                    (
+                        StatusCode::OK,
+                        [("content-type", "text/event-stream")],
+                        "data: backend-fallback\n\n",
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = build_router(
+        AppState::new(&RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            event_store_enabled: true,
+            resume_core_enabled: true,
+            redis_url: Some(redis_url.to_string()),
+            cache_prefix: cache_prefix.clone(),
+            ..test_runtime_config()
+        })
+        .expect("state"),
+    );
+    let runtime_url = spawn_router(runtime).await;
+
+    let auth_context = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "resume@example.com",
+            "teams": ["team-a"],
+            "is_admin": false
+        }))
+        .expect("auth context json"),
+    );
+    let client = reqwest::Client::new();
+
+    let initialize_response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-auth-context", auth_context.clone())
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc":"2.0",
+            "id":1,
+            "method":"initialize",
+            "params":{"protocolVersion":"2025-11-25","capabilities":{}}
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+    assert_eq!(initialize_response.status(), StatusCode::OK);
+    let session_id = initialize_response
+        .headers()
+        .get("mcp-session-id")
+        .and_then(|value| value.to_str().ok())
+        .expect("session id")
+        .to_string();
+
+    let store_1 = client
+        .post(format!("{runtime_url}/_internal/event-store/store"))
+        .json(&json!({
+            "streamId": "resume-stream-1",
+            "message": {"jsonrpc":"2.0","method":"notifications/message","params":{"level":"info","data":"first"}},
+            "keyPrefix": "eventstore"
+        }))
+        .send()
+        .await
+        .expect("store event 1");
+    assert_eq!(store_1.status(), StatusCode::OK);
+    let first_event_id = store_1.json::<Value>().await.expect("store 1 json")["eventId"]
+        .as_str()
+        .expect("event id")
+        .to_string();
+
+    let store_2 = client
+        .post(format!("{runtime_url}/_internal/event-store/store"))
+        .json(&json!({
+            "streamId": "resume-stream-1",
+            "message": {"jsonrpc":"2.0","method":"notifications/message","params":{"level":"info","data":"second"}},
+            "keyPrefix": "eventstore"
+        }))
+        .send()
+        .await
+        .expect("store event 2");
+    assert_eq!(store_2.status(), StatusCode::OK);
+    let second_event_id = store_2.json::<Value>().await.expect("store 2 json")["eventId"]
+        .as_str()
+        .expect("event id")
+        .to_string();
+
+    let mut resume_response = client
+        .get(format!("{runtime_url}/mcp?session_id={session_id}"))
+        .header("x-contextforge-auth-context", auth_context)
+        .header("accept", "text/event-stream")
+        .header("mcp-protocol-version", "2025-11-25")
+        .header("last-event-id", first_event_id)
+        .send()
+        .await
+        .expect("resume response");
+    assert_eq!(resume_response.status(), StatusCode::OK);
+    assert_eq!(
+        resume_response
+            .headers()
+            .get("x-contextforge-mcp-resume-core")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+
+    let replay_chunk = tokio::time::timeout(std::time::Duration::from_secs(2), async {
+        let mut collected = Vec::new();
+        loop {
+            let Some(chunk) = resume_response.chunk().await.expect("resume chunk") else {
+                break;
+            };
+            collected.extend_from_slice(&chunk);
+            if collected
+                .windows(second_event_id.len())
+                .any(|window| window == second_event_id.as_bytes())
+            {
+                break;
+            }
+        }
+        collected
+    })
+    .await
+    .expect("resume timeout");
+    let replay_text = String::from_utf8_lossy(&replay_chunk);
+    assert!(replay_text.contains("event: message"));
+    assert!(replay_text.contains(&format!("id: {second_event_id}")));
+    assert!(replay_text.contains("\"data\":\"second\""));
+
+    {
+        let calls = transport_calls.lock().expect("lock");
+        assert_eq!(calls.as_slice(), &["POST".to_string()]);
+    }
+
+    cleanup_redis_prefix(redis_url, &cache_prefix).await;
+}
+
+#[tokio::test]
+async fn resume_core_disabled_falls_back_to_python_transport_get() {
+    let transport_calls: Arc<Mutex<Vec<String>>> = Arc::new(Mutex::new(Vec::new()));
+    let backend = {
+        let post_calls = transport_calls.clone();
+        let get_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            post(move || {
+                let transport_calls = post_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("POST".to_string());
+                    (
+                        StatusCode::OK,
+                        [
+                            ("content-type", "application/json"),
+                            ("mcp-session-id", "fallback-session-1"),
+                        ],
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": 1,
+                            "result": {"protocolVersion": "2025-11-25", "capabilities": {}}
+                        })),
+                    )
+                }
+            })
+            .get(move || {
+                let transport_calls = get_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("GET".to_string());
+                    (
+                        StatusCode::OK,
+                        [
+                            ("content-type", "text/event-stream"),
+                            ("mcp-session-id", "fallback-session-1"),
+                        ],
+                        "data: backend-fallback\n\n",
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = build_router(
+        AppState::new(&RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            event_store_enabled: true,
+            resume_core_enabled: false,
+            ..test_runtime_config()
+        })
+        .expect("state"),
+    );
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    initialize_runtime_session(&runtime_url, "fallback-session-1", None).await;
+
+    let response = client
+        .get(format!("{runtime_url}/mcp?session_id=fallback-session-1"))
+        .header("accept", "text/event-stream")
+        .header("last-event-id", "event-123")
+        .send()
+        .await
+        .expect("get response");
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-resume-core")
+            .and_then(|value| value.to_str().ok()),
+        Some("python")
+    );
+    assert_eq!(
+        response.text().await.expect("body"),
+        "data: backend-fallback\n\n"
+    );
+
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls.as_slice(), &["POST".to_string(), "GET".to_string()]);
+}
+
+#[tokio::test]
+async fn live_stream_core_restreams_public_get_from_rust_edge() {
+    let transport_calls: Arc<Mutex<Vec<String>>> = Arc::new(Mutex::new(Vec::new()));
+    let backend = {
+        let post_calls = transport_calls.clone();
+        let get_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            post(move || {
+                let transport_calls = post_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("POST".to_string());
+                    (
+                        StatusCode::OK,
+                        [
+                            ("content-type", "application/json"),
+                            ("mcp-session-id", "live-session-1"),
+                        ],
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": 1,
+                            "result": {"protocolVersion": "2025-11-25", "capabilities": {}}
+                        })),
+                    )
+                }
+            })
+            .get(move || {
+                let transport_calls = get_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("GET".to_string());
+                    (
+                        StatusCode::OK,
+                        [
+                            ("content-type", "text/event-stream"),
+                            ("mcp-session-id", "live-session-1"),
+                        ],
+                        "id: evt-1\nevent: message\ndata: {\"jsonrpc\":\"2.0\",\"method\":\"notifications/message\",\"params\":{\"data\":\"hello-live\"}}\n\n",
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = build_router(
+        AppState::new(&RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            live_stream_core_enabled: true,
+            ..test_runtime_config()
+        })
+        .expect("state"),
+    );
+    let runtime_url = spawn_router(runtime).await;
+    let auth_context = URL_SAFE_NO_PAD.encode(
+        serde_json::to_vec(&json!({
+            "email": "live@example.com",
+            "teams": ["team-a"],
+            "is_admin": false
+        }))
+        .expect("auth context json"),
+    );
+
+    initialize_runtime_session(&runtime_url, "live-session-1", Some(auth_context.as_str())).await;
+
+    let response = reqwest::Client::new()
+        .get(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-auth-context", auth_context)
+        .header("accept", "text/event-stream")
+        .header("mcp-session-id", "live-session-1")
+        .header("mcp-protocol-version", "2025-03-26")
+        .send()
+        .await
+        .expect("get response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-live-stream-core")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    assert_eq!(
+        response
+            .headers()
+            .get("mcp-session-id")
+            .and_then(|value| value.to_str().ok()),
+        Some("live-session-1")
+    );
+    let body = response.text().await.expect("body");
+    assert!(body.contains("id: evt-1"));
+    assert!(body.contains("event: message"));
+    assert!(body.contains("hello-live"));
+
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls.as_slice(), &["POST".to_string(), "GET".to_string()]);
+}
+
+#[tokio::test]
+async fn live_stream_core_returns_headers_without_waiting_for_backend_sse() {
+    let transport_calls: Arc<Mutex<Vec<String>>> = Arc::new(Mutex::new(Vec::new()));
+    let backend = {
+        let post_calls = transport_calls.clone();
+        let get_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            post(move || {
+                let transport_calls = post_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("POST".to_string());
+                    (
+                        StatusCode::OK,
+                        [
+                            ("content-type", "application/json"),
+                            ("mcp-session-id", "live-session-delayed"),
+                        ],
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": 1,
+                            "result": {"protocolVersion": "2025-11-25", "capabilities": {}}
+                        })),
+                    )
+                }
+            })
+            .get(move || {
+                let transport_calls = get_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("GET".to_string());
+                    tokio::time::sleep(Duration::from_millis(400)).await;
+                    (
+                        StatusCode::OK,
+                        [
+                            ("content-type", "text/event-stream"),
+                            ("mcp-session-id", "live-session-delayed"),
+                        ],
+                        "id: evt-delayed\nevent: message\ndata: {\"jsonrpc\":\"2.0\",\"method\":\"notifications/message\",\"params\":{\"data\":\"hello-delayed\"}}\n\n",
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = build_router(
+        AppState::new(&RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            live_stream_core_enabled: true,
+            ..test_runtime_config()
+        })
+        .expect("state"),
+    );
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+    let started = Instant::now();
+
+    initialize_runtime_session(&runtime_url, "live-session-delayed", None).await;
+
+    let response = client
+        .get(format!("{runtime_url}/mcp"))
+        .header("accept", "text/event-stream")
+        .header("mcp-session-id", "live-session-delayed")
+        .send()
+        .await
+        .expect("get response");
+
+    assert!(
+        started.elapsed() < Duration::from_millis(250),
+        "live stream headers should be returned before the delayed backend handshake finishes"
+    );
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-live-stream-core")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    assert_eq!(
+        response
+            .headers()
+            .get("mcp-session-id")
+            .and_then(|value| value.to_str().ok()),
+        Some("live-session-delayed")
+    );
+    let body = response.text().await.expect("body");
+    assert!(body.contains("id: evt-delayed"));
+    assert!(body.contains("hello-delayed"));
+
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls.as_slice(), &["POST".to_string(), "GET".to_string()]);
+}
+
+#[tokio::test]
+async fn live_stream_core_disabled_falls_back_to_python_transport_get() {
+    let transport_calls: Arc<Mutex<Vec<String>>> = Arc::new(Mutex::new(Vec::new()));
+    let backend = {
+        let transport_calls = transport_calls.clone();
+        Router::new().route(
+            "/_internal/mcp/transport",
+            get(move || {
+                let transport_calls = transport_calls.clone();
+                async move {
+                    transport_calls
+                        .lock()
+                        .expect("lock")
+                        .push("GET".to_string());
+                    (
+                        StatusCode::OK,
+                        [
+                            ("content-type", "text/event-stream"),
+                            ("mcp-session-id", "fallback-live-session-1"),
+                        ],
+                        "data: backend-live-fallback\n\n",
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = build_router(
+        AppState::new(&RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            session_core_enabled: true,
+            live_stream_core_enabled: false,
+            ..test_runtime_config()
+        })
+        .expect("state"),
+    );
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let response = client
+        .get(format!("{runtime_url}/mcp"))
+        .header("accept", "text/event-stream")
+        .send()
+        .await
+        .expect("get response");
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-live-stream-core")
+            .and_then(|value| value.to_str().ok()),
+        Some("python")
+    );
+    assert_eq!(
+        response.text().await.expect("body"),
+        "data: backend-live-fallback\n\n"
+    );
+
+    let calls = transport_calls.lock().expect("lock");
+    assert_eq!(calls.as_slice(), &["GET".to_string()]);
+}
+
+#[tokio::test]
+async fn tools_list_is_forwarded_with_auth_and_session_headers() {
+    let observation = BackendObservation::default();
+    let backend = {
+        let observation = observation.clone();
+        Router::new().route(
+            "/rpc",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let observation = observation.clone();
+                async move {
+                    observation.calls.lock().expect("lock").push((
+                        body.get("method")
+                            .and_then(Value::as_str)
+                            .unwrap_or("unknown")
+                            .to_string(),
+                        headers
+                            .get("authorization")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                        headers
+                            .get("mcp-session-id")
+                            .and_then(|value| value.to_str().ok())
+                            .map(str::to_string),
+                    ));
+
+                    let mut response_headers = HeaderMap::new();
+                    response_headers
+                        .insert("mcp-session-id", "abc123".parse().expect("session header"));
+
+                    (
+                        StatusCode::OK,
+                        response_headers,
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": body["id"],
+                            "result": {
+                                "tools": [{"name": "echo"}]
+                            }
+                        })),
+                    )
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/rpc"))
+        .header("authorization", "Bearer test-token")
+        .header("mcp-session-id", "session-1")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 7,
+            "method": "tools/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("tools/list response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("mcp-session-id")
+            .and_then(|value| value.to_str().ok()),
+        Some("abc123")
+    );
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["tools"][0]["name"], "echo");
+
+    let calls = observation.calls.lock().expect("lock");
+    assert_eq!(calls.len(), 1);
+    assert_eq!(calls[0].0, "tools/list");
+    assert_eq!(calls[0].1.as_deref(), Some("Bearer test-token"));
+    assert_eq!(calls[0].2.as_deref(), Some("session-1"));
+}
+
+#[tokio::test]
+async fn server_scoped_tools_list_uses_specialized_internal_endpoint() {
+    let observation = BackendObservation::default();
+    let backend = {
+        let observation = observation.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move |Json(body): Json<Value>| {
+                    let observation = observation.clone();
+                    async move {
+                        observation.calls.lock().expect("lock").push((
+                            body.get("method")
+                                .and_then(Value::as_str)
+                                .unwrap_or("unknown")
+                                .to_string(),
+                            None,
+                            None,
+                        ));
+                        Json(json!({"jsonrpc":"2.0","id":body["id"],"result":{"unexpected":true}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/list",
+                post(|headers: HeaderMap| async move {
+                    assert_eq!(
+                        headers
+                            .get("x-contextforge-server-id")
+                            .and_then(|value| value.to_str().ok()),
+                        Some("server-1")
+                    );
+                    Json(json!({
+                        "tools": [{
+                            "name": "echo",
+                            "description": "Echo input",
+                            "inputSchema": {"type": "object"},
+                            "annotations": {}
+                        }]
+                    }))
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .header("x-contextforge-server-id", "server-1")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 11,
+            "method": "tools/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("tools/list response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["tools"][0]["name"], "echo");
+
+    let calls = observation.calls.lock().expect("lock");
+    assert!(
+        calls.is_empty(),
+        "server-scoped tools/list should bypass generic /rpc forwarding"
+    );
+}
+
+#[tokio::test]
+async fn resources_list_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let resources_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let resources_calls = resources_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/resources/list",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let resources_calls = resources_calls.clone();
+                    async move {
+                        *resources_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "resources/list");
+                        Json(json!({
+                            "resources": [{
+                                "uri": "resource://one",
+                                "name": "Resource One"
+                            }],
+                            "nextCursor": "next-1"
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 12,
+            "method": "resources/list",
+            "params": {"cursor": "cursor-1"}
+        }))
+        .send()
+        .await
+        .expect("resources/list response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["resources"][0]["uri"], "resource://one");
+    assert_eq!(body["result"]["nextCursor"], "next-1");
+    assert_eq!(*resources_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn resources_read_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let resources_read_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let resources_read_calls = resources_read_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/resources/read",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let resources_read_calls = resources_read_calls.clone();
+                    async move {
+                        *resources_read_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "resources/read");
+                        assert_eq!(body["params"]["uri"], "resource://one");
+                        Json(json!({
+                            "contents": [{
+                                "uri": "resource://one",
+                                "text": "hello"
+                            }]
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 14,
+            "method": "resources/read",
+            "params": {"uri": "resource://one"}
+        }))
+        .send()
+        .await
+        .expect("resources/read response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["contents"][0]["uri"], "resource://one");
+    assert_eq!(*resources_read_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn resources_subscribe_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let subscribe_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let subscribe_calls = subscribe_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/resources/subscribe",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let subscribe_calls = subscribe_calls.clone();
+                    async move {
+                        *subscribe_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "resources/subscribe");
+                        assert_eq!(body["params"]["uri"], "resource://one");
+                        Json(json!({}))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/servers/server-1/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 17,
+            "method": "resources/subscribe",
+            "params": {"uri": "resource://one"}
+        }))
+        .send()
+        .await
+        .expect("resources/subscribe response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"], json!({}));
+    assert_eq!(*subscribe_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn resources_unsubscribe_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let unsubscribe_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let unsubscribe_calls = unsubscribe_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/resources/unsubscribe",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let unsubscribe_calls = unsubscribe_calls.clone();
+                    async move {
+                        *unsubscribe_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "resources/unsubscribe");
+                        assert_eq!(body["params"]["uri"], "resource://one");
+                        Json(json!({}))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 18,
+            "method": "resources/unsubscribe",
+            "params": {"uri": "resource://one"}
+        }))
+        .send()
+        .await
+        .expect("resources/unsubscribe response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"], json!({}));
+    assert_eq!(*unsubscribe_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn resource_templates_list_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let templates_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let templates_calls = templates_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/resources/templates/list",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let templates_calls = templates_calls.clone();
+                    async move {
+                        *templates_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "resources/templates/list");
+                        Json(json!({
+                            "resourceTemplates": [{
+                                "uriTemplate": "resource://{id}",
+                                "name": "Resource Template"
+                            }]
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 15,
+            "method": "resources/templates/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("resources/templates/list response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(
+        body["result"]["resourceTemplates"][0]["uriTemplate"],
+        "resource://{id}"
+    );
+    assert_eq!(*templates_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn prompts_list_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let prompts_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let prompts_calls = prompts_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/prompts/list",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let prompts_calls = prompts_calls.clone();
+                    async move {
+                        *prompts_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "prompts/list");
+                        Json(json!({
+                            "prompts": [{
+                                "name": "prompt-one",
+                                "description": "Prompt One"
+                            }],
+                            "nextCursor": "next-prompt"
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 13,
+            "method": "prompts/list",
+            "params": {"cursor": "cursor-1"}
+        }))
+        .send()
+        .await
+        .expect("prompts/list response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["prompts"][0]["name"], "prompt-one");
+    assert_eq!(body["result"]["nextCursor"], "next-prompt");
+    assert_eq!(*prompts_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn prompts_get_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let prompts_get_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let prompts_get_calls = prompts_get_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/prompts/get",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let prompts_get_calls = prompts_get_calls.clone();
+                    async move {
+                        *prompts_get_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "prompts/get");
+                        assert_eq!(body["params"]["name"], "prompt-one");
+                        Json(json!({
+                            "name": "prompt-one",
+                            "messages": [{
+                                "role": "user",
+                                "content": "hello"
+                            }]
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 16,
+            "method": "prompts/get",
+            "params": {"name": "prompt-one"}
+        }))
+        .send()
+        .await
+        .expect("prompts/get response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["name"], "prompt-one");
+    assert_eq!(*prompts_get_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn prompts_get_rejects_non_string_argument_values_before_backend_dispatch() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let prompts_get_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let prompts_get_calls = prompts_get_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/prompts/get",
+                post(move || {
+                    let prompts_get_calls = prompts_get_calls.clone();
+                    async move {
+                        *prompts_get_calls.lock().expect("lock") += 1;
+                        Json(json!({"unexpected": true}))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 17,
+            "method": "prompts/get",
+            "params": {
+                "name": "prompt-one",
+                "arguments": {
+                    "target_timezones": ["America/New_York", "Europe/Dublin"]
+                }
+            }
+        }))
+        .send()
+        .await
+        .expect("prompts/get response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["error"]["code"], -32602);
+    assert_eq!(
+        body["error"]["message"],
+        "Prompt argument 'target_timezones' must be a string value"
+    );
+    assert_eq!(*prompts_get_calls.lock().expect("lock"), 0);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn roots_list_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let roots_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let roots_calls = roots_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/roots/list",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let roots_calls = roots_calls.clone();
+                    async move {
+                        *roots_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "roots/list");
+                        Json(json!({
+                            "roots": [{
+                                "uri": "file:///tmp",
+                                "name": "tmp"
+                            }]
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 19,
+            "method": "roots/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("roots/list response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["roots"][0]["uri"], "file:///tmp");
+    assert_eq!(*roots_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn completion_complete_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let completion_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let completion_calls = completion_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/completion/complete",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let completion_calls = completion_calls.clone();
+                    async move {
+                        *completion_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "completion/complete");
+                        Json(json!({
+                            "completion": {
+                                "values": [{"value": "done"}],
+                                "hasMore": false
+                            }
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 20,
+            "method": "completion/complete",
+            "params": {"prompt": "hi"}
+        }))
+        .send()
+        .await
+        .expect("completion/complete response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["completion"]["values"][0]["value"], "done");
+    assert_eq!(*completion_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn sampling_create_message_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let sampling_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let sampling_calls = sampling_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/sampling/createMessage",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let sampling_calls = sampling_calls.clone();
+                    async move {
+                        *sampling_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "sampling/createMessage");
+                        Json(json!({
+                            "role": "assistant",
+                            "content": {"type": "text", "text": "sampled"}
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 21,
+            "method": "sampling/createMessage",
+            "params": {"messages": []}
+        }))
+        .send()
+        .await
+        .expect("sampling/createMessage response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["content"]["text"], "sampled");
+    assert_eq!(*sampling_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn logging_set_level_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let logging_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let logging_calls = logging_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/logging/setLevel",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let logging_calls = logging_calls.clone();
+                    async move {
+                        *logging_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "logging/setLevel");
+                        Json(json!({}))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 22,
+            "method": "logging/setLevel",
+            "params": {"level": "warning"}
+        }))
+        .send()
+        .await
+        .expect("logging/setLevel response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"], json!({}));
+    assert_eq!(*logging_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn representative_specialized_endpoints_wrap_success_and_error_payloads_in_jsonrpc_envelopes()
+{
+    let backend = Router::new()
+        .route(
+            "/_internal/mcp/resources/list",
+            post(|Json(body): Json<Value>| async move {
+                let mut headers = HeaderMap::new();
+                if body["id"] == json!(63) {
+                    headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("resources-specialized-session"),
+                    );
+                    (
+                        StatusCode::OK,
+                        headers,
+                        Json(json!({"resources": [{"uri": "resource://one"}]})),
+                    )
+                        .into_response()
+                } else {
+                    headers.insert(
+                        "www-authenticate",
+                        HeaderValue::from_static("Bearer realm=\"contextforge\""),
+                    );
+                    headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("resources-specialized-denied"),
+                    );
+                    (
+                        StatusCode::FORBIDDEN,
+                        headers,
+                        Json(json!({"code": -32002, "message": "resources/list denied"})),
+                    )
+                        .into_response()
+                }
+            }),
+        )
+        .route(
+            "/_internal/mcp/prompts/get",
+            post(|Json(body): Json<Value>| async move {
+                let mut headers = HeaderMap::new();
+                if body["id"] == json!(65) {
+                    headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("prompts-specialized-session"),
+                    );
+                    (
+                        StatusCode::OK,
+                        headers,
+                        Json(json!({
+                            "name": "prompt-one",
+                            "messages": [{"role": "user", "content": "hello"}]
+                        })),
+                    )
+                        .into_response()
+                } else {
+                    headers.insert(
+                        "www-authenticate",
+                        HeaderValue::from_static("Bearer realm=\"contextforge\""),
+                    );
+                    headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("prompts-specialized-denied"),
+                    );
+                    (
+                        StatusCode::FORBIDDEN,
+                        headers,
+                        Json(json!({"code": -32003, "message": "prompts/get denied"})),
+                    )
+                        .into_response()
+                }
+            }),
+        )
+        .route(
+            "/_internal/mcp/completion/complete",
+            post(|Json(body): Json<Value>| async move {
+                let mut headers = HeaderMap::new();
+                if body["id"] == json!(67) {
+                    headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("completion-specialized-session"),
+                    );
+                    (
+                        StatusCode::OK,
+                        headers,
+                        Json(json!({
+                            "completion": {
+                                "values": [{"value": "done"}],
+                                "hasMore": false
+                            }
+                        })),
+                    )
+                        .into_response()
+                } else {
+                    headers.insert(
+                        "www-authenticate",
+                        HeaderValue::from_static("Bearer realm=\"contextforge\""),
+                    );
+                    headers.insert(
+                        "mcp-session-id",
+                        HeaderValue::from_static("completion-specialized-denied"),
+                    );
+                    (
+                        StatusCode::FORBIDDEN,
+                        headers,
+                        Json(json!({"code": -32004, "message": "completion denied"})),
+                    )
+                        .into_response()
+                }
+            }),
+        );
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let mut config = test_runtime_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let resources_ok = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 63,
+            "method": "resources/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("resources/list success response");
+    assert_eq!(resources_ok.status(), StatusCode::OK);
+    let resources_ok_body: Value = resources_ok
+        .json()
+        .await
+        .expect("resources/list success json");
+    assert_eq!(resources_ok_body["jsonrpc"], json!("2.0"));
+    assert_eq!(resources_ok_body["id"], json!(63));
+    assert_eq!(
+        resources_ok_body["result"]["resources"][0]["uri"],
+        json!("resource://one")
+    );
+    assert!(resources_ok_body["error"].is_null());
+
+    let resources_err = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 64,
+            "method": "resources/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("resources/list error response");
+    assert_eq!(resources_err.status(), StatusCode::FORBIDDEN);
+    let resources_err_body: Value = resources_err
+        .json()
+        .await
+        .expect("resources/list error json");
+    assert_eq!(resources_err_body["jsonrpc"], json!("2.0"));
+    assert_eq!(resources_err_body["id"], json!(64));
+    assert_eq!(resources_err_body["error"]["code"], json!(-32002));
+    assert!(resources_err_body["result"].is_null());
+
+    let prompts_ok = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 65,
+            "method": "prompts/get",
+            "params": {"name": "prompt-one"}
+        }))
+        .send()
+        .await
+        .expect("prompts/get success response");
+    assert_eq!(prompts_ok.status(), StatusCode::OK);
+    let prompts_ok_body: Value = prompts_ok.json().await.expect("prompts/get success json");
+    assert_eq!(prompts_ok_body["jsonrpc"], json!("2.0"));
+    assert_eq!(prompts_ok_body["id"], json!(65));
+    assert_eq!(prompts_ok_body["result"]["name"], json!("prompt-one"));
+    assert!(prompts_ok_body["error"].is_null());
+
+    let prompts_err = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 66,
+            "method": "prompts/get",
+            "params": {"name": "prompt-one"}
+        }))
+        .send()
+        .await
+        .expect("prompts/get error response");
+    assert_eq!(prompts_err.status(), StatusCode::FORBIDDEN);
+    let prompts_err_body: Value = prompts_err.json().await.expect("prompts/get error json");
+    assert_eq!(prompts_err_body["jsonrpc"], json!("2.0"));
+    assert_eq!(prompts_err_body["id"], json!(66));
+    assert_eq!(prompts_err_body["error"]["code"], json!(-32003));
+    assert!(prompts_err_body["result"].is_null());
+
+    let completion_ok = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 67,
+            "method": "completion/complete",
+            "params": {"prompt": "hi"}
+        }))
+        .send()
+        .await
+        .expect("completion/complete success response");
+    assert_eq!(completion_ok.status(), StatusCode::OK);
+    let completion_ok_body: Value = completion_ok
+        .json()
+        .await
+        .expect("completion/complete success json");
+    assert_eq!(completion_ok_body["jsonrpc"], json!("2.0"));
+    assert_eq!(completion_ok_body["id"], json!(67));
+    assert_eq!(
+        completion_ok_body["result"]["completion"]["values"][0]["value"],
+        json!("done")
+    );
+    assert!(completion_ok_body["error"].is_null());
+
+    let completion_err = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 68,
+            "method": "completion/complete",
+            "params": {"prompt": "hi"}
+        }))
+        .send()
+        .await
+        .expect("completion/complete error response");
+    assert_eq!(completion_err.status(), StatusCode::FORBIDDEN);
+    assert_eq!(
+        completion_err
+            .headers()
+            .get("www-authenticate")
+            .and_then(|value| value.to_str().ok()),
+        Some("Bearer realm=\"contextforge\"")
+    );
+    assert_eq!(
+        completion_err
+            .headers()
+            .get("mcp-session-id")
+            .and_then(|value| value.to_str().ok()),
+        Some("completion-specialized-denied")
+    );
+    let completion_err_body: Value = completion_err
+        .json()
+        .await
+        .expect("completion/complete error json");
+    assert_eq!(completion_err_body["jsonrpc"], json!("2.0"));
+    assert_eq!(completion_err_body["id"], json!(68));
+    assert_eq!(completion_err_body["error"]["code"], json!(-32004));
+    assert!(completion_err_body["result"].is_null());
+}
+
+#[tokio::test]
+async fn unknown_notification_catchall_stays_local() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        Router::new().route(
+            "/rpc",
+            post(move || {
+                let rpc_calls = rpc_calls.clone();
+                async move {
+                    *rpc_calls.lock().expect("lock") += 1;
+                    Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "method": "notifications/unknown",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("notifications/unknown response");
+
+    assert_eq!(response.status(), StatusCode::ACCEPTED);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn unsupported_prefix_methods_stay_local() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        Router::new().route(
+            "/rpc",
+            post(move || {
+                let rpc_calls = rpc_calls.clone();
+                async move {
+                    *rpc_calls.lock().expect("lock") += 1;
+                    Json(json!({"jsonrpc":"2.0","id":"unexpected-rpc-path","result":{}}))
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    for (id, method) in [
+        (23, "sampling/unknown"),
+        (24, "completion/unknown"),
+        (25, "logging/other"),
+        (26, "elicitation/other"),
+    ] {
+        let response = client
+            .post(format!("{runtime_url}/mcp"))
+            .header("authorization", "Bearer test-token")
+            .json(&json!({
+                "jsonrpc": "2.0",
+                "id": id,
+                "method": method,
+                "params": {}
+            }))
+            .send()
+            .await
+            .expect("catchall response");
+
+        assert_eq!(response.status(), StatusCode::OK, "method={method}");
+        let body: Value = response.json().await.expect("json body");
+        assert_eq!(body["result"], json!({}), "method={method}");
+    }
+
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn elicitation_create_forwards_to_backend_rpc_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(Vec::<Value>::new()));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        Router::new().route(
+            "/rpc",
+            post(move |Json(body): Json<Value>| {
+                let rpc_calls = rpc_calls.clone();
+                async move {
+                    rpc_calls.lock().expect("lock").push(body.clone());
+                    Json(json!({
+                        "jsonrpc": "2.0",
+                        "id": body["id"],
+                        "result": {"decision": "forwarded"}
+                    }))
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let mut config = test_runtime_config();
+        config.backend_rpc_url = format!("{backend_url}/rpc");
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let request_body = json!({
+        "jsonrpc": "2.0",
+        "id": 67,
+        "method": "elicitation/create",
+        "params": {
+            "prompt": "Need approval",
+            "schema": {"type": "object", "properties": {"approved": {"type": "boolean"}}}
+        }
+    });
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&request_body)
+        .send()
+        .await
+        .expect("elicitation/create response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["decision"], json!("forwarded"));
+
+    let calls = rpc_calls.lock().expect("lock");
+    assert_eq!(calls.len(), 1);
+    assert_eq!(calls[0], request_body);
+}
+
+#[tokio::test]
+async fn server_scoped_tools_list_db_mode_falls_back_to_python_data_endpoint_on_db_failure() {
+    let authz_calls = Arc::new(Mutex::new(0usize));
+    let list_calls = Arc::new(Mutex::new(0usize));
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let authz_calls = authz_calls.clone();
+        let list_calls = list_calls.clone();
+        let rpc_calls = rpc_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":1,"result":{"unexpected":true}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/list/authz",
+                post(move |headers: HeaderMap| {
+                    let authz_calls = authz_calls.clone();
+                    async move {
+                        *authz_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("server-1")
+                        );
+                        StatusCode::NO_CONTENT
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/list",
+                post(move || {
+                    let list_calls = list_calls.clone();
+                    async move {
+                        *list_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "tools": [{
+                                "name": "echo",
+                                "description": "Echo input",
+                                "inputSchema": {"type": "object"},
+                                "annotations": {}
+                            }]
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: Some("postgresql://postgres:postgres@127.0.0.1:1/mcp".to_string()),
+            db_pool_max_size: 2,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .header("x-contextforge-server-id", "server-1")
+        .header(
+            "x-contextforge-auth-context",
+            URL_SAFE_NO_PAD.encode(r#"{"email":"user@example.com","teams":["team-1"],"is_authenticated":true,"is_admin":false,"permission_is_admin":false}"#),
+        )
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 12,
+            "method": "tools/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("tools/list response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["tools"][0]["name"], "echo");
+    assert_eq!(*authz_calls.lock().expect("lock"), 1);
+    assert_eq!(*list_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn tools_call_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let tools_call_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let tools_call_calls = tools_call_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","id":1,"result":{"unexpected":true}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let tools_call_calls = tools_call_calls.clone();
+                    async move {
+                        *tools_call_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("server-1")
+                        );
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": body["id"],
+                            "result": {
+                                "content": [{"type": "text", "text": "ok"}],
+                                "isError": false
+                            }
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .header("x-contextforge-server-id", "server-1")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 13,
+            "method": "tools/call",
+            "params": {
+                "name": "echo",
+                "arguments": {"text": "hello"}
+            }
+        }))
+        .send()
+        .await
+        .expect("tools/call response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["content"][0]["text"], "ok");
+    assert_eq!(*tools_call_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn tools_call_surfaces_backend_jsonrpc_errors_from_resolve() {
+    let backend_fallback_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let backend_fallback_calls = backend_fallback_calls.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/tools/call/resolve",
+                post(move |Json(body): Json<Value>| async move {
+                    (
+                        StatusCode::NOT_FOUND,
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": body["id"],
+                            "error": {
+                                "code": -32601,
+                                "message": "Tool not found: nonexistent-tool-xyz"
+                            }
+                        })),
+                    )
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call",
+                post(move || {
+                    let backend_fallback_calls = backend_fallback_calls.clone();
+                    async move {
+                        *backend_fallback_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": 99,
+                            "result": {"unexpected": true}
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 14,
+            "method": "tools/call",
+            "params": {
+                "name": "nonexistent-tool-xyz",
+                "arguments": {}
+            }
+        }))
+        .send()
+        .await
+        .expect("tools/call response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["error"]["code"], -32601);
+    assert_eq!(
+        body["error"]["message"],
+        "Tool not found: nonexistent-tool-xyz"
+    );
+    assert_eq!(*backend_fallback_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn tools_call_uses_rust_direct_execution_and_reuses_upstream_session() {
+    let upstream_initialize_calls = Arc::new(Mutex::new(0usize));
+    let upstream_tool_calls = Arc::new(Mutex::new(0usize));
+    let backend_fallback_calls = Arc::new(Mutex::new(0usize));
+    let backend_resolve_calls = Arc::new(Mutex::new(0usize));
+    let backend_metric_calls = Arc::new(Mutex::new(Vec::<Value>::new()));
+
+    let upstream = {
+        let upstream_initialize_calls = upstream_initialize_calls.clone();
+        let upstream_tool_calls = upstream_tool_calls.clone();
+        Router::new().route(
+            "/mcp",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let upstream_initialize_calls = upstream_initialize_calls.clone();
+                let upstream_tool_calls = upstream_tool_calls.clone();
+                async move {
+                    match body.get("method").and_then(Value::as_str) {
+                        Some("initialize") => {
+                            *upstream_initialize_calls.lock().expect("lock") += 1;
+                            assert_eq!(
+                                headers
+                                    .get("x-upstream-auth")
+                                    .and_then(|value| value.to_str().ok()),
+                                Some("rust-plan")
+                            );
+                            let mut response_headers = HeaderMap::new();
+                            response_headers.insert(
+                                "mcp-session-id",
+                                HeaderValue::from_static("upstream-session-1"),
+                            );
+                            (
+                                StatusCode::OK,
+                                response_headers,
+                                Json(json!({
+                                    "jsonrpc":"2.0",
+                                    "id": body["id"],
+                                    "result": {
+                                        "protocolVersion": "2025-11-25",
+                                        "serverInfo": {"name": "upstream", "version": "1.0.0"},
+                                        "capabilities": {}
+                                    }
+                                })),
+                            )
+                                .into_response()
+                        }
+                        Some("notifications/initialized") => StatusCode::ACCEPTED.into_response(),
+                        Some("tools/call") => {
+                            *upstream_tool_calls.lock().expect("lock") += 1;
+                            assert_eq!(
+                                headers
+                                    .get("mcp-session-id")
+                                    .and_then(|value| value.to_str().ok()),
+                                Some("upstream-session-1")
+                            );
+                            assert_eq!(body["params"]["name"], "echo_remote");
+                            Json(json!({
+                                "jsonrpc":"2.0",
+                                "id": body["id"],
+                                "result": {
+                                    "content": [{"type": "text", "text": "ok-direct"}],
+                                    "isError": false
+                                }
+                            }))
+                            .into_response()
+                        }
+                        other => (
+                            StatusCode::BAD_REQUEST,
+                            Json(json!({"unexpected_method": other})),
+                        )
+                            .into_response(),
+                    }
+                }
+            }),
+        )
+    };
+    let upstream_url = spawn_router(upstream).await;
+
+    let backend = {
+        let backend_fallback_calls = backend_fallback_calls.clone();
+        let backend_metric_calls = backend_metric_calls.clone();
+        let backend_resolve_calls = backend_resolve_calls.clone();
+        let upstream_url = upstream_url.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/tools/call/resolve",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let backend_resolve_calls = backend_resolve_calls.clone();
+                    let upstream_url = upstream_url.clone();
+                    async move {
+                        *backend_resolve_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("server-1")
+                        );
+                        assert_eq!(body["params"]["name"], "echo");
+                        Json(json!({
+                            "eligible": true,
+                            "transport": "streamablehttp",
+                            "toolId": "tool-1",
+                            "serverId": "server-1",
+                            "serverUrl": format!("{upstream_url}/mcp"),
+                            "remoteToolName": "echo_remote",
+                            "headers": {"x-upstream-auth": "rust-plan"},
+                            "timeoutMs": 30000
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call",
+                post(move || {
+                    let backend_fallback_calls = backend_fallback_calls.clone();
+                    async move {
+                        *backend_fallback_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": 1,
+                            "result": {"unexpected": true}
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call/metric",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let backend_metric_calls = backend_metric_calls.clone();
+                    async move {
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("server-1")
+                        );
+                        backend_metric_calls.lock().expect("lock").push(body);
+                        Json(json!({"status": "ok"}))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    for request_id in [31, 32] {
+        let response = client
+            .post(format!("{runtime_url}/mcp"))
+            .header("authorization", "Bearer test-token")
+            .header("x-contextforge-server-id", "server-1")
+            .header("mcp-session-id", "client-session-1")
+            .json(&json!({
+                "jsonrpc": "2.0",
+                "id": request_id,
+                "method": "tools/call",
+                "params": {
+                    "name": "echo",
+                    "arguments": {"text": "hello"}
+                }
+            }))
+            .send()
+            .await
+            .expect("tools/call response");
+
+        assert_eq!(response.status(), StatusCode::OK);
+        assert_eq!(
+            response
+                .headers()
+                .get("mcp-session-id")
+                .and_then(|value| value.to_str().ok()),
+            Some("client-session-1")
+        );
+        let body: Value = response.json().await.expect("json body");
+        assert_eq!(body["result"]["content"][0]["text"], "ok-direct");
+    }
+
+    assert_eq!(*backend_resolve_calls.lock().expect("lock"), 1);
+    assert_eq!(*backend_fallback_calls.lock().expect("lock"), 0);
+    assert_eq!(*upstream_initialize_calls.lock().expect("lock"), 1);
+    assert_eq!(*upstream_tool_calls.lock().expect("lock"), 2);
+    let metric_calls = backend_metric_calls.lock().expect("lock");
+    assert_eq!(metric_calls.len(), 2);
+    for metric in metric_calls.iter() {
+        assert_eq!(metric["toolId"], "tool-1");
+        assert_eq!(metric["serverId"], "server-1");
+        assert_eq!(metric["success"], true);
+        assert!(metric["durationMs"].as_f64().unwrap_or_default() >= 0.0);
+        assert!(metric.get("errorMessage").is_none());
+    }
+}
+
+#[tokio::test]
+async fn tools_call_reuses_shared_upstream_session_without_client_session_id() {
+    let upstream_initialize_calls = Arc::new(Mutex::new(0usize));
+    let upstream_tool_calls = Arc::new(Mutex::new(0usize));
+    let backend_fallback_calls = Arc::new(Mutex::new(0usize));
+    let backend_resolve_calls = Arc::new(Mutex::new(0usize));
+
+    let upstream = {
+        let upstream_initialize_calls = upstream_initialize_calls.clone();
+        let upstream_tool_calls = upstream_tool_calls.clone();
+        Router::new().route(
+            "/mcp",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let upstream_initialize_calls = upstream_initialize_calls.clone();
+                let upstream_tool_calls = upstream_tool_calls.clone();
+                async move {
+                    match body.get("method").and_then(Value::as_str) {
+                        Some("initialize") => {
+                            *upstream_initialize_calls.lock().expect("lock") += 1;
+                            assert_eq!(
+                                headers
+                                    .get("x-upstream-auth")
+                                    .and_then(|value| value.to_str().ok()),
+                                Some("rust-plan")
+                            );
+                            let mut response_headers = HeaderMap::new();
+                            response_headers.insert(
+                                "mcp-session-id",
+                                HeaderValue::from_static("shared-upstream-session"),
+                            );
+                            (
+                                StatusCode::OK,
+                                response_headers,
+                                Json(json!({
+                                    "jsonrpc":"2.0",
+                                    "id": body["id"],
+                                    "result": {
+                                        "protocolVersion": "2025-11-25",
+                                        "serverInfo": {"name": "upstream", "version": "1.0.0"},
+                                        "capabilities": {}
+                                    }
+                                })),
+                            )
+                                .into_response()
+                        }
+                        Some("notifications/initialized") => StatusCode::ACCEPTED.into_response(),
+                        Some("tools/call") => {
+                            *upstream_tool_calls.lock().expect("lock") += 1;
+                            assert_eq!(
+                                headers
+                                    .get("mcp-session-id")
+                                    .and_then(|value| value.to_str().ok()),
+                                Some("shared-upstream-session")
+                            );
+                            Json(json!({
+                                "jsonrpc":"2.0",
+                                "id": body["id"],
+                                "result": {
+                                    "content": [{"type": "text", "text": "ok-shared"}],
+                                    "isError": false
+                                }
+                            }))
+                            .into_response()
+                        }
+                        other => (
+                            StatusCode::BAD_REQUEST,
+                            Json(json!({"unexpected_method": other})),
+                        )
+                            .into_response(),
+                    }
+                }
+            }),
+        )
+    };
+    let upstream_url = spawn_router(upstream).await;
+
+    let backend = {
+        let backend_fallback_calls = backend_fallback_calls.clone();
+        let backend_resolve_calls = backend_resolve_calls.clone();
+        let upstream_url = upstream_url.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/tools/call/resolve",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let backend_resolve_calls = backend_resolve_calls.clone();
+                    let upstream_url = upstream_url.clone();
+                    async move {
+                        *backend_resolve_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("server-1")
+                        );
+                        assert_eq!(body["params"]["name"], "echo");
+                        Json(json!({
+                            "eligible": true,
+                            "transport": "streamablehttp",
+                            "serverUrl": format!("{upstream_url}/mcp"),
+                            "remoteToolName": "echo_remote",
+                            "headers": {"x-upstream-auth": "rust-plan"},
+                            "timeoutMs": 30000
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call",
+                post(move || {
+                    let backend_fallback_calls = backend_fallback_calls.clone();
+                    async move {
+                        *backend_fallback_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": 1,
+                            "result": {"unexpected": true}
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    for request_id in [41, 42] {
+        let response = client
+            .post(format!("{runtime_url}/mcp"))
+            .header("authorization", "Bearer test-token")
+            .header("x-contextforge-server-id", "server-1")
+            .json(&json!({
+                "jsonrpc": "2.0",
+                "id": request_id,
+                "method": "tools/call",
+                "params": {
+                    "name": "echo",
+                    "arguments": {"text": "hello"}
+                }
+            }))
+            .send()
+            .await
+            .expect("tools/call response");
+
+        assert_eq!(response.status(), StatusCode::OK);
+        assert!(response.headers().get("mcp-session-id").is_none());
+        let body: Value = response.json().await.expect("json body");
+        assert_eq!(body["result"]["content"][0]["text"], "ok-shared");
+    }
+
+    assert_eq!(*backend_resolve_calls.lock().expect("lock"), 1);
+    assert_eq!(*backend_fallback_calls.lock().expect("lock"), 0);
+    assert_eq!(*upstream_initialize_calls.lock().expect("lock"), 1);
+    assert_eq!(*upstream_tool_calls.lock().expect("lock"), 2);
+}
+
+#[tokio::test]
+async fn tools_call_reinitializes_upstream_session_after_cached_session_failure() {
+    let upstream_initialize_calls = Arc::new(Mutex::new(0usize));
+    let upstream_tool_calls = Arc::new(Mutex::new(Vec::<String>::new()));
+    let session_one_uses = Arc::new(Mutex::new(0usize));
+    let backend_resolve_calls = Arc::new(Mutex::new(0usize));
+
+    let upstream = {
+        let upstream_initialize_calls = upstream_initialize_calls.clone();
+        let upstream_tool_calls = upstream_tool_calls.clone();
+        let session_one_uses = session_one_uses.clone();
+        Router::new().route(
+            "/mcp",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let upstream_initialize_calls = upstream_initialize_calls.clone();
+                let upstream_tool_calls = upstream_tool_calls.clone();
+                let session_one_uses = session_one_uses.clone();
+                async move {
+                    match body.get("method").and_then(Value::as_str) {
+                        Some("initialize") => {
+                            let init_index = {
+                                let mut calls = upstream_initialize_calls.lock().expect("lock");
+                                *calls += 1;
+                                *calls
+                            };
+                            let session_id = if init_index == 1 {
+                                "retry-upstream-session-1"
+                            } else {
+                                "retry-upstream-session-2"
+                            };
+                            let mut response_headers = HeaderMap::new();
+                            response_headers.insert(
+                                "mcp-session-id",
+                                HeaderValue::from_str(session_id).expect("session header"),
+                            );
+                            (
+                                StatusCode::OK,
+                                response_headers,
+                                Json(json!({
+                                    "jsonrpc":"2.0",
+                                    "id": body["id"],
+                                    "result": {
+                                        "protocolVersion": "2025-11-25",
+                                        "serverInfo": {"name": "upstream", "version": "1.0.0"},
+                                        "capabilities": {}
+                                    }
+                                })),
+                            )
+                                .into_response()
+                        }
+                        Some("notifications/initialized") => StatusCode::ACCEPTED.into_response(),
+                        Some("tools/call") => {
+                            let session_id = headers
+                                .get("mcp-session-id")
+                                .and_then(|value| value.to_str().ok())
+                                .expect("upstream session id")
+                                .to_string();
+                            upstream_tool_calls
+                                .lock()
+                                .expect("lock")
+                                .push(session_id.clone());
+
+                            if session_id == "retry-upstream-session-1" {
+                                let use_count = {
+                                    let mut calls = session_one_uses.lock().expect("lock");
+                                    *calls += 1;
+                                    *calls
+                                };
+                                if use_count == 1 {
+                                    return Json(json!({
+                                        "jsonrpc":"2.0",
+                                        "id": body["id"],
+                                        "result": {
+                                            "content": [{"type": "text", "text": "ok-initial"}],
+                                            "isError": false
+                                        }
+                                    }))
+                                    .into_response();
+                                }
+
+                                return (
+                                    StatusCode::UNAUTHORIZED,
+                                    Json(json!({
+                                        "code": -32099,
+                                        "message": "upstream session expired"
+                                    })),
+                                )
+                                    .into_response();
+                            }
+
+                            Json(json!({
+                                "jsonrpc":"2.0",
+                                "id": body["id"],
+                                "result": {
+                                    "content": [{"type": "text", "text": "ok-refreshed"}],
+                                    "isError": false
+                                }
+                            }))
+                            .into_response()
+                        }
+                        other => (
+                            StatusCode::BAD_REQUEST,
+                            Json(json!({"unexpected_method": other})),
+                        )
+                            .into_response(),
+                    }
+                }
+            }),
+        )
+    };
+    let upstream_url = spawn_router(upstream).await;
+
+    let backend = {
+        let backend_resolve_calls = backend_resolve_calls.clone();
+        let upstream_url = upstream_url.clone();
+        Router::new().route(
+            "/_internal/mcp/tools/call/resolve",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let backend_resolve_calls = backend_resolve_calls.clone();
+                let upstream_url = upstream_url.clone();
+                async move {
+                    *backend_resolve_calls.lock().expect("lock") += 1;
+                    assert_eq!(
+                        headers
+                            .get("x-contextforge-server-id")
+                            .and_then(|value| value.to_str().ok()),
+                        Some("server-1")
+                    );
+                    assert_eq!(body["params"]["name"], "echo");
+                    Json(json!({
+                        "eligible": true,
+                        "transport": "streamablehttp",
+                        "serverUrl": format!("{upstream_url}/mcp"),
+                        "remoteToolName": "echo_remote",
+                        "headers": {"x-upstream-auth": "rust-plan"},
+                        "timeoutMs": 30000
+                    }))
+                }
+            }),
+        )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    let initial = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .header("x-contextforge-server-id", "server-1")
+        .header("mcp-session-id", "client-session-retry")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 71,
+            "method": "tools/call",
+            "params": {
+                "name": "echo",
+                "arguments": {"text": "hello"}
+            }
+        }))
+        .send()
+        .await
+        .expect("initial tools/call response");
+    assert_eq!(initial.status(), StatusCode::OK);
+    let initial_body: Value = initial.json().await.expect("initial json body");
+    assert_eq!(
+        initial_body["result"]["content"][0]["text"],
+        json!("ok-initial")
+    );
+
+    let refreshed = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .header("x-contextforge-server-id", "server-1")
+        .header("mcp-session-id", "client-session-retry")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 72,
+            "method": "tools/call",
+            "params": {
+                "name": "echo",
+                "arguments": {"text": "hello again"}
+            }
+        }))
+        .send()
+        .await
+        .expect("refreshed tools/call response");
+    assert_eq!(refreshed.status(), StatusCode::OK);
+    assert_eq!(
+        refreshed
+            .headers()
+            .get("mcp-session-id")
+            .and_then(|value| value.to_str().ok()),
+        Some("client-session-retry")
+    );
+    let refreshed_body: Value = refreshed.json().await.expect("refreshed json body");
+    assert_eq!(
+        refreshed_body["result"]["content"][0]["text"],
+        json!("ok-refreshed")
+    );
+
+    assert_eq!(*backend_resolve_calls.lock().expect("lock"), 1);
+    assert_eq!(*upstream_initialize_calls.lock().expect("lock"), 2);
+    assert_eq!(
+        upstream_tool_calls.lock().expect("lock").as_slice(),
+        &[
+            "retry-upstream-session-1".to_string(),
+            "retry-upstream-session-1".to_string(),
+            "retry-upstream-session-2".to_string(),
+        ]
+    );
+}
+
+#[cfg(feature = "rmcp-upstream-client")]
+#[tokio::test]
+async fn tools_call_can_use_rmcp_upstream_client() {
+    let upstream_initialize_calls = Arc::new(Mutex::new(0usize));
+    let upstream_tool_calls = Arc::new(Mutex::new(0usize));
+    let backend_fallback_calls = Arc::new(Mutex::new(0usize));
+    let backend_resolve_calls = Arc::new(Mutex::new(0usize));
+    let metric_records: Arc<Mutex<Vec<Value>>> = Arc::new(Mutex::new(Vec::new()));
+
+    let upstream = {
+        let upstream_initialize_calls = upstream_initialize_calls.clone();
+        let upstream_tool_calls = upstream_tool_calls.clone();
+        Router::new().route(
+            "/mcp",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let upstream_initialize_calls = upstream_initialize_calls.clone();
+                let upstream_tool_calls = upstream_tool_calls.clone();
+                async move {
+                    match body.get("method").and_then(Value::as_str) {
+                        Some("initialize") => {
+                            *upstream_initialize_calls.lock().expect("lock") += 1;
+                            assert_eq!(
+                                headers
+                                    .get("x-upstream-auth")
+                                    .and_then(|value| value.to_str().ok()),
+                                Some("rust-plan")
+                            );
+                            Json(json!({
+                                "jsonrpc":"2.0",
+                                "id": body["id"],
+                                "result": {
+                                    "protocolVersion": "2025-11-25",
+                                    "serverInfo": {"name": "upstream", "version": "1.0.0"},
+                                    "capabilities": {}
+                                }
+                            }))
+                            .into_response()
+                        }
+                        Some("notifications/initialized") => StatusCode::ACCEPTED.into_response(),
+                        Some("tools/call") => {
+                            *upstream_tool_calls.lock().expect("lock") += 1;
+                            assert_eq!(body["params"]["name"], "echo_remote");
+                            Json(json!({
+                                "jsonrpc":"2.0",
+                                "id": body["id"],
+                                "result": {
+                                    "content": [{"type": "text", "text": "ok-rmcp"}],
+                                    "isError": false
+                                }
+                            }))
+                            .into_response()
+                        }
+                        other => (
+                            StatusCode::BAD_REQUEST,
+                            Json(json!({"unexpected_method": other})),
+                        )
+                            .into_response(),
+                    }
+                }
+            }),
+        )
+    };
+    let upstream_url = spawn_router(upstream).await;
+
+    let backend = {
+        let backend_fallback_calls = backend_fallback_calls.clone();
+        let backend_resolve_calls = backend_resolve_calls.clone();
+        let metric_records = metric_records.clone();
+        let upstream_url = upstream_url.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/tools/call/resolve",
+                post(move |Json(body): Json<Value>| {
+                    let backend_resolve_calls = backend_resolve_calls.clone();
+                    let upstream_url = upstream_url.clone();
+                    async move {
+                        *backend_resolve_calls.lock().expect("lock") += 1;
+                        assert_eq!(body["params"]["name"], "echo");
+                        Json(json!({
+                            "eligible": true,
+                            "toolId": "tool-1",
+                            "serverId": "server-1",
+                            "transport": "streamablehttp",
+                            "serverUrl": format!("{upstream_url}/mcp"),
+                            "remoteToolName": "echo_remote",
+                            "headers": {"x-upstream-auth": "rust-plan"},
+                            "timeoutMs": 30000
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call/metric",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let metric_records = metric_records.clone();
+                    async move {
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        metric_records.lock().expect("lock").push(body);
+                        Json(json!({"status": "ok"}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call",
+                post(move || {
+                    let backend_fallback_calls = backend_fallback_calls.clone();
+                    async move {
+                        *backend_fallback_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": 1,
+                            "result": {"unexpected": true}
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            use_rmcp_upstream_client: true,
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+    let client = reqwest::Client::new();
+
+    for request_id in [61, 62] {
+        let response = client
+            .post(format!("{runtime_url}/mcp"))
+            .header("authorization", "Bearer test-token")
+            .header("x-contextforge-server-id", "server-1")
+            .json(&json!({
+                "jsonrpc": "2.0",
+                "id": request_id,
+                "method": "tools/call",
+                "params": {
+                    "name": "echo",
+                    "arguments": {"text": "hello"}
+                }
+            }))
+            .send()
+            .await
+            .expect("tools/call response");
+
+        assert_eq!(response.status(), StatusCode::OK);
+        assert_eq!(
+            response
+                .headers()
+                .get("x-contextforge-mcp-upstream-client")
+                .and_then(|value| value.to_str().ok()),
+            Some("rmcp")
+        );
+        let body: Value = response.json().await.expect("json body");
+        assert_eq!(body["result"]["content"][0]["text"], "ok-rmcp");
+    }
+
+    assert_eq!(*backend_resolve_calls.lock().expect("lock"), 1);
+    assert_eq!(*backend_fallback_calls.lock().expect("lock"), 0);
+    assert_eq!(*upstream_initialize_calls.lock().expect("lock"), 1);
+    assert_eq!(*upstream_tool_calls.lock().expect("lock"), 2);
+    let metric_records = metric_records.lock().expect("lock");
+    assert_eq!(metric_records.len(), 2);
+    for body in metric_records.iter() {
+        assert_eq!(body["toolId"], "tool-1");
+        assert_eq!(body["serverId"], "server-1");
+        assert_eq!(body["success"], true);
+        assert!(body["durationMs"].as_f64().unwrap_or_default() >= 0.0);
+        assert!(body.get("errorMessage").is_none());
+    }
+}
+
+#[tokio::test]
+async fn tools_call_direct_execution_supports_sse_upstream_responses() {
+    let upstream_initialize_calls = Arc::new(Mutex::new(0usize));
+    let upstream_tool_calls = Arc::new(Mutex::new(0usize));
+    let backend_fallback_calls = Arc::new(Mutex::new(0usize));
+    let backend_resolve_calls = Arc::new(Mutex::new(0usize));
+
+    let upstream = {
+        let upstream_initialize_calls = upstream_initialize_calls.clone();
+        let upstream_tool_calls = upstream_tool_calls.clone();
+        Router::new().route(
+            "/mcp",
+            post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                let upstream_initialize_calls = upstream_initialize_calls.clone();
+                let upstream_tool_calls = upstream_tool_calls.clone();
+                async move {
+                    match body.get("method").and_then(Value::as_str) {
+                        Some("initialize") => {
+                            *upstream_initialize_calls.lock().expect("lock") += 1;
+                            assert_eq!(
+                                headers
+                                    .get("x-upstream-auth")
+                                    .and_then(|value| value.to_str().ok()),
+                                Some("rust-plan")
+                            );
+                            let mut response_headers = HeaderMap::new();
+                            response_headers.insert(
+                                "mcp-session-id",
+                                HeaderValue::from_static("sse-upstream-session"),
+                            );
+                            response_headers.insert(
+                                "content-type",
+                                HeaderValue::from_static("text/event-stream"),
+                            );
+                            (
+                                StatusCode::OK,
+                                response_headers,
+                                format!(
+                                    "data: {}\n\n",
+                                    json!({
+                                        "jsonrpc":"2.0",
+                                        "id": body["id"],
+                                        "result": {
+                                            "protocolVersion": "2025-11-25",
+                                            "serverInfo": {"name": "upstream", "version": "1.0.0"},
+                                            "capabilities": {}
+                                        }
+                                    })
+                                ),
+                            )
+                                .into_response()
+                        }
+                        Some("notifications/initialized") => StatusCode::ACCEPTED.into_response(),
+                        Some("tools/call") => {
+                            *upstream_tool_calls.lock().expect("lock") += 1;
+                            assert_eq!(
+                                headers
+                                    .get("mcp-session-id")
+                                    .and_then(|value| value.to_str().ok()),
+                                Some("sse-upstream-session")
+                            );
+                            (
+                                StatusCode::OK,
+                                [(
+                                    "content-type",
+                                    HeaderValue::from_static("text/event-stream"),
+                                )],
+                                format!(
+                                    "data: {}\nid: 0/0\n\n",
+                                    json!({
+                                        "jsonrpc":"2.0",
+                                        "id": body["id"],
+                                        "result": {
+                                            "content": [{"type": "text", "text": "ok-sse-direct"}],
+                                            "isError": false
+                                        }
+                                    })
+                                ),
+                            )
+                                .into_response()
+                        }
+                        other => (
+                            StatusCode::BAD_REQUEST,
+                            Json(json!({"unexpected_method": other})),
+                        )
+                            .into_response(),
+                    }
+                }
+            }),
+        )
+    };
+    let upstream_url = spawn_router(upstream).await;
+
+    let backend = {
+        let backend_fallback_calls = backend_fallback_calls.clone();
+        let backend_resolve_calls = backend_resolve_calls.clone();
+        let upstream_url = upstream_url.clone();
+        Router::new()
+            .route(
+                "/_internal/mcp/tools/call/resolve",
+                post(move |Json(body): Json<Value>| {
+                    let backend_resolve_calls = backend_resolve_calls.clone();
+                    let upstream_url = upstream_url.clone();
+                    async move {
+                        *backend_resolve_calls.lock().expect("lock") += 1;
+                        assert_eq!(body["params"]["name"], "echo");
+                        Json(json!({
+                            "eligible": true,
+                            "transport": "streamablehttp",
+                            "serverUrl": format!("{upstream_url}/mcp"),
+                            "remoteToolName": "echo_remote",
+                            "headers": {"x-upstream-auth": "rust-plan"},
+                            "timeoutMs": 30000
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/tools/call",
+                post(move || {
+                    let backend_fallback_calls = backend_fallback_calls.clone();
+                    async move {
+                        *backend_fallback_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id": 1,
+                            "result": {"unexpected": true}
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("authorization", "Bearer test-token")
+        .header("x-contextforge-server-id", "server-1")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 51,
+            "method": "tools/call",
+            "params": {
+                "name": "echo",
+                "arguments": {"text": "hello"}
+            }
+        }))
+        .send()
+        .await
+        .expect("tools/call response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["content"][0]["text"], "ok-sse-direct");
+    assert_eq!(*backend_resolve_calls.lock().expect("lock"), 1);
+    assert_eq!(*backend_fallback_calls.lock().expect("lock"), 0);
+    assert_eq!(*upstream_initialize_calls.lock().expect("lock"), 1);
+    assert_eq!(*upstream_tool_calls.lock().expect("lock"), 1);
+}
+
+#[tokio::test]
+async fn mcp_path_aliases_to_the_same_runtime_handler() {
+    let backend = Router::new().route(
+        "/rpc",
+        post(|| async {
+            Json(json!({
+                "jsonrpc":"2.0",
+                "id": 3,
+                "result": {"ok": true}
+            }))
+        }),
+    );
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 3,
+            "method": "tools/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("mcp alias response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["ok"], true);
+}
+
+#[tokio::test]
+async fn unsupported_protocol_header_is_rejected() {
+    let backend = Router::new().route(
+        "/rpc",
+        post(|| async {
+            Json(json!({
+                "jsonrpc":"2.0",
+                "id": 1,
+                "result": {}
+            }))
+        }),
+    );
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "1999-01-01")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": "ping-bad-version",
+            "method": "ping",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("unsupported version response");
+
+    assert_eq!(response.status(), StatusCode::BAD_REQUEST);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["error"], "Bad Request");
+    assert!(
+        body["message"]
+            .as_str()
+            .expect("message string")
+            .contains("Unsupported protocol version: 1999-01-01")
+    );
+}
+
+#[tokio::test]
+async fn notifications_are_forwarded_but_return_accepted() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let initialized_calls = Arc::new(Mutex::new(0usize));
+    let message_calls = Arc::new(Mutex::new(0usize));
+    let cancelled_calls = Arc::new(Mutex::new(0usize));
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let initialized_calls = initialized_calls.clone();
+        let message_calls = message_calls.clone();
+        let cancelled_calls = cancelled_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({"jsonrpc":"2.0","result":{}}))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/notifications/initialized",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let initialized_calls = initialized_calls.clone();
+                    async move {
+                        *initialized_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "notifications/initialized");
+                        StatusCode::NO_CONTENT.into_response()
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/notifications/message",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let message_calls = message_calls.clone();
+                    async move {
+                        *message_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "notifications/message");
+                        StatusCode::NO_CONTENT.into_response()
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/notifications/cancelled",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let cancelled_calls = cancelled_calls.clone();
+                    async move {
+                        *cancelled_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(body["method"], "notifications/cancelled");
+                        StatusCode::NO_CONTENT.into_response()
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let client = reqwest::Client::new();
+
+    let response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "method": "notifications/initialized",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("notification response");
+
+    assert_eq!(response.status(), StatusCode::ACCEPTED);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    assert!(response.bytes().await.expect("body bytes").is_empty());
+
+    let response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "method": "notifications/message",
+            "params": {
+                "data": "hello",
+                "level": "info",
+                "logger": "tests"
+            }
+        }))
+        .send()
+        .await
+        .expect("notification response");
+
+    assert_eq!(response.status(), StatusCode::ACCEPTED);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    assert!(response.bytes().await.expect("body bytes").is_empty());
+
+    let response = client
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "method": "notifications/cancelled",
+            "params": {
+                "requestId": "req-1",
+                "reason": "stop"
+            }
+        }))
+        .send()
+        .await
+        .expect("notification response");
+
+    assert_eq!(response.status(), StatusCode::ACCEPTED);
+    assert_eq!(
+        response
+            .headers()
+            .get("x-contextforge-mcp-runtime")
+            .and_then(|value| value.to_str().ok()),
+        Some("rust")
+    );
+    assert!(response.bytes().await.expect("body bytes").is_empty());
+
+    assert_eq!(*initialized_calls.lock().expect("lock"), 1);
+    assert_eq!(*message_calls.lock().expect("lock"), 1);
+    assert_eq!(*cancelled_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn internal_only_headers_are_not_forwarded_to_backend() {
+    let backend = Router::new().route(
+        "/rpc",
+        post(|headers: HeaderMap| async move {
+            Json(json!({
+                "jsonrpc":"2.0",
+                "id": 1,
+                "result": {
+                    "x_forwarded_internally": headers.get("x-forwarded-internally").and_then(|value| value.to_str().ok()),
+                    "x_forwarded_for": headers.get("x-forwarded-for").and_then(|value| value.to_str().ok()),
+                    "x_real_ip": headers.get("x-real-ip").and_then(|value| value.to_str().ok()),
+                    "x_forwarded_proto": headers.get("x-forwarded-proto").and_then(|value| value.to_str().ok()),
+                    "x_mcp_session_id": headers.get("x-mcp-session-id").and_then(|value| value.to_str().ok()),
+                    "runtime_header": headers.get("x-contextforge-mcp-runtime").and_then(|value| value.to_str().ok()),
+                }
+            }))
+        }),
+    );
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-forwarded-internally", "true")
+        .header("x-forwarded-for", "198.51.100.10")
+        .header("x-real-ip", "198.51.100.10")
+        .header("x-forwarded-proto", "https")
+        .header("x-mcp-session-id", "internal-only")
+        .header("x-contextforge-mcp-runtime", "spoofed")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": 1,
+            "method": "tools/list",
+            "params": {}
+        }))
+        .send()
+        .await
+        .expect("runtime response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["result"]["x_forwarded_internally"], Value::Null);
+    assert_eq!(body["result"]["x_forwarded_for"], Value::Null);
+    assert_eq!(body["result"]["x_real_ip"], Value::Null);
+    assert_eq!(body["result"]["x_forwarded_proto"], Value::Null);
+    assert_eq!(body["result"]["x_mcp_session_id"], Value::Null);
+    assert_eq!(body["result"]["runtime_header"], "rust");
+}
+
+#[tokio::test]
+async fn initialize_uses_specialized_internal_endpoint() {
+    let rpc_calls = Arc::new(Mutex::new(0usize));
+    let initialize_calls = Arc::new(Mutex::new(0usize));
+
+    let backend = {
+        let rpc_calls = rpc_calls.clone();
+        let initialize_calls = initialize_calls.clone();
+        Router::new()
+            .route(
+                "/rpc",
+                post(move || {
+                    let rpc_calls = rpc_calls.clone();
+                    async move {
+                        *rpc_calls.lock().expect("lock") += 1;
+                        Json(json!({
+                            "jsonrpc":"2.0",
+                            "id":"unexpected-rpc-path",
+                            "result": {}
+                        }))
+                    }
+                }),
+            )
+            .route(
+                "/_internal/mcp/initialize",
+                post(move |headers: HeaderMap, Json(body): Json<Value>| {
+                    let initialize_calls = initialize_calls.clone();
+                    async move {
+                        *initialize_calls.lock().expect("lock") += 1;
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-mcp-runtime")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("rust")
+                        );
+                        assert_eq!(
+                            headers
+                                .get("x-contextforge-server-id")
+                                .and_then(|value| value.to_str().ok()),
+                            Some("server-1")
+                        );
+                        assert_eq!(body["method"], "initialize");
+                        Json(json!({
+                            "jsonrpc": "2.0",
+                            "id": body["id"],
+                            "result": {
+                                "protocolVersion": "2025-11-25",
+                                "capabilities": {},
+                                "serverInfo": {"name": "ContextForge", "version": "1.0.0"}
+                            }
+                        }))
+                    }
+                }),
+            )
+    };
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/_internal/mcp/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("x-contextforge-server-id", "server-1")
+        .header(
+            "x-contextforge-auth-context",
+            URL_SAFE_NO_PAD.encode(r#"{"email":"user@example.com","teams":["team-1"],"is_authenticated":true,"is_admin":false,"permission_is_admin":false}"#),
+        )
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": "init-1",
+            "method": "initialize",
+            "params": {
+                "protocolVersion": "2025-11-25",
+                "capabilities": {}
+            }
+        }))
+        .send()
+        .await
+        .expect("initialize response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["id"], "init-1");
+    assert_eq!(body["result"]["protocolVersion"], "2025-11-25");
+    assert_eq!(*initialize_calls.lock().expect("lock"), 1);
+    assert_eq!(*rpc_calls.lock().expect("lock"), 0);
+}
+
+#[tokio::test]
+async fn initialize_missing_protocol_version_returns_invalid_params() {
+    let backend = Router::new().route(
+        "/rpc",
+        post(|| async {
+            Json(json!({
+                "jsonrpc":"2.0",
+                "id": "should-not-be-called",
+                "result": {}
+            }))
+        }),
+    );
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!({
+            "jsonrpc": "2.0",
+            "id": "init-missing-version",
+            "method": "initialize",
+            "params": {
+                "capabilities": {},
+                "clientInfo": {"name": "mcp-compliance-suite", "version": "1.0.0"}
+            }
+        }))
+        .send()
+        .await
+        .expect("initialize invalid params response");
+
+    assert_eq!(response.status(), StatusCode::OK);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["jsonrpc"], "2.0");
+    assert_eq!(body["id"], "init-missing-version");
+    assert_eq!(body["error"]["code"], -32602);
+}
+
+#[tokio::test]
+async fn jsonrpc_batch_payload_is_rejected() {
+    let backend = Router::new().route(
+        "/rpc",
+        post(|| async {
+            Json(json!({
+                "jsonrpc":"2.0",
+                "id": 1,
+                "result": {}
+            }))
+        }),
+    );
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "2025-11-25")
+        .json(&json!([
+            {"jsonrpc": "2.0", "id": 1, "method": "ping"}
+        ]))
+        .send()
+        .await
+        .expect("batch rejection response");
+
+    assert_eq!(response.status(), StatusCode::BAD_REQUEST);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["jsonrpc"], "2.0");
+    assert_eq!(body["error"]["code"], -32600);
+}
+
+#[tokio::test]
+async fn top_level_scalar_payload_is_invalid_request() {
+    let backend = Router::new().route(
+        "/rpc",
+        post(|| async {
+            Json(json!({
+                "jsonrpc":"2.0",
+                "id": 1,
+                "result": {}
+            }))
+        }),
+    );
+    let backend_url = spawn_router(backend).await;
+
+    let runtime = {
+        let config = RuntimeConfig {
+            backend_rpc_url: format!("{backend_url}/rpc"),
+            listen_http: "127.0.0.1:8787".to_string(),
+            listen_uds: None,
+            protocol_version: "2025-11-25".to_string(),
+            supported_protocol_versions: vec![],
+            server_name: "ContextForge".to_string(),
+            server_version: "0.1.0".to_string(),
+            instructions: "ContextForge providing federated tools, resources and prompts. Use /admin interface for configuration.".to_string(),
+            request_timeout_ms: 30_000,
+            database_url: None,
+            db_pool_max_size: 20,
+            log_filter: "error".to_string(),
+            ..test_runtime_config()
+        };
+        build_router(AppState::new(&config).expect("state"))
+    };
+    let runtime_url = spawn_router(runtime).await;
+
+    let response = reqwest::Client::new()
+        .post(format!("{runtime_url}/mcp"))
+        .header("mcp-protocol-version", "2025-11-25")
+        .body("\"not-an-object\"")
+        .send()
+        .await
+        .expect("invalid request response");
+
+    assert_eq!(response.status(), StatusCode::BAD_REQUEST);
+    let body: Value = response.json().await.expect("json body");
+    assert_eq!(body["jsonrpc"], "2.0");
+    assert_eq!(body["error"]["code"], -32600);
+}