NVIDIA
diff --git a/‎.agents/skills/nemoclaw-user-monitor-sandbox/SKILL.md‎
Lines changed: 32 additions & 0 deletions b/‎.agents/skills/nemoclaw-user-monitor-sandbox/SKILL.md‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎nemoclaw/src/blueprint/runner-metrics.test.ts‎
Lines changed: 165 additions & 0 deletions b/‎nemoclaw/src/blueprint/runner-metrics.test.ts‎
Lines changed: 165 additions & 0 deletions
diff --git a/‎nemoclaw/src/blueprint/runner.test.ts‎
Lines changed: 1 addition & 0 deletions b/‎nemoclaw/src/blueprint/runner.test.ts‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎nemoclaw/src/blueprint/runner.ts‎
Lines changed: 41 additions & 9 deletions b/‎nemoclaw/src/blueprint/runner.ts‎
Lines changed: 41 additions & 9 deletions
diff --git a/‎nemoclaw/src/index.ts‎
Lines changed: 39 additions & 1 deletion b/‎nemoclaw/src/index.ts‎
Lines changed: 39 additions & 1 deletion
@@ -79,6 +79,38 @@ openshell sandbox download <name> /sandbox/.openclaw/agents/main/sessions/<sessi
 Treat exported session logs as sensitive data.
 They can contain prompts, tool inputs, tool outputs, file paths, and cost metadata from the agent run.
 
+## Export Prometheus Metrics
+
+NemoClaw can expose lightweight Prometheus-format metrics for blueprint execution, API validation, and sandbox lifecycle operations.
+Metrics are disabled by default.
+
+Set the following environment variable before starting the OpenClaw process that loads the NemoClaw plugin:
+
+```bash
+export NEMOCLAW_METRICS_ENABLED=true
+```
+
+The metrics endpoint listens on `127.0.0.1:9090` by default:
+
+```bash
+curl http://127.0.0.1:9090/metrics
+```
+
+Warning: the `/metrics` endpoint is unauthenticated.
+If `NEMOCLAW_METRICS_HOST` binds beyond loopback, any host or network that can reach `NEMOCLAW_METRICS_HOST:NEMOCLAW_METRICS_PORT/metrics` may scrape operational metadata about blueprint execution, API validation, and sandbox lifecycle activity.
+Prefer scraping over a secured network, restrict access with firewall rules, or keep `NEMOCLAW_METRICS_HOST` bound to loopback and expose `/metrics` through a secured proxy.
+
+Use `NEMOCLAW_METRICS_PORT` to select another port, or `NEMOCLAW_METRICS_HOST` to bind to a different interface when your deployment needs remote scraping.
+The endpoint serves only `/metrics`; other paths return `404`.
+
+Example metric families include:
+
+```text
+blueprint_execution_total{action="apply",profile="default",status="success"} 1
+api_validation_total{kind="endpoint_url",source="blueprint",status="success"} 1
+sandbox_lifecycle_total{operation="create",status="success"} 1
+```
+
 ## Monitor Network Activity in the TUI
 
 Open the OpenShell terminal UI for a live view of sandbox network activity and egress requests:
 
@@ -0,0 +1,165 @@
+// SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+// SPDX-License-Identifier: Apache-2.0
+
+import { afterEach, beforeEach, describe, expect, it, vi } from "vitest";
+import type fs from "node:fs";
+
+interface FsEntry {
+  type: "file" | "dir";
+  content?: string;
+}
+
+const store = new Map<string, FsEntry>();
+const mockExeca = vi.fn();
+
+vi.mock("node:os", () => ({
+  homedir: () => "/fakehome",
+}));
+
+vi.mock("node:crypto", () => ({
+  randomUUID: () => "aaaaaaaa-bbbb-cccc-dddd-eeeeeeeeeeee",
+}));
+
+vi.mock("node:fs", async (importOriginal) => {
+  const original = await importOriginal<typeof fs>();
+  return {
+    ...original,
+    existsSync: (p: string) => store.has(p),
+    mkdirSync: vi.fn((p: string) => {
+      store.set(p, { type: "dir" });
+    }),
+    readFileSync: (p: string) => {
+      const entry = store.get(p);
+      if (entry?.type !== "file") {
+        throw new Error(`ENOENT: ${p}`);
+      }
+      return entry.content ?? "";
+    },
+    writeFileSync: vi.fn((p: string, data: string) => {
+      store.set(p, { type: "file", content: data });
+    }),
+    readdirSync: (p: string) => {
+      const prefix = p.endsWith("/") ? p : `${p}/`;
+      const entries = new Set<string>();
+      for (const key of store.keys()) {
+        if (key.startsWith(prefix)) {
+          const [first] = key.slice(prefix.length).split("/");
+          if (first) {
+            entries.add(first);
+          }
+        }
+      }
+      if (entries.size === 0 && !store.has(p)) {
+        throw new Error(`ENOENT: ${p}`);
+      }
+      return [...entries].sort();
+    },
+  };
+});
+
+vi.mock("execa", () => ({
+  execa: (...args: unknown[]) => mockExeca(...args),
+}));
+
+vi.mock("./ssrf.js", () => ({
+  validateEndpointUrl: vi.fn(async (url: string) => ({ url, pinnedUrl: url })),
+}));
+
+const { validateEndpointUrl } = await import("./ssrf.js");
+const mockedValidateEndpoint = vi.mocked(validateEndpointUrl);
+const { metrics } = await import("../observability/metrics.js");
+const { actionApply, actionPlan } = await import("./runner.js");
+
+const stdoutChunks: string[] = [];
+
+function captureStdout(): void {
+  vi.spyOn(process.stdout, "write").mockImplementation((chunk: string | Uint8Array) => {
+    stdoutChunks.push(String(chunk));
+    return true;
+  });
+}
+
+function minimalBlueprint(): Record<string, unknown> {
+  return {
+    version: "1.0",
+    components: {
+      inference: {
+        profiles: {
+          default: {
+            provider_type: "openai",
+            provider_name: "my-provider",
+            endpoint: "https://api.example.com/v1",
+            model: "gpt-4",
+            credential_env: "MY_API_KEY",
+          },
+        },
+      },
+      sandbox: {
+        image: "openclaw",
+        name: "test-sandbox",
+        forward_ports: [18789],
+      },
+      policy: { additions: {} },
+    },
+  };
+}
+
+describe("runner metrics", () => {
+  beforeEach(() => {
+    store.clear();
+    stdoutChunks.length = 0;
+    vi.clearAllMocks();
+    process.env.NEMOCLAW_METRICS_ENABLED = "true";
+    metrics.reset();
+  });
+
+  afterEach(() => {
+    vi.restoreAllMocks();
+    metrics.reset();
+    delete process.env.NEMOCLAW_METRICS_ENABLED;
+  });
+
+  it("records blueprint and endpoint validation metrics for successful plans", async () => {
+    captureStdout();
+    mockExeca.mockResolvedValue({ exitCode: 0 });
+
+    await actionPlan("default", minimalBlueprint());
+
+    const output = metrics.renderPrometheus();
+    expect(output).toContain('blueprint_execution_total{action="plan",status="success"} 1');
+    expect(output).toContain(
+      'blueprint_execution_duration_seconds_count{action="plan",status="success"} 1',
+    );
+    expect(output).toContain(
+      'api_validation_total{kind="endpoint_url",source="blueprint",status="success"} 1',
+    );
+  });
+
+  it("records blueprint and endpoint validation metrics for failed plans", async () => {
+    captureStdout();
+    mockExeca.mockResolvedValue({ exitCode: 0 });
+    mockedValidateEndpoint.mockRejectedValueOnce(new Error("SSRF blocked"));
+
+    await expect(actionPlan("default", minimalBlueprint())).rejects.toThrow("SSRF blocked");
+
+    const output = metrics.renderPrometheus();
+    expect(output).toContain('blueprint_execution_total{action="plan",status="error"} 1');
+    expect(output).toContain(
+      'api_validation_total{kind="endpoint_url",source="blueprint",status="error"} 1',
+    );
+  });
+
+  it("records sandbox lifecycle metrics during apply", async () => {
+    captureStdout();
+    mockExeca.mockResolvedValue({ exitCode: 0, stdout: "", stderr: "" });
+
+    await actionApply("default", minimalBlueprint());
+
+    const output = metrics.renderPrometheus();
+    expect(output).toContain('blueprint_execution_total{action="apply",status="success"} 1');
+    expect(output).toContain('sandbox_lifecycle_total{operation="create",status="success"} 1');
+    expect(output).toContain(
+      'sandbox_lifecycle_duration_seconds_count{operation="create",status="success"} 1',
+    );
+  });
+});
@@ -620,6 +620,7 @@ describe("runner", () => {
       expect(plan.router.enabled).toBe(false);
       expect(plan.router.port).toBe(4000);
     });
+
   });
 
   describe("actionApply", () => {
 
@@ -20,6 +20,7 @@ import { join, sep } from "node:path";
 import { execa } from "execa";
 import YAML from "yaml";
 
+import { metrics } from "../observability/metrics.js";
 import { validateEndpointUrl } from "./ssrf.js";
 import { buildSubprocessEnv } from "../lib/subprocess-env.js";
 import { DASHBOARD_PORT } from "../lib/ports.js";
@@ -409,6 +410,15 @@ async function openshellAvailable(): Promise<boolean> {
   return result.exitCode === 0;
 }
 
+async function validateEndpointForMetrics(
+  endpointUrl: string,
+  source: "override" | "blueprint",
+): ReturnType<typeof validateEndpointUrl> {
+  return await metrics.observeOperation("api_validation", { kind: "endpoint_url", source }, () =>
+    validateEndpointUrl(endpointUrl),
+  );
+}
+
 /**
  * Resolve inference config and sandbox config from a blueprint, applying
  * endpoint URL override and SSRF validation if provided.
@@ -431,7 +441,7 @@ async function resolveRunConfig(
 
   let inferenceCfg = { ...inferenceProfiles[profile] };
   if (endpointUrl) {
-    const validated = await validateEndpointUrl(endpointUrl);
+    const validated = await validateEndpointForMetrics(endpointUrl, "override");
     // Use DNS-pinned URL for HTTP (full SSRF/rebinding protection). For HTTPS,
     // keep the original hostname — TLS certificate validation prevents rebinding
     // since the attacker cannot present a valid cert for the target.
@@ -441,7 +451,7 @@ async function resolveRunConfig(
 
   // Validate the final endpoint (whether from CLI override or blueprint profile)
   if (inferenceCfg.endpoint) {
-    const validated = await validateEndpointUrl(inferenceCfg.endpoint);
+    const validated = await validateEndpointForMetrics(inferenceCfg.endpoint, "blueprint");
     const safe = inferenceCfg.endpoint.startsWith("https:") ? validated.url : validated.pinnedUrl;
     inferenceCfg = { ...inferenceCfg, endpoint: safe };
   }
@@ -655,6 +665,16 @@ export async function actionPlan(
   profile: string,
   blueprint: Blueprint,
   options?: { dryRun?: boolean; endpointUrl?: string },
+): Promise<RunPlan> {
+  return await metrics.observeOperation("blueprint_execution", { action: "plan" }, () =>
+    actionPlanImpl(profile, blueprint, options),
+  );
+}
+
+async function actionPlanImpl(
+  profile: string,
+  blueprint: Blueprint,
+  options?: { dryRun?: boolean; endpointUrl?: string },
 ): Promise<RunPlan> {
   const rid = emitRunId();
   progress(10, "Validating blueprint");
@@ -691,6 +711,16 @@ export async function actionApply(
   profile: string,
   blueprint: Blueprint,
   options?: { planPath?: string; endpointUrl?: string },
+): Promise<void> {
+  await metrics.observeOperation("blueprint_execution", { action: "apply" }, () =>
+    actionApplyImpl(profile, blueprint, options),
+  );
+}
+
+async function actionApplyImpl(
+  profile: string,
+  blueprint: Blueprint,
+  options?: { planPath?: string; endpointUrl?: string },
 ): Promise<void> {
   if (options?.planPath) {
     throw new Error(
@@ -727,14 +757,16 @@ export async function actionApply(
     createArgs.push("--forward", String(port));
   }
 
-  const createResult = await runCmd(createArgs, { reject: false });
-  if (createResult.exitCode !== 0) {
-    if (createResult.stderr.includes("already exists")) {
-      log(`Sandbox '${sandboxName}' already exists, reusing.`);
-    } else {
-      throw new Error(`Failed to create sandbox: ${createResult.stderr}`);
+  await metrics.observeOperation("sandbox_lifecycle", { operation: "create" }, async () => {
+    const createResult = await runCmd(createArgs, { reject: false });
+    if (createResult.exitCode !== 0) {
+      if (createResult.stderr.includes("already exists")) {
+        log(`Sandbox '${sandboxName}' already exists, reusing.`);
+      } else {
+        throw new Error(`Failed to create sandbox: ${createResult.stderr}`);
+      }
     }
-  }
+  });
 
   progress(50, "Configuring inference provider");
   const providerName = inferenceCfg.provider_name ?? "default";
 
@@ -19,6 +19,8 @@ import {
   describeOnboardProvider,
   loadOnboardConfig,
 } from "./onboard/config.js";
+import { isMetricsEnabled, metrics } from "./observability/metrics.js";
+import { startMetricsServer, type MetricsServer } from "./observability/server.js";
 import { registerRuntimeContext } from "./runtime-context.js";
 import { scanForSecrets, isMemoryPath } from "./security/secret-scanner.js";
 import { safeResolvePath } from "./security/safe-resolve-path.js";
@@ -352,7 +354,43 @@ export default function register(api: OpenClawPluginApi): void {
     handler: (ctx) => handleSlashCommand(ctx, api),
   });
 
-  // 2. Register nvidia-nim provider from the active OpenClaw config, falling
+  // 2. Register optional Prometheus-compatible metrics endpoint (#233)
+  if (isMetricsEnabled()) {
+    let metricsServer: MetricsServer | undefined;
+    api.registerService({
+      id: "nemoclaw-metrics",
+      start: async ({ logger }) => {
+        try {
+          metricsServer = await startMetricsServer({ registry: metrics, logger });
+        } catch (error) {
+          logger.warn(
+            `[OBSERVABILITY] Could not start NemoClaw metrics endpoint: ${
+              error instanceof Error ? error.message : String(error)
+            }`,
+          );
+        }
+      },
+      stop: async ({ logger }) => {
+        if (!metricsServer) {
+          return;
+        }
+        try {
+          await metricsServer.close();
+          logger.info("NemoClaw metrics endpoint stopped");
+        } catch (error) {
+          logger.warn(
+            `[OBSERVABILITY] Could not stop NemoClaw metrics endpoint cleanly: ${
+              error instanceof Error ? error.message : String(error)
+            }`,
+          );
+        } finally {
+          metricsServer = undefined;
+        }
+      },
+    });
+  }
+
+  // 3. Register nvidia-nim provider from the active OpenClaw config, falling
   // back to the onboard snapshot and then the NemoClaw default.
   const onboardCfg = loadOnboardConfig();
   const activeModel = readOpenClawPrimaryModel(api.logger) || onboardCfg?.model || "";