strands-agents · jsamuel1 · May 9, 2026 · github-actions · May 9, 2026
diff --git a/AGENTS.md b/AGENTS.md
@@ -78,10 +78,14 @@ sdk-typescript/
 │   │   │   ├── anthropic.ts      # Anthropic Claude
 │   │   │   ├── bedrock.ts        # AWS Bedrock
 │   │   │   ├── vercel.ts         # Vercel AI SDK
+│   │   │   ├── webllm/           # WebLLM (on-device via WebGPU) provider
+│   │   │   │   ├── __tests__/    # model.test.ts, cache.test.node.ts, browser.test.browser.ts
+│   │   │   │   ├── cache.ts      # Download / list / check / evict helpers + errors
+│   │   │   │   ├── model.ts      # WebLLMModel (runtime streaming + message formatting)
+│   │   │   │   └── index.ts
 │   │   │   ├── defaults.ts       # Centralized model defaults + warning messages
 │   │   │   ├── model.ts          # Base model interface
 │   │   │   └── streaming.ts      # Streaming event types
-│   │   │
 │   │   ├── multiagent/           # Multi-agent orchestration
 │   │   │   ├── __tests__/
 │   │   │   ├── graph.ts          # Graph orchestrator (DAG)
@@ -275,7 +279,7 @@ sdk-typescript/
 - **`strands-ts/src/conversation-manager/`**: Conversation history management strategies
 - **`strands-ts/src/hooks/`**: Hooks system for event-driven extensibility
 - **`strands-ts/src/logging/`**: Structured logging utilities
-- **`strands-ts/src/models/`**: Model provider implementations (Bedrock, Anthropic, OpenAI, Google, Vercel)
+- **`strands-ts/src/models/`**: Model provider implementations (Bedrock, Anthropic, OpenAI, Google, Vercel, WebLLM)
 - **`strands-ts/src/multiagent/`**: Multi-agent orchestration patterns (Graph for DAG execution, Swarm for handoff-based routing)
 - **`strands-ts/src/plugins/`**: Plugin system for extending agent functionality
 - **`strands-ts/src/registry/`**: Tool registry implementation

diff --git a/strands-ts/package.json b/strands-ts/package.json
@@ -36,6 +36,10 @@
       "types": "./dist/src/models/vercel.d.ts",
       "default": "./dist/src/models/vercel.js"
     },
+    "./models/webllm": {
+      "types": "./dist/src/models/webllm/index.d.ts",
+      "default": "./dist/src/models/webllm/index.js"
+    },
     "./multiagent": {
       "types": "./dist/src/multiagent/index.d.ts",
       "default": "./dist/src/multiagent/index.js"
@@ -130,6 +134,7 @@
     "@aws-sdk/credential-providers": "^3.943.0",
     "@eslint/js": "^9.39.4",
     "@google/genai": "^1.40.0",
+    "@mlc-ai/web-llm": "^0.2.79",
     "@opentelemetry/api": "^1.9.0",
     "@opentelemetry/exporter-metrics-otlp-http": "^0.214.0",
     "@opentelemetry/exporter-trace-otlp-http": "^0.214.0",
@@ -178,6 +183,7 @@
     "@aws-sdk/client-s3": "^3.943.0",
     "@google/genai": "^1.40.0",
     "@modelcontextprotocol/sdk": "^1.25.2",
+    "@mlc-ai/web-llm": "^0.2.79",
     "@opentelemetry/api": "^1.9.0",
     "@opentelemetry/exporter-metrics-otlp-http": "^0.214.0",
     "@opentelemetry/exporter-trace-otlp-http": "^0.214.0",
@@ -208,6 +214,9 @@
     "@google/genai": {
       "optional": true
     },
+    "@mlc-ai/web-llm": {
+      "optional": true
+    },
     "openai": {
       "optional": true
     },

diff --git a/strands-ts/src/models/webllm/__tests__/browser.test.browser.ts b/strands-ts/src/models/webllm/__tests__/browser.test.browser.ts
@@ -0,0 +1,27 @@
+// ABOUTME: Browser-only smoke test for the WebLLM provider.
+// ABOUTME: Verifies the public module imports cleanly and listWebLLMModels works
+// ABOUTME: against the real @mlc-ai/web-llm prebuilt app config in a browser.
+
+import { describe, it, expect } from 'vitest'
+import { isBrowser } from '../../../__fixtures__/environment.js'
+import { WebLLMModel, listWebLLMModels } from '../index.js'
+
+describe('WebLLM browser smoke', () => {
+  it('runs in a browser environment', () => {
+    expect(isBrowser).toBe(true)
+  })
+
+  it('exposes WebLLMModel as a constructor', () => {
+    expect(typeof WebLLMModel).toBe('function')
+    const model = new WebLLMModel({ modelId: 'Llama-3.1-8B-Instruct-q4f32_1-MLC' })
+    expect(model.getConfig().modelId).toBe('Llama-3.1-8B-Instruct-q4f32_1-MLC')
+  })
+
+  it('lists prebuilt models', async () => {
+    const models = await listWebLLMModels()
+    expect(models.length).toBeGreaterThan(0)
+    expect(models[0]).toHaveProperty('modelId')
+    expect(models[0]).toHaveProperty('modelUrl')
+    expect(models[0]).toHaveProperty('modelLib')
+  })
+})
diff --git a/strands-ts/src/models/webllm/__tests__/cache.test.node.ts b/strands-ts/src/models/webllm/__tests__/cache.test.node.ts
@@ -0,0 +1,210 @@
+// ABOUTME: Unit tests for WebLLM cache / download helpers.
+// ABOUTME: The `@mlc-ai/web-llm` module is mocked so these run in node without WebGPU.
+
+import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest'
+import type { MockedFunction } from 'vitest'
+import {
+  deleteWebLLMModel,
+  downloadWebLLMModel,
+  isWebLLMModelCached,
+  listWebLLMModels,
+  resetWebLLMModuleCache,
+  WebLLMModelNotFoundError,
+  WebLLMUnavailableError,
+} from '../cache.js'
+
+// A minimal mock of the `@mlc-ai/web-llm` module surface we depend on.
+const mockPrebuiltAppConfig = {
+  model_list: [
+    {
+      model_id: 'test-model',
+      model: 'https://example.com/test-model',
+      model_lib: 'https://example.com/test-model.wasm',
+      vram_required_MB: 2048,
+    },
+    {
+      model_id: 'other-model',
+      model: 'https://example.com/other',
+      model_lib: 'https://example.com/other.wasm',
+    },
+  ],
+}
+
+const mockCreateEngine = vi.fn(
+  async (
+    _modelId: string | string[],
+    _engineConfig?: { initProgressCallback?: (report: unknown) => void },
+    _chatOpts?: unknown
+  ) => ({
+    unload: vi.fn(async () => undefined),
+    chat: { completions: { create: vi.fn() } },
+  })
+)
+const mockHasModelInCache = vi.fn(async () => false)
+const mockDeleteModelAllInfoInCache = vi.fn(async () => undefined)
+
+vi.mock('@mlc-ai/web-llm', () => ({
+  CreateMLCEngine: mockCreateEngine,
+  prebuiltAppConfig: mockPrebuiltAppConfig,
+  hasModelInCache: mockHasModelInCache,
+  deleteModelAllInfoInCache: mockDeleteModelAllInfoInCache,
+}))
+
+// Fake out the browser environment check so these helpers run in node.
+const originalWindow = globalThis.window
+beforeEach(() => {
+  ;(globalThis as { window?: unknown }).window = {} as unknown
+  vi.clearAllMocks()
+  resetWebLLMModuleCache()
+  mockHasModelInCache.mockResolvedValue(false)
+  mockDeleteModelAllInfoInCache.mockResolvedValue(undefined)
+  mockCreateEngine.mockImplementation(async () => ({
+    unload: vi.fn(async () => undefined),
+    chat: { completions: { create: vi.fn() } },
+  }))
+})
+afterEach(() => {
+  if (originalWindow === undefined) {
+    delete (globalThis as { window?: unknown }).window
+  } else {
+    ;(globalThis as { window?: unknown }).window = originalWindow
+  }
+})
+
+describe('isWebLLMModelCached', () => {
+  it('returns true when the model is in cache', async () => {
+    mockHasModelInCache.mockResolvedValueOnce(true)
+    const result = await isWebLLMModelCached('test-model')
+    expect(result).toBe(true)
+    expect(mockHasModelInCache).toHaveBeenCalledWith('test-model', mockPrebuiltAppConfig)
+  })
+
+  it('returns false when the model is not in cache', async () => {
+    const result = await isWebLLMModelCached('test-model')
+    expect(result).toBe(false)
+  })
+
+  it('returns false when hasModelInCache throws (treats as not cached)', async () => {
+    mockHasModelInCache.mockRejectedValueOnce(new Error('storage error'))
+    const result = await isWebLLMModelCached('test-model')
+    expect(result).toBe(false)
+  })
+
+  it('throws WebLLMModelNotFoundError for unknown modelId', async () => {
+    await expect(isWebLLMModelCached('nonexistent-model')).rejects.toBeInstanceOf(WebLLMModelNotFoundError)
+  })
+
+  it('throws WebLLMUnavailableError when not in browser environment', async () => {
+    delete (globalThis as { window?: unknown }).window
+    await expect(isWebLLMModelCached('test-model')).rejects.toBeInstanceOf(WebLLMUnavailableError)
+  })
+})
+
+describe('deleteWebLLMModel', () => {
+  it('delegates to deleteModelAllInfoInCache', async () => {
+    await deleteWebLLMModel('test-model')
+    expect(mockDeleteModelAllInfoInCache).toHaveBeenCalledWith('test-model', mockPrebuiltAppConfig)
+  })
+
+  it('throws for unknown model', async () => {
+    await expect(deleteWebLLMModel('nonexistent')).rejects.toBeInstanceOf(WebLLMModelNotFoundError)
+  })
+})
+
+describe('listWebLLMModels', () => {
+  it('returns all models from prebuiltAppConfig', async () => {
+    const models = await listWebLLMModels()
+    expect(models).toHaveLength(2)
+    expect(models[0]).toEqual({
+      modelId: 'test-model',
+      modelUrl: 'https://example.com/test-model',
+      modelLib: 'https://example.com/test-model.wasm',
+      vramMB: 2048,
+    })
+    expect(models[1]).toEqual({
+      modelId: 'other-model',
+      modelUrl: 'https://example.com/other',
+      modelLib: 'https://example.com/other.wasm',
+    })
+  })
+
+  it('uses custom appConfig when provided', async () => {
+    const custom = {
+      model_list: [{ model_id: 'custom', model: 'x', model_lib: 'y' }],
+    }
+    const models = await listWebLLMModels(custom as never)
+    expect(models).toEqual([{ modelId: 'custom', modelUrl: 'x', modelLib: 'y' }])
+  })
+})
+
+describe('downloadWebLLMModel', () => {
+  it('creates a temporary engine and unloads it after load', async () => {
+    const unload = vi.fn(async () => undefined)
+    mockCreateEngine.mockImplementationOnce(async () => ({
+      unload,
+      chat: { completions: { create: vi.fn() } },
+    }))
+    await downloadWebLLMModel({ modelId: 'test-model' })
+    expect(mockCreateEngine).toHaveBeenCalledTimes(1)
+    expect(mockCreateEngine).toHaveBeenCalledWith('test-model', { appConfig: mockPrebuiltAppConfig }, undefined)
+    expect(unload).toHaveBeenCalledTimes(1)
+  })
+
+  it('forwards onProgress as the engine initProgressCallback', async () => {
+    const onProgress = vi.fn()
+    const unload = vi.fn(async () => undefined)
+    mockCreateEngine.mockImplementationOnce(async (_modelId, engineConfig) => {
+      ;(engineConfig as { initProgressCallback?: (r: unknown) => void }).initProgressCallback?.({
+        progress: 0.5,
+        text: 'loading',
+        timeElapsed: 1,
+      })
+      return { unload, chat: { completions: { create: vi.fn() } } }
+    })
+    await downloadWebLLMModel({ modelId: 'test-model', onProgress })
+    expect(onProgress).toHaveBeenCalledWith({ progress: 0.5, text: 'loading', timeElapsed: 1 })
+  })
+
+  it('throws AbortError when signal is already aborted', async () => {
+    const controller = new AbortController()
+    controller.abort()
+    await expect(downloadWebLLMModel({ modelId: 'test-model', signal: controller.signal })).rejects.toMatchObject({
+      name: 'AbortError',
+    })
+    expect(mockCreateEngine).not.toHaveBeenCalled()
+  })
+
+  it('throws AbortError when aborted mid-download', async () => {
+    const controller = new AbortController()
+    const unload = vi.fn(async () => undefined)
+    mockCreateEngine.mockImplementationOnce(async () => {
+      controller.abort()
+      return { unload, chat: { completions: { create: vi.fn() } } }
+    })
+    await expect(downloadWebLLMModel({ modelId: 'test-model', signal: controller.signal })).rejects.toMatchObject({
+      name: 'AbortError',
+    })
+    expect(unload).toHaveBeenCalled()
+  })
+
+  it('throws when model is not in app config', async () => {
+    await expect(downloadWebLLMModel({ modelId: 'nonexistent' })).rejects.toBeInstanceOf(WebLLMModelNotFoundError)
+  })
+
+  it('surfaces engine errors via normalizeError', async () => {
+    mockCreateEngine.mockImplementationOnce(async () => {
+      throw new Error('webgpu unavailable')
+    })
+    await expect(downloadWebLLMModel({ modelId: 'test-model' })).rejects.toThrow('webgpu unavailable')
+  })
+})
+
+describe('loadWebLLMModule error handling', () => {
+  it('throws WebLLMUnavailableError when environment is not a browser', async () => {
+    delete (globalThis as { window?: unknown }).window
+    await expect(downloadWebLLMModel({ modelId: 'test-model' })).rejects.toBeInstanceOf(WebLLMUnavailableError)
+  })
+})
+
+// Silence unused-helper lint noise
+export type _Unused = MockedFunction<typeof mockCreateEngine>