docs(v2): add mode migration guide and normalization tests

jxnl · jxnl · commit 26e179513c36 · 2026-01-18T13:46:26.000-05:00
- Add docs/concepts/mode-migration.md explaining legacy mode deprecation - Add tests/v2/test_mode_normalization.py for mode normalization logic - Update mkdocs.yml with mode migration guide link - Tests skip gracefully when handlers not yet registered This PR was written by [Cursor](https://cursor.com)
diff --git a/docs/concepts/mode-migration.md b/docs/concepts/mode-migration.md
@@ -0,0 +1,107 @@
+---
+title: Mode Migration Guide
+description: Migrate from provider-specific modes to the core modes in Instructor.
+---
+
+# Mode Migration Guide
+
+This guide helps you move from provider-specific modes to the core modes.
+Core modes work across providers and are the recommended choice for new code.
+
+## Core Modes
+
+These are the core modes you should use:
+
+- `TOOLS`: Tool or function calling
+- `JSON_SCHEMA`: Native schema support when a provider has it
+- `MD_JSON`: JSON extracted from text or code blocks
+- `PARALLEL_TOOLS`: Multiple tool calls in one response
+- `RESPONSES_TOOLS`: OpenAI Responses API tools
+
+## Quick Mapping
+
+Use this table to replace legacy modes:
+
+| Legacy Mode | Core Mode |
+|------------|-----------|
+| `FUNCTIONS` | `TOOLS` |
+| `TOOLS_STRICT` | `TOOLS` |
+| `ANTHROPIC_TOOLS` | `TOOLS` |
+| `ANTHROPIC_JSON` | `MD_JSON` |
+| `COHERE_TOOLS` | `TOOLS` |
+| `COHERE_JSON_SCHEMA` | `JSON_SCHEMA` |
+| `XAI_TOOLS` | `TOOLS` |
+| `XAI_JSON` | `MD_JSON` |
+| `MISTRAL_TOOLS` | `TOOLS` |
+| `MISTRAL_STRUCTURED_OUTPUTS` | `JSON_SCHEMA` |
+| `FIREWORKS_TOOLS` | `TOOLS` |
+| `FIREWORKS_JSON` | `MD_JSON` |
+| `CEREBRAS_TOOLS` | `TOOLS` |
+| `CEREBRAS_JSON` | `MD_JSON` |
+| `WRITER_TOOLS` | `TOOLS` |
+| `WRITER_JSON` | `MD_JSON` |
+| `BEDROCK_TOOLS` | `TOOLS` |
+| `BEDROCK_JSON` | `MD_JSON` |
+| `PERPLEXITY_JSON` | `MD_JSON` |
+| `VERTEXAI_TOOLS` | `TOOLS` |
+| `VERTEXAI_JSON` | `MD_JSON` |
+| `VERTEXAI_PARALLEL_TOOLS` | `PARALLEL_TOOLS` |
+
+## Example: Anthropic
+
+**Before:**
+
+```python
+import instructor
+from instructor import Mode
+
+client = instructor.from_provider(
+    "anthropic/claude-3-5-haiku-latest",
+    mode=Mode.ANTHROPIC_TOOLS,
+)
+```
+
+**After:**
+
+```python
+import instructor
+from instructor import Mode
+
+client = instructor.from_provider(
+    "anthropic/claude-3-5-haiku-latest",
+    mode=Mode.TOOLS,
+)
+```
+
+## Example: Bedrock
+
+**Before:**
+
+```python
+import instructor
+from instructor import Mode
+
+client = instructor.from_provider(
+    "bedrock/anthropic.claude-3-5-sonnet-20241022-v2:0",
+    mode=Mode.BEDROCK_TOOLS,
+)
+```
+
+**After:**
+
+```python
+import instructor
+from instructor import Mode
+
+client = instructor.from_provider(
+    "bedrock/anthropic.claude-3-5-sonnet-20241022-v2:0",
+    mode=Mode.TOOLS,
+)
+```
+
+## Notes
+
+- Legacy modes still work but show a deprecation warning.
+- Use core modes for new code and docs.
+- Core tests are parameterized by provider and mode for consistent coverage.
+- See [Mode Comparison](../modes-comparison.md) for details.
diff --git a/mkdocs.yml b/mkdocs.yml
@@ -249,6 +249,7 @@ nav:
     - Patching: 'concepts/patching.md'
     - from_provider: 'concepts/from_provider.md'
     - Migration Guide: 'concepts/migration.md'
+    - Mode Migration: 'concepts/mode-migration.md'
     - Hooks: 'concepts/hooks.md'
     - Types: 'concepts/types.md'
     - TypedDicts: 'concepts/typeddicts.md'
diff --git a/tests/v2/test_mode_normalization.py b/tests/v2/test_mode_normalization.py
@@ -0,0 +1,281 @@
+from __future__ import annotations
+
+import warnings
+
+import pytest
+
+from instructor.mode import Mode
+from instructor.utils.providers import Provider
+
+try:
+    from instructor.v2.core import (
+        DEPRECATED_MODE_MAPPING,
+        mode_registry,
+        normalize_mode,
+        reset_deprecation_warnings,
+    )
+except ModuleNotFoundError:
+    pytest.skip("v2 module not available", allow_module_level=True)
+
+
+@pytest.fixture(autouse=True)
+def reset_warnings():
+    """Reset deprecation warnings before each test."""
+    reset_deprecation_warnings()
+    yield
+    reset_deprecation_warnings()
+
+
+@pytest.mark.parametrize(
+    "provider,mode,expected",
+    [
+        # GenAI legacy modes
+        (Provider.GENAI, Mode.GENAI_TOOLS, Mode.TOOLS),
+        (Provider.GENAI, Mode.GENAI_JSON, Mode.JSON),
+        (Provider.GENAI, Mode.GENAI_STRUCTURED_OUTPUTS, Mode.JSON),
+        # Anthropic legacy modes
+        (Provider.ANTHROPIC, Mode.ANTHROPIC_TOOLS, Mode.TOOLS),
+        (Provider.ANTHROPIC, Mode.ANTHROPIC_JSON, Mode.MD_JSON),
+        (Provider.ANTHROPIC, Mode.ANTHROPIC_PARALLEL_TOOLS, Mode.PARALLEL_TOOLS),
+        # OpenAI legacy modes
+        (Provider.OPENAI, Mode.FUNCTIONS, Mode.TOOLS),
+        (Provider.OPENAI, Mode.TOOLS_STRICT, Mode.TOOLS),
+        (Provider.OPENAI, Mode.JSON_O1, Mode.JSON_SCHEMA),
+        # Note: Mode.JSON is NOT deprecated - it's used by GenAI as a valid mode
+        (
+            Provider.OPENAI,
+            Mode.RESPONSES_TOOLS_WITH_INBUILT_TOOLS,
+            Mode.RESPONSES_TOOLS,
+        ),
+        # Mistral legacy modes
+        (Provider.MISTRAL, Mode.MISTRAL_TOOLS, Mode.TOOLS),
+        (Provider.MISTRAL, Mode.MISTRAL_STRUCTURED_OUTPUTS, Mode.JSON_SCHEMA),
+        # Cohere legacy modes
+        (Provider.COHERE, Mode.COHERE_TOOLS, Mode.TOOLS),
+        (Provider.COHERE, Mode.COHERE_JSON_SCHEMA, Mode.JSON_SCHEMA),
+        # xAI legacy modes
+        (Provider.XAI, Mode.XAI_TOOLS, Mode.TOOLS),
+        (Provider.XAI, Mode.XAI_JSON, Mode.MD_JSON),
+        # Generic modes should pass through unchanged
+        (Provider.GENAI, Mode.TOOLS, Mode.TOOLS),
+        (Provider.GENAI, Mode.JSON, Mode.JSON),
+        (Provider.ANTHROPIC, Mode.TOOLS, Mode.TOOLS),
+        (Provider.ANTHROPIC, Mode.JSON, Mode.JSON),
+        (Provider.OPENAI, Mode.TOOLS, Mode.TOOLS),
+        (Provider.OPENAI, Mode.JSON_SCHEMA, Mode.JSON_SCHEMA),
+        (Provider.OPENAI, Mode.MD_JSON, Mode.MD_JSON),
+        (Provider.OPENAI, Mode.PARALLEL_TOOLS, Mode.PARALLEL_TOOLS),
+        (Provider.OPENAI, Mode.RESPONSES_TOOLS, Mode.RESPONSES_TOOLS),
+    ],
+)
+def test_normalize_mode(provider: Provider, mode: Mode, expected: Mode):
+    """Test that mode normalization works correctly."""
+    result = normalize_mode(provider, mode)
+    assert result == expected
+
+
+@pytest.mark.parametrize(
+    "provider,expected_modes",
+    [
+        (Provider.GENAI, [Mode.TOOLS, Mode.JSON]),
+        (
+            Provider.OPENAI,
+            [
+                Mode.TOOLS,
+                Mode.JSON_SCHEMA,
+                Mode.MD_JSON,
+                Mode.PARALLEL_TOOLS,
+                Mode.RESPONSES_TOOLS,
+            ],
+        ),
+    ],
+)
+def test_handlers_registered_with_generic_modes(
+    provider: Provider, expected_modes: list[Mode]
+):
+    """Test that handlers are registered with generic modes.
+
+    Note: This test requires provider handlers to be registered.
+    It will be fully enabled in PR 3+ when providers are added.
+    """
+    # Skip if no modes are registered for this provider yet
+    registered_modes = mode_registry.get_modes_for_provider(provider)
+    if not registered_modes:
+        pytest.skip(f"No handlers registered for {provider.value} yet")
+
+    for mode in expected_modes:
+        if mode in registered_modes:
+            assert mode_registry.is_registered(provider, mode)
+
+
+@pytest.mark.parametrize(
+    "provider,legacy_mode,expected_mode",
+    [
+        (Provider.GENAI, Mode.GENAI_TOOLS, Mode.TOOLS),
+        (Provider.GENAI, Mode.GENAI_JSON, Mode.JSON),
+        (Provider.GENAI, Mode.GENAI_STRUCTURED_OUTPUTS, Mode.JSON),
+        (Provider.OPENAI, Mode.FUNCTIONS, Mode.TOOLS),
+        (Provider.OPENAI, Mode.TOOLS_STRICT, Mode.TOOLS),
+        (Provider.OPENAI, Mode.JSON_O1, Mode.JSON_SCHEMA),
+        (
+            Provider.OPENAI,
+            Mode.RESPONSES_TOOLS_WITH_INBUILT_TOOLS,
+            Mode.RESPONSES_TOOLS,
+        ),
+    ],
+)
+def test_backwards_compatibility(
+    provider: Provider, legacy_mode: Mode, expected_mode: Mode
+):
+    """Test that old provider-specific modes still work.
+
+    Note: This test requires provider handlers to be registered.
+    It will be fully enabled in PR 3+ when providers are added.
+    """
+    # Skip if provider doesn't have any handlers registered yet
+    registered_modes = mode_registry.get_modes_for_provider(provider)
+    if not registered_modes:
+        pytest.skip(f"No handlers registered for {provider.value} yet")
+
+    # The normalized mode should be registered
+    assert mode_registry.is_registered(provider, expected_mode)
+
+    # Legacy mode should normalize and find the same handler
+    legacy_handler = mode_registry.get_handler_class(provider, legacy_mode)
+    expected_handler = mode_registry.get_handler_class(provider, expected_mode)
+
+    assert legacy_handler is not None
+    assert expected_handler is not None
+    assert legacy_handler == expected_handler
+
+
+@pytest.mark.parametrize(
+    "provider,mode,expected_replacement",
+    [
+        (Provider.OPENAI, Mode.FUNCTIONS, Mode.TOOLS),
+        (Provider.OPENAI, Mode.TOOLS_STRICT, Mode.TOOLS),
+        (Provider.OPENAI, Mode.JSON_O1, Mode.JSON_SCHEMA),
+        # Note: Mode.JSON is NOT deprecated - it's used by GenAI as a valid mode
+        (Provider.ANTHROPIC, Mode.ANTHROPIC_TOOLS, Mode.TOOLS),
+        (Provider.GENAI, Mode.GENAI_TOOLS, Mode.TOOLS),
+        (Provider.MISTRAL, Mode.MISTRAL_TOOLS, Mode.TOOLS),
+        (Provider.COHERE, Mode.COHERE_TOOLS, Mode.TOOLS),
+        (Provider.XAI, Mode.XAI_TOOLS, Mode.TOOLS),
+    ],
+)
+def test_deprecated_mode_emits_warning(
+    provider: Provider, mode: Mode, expected_replacement: Mode
+):
+    """Test that using deprecated modes emits a deprecation warning."""
+    with warnings.catch_warnings(record=True) as w:
+        warnings.simplefilter("always")
+        result = normalize_mode(provider, mode)
+
+        # Should have emitted a warning
+        assert len(w) == 1
+        assert issubclass(w[0].category, DeprecationWarning)
+        assert mode.name in str(w[0].message)
+        assert expected_replacement.name in str(w[0].message)
+        assert "v3.0" in str(w[0].message)
+
+        # Should still return the correct normalized mode
+        assert result == expected_replacement
+
+
+@pytest.mark.parametrize("provider", [Provider.OPENAI, Provider.ANTHROPIC])
+def test_deprecated_mode_warning_only_once(provider: Provider):
+    """Test that deprecation warning is only shown once per mode."""
+    with warnings.catch_warnings(record=True) as w:
+        warnings.simplefilter("always")
+
+        # First call should warn
+        normalize_mode(provider, Mode.FUNCTIONS)
+        assert len(w) == 1
+
+        # Second call should not warn again
+        normalize_mode(provider, Mode.FUNCTIONS)
+        assert len(w) == 1  # Still only 1 warning
+
+        # Different mode should warn
+        normalize_mode(provider, Mode.TOOLS_STRICT)
+        assert len(w) == 2
+
+
+@pytest.mark.parametrize(
+    "provider,modes",
+    [
+        (Provider.OPENAI, [Mode.TOOLS, Mode.JSON_SCHEMA, Mode.MD_JSON]),
+        (Provider.GENAI, [Mode.TOOLS, Mode.JSON]),
+        (Provider.ANTHROPIC, [Mode.TOOLS, Mode.JSON]),
+    ],
+)
+def test_generic_mode_no_warning(provider: Provider, modes: list[Mode]):
+    """Test that using generic modes does not emit warnings."""
+    with warnings.catch_warnings(record=True) as w:
+        warnings.simplefilter("always")
+
+        for mode in modes:
+            normalize_mode(provider, mode)
+
+        # No warnings should be emitted for generic modes
+        assert len(w) == 0
+
+
+def test_deprecated_mode_mapping_is_complete():
+    """Test that all provider-specific modes are in the deprecated mapping."""
+    # These are the provider-specific modes that should be deprecated
+    # Note: Mode.JSON is NOT deprecated - it's used by GenAI as a valid mode
+    expected_deprecated = {
+        # OpenAI legacy
+        Mode.FUNCTIONS,
+        Mode.TOOLS_STRICT,
+        # Mode.JSON is NOT deprecated - it's used by GenAI
+        Mode.JSON_O1,
+        Mode.RESPONSES_TOOLS_WITH_INBUILT_TOOLS,
+        # Anthropic
+        Mode.ANTHROPIC_TOOLS,
+        Mode.ANTHROPIC_JSON,
+        Mode.ANTHROPIC_PARALLEL_TOOLS,
+        # GenAI
+        Mode.GENAI_TOOLS,
+        Mode.GENAI_JSON,
+        Mode.GENAI_STRUCTURED_OUTPUTS,
+        # Mistral
+        Mode.MISTRAL_TOOLS,
+        Mode.MISTRAL_STRUCTURED_OUTPUTS,
+        # Cohere
+        Mode.COHERE_TOOLS,
+        Mode.COHERE_JSON_SCHEMA,
+        # xAI
+        Mode.XAI_TOOLS,
+        Mode.XAI_JSON,
+        # Fireworks
+        Mode.FIREWORKS_TOOLS,
+        Mode.FIREWORKS_JSON,
+        # Cerebras
+        Mode.CEREBRAS_TOOLS,
+        Mode.CEREBRAS_JSON,
+        # Writer
+        Mode.WRITER_TOOLS,
+        Mode.WRITER_JSON,
+        # Bedrock
+        Mode.BEDROCK_TOOLS,
+        Mode.BEDROCK_JSON,
+        # Perplexity
+        Mode.PERPLEXITY_JSON,
+        # VertexAI
+        Mode.VERTEXAI_TOOLS,
+        Mode.VERTEXAI_JSON,
+        Mode.VERTEXAI_PARALLEL_TOOLS,
+        # Gemini
+        Mode.GEMINI_TOOLS,
+        Mode.GEMINI_JSON,
+        # OpenRouter
+        Mode.OPENROUTER_STRUCTURED_OUTPUTS,
+    }
+
+    # Check that all expected deprecated modes are in the mapping
+    for mode in expected_deprecated:
+        assert mode in DEPRECATED_MODE_MAPPING, (
+            f"Mode.{mode.name} should be in DEPRECATED_MODE_MAPPING"
+        )