ucbepic · shreyashankar · Oct 7, 2025 · Oct 7, 2025 · Oct 7, 2025 · cursor
diff --git a/docetl/operations/filter.py b/docetl/operations/filter.py
@@ -5,18 +5,28 @@
 from pydantic import model_validator
 
 from docetl.operations.map import MapOperation
+from docetl.operations.utils.validation import (
+    convert_schema_to_dict_format,
+    is_pydantic_model,
+)
 
 
 class FilterOperation(MapOperation):
     class schema(MapOperation.schema):
         type: str = "filter"
         prompt: str
-        output: dict[str, Any]
+        output: dict[str, Any] | Any
 
         @model_validator(mode="after")
         def validate_filter_output_schema(self):
             # Check that schema exists and has the right structure for filtering
-            schema_dict = self.output["schema"]
+            raw_schema = self.output["schema"]
+
+            # Convert Pydantic schema to dict format for validation
+            if is_pydantic_model(raw_schema):
+                schema_dict = convert_schema_to_dict_format(raw_schema)
+            else:
+                schema_dict = raw_schema
 
             # Filter out _short_explanation for validation
             schema = {k: v for k, v in schema_dict.items() if k != "_short_explanation"}

diff --git a/docetl/operations/map.py b/docetl/operations/map.py
@@ -17,12 +17,16 @@
 from docetl.operations.base import BaseOperation
 from docetl.operations.utils import RichLoopBar, strict_render, validate_output_types
 from docetl.operations.utils.api import OutputMode
+from docetl.operations.utils.validation import (
+    convert_schema_to_dict_format,
+    is_pydantic_model,
+)
 
 
 class MapOperation(BaseOperation):
     class schema(BaseOperation.schema):
         type: str = "map"
-        output: dict[str, Any] | None = None
+        output: dict[str, Any] | Any | None = None
         prompt: str | None = None
         model: str | None = None
         optimize: bool | None = None
@@ -610,7 +614,15 @@ def execute(self, input_data: list[dict]) -> tuple[list[dict], float]:
         """
         results = {}
         total_cost = 0
-        output_schema = self.config.get("output", {}).get("schema", {})
+        # Handle both dict and Pydantic schemas
+        output_config = self.config.get("output", {})
+        raw_schema = output_config.get("schema", {})
+
+        # Convert Pydantic schema to dict format if needed
+        if is_pydantic_model(raw_schema):
+            output_schema = convert_schema_to_dict_format(raw_schema)
+        else:
+            output_schema = raw_schema
 
         # Check if there's no prompt and only drop_keys
         if "prompts" not in self.config and "drop_keys" in self.config:

diff --git a/docetl/operations/reduce.py b/docetl/operations/reduce.py
@@ -32,6 +32,10 @@
 
 # Import OutputMode enum for structured output checks
 from docetl.operations.utils.api import OutputMode
+from docetl.operations.utils.validation import (
+    convert_schema_to_dict_format,
+    is_pydantic_model,
+)
 from docetl.utils import completion_cost
 
 
@@ -46,7 +50,7 @@ class ReduceOperation(BaseOperation):
     class schema(BaseOperation.schema):
         type: str = "reduce"
         reduce_key: str | list[str]
-        output: dict[str, Any]
+        output: dict[str, Any] | Any
         prompt: str
         optimize: bool | None = None
         synthesize_resolve: bool | None = None
@@ -200,6 +204,15 @@ def execute(self, input_data: list[dict]) -> tuple[list[dict], float]:
                 f"Using gleaning with validation prompt: {self.config.get('gleaning', {}).get('validation_prompt', '')}"
             )
 
+        # Handle both dict and Pydantic schemas
+        if self.config.get("output") and "schema" in self.config["output"]:
+            raw_schema = self.config["output"]["schema"]
+            if is_pydantic_model(raw_schema):
+                # Convert Pydantic schema to dict format for internal processing
+                self.config["output"]["schema"] = convert_schema_to_dict_format(
+                    raw_schema
+                )
+
         reduce_keys = self.config["reduce_key"]
         if isinstance(reduce_keys, str):
             reduce_keys = [reduce_keys]

diff --git a/docetl/operations/resolve.py b/docetl/operations/resolve.py
@@ -14,6 +14,10 @@
 
 from docetl.operations.base import BaseOperation
 from docetl.operations.utils import RichLoopBar, rich_as_completed, strict_render
+from docetl.operations.utils.validation import (
+    convert_schema_to_dict_format,
+    is_pydantic_model,
+)
 from docetl.utils import completion_cost, extract_jinja_variables
 
 
@@ -29,7 +33,7 @@ class schema(BaseOperation.schema):
         type: str = "resolve"
         comparison_prompt: str
         resolution_prompt: str | None = None
-        output: dict[str, Any] | None = None
+        output: dict[str, Any] | Any | None = None
         embedding_model: str | None = None
         resolution_model: str | None = None
         comparison_model: str | None = None
@@ -113,12 +117,15 @@ def validate_output_schema(self, info: ValidationInfo):
             if "schema" not in self.output:
                 raise ValueError("Missing 'schema' in 'output' configuration")
 
-            if not isinstance(self.output["schema"], dict):
+            # Accept both dict schemas and Pydantic models
+            schema = self.output["schema"]
+            if not isinstance(schema, dict) and not is_pydantic_model(schema):
                 raise TypeError(
-                    "'schema' in 'output' configuration must be a dictionary"
+                    "'schema' in 'output' configuration must be a dictionary or Pydantic BaseModel"
                 )
 
-            if not self.output["schema"]:
+            # Check if schema is empty (only applies to dict schemas)
+            if isinstance(schema, dict) and not schema:
                 raise ValueError("'schema' in 'output' configuration cannot be empty")
 
             return self
@@ -208,6 +215,15 @@ def execute(self, input_data: list[dict]) -> tuple[list[dict], float]:
         if len(input_data) == 0:
             return [], 0
 
+        # Handle both dict and Pydantic schemas
+        if self.config.get("output") and "schema" in self.config["output"]:
+            raw_schema = self.config["output"]["schema"]
+            if is_pydantic_model(raw_schema):
+                # Convert Pydantic schema to dict format for internal processing
+                self.config["output"]["schema"] = convert_schema_to_dict_format(
+                    raw_schema
+                )
+
         # Initialize observability data for all items at the start
         if self.config.get("enable_observability", False):
             observability_key = f"_observability_{self.config['name']}"

diff --git a/docetl/operations/utils/api.py b/docetl/operations/utils/api.py
@@ -34,8 +34,10 @@
 )
 from .validation import (
     convert_dict_schema_to_list_schema,
+    convert_schema_to_dict_format,
     convert_val,
     get_user_input_for_schema,
+    is_pydantic_model,
     safe_eval,
     strict_render,
 )
@@ -130,16 +132,32 @@ def call_llm_batch(
         model: str,
         op_type: str,
         messages: list[dict[str, str]],
-        output_schema: dict[str, str],
+        output_schema: dict[str, str] | Any,
         verbose: bool = False,
         timeout_seconds: int = 120,
         max_retries_per_timeout: int = 2,
         bypass_cache: bool = False,
         litellm_completion_kwargs: dict[str, Any] = {},
         op_config: dict[str, Any] = {},
     ) -> LLMResult:
-        # Turn the output schema into a list of schemas
-        output_schema = convert_dict_schema_to_list_schema(output_schema)
+        # Handle Pydantic schemas
+        if is_pydantic_model(output_schema):
+            # Auto-enable structured output for Pydantic schemas
+            op_config = op_config.copy()
+            if "output" not in op_config:
+                op_config["output"] = {}
+            if "mode" not in op_config["output"]:
+                op_config["output"]["mode"] = OutputMode.STRUCTURED_OUTPUT.value
+
+            # For structured output mode, pass the Pydantic model directly
+            # The LLM API will handle the OpenAPI conversion internally
+            op_config["_pydantic_schema"] = output_schema
+            # Convert to dict format only for the list schema wrapper
+            dict_schema = convert_schema_to_dict_format(output_schema, model)
+            output_schema = convert_dict_schema_to_list_schema(dict_schema)
+        else:
+            # Regular dict schema processing
+            output_schema = convert_dict_schema_to_list_schema(output_schema)
 
         # Invoke the LLM call
         return self.call_llm(
@@ -442,7 +460,7 @@ def call_llm(
         model: str,
         op_type: str,
         messages: list[dict[str, str]],
-        output_schema: dict[str, str],
+        output_schema: dict[str, str] | Any,
         tools: list[dict[str, str]] | None = None,
         scratchpad: str | None = None,
         timeout_seconds: int = 120,
@@ -479,6 +497,20 @@ def call_llm(
         Raises:
             TimeoutError: If the call times out after retrying.
         """
+        # Handle Pydantic schemas
+        if is_pydantic_model(output_schema):
+            # Auto-enable structured output for Pydantic schemas
+            op_config = op_config.copy()
+            if "output" not in op_config:
+                op_config["output"] = {}
+            if "mode" not in op_config["output"]:
+                op_config["output"]["mode"] = OutputMode.STRUCTURED_OUTPUT.value
+
+            # Store the Pydantic schema for structured output
+            op_config["_pydantic_schema"] = output_schema
+            # Convert to dict format for internal processing
+            output_schema = convert_schema_to_dict_format(output_schema, model)
+
         # Determine output mode using central enum
         output_mode_str = op_config.get("output", {}).get(
             "mode", OutputMode.TOOLS.value
@@ -674,15 +706,38 @@ def _call_llm_with_cache(
         # Prepare structured output schema if using structured output mode
         response_format = None
         if use_structured_output:
-            if scratchpad is not None:
-                props["updated_scratchpad"] = {"type": "string"}
+            # Check if we have a Pydantic schema to use directly
+            pydantic_schema = op_config.get("_pydantic_schema")
+            if pydantic_schema and is_pydantic_model(pydantic_schema):
+                # Use the OpenAPI schema from Pydantic directly
+                from .validation import pydantic_to_openapi_schema
+
+                openapi_schema = pydantic_to_openapi_schema(pydantic_schema)
+
+                if scratchpad is not None:
+                    # Add scratchpad to the schema properties
+                    openapi_schema = openapi_schema.copy()
+                    openapi_schema["properties"] = openapi_schema["properties"].copy()
+                    openapi_schema["properties"]["updated_scratchpad"] = {
+                        "type": "string"
+                    }
+                    if "required" in openapi_schema:
+                        openapi_schema["required"] = list(
+                            openapi_schema["required"]
+                        ) + ["updated_scratchpad"]
 
-            schema = {
-                "type": "object",
-                "properties": props,
-                "required": list(props.keys()),
-                "additionalProperties": False,
-            }
+                schema = openapi_schema
+            else:
+                # Use the converted dict schema
+                if scratchpad is not None:
+                    props["updated_scratchpad"] = {"type": "string"}
+
+                schema = {
+                    "type": "object",
+                    "properties": props,
+                    "required": list(props.keys()),
+                    "additionalProperties": False,
+                }
 
             response_format = {
                 "type": "json_schema",