Do a better job of inferring openai strict mode (#1511)

dmontagu · web-flow · commit babdf8254985 · 2025-04-16T23:36:24.000Z
diff --git a/pydantic_ai_slim/pydantic_ai/models/openai.py b/pydantic_ai_slim/pydantic_ai/models/openai.py
@@ -1,6 +1,7 @@
 from __future__ import annotations as _annotations
 
 import base64
+import re
 import warnings
 from collections.abc import AsyncIterable, AsyncIterator, Sequence
 from contextlib import asynccontextmanager
@@ -932,6 +933,31 @@ def _map_usage(response: chat.ChatCompletion | ChatCompletionChunk | responses.R
         )
 
 
+_STRICT_INCOMPATIBLE_KEYS = [
+    'minLength',
+    'maxLength',
+    'pattern',
+    'format',
+    'minimum',
+    'maximum',
+    'multipleOf',
+    'patternProperties',
+    'unevaluatedProperties',
+    'propertyNames',
+    'minProperties',
+    'maxProperties',
+    'unevaluatedItems',
+    'contains',
+    'minContains',
+    'maxContains',
+    'minItems',
+    'maxItems',
+    'uniqueItems',
+]
+
+_sentinel = object()
+
+
 @dataclass
 class _OpenAIJsonSchema(WalkJsonSchema):
     """Recursively handle the schema to make it compatible with OpenAI strict mode.
@@ -946,28 +972,64 @@ def __init__(self, schema: JsonSchema, strict: bool | None):
         super().__init__(schema)
         self.strict = strict
         self.is_strict_compatible = True
+        self.root_ref = schema.get('$ref')
+
+    def walk(self) -> JsonSchema:
+        # Note: OpenAI does not support anyOf at the root in strict mode
+        # However, we don't need to check for it here because we ensure in pydantic_ai._utils.check_object_json_schema
+        # that the root schema either has type 'object' or is recursive.
+        result = super().walk()
+
+        # For recursive models, we need to tweak the schema to make it compatible with strict mode.
+        # Because the following should never change the semantics of the schema we apply it unconditionally.
+        if self.root_ref is not None:
+            result.pop('$ref', None)  # We replace references to the self.root_ref with just '#' in the transform method
+            root_key = re.sub(r'^#/\$defs/', '', self.root_ref)
+            result.update(self.defs.get(root_key) or {})
+
+        return result
 
-    def transform(self, schema: JsonSchema) -> JsonSchema:
+    def transform(self, schema: JsonSchema) -> JsonSchema:  # noqa C901
         # Remove unnecessary keys
         schema.pop('title', None)
         schema.pop('default', None)
         schema.pop('$schema', None)
         schema.pop('discriminator', None)
 
-        # Remove incompatible keys, but note their impact in the description provided to the LLM
+        if schema_ref := schema.get('$ref'):
+            if schema_ref == self.root_ref:
+                schema['$ref'] = '#'
+            if len(schema) > 1:
+                # OpenAI Strict mode doesn't support siblings to "$ref", but _does_ allow siblings to "anyOf".
+                # So if there is a "description" field or any other extra info, we move the "$ref" into an "anyOf":
+                schema['anyOf'] = [{'$ref': schema.pop('$ref')}]
+
+        # Track strict-incompatible keys
+        incompatible_values: dict[str, Any] = {}
+        for key in _STRICT_INCOMPATIBLE_KEYS:
+            value = schema.get(key, _sentinel)
+            if value is not _sentinel:
+                incompatible_values[key] = value
         description = schema.get('description')
-        min_length = schema.pop('minLength', None)
-        max_length = schema.pop('maxLength', None)
-        if description is not None:
-            notes = list[str]()
-            if min_length is not None:  # pragma: no cover
-                notes.append(f'min_length={min_length}')
-            if max_length is not None:  # pragma: no cover
-                notes.append(f'max_length={max_length}')
-            if notes:  # pragma: no cover
-                schema['description'] = f'{description} ({", ".join(notes)})'
+        if incompatible_values:
+            if self.strict is True:
+                notes: list[str] = []
+                for key, value in incompatible_values.items():
+                    schema.pop(key)
+                    notes.append(f'{key}={value}')
+                notes_string = ', '.join(notes)
+                schema['description'] = notes_string if not description else f'{description} ({notes_string})'
+            elif self.strict is None:
+                self.is_strict_compatible = False
 
         schema_type = schema.get('type')
+        if 'oneOf' in schema:
+            # OpenAI does not support oneOf in strict mode
+            if self.strict is True:
+                schema['anyOf'] = schema.pop('oneOf')
+            else:
+                self.is_strict_compatible = False
+
         if schema_type == 'object':
             if self.strict is True:
                 # additional properties are disallowed
diff --git a/tests/models/test_openai.py b/tests/models/test_openai.py
@@ -4,6 +4,7 @@
 from collections.abc import Sequence
 from dataclasses import dataclass, field
 from datetime import datetime, timezone
+from enum import Enum
 from functools import cached_property
 from typing import Annotated, Any, Callable, Literal, Union, cast
 
@@ -730,9 +731,15 @@ class MyDefaultDc:
     x: int = 1
 
 
+class MyEnum(Enum):
+    a = 'a'
+    b = 'b'
+
+
 @dataclass
 class MyRecursiveDc:
     field: MyRecursiveDc | None
+    my_enum: MyEnum = Field(description='my enum')
 
 
 @dataclass
@@ -826,9 +833,13 @@ def tool_with_tuples(x: tuple[int], y: tuple[str] = ('abc',)) -> str:
                             },
                             'type': 'object',
                         },
+                        'MyEnum': {'enum': ['a', 'b'], 'type': 'string'},
                         'MyRecursiveDc': {
-                            'properties': {'field': {'anyOf': [{'$ref': '#/$defs/MyRecursiveDc'}, {'type': 'null'}]}},
-                            'required': ['field'],
+                            'properties': {
+                                'field': {'anyOf': [{'$ref': '#/$defs/MyRecursiveDc'}, {'type': 'null'}]},
+                                'my_enum': {'description': 'my enum', 'anyOf': [{'$ref': '#/$defs/MyEnum'}]},
+                            },
+                            'required': ['field', 'my_enum'],
                             'type': 'object',
                         },
                     },
@@ -857,11 +868,15 @@ def tool_with_tuples(x: tuple[int], y: tuple[str] = ('abc',)) -> str:
                             'additionalProperties': False,
                             'required': ['field'],
                         },
+                        'MyEnum': {'enum': ['a', 'b'], 'type': 'string'},
                         'MyRecursiveDc': {
-                            'properties': {'field': {'anyOf': [{'$ref': '#/$defs/MyRecursiveDc'}, {'type': 'null'}]}},
+                            'properties': {
+                                'field': {'anyOf': [{'$ref': '#/$defs/MyRecursiveDc'}, {'type': 'null'}]},
+                                'my_enum': {'description': 'my enum', 'anyOf': [{'$ref': '#/$defs/MyEnum'}]},
+                            },
                             'type': 'object',
                             'additionalProperties': False,
-                            'required': ['field'],
+                            'required': ['field', 'my_enum'],
                         },
                     },
                     'additionalProperties': False,
@@ -998,7 +1013,7 @@ def tool_with_tuples(x: tuple[int], y: tuple[str] = ('abc',)) -> str:
                         }
                     },
                     'additionalProperties': False,
-                    'properties': {'x': {'oneOf': [{'type': 'integer'}, {'$ref': '#/$defs/MyDefaultDc'}]}},
+                    'properties': {'x': {'anyOf': [{'type': 'integer'}, {'$ref': '#/$defs/MyDefaultDc'}]}},
                     'required': ['x'],
                     'type': 'object',
                 }
@@ -1079,12 +1094,15 @@ def tool_with_tuples(x: tuple[int], y: tuple[str] = ('abc',)) -> str:
                 {
                     'additionalProperties': False,
                     'properties': {
-                        'x': {'maxItems': 1, 'minItems': 1, 'prefixItems': [{'type': 'integer'}], 'type': 'array'},
+                        'x': {
+                            'prefixItems': [{'type': 'integer'}],
+                            'type': 'array',
+                            'description': 'minItems=1, maxItems=1',
+                        },
                         'y': {
-                            'maxItems': 1,
-                            'minItems': 1,
                             'prefixItems': [{'type': 'string'}],
                             'type': 'array',
+                            'description': 'minItems=1, maxItems=1',
                         },
                     },
                     'required': ['x', 'y'],
@@ -1160,28 +1178,46 @@ class MyModel(BaseModel):
                 'MyModel': {
                     'additionalProperties': False,
                     'properties': {
-                        'my_discriminated_union': {'oneOf': [{'$ref': '#/$defs/Apple'}, {'$ref': '#/$defs/Banana'}]},
+                        'my_discriminated_union': {'anyOf': [{'$ref': '#/$defs/Apple'}, {'$ref': '#/$defs/Banana'}]},
                         'my_list': {'items': {'type': 'number'}, 'type': 'array'},
                         'my_patterns': {
                             'additionalProperties': False,
-                            'patternProperties': {'^my-pattern$': {'type': 'string'}},
+                            'description': "patternProperties={'^my-pattern$': {'type': 'string'}}",
                             'type': 'object',
                             'properties': {},
                             'required': [],
                         },
-                        'my_recursive': {'anyOf': [{'$ref': '#/$defs/MyModel'}, {'type': 'null'}]},
+                        'my_recursive': {'anyOf': [{'$ref': '#'}, {'type': 'null'}]},
                         'my_tuple': {
-                            'maxItems': 1,
-                            'minItems': 1,
                             'prefixItems': [{'type': 'integer'}],
                             'type': 'array',
+                            'description': 'minItems=1, maxItems=1',
                         },
                     },
                     'required': ['my_recursive', 'my_patterns', 'my_tuple', 'my_list', 'my_discriminated_union'],
                     'type': 'object',
                 },
             },
-            '$ref': '#/$defs/MyModel',
+            'properties': {
+                'my_recursive': {'anyOf': [{'$ref': '#'}, {'type': 'null'}]},
+                'my_patterns': {
+                    'type': 'object',
+                    'description': "patternProperties={'^my-pattern$': {'type': 'string'}}",
+                    'additionalProperties': False,
+                    'properties': {},
+                    'required': [],
+                },
+                'my_tuple': {
+                    'prefixItems': [{'type': 'integer'}],
+                    'type': 'array',
+                    'description': 'minItems=1, maxItems=1',
+                },
+                'my_list': {'items': {'type': 'number'}, 'type': 'array'},
+                'my_discriminated_union': {'anyOf': [{'$ref': '#/$defs/Apple'}, {'$ref': '#/$defs/Banana'}]},
+            },
+            'required': ['my_recursive', 'my_patterns', 'my_tuple', 'my_list', 'my_discriminated_union'],
+            'type': 'object',
+            'additionalProperties': False,
         }
     )