python-openapi · p1c2u · Mar 1, 2026 · Mar 1, 2026 · Mar 1, 2026 · Mar 1, 2026
diff --git a/README.rst b/README.rst
@@ -54,7 +54,14 @@ Usage
 
 .. code-block:: python
 
-   validate(instance, schema, cls=OAS32Validator, allow_remote_references=False, **kwargs)
+   validate(
+       instance,
+       schema,
+       cls=OAS32Validator,
+       allow_remote_references=False,
+       check_schema=True,
+       **kwargs,
+   )
 
 The first argument is always the value you want to validate.
 The second argument is always the OpenAPI schema object.
@@ -83,6 +90,17 @@ remote ``$ref`` retrieval. To resolve external references, pass an explicit
 ``registry``. Set ``allow_remote_references=True`` only if you explicitly
 accept jsonschema's default remote retrieval behavior.
 
+``check_schema`` defaults to ``True`` and validates the schema before
+validating an instance. For trusted pre-validated schemas in hot paths, set
+``check_schema=False`` to skip schema checking.
+
+The ``validate`` helper keeps an internal compiled-validator cache. You can
+control cache size using the
+``OPENAPI_SCHEMA_VALIDATOR_COMPILED_VALIDATOR_CACHE_MAX_SIZE`` environment variable
+(default: ``128``).
+The value is loaded once at first use and reused for the lifetime of the
+process.
+
 To validate an OpenAPI schema:
 
 .. code-block:: python

diff --git a/benchmarks/__init__.py b/benchmarks/__init__.py
diff --git a/benchmarks/cases.py b/benchmarks/cases.py
@@ -0,0 +1,171 @@
+from dataclasses import dataclass
+from typing import Any
+
+from referencing import Registry
+from referencing import Resource
+from referencing.jsonschema import DRAFT202012
+
+from openapi_schema_validator import OAS30Validator
+from openapi_schema_validator import OAS31Validator
+from openapi_schema_validator import OAS32Validator
+from openapi_schema_validator import oas30_format_checker
+from openapi_schema_validator import oas31_format_checker
+from openapi_schema_validator import oas32_format_checker
+
+
+@dataclass(frozen=True)
+class BenchmarkCase:
+    name: str
+    validator_class: Any
+    schema: dict[str, Any]
+    instance: Any
+    validator_kwargs: dict[str, Any]
+
+
+def build_cases() -> list[BenchmarkCase]:
+    name_schema = Resource.from_contents(
+        {
+            "$schema": "https://json-schema.org/draft/2020-12/schema",
+            "type": "string",
+        }
+    )
+    age_schema = DRAFT202012.create_resource(
+        {
+            "type": "integer",
+            "format": "int32",
+            "minimum": 0,
+            "maximum": 120,
+        }
+    )
+    registry = Registry().with_resources(
+        [
+            ("urn:name-schema", name_schema),
+            ("urn:age-schema", age_schema),
+        ]
+    )
+
+    return [
+        BenchmarkCase(
+            name="oas32_simple_object",
+            validator_class=OAS32Validator,
+            schema={
+                "type": "object",
+                "required": ["name"],
+                "properties": {
+                    "name": {"type": "string"},
+                    "enabled": {"type": "boolean"},
+                },
+                "additionalProperties": False,
+            },
+            instance={"name": "svc", "enabled": True},
+            validator_kwargs={"format_checker": oas32_format_checker},
+        ),
+        BenchmarkCase(
+            name="oas31_prefix_items",
+            validator_class=OAS31Validator,
+            schema={
+                "type": "array",
+                "prefixItems": [
+                    {"type": "number"},
+                    {"type": "string"},
+                    {"enum": ["Street", "Avenue", "Boulevard"]},
+                    {"enum": ["NW", "NE", "SW", "SE"]},
+                ],
+                "items": False,
+            },
+            instance=[1600, "Pennsylvania", "Avenue", "NW"],
+            validator_kwargs={"format_checker": oas31_format_checker},
+        ),
+        BenchmarkCase(
+            name="oas30_nullable",
+            validator_class=OAS30Validator,
+            schema={"type": "string", "nullable": True},
+            instance=None,
+            validator_kwargs={"format_checker": oas30_format_checker},
+        ),
+        BenchmarkCase(
+            name="oas30_discriminator",
+            validator_class=OAS30Validator,
+            schema={
+                "$ref": "#/components/schemas/Route",
+                "components": {
+                    "schemas": {
+                        "MountainHiking": {
+                            "type": "object",
+                            "properties": {
+                                "discipline": {
+                                    "type": "string",
+                                    "enum": [
+                                        "mountain_hiking",
+                                        "MountainHiking",
+                                    ],
+                                },
+                                "length": {"type": "integer"},
+                            },
+                            "required": ["discipline", "length"],
+                        },
+                        "AlpineClimbing": {
+                            "type": "object",
+                            "properties": {
+                                "discipline": {
+                                    "type": "string",
+                                    "enum": ["alpine_climbing"],
+                                },
+                                "height": {"type": "integer"},
+                            },
+                            "required": ["discipline", "height"],
+                        },
+                        "Route": {
+                            "oneOf": [
+                                {
+                                    "$ref": (
+                                        "#/components/schemas/"
+                                        "MountainHiking"
+                                    )
+                                },
+                                {
+                                    "$ref": (
+                                        "#/components/schemas/"
+                                        "AlpineClimbing"
+                                    )
+                                },
+                            ],
+                            "discriminator": {
+                                "propertyName": "discipline",
+                                "mapping": {
+                                    "mountain_hiking": (
+                                        "#/components/schemas/"
+                                        "MountainHiking"
+                                    ),
+                                    "alpine_climbing": (
+                                        "#/components/schemas/"
+                                        "AlpineClimbing"
+                                    ),
+                                },
+                            },
+                        },
+                    }
+                },
+            },
+            instance={"discipline": "mountain_hiking", "length": 10},
+            validator_kwargs={"format_checker": oas30_format_checker},
+        ),
+        BenchmarkCase(
+            name="oas32_registry_refs",
+            validator_class=OAS32Validator,
+            schema={
+                "type": "object",
+                "required": ["name"],
+                "properties": {
+                    "name": {"$ref": "urn:name-schema"},
+                    "age": {"$ref": "urn:age-schema"},
+                },
+                "additionalProperties": False,
+            },
+            instance={"name": "John", "age": 23},
+            validator_kwargs={
+                "format_checker": oas32_format_checker,
+                "registry": registry,
+            },
+        ),
+    ]
diff --git a/benchmarks/compare.py b/benchmarks/compare.py
@@ -0,0 +1,169 @@
+from __future__ import annotations
+
+import argparse
+import json
+from pathlib import Path
+from typing import Any
+
+LOWER_IS_BETTER_METRICS = {
+    "compile_ms",
+    "first_validate_ms",
+    "compiled_peak_memory_kib",
+}
+HIGHER_IS_BETTER_METRICS = {
+    "compiled_validations_per_second",
+    "helper_validations_per_second",
+    "helper_trusted_validations_per_second",
+}
+ALL_METRICS = [
+    "compile_ms",
+    "first_validate_ms",
+    "compiled_validations_per_second",
+    "helper_validations_per_second",
+    "helper_trusted_validations_per_second",
+    "compiled_peak_memory_kib",
+]
+
+
+def _parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        description="Compare two benchmark JSON reports.",
+    )
+    parser.add_argument(
+        "--baseline",
+        type=Path,
+        required=True,
+        help="Path to baseline benchmark JSON.",
+    )
+    parser.add_argument(
+        "--candidate",
+        type=Path,
+        required=True,
+        help="Path to candidate benchmark JSON.",
+    )
+    parser.add_argument(
+        "--regression-threshold",
+        type=float,
+        default=0.0,
+        help=(
+            "Percent threshold for regressions. "
+            "Example: 5 means fail only when regression exceeds 5%%."
+        ),
+    )
+    parser.add_argument(
+        "--fail-on-regression",
+        action="store_true",
+        help="Exit with status 1 if regressions exceed threshold.",
+    )
+    return parser.parse_args()
+
+
+def _load_report(path: Path) -> dict[str, Any]:
+    return json.loads(path.read_text(encoding="utf-8"))
+
+
+def _cases_by_name(report: dict[str, Any]) -> dict[str, dict[str, Any]]:
+    return {case["name"]: case for case in report["cases"]}
+
+
+def _percent_change(baseline_value: float, candidate_value: float) -> float:
+    if baseline_value == 0:
+        if candidate_value == 0:
+            return 0.0
+        return float("inf")
+    return ((candidate_value - baseline_value) / baseline_value) * 100.0
+
+
+def _is_regression(metric: str, percent_change: float) -> bool:
+    if metric in LOWER_IS_BETTER_METRICS:
+        return percent_change > 0
+    return percent_change < 0
+
+
+def _format_status(is_regression: bool, percent_change: float) -> str:
+    if abs(percent_change) < 1e-12:
+        return "no change (0.00%)"
+
+    direction = "regression" if is_regression else "improvement"
+    sign = "+" if percent_change >= 0 else ""
+    return f"{direction} ({sign}{percent_change:.2f}%)"
+
+
+def _compare_reports(
+    baseline: dict[str, Any],
+    candidate: dict[str, Any],
+    regression_threshold: float,
+) -> tuple[list[str], list[str]]:
+    baseline_cases = _cases_by_name(baseline)
+    candidate_cases = _cases_by_name(candidate)
+
+    report_lines: list[str] = []
+    regressions: list[str] = []
+
+    for case_name in sorted(baseline_cases):
+        if case_name not in candidate_cases:
+            regressions.append(
+                f"Missing case in candidate report: {case_name}"
+            )
+            continue
+
+        report_lines.append(f"Case: {case_name}")
+        baseline_case = baseline_cases[case_name]
+        candidate_case = candidate_cases[case_name]
+
+        for metric in ALL_METRICS:
+            baseline_value = float(baseline_case[metric])
+            candidate_value = float(candidate_case[metric])
+            change = _percent_change(baseline_value, candidate_value)
+            regression = _is_regression(metric, change)
+            status = _format_status(regression, change)
+
+            report_lines.append(
+                "  "
+                f"{metric}: baseline={baseline_value:.6f} "
+                f"candidate={candidate_value:.6f} -> {status}"
+            )
+
+            if regression and abs(change) > regression_threshold:
+                regressions.append(
+                    f"{case_name} {metric} regressed by {abs(change):.2f}%"
+                )
+
+    extra_candidate_cases = set(candidate_cases).difference(baseline_cases)
+    for case_name in sorted(extra_candidate_cases):
+        report_lines.append(f"Case present only in candidate: {case_name}")
+
+    return report_lines, regressions
+
+
+def main() -> int:
+    args = _parse_args()
+    baseline = _load_report(args.baseline)
+    candidate = _load_report(args.candidate)
+    report_lines, regressions = _compare_reports(
+        baseline,
+        candidate,
+        args.regression_threshold,
+    )
+
+    print(
+        f"Comparing candidate {args.candidate} "
+        f"against baseline {args.baseline}"
+    )
+    print("")
+    print("\n".join(report_lines))
+
+    if regressions:
+        print("")
+        print("Regressions above threshold:")
+        for regression in regressions:
+            print(f"- {regression}")
+
+        if args.fail_on_regression:
+            return 1
+
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())