feat: deterministic JSON schema inference (genson wrapper)
This commit is contained in:
@@ -0,0 +1,24 @@
|
|||||||
|
from __future__ import annotations
|
||||||
|
|
||||||
|
from typing import Any
|
||||||
|
|
||||||
|
from genson import SchemaBuilder
|
||||||
|
|
||||||
|
|
||||||
|
class SchemaAccumulator:
|
||||||
|
"""Accumulate JSON samples into a widening JSON Schema (genson-backed)."""
|
||||||
|
|
||||||
|
def __init__(self) -> None:
|
||||||
|
self._builder = SchemaBuilder()
|
||||||
|
self._count = 0
|
||||||
|
|
||||||
|
def add(self, value: Any) -> None:
|
||||||
|
self._builder.add_object(value)
|
||||||
|
self._count += 1
|
||||||
|
|
||||||
|
def schema(self) -> dict[str, Any] | None:
|
||||||
|
if self._count == 0:
|
||||||
|
return None
|
||||||
|
result: dict[str, Any] = self._builder.to_schema()
|
||||||
|
result.pop("$schema", None)
|
||||||
|
return result
|
||||||
@@ -0,0 +1,30 @@
|
|||||||
|
from auto_reverse.doc.schema import SchemaAccumulator
|
||||||
|
|
||||||
|
|
||||||
|
def test_single_object_schema():
|
||||||
|
acc = SchemaAccumulator()
|
||||||
|
acc.add({"id": 1, "name": "Ada"})
|
||||||
|
schema = acc.schema()
|
||||||
|
assert schema["type"] == "object"
|
||||||
|
assert set(schema["properties"]) == {"id", "name"}
|
||||||
|
|
||||||
|
|
||||||
|
def test_merge_widens_optional_fields():
|
||||||
|
acc = SchemaAccumulator()
|
||||||
|
acc.add({"id": 1, "name": "Ada"})
|
||||||
|
acc.add({"id": 2}) # name missing -> becomes optional
|
||||||
|
schema = acc.schema()
|
||||||
|
assert "id" in schema.get("required", [])
|
||||||
|
assert "name" not in schema.get("required", [])
|
||||||
|
|
||||||
|
|
||||||
|
def test_array_schema():
|
||||||
|
acc = SchemaAccumulator()
|
||||||
|
acc.add([{"id": 1}, {"id": 2}])
|
||||||
|
schema = acc.schema()
|
||||||
|
assert schema["type"] == "array"
|
||||||
|
assert schema["items"]["type"] == "object"
|
||||||
|
|
||||||
|
|
||||||
|
def test_empty_accumulator_returns_none():
|
||||||
|
assert SchemaAccumulator().schema() is None
|
||||||
Reference in New Issue
Block a user