toon-format · alesanfra · May 20, 2026 · Nov 28, 2025 · May 19, 2026 · May 20, 2026
@@ -120,6 +120,47 @@ tokens = count_tokens(toon_str)  # Uses tiktoken (gpt5/gpt5-mini)
 
 **Type Normalization:** `Infinity/NaN/Functions` → `null` • `Decimal` → `float` • `datetime` → ISO 8601 • `-0` → `0`
 
+## Pydantic Integration – (Structured TOON for LLM Outputs)
+
+Adds a **completely optional** Pydantic integration via the `[pydantic]` extra.
+
+```bash
+pip install "toon-python[pydantic]"
+```
+
+### Features
+
+- Schema: 50–60 % smaller than model_json_schema()
+- Zero JSON parsing errors
+- Works with `Instructor`, `Outlines`, `Marvin`, `LangChain agents`, etc.
+- Full Pydantic validation preserved
+
+## Usage After Release
+
+```python
+from toon_format.pydantic import ToonPydanticModel
+
+class User(ToonPydanticModel):
+    name: str
+    age: int
+    email: str | None = None
+
+# Convert schema to TOON for LLM system prompts
+schema_toon = User.schema_to_toon()
+# name:str,age:int,email:str|None
+
+# Parse LLM TOON output into validated Pydantic model
+toon_output = "name:Ansar,age:25,email:ansar@example.com"
+user = User.model_validate_toon(toon_output)
+
+# user.name → "Ansar"
+# user.age → 25
+# user.email → "ansar@example.com"
+
+# Serialize a model instance back to TOON
+toon_str = user.model_dump_toon()
+```
+
 ## Development
 
 ```bash

@@ -36,13 +36,17 @@ Documentation = "https://github.com/toon-format/spec"
 [project.scripts]
 toon = "toon_format.cli:main"
 
+[project.optional-dependencies]
+pydantic = ["pydantic>=2.0.0"]
+
 [dependency-groups]
 benchmark = ["tiktoken>=0.4.0"]
 dev = [
     "pytest>=8.0.0",
     "pytest-cov>=4.1.0",
     "ruff>=0.8.0",
     "mypy>=1.8.0",
+    "pydantic>=2.0.0",
 ]
 
 [tool.pytest.ini_options]
@@ -94,4 +98,4 @@ requires = ["hatchling"]
 build-backend = "hatchling.build"
 
 [tool.hatch.build.targets.wheel]
-packages = ["src/toon_format"]
+packages = ["src/toon_format"]
@@ -0,0 +1,3 @@
+from .serializer import ToonPydanticModel
+
+__all__ = ["ToonPydanticModel"]
@@ -0,0 +1,61 @@
+from __future__ import annotations
+
+from typing import TypeVar
+
+from pydantic import BaseModel, ValidationError
+
+from toon_format import decode, encode
+
+T = TypeVar("T", bound="ToonPydanticModel")
+
+
+class ToonPydanticModel(BaseModel):
+    """
+    Pydantic mixin that adds TOON superpowers.
+
+    • schema_to_toon()        → TOON schema string (for LLM few-shot / system prompts)
+    • model_dump_toon()       → Serialize this model instance to a TOON string
+    • model_validate_toon()   → Parse TOON output directly into a validated model
+    """
+
+    @classmethod
+    def schema_to_toon(cls) -> str:
+        """
+        Convert the model's JSON schema into compact TOON format.
+        Use this in your LLM prompt to save 40–60% tokens vs JSON schema.
+        """
+        schema = cls.model_json_schema()
+        # Pydantic gives us full JSON schema
+        return encode(schema)
+
+    def model_dump_toon(self, **kwargs) -> str:
+        """
+        Serialize this model instance into a compact TOON string.
+
+        Mirrors pydantic's ``model_dump_json()``. Extra keyword arguments are
+        forwarded to ``model_dump()`` (e.g. ``exclude_none=True``).
+        """
+        data = self.model_dump(mode="json", **kwargs)
+        return encode(data)
+
+    @classmethod
+    def model_validate_toon(cls: type[T], text: str) -> T:
+        """
+        Parse a raw TOON string (from an LLM) into a fully validated model.
+
+        Mirrors pydantic's ``model_validate_json()``.
+
+        Raises:
+            ValueError – If TOON parsing fails or the input is empty
+            ValidationError – If data doesn't match the model
+        """
+        if not text.strip():
+            raise ValueError("Empty string cannot be parsed as TOON")
+
+        try:
+            data = decode(text.strip())
+            return cls.model_validate(data)
+        except ValidationError as e:
+            raise e  # Let Pydantic's rich error surface (best UX)
+        except Exception as e:
+            raise ValueError(f"Failed to parse TOON into {cls.__name__}: {e}") from e
@@ -0,0 +1,52 @@
+from typing import Optional
+
+import pytest
+from pydantic import ValidationError
+
+from toon_format.pydantic import ToonPydanticModel
+
+
+class User(ToonPydanticModel):
+    name: str
+    age: int
+    email: Optional[str] = None
+
+
+def test_schema_to_toon():
+    schema = User.schema_to_toon()
+    assert "name:" in schema
+    assert "age:" in schema
+    assert "email:" in schema  # optional field
+    assert "type: object" in schema
+
+
+def test_model_validate_toon_success():
+    toon = "name:Ansar\nage:25\nemail:null"
+    user = User.model_validate_toon(toon)
+    assert user.name == "Ansar"
+    assert user.age == 25
+    assert user.email is None
+
+
+def test_model_validate_toon_validation_error():
+    toon = "name:Ansar\nage:twenty-five"  # wrong type
+    with pytest.raises(ValidationError):
+        User.model_validate_toon(toon)
+
+
+def test_model_validate_toon_empty_string():
+    with pytest.raises(ValueError, match="Empty string"):
+        User.model_validate_toon("")
+
+
+def test_model_dump_toon():
+    user = User(name="Ansar", age=25)
+    toon = user.model_dump_toon()
+    assert "name: Ansar" in toon
+    assert "age: 25" in toon
+
+
+def test_model_dump_toon_roundtrip():
+    user = User(name="Ansar", age=25, email="a@b.com")
+    restored = User.model_validate_toon(user.model_dump_toon())
+    assert restored == user
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		from .serializer import ToonPydanticModel

		__all__ = ["ToonPydanticModel"]