pdmtt · January 1, 2026 10:43 · pdmtt · May 5, 2025 · AdamBryantLaunchWindow · May 5, 2025
diff --git a/sqlalchemy_with_pydantic_v2.py b/sqlalchemy_with_pydantic_v2.py
 import datetime
 from typing import TYPE_CHECKING, Any, Optional, final

 import sqlalchemy as sa
 from pydantic import BaseModel, Field
 from sqlalchemy.dialects.postgresql import JSONB
 from sqlalchemy.orm import Mapped, declarative_base, mapped_column, sessionmaker
 from typing_extensions import override

 if TYPE_CHECKING:
    from typing import Any

    from sqlalchemy import Dialect
    from sqlalchemy.sql.type_api import TypeEngine


 # --------------------------------------------------------------------------------------
 # Define pydantic-alchemy specific types (once per application)
 # --------------------------------------------------------------------------------------


 @final
 class PydanticType(sa.types.TypeDecorator["BaseModel"]):
    """Pydantic type.

    SAVING:

    - Uses SQLAlchemy JSON type under the hood.
    - Acceps the pydantic model and converts it to a dict on save.
    - SQLAlchemy engine JSON-encodes the dict to a string.

    RETRIEVING:

    - Pulls the string from the database.
    - SQLAlchemy engine JSON-decodes the string to a dict.
    - Uses the dict to create a pydantic model.
    """
    
    # If you intend to use this class with one dialect only, 
    # you could pick a type from the specific dialect for 
    # simplicity sake.
    #
    # E.g., if you work with PostgreSQL, you can consider using
    # sqlalchemy.dialects.postgresql.JSONB instead of a
    # generic sa.types.JSON
    # Ref: https://www.postgresql.org/docs/13/datatype-json.html
    # 
    # Otherwise, you should implement the `load_dialect_impl` 
    # method to handle different dialects. In this case, the 
    # impl variable can reference TypeEngine as a placeholder.
    impl = sa.types.JSON

    def __init__(self, pydantic_type: type["BaseModel"]) -> None:
        super().__init__()
        self.pydantic_type = pydantic_type

    @override
    def load_dialect_impl(self, dialect: "Dialect") -> "TypeEngine[JSONB | sa.JSON]":
        # You should implement this method to handle different dialects 
        # if you intend to use this class with more than one.
        # E.g., use JSONB for PostgreSQL and the generic JSON type for 
        # other databases.
        if dialect.name == "postgresql":
            return dialect.type_descriptor(JSONB())
        else:
            return dialect.type_descriptor(sa.JSON())

    @override
    def process_bind_param(
        self,
        value: "BaseModel | None",
        dialect: "Dialect",
    ) -> "dict[str, Any] | None":
        if value is None:
            return None

        if not isinstance(value, BaseModel):  # dynamic typing.
            raise TypeError(f'The value "{value!r}" is not a pydantic model')

        # Method .dict() is deprecated as of pydantic V2.
        #
        # You should think before setting exclude_unset to True. This can reduce the size
        # of the dump, but unset values might mean something depending on your context.
        #
        # Setting mode to "json" entails that you won't need to define a custom json
        # serializer ahead.
        return value.model_dump(mode="json", exclude_unset=True)

    @override
    def process_result_value(
        self,
        value: "dict[str, Any] | None",
        dialect: "Dialect",
    ) -> "BaseModel | None":
        # `parse_obj_as` is deprecated as of pydantic V2.
        # We're assuming that the value will be a dictionary here.
        return self.pydantic_type(**value) if value else None


 # --------------------------------------------------------------------------------------
 # Configure SQLAlchemy engine, session and declarative base (once per application)
 # --------------------------------------------------------------------------------------

 engine = sa.create_engine("sqlite:///:memory:")
 Session = sessionmaker(bind=engine, expire_on_commit=False)
 Base = declarative_base()


 # --------------------------------------------------------------------------------------
 # Define your Pydantic and SQLAlchemy models (as many as needed)
 # --------------------------------------------------------------------------------------


 class UserSettings(BaseModel):
    notify_at: datetime.datetime = Field(default_factory=datetime.datetime.now)


 @final
 class User(Base):
    __tablename__ = "users"
    # Using Annotated Declarative Table.
    # docs.sqlalchemy.org/en/20/orm/declarative_tables.html#using-annotated-declarative-table-type-annotated-forms-for-mapped-column
    id: Mapped[int] = mapped_column(primary_key=True)
    name: Mapped[str] = mapped_column(doc="User name", comment="User name")
    settings: Mapped[Optional[UserSettings]] = mapped_column(
        PydanticType(UserSettings), nullable=True
    )


 # --------------------------------------------------------------------------------------
 # Create tables (once per application)
 # --------------------------------------------------------------------------------------

 Base.metadata.create_all(engine)


 # --------------------------------------------------------------------------------------
 # Usage example (we use 2.0 querying style with selects)
 # Ref: https://docs.sqlalchemy.org/en/20/orm/session_basics.htm
 # --------------------------------------------------------------------------------------

 session = Session()
 user = User(name="user", settings=UserSettings())
 session.add(user)
 session.commit()
 same_user = session.execute(sa.select(User)).scalars().first()
	import datetime
	from typing import TYPE_CHECKING, Any, Optional, final

	import sqlalchemy as sa
	from pydantic import BaseModel, Field
	from sqlalchemy.dialects.postgresql import JSONB
	from sqlalchemy.orm import Mapped, declarative_base, mapped_column, sessionmaker
	from typing_extensions import override

	if TYPE_CHECKING:
	from typing import Any

	from sqlalchemy import Dialect
	from sqlalchemy.sql.type_api import TypeEngine


	# --------------------------------------------------------------------------------------
	# Define pydantic-alchemy specific types (once per application)
	# --------------------------------------------------------------------------------------


	@final
	class PydanticType(sa.types.TypeDecorator["BaseModel"]):
	"""Pydantic type.

	SAVING:

	- Uses SQLAlchemy JSON type under the hood.
	- Acceps the pydantic model and converts it to a dict on save.
	- SQLAlchemy engine JSON-encodes the dict to a string.

	RETRIEVING:

	- Pulls the string from the database.
	- SQLAlchemy engine JSON-decodes the string to a dict.
	- Uses the dict to create a pydantic model.
	"""

	# If you intend to use this class with one dialect only,
	# you could pick a type from the specific dialect for
	# simplicity sake.
	#
	# E.g., if you work with PostgreSQL, you can consider using
	# sqlalchemy.dialects.postgresql.JSONB instead of a
	# generic sa.types.JSON
	# Ref: https://www.postgresql.org/docs/13/datatype-json.html
	#
	# Otherwise, you should implement the `load_dialect_impl`
	# method to handle different dialects. In this case, the
	# impl variable can reference TypeEngine as a placeholder.
	impl = sa.types.JSON

	def __init__(self, pydantic_type: type["BaseModel"]) -> None:
	super().__init__()
	self.pydantic_type = pydantic_type

	@override
	def load_dialect_impl(self, dialect: "Dialect") -> "TypeEngine[JSONB \| sa.JSON]":
	# You should implement this method to handle different dialects
	# if you intend to use this class with more than one.
	# E.g., use JSONB for PostgreSQL and the generic JSON type for
	# other databases.
	if dialect.name == "postgresql":
	return dialect.type_descriptor(JSONB())
	else:
	return dialect.type_descriptor(sa.JSON())

	@override
	def process_bind_param(
	self,
	value: "BaseModel \| None",
	dialect: "Dialect",
	) -> "dict[str, Any] \| None":
	if value is None:
	return None

	if not isinstance(value, BaseModel): # dynamic typing.
	raise TypeError(f'The value "{value!r}" is not a pydantic model')

	# Method .dict() is deprecated as of pydantic V2.
	#
	# You should think before setting exclude_unset to True. This can reduce the size
	# of the dump, but unset values might mean something depending on your context.
	#
	# Setting mode to "json" entails that you won't need to define a custom json
	# serializer ahead.
	return value.model_dump(mode="json", exclude_unset=True)

	@override
	def process_result_value(
	self,
	value: "dict[str, Any] \| None",
	dialect: "Dialect",
	) -> "BaseModel \| None":
	# `parse_obj_as` is deprecated as of pydantic V2.
	# We're assuming that the value will be a dictionary here.
	return self.pydantic_type(**value) if value else None


	# --------------------------------------------------------------------------------------
	# Configure SQLAlchemy engine, session and declarative base (once per application)
	# --------------------------------------------------------------------------------------

	engine = sa.create_engine("sqlite:///:memory:")
	Session = sessionmaker(bind=engine, expire_on_commit=False)
	Base = declarative_base()


	# --------------------------------------------------------------------------------------
	# Define your Pydantic and SQLAlchemy models (as many as needed)
	# --------------------------------------------------------------------------------------


	class UserSettings(BaseModel):
	notify_at: datetime.datetime = Field(default_factory=datetime.datetime.now)


	@final
	class User(Base):
	__tablename__ = "users"
	# Using Annotated Declarative Table.
	# docs.sqlalchemy.org/en/20/orm/declarative_tables.html#using-annotated-declarative-table-type-annotated-forms-for-mapped-column
	id: Mapped[int] = mapped_column(primary_key=True)
	name: Mapped[str] = mapped_column(doc="User name", comment="User name")
	settings: Mapped[Optional[UserSettings]] = mapped_column(
	PydanticType(UserSettings), nullable=True
	)


	# --------------------------------------------------------------------------------------
	# Create tables (once per application)
	# --------------------------------------------------------------------------------------

	Base.metadata.create_all(engine)


	# --------------------------------------------------------------------------------------
	# Usage example (we use 2.0 querying style with selects)
	# Ref: https://docs.sqlalchemy.org/en/20/orm/session_basics.htm
	# --------------------------------------------------------------------------------------

	session = Session()
	user = User(name="user", settings=UserSettings())
	session.add(user)
	session.commit()
	same_user = session.execute(sa.select(User)).scalars().first()
No results found