PyPI - lsst-felis - Versions diffs - 26.2024.900__py3-none-any.whl → 29.2025.4500__py3-none-any.whl - Mend

lsst-felis 26.2024.900py3-none-any.whl → 29.2025.4500py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

felis/__init__.py +10 -24
felis/cli.py +437 -341
felis/config/tap_schema/columns.csv +33 -0
felis/config/tap_schema/key_columns.csv +8 -0
felis/config/tap_schema/keys.csv +8 -0
felis/config/tap_schema/schemas.csv +2 -0
felis/config/tap_schema/tables.csv +6 -0
felis/config/tap_schema/tap_schema_std.yaml +273 -0
felis/datamodel.py +1386 -193
felis/db/dialects.py +116 -0
felis/db/schema.py +62 -0
felis/db/sqltypes.py +275 -48
felis/db/utils.py +409 -0
felis/db/variants.py +159 -0
felis/diff.py +234 -0
felis/metadata.py +385 -0
felis/tap_schema.py +767 -0
felis/tests/__init__.py +0 -0
felis/tests/postgresql.py +134 -0
felis/tests/run_cli.py +79 -0
felis/types.py +57 -9
lsst_felis-29.2025.4500.dist-info/METADATA +38 -0
lsst_felis-29.2025.4500.dist-info/RECORD +31 -0
{lsst_felis-26.2024.900.dist-info → lsst_felis-29.2025.4500.dist-info}/WHEEL +1 -1
{lsst_felis-26.2024.900.dist-info → lsst_felis-29.2025.4500.dist-info/licenses}/COPYRIGHT +1 -1
felis/check.py +0 -381
felis/simple.py +0 -424
felis/sql.py +0 -275
felis/tap.py +0 -433
felis/utils.py +0 -100
felis/validation.py +0 -103
felis/version.py +0 -2
felis/visitor.py +0 -180
lsst_felis-26.2024.900.dist-info/METADATA +0 -28
lsst_felis-26.2024.900.dist-info/RECORD +0 -23
{lsst_felis-26.2024.900.dist-info → lsst_felis-29.2025.4500.dist-info}/entry_points.txt +0 -0
{lsst_felis-26.2024.900.dist-info → lsst_felis-29.2025.4500.dist-info/licenses}/LICENSE +0 -0
{lsst_felis-26.2024.900.dist-info → lsst_felis-29.2025.4500.dist-info}/top_level.txt +0 -0
{lsst_felis-26.2024.900.dist-info → lsst_felis-29.2025.4500.dist-info}/zip-safe +0 -0

felis/datamodel.py CHANGED Viewed

@@ -1,3 +1,5 @@
+"""Define Pydantic data models for Felis."""
 # This file is part of felis.
 #
 # Developed for the LSST Data Management System.
@@ -21,24 +23,43 @@
 from __future__ import annotations
+import json
 import logging
-from collections.abc import Mapping, Sequence
-from enum import Enum
-from typing import Annotated, Any, Literal, TypeAlias
+import sys
+from collections.abc import Sequence
+from enum import StrEnum, auto
+from typing import IO, Annotated, Any, Generic, Literal, TypeAlias, TypeVar
+import yaml
 from astropy import units as units  # type: ignore
 from astropy.io.votable import ucd  # type: ignore
-from pydantic import BaseModel, ConfigDict, Field, field_validator, model_validator
+from lsst.resources import ResourcePath, ResourcePathExpression
+from pydantic import (
+    BaseModel,
+    ConfigDict,
+    Field,
+    PrivateAttr,
+    ValidationError,
+    ValidationInfo,
+    field_serializer,
+    field_validator,
+    model_validator,
+)
+from pydantic_core import InitErrorDetails
+from .db.dialects import get_supported_dialects
+from .db.sqltypes import get_type_func
+from .db.utils import string_to_typeengine
+from .types import Boolean, Byte, Char, Double, FelisType, Float, Int, Long, Short, String, Text, Unicode
 logger = logging.getLogger(__name__)
-# logger.setLevel(logging.DEBUG)
 __all__ = (
     "BaseObject",
-    "Column",
     "CheckConstraint",
+    "Column",
     "Constraint",
-    "DescriptionStr",
+    "DataType",
     "ForeignKeyConstraint",
     "Index",
     "Schema",
@@ -50,9 +71,8 @@ __all__ = (
 CONFIG = ConfigDict(
     populate_by_name=True,  # Populate attributes by name.
     extra="forbid",  # Do not allow extra fields.
-    use_enum_values=True,  # Use enum values instead of names.
-    validate_assignment=True,  # Validate assignments after model is created.
     str_strip_whitespace=True,  # Strip whitespace from string fields.
+    use_enum_values=False,  # Do not use enum values during serialization.
 )
 """Pydantic model configuration as described in:
 https://docs.pydantic.dev/2.0/api/config/#pydantic.config.ConfigDict
@@ -62,132 +82,220 @@ DESCR_MIN_LENGTH = 3
 """Minimum length for a description field."""
 DescriptionStr: TypeAlias = Annotated[str, Field(min_length=DESCR_MIN_LENGTH)]
-"""Define a type for a description string, which must be three or more
-characters long. Stripping of whitespace is done globally on all str fields."""
+"""Type for a description, which must be three or more characters long."""
 class BaseObject(BaseModel):
-    """Base class for all Felis objects."""
+    """Base model.
+    All classes representing objects in the Felis data model should inherit
+    from this class.
+    """
     model_config = CONFIG
     """Pydantic model configuration."""
     name: str
-    """The name of the database object.
-    All Felis database objects must have a name.
-    """
+    """Name of the database object."""
     id: str = Field(alias="@id")
-    """The unique identifier of the database object.
-    All Felis database objects must have a unique identifier.
-    """
+    """Unique identifier of the database object."""
     description: DescriptionStr | None = None
-    """A description of the database object.
+    """Description of the database object."""
-    By default, the description is optional but will be required if
-    `BaseObject.Config.require_description` is set to `True` by the user.
-    """
-    @model_validator(mode="before")
-    @classmethod
-    def check_description(cls, values: dict[str, Any]) -> dict[str, Any]:
-        """Check that the description is present if required."""
-        if Schema.is_description_required():
-            if "description" not in values or not values["description"]:
-                raise ValueError("Description is required and must be non-empty")
-            if len(values["description"].strip()) < DESCR_MIN_LENGTH:
-                raise ValueError(f"Description must be at least {DESCR_MIN_LENGTH} characters long")
-        return values
+    votable_utype: str | None = Field(None, alias="votable:utype")
+    """VOTable utype (usage-specific or unique type) of the object."""
+    @model_validator(mode="after")
+    def check_description(self, info: ValidationInfo) -> BaseObject:
+        """Check that the description is present if required.
+        Parameters
+        ----------
+        info
+            Validation context used to determine if the check is enabled.
+        Returns
+        -------
+        `BaseObject`
+            The object being validated.
+        """
+        context = info.context
+        if not context or not context.get("check_description", False):
+            return self
+        if self.description is None or self.description == "":
+            raise ValueError("Description is required and must be non-empty")
+        if len(self.description) < DESCR_MIN_LENGTH:
+            raise ValueError(f"Description must be at least {DESCR_MIN_LENGTH} characters long")
+        return self
-class DataType(Enum):
-    """`Enum` representing the data types supported by Felis."""
-    BOOLEAN = "boolean"
-    BYTE = "byte"
-    SHORT = "short"
-    INT = "int"
-    LONG = "long"
-    FLOAT = "float"
-    DOUBLE = "double"
-    CHAR = "char"
-    STRING = "string"
-    UNICODE = "unicode"
-    TEXT = "text"
-    BINARY = "binary"
-    TIMESTAMP = "timestamp"
+class DataType(StrEnum):
+    """``Enum`` representing the data types supported by Felis."""
+    boolean = auto()
+    byte = auto()
+    short = auto()
+    int = auto()
+    long = auto()
+    float = auto()
+    double = auto()
+    char = auto()
+    string = auto()
+    unicode = auto()
+    text = auto()
+    binary = auto()
+    timestamp = auto()
+def validate_ivoa_ucd(ivoa_ucd: str) -> str:
+    """Validate IVOA UCD values.
+    Parameters
+    ----------
+    ivoa_ucd
+        IVOA UCD value to check.
+    Returns
+    -------
+    `str`
+        The IVOA UCD value if it is valid.
+    Raises
+    ------
+    ValueError
+        If the IVOA UCD value is invalid.
+    """
+    if ivoa_ucd is not None:
+        try:
+            ucd.parse_ucd(ivoa_ucd, check_controlled_vocabulary=True, has_colon=";" in ivoa_ucd)
+        except ValueError as e:
+            raise ValueError(f"Invalid IVOA UCD: {e}")
+    return ivoa_ucd
 class Column(BaseObject):
-    """A column in a table."""
+    """Column model."""
     datatype: DataType
-    """The datatype of the column."""
+    """Datatype of the column."""
-    length: int | None = None
-    """The length of the column."""
+    length: int | None = Field(None, gt=0)
+    """Length of the column."""
+    precision: int | None = Field(None, ge=0)
+    """The numerical precision of the column.
+    For timestamps, this is the number of fractional digits retained in the
+    seconds field.
+    """
     nullable: bool = True
-    """Whether the column can be `NULL`."""
+    """Whether the column can be ``NULL``."""
-    value: Any = None
-    """The default value of the column."""
+    value: str | int | float | bool | None = None
+    """Default value of the column."""
     autoincrement: bool | None = None
     """Whether the column is autoincremented."""
-    mysql_datatype: str | None = Field(None, alias="mysql:datatype")
-    """The MySQL datatype of the column."""
     ivoa_ucd: str | None = Field(None, alias="ivoa:ucd")
-    """The IVOA UCD of the column."""
+    """IVOA UCD of the column."""
     fits_tunit: str | None = Field(None, alias="fits:tunit")
-    """The FITS TUNIT of the column."""
+    """FITS TUNIT of the column."""
     ivoa_unit: str | None = Field(None, alias="ivoa:unit")
-    """The IVOA unit of the column."""
+    """IVOA unit of the column."""
     tap_column_index: int | None = Field(None, alias="tap:column_index")
-    """The TAP_SCHEMA column index of the column."""
+    """TAP_SCHEMA column index of the column."""
     tap_principal: int | None = Field(0, alias="tap:principal", ge=0, le=1)
-    """Whether this is a TAP_SCHEMA principal column; can be either 0 or 1.
-    """
+    """Whether this is a TAP_SCHEMA principal column."""
-    votable_arraysize: int | Literal["*"] | None = Field(None, alias="votable:arraysize")
-    """The VOTable arraysize of the column."""
+    votable_arraysize: int | str | None = Field(None, alias="votable:arraysize")
+    """VOTable arraysize of the column."""
     tap_std: int | None = Field(0, alias="tap:std", ge=0, le=1)
     """TAP_SCHEMA indication that this column is defined by an IVOA standard.
     """
-    votable_utype: str | None = Field(None, alias="votable:utype")
-    """The VOTable utype (usage-specific or unique type) of the column."""
     votable_xtype: str | None = Field(None, alias="votable:xtype")
-    """The VOTable xtype (extended type) of the column."""
+    """VOTable xtype (extended type) of the column."""
+    votable_datatype: str | None = Field(None, alias="votable:datatype")
+    """VOTable datatype of the column."""
+    mysql_datatype: str | None = Field(None, alias="mysql:datatype")
+    """MySQL datatype override on the column."""
+    postgresql_datatype: str | None = Field(None, alias="postgresql:datatype")
+    """PostgreSQL datatype override on the column."""
+    @model_validator(mode="after")
+    def check_value(self) -> Column:
+        """Check that the default value is valid.
+        Returns
+        -------
+        `Column`
+            The column being validated.
+        """
+        if (value := self.value) is not None:
+            if value is not None and self.autoincrement is True:
+                raise ValueError("Column cannot have both a default value and be autoincremented")
+            felis_type = FelisType.felis_type(self.datatype)
+            if felis_type.is_numeric:
+                if felis_type in (Byte, Short, Int, Long) and not isinstance(value, int):
+                    raise ValueError("Default value must be an int for integer type columns")
+                elif felis_type in (Float, Double) and not isinstance(value, float):
+                    raise ValueError("Default value must be a decimal number for float and double columns")
+            elif felis_type in (String, Char, Unicode, Text):
+                if not isinstance(value, str):
+                    raise ValueError("Default value must be a string for string columns")
+                if not len(value):
+                    raise ValueError("Default value must be a non-empty string for string columns")
+            elif felis_type is Boolean and not isinstance(value, bool):
+                raise ValueError("Default value must be a boolean for boolean columns")
+        return self
     @field_validator("ivoa_ucd")
     @classmethod
     def check_ivoa_ucd(cls, ivoa_ucd: str) -> str:
-        """Check that IVOA UCD values are valid."""
-        if ivoa_ucd is not None:
-            try:
-                ucd.parse_ucd(ivoa_ucd, check_controlled_vocabulary=True, has_colon=";" in ivoa_ucd)
-            except ValueError as e:
-                raise ValueError(f"Invalid IVOA UCD: {e}")
-        return ivoa_ucd
+        """Check that IVOA UCD values are valid.
-    @model_validator(mode="before")
-    @classmethod
-    def check_units(cls, values: dict[str, Any]) -> dict[str, Any]:
-        """Check that units are valid."""
-        fits_unit = values.get("fits:tunit")
-        ivoa_unit = values.get("ivoa:unit")
+        Parameters
+        ----------
+        ivoa_ucd
+            IVOA UCD value to check.
+        Returns
+        -------
+        `str`
+            The IVOA UCD value if it is valid.
+        """
+        return validate_ivoa_ucd(ivoa_ucd)
+    @model_validator(mode="after")
+    def check_units(self) -> Column:
+        """Check that the ``fits:tunit`` or ``ivoa:unit`` field has valid
+        units according to astropy. Only one may be provided.
+        Returns
+        -------
+        `Column`
+            The column being validated.
+        Raises
+        ------
+        ValueError
+            Raised if both FITS and IVOA units are provided, or if the unit is
+            invalid.
+        """
+        fits_unit = self.fits_tunit
+        ivoa_unit = self.ivoa_unit
         if fits_unit and ivoa_unit:
             raise ValueError("Column cannot have both FITS and IVOA units")
@@ -199,55 +307,420 @@ class Column(BaseObject):
             except ValueError as e:
                 raise ValueError(f"Invalid unit: {e}")
+        return self
+    @model_validator(mode="before")
+    @classmethod
+    def check_length(cls, values: dict[str, Any]) -> dict[str, Any]:
+        """Check that a valid length is provided for sized types.
+        Parameters
+        ----------
+        values
+            Values of the column.
+        Returns
+        -------
+        `dict` [ `str`, `Any` ]
+            The values of the column.
+        Raises
+        ------
+        ValueError
+            Raised if a length is not provided for a sized type.
+        """
+        datatype = values.get("datatype")
+        if datatype is None:
+            # Skip this validation if datatype is not provided
+            return values
+        length = values.get("length")
+        felis_type = FelisType.felis_type(datatype)
+        if felis_type.is_sized and length is None:
+            raise ValueError(
+                f"Length must be provided for type '{datatype}'"
+                + (f" in column '{values['@id']}'" if "@id" in values else "")
+            )
+        elif not felis_type.is_sized and length is not None:
+            logger.warning(
+                f"The datatype '{datatype}' does not support a specified length"
+                + (f" in column '{values['@id']}'" if "@id" in values else "")
+            )
+        return values
+    @model_validator(mode="after")
+    def check_redundant_datatypes(self, info: ValidationInfo) -> Column:
+        """Check for redundant datatypes on columns.
+        Parameters
+        ----------
+        info
+            Validation context used to determine if the check is enabled.
+        Returns
+        -------
+        `Column`
+            The column being validated.
+        Raises
+        ------
+        ValueError
+            Raised if a datatype override is redundant.
+        """
+        context = info.context
+        if not context or not context.get("check_redundant_datatypes", False):
+            return self
+        if all(
+            getattr(self, f"{dialect}:datatype", None) is not None
+            for dialect in get_supported_dialects().keys()
+        ):
+            return self
+        datatype = self.datatype
+        length: int | None = self.length or None
+        datatype_func = get_type_func(datatype)
+        felis_type = FelisType.felis_type(datatype)
+        if felis_type.is_sized:
+            datatype_obj = datatype_func(length)
+        else:
+            datatype_obj = datatype_func()
+        for dialect_name, dialect in get_supported_dialects().items():
+            db_annotation = f"{dialect_name}_datatype"
+            if datatype_string := self.model_dump().get(db_annotation):
+                db_datatype_obj = string_to_typeengine(datatype_string, dialect, length)
+                if datatype_obj.compile(dialect) == db_datatype_obj.compile(dialect):
+                    raise ValueError(
+                        "'{}: {}' is a redundant override of 'datatype: {}' in column '{}'{}".format(
+                            db_annotation,
+                            datatype_string,
+                            self.datatype,
+                            self.id,
+                            "" if length is None else f" with length {length}",
+                        )
+                    )
+                else:
+                    logger.debug(
+                        f"Type override of 'datatype: {self.datatype}' "
+                        f"with '{db_annotation}: {datatype_string}' in column '{self.id}' "
+                        f"compiled to '{datatype_obj.compile(dialect)}' and "
+                        f"'{db_datatype_obj.compile(dialect)}'"
+                    )
+        return self
+    @model_validator(mode="after")
+    def check_precision(self) -> Column:
+        """Check that precision is only valid for timestamp columns.
+        Returns
+        -------
+        `Column`
+            The column being validated.
+        """
+        if self.precision is not None and self.datatype != "timestamp":
+            raise ValueError("Precision is only valid for timestamp columns")
+        return self
+    @model_validator(mode="before")
+    @classmethod
+    def check_votable_arraysize(cls, values: dict[str, Any], info: ValidationInfo) -> dict[str, Any]:
+        """Set the default value for the ``votable_arraysize`` field, which
+        corresponds to ``arraysize`` in the IVOA VOTable standard.
+        Parameters
+        ----------
+        values
+            Values of the column.
+        info
+            Validation context used to determine if the check is enabled.
+        Returns
+        -------
+        `dict` [ `str`, `Any` ]
+            The values of the column.
+        Notes
+        -----
+        Following the IVOA VOTable standard, an ``arraysize`` of 1 should not
+        be used.
+        """
+        if values.get("name", None) is None or values.get("datatype", None) is None:
+            # Skip bad column data that will not validate
+            return values
+        context = info.context if info.context else {}
+        arraysize = values.get("votable:arraysize", None)
+        if arraysize is None:
+            length = values.get("length", None)
+            datatype = values.get("datatype")
+            if length is not None and length > 1:
+                # Following the IVOA standard, arraysize of 1 is disallowed
+                if datatype == "char":
+                    arraysize = str(length)
+                elif datatype in ("string", "unicode", "binary"):
+                    if context.get("force_unbounded_arraysize", False):
+                        arraysize = "*"
+                        logger.debug(
+                            f"Forced VOTable's 'arraysize' to '*' on column '{values['name']}' with datatype "
+                            + f"'{values['datatype']}' and length '{length}'"
+                        )
+                    else:
+                        arraysize = f"{length}*"
+            elif datatype in ("timestamp", "text"):
+                arraysize = "*"
+            if arraysize is not None:
+                values["votable:arraysize"] = arraysize
+                logger.debug(
+                    f"Set default 'votable:arraysize' to '{arraysize}' on column '{values['name']}'"
+                    + f" with datatype '{values['datatype']}' and length '{values.get('length', None)}'"
+                )
+        else:
+            logger.debug(f"Using existing 'votable:arraysize' of '{arraysize}' on column '{values['name']}'")
+            if isinstance(values["votable:arraysize"], int):
+                logger.warning(
+                    f"Usage of an integer value for 'votable:arraysize' in column '{values['name']}' is "
+                    + "deprecated"
+                )
+                values["votable:arraysize"] = str(arraysize)
         return values
+    @field_serializer("datatype")
+    def serialize_datatype(self, value: DataType) -> str:
+        """Convert `DataType` to string when serializing to JSON/YAML.
+        Parameters
+        ----------
+        value
+            The `DataType` value to serialize.
+        Returns
+        -------
+        `str`
+            The serialized `DataType` value.
+        """
+        return str(value)
+    @field_validator("datatype", mode="before")
+    @classmethod
+    def deserialize_datatype(cls, value: str) -> DataType:
+        """Convert string back into `DataType` when loading from JSON/YAML.
+        Parameters
+        ----------
+        value
+            The string value to deserialize.
+        Returns
+        -------
+        `DataType`
+            The deserialized `DataType` value.
+        """
+        return DataType(value)
+    @model_validator(mode="after")
+    def check_votable_xtype(self) -> Column:
+        """Set the default value for the ``votable_xtype`` field, which
+        corresponds to an Extended Datatype or ``xtype`` in the IVOA VOTable
+        standard.
+        Returns
+        -------
+        `Column`
+            The column being validated.
+        Notes
+        -----
+        This is currently only set automatically for the Felis ``timestamp``
+        datatype.
+        """
+        if self.datatype == DataType.timestamp and self.votable_xtype is None:
+            self.votable_xtype = "timestamp"
+        return self
 class Constraint(BaseObject):
-    """A database table constraint."""
+    """Table constraint model."""
     deferrable: bool = False
-    """If `True` then this constraint will be declared as deferrable."""
+    """Whether this constraint will be declared as deferrable."""
-    initially: str | None = None
-    """Value for ``INITIALLY`` clause, only used if ``deferrable`` is True."""
+    initially: Literal["IMMEDIATE", "DEFERRED"] | None = None
+    """Value for ``INITIALLY`` clause; only used if `deferrable` is
+    `True`."""
-    annotations: Mapping[str, Any] = Field(default_factory=dict)
-    """Additional annotations for this constraint."""
-    type: str | None = Field(None, alias="@type")
-    """The type of the constraint."""
+    @model_validator(mode="after")
+    def check_deferrable(self) -> Constraint:
+        """Check that the ``INITIALLY`` clause is only used if `deferrable` is
+        `True`.
+        Returns
+        -------
+        `Constraint`
+            The constraint being validated.
+        """
+        if self.initially is not None and not self.deferrable:
+            raise ValueError("INITIALLY clause can only be used if deferrable is True")
+        return self
 class CheckConstraint(Constraint):
-    """A check constraint on a table."""
+    """Table check constraint model."""
+    type: Literal["Check"] = Field("Check", alias="@type")
+    """Type of the constraint."""
     expression: str
-    """The expression for the check constraint."""
+    """Expression for the check constraint."""
+    @field_serializer("type")
+    def serialize_type(self, value: str) -> str:
+        """Ensure '@type' is included in serialized output.
+        Parameters
+        ----------
+        value
+            The value to serialize.
+        Returns
+        -------
+        `str`
+            The serialized value.
+        """
+        return value
 class UniqueConstraint(Constraint):
-    """A unique constraint on a table."""
+    """Table unique constraint model."""
+    type: Literal["Unique"] = Field("Unique", alias="@type")
+    """Type of the constraint."""
     columns: list[str]
-    """The columns in the unique constraint."""
+    """Columns in the unique constraint."""
+    @field_serializer("type")
+    def serialize_type(self, value: str) -> str:
+        """Ensure '@type' is included in serialized output.
+        Parameters
+        ----------
+        value
+            The value to serialize.
+        Returns
+        -------
+        `str`
+            The serialized value.
+        """
+        return value
+class ForeignKeyConstraint(Constraint):
+    """Table foreign key constraint model.
+    This constraint is used to define a foreign key relationship between two
+    tables in the schema. There must be at least one column in the
+    `columns` list, and at least one column in the `referenced_columns` list
+    or a validation error will be raised.
+    Notes
+    -----
+    These relationships will be reflected in the TAP_SCHEMA ``keys`` and
+    ``key_columns`` data.
+    """
+    type: Literal["ForeignKey"] = Field("ForeignKey", alias="@type")
+    """Type of the constraint."""
+    columns: list[str] = Field(min_length=1)
+    """The columns comprising the foreign key."""
+    referenced_columns: list[str] = Field(alias="referencedColumns", min_length=1)
+    """The columns referenced by the foreign key."""
+    on_delete: Literal["CASCADE", "SET NULL", "SET DEFAULT", "RESTRICT", "NO ACTION"] | None = None
+    """Action to take when the referenced row is deleted."""
+    on_update: Literal["CASCADE", "SET NULL", "SET DEFAULT", "RESTRICT", "NO ACTION"] | None = None
+    """Action to take when the referenced row is updated."""
+    @field_serializer("type")
+    def serialize_type(self, value: str) -> str:
+        """Ensure '@type' is included in serialized output.
+        Parameters
+        ----------
+        value
+            The value to serialize.
+        Returns
+        -------
+        `str`
+            The serialized value.
+        """
+        return value
+    @model_validator(mode="after")
+    def check_column_lengths(self) -> ForeignKeyConstraint:
+        """Check that the `columns` and `referenced_columns` lists have the
+        same length.
+        Returns
+        -------
+        `ForeignKeyConstraint`
+            The foreign key constraint being validated.
+        Raises
+        ------
+        ValueError
+            Raised if the `columns` and `referenced_columns` lists do not have
+            the same length.
+        """
+        if len(self.columns) != len(self.referenced_columns):
+            raise ValueError(
+                "Columns and referencedColumns must have the same length for a ForeignKey constraint"
+            )
+        return self
+_ConstraintType = Annotated[
+    CheckConstraint | ForeignKeyConstraint | UniqueConstraint, Field(discriminator="type")
+]
+"""Type alias for a constraint type."""
 class Index(BaseObject):
-    """A database table index.
+    """Table index model.
     An index can be defined on either columns or expressions, but not both.
     """
     columns: list[str] | None = None
-    """The columns in the index."""
+    """Columns in the index."""
     expressions: list[str] | None = None
-    """The expressions in the index."""
+    """Expressions in the index."""
     @model_validator(mode="before")
     @classmethod
     def check_columns_or_expressions(cls, values: dict[str, Any]) -> dict[str, Any]:
-        """Check that columns or expressions are specified, but not both."""
+        """Check that columns or expressions are specified, but not both.
+        Parameters
+        ----------
+        values
+            Values of the index.
+        Returns
+        -------
+        `dict` [ `str`, `Any` ]
+            The values of the index.
+        Raises
+        ------
+        ValueError
+            Raised if both columns and expressions are specified, or if neither
+            are specified.
+        """
         if "columns" in values and "expressions" in values:
             raise ValueError("Defining columns and expressions is not valid")
         elif "columns" not in values and "expressions" not in values:
@@ -255,80 +728,234 @@ class Index(BaseObject):
         return values
-class ForeignKeyConstraint(Constraint):
-    """A foreign key constraint on a table.
+ColumnRef: TypeAlias = str
+"""Type alias for a column reference."""
-    These will be reflected in the TAP_SCHEMA keys and key_columns data.
-    """
-    columns: list[str]
-    """The columns comprising the foreign key."""
+class ColumnGroup(BaseObject):
+    """Column group model."""
-    referenced_columns: list[str] = Field(alias="referencedColumns")
-    """The columns referenced by the foreign key."""
+    columns: list[ColumnRef | Column] = Field(..., min_length=1)
+    """Columns in the group."""
+    ivoa_ucd: str | None = Field(None, alias="ivoa:ucd")
+    """IVOA UCD of the column."""
-class Table(BaseObject):
-    """A database table."""
+    table: Table | None = Field(None, exclude=True)
+    """Reference to the parent table."""
-    columns: Sequence[Column]
-    """The columns in the table."""
+    @field_validator("ivoa_ucd")
+    @classmethod
+    def check_ivoa_ucd(cls, ivoa_ucd: str) -> str:
+        """Check that IVOA UCD values are valid.
-    constraints: list[Constraint] = Field(default_factory=list)
-    """The constraints on the table."""
+        Parameters
+        ----------
+        ivoa_ucd
+            IVOA UCD value to check.
-    indexes: list[Index] = Field(default_factory=list)
-    """The indexes on the table."""
+        Returns
+        -------
+        `str`
+            The IVOA UCD value if it is valid.
+        """
+        return validate_ivoa_ucd(ivoa_ucd)
+    @model_validator(mode="after")
+    def check_unique_columns(self) -> ColumnGroup:
+        """Check that the columns list contains unique items.
-    primaryKey: str | list[str] | None = None
-    """The primary key of the table."""
+        Returns
+        -------
+        `ColumnGroup`
+            The column group being validated.
+        """
+        column_ids = [col if isinstance(col, str) else col.id for col in self.columns]
+        if len(column_ids) != len(set(column_ids)):
+            raise ValueError("Columns in the group must be unique")
+        return self
-    tap_table_index: int | None = Field(None, alias="tap:table_index")
-    """The IVOA TAP_SCHEMA table index of the table."""
+    def _dereference_columns(self) -> None:
+        """Dereference ColumnRef to Column objects."""
+        if self.table is None:
+            raise ValueError("ColumnGroup must have a reference to its parent table")
+        dereferenced_columns: list[ColumnRef | Column] = []
+        for col in self.columns:
+            if isinstance(col, str):
+                # Dereference ColumnRef to Column object
+                try:
+                    col_obj = self.table._find_column_by_id(col)
+                except KeyError as e:
+                    raise ValueError(f"Column '{col}' not found in table '{self.table.name}'") from e
+                dereferenced_columns.append(col_obj)
+            else:
+                dereferenced_columns.append(col)
+        self.columns = dereferenced_columns
+    @field_serializer("columns")
+    def serialize_columns(self, columns: list[ColumnRef | Column]) -> list[str]:
+        """Serialize columns as their IDs.
+        Parameters
+        ----------
+        columns
+            The columns to serialize.
+        Returns
+        -------
+        `list` [ `str` ]
+            The serialized column IDs.
+        """
+        return [col if isinstance(col, str) else col.id for col in columns]
-    mysql_engine: str | None = Field(None, alias="mysql:engine")
-    """The mysql engine to use for the table.
-    For now this is a freeform string but it could be constrained to a list of
-    known engines in the future.
-    """
+class Table(BaseObject):
+    """Table model."""
+    primary_key: str | list[str] | None = Field(None, alias="primaryKey")
+    """Primary key of the table."""
+    tap_table_index: int | None = Field(None, alias="tap:table_index")
+    """IVOA TAP_SCHEMA table index of the table."""
+    mysql_engine: str | None = Field("MyISAM", alias="mysql:engine")
+    """MySQL engine to use for the table."""
     mysql_charset: str | None = Field(None, alias="mysql:charset")
-    """The mysql charset to use for the table.
+    """MySQL charset to use for the table."""
-    For now this is a freeform string but it could be constrained to a list of
-    known charsets in the future.
-    """
+    columns: Sequence[Column]
+    """Columns in the table."""
-    @model_validator(mode="before")
-    @classmethod
-    def create_constraints(cls, values: dict[str, Any]) -> dict[str, Any]:
-        """Create constraints from the ``constraints`` field."""
-        if "constraints" in values:
-            new_constraints: list[Constraint] = []
-            for item in values["constraints"]:
-                if item["@type"] == "ForeignKey":
-                    new_constraints.append(ForeignKeyConstraint(**item))
-                elif item["@type"] == "Unique":
-                    new_constraints.append(UniqueConstraint(**item))
-                elif item["@type"] == "Check":
-                    new_constraints.append(CheckConstraint(**item))
-                else:
-                    raise ValueError(f"Unknown constraint type: {item['@type']}")
-            values["constraints"] = new_constraints
-        return values
+    column_groups: list[ColumnGroup] = Field(default_factory=list, alias="columnGroups")
+    """Column groups in the table."""
+    constraints: list[_ConstraintType] = Field(default_factory=list)
+    """Constraints on the table."""
+    indexes: list[Index] = Field(default_factory=list)
+    """Indexes on the table."""
     @field_validator("columns", mode="after")
     @classmethod
     def check_unique_column_names(cls, columns: list[Column]) -> list[Column]:
-        """Check that column names are unique."""
+        """Check that column names are unique.
+        Parameters
+        ----------
+        columns
+            The columns to check.
+        Returns
+        -------
+        `list` [ `Column` ]
+            The columns if they are unique.
+        Raises
+        ------
+        ValueError
+            Raised if column names are not unique.
+        """
         if len(columns) != len(set(column.name for column in columns)):
             raise ValueError("Column names must be unique")
         return columns
+    @model_validator(mode="after")
+    def check_tap_table_index(self, info: ValidationInfo) -> Table:
+        """Check that the table has a TAP table index.
+        Parameters
+        ----------
+        info
+            Validation context used to determine if the check is enabled.
+        Returns
+        -------
+        `Table`
+            The table being validated.
+        Raises
+        ------
+        ValueError
+            Raised If the table is missing a TAP table index.
+        """
+        context = info.context
+        if not context or not context.get("check_tap_table_indexes", False):
+            return self
+        if self.tap_table_index is None:
+            raise ValueError("Table is missing a TAP table index")
+        return self
+    @model_validator(mode="after")
+    def check_tap_principal(self, info: ValidationInfo) -> Table:
+        """Check that at least one column is flagged as 'principal' for TAP
+        purposes.
+        Parameters
+        ----------
+        info
+            Validation context used to determine if the check is enabled.
+        Returns
+        -------
+        `Table`
+            The table being validated.
+        Raises
+        ------
+        ValueError
+            Raised if the table is missing a column flagged as 'principal'.
+        """
+        context = info.context
+        if not context or not context.get("check_tap_principal", False):
+            return self
+        for col in self.columns:
+            if col.tap_principal == 1:
+                return self
+        raise ValueError(f"Table '{self.name}' is missing at least one column designated as 'tap:principal'")
+    def _find_column_by_id(self, id: str) -> Column:
+        """Find a column by ID.
+        Parameters
+        ----------
+        id
+            The ID of the column to find.
+        Returns
+        -------
+        `Column`
+            The column with the given ID.
+        Raises
+        ------
+        ValueError
+            Raised if the column is not found.
+        """
+        for column in self.columns:
+            if column.id == id:
+                return column
+        raise KeyError(f"Column '{id}' not found in table '{self.name}'")
+    @model_validator(mode="after")
+    def dereference_column_groups(self: Table) -> Table:
+        """Dereference columns in column groups.
+        Returns
+        -------
+        `Table`
+            The table with dereferenced column groups.
+        """
+        for group in self.column_groups:
+            group.table = self
+            group._dereference_columns()
+        return self
 class SchemaVersion(BaseModel):
-    """The version of the schema."""
+    """Schema version model."""
     current: str
     """The current version of the schema."""
@@ -341,35 +968,49 @@ class SchemaVersion(BaseModel):
 class SchemaIdVisitor:
-    """Visitor to build a Schema object's map of IDs to objects.
+    """Visit a schema and build the map of IDs to objects.
+    Notes
+    -----
     Duplicates are added to a set when they are encountered, which can be
-    accessed via the `duplicates` attribute. The presence of duplicates will
+    accessed via the ``duplicates`` attribute. The presence of duplicates will
     not throw an error. Only the first object with a given ID will be added to
-    the map, but this should not matter, since a ValidationError will be thrown
-    by the `model_validator` method if any duplicates are found in the schema.
-    This class is intended for internal use only.
+    the map, but this should not matter, since a ``ValidationError`` will be
+    thrown by the ``model_validator`` method if any duplicates are found in the
+    schema.
     """
     def __init__(self) -> None:
         """Create a new SchemaVisitor."""
-        self.schema: "Schema" | None = None
+        self.schema: Schema | None = None
         self.duplicates: set[str] = set()
     def add(self, obj: BaseObject) -> None:
-        """Add an object to the ID map."""
+        """Add an object to the ID map.
+        Parameters
+        ----------
+        obj
+            The object to add to the ID map.
+        """
         if hasattr(obj, "id"):
             obj_id = getattr(obj, "id")
             if self.schema is not None:
-                if obj_id in self.schema.id_map:
+                if obj_id in self.schema._id_map:
                     self.duplicates.add(obj_id)
                 else:
-                    self.schema.id_map[obj_id] = obj
+                    self.schema._id_map[obj_id] = obj
-    def visit_schema(self, schema: "Schema") -> None:
-        """Visit the schema object that was added during initialization.
+    def visit_schema(self, schema: Schema) -> None:
+        """Visit the objects in a schema and build the ID map.
+        Parameters
+        ----------
+        schema
+            The schema object to visit.
+        Notes
+        -----
         This will set an internal variable pointing to the schema object.
         """
         self.schema = schema
@@ -379,7 +1020,13 @@ class SchemaIdVisitor:
             self.visit_table(table)
     def visit_table(self, table: Table) -> None:
-        """Visit a table object."""
+        """Visit a table object.
+        Parameters
+        ----------
+        table
+            The table object to visit.
+        """
         self.add(table)
         for column in table.columns:
             self.visit_column(column)
@@ -387,25 +1034,84 @@ class SchemaIdVisitor:
             self.visit_constraint(constraint)
     def visit_column(self, column: Column) -> None:
-        """Visit a column object."""
+        """Visit a column object.
+        Parameters
+        ----------
+        column
+            The column object to visit.
+        """
         self.add(column)
     def visit_constraint(self, constraint: Constraint) -> None:
-        """Visit a constraint object."""
+        """Visit a constraint object.
+        Parameters
+        ----------
+        constraint
+            The constraint object to visit.
+        """
         self.add(constraint)
-class Schema(BaseObject):
-    """The database schema containing the tables."""
+T = TypeVar("T", bound=BaseObject)
-    class ValidationConfig:
-        """Validation configuration which is specific to Felis."""
-        _require_description = False
-        """Flag to require a description for all objects.
+def _strip_ids(data: Any) -> Any:
+    """Recursively strip '@id' fields from a dictionary or list.
+    Parameters
+    ----------
+    data
+        The data to strip IDs from, which can be a dictionary, list, or any
+        other type. Other types will be returned unchanged.
+    """
+    if isinstance(data, dict):
+        data.pop("@id", None)
+        for k, v in data.items():
+            data[k] = _strip_ids(v)
+        return data
+    elif isinstance(data, list):
+        return [_strip_ids(item) for item in data]
+    else:
+        return data
+def _append_error(
+    errors: list[InitErrorDetails],
+    loc: tuple,
+    input_value: Any,
+    error_message: str,
+    error_type: str = "value_error",
+) -> None:
+    """Append an error to the errors list.
+    Parameters
+    ----------
+    errors : list[InitErrorDetails]
+        The list of errors to append to.
+    loc : tuple
+        The location of the error in the schema.
+    input_value : Any
+        The input value that caused the error.
+    error_message : str
+        The error message to include in the context.
+    """
+    errors.append(
+        {
+            "type": error_type,
+            "loc": loc,
+            "input": input_value,
+            "ctx": {"error": error_message},
+        }
+    )
-        This is set by the `require_description` class method.
-        """
+class Schema(BaseObject, Generic[T]):
+    """Database schema model.
+    This represents a database schema, which contains one or more tables.
+    """
     version: SchemaVersion | str | None = None
     """The version of the schema."""
@@ -413,52 +1119,539 @@ class Schema(BaseObject):
     tables: Sequence[Table]
     """The tables in the schema."""
-    id_map: dict[str, Any] = Field(default_factory=dict, exclude=True)
+    _id_map: dict[str, Any] = PrivateAttr(default_factory=dict)
     """Map of IDs to objects."""
+    @model_validator(mode="before")
+    @classmethod
+    def generate_ids(cls, values: dict[str, Any], info: ValidationInfo) -> dict[str, Any]:
+        """Generate IDs for objects that do not have them.
+        Parameters
+        ----------
+        values
+            The values of the schema.
+        info
+            Validation context used to determine if ID generation is enabled.
+        Returns
+        -------
+        `dict` [ `str`, `Any` ]
+            The values of the schema with generated IDs.
+        """
+        context = info.context
+        if not context or not context.get("id_generation", False):
+            logger.debug("Skipping ID generation")
+            return values
+        schema_name = values["name"]
+        if "@id" not in values:
+            values["@id"] = f"#{schema_name}"
+            logger.debug(f"Generated ID '{values['@id']}' for schema '{schema_name}'")
+        if "tables" in values:
+            for table in values["tables"]:
+                if "@id" not in table:
+                    table["@id"] = f"#{table['name']}"
+                    logger.debug(f"Generated ID '{table['@id']}' for table '{table['name']}'")
+                if "columns" in table:
+                    for column in table["columns"]:
+                        if "@id" not in column:
+                            column["@id"] = f"#{table['name']}.{column['name']}"
+                            logger.debug(f"Generated ID '{column['@id']}' for column '{column['name']}'")
+                if "columnGroups" in table:
+                    for column_group in table["columnGroups"]:
+                        if "@id" not in column_group:
+                            column_group["@id"] = f"#{table['name']}.{column_group['name']}"
+                            logger.debug(
+                                f"Generated ID '{column_group['@id']}' for column group "
+                                f"'{column_group['name']}'"
+                            )
+                if "constraints" in table:
+                    for constraint in table["constraints"]:
+                        if "@id" not in constraint:
+                            constraint["@id"] = f"#{constraint['name']}"
+                            logger.debug(
+                                f"Generated ID '{constraint['@id']}' for constraint '{constraint['name']}'"
+                            )
+                if "indexes" in table:
+                    for index in table["indexes"]:
+                        if "@id" not in index:
+                            index["@id"] = f"#{index['name']}"
+                            logger.debug(f"Generated ID '{index['@id']}' for index '{index['name']}'")
+        return values
     @field_validator("tables", mode="after")
     @classmethod
     def check_unique_table_names(cls, tables: list[Table]) -> list[Table]:
-        """Check that table names are unique."""
+        """Check that table names are unique.
+        Parameters
+        ----------
+        tables
+            The tables to check.
+        Returns
+        -------
+        `list` [ `Table` ]
+            The tables if they are unique.
+        Raises
+        ------
+        ValueError
+            Raised if table names are not unique.
+        """
         if len(tables) != len(set(table.name for table in tables)):
             raise ValueError("Table names must be unique")
         return tables
+    @model_validator(mode="after")
+    def check_tap_table_indexes(self, info: ValidationInfo) -> Schema:
+        """Check that the TAP table indexes are unique.
+        Parameters
+        ----------
+        info
+            The validation context used to determine if the check is enabled.
+        Returns
+        -------
+        `Schema`
+            The schema being validated.
+        """
+        context = info.context
+        if not context or not context.get("check_tap_table_indexes", False):
+            return self
+        table_indicies = set()
+        for table in self.tables:
+            table_index = table.tap_table_index
+            if table_index is not None:
+                if table_index in table_indicies:
+                    raise ValueError(f"Duplicate 'tap:table_index' value {table_index} found in schema")
+                table_indicies.add(table_index)
+        return self
+    @model_validator(mode="after")
+    def check_unique_constraint_names(self: Schema) -> Schema:
+        """Check for duplicate constraint names in the schema.
+        Returns
+        -------
+        `Schema`
+            The schema being validated.
+        Raises
+        ------
+        ValueError
+            Raised if duplicate constraint names are found in the schema.
+        """
+        constraint_names = set()
+        duplicate_names = []
+        for table in self.tables:
+            for constraint in table.constraints:
+                constraint_name = constraint.name
+                if constraint_name in constraint_names:
+                    duplicate_names.append(constraint_name)
+                else:
+                    constraint_names.add(constraint_name)
+        if duplicate_names:
+            raise ValueError(f"Duplicate constraint names found in schema: {duplicate_names}")
+        return self
+    @model_validator(mode="after")
+    def check_unique_index_names(self: Schema) -> Schema:
+        """Check for duplicate index names in the schema.
+        Returns
+        -------
+        `Schema`
+            The schema being validated.
+        Raises
+        ------
+        ValueError
+            Raised if duplicate index names are found in the schema.
+        """
+        index_names = set()
+        duplicate_names = []
+        for table in self.tables:
+            for index in table.indexes:
+                index_name = index.name
+                if index_name in index_names:
+                    duplicate_names.append(index_name)
+                else:
+                    index_names.add(index_name)
+        if duplicate_names:
+            raise ValueError(f"Duplicate index names found in schema: {duplicate_names}")
+        return self
     @model_validator(mode="after")
     def create_id_map(self: Schema) -> Schema:
-        """Create a map of IDs to objects."""
+        """Create a map of IDs to objects.
+        Returns
+        -------
+        `Schema`
+            The schema with the ID map created.
+        Raises
+        ------
+        ValueError
+            Raised if duplicate identifiers are found in the schema.
+        """
+        if self._id_map:
+            logger.debug("Ignoring call to create_id_map() - ID map was already populated")
+            return self
         visitor: SchemaIdVisitor = SchemaIdVisitor()
         visitor.visit_schema(self)
-        logger.debug(f"ID map contains {len(self.id_map.keys())} objects")
         if len(visitor.duplicates):
             raise ValueError(
                 "Duplicate IDs found in schema:\n    " + "\n    ".join(visitor.duplicates) + "\n"
             )
+        logger.debug("Created ID map with %d entries", len(self._id_map))
+        return self
+    def _validate_column_id(
+        self: Schema,
+        column_id: str,
+        loc: tuple,
+        errors: list[InitErrorDetails],
+    ) -> None:
+        """Validate a column ID from a constraint and append errors if invalid.
+        Parameters
+        ----------
+        schema : Schema
+            The schema being validated.
+        column_id : str
+            The column ID to validate.
+        loc : tuple
+            The location of the error in the schema.
+        errors : list[InitErrorDetails]
+            The list of errors to append to.
+        """
+        if column_id not in self:
+            _append_error(
+                errors,
+                loc,
+                column_id,
+                f"Column ID '{column_id}' not found in schema",
+            )
+        elif not isinstance(self[column_id], Column):
+            _append_error(
+                errors,
+                loc,
+                column_id,
+                f"ID '{column_id}' does not refer to a Column object",
+            )
+    def _validate_foreign_key_column(
+        self: Schema,
+        column_id: str,
+        table: Table,
+        loc: tuple,
+        errors: list[InitErrorDetails],
+    ) -> None:
+        """Validate a foreign key column ID from a constraint and append errors
+        if invalid.
+        Parameters
+        ----------
+        schema : Schema
+            The schema being validated.
+        column_id : str
+            The foreign key column ID to validate.
+        loc : tuple
+            The location of the error in the schema.
+        errors : list[InitErrorDetails]
+            The list of errors to append to.
+        """
+        try:
+            table._find_column_by_id(column_id)
+        except KeyError:
+            _append_error(
+                errors,
+                loc,
+                column_id,
+                f"Column '{column_id}' not found in table '{table.name}'",
+            )
+    @model_validator(mode="after")
+    def check_constraints(self: Schema) -> Schema:
+        """Check constraint objects for validity. This needs to be deferred
+        until after the schema is fully loaded and the ID map is created.
+        Raises
+        ------
+        pydantic.ValidationError
+            Raised if any constraints are invalid.
+        Returns
+        -------
+        `Schema`
+            The schema being validated.
+        """
+        errors: list[InitErrorDetails] = []
+        for table_index, table in enumerate(self.tables):
+            for constraint_index, constraint in enumerate(table.constraints):
+                column_ids: list[str] = []
+                referenced_column_ids: list[str] = []
+                if isinstance(constraint, ForeignKeyConstraint):
+                    column_ids += constraint.columns
+                    referenced_column_ids += constraint.referenced_columns
+                elif isinstance(constraint, UniqueConstraint):
+                    column_ids += constraint.columns
+                # No extra checks are required on CheckConstraint objects.
+                # Validate the foreign key columns
+                for column_id in column_ids:
+                    self._validate_column_id(
+                        column_id,
+                        (
+                            "tables",
+                            table_index,
+                            "constraints",
+                            constraint_index,
+                            "columns",
+                            column_id,
+                        ),
+                        errors,
+                    )
+                    # Check that the foreign key column is within the source
+                    # table.
+                    self._validate_foreign_key_column(
+                        column_id,
+                        table,
+                        (
+                            "tables",
+                            table_index,
+                            "constraints",
+                            constraint_index,
+                            "columns",
+                            column_id,
+                        ),
+                        errors,
+                    )
+                # Validate the primary key (reference) columns
+                for referenced_column_id in referenced_column_ids:
+                    self._validate_column_id(
+                        referenced_column_id,
+                        (
+                            "tables",
+                            table_index,
+                            "constraints",
+                            constraint_index,
+                            "referenced_columns",
+                            referenced_column_id,
+                        ),
+                        errors,
+                    )
+        if errors:
+            raise ValidationError.from_exception_data("Schema validation failed", errors)
         return self
     def __getitem__(self, id: str) -> BaseObject:
-        """Get an object by its ID."""
+        """Get an object by its ID.
+        Parameters
+        ----------
+        id
+            The ID of the object to get.
+        Raises
+        ------
+        KeyError
+            Raised if the object with the given ID is not found in the schema.
+        """
         if id not in self:
             raise KeyError(f"Object with ID '{id}' not found in schema")
-        return self.id_map[id]
+        return self._id_map[id]
     def __contains__(self, id: str) -> bool:
-        """Check if an object with the given ID is in the schema."""
-        return id in self.id_map
+        """Check if an object with the given ID is in the schema.
-    @classmethod
-    def require_description(cls, rd: bool = True) -> None:
-        """Set whether a description is required for all objects.
-        This includes the schema, tables, columns, and constraints.
+        Parameters
+        ----------
+        id
+            The ID of the object to check.
+        """
+        return id in self._id_map
+    def find_object_by_id(self, id: str, obj_type: type[T]) -> T:
+        """Find an object with the given type by its ID.
+        Parameters
+        ----------
+        id
+            The ID of the object to find.
+        obj_type
+            The type of the object to find.
+        Returns
+        -------
+        BaseObject
+            The object with the given ID and type.
+        Raises
+        ------
+        KeyError
+            If the object with the given ID is not found in the schema.
+        TypeError
+            If the object that is found does not have the right type.
+        Notes
+        -----
+        The actual return type is the user-specified argument ``T``, which is
+        expected to be a subclass of `BaseObject`.
+        """
+        obj = self[id]
+        if not isinstance(obj, obj_type):
+            raise TypeError(f"Object with ID '{id}' is not of type '{obj_type.__name__}'")
+        return obj
+    def get_table_by_column(self, column: Column) -> Table:
+        """Find the table that contains a column.
+        Parameters
+        ----------
+        column
+            The column to find.
+        Returns
+        -------
+        `Table`
+            The table that contains the column.
+        Raises
+        ------
+        ValueError
+            If the column is not found in any table.
+        """
+        for table in self.tables:
+            if column in table.columns:
+                return table
+        raise ValueError(f"Column '{column.name}' not found in any table")
-        Users should call this method to set the requirement for a description
-        when validating schemas, rather than change the flag value directly.
+    @classmethod
+    def from_uri(cls, resource_path: ResourcePathExpression, context: dict[str, Any] = {}) -> Schema:
+        """Load a `Schema` from a string representing a ``ResourcePath``.
+        Parameters
+        ----------
+        resource_path
+            The ``ResourcePath`` pointing to a YAML file.
+        context
+            Pydantic context to be used in validation.
+        Returns
+        -------
+        `str`
+            The ID of the object.
+        Raises
+        ------
+        yaml.YAMLError
+            Raised if there is an error loading the YAML data.
+        ValueError
+            Raised if there is an error reading the resource.
+        pydantic.ValidationError
+            Raised if the schema fails validation.
         """
-        logger.debug(f"Setting description requirement to '{rd}'")
-        cls.ValidationConfig._require_description = rd
+        logger.debug(f"Loading schema from: '{resource_path}'")
+        try:
+            rp_stream = ResourcePath(resource_path).read()
+        except Exception as e:
+            raise ValueError(f"Error reading resource from '{resource_path}' : {e}") from e
+        yaml_data = yaml.safe_load(rp_stream)
+        return Schema.model_validate(yaml_data, context=context)
     @classmethod
-    def is_description_required(cls) -> bool:
-        """Return whether a description is required for all objects."""
-        return cls.ValidationConfig._require_description
+    def from_stream(cls, source: IO[str], context: dict[str, Any] = {}) -> Schema:
+        """Load a `Schema` from a file stream which should contain YAML data.
+        Parameters
+        ----------
+        source
+            The file stream to read from.
+        context
+            Pydantic context to be used in validation.
+        Returns
+        -------
+        `Schema`
+            The Felis schema loaded from the stream.
+        Raises
+        ------
+        yaml.YAMLError
+            Raised if there is an error loading the YAML file.
+        pydantic.ValidationError
+            Raised if the schema fails validation.
+        """
+        logger.debug("Loading schema from: '%s'", source)
+        yaml_data = yaml.safe_load(source)
+        return Schema.model_validate(yaml_data, context=context)
+    def _model_dump(self, strip_ids: bool = False) -> dict[str, Any]:
+        """Dump the schema as a dictionary with some default arguments
+        applied.
+        Parameters
+        ----------
+        strip_ids
+            Whether to strip the IDs from the dumped data. Defaults to `False`.
+        Returns
+        -------
+        `dict` [ `str`, `Any` ]
+            The dumped schema data as a dictionary.
+        """
+        data = self.model_dump(by_alias=True, exclude_none=True, exclude_defaults=True)
+        if strip_ids:
+            data = _strip_ids(data)
+        return data
+    def dump_yaml(self, stream: IO[str] = sys.stdout, strip_ids: bool = False) -> None:
+        """Pretty print the schema as YAML.
+        Parameters
+        ----------
+        stream
+            The stream to write the YAML data to.
+        strip_ids
+            Whether to strip the IDs from the dumped data. Defaults to `False`.
+        """
+        data = self._model_dump(strip_ids=strip_ids)
+        yaml.safe_dump(
+            data,
+            stream,
+            default_flow_style=False,
+            sort_keys=False,
+        )
+    def dump_json(self, stream: IO[str] = sys.stdout, strip_ids: bool = False) -> None:
+        """Pretty print the schema as JSON.
+        Parameters
+        ----------
+        stream
+            The stream to write the JSON data to.
+        strip_ids
+            Whether to strip the IDs from the dumped data. Defaults to `False`.
+        """
+        data = self._model_dump(strip_ids=strip_ids)
+        json.dump(
+            data,
+            stream,
+            indent=4,
+            sort_keys=False,
+        )

lsst-felis 26.2024.900__py3-none-any.whl → 29.2025.4500__py3-none-any.whl

lsst-felis 26.2024.900py3-none-any.whl → 29.2025.4500py3-none-any.whl