lsst-felis 28.2024.4500__py3-none-any.whl → 29.2025.4500__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
felis/db/dialects.py CHANGED
@@ -32,7 +32,7 @@ from sqlalchemy.engine.mock import create_mock_engine
32
32
 
33
33
  from .sqltypes import MYSQL, POSTGRES, SQLITE
34
34
 
35
- __all__ = ["get_supported_dialects", "get_dialect_module"]
35
+ __all__ = ["get_dialect_module", "get_supported_dialects"]
36
36
 
37
37
  _DIALECT_NAMES = (MYSQL, POSTGRES, SQLITE)
38
38
  """List of supported dialect names.
felis/db/schema.py ADDED
@@ -0,0 +1,62 @@
1
+ """Database utilities for Felis schemas."""
2
+
3
+ # This file is part of felis.
4
+ #
5
+ # Developed for the LSST Data Management System.
6
+ # This product includes software developed by the LSST Project
7
+ # (https://www.lsst.org).
8
+ # See the COPYRIGHT file at the top-level directory of this distribution
9
+ # for details of code ownership.
10
+ #
11
+ # This program is free software: you can redistribute it and/or modify
12
+ # it under the terms of the GNU General Public License as published by
13
+ # the Free Software Foundation, either version 3 of the License, or
14
+ # (at your option) any later version.
15
+ #
16
+ # This program is distributed in the hope that it will be useful,
17
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
18
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19
+ # GNU General Public License for more details.
20
+ #
21
+ # You should have received a copy of the GNU General Public License
22
+ # along with this program. If not, see <https://www.gnu.org/licenses/>.
23
+
24
+ from sqlalchemy import Engine, create_engine
25
+
26
+ from ..datamodel import Schema
27
+ from ..metadata import MetaDataBuilder
28
+ from .utils import DatabaseContext
29
+
30
+ __all__ = ["create_database"]
31
+
32
+
33
+ def create_database(schema: Schema, engine_or_url_str: Engine | str | None = None) -> DatabaseContext:
34
+ """
35
+ Create a database from the specified `Schema`.
36
+
37
+ Parameters
38
+ ----------
39
+ schema
40
+ The schema to create.
41
+ engine_or_url_str
42
+ The SQLAlchemy engine or URL to use for database creation.
43
+ If None, an in-memory SQLite database will be created.
44
+
45
+ Returns
46
+ -------
47
+ `DatabaseContext`
48
+ The database context object.
49
+ """
50
+ if engine_or_url_str is not None:
51
+ engine = (
52
+ engine_or_url_str if isinstance(engine_or_url_str, Engine) else create_engine(engine_or_url_str)
53
+ )
54
+ else:
55
+ engine = create_engine("sqlite:///:memory:")
56
+ metadata = MetaDataBuilder(
57
+ schema, apply_schema_to_metadata=False if engine.url.drivername == "sqlite" else True
58
+ ).build()
59
+ ctx = DatabaseContext(metadata, engine)
60
+ ctx.initialize()
61
+ ctx.create_all()
62
+ return ctx
felis/db/sqltypes.py CHANGED
@@ -32,20 +32,20 @@ from sqlalchemy.dialects import mysql, postgresql
32
32
  from sqlalchemy.ext.compiler import compiles
33
33
 
34
34
  __all__ = [
35
+ "binary",
35
36
  "boolean",
36
37
  "byte",
37
- "short",
38
+ "char",
39
+ "double",
40
+ "float",
41
+ "get_type_func",
38
42
  "int",
39
43
  "long",
40
- "float",
41
- "double",
42
- "char",
44
+ "short",
43
45
  "string",
44
- "unicode",
45
46
  "text",
46
- "binary",
47
47
  "timestamp",
48
- "get_type_func",
48
+ "unicode",
49
49
  ]
50
50
 
51
51
  MYSQL = "mysql"
felis/db/utils.py CHANGED
@@ -38,7 +38,7 @@ from sqlalchemy.types import TypeEngine
38
38
 
39
39
  from .dialects import get_dialect_module
40
40
 
41
- __all__ = ["string_to_typeengine", "SQLWriter", "ConnectionWrapper", "DatabaseContext"]
41
+ __all__ = ["ConnectionWrapper", "DatabaseContext", "SQLWriter", "string_to_typeengine"]
42
42
 
43
43
  logger = logging.getLogger("felis")
44
44
 
felis/diff.py ADDED
@@ -0,0 +1,234 @@
1
+ """Compare schemas and print the differences."""
2
+
3
+ # This file is part of felis.
4
+ #
5
+ # Developed for the LSST Data Management System.
6
+ # This product includes software developed by the LSST Project
7
+ # (https://www.lsst.org).
8
+ # See the COPYRIGHT file at the top-level directory of this distribution
9
+ # for details of code ownership.
10
+ #
11
+ # This program is free software: you can redistribute it and/or modify
12
+ # it under the terms of the GNU General Public License as published by
13
+ # the Free Software Foundation, either version 3 of the License, or
14
+ # (at your option) any later version.
15
+ #
16
+ # This program is distributed in the hope that it will be useful,
17
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
18
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19
+ # GNU General Public License for more details.
20
+ #
21
+ # You should have received a copy of the GNU General Public License
22
+ # along with this program. If not, see <https://www.gnu.org/licenses/>.
23
+
24
+ import logging
25
+ import pprint
26
+ import re
27
+ from collections.abc import Callable
28
+ from typing import Any
29
+
30
+ from alembic.autogenerate import compare_metadata
31
+ from alembic.migration import MigrationContext
32
+ from deepdiff.diff import DeepDiff
33
+ from sqlalchemy import Engine, MetaData
34
+
35
+ from .datamodel import Schema
36
+ from .metadata import MetaDataBuilder
37
+
38
+ __all__ = ["DatabaseDiff", "SchemaDiff"]
39
+
40
+ logger = logging.getLogger(__name__)
41
+
42
+ # Change alembic log level to avoid unnecessary output
43
+ logging.getLogger("alembic").setLevel(logging.WARNING)
44
+
45
+
46
+ class SchemaDiff:
47
+ """
48
+ Compare two schemas using DeepDiff and print the differences.
49
+
50
+ Parameters
51
+ ----------
52
+ schema1
53
+ The first schema to compare.
54
+ schema2
55
+ The second schema to compare.
56
+ """
57
+
58
+ def __init__(self, schema1: Schema, schema2: Schema):
59
+ self.dict1 = schema1.model_dump(exclude_none=True)
60
+ self.dict2 = schema2.model_dump(exclude_none=True)
61
+ self.diff = DeepDiff(self.dict1, self.dict2, ignore_order=True)
62
+
63
+ def print(self) -> None:
64
+ """
65
+ Print the differences between the two schemas.
66
+ """
67
+ pprint.pprint(self.diff)
68
+
69
+ @property
70
+ def has_changes(self) -> bool:
71
+ """
72
+ Check if there are any differences between the two schemas.
73
+
74
+ Returns
75
+ -------
76
+ bool
77
+ True if there are differences, False otherwise.
78
+ """
79
+ return len(self.diff) > 0
80
+
81
+
82
+ class FormattedSchemaDiff(SchemaDiff):
83
+ """
84
+ Compare two schemas using DeepDiff and print the differences using a
85
+ customized output format.
86
+
87
+ Parameters
88
+ ----------
89
+ schema1
90
+ The first schema to compare.
91
+ schema2
92
+ The second schema to compare.
93
+ """
94
+
95
+ def __init__(self, schema1: Schema, schema2: Schema):
96
+ super().__init__(schema1, schema2)
97
+
98
+ def print(self) -> None:
99
+ """
100
+ Print the differences between the two schemas using a custom format.
101
+ """
102
+ handlers: dict[str, Callable[[dict[str, Any]], None]] = {
103
+ "values_changed": self._handle_values_changed,
104
+ "iterable_item_added": self._handle_iterable_item_added,
105
+ "iterable_item_removed": self._handle_iterable_item_removed,
106
+ "dictionary_item_added": self._handle_dictionary_item_added,
107
+ "dictionary_item_removed": self._handle_dictionary_item_removed,
108
+ }
109
+
110
+ for change_type, handler in handlers.items():
111
+ if change_type in self.diff:
112
+ handler(self.diff[change_type])
113
+
114
+ def _print_header(self, id_dict: dict[str, Any], keys: list[int | str]) -> None:
115
+ # id = self._get_id(id_dict, keys)
116
+ # Don't display ID here for now; it is always just the schema ID.
117
+ print(f"{self._get_key_display(keys)}")
118
+ # print(f"{id} @ {self._get_key_display(keys)}")
119
+
120
+ def _handle_values_changed(self, changes: dict[str, Any]) -> None:
121
+ for key in changes:
122
+ keys = self._parse_deepdiff_path(key)
123
+ value1 = changes[key]["old_value"]
124
+ value2 = changes[key]["new_value"]
125
+ self._print_header(self.dict1, keys)
126
+ print(f"- {value1}")
127
+ print(f"+ {value2}")
128
+
129
+ def _handle_iterable_item_added(self, changes: dict[str, Any]) -> None:
130
+ for key in changes:
131
+ keys = self._parse_deepdiff_path(key)
132
+ value = changes[key]
133
+ self._print_header(self.dict2, keys)
134
+ print(f"+ {value}")
135
+
136
+ def _handle_iterable_item_removed(self, changes: dict[str, Any]) -> None:
137
+ for key in changes:
138
+ keys = self._parse_deepdiff_path(key)
139
+ value = changes[key]
140
+ self._print_header(self.dict1, keys)
141
+ print(f"- {value}")
142
+
143
+ def _handle_dictionary_item_added(self, changes: dict[str, Any]) -> None:
144
+ for key in changes:
145
+ keys = self._parse_deepdiff_path(key)
146
+ value = keys[-1]
147
+ keys.pop()
148
+ self._print_header(self.dict2, keys)
149
+ print(f"+ {value}")
150
+
151
+ def _handle_dictionary_item_removed(self, changes: dict[str, Any]) -> None:
152
+ for key in changes:
153
+ keys = self._parse_deepdiff_path(key)
154
+ value = keys[-1]
155
+ keys.pop()
156
+ self._print_header(self.dict1, keys)
157
+ print(f"- {value}")
158
+
159
+ @staticmethod
160
+ def _get_id(values: dict, keys: list[str | int]) -> str:
161
+ # Unused for now, pending updates to diff tool in DM-49446.
162
+ value: list | dict = values
163
+ last_id = None
164
+
165
+ for key in keys:
166
+ logger.debug(f"Processing key <{key}> with type {type(key)}")
167
+ logger.debug(f"Type of value: {type(value)}")
168
+ if isinstance(value, dict) and "id" in value:
169
+ last_id = value["id"]
170
+ elif isinstance(value, list) and isinstance(key, int):
171
+ if 0 <= key < len(value):
172
+ value = value[key]
173
+ else:
174
+ raise ValueError(f"Index '{key}' is out of range for list of length {len(value)}")
175
+ value = value[key]
176
+
177
+ if isinstance(value, dict) and "id" in value:
178
+ last_id = value["id"]
179
+
180
+ if last_id is not None:
181
+ return last_id
182
+ else:
183
+ raise ValueError("No 'id' found in the specified path")
184
+
185
+ @staticmethod
186
+ def _get_key_display(keys: list[str | int]) -> str:
187
+ return ".".join(str(k) for k in keys)
188
+
189
+ @staticmethod
190
+ def _parse_deepdiff_path(path: str) -> list[str | int]:
191
+ if path.startswith("root"):
192
+ path = path[4:]
193
+
194
+ pattern = re.compile(r"\['([^']+)'\]|\[(\d+)\]")
195
+ matches = pattern.findall(path)
196
+
197
+ keys = []
198
+ for match in matches:
199
+ if match[0]: # String key
200
+ keys.append(match[0])
201
+ elif match[1]: # Integer index
202
+ keys.append(int(match[1]))
203
+
204
+ return keys
205
+
206
+
207
+ class DatabaseDiff(SchemaDiff):
208
+ """
209
+ Compare a schema with a database and print the differences.
210
+
211
+ Parameters
212
+ ----------
213
+ schema
214
+ The schema to compare.
215
+ engine
216
+ The database engine to compare with.
217
+ """
218
+
219
+ def __init__(self, schema: Schema, engine: Engine):
220
+ db_metadata = MetaData()
221
+ with engine.connect() as connection:
222
+ db_metadata.reflect(bind=connection)
223
+ mc = MigrationContext.configure(
224
+ connection, opts={"compare_type": True, "target_metadata": db_metadata}
225
+ )
226
+ schema_metadata = MetaDataBuilder(schema, apply_schema_to_metadata=False).build()
227
+ self.diff = compare_metadata(mc, schema_metadata)
228
+
229
+ def print(self) -> None:
230
+ """
231
+ Print the differences between the schema and the database.
232
+ """
233
+ if self.has_changes:
234
+ pprint.pprint(self.diff)
felis/metadata.py CHANGED
@@ -125,29 +125,27 @@ class MetaDataBuilder:
125
125
  The schema object from which to build the SQLAlchemy metadata.
126
126
  apply_schema_to_metadata
127
127
  Whether to apply the schema name to the metadata object.
128
- apply_schema_to_tables
129
- Whether to apply the schema name to the tables.
130
128
  ignore_constraints
131
129
  Whether to ignore constraints when building the metadata.
130
+ table_name_postfix
131
+ A string to append to the table names when building the metadata.
132
132
  """
133
133
 
134
134
  def __init__(
135
135
  self,
136
136
  schema: Schema,
137
137
  apply_schema_to_metadata: bool = True,
138
- apply_schema_to_tables: bool = True,
139
138
  ignore_constraints: bool = False,
139
+ table_name_postfix: str = "",
140
140
  ) -> None:
141
141
  """Initialize the metadata builder."""
142
142
  self.schema = schema
143
143
  if not apply_schema_to_metadata:
144
144
  logger.debug("Schema name will not be applied to metadata")
145
- if not apply_schema_to_tables:
146
- logger.debug("Schema name will not be applied to tables")
147
145
  self.metadata = MetaData(schema=schema.name if apply_schema_to_metadata else None)
148
146
  self._objects: dict[str, Any] = {}
149
- self.apply_schema_to_tables = apply_schema_to_tables
150
147
  self.ignore_constraints = ignore_constraints
148
+ self.table_name_postfix = table_name_postfix
151
149
 
152
150
  def build(self) -> MetaData:
153
151
  """Build the SQLAlchemy tables and constraints from the schema.
@@ -231,11 +229,10 @@ class MetaDataBuilder:
231
229
  description = table_obj.description
232
230
  columns = [self.build_column(column) for column in table_obj.columns]
233
231
  table = Table(
234
- name,
232
+ name + self.table_name_postfix,
235
233
  self.metadata,
236
234
  *columns,
237
235
  comment=description,
238
- schema=self.schema.name if self.apply_schema_to_tables else None,
239
236
  **optargs, # type: ignore[arg-type]
240
237
  )
241
238
 
@@ -341,12 +338,17 @@ class MetaDataBuilder:
341
338
  "deferrable": constraint_obj.deferrable or None,
342
339
  "initially": constraint_obj.initially or None,
343
340
  }
341
+
344
342
  constraint: Constraint
345
343
 
346
344
  if isinstance(constraint_obj, datamodel.ForeignKeyConstraint):
347
345
  fk_obj: datamodel.ForeignKeyConstraint = constraint_obj
348
346
  columns = [self._objects[column_id] for column_id in fk_obj.columns]
349
347
  refcolumns = [self._objects[column_id] for column_id in fk_obj.referenced_columns]
348
+ if constraint_obj.on_delete is not None:
349
+ args["ondelete"] = constraint_obj.on_delete
350
+ if constraint_obj.on_update is not None:
351
+ args["onupdate"] = constraint_obj.on_update
350
352
  constraint = ForeignKeyConstraint(columns, refcolumns, **args)
351
353
  elif isinstance(constraint_obj, datamodel.CheckConstraint):
352
354
  check_obj: datamodel.CheckConstraint = constraint_obj