PyPI - sqlspec - Versions diffs - 0.21.0__py3-none-any.whl → 0.22.0__py3-none-any.whl - Mend

sqlspec 0.21.0py3-none-any.whl → 0.22.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of sqlspec might be problematic. Click here for more details.

Files changed (21) hide show

sqlspec/base.py +4 -4
sqlspec/driver/mixins/_result_tools.py +41 -6
sqlspec/loader.py +65 -68
sqlspec/protocols.py +3 -5
sqlspec/storage/__init__.py +2 -12
sqlspec/storage/backends/__init__.py +1 -0
sqlspec/storage/backends/fsspec.py +87 -147
sqlspec/storage/backends/local.py +310 -0
sqlspec/storage/backends/obstore.py +210 -192
sqlspec/storage/registry.py +101 -70
sqlspec/utils/data_transformation.py +120 -0
sqlspec/utils/sync_tools.py +8 -5
sqlspec/utils/text.py +27 -19
sqlspec/utils/type_guards.py +74 -0
{sqlspec-0.21.0.dist-info → sqlspec-0.22.0.dist-info}/METADATA +1 -1
{sqlspec-0.21.0.dist-info → sqlspec-0.22.0.dist-info}/RECORD +20 -19
sqlspec/storage/capabilities.py +0 -102
{sqlspec-0.21.0.dist-info → sqlspec-0.22.0.dist-info}/WHEEL +0 -0
{sqlspec-0.21.0.dist-info → sqlspec-0.22.0.dist-info}/entry_points.txt +0 -0
{sqlspec-0.21.0.dist-info → sqlspec-0.22.0.dist-info}/licenses/LICENSE +0 -0
{sqlspec-0.21.0.dist-info → sqlspec-0.22.0.dist-info}/licenses/NOTICE +0 -0

sqlspec/base.py CHANGED Viewed

@@ -64,7 +64,7 @@ class SQLSpec:
                     config.close_pool()
                     cleaned_count += 1
                 except Exception as e:
-                    logger.warning("Failed to clean up sync pool for config %s: %s", config_type.__name__, e)
+                    logger.debug("Failed to clean up sync pool for config %s: %s", config_type.__name__, e)
         if cleaned_count > 0:
             logger.debug("Sync pool cleanup completed. Cleaned %d pools.", cleaned_count)
@@ -87,14 +87,14 @@ class SQLSpec:
                     else:
                         sync_configs.append((config_type, config))
                 except Exception as e:
-                    logger.warning("Failed to prepare cleanup for config %s: %s", config_type.__name__, e)
+                    logger.debug("Failed to prepare cleanup for config %s: %s", config_type.__name__, e)
         if cleanup_tasks:
             try:
                 await asyncio.gather(*cleanup_tasks, return_exceptions=True)
                 logger.debug("Async pool cleanup completed. Cleaned %d pools.", len(cleanup_tasks))
             except Exception as e:
-                logger.warning("Failed to complete async pool cleanup: %s", e)
+                logger.debug("Failed to complete async pool cleanup: %s", e)
         for _config_type, config in sync_configs:
             config.close_pool()
@@ -129,7 +129,7 @@ class SQLSpec:
         """
         config_type = type(config)
         if config_type in self._configs:
-            logger.warning("Configuration for %s already exists. Overwriting.", config_type.__name__)
+            logger.debug("Configuration for %s already exists. Overwriting.", config_type.__name__)
         self._configs[config_type] = config
         return config_type

sqlspec/driver/mixins/_result_tools.py CHANGED Viewed

@@ -1,3 +1,4 @@
+# ruff: noqa: C901
 """Result handling and schema conversion mixins for database drivers."""
 import datetime
@@ -22,7 +23,16 @@ from sqlspec.typing import (
     convert,
     get_type_adapter,
 )
-from sqlspec.utils.type_guards import is_attrs_schema, is_dataclass, is_msgspec_struct, is_pydantic_model
+from sqlspec.utils.data_transformation import transform_dict_keys
+from sqlspec.utils.text import camelize, kebabize, pascalize
+from sqlspec.utils.type_guards import (
+    get_msgspec_rename_config,
+    is_attrs_schema,
+    is_dataclass,
+    is_dict,
+    is_msgspec_struct,
+    is_pydantic_model,
+)
 __all__ = ("_DEFAULT_TYPE_DECODERS", "_default_msgspec_deserializer")
@@ -143,21 +153,46 @@ class ToSchemaMixin:
             if isinstance(data, list):
                 result: list[Any] = []
                 for item in data:
-                    if hasattr(item, "keys"):
+                    if is_dict(item):
                         result.append(schema_type(**dict(item)))  # type: ignore[operator]
                     else:
                         result.append(item)
                 return result
-            if hasattr(data, "keys"):
+            if is_dict(data):
                 return schema_type(**dict(data))  # type: ignore[operator]
             if isinstance(data, dict):
                 return schema_type(**data)  # type: ignore[operator]
             return data
         if is_msgspec_struct(schema_type):
+            rename_config = get_msgspec_rename_config(schema_type)  # type: ignore[arg-type]
             deserializer = partial(_default_msgspec_deserializer, type_decoders=_DEFAULT_TYPE_DECODERS)
-            if not isinstance(data, Sequence):
-                return convert(obj=data, type=schema_type, from_attributes=True, dec_hook=deserializer)
-            return convert(obj=data, type=list[schema_type], from_attributes=True, dec_hook=deserializer)  # type: ignore[valid-type]
+            # Transform field names if rename configuration exists
+            transformed_data = data
+            if (rename_config and is_dict(data)) or (isinstance(data, Sequence) and data and is_dict(data[0])):
+                try:
+                    converter = None
+                    if rename_config == "camel":
+                        converter = camelize
+                    elif rename_config == "kebab":
+                        converter = kebabize
+                    elif rename_config == "pascal":
+                        converter = pascalize
+                    if converter is not None:
+                        if isinstance(data, Sequence):
+                            transformed_data = [
+                                transform_dict_keys(item, converter) if is_dict(item) else item for item in data
+                            ]
+                        else:
+                            transformed_data = transform_dict_keys(data, converter) if is_dict(data) else data
+                except Exception as e:
+                    logger.debug("Field name transformation failed for msgspec schema: %s", e)
+                    transformed_data = data
+            if not isinstance(transformed_data, Sequence):
+                return convert(obj=transformed_data, type=schema_type, from_attributes=True, dec_hook=deserializer)
+            return convert(obj=transformed_data, type=list[schema_type], from_attributes=True, dec_hook=deserializer)  # type: ignore[valid-type]
         if is_pydantic_model(schema_type):
             if not isinstance(data, Sequence):
                 adapter = get_type_adapter(schema_type)

sqlspec/loader.py CHANGED Viewed

@@ -10,18 +10,15 @@ import time
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import TYPE_CHECKING, Any, Final, Optional, Union
+from urllib.parse import unquote, urlparse
 from sqlspec.core.cache import CacheKey, get_cache_config, get_default_cache
 from sqlspec.core.statement import SQL
-from sqlspec.exceptions import (
-    MissingDependencyError,
-    SQLFileNotFoundError,
-    SQLFileParseError,
-    StorageOperationFailedError,
-)
+from sqlspec.exceptions import SQLFileNotFoundError, SQLFileParseError, StorageOperationFailedError
 from sqlspec.storage.registry import storage_registry as default_storage_registry
 from sqlspec.utils.correlation import CorrelationContext
 from sqlspec.utils.logging import get_logger
+from sqlspec.utils.text import slugify
 if TYPE_CHECKING:
     from sqlspec.storage.registry import StorageRegistry
@@ -54,13 +51,25 @@ MIN_QUERY_PARTS: Final = 3
 def _normalize_query_name(name: str) -> str:
     """Normalize query name to be a valid Python identifier.
+    Convert hyphens to underscores, preserve dots for namespacing,
+    and remove invalid characters.
     Args:
         name: Raw query name from SQL file.
     Returns:
         Normalized query name suitable as Python identifier.
     """
-    return TRIM_SPECIAL_CHARS.sub("", name).replace("-", "_")
+    # Handle namespace parts separately to preserve dots
+    parts = name.split(".")
+    normalized_parts = []
+    for part in parts:
+        # Use slugify with underscore separator and remove any remaining invalid chars
+        normalized_part = slugify(part, separator="_")
+        normalized_parts.append(normalized_part)
+    return ".".join(normalized_parts)
 def _normalize_dialect(dialect: str) -> str:
@@ -76,19 +85,6 @@ def _normalize_dialect(dialect: str) -> str:
     return DIALECT_ALIASES.get(normalized, normalized)
-def _normalize_dialect_for_sqlglot(dialect: str) -> str:
-    """Normalize dialect name for SQLGlot compatibility.
-    Args:
-        dialect: Dialect name from SQL file or parameter.
-    Returns:
-        SQLGlot-compatible dialect name.
-    """
-    normalized = dialect.lower().strip()
-    return DIALECT_ALIASES.get(normalized, normalized)
 class NamedStatement:
     """Represents a parsed SQL statement with metadata.
@@ -218,8 +214,7 @@ class SQLFileLoader:
             SQLFileParseError: If file cannot be read.
         """
         try:
-            content = self._read_file_content(path)
-            return hashlib.md5(content.encode(), usedforsecurity=False).hexdigest()
+            return hashlib.md5(self._read_file_content(path).encode(), usedforsecurity=False).hexdigest()
         except Exception as e:
             raise SQLFileParseError(str(path), str(path), e) from e
@@ -253,19 +248,22 @@ class SQLFileLoader:
             SQLFileNotFoundError: If file does not exist.
             SQLFileParseError: If file cannot be read or parsed.
         """
         path_str = str(path)
         try:
             backend = self.storage_registry.get(path)
+            # For file:// URIs, extract just the filename for the backend call
+            if path_str.startswith("file://"):
+                parsed = urlparse(path_str)
+                file_path = unquote(parsed.path)
+                # Handle Windows paths (file:///C:/path)
+                if file_path and len(file_path) > 2 and file_path[2] == ":":  # noqa: PLR2004
+                    file_path = file_path[1:]  # Remove leading slash for Windows
+                filename = Path(file_path).name
+                return backend.read_text(filename, encoding=self.encoding)
             return backend.read_text(path_str, encoding=self.encoding)
         except KeyError as e:
             raise SQLFileNotFoundError(path_str) from e
-        except MissingDependencyError:
-            try:
-                return path.read_text(encoding=self.encoding)  # type: ignore[union-attr]
-            except FileNotFoundError as e:
-                raise SQLFileNotFoundError(path_str) from e
         except StorageOperationFailedError as e:
             if "not found" in str(e).lower() or "no such file" in str(e).lower():
                 raise SQLFileNotFoundError(path_str) from e
@@ -419,8 +417,7 @@ class SQLFileLoader:
         for file_path in sql_files:
             relative_path = file_path.relative_to(dir_path)
             namespace_parts = relative_path.parent.parts
-            namespace = ".".join(namespace_parts) if namespace_parts else None
-            self._load_single_file(file_path, namespace)
+            self._load_single_file(file_path, ".".join(namespace_parts) if namespace_parts else None)
         return len(sql_files)
     def _load_single_file(self, file_path: Union[str, Path], namespace: Optional[str]) -> None:
@@ -533,44 +530,6 @@ class SQLFileLoader:
         self._queries[normalized_name] = statement
         self._query_to_file[normalized_name] = "<directly added>"
-    def get_sql(self, name: str) -> "SQL":
-        """Get a SQL object by statement name.
-        Args:
-            name: Name of the statement (from -- name: in SQL file).
-                  Hyphens in names are converted to underscores.
-        Returns:
-            SQL object ready for execution.
-        Raises:
-            SQLFileNotFoundError: If statement name not found.
-        """
-        correlation_id = CorrelationContext.get()
-        safe_name = _normalize_query_name(name)
-        if safe_name not in self._queries:
-            available = ", ".join(sorted(self._queries.keys())) if self._queries else "none"
-            logger.error(
-                "Statement not found: %s",
-                name,
-                extra={
-                    "statement_name": name,
-                    "safe_name": safe_name,
-                    "available_statements": len(self._queries),
-                    "correlation_id": correlation_id,
-                },
-            )
-            raise SQLFileNotFoundError(name, path=f"Statement '{name}' not found. Available statements: {available}")
-        parsed_statement = self._queries[safe_name]
-        sqlglot_dialect = None
-        if parsed_statement.dialect:
-            sqlglot_dialect = _normalize_dialect_for_sqlglot(parsed_statement.dialect)
-        return SQL(parsed_statement.sql, dialect=sqlglot_dialect)
     def get_file(self, path: Union[str, Path]) -> "Optional[SQLFile]":
         """Get a loaded SQLFile object by path.
@@ -659,3 +618,41 @@ class SQLFileLoader:
         if safe_name not in self._queries:
             raise SQLFileNotFoundError(name)
         return self._queries[safe_name].sql
+    def get_sql(self, name: str) -> "SQL":
+        """Get a SQL object by statement name.
+        Args:
+            name: Name of the statement (from -- name: in SQL file).
+                  Hyphens in names are converted to underscores.
+        Returns:
+            SQL object ready for execution.
+        Raises:
+            SQLFileNotFoundError: If statement name not found.
+        """
+        correlation_id = CorrelationContext.get()
+        safe_name = _normalize_query_name(name)
+        if safe_name not in self._queries:
+            available = ", ".join(sorted(self._queries.keys())) if self._queries else "none"
+            logger.error(
+                "Statement not found: %s",
+                name,
+                extra={
+                    "statement_name": name,
+                    "safe_name": safe_name,
+                    "available_statements": len(self._queries),
+                    "correlation_id": correlation_id,
+                },
+            )
+            raise SQLFileNotFoundError(name, path=f"Statement '{name}' not found. Available statements: {available}")
+        parsed_statement = self._queries[safe_name]
+        sqlglot_dialect = None
+        if parsed_statement.dialect:
+            sqlglot_dialect = _normalize_dialect(parsed_statement.dialect)
+        return SQL(parsed_statement.sql, dialect=sqlglot_dialect)

sqlspec/protocols.py CHANGED Viewed

@@ -4,7 +4,7 @@ This module provides protocols that can be used for static type checking
 and runtime isinstance() checks.
 """
-from typing import TYPE_CHECKING, Any, ClassVar, Optional, Protocol, Union, runtime_checkable
+from typing import TYPE_CHECKING, Any, Optional, Protocol, Union, runtime_checkable
 from typing_extensions import Self
@@ -14,7 +14,6 @@ if TYPE_CHECKING:
     from sqlglot import exp
-    from sqlspec.storage.capabilities import StorageCapabilities
     from sqlspec.typing import ArrowRecordBatch, ArrowTable
 __all__ = (
@@ -194,9 +193,8 @@ class ObjectStoreItemProtocol(Protocol):
 class ObjectStoreProtocol(Protocol):
     """Protocol for object storage operations."""
-    capabilities: ClassVar["StorageCapabilities"]
     protocol: str
+    backend_type: str
     def __init__(self, uri: str, **kwargs: Any) -> None:
         return
@@ -330,7 +328,7 @@ class ObjectStoreProtocol(Protocol):
         msg = "Async arrow writing not implemented"
         raise NotImplementedError(msg)
-    async def stream_arrow_async(self, pattern: str, **kwargs: Any) -> "AsyncIterator[ArrowRecordBatch]":
+    def stream_arrow_async(self, pattern: str, **kwargs: Any) -> "AsyncIterator[ArrowRecordBatch]":
         """Async stream Arrow record batches from matching objects."""
         msg = "Async arrow streaming not implemented"
         raise NotImplementedError(msg)

sqlspec/storage/__init__.py CHANGED Viewed

@@ -8,16 +8,6 @@ Provides a storage system with:
 - Capability-based backend selection
 """
-from sqlspec.protocols import ObjectStoreProtocol
-from sqlspec.storage.capabilities import HasStorageCapabilities, StorageCapabilities
-from sqlspec.storage.registry import StorageRegistry
+from sqlspec.storage.registry import StorageRegistry, storage_registry
-storage_registry = StorageRegistry()
-__all__ = (
-    "HasStorageCapabilities",
-    "ObjectStoreProtocol",
-    "StorageCapabilities",
-    "StorageRegistry",
-    "storage_registry",
-)
+__all__ = ("StorageRegistry", "storage_registry")

sqlspec/storage/backends/__init__.py CHANGED Viewed

	@@ -0,0 +1 @@
1	+ """Storage backends."""

sqlspec 0.21.0__py3-none-any.whl → 0.22.0__py3-none-any.whl

Potentially problematic release.

sqlspec 0.21.0py3-none-any.whl → 0.22.0py3-none-any.whl