PyPI - sqlalchemy-jdbcapi - Versions diffs - 2.0.0.post2__py3-none-any.whl - Mend

sqlalchemy-jdbcapi 2.0.0.post2__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

sqlalchemy_jdbcapi/__init__.py +128 -0
sqlalchemy_jdbcapi/_version.py +34 -0
sqlalchemy_jdbcapi/dialects/__init__.py +30 -0
sqlalchemy_jdbcapi/dialects/base.py +879 -0
sqlalchemy_jdbcapi/dialects/db2.py +134 -0
sqlalchemy_jdbcapi/dialects/mssql.py +117 -0
sqlalchemy_jdbcapi/dialects/mysql.py +152 -0
sqlalchemy_jdbcapi/dialects/oceanbase.py +218 -0
sqlalchemy_jdbcapi/dialects/odbc_base.py +389 -0
sqlalchemy_jdbcapi/dialects/odbc_mssql.py +69 -0
sqlalchemy_jdbcapi/dialects/odbc_mysql.py +101 -0
sqlalchemy_jdbcapi/dialects/odbc_oracle.py +80 -0
sqlalchemy_jdbcapi/dialects/odbc_postgresql.py +63 -0
sqlalchemy_jdbcapi/dialects/oracle.py +180 -0
sqlalchemy_jdbcapi/dialects/postgresql.py +110 -0
sqlalchemy_jdbcapi/dialects/sqlite.py +141 -0
sqlalchemy_jdbcapi/jdbc/__init__.py +98 -0
sqlalchemy_jdbcapi/jdbc/connection.py +244 -0
sqlalchemy_jdbcapi/jdbc/cursor.py +329 -0
sqlalchemy_jdbcapi/jdbc/dataframe.py +198 -0
sqlalchemy_jdbcapi/jdbc/driver_manager.py +353 -0
sqlalchemy_jdbcapi/jdbc/exceptions.py +53 -0
sqlalchemy_jdbcapi/jdbc/jvm.py +176 -0
sqlalchemy_jdbcapi/jdbc/type_converter.py +292 -0
sqlalchemy_jdbcapi/jdbc/types.py +72 -0
sqlalchemy_jdbcapi/odbc/__init__.py +46 -0
sqlalchemy_jdbcapi/odbc/connection.py +136 -0
sqlalchemy_jdbcapi/odbc/exceptions.py +48 -0
sqlalchemy_jdbcapi/py.typed +2 -0
sqlalchemy_jdbcapi-2.0.0.post2.dist-info/METADATA +825 -0
sqlalchemy_jdbcapi-2.0.0.post2.dist-info/RECORD +36 -0
sqlalchemy_jdbcapi-2.0.0.post2.dist-info/WHEEL +5 -0
sqlalchemy_jdbcapi-2.0.0.post2.dist-info/entry_points.txt +20 -0
sqlalchemy_jdbcapi-2.0.0.post2.dist-info/licenses/AUTHORS +7 -0
sqlalchemy_jdbcapi-2.0.0.post2.dist-info/licenses/LICENSE +13 -0
sqlalchemy_jdbcapi-2.0.0.post2.dist-info/top_level.txt +1 -0

sqlalchemy_jdbcapi/jdbc/dataframe.py ADDED Viewed

@@ -0,0 +1,198 @@
+"""
+DataFrame integration for pandas, polars, and Apache Arrow.
+This module provides utilities to convert JDBC query results directly
+into DataFrames for data science and ML workflows.
+"""
+from __future__ import annotations
+import logging
+from typing import TYPE_CHECKING, Any
+if TYPE_CHECKING:
+    from .cursor import Cursor
+logger = logging.getLogger(__name__)
+def cursor_to_pandas(cursor: Cursor) -> Any:
+    """
+    Convert cursor results to pandas DataFrame.
+    Args:
+        cursor: Cursor with executed query
+    Returns:
+        pandas.DataFrame
+    Raises:
+        ImportError: If pandas is not installed
+        ValueError: If cursor has no results
+    Example:
+        >>> cursor.execute("SELECT * FROM users")
+        >>> df = cursor_to_pandas(cursor)
+        >>> print(df.head())
+    """
+    try:
+        import pandas as pd
+    except ImportError as e:
+        raise ImportError(
+            "pandas is not installed. Install with: pip install pandas"
+        ) from e
+    if cursor.description is None:
+        raise ValueError("Cursor has no result set")
+    # Get column names
+    columns = [desc[0] for desc in cursor.description]
+    # Fetch all rows
+    rows = cursor.fetchall()
+    # Create DataFrame
+    df = pd.DataFrame(rows, columns=columns)
+    logger.debug(f"Created pandas DataFrame with shape {df.shape}")
+    return df
+def cursor_to_polars(cursor: Cursor) -> Any:
+    """
+    Convert cursor results to polars DataFrame.
+    Args:
+        cursor: Cursor with executed query
+    Returns:
+        polars.DataFrame
+    Raises:
+        ImportError: If polars is not installed
+        ValueError: If cursor has no results
+    Example:
+        >>> cursor.execute("SELECT * FROM users")
+        >>> df = cursor_to_polars(cursor)
+        >>> print(df.head())
+    """
+    try:
+        import polars as pl
+    except ImportError as e:
+        raise ImportError(
+            "polars is not installed. Install with: pip install polars"
+        ) from e
+    if cursor.description is None:
+        raise ValueError("Cursor has no result set")
+    # Get column names
+    columns = [desc[0] for desc in cursor.description]
+    # Fetch all rows
+    rows = cursor.fetchall()
+    # Create DataFrame from dict of lists
+    data = {col: [row[i] for row in rows] for i, col in enumerate(columns)}
+    df = pl.DataFrame(data)
+    logger.debug(f"Created polars DataFrame with shape {df.shape}")
+    return df
+def cursor_to_arrow(cursor: Cursor) -> Any:
+    """
+    Convert cursor results to Apache Arrow Table.
+    Args:
+        cursor: Cursor with executed query
+    Returns:
+        pyarrow.Table
+    Raises:
+        ImportError: If pyarrow is not installed
+        ValueError: If cursor has no results
+    Example:
+        >>> cursor.execute("SELECT * FROM users")
+        >>> table = cursor_to_arrow(cursor)
+        >>> print(table.schema)
+    """
+    try:
+        import pyarrow as pa
+    except ImportError as e:
+        raise ImportError(
+            "pyarrow is not installed. Install with: pip install pyarrow"
+        ) from e
+    if cursor.description is None:
+        raise ValueError("Cursor has no result set")
+    # Get column names
+    columns = [desc[0] for desc in cursor.description]
+    # Fetch all rows
+    rows = cursor.fetchall()
+    # Convert to Arrow Table
+    # Build column arrays
+    if not rows:
+        # Empty result
+        arrays = [pa.array([]) for _ in columns]
+    else:
+        # Transpose rows to columns
+        col_data = [[row[i] for row in rows] for i in range(len(columns))]
+        arrays = [pa.array(col) for col in col_data]
+    table = pa.Table.from_arrays(arrays, names=columns)
+    logger.debug(f"Created Arrow Table with {table.num_rows} rows")
+    return table
+def cursor_to_dict(cursor: Cursor) -> list[dict[str, Any]]:
+    """
+    Convert cursor results to list of dictionaries.
+    Args:
+        cursor: Cursor with executed query
+    Returns:
+        List of row dictionaries
+    Example:
+        >>> cursor.execute("SELECT * FROM users")
+        >>> rows = cursor_to_dict(cursor)
+        >>> print(rows[0])
+        {'id': 1, 'name': 'Alice', 'email': 'alice@example.com'}
+    """
+    if cursor.description is None:
+        raise ValueError("Cursor has no result set")
+    columns = [desc[0] for desc in cursor.description]
+    rows = cursor.fetchall()
+    return [dict(zip(columns, row)) for row in rows]
+# Add convenience methods to Cursor class
+def _add_dataframe_methods() -> None:
+    """Add DataFrame methods to Cursor class."""
+    from .cursor import Cursor
+    # Add methods
+    Cursor.to_pandas = lambda self: cursor_to_pandas(self)  # type: ignore
+    Cursor.to_polars = lambda self: cursor_to_polars(self)  # type: ignore
+    Cursor.to_arrow = lambda self: cursor_to_arrow(self)  # type: ignore
+    Cursor.to_dict = lambda self: cursor_to_dict(self)  # type: ignore
+    logger.debug("Added DataFrame methods to Cursor class")
+# Auto-register methods on import
+try:
+    _add_dataframe_methods()
+except Exception as e:
+    logger.debug(f"Could not add DataFrame methods: {e}")

sqlalchemy_jdbcapi/jdbc/driver_manager.py ADDED Viewed

@@ -0,0 +1,353 @@
+"""
+JDBC driver auto-download and management.
+This module handles automatic downloading of JDBC drivers from Maven Central
+and provides fallback to manual driver configuration via CLASSPATH.
+"""
+from __future__ import annotations
+import logging
+import os
+import shutil
+import urllib.request
+from pathlib import Path
+from typing import NamedTuple
+logger = logging.getLogger(__name__)
+# Default driver cache directory
+DEFAULT_DRIVER_CACHE = Path.home() / ".sqlalchemy-jdbcapi" / "drivers"
+class JDBCDriver(NamedTuple):
+    """JDBC driver metadata for automatic download."""
+    group_id: str
+    artifact_id: str
+    version: str
+    classifier: str | None = None
+    @property
+    def filename(self) -> str:
+        """Get the JAR filename."""
+        if self.classifier:
+            return f"{self.artifact_id}-{self.version}-{self.classifier}.jar"
+        return f"{self.artifact_id}-{self.version}.jar"
+    @property
+    def maven_url(self) -> str:
+        """Get the Maven Central download URL."""
+        base_url = "https://repo1.maven.org/maven2"
+        group_path = self.group_id.replace(".", "/")
+        return (
+            f"{base_url}/{group_path}/{self.artifact_id}/{self.version}/{self.filename}"
+        )
+# Recommended JDBC drivers for auto-download from Maven Central
+# These versions are tested and known to work well
+# TODO: Consider checking for newer versions periodically
+RECOMMENDED_JDBC_DRIVERS = {
+    "postgresql": JDBCDriver(
+        group_id="org.postgresql",
+        artifact_id="postgresql",
+        version="42.7.1",  # Latest stable as of 2024
+    ),
+    "mysql": JDBCDriver(
+        group_id="com.mysql",
+        artifact_id="mysql-connector-j",
+        version="8.3.0",  # Note: Oracle renamed this from mysql-connector-java
+    ),
+    "mariadb": JDBCDriver(
+        group_id="org.mariadb.jdbc",
+        artifact_id="mariadb-java-client",
+        version="3.3.2",
+    ),
+    "mssql": JDBCDriver(
+        group_id="com.microsoft.sqlserver",
+        artifact_id="mssql-jdbc",
+        version="12.6.0.jre11",  # JRE11 version for Java 11+ compatibility
+    ),
+    "oracle": JDBCDriver(
+        group_id="com.oracle.database.jdbc",
+        artifact_id="ojdbc11",
+        version="23.3.0.23.09",
+    ),
+    "db2": JDBCDriver(
+        group_id="com.ibm.db2",
+        artifact_id="jcc",
+        version="11.5.9.0",
+    ),
+    "sqlite": JDBCDriver(
+        group_id="org.xerial",
+        artifact_id="sqlite-jdbc",
+        version="3.45.0.0",
+    ),
+    "oceanbase": JDBCDriver(
+        group_id="com.oceanbase",
+        artifact_id="oceanbase-client",
+        version="2.4.9",
+    ),
+}
+def get_driver_cache_dir() -> Path:
+    """
+    Get the driver cache directory.
+    Returns:
+        Path to the driver cache directory.
+    """
+    cache_dir = os.environ.get("SQLALCHEMY_JDBCAPI_DRIVER_CACHE")
+    if cache_dir:
+        return Path(cache_dir)
+    return DEFAULT_DRIVER_CACHE
+def download_driver(
+    driver: JDBCDriver,
+    cache_dir: Path | None = None,
+    force: bool = False,
+) -> Path:
+    """
+    Download a JDBC driver from Maven Central.
+    Args:
+        driver: JDBC driver metadata.
+        cache_dir: Directory to cache downloaded drivers. If None, uses default.
+        force: Force re-download even if driver exists.
+    Returns:
+        Path to the downloaded driver JAR file.
+    Raises:
+        RuntimeError: If download fails.
+    """
+    if cache_dir is None:
+        cache_dir = get_driver_cache_dir()
+    # Create cache directory if it doesn't exist
+    cache_dir.mkdir(parents=True, exist_ok=True)
+    # Target file path
+    target_path = cache_dir / driver.filename
+    # Check if driver already exists
+    if target_path.exists() and not force:
+        logger.debug(f"Driver already cached: {target_path}")
+        return target_path
+    # Download driver
+    logger.info(f"Downloading JDBC driver: {driver.filename}")
+    logger.debug(f"URL: {driver.maven_url}")
+    try:
+        with urllib.request.urlopen(driver.maven_url) as response:
+            # Download to temporary file first
+            temp_path = target_path.with_suffix(".tmp")
+            with open(temp_path, "wb") as f:
+                shutil.copyfileobj(response, f)
+            # Move to final location
+            temp_path.replace(target_path)
+        logger.info(f"Driver downloaded successfully: {target_path}")
+        return target_path
+    except Exception as e:
+        error_msg = f"Failed to download driver from {driver.maven_url}: {e}"
+        logger.error(error_msg)
+        raise RuntimeError(error_msg) from e
+def get_driver_path(
+    database: str,
+    driver: JDBCDriver | None = None,
+    auto_download: bool = True,
+    cache_dir: Path | None = None,
+) -> Path:
+    """
+    Get the path to a JDBC driver, downloading if necessary.
+    Args:
+        database: Database name (e.g., 'postgresql', 'mysql').
+        driver: Custom driver metadata. If None, uses recommended driver.
+        auto_download: Whether to auto-download driver if not found.
+        cache_dir: Directory to cache downloaded drivers.
+    Returns:
+        Path to the JDBC driver JAR file.
+    Raises:
+        RuntimeError: If driver not found and auto-download disabled.
+    """
+    if driver is None:
+        driver = RECOMMENDED_JDBC_DRIVERS.get(database.lower())
+        if driver is None:
+            raise ValueError(f"No recommended driver for database: {database}")
+    if cache_dir is None:
+        cache_dir = get_driver_cache_dir()
+    target_path = cache_dir / driver.filename
+    # Check if driver exists in cache
+    if target_path.exists():
+        return target_path
+    # Try to auto-download
+    if auto_download:
+        return download_driver(driver, cache_dir)
+    raise RuntimeError(
+        f"JDBC driver not found: {target_path}. "
+        f"Enable auto_download or set CLASSPATH environment variable."
+    )
+def get_all_driver_paths(
+    databases: list[str] | None = None,
+    auto_download: bool = True,
+    cache_dir: Path | None = None,
+) -> list[Path]:
+    """
+    Get paths to multiple JDBC drivers.
+    Args:
+        databases: List of database names. If None, downloads all recommended drivers.
+        auto_download: Whether to auto-download drivers if not found.
+        cache_dir: Directory to cache downloaded drivers.
+    Returns:
+        List of paths to JDBC driver JAR files.
+    """
+    if databases is None:
+        databases = list(RECOMMENDED_JDBC_DRIVERS.keys())
+    paths = []
+    for database in databases:
+        try:
+            path = get_driver_path(
+                database, auto_download=auto_download, cache_dir=cache_dir
+            )
+            paths.append(path)
+        except Exception as e:
+            logger.warning(f"Failed to get driver for {database}: {e}")
+    return paths
+def get_classpath_with_drivers(
+    databases: list[str] | None = None,
+    auto_download: bool = True,
+    manual_classpath: list[Path] | None = None,
+) -> list[Path]:
+    """
+    Get comprehensive classpath including auto-downloaded and manual drivers.
+    Args:
+        databases: List of database names for auto-download. If None, downloads all recommended.
+        auto_download: Whether to auto-download drivers.
+        manual_classpath: Additional manual classpath entries.
+    Returns:
+        List of all classpath entries.
+    """
+    classpath = []
+    # Add manual classpath entries first (higher priority)
+    if manual_classpath:
+        classpath.extend(manual_classpath)
+    # Add auto-downloaded drivers
+    if auto_download:
+        try:
+            auto_paths = get_all_driver_paths(databases, auto_download=True)
+            classpath.extend(auto_paths)
+        except Exception as e:
+            logger.warning(f"Failed to auto-download some drivers: {e}")
+    # Remove duplicates while preserving order
+    seen = set()
+    unique_classpath = []
+    for path in classpath:
+        if path not in seen:
+            seen.add(path)
+            unique_classpath.append(path)
+    return unique_classpath
+def verify_driver(driver_path: Path) -> bool:
+    """
+    Verify that a JDBC driver JAR file is valid.
+    Args:
+        driver_path: Path to the driver JAR file.
+    Returns:
+        True if driver appears valid, False otherwise.
+    """
+    if not driver_path.exists():
+        return False
+    if not driver_path.is_file():
+        return False
+    if not driver_path.suffix == ".jar":
+        return False
+    # Check if file is not empty
+    if driver_path.stat().st_size == 0:
+        return False
+    # Could add more validation (e.g., ZIP file structure)
+    return True
+def list_cached_drivers(cache_dir: Path | None = None) -> list[Path]:
+    """
+    List all cached JDBC drivers.
+    Args:
+        cache_dir: Directory to check. If None, uses default.
+    Returns:
+        List of paths to cached driver JAR files.
+    """
+    if cache_dir is None:
+        cache_dir = get_driver_cache_dir()
+    if not cache_dir.exists():
+        return []
+    return [path for path in cache_dir.glob("*.jar") if verify_driver(path)]
+def clear_driver_cache(cache_dir: Path | None = None) -> int:
+    """
+    Clear the driver cache directory.
+    Args:
+        cache_dir: Directory to clear. If None, uses default.
+    Returns:
+        Number of files deleted.
+    """
+    if cache_dir is None:
+        cache_dir = get_driver_cache_dir()
+    if not cache_dir.exists():
+        return 0
+    count = 0
+    for path in cache_dir.glob("*.jar"):
+        try:
+            path.unlink()
+            count += 1
+            logger.debug(f"Deleted cached driver: {path}")
+        except Exception as e:
+            logger.warning(f"Failed to delete {path}: {e}")
+    return count

sqlalchemy_jdbcapi/jdbc/exceptions.py ADDED Viewed

@@ -0,0 +1,53 @@
+"""
+JDBC Exception hierarchy following DB-API 2.0 specification.
+"""
+from __future__ import annotations
+class Error(Exception):
+    """Base class for all JDBC-related errors."""
+class Warning(Exception):  # noqa: A001 - DB-API 2.0 requires Warning exception class
+    """Exception raised for important warnings."""
+class InterfaceError(Error):
+    """Exception raised for errors related to the database interface."""
+class DatabaseError(Error):
+    """Exception raised for errors related to the database."""
+class InternalError(DatabaseError):
+    """Exception raised when the database encounters an internal error."""
+class OperationalError(DatabaseError):
+    """Exception raised for operational database errors."""
+class ProgrammingError(DatabaseError):
+    """Exception raised for programming errors."""
+class IntegrityError(DatabaseError):
+    """Exception raised when database integrity is violated."""
+class DataError(DatabaseError):
+    """Exception raised for errors related to processed data."""
+class NotSupportedError(DatabaseError):
+    """Exception raised when a method or database API is not supported."""
+class JDBCDriverNotFoundError(InterfaceError):
+    """Exception raised when JDBC driver cannot be found."""
+class JVMNotStartedError(InterfaceError):
+    """Exception raised when JVM is not started."""