PyPI - moltres - Versions diffs - 0.18.0__tar.gz - Mend

moltres 0.18.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

moltres-0.18.0/PKG-INFO +378 -0
moltres-0.18.0/README.md +306 -0
moltres-0.18.0/pyproject.toml +181 -0
moltres-0.18.0/setup.cfg +4 -0
moltres-0.18.0/src/moltres/__init__.py +312 -0
moltres-0.18.0/src/moltres/config.py +202 -0
moltres-0.18.0/src/moltres/dataframe/__init__.py +0 -0
moltres-0.18.0/src/moltres/dataframe/async_dataframe.py +1867 -0
moltres-0.18.0/src/moltres/dataframe/async_groupby.py +422 -0
moltres-0.18.0/src/moltres/dataframe/async_pandas_dataframe.py +1422 -0
moltres-0.18.0/src/moltres/dataframe/async_pandas_groupby.py +408 -0
moltres-0.18.0/src/moltres/dataframe/async_pandas_indexers.py +117 -0
moltres-0.18.0/src/moltres/dataframe/async_polars_dataframe.py +1582 -0
moltres-0.18.0/src/moltres/dataframe/async_polars_groupby.py +385 -0
moltres-0.18.0/src/moltres/dataframe/async_reader.py +557 -0
moltres-0.18.0/src/moltres/dataframe/async_writer.py +996 -0
moltres-0.18.0/src/moltres/dataframe/create_dataframe.py +620 -0
moltres-0.18.0/src/moltres/dataframe/dataframe.py +2715 -0
moltres-0.18.0/src/moltres/dataframe/groupby.py +429 -0
moltres-0.18.0/src/moltres/dataframe/pandas_column.py +142 -0
moltres-0.18.0/src/moltres/dataframe/pandas_dataframe.py +1446 -0
moltres-0.18.0/src/moltres/dataframe/pandas_groupby.py +341 -0
moltres-0.18.0/src/moltres/dataframe/pandas_string_accessor.py +208 -0
moltres-0.18.0/src/moltres/dataframe/polars_column.py +151 -0
moltres-0.18.0/src/moltres/dataframe/polars_dataframe.py +1650 -0
moltres-0.18.0/src/moltres/dataframe/polars_datetime_accessor.py +144 -0
moltres-0.18.0/src/moltres/dataframe/polars_groupby.py +295 -0
moltres-0.18.0/src/moltres/dataframe/polars_string_accessor.py +195 -0
moltres-0.18.0/src/moltres/dataframe/reader.py +656 -0
moltres-0.18.0/src/moltres/dataframe/readers/__init__.py +24 -0
moltres-0.18.0/src/moltres/dataframe/readers/async_csv_reader.py +491 -0
moltres-0.18.0/src/moltres/dataframe/readers/async_json_reader.py +392 -0
moltres-0.18.0/src/moltres/dataframe/readers/async_parquet_reader.py +192 -0
moltres-0.18.0/src/moltres/dataframe/readers/async_readers_init.py +8 -0
moltres-0.18.0/src/moltres/dataframe/readers/async_text_reader.py +176 -0
moltres-0.18.0/src/moltres/dataframe/readers/compression.py +132 -0
moltres-0.18.0/src/moltres/dataframe/readers/csv_reader.py +489 -0
moltres-0.18.0/src/moltres/dataframe/readers/json_reader.py +643 -0
moltres-0.18.0/src/moltres/dataframe/readers/parquet_reader.py +181 -0
moltres-0.18.0/src/moltres/dataframe/readers/schema_inference.py +195 -0
moltres-0.18.0/src/moltres/dataframe/readers/text_reader.py +175 -0
moltres-0.18.0/src/moltres/dataframe/writer.py +1190 -0
moltres-0.18.0/src/moltres/engine/__init__.py +22 -0
moltres-0.18.0/src/moltres/engine/async_connection.py +253 -0
moltres-0.18.0/src/moltres/engine/async_execution.py +332 -0
moltres-0.18.0/src/moltres/engine/connection.py +117 -0
moltres-0.18.0/src/moltres/engine/dialects.py +30 -0
moltres-0.18.0/src/moltres/engine/execution.py +304 -0
moltres-0.18.0/src/moltres/expressions/__init__.py +273 -0
moltres-0.18.0/src/moltres/expressions/column.py +311 -0
moltres-0.18.0/src/moltres/expressions/expr.py +46 -0
moltres-0.18.0/src/moltres/expressions/functions.py +3726 -0
moltres-0.18.0/src/moltres/expressions/sql_parser.py +451 -0
moltres-0.18.0/src/moltres/expressions/when.py +64 -0
moltres-0.18.0/src/moltres/expressions/window.py +203 -0
moltres-0.18.0/src/moltres/io/__init__.py +0 -0
moltres-0.18.0/src/moltres/io/read.py +49 -0
moltres-0.18.0/src/moltres/io/records.py +1367 -0
moltres-0.18.0/src/moltres/io/write.py +33 -0
moltres-0.18.0/src/moltres/logical/__init__.py +0 -0
moltres-0.18.0/src/moltres/logical/operators.py +438 -0
moltres-0.18.0/src/moltres/logical/plan.py +299 -0
moltres-0.18.0/src/moltres/py.typed +0 -0
moltres-0.18.0/src/moltres/sql/__init__.py +0 -0
moltres-0.18.0/src/moltres/sql/builders.py +59 -0
moltres-0.18.0/src/moltres/sql/compiler.py +3154 -0
moltres-0.18.0/src/moltres/sql/ddl.py +726 -0
moltres-0.18.0/src/moltres/table/__init__.py +0 -0
moltres-0.18.0/src/moltres/table/actions.py +393 -0
moltres-0.18.0/src/moltres/table/async_actions.py +425 -0
moltres-0.18.0/src/moltres/table/async_mutations.py +306 -0
moltres-0.18.0/src/moltres/table/async_table.py +1358 -0
moltres-0.18.0/src/moltres/table/batch.py +95 -0
moltres-0.18.0/src/moltres/table/mutations.py +309 -0
moltres-0.18.0/src/moltres/table/schema.py +328 -0
moltres-0.18.0/src/moltres/table/sqlalchemy_integration.py +530 -0
moltres-0.18.0/src/moltres/table/table.py +1485 -0
moltres-0.18.0/src/moltres/utils/__init__.py +0 -0
moltres-0.18.0/src/moltres/utils/exceptions.py +322 -0
moltres-0.18.0/src/moltres/utils/health.py +280 -0
moltres-0.18.0/src/moltres/utils/inspector.py +613 -0
moltres-0.18.0/src/moltres/utils/optional_deps.py +219 -0
moltres-0.18.0/src/moltres/utils/retry.py +241 -0
moltres-0.18.0/src/moltres/utils/telemetry.py +255 -0
moltres-0.18.0/src/moltres/utils/typing.py +10 -0
moltres-0.18.0/src/moltres/utils/validation.py +43 -0
moltres-0.18.0/src/moltres.egg-info/PKG-INFO +378 -0
moltres-0.18.0/src/moltres.egg-info/SOURCES.txt +91 -0
moltres-0.18.0/src/moltres.egg-info/dependency_links.txt +1 -0
moltres-0.18.0/src/moltres.egg-info/requires.txt +52 -0
moltres-0.18.0/src/moltres.egg-info/top_level.txt +1 -0
moltres-0.18.0/tests/test_connection_validation.py +75 -0
moltres-0.18.0/tests/test_imports.py +5 -0

moltres-0.18.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,378 @@
+Metadata-Version: 2.4
+Name: moltres
+Version: 0.18.0
+Summary: DataFrame API with SQL pushdown execution and real SQL CRUD - the missing layer for SQL in Python
+Author-email: Odos Matthews <odosmatthews@gmail.com>
+License-Expression: MIT
+Project-URL: Homepage, https://github.com/eddiethedean/moltres
+Project-URL: Repository, https://github.com/eddiethedean/moltres
+Project-URL: Issues, https://github.com/eddiethedean/moltres/issues
+Keywords: dataframe,sql,crud,pushdown,etl,data-engineering,sqlalchemy,pandas,polars,spark,database,query-builder
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: Programming Language :: Python
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3 :: Only
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Operating System :: MacOS :: MacOS X
+Classifier: Operating System :: Microsoft :: Windows
+Classifier: Operating System :: POSIX :: Linux
+Classifier: Topic :: Database
+Classifier: Topic :: Software Development :: Libraries
+Requires-Python: >=3.9
+Description-Content-Type: text/markdown
+Requires-Dist: SQLAlchemy>=2.0
+Requires-Dist: typing-extensions>=4.5
+Provides-Extra: polars
+Requires-Dist: polars>=1.0; extra == "polars"
+Provides-Extra: pandas
+Requires-Dist: pandas>=2.1; extra == "pandas"
+Provides-Extra: async
+Requires-Dist: aiofiles>=23.0; extra == "async"
+Requires-Dist: greenlet>=3.0.0; extra == "async"
+Provides-Extra: async-postgresql
+Requires-Dist: aiofiles>=23.0; extra == "async-postgresql"
+Requires-Dist: asyncpg>=0.29.0; extra == "async-postgresql"
+Requires-Dist: greenlet>=3.0.0; extra == "async-postgresql"
+Provides-Extra: async-mysql
+Requires-Dist: aiofiles>=23.0; extra == "async-mysql"
+Requires-Dist: aiomysql>=0.2.0; extra == "async-mysql"
+Requires-Dist: greenlet>=3.0.0; extra == "async-mysql"
+Provides-Extra: async-sqlite
+Requires-Dist: aiofiles>=23.0; extra == "async-sqlite"
+Requires-Dist: aiosqlite>=0.19.0; extra == "async-sqlite"
+Requires-Dist: greenlet>=3.0.0; extra == "async-sqlite"
+Provides-Extra: dev
+Requires-Dist: pytest>=8.0; extra == "dev"
+Requires-Dist: pytest-asyncio>=0.21.0; extra == "dev"
+Requires-Dist: pytest-cov>=4.1; extra == "dev"
+Requires-Dist: pytest-green-light>=0.2.0; extra == "dev"
+Requires-Dist: pytest-xdist>=3.5; extra == "dev"
+Requires-Dist: mypy>=1.8; extra == "dev"
+Requires-Dist: sphinx>=7.0; extra == "dev"
+Requires-Dist: sphinx-rtd-theme>=2.0; extra == "dev"
+Requires-Dist: ruff>=0.6; extra == "dev"
+Requires-Dist: pre-commit>=3.5; extra == "dev"
+Requires-Dist: pandas>=2.1; extra == "dev"
+Requires-Dist: pandas-stubs>=2.1; extra == "dev"
+Requires-Dist: polars>=1.0; extra == "dev"
+Requires-Dist: pyarrow>=10.0; extra == "dev"
+Requires-Dist: aiofiles>=23.0; extra == "dev"
+Requires-Dist: aiosqlite>=0.19.0; extra == "dev"
+Requires-Dist: asyncpg>=0.29.0; extra == "dev"
+Requires-Dist: greenlet>=3.0.0; extra == "dev"
+Requires-Dist: testing.postgresql>=1.3.0; extra == "dev"
+Requires-Dist: testing.mysqld>=1.4.0; extra == "dev"
+Requires-Dist: psycopg2-binary>=2.9.0; extra == "dev"
+Requires-Dist: pymysql>=1.0.0; extra == "dev"
+Requires-Dist: duckdb-engine>=0.9.0; extra == "dev"
+# Moltres
+<div align="center">
+[![CI](https://github.com/eddiethedean/moltres/actions/workflows/ci.yml/badge.svg)](https://github.com/eddiethedean/moltres/actions/workflows/ci.yml)
+[![Python 3.9+](https://img.shields.io/badge/python-3.9+-blue.svg)](https://github.com/eddiethedean/moltres)
+[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://github.com/eddiethedean/moltres/blob/main/LICENSE)
+[![Code style: ruff](https://img.shields.io/endpoint?url=https://raw.githubusercontent.com/astral-sh/ruff/main/assets/badge/v2.json)](https://github.com/astral-sh/ruff)
+**The Missing DataFrame Layer for SQL in Python**
+**MOLTRES**: **M**odern **O**perations **L**ayer for **T**ransformations, **R**elational **E**xecution, and **S**QL
+[Installation](#-installation) • [Quick Start](#-quick-start) • [Documentation](#-documentation) • [Examples](#-examples)
+</div>
+---
+**Moltres** combines a DataFrame API (like Pandas/Polars), SQL pushdown execution (no data loading into memory), and real SQL CRUD operations (INSERT, UPDATE, DELETE) in one unified interface.
+Transform millions of rows using familiar DataFrame operations—all executed directly in SQL without materializing data. Update, insert, and delete with column-aware, type-safe operations.
+## ✨ Features
+- 🚀 **PySpark-Style DataFrame API** - Primary API with familiar operations (select, filter, join, groupBy, etc.) for seamless migration from PySpark
+- 🐼 **Optional Pandas-Style Interface** - Comprehensive Pandas-like API with string accessor, query(), dtypes, shape, pivot, sample, concat, and more
+- 🦀 **Optional Polars-Style Interface** - Polars LazyFrame-like API with expression-based operations, set operations, file I/O, CTEs, and more
+- 🎯 **98% PySpark API Compatibility** - Near-complete compatibility for seamless migration
+- 🗄️ **SQL Pushdown Execution** - All operations compile to SQL and run on your database—no data loading into memory
+- ✏️ **Real SQL CRUD** - INSERT, UPDATE, DELETE operations with DataFrame-style syntax
+- 📊 **Multiple Formats** - Read/write CSV, JSON, JSONL, Parquet, and more
+- 🐼 **Pandas & Polars Integration** - Pass pandas/polars DataFrames directly to moltres operations
+- 🌊 **Streaming Support** - Handle datasets larger than memory with chunked processing
+- ⚡ **Async Support** - Full async/await support for all operations
+- 🔒 **Security First** - Built-in SQL injection prevention and validation
+## 📦 Installation
+```bash
+pip install moltres
+# Optional: For async support
+pip install moltres[async-postgresql]  # PostgreSQL
+pip install moltres[async-mysql]       # MySQL
+pip install moltres[async-sqlite]     # SQLite
+# Optional: For pandas/polars result formats
+pip install moltres[pandas,polars]
+```
+## 🚀 Quick Start
+### Basic DataFrame Operations
+```python
+from moltres import col, connect
+from moltres.expressions import functions as F
+# Connect to your database
+db = connect("sqlite:///example.db")
+# DataFrame operations with SQL pushdown (no data loading into memory)
+df = (
+    db.table("orders")
+    .select()
+    .join(db.table("customers").select(), on=[col("orders.customer_id") == col("customers.id")])
+    .where(col("active") == True)
+    .group_by("country")
+    .agg(F.sum(col("amount")).alias("total_amount"))
+)
+# Execute and get results (SQL is compiled and executed here)
+results = df.collect()  # Returns list of dicts by default
+```
+### Pandas-Style Interface
+```python
+df = db.table("users").pandas()
+# Pandas-style operations
+df[['id', 'name']]  # Select columns
+df.query('age > 25 and country == "USA"')  # Query with AND/OR
+df['name'].str.upper()  # String accessor
+df.groupby('country').agg(age='mean')  # GroupBy
+```
+📚 **[See the Pandas Interface Guide →](guides/09-pandas-interface.md)**
+### Polars-Style Interface
+```python
+df = db.table("users").polars()
+# Polars-style operations
+df.select("id", "name", (col("age") * 2).alias("double_age"))
+df.filter((col("age") > 25) & (col("country") == "USA"))
+df.group_by("country").agg(F.sum(col("age")))
+```
+📚 **[See the Polars Interface Guide →](guides/10-polars-interface.md)**
+### CRUD Operations
+```python
+from moltres.io.records import Records
+# Insert rows
+Records.from_list([
+    {"id": 1, "name": "Alice", "email": "alice@example.com"},
+    {"id": 2, "name": "Bob", "email": "bob@example.com"},
+], database=db).insert_into("users")
+# Update rows
+db.update("users", where=col("active") == 0, set={"active": 1})
+# Delete rows
+db.delete("users", where=col("email").is_null())
+```
+📚 **[See CRUD Operations Guide →](guides/05-common-patterns.md#data-mutations)**
+## 📖 Documentation
+### Getting Started
+- **[Getting Started Guide](guides/01-getting-started.md)** - Step-by-step introduction
+- **[Examples Directory](examples/)** - 19 comprehensive example files
+- **[Examples Guide](docs/EXAMPLES.md)** - Common patterns and use cases
+### Interface Guides
+- **[Pandas Interface](guides/09-pandas-interface.md)** - Complete pandas-style API reference
+- **[Polars Interface](guides/10-polars-interface.md)** - Complete Polars-style API reference
+- **[PySpark Migration](guides/03-migrating-from-pyspark.md)** - Migrating from PySpark
+### Core Topics
+- **[Reading Data](guides/01-getting-started.md#reading-data)** - Tables, SQL, files
+- **[Writing Data](guides/01-getting-started.md#writing-data)** - Tables, files, formats
+- **[Table Management](guides/01-getting-started.md#table-management)** - Create, drop, constraints
+- **[Schema Inspection](guides/01-getting-started.md#schema-inspection)** - Reflection and inspection
+- **[Streaming](guides/04-performance-optimization.md#streaming)** - Large dataset handling
+- **[Async Operations](guides/07-advanced-topics.md#async-support)** - Async/await support
+### Advanced Topics
+- **[Performance Optimization](guides/04-performance-optimization.md)** - Query optimization and best practices
+- **[Error Handling](guides/06-error-handling.md)** - Exception handling and debugging
+- **[Best Practices](guides/08-best-practices.md)** - Production-ready patterns
+- **[Advanced Topics](guides/07-advanced-topics.md)** - Window functions, CTEs, transactions
+### Reference
+- **[Why Moltres?](docs/WHY_MOLTRES.md)** - Understanding the gap Moltres fills
+- **[Security Guide](docs/SECURITY.md)** - Security best practices
+- **[Troubleshooting](docs/TROUBLESHOOTING.md)** - Common issues and solutions
+- **[API Reference](docs/api/)** - Complete API documentation
+## 📚 Examples
+Comprehensive examples demonstrating all Moltres features:
+- **[01_connecting.py](examples/01_connecting.py)** - Database connections (sync and async)
+- **[02_dataframe_basics.py](examples/02_dataframe_basics.py)** - Basic DataFrame operations
+- **[03_async_dataframe.py](examples/03_async_dataframe.py)** - Asynchronous operations
+- **[04_joins.py](examples/04_joins.py)** - Join operations
+- **[05_groupby.py](examples/05_groupby.py)** - GroupBy and aggregation
+- **[06_expressions.py](examples/06_expressions.py)** - Column expressions and functions
+- **[07_file_reading.py](examples/07_file_reading.py)** - Reading files (CSV, JSON, Parquet)
+- **[08_file_writing.py](examples/08_file_writing.py)** - Writing DataFrames to files
+- **[09_table_operations.py](examples/09_table_operations.py)** - Table operations and mutations
+- **[10_create_dataframe.py](examples/10_create_dataframe.py)** - Creating DataFrames from Python data
+- **[11_window_functions.py](examples/11_window_functions.py)** - Window functions
+- **[12_sql_operations.py](examples/12_sql_operations.py)** - Raw SQL and SQL operations
+- **[13_transactions.py](examples/13_transactions.py)** - Transaction management
+- **[14_reflection.py](examples/14_reflection.py)** - Schema inspection and reflection
+- **[15_pandas_polars_dataframes.py](examples/15_pandas_polars_dataframes.py)** - Pandas/Polars integration
+- **[16_ux_features.py](examples/16_ux_features.py)** - UX improvements
+- **[17_sqlalchemy_models.py](examples/17_sqlalchemy_models.py)** - SQLAlchemy ORM integration
+- **[18_pandas_interface.py](examples/18_pandas_interface.py)** - Pandas-style interface examples
+- **[19_polars_interface.py](examples/19_polars_interface.py)** - Polars-style interface examples
+See the [examples directory](examples/) for all example files.
+## 🛠️ Supported Operations
+### DataFrame Operations
+- `select()` / `selectExpr()` - Project columns or SQL expressions
+- `where()` / `filter()` - Filter rows
+- `join()` - Join with other DataFrames
+- `group_by()` / `groupBy()` - Group rows
+- `agg()` - Aggregate functions
+- `order_by()` / `orderBy()` / `sort()` - Sort rows
+- `limit()` - Limit number of rows
+- `distinct()` - Remove duplicate rows
+- `withColumn()` - Add or rename columns
+- `pivot()` - Pivot operations
+- `explode()` - Explode array/JSON columns
+### Column Expressions
+- **Arithmetic**: `+`, `-`, `*`, `/`, `%`
+- **Comparisons**: `==`, `!=`, `<`, `>`, `<=`, `>=`
+- **Boolean**: `&`, `|`, `~`
+- **Functions**: 130+ functions including mathematical, string, date/time, aggregate, window, array, JSON, and utility functions
+- **Window Functions**: `over()`, `partition_by()`, `order_by()` - Full PySpark compatibility
+📚 **[See Expressions Guide →](examples/06_expressions.py)**
+### Supported SQL Dialects
+- ✅ **SQLite** - Full support
+- ✅ **PostgreSQL** - Full support with dialect-specific optimizations
+- ✅ **MySQL** - Full support with dialect-specific optimizations
+- ✅ **DuckDB** - Full support with PostgreSQL-compatible optimizations
+- ✅ **Other SQLAlchemy-supported databases** - ANSI SQL fallback
+## 🧪 Development
+### Setup
+```bash
+# Clone the repository
+git clone https://github.com/eddiethedean/moltres.git
+cd moltres
+# Install in development mode
+pip install -e ".[dev]"
+# Install pre-commit hooks
+pre-commit install
+```
+### Running Tests
+```bash
+# Run all tests
+pytest
+# Run tests in parallel
+pytest -n 9
+# Run with coverage
+pytest --cov=src/moltres --cov-report=html
+```
+### Code Quality
+```bash
+# Linting
+ruff check .
+# Formatting
+ruff format .
+# Type checking (strict mode enabled)
+mypy src
+```
+### Pre-Commit CI Checks
+```bash
+# Run all CI checks (linting, type checking, tests)
+make ci-check
+# Quick linting check only
+make ci-check-lint
+```
+## 🤝 Contributing
+Contributions are welcome! Please see [`CONTRIBUTING.md`](CONTRIBUTING.md) for guidelines.
+**Quick Start:**
+1. Fork the repository
+2. Create a feature branch (`git checkout -b feature/amazing-feature`)
+3. Commit your changes (`git commit -m 'Add some amazing feature'`)
+4. Push to the branch (`git push origin feature/amazing-feature`)
+5. Open a Pull Request
+**Before submitting:**
+- Run tests: `pytest`
+- Check code quality: `ruff check . && mypy src`
+- Update documentation if needed
+## 👤 Author
+**Odos Matthews**
+- GitHub: [@eddiethedean](https://github.com/eddiethedean)
+- Email: odosmatthews@gmail.com
+## 🙏 Acknowledgments
+- Inspired by PySpark's DataFrame API style, but focused on SQL feature support rather than PySpark feature parity
+- Built on SQLAlchemy for database connectivity and SQL compilation
+- Thanks to all contributors and users
+## 📄 License
+MIT License - see [LICENSE](LICENSE) file for details.
+---
+<div align="center">
+**Made with ❤️ for the Python data community**
+[⬆ Back to Top](#moltres)
+</div>

moltres-0.18.0/README.md ADDED Viewed

@@ -0,0 +1,306 @@
+# Moltres
+<div align="center">
+[![CI](https://github.com/eddiethedean/moltres/actions/workflows/ci.yml/badge.svg)](https://github.com/eddiethedean/moltres/actions/workflows/ci.yml)
+[![Python 3.9+](https://img.shields.io/badge/python-3.9+-blue.svg)](https://github.com/eddiethedean/moltres)
+[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://github.com/eddiethedean/moltres/blob/main/LICENSE)
+[![Code style: ruff](https://img.shields.io/endpoint?url=https://raw.githubusercontent.com/astral-sh/ruff/main/assets/badge/v2.json)](https://github.com/astral-sh/ruff)
+**The Missing DataFrame Layer for SQL in Python**
+**MOLTRES**: **M**odern **O**perations **L**ayer for **T**ransformations, **R**elational **E**xecution, and **S**QL
+[Installation](#-installation) • [Quick Start](#-quick-start) • [Documentation](#-documentation) • [Examples](#-examples)
+</div>
+---
+**Moltres** combines a DataFrame API (like Pandas/Polars), SQL pushdown execution (no data loading into memory), and real SQL CRUD operations (INSERT, UPDATE, DELETE) in one unified interface.
+Transform millions of rows using familiar DataFrame operations—all executed directly in SQL without materializing data. Update, insert, and delete with column-aware, type-safe operations.
+## ✨ Features
+- 🚀 **PySpark-Style DataFrame API** - Primary API with familiar operations (select, filter, join, groupBy, etc.) for seamless migration from PySpark
+- 🐼 **Optional Pandas-Style Interface** - Comprehensive Pandas-like API with string accessor, query(), dtypes, shape, pivot, sample, concat, and more
+- 🦀 **Optional Polars-Style Interface** - Polars LazyFrame-like API with expression-based operations, set operations, file I/O, CTEs, and more
+- 🎯 **98% PySpark API Compatibility** - Near-complete compatibility for seamless migration
+- 🗄️ **SQL Pushdown Execution** - All operations compile to SQL and run on your database—no data loading into memory
+- ✏️ **Real SQL CRUD** - INSERT, UPDATE, DELETE operations with DataFrame-style syntax
+- 📊 **Multiple Formats** - Read/write CSV, JSON, JSONL, Parquet, and more
+- 🐼 **Pandas & Polars Integration** - Pass pandas/polars DataFrames directly to moltres operations
+- 🌊 **Streaming Support** - Handle datasets larger than memory with chunked processing
+- ⚡ **Async Support** - Full async/await support for all operations
+- 🔒 **Security First** - Built-in SQL injection prevention and validation
+## 📦 Installation
+```bash
+pip install moltres
+# Optional: For async support
+pip install moltres[async-postgresql]  # PostgreSQL
+pip install moltres[async-mysql]       # MySQL
+pip install moltres[async-sqlite]     # SQLite
+# Optional: For pandas/polars result formats
+pip install moltres[pandas,polars]
+```
+## 🚀 Quick Start
+### Basic DataFrame Operations
+```python
+from moltres import col, connect
+from moltres.expressions import functions as F
+# Connect to your database
+db = connect("sqlite:///example.db")
+# DataFrame operations with SQL pushdown (no data loading into memory)
+df = (
+    db.table("orders")
+    .select()
+    .join(db.table("customers").select(), on=[col("orders.customer_id") == col("customers.id")])
+    .where(col("active") == True)
+    .group_by("country")
+    .agg(F.sum(col("amount")).alias("total_amount"))
+)
+# Execute and get results (SQL is compiled and executed here)
+results = df.collect()  # Returns list of dicts by default
+```
+### Pandas-Style Interface
+```python
+df = db.table("users").pandas()
+# Pandas-style operations
+df[['id', 'name']]  # Select columns
+df.query('age > 25 and country == "USA"')  # Query with AND/OR
+df['name'].str.upper()  # String accessor
+df.groupby('country').agg(age='mean')  # GroupBy
+```
+📚 **[See the Pandas Interface Guide →](guides/09-pandas-interface.md)**
+### Polars-Style Interface
+```python
+df = db.table("users").polars()
+# Polars-style operations
+df.select("id", "name", (col("age") * 2).alias("double_age"))
+df.filter((col("age") > 25) & (col("country") == "USA"))
+df.group_by("country").agg(F.sum(col("age")))
+```
+📚 **[See the Polars Interface Guide →](guides/10-polars-interface.md)**
+### CRUD Operations
+```python
+from moltres.io.records import Records
+# Insert rows
+Records.from_list([
+    {"id": 1, "name": "Alice", "email": "alice@example.com"},
+    {"id": 2, "name": "Bob", "email": "bob@example.com"},
+], database=db).insert_into("users")
+# Update rows
+db.update("users", where=col("active") == 0, set={"active": 1})
+# Delete rows
+db.delete("users", where=col("email").is_null())
+```
+📚 **[See CRUD Operations Guide →](guides/05-common-patterns.md#data-mutations)**
+## 📖 Documentation
+### Getting Started
+- **[Getting Started Guide](guides/01-getting-started.md)** - Step-by-step introduction
+- **[Examples Directory](examples/)** - 19 comprehensive example files
+- **[Examples Guide](docs/EXAMPLES.md)** - Common patterns and use cases
+### Interface Guides
+- **[Pandas Interface](guides/09-pandas-interface.md)** - Complete pandas-style API reference
+- **[Polars Interface](guides/10-polars-interface.md)** - Complete Polars-style API reference
+- **[PySpark Migration](guides/03-migrating-from-pyspark.md)** - Migrating from PySpark
+### Core Topics
+- **[Reading Data](guides/01-getting-started.md#reading-data)** - Tables, SQL, files
+- **[Writing Data](guides/01-getting-started.md#writing-data)** - Tables, files, formats
+- **[Table Management](guides/01-getting-started.md#table-management)** - Create, drop, constraints
+- **[Schema Inspection](guides/01-getting-started.md#schema-inspection)** - Reflection and inspection
+- **[Streaming](guides/04-performance-optimization.md#streaming)** - Large dataset handling
+- **[Async Operations](guides/07-advanced-topics.md#async-support)** - Async/await support
+### Advanced Topics
+- **[Performance Optimization](guides/04-performance-optimization.md)** - Query optimization and best practices
+- **[Error Handling](guides/06-error-handling.md)** - Exception handling and debugging
+- **[Best Practices](guides/08-best-practices.md)** - Production-ready patterns
+- **[Advanced Topics](guides/07-advanced-topics.md)** - Window functions, CTEs, transactions
+### Reference
+- **[Why Moltres?](docs/WHY_MOLTRES.md)** - Understanding the gap Moltres fills
+- **[Security Guide](docs/SECURITY.md)** - Security best practices
+- **[Troubleshooting](docs/TROUBLESHOOTING.md)** - Common issues and solutions
+- **[API Reference](docs/api/)** - Complete API documentation
+## 📚 Examples
+Comprehensive examples demonstrating all Moltres features:
+- **[01_connecting.py](examples/01_connecting.py)** - Database connections (sync and async)
+- **[02_dataframe_basics.py](examples/02_dataframe_basics.py)** - Basic DataFrame operations
+- **[03_async_dataframe.py](examples/03_async_dataframe.py)** - Asynchronous operations
+- **[04_joins.py](examples/04_joins.py)** - Join operations
+- **[05_groupby.py](examples/05_groupby.py)** - GroupBy and aggregation
+- **[06_expressions.py](examples/06_expressions.py)** - Column expressions and functions
+- **[07_file_reading.py](examples/07_file_reading.py)** - Reading files (CSV, JSON, Parquet)
+- **[08_file_writing.py](examples/08_file_writing.py)** - Writing DataFrames to files
+- **[09_table_operations.py](examples/09_table_operations.py)** - Table operations and mutations
+- **[10_create_dataframe.py](examples/10_create_dataframe.py)** - Creating DataFrames from Python data
+- **[11_window_functions.py](examples/11_window_functions.py)** - Window functions
+- **[12_sql_operations.py](examples/12_sql_operations.py)** - Raw SQL and SQL operations
+- **[13_transactions.py](examples/13_transactions.py)** - Transaction management
+- **[14_reflection.py](examples/14_reflection.py)** - Schema inspection and reflection
+- **[15_pandas_polars_dataframes.py](examples/15_pandas_polars_dataframes.py)** - Pandas/Polars integration
+- **[16_ux_features.py](examples/16_ux_features.py)** - UX improvements
+- **[17_sqlalchemy_models.py](examples/17_sqlalchemy_models.py)** - SQLAlchemy ORM integration
+- **[18_pandas_interface.py](examples/18_pandas_interface.py)** - Pandas-style interface examples
+- **[19_polars_interface.py](examples/19_polars_interface.py)** - Polars-style interface examples
+See the [examples directory](examples/) for all example files.
+## 🛠️ Supported Operations
+### DataFrame Operations
+- `select()` / `selectExpr()` - Project columns or SQL expressions
+- `where()` / `filter()` - Filter rows
+- `join()` - Join with other DataFrames
+- `group_by()` / `groupBy()` - Group rows
+- `agg()` - Aggregate functions
+- `order_by()` / `orderBy()` / `sort()` - Sort rows
+- `limit()` - Limit number of rows
+- `distinct()` - Remove duplicate rows
+- `withColumn()` - Add or rename columns
+- `pivot()` - Pivot operations
+- `explode()` - Explode array/JSON columns
+### Column Expressions
+- **Arithmetic**: `+`, `-`, `*`, `/`, `%`
+- **Comparisons**: `==`, `!=`, `<`, `>`, `<=`, `>=`
+- **Boolean**: `&`, `|`, `~`
+- **Functions**: 130+ functions including mathematical, string, date/time, aggregate, window, array, JSON, and utility functions
+- **Window Functions**: `over()`, `partition_by()`, `order_by()` - Full PySpark compatibility
+📚 **[See Expressions Guide →](examples/06_expressions.py)**
+### Supported SQL Dialects
+- ✅ **SQLite** - Full support
+- ✅ **PostgreSQL** - Full support with dialect-specific optimizations
+- ✅ **MySQL** - Full support with dialect-specific optimizations
+- ✅ **DuckDB** - Full support with PostgreSQL-compatible optimizations
+- ✅ **Other SQLAlchemy-supported databases** - ANSI SQL fallback
+## 🧪 Development
+### Setup
+```bash
+# Clone the repository
+git clone https://github.com/eddiethedean/moltres.git
+cd moltres
+# Install in development mode
+pip install -e ".[dev]"
+# Install pre-commit hooks
+pre-commit install
+```
+### Running Tests
+```bash
+# Run all tests
+pytest
+# Run tests in parallel
+pytest -n 9
+# Run with coverage
+pytest --cov=src/moltres --cov-report=html
+```
+### Code Quality
+```bash
+# Linting
+ruff check .
+# Formatting
+ruff format .
+# Type checking (strict mode enabled)
+mypy src
+```
+### Pre-Commit CI Checks
+```bash
+# Run all CI checks (linting, type checking, tests)
+make ci-check
+# Quick linting check only
+make ci-check-lint
+```
+## 🤝 Contributing
+Contributions are welcome! Please see [`CONTRIBUTING.md`](CONTRIBUTING.md) for guidelines.
+**Quick Start:**
+1. Fork the repository
+2. Create a feature branch (`git checkout -b feature/amazing-feature`)
+3. Commit your changes (`git commit -m 'Add some amazing feature'`)
+4. Push to the branch (`git push origin feature/amazing-feature`)
+5. Open a Pull Request
+**Before submitting:**
+- Run tests: `pytest`
+- Check code quality: `ruff check . && mypy src`
+- Update documentation if needed
+## 👤 Author
+**Odos Matthews**
+- GitHub: [@eddiethedean](https://github.com/eddiethedean)
+- Email: odosmatthews@gmail.com
+## 🙏 Acknowledgments
+- Inspired by PySpark's DataFrame API style, but focused on SQL feature support rather than PySpark feature parity
+- Built on SQLAlchemy for database connectivity and SQL compilation
+- Thanks to all contributors and users
+## 📄 License
+MIT License - see [LICENSE](LICENSE) file for details.
+---
+<div align="center">
+**Made with ❤️ for the Python data community**
+[⬆ Back to Top](#moltres)
+</div>