PyPI - collie-mlops - Versions diffs - 0.1.1b0__py3-none-any.whl - Mend

collie-mlops 0.1.1b0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

collie/__init__.py +69 -0
collie/_common/__init__.py +0 -0
collie/_common/decorator.py +53 -0
collie/_common/exceptions.py +104 -0
collie/_common/mlflow_model_io/__init__.py +0 -0
collie/_common/mlflow_model_io/base_flavor_handler.py +26 -0
collie/_common/mlflow_model_io/flavor_registry.py +72 -0
collie/_common/mlflow_model_io/model_flavors.py +259 -0
collie/_common/mlflow_model_io/model_io.py +65 -0
collie/_common/utils.py +13 -0
collie/contracts/__init__.py +0 -0
collie/contracts/event.py +79 -0
collie/contracts/mlflow.py +444 -0
collie/contracts/orchestrator.py +79 -0
collie/core/__init__.py +41 -0
collie/core/enums/__init__.py +0 -0
collie/core/enums/components.py +26 -0
collie/core/enums/ml_models.py +20 -0
collie/core/evaluator/__init__.py +0 -0
collie/core/evaluator/evaluator.py +147 -0
collie/core/models.py +125 -0
collie/core/orchestrator/__init__.py +0 -0
collie/core/orchestrator/orchestrator.py +47 -0
collie/core/pusher/__init__.py +0 -0
collie/core/pusher/pusher.py +98 -0
collie/core/trainer/__init__.py +0 -0
collie/core/trainer/trainer.py +78 -0
collie/core/transform/__init__.py +0 -0
collie/core/transform/transform.py +87 -0
collie/core/tuner/__init__.py +0 -0
collie/core/tuner/tuner.py +84 -0
collie/helper/__init__.py +0 -0
collie/helper/pytorch/__init__.py +0 -0
collie/helper/pytorch/callback/__init__.py +0 -0
collie/helper/pytorch/callback/callback.py +155 -0
collie/helper/pytorch/callback/earlystop.py +54 -0
collie/helper/pytorch/callback/model_checkpoint.py +100 -0
collie/helper/pytorch/model/__init__.py +0 -0
collie/helper/pytorch/model/loader.py +55 -0
collie/helper/pytorch/trainer.py +304 -0
collie_mlops-0.1.1b0.dist-info/LICENSE +21 -0
collie_mlops-0.1.1b0.dist-info/METADATA +259 -0
collie_mlops-0.1.1b0.dist-info/RECORD +45 -0
collie_mlops-0.1.1b0.dist-info/WHEEL +5 -0
collie_mlops-0.1.1b0.dist-info/top_level.txt +1 -0

collie_mlops-0.1.1b0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,259 @@
+Metadata-Version: 2.1
+Name: collie-mlops
+Version: 0.1.1b0
+Summary: A Lightweight MLOps Framework for Machine Learning Workflows
+Home-page: https://github.com/ChingHuanChiu/collie
+Author: ChingHuanChiu
+Author-email: ChingHuanChiu <stevenchiou8@gmail.com>
+Maintainer-email: ChingHuanChiu <stevenchiou8@gmail.com>
+License: MIT
+Project-URL: Homepage, https://github.com/ChingHuanChiu/collie
+Project-URL: Documentation, https://github.com/ChingHuanChiu/collie/blob/main/README.md
+Project-URL: Repository, https://github.com/ChingHuanChiu/collie
+Project-URL: Bug Tracker, https://github.com/ChingHuanChiu/collie/issues
+Project-URL: Changelog, https://github.com/ChingHuanChiu/collie/blob/main/CHANGELOG.md
+Keywords: mlops,machine-learning,mlflow,pipeline,orchestration,deep-learning,experiment-tracking
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Developers
+Classifier: Intended Audience :: Science/Research
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Classifier: Programming Language :: Python :: 3 :: Only
+Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
+Classifier: Topic :: Software Development :: Libraries :: Python Modules
+Classifier: Typing :: Typed
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: mlflow >=2.0.0
+Requires-Dist: pydantic >=2.0.0
+Requires-Dist: pandas >=1.3.0
+Requires-Dist: numpy <2.0.0,>=1.20.0
+Requires-Dist: scikit-learn >=1.0.0
+Requires-Dist: xgboost >=1.5.0
+Requires-Dist: torch >=1.9.0
+Requires-Dist: pytorch-lightning >=2.0.0
+Requires-Dist: lightgbm >=3.0.0
+Requires-Dist: transformers >=4.0.0
+Requires-Dist: sentence-transformers >=2.0.0
+Provides-Extra: all
+Requires-Dist: scikit-learn >=1.0.0 ; extra == 'all'
+Requires-Dist: xgboost >=1.5.0 ; extra == 'all'
+Requires-Dist: torch >=1.9.0 ; extra == 'all'
+Requires-Dist: pytorch-lightning >=2.0.0 ; extra == 'all'
+Requires-Dist: lightgbm >=3.0.0 ; extra == 'all'
+Requires-Dist: transformers >=4.0.0 ; extra == 'all'
+Requires-Dist: sentence-transformers >=2.0.0 ; extra == 'all'
+Requires-Dist: PyYAML >=5.4.0 ; extra == 'all'
+Requires-Dist: toml >=0.10.0 ; extra == 'all'
+Provides-Extra: config
+Requires-Dist: PyYAML >=5.4.0 ; extra == 'config'
+Requires-Dist: toml >=0.10.0 ; extra == 'config'
+Provides-Extra: dev
+Requires-Dist: pytest >=6.0.0 ; extra == 'dev'
+Requires-Dist: pytest-cov >=3.0.0 ; extra == 'dev'
+Requires-Dist: pytest-mock >=3.6.0 ; extra == 'dev'
+Requires-Dist: black >=22.0.0 ; extra == 'dev'
+Requires-Dist: isort >=5.10.0 ; extra == 'dev'
+Requires-Dist: flake8 >=4.0.0 ; extra == 'dev'
+Requires-Dist: mypy >=0.950 ; extra == 'dev'
+Requires-Dist: pre-commit >=2.15.0 ; extra == 'dev'
+Requires-Dist: twine >=4.0.0 ; extra == 'dev'
+Requires-Dist: build >=0.7.0 ; extra == 'dev'
+Provides-Extra: docs
+Requires-Dist: sphinx >=4.0.0 ; extra == 'docs'
+Requires-Dist: sphinx-rtd-theme >=1.0.0 ; extra == 'docs'
+Requires-Dist: sphinx-autodoc-typehints >=1.12.0 ; extra == 'docs'
+Requires-Dist: myst-parser >=0.18.0 ; extra == 'docs'
+Provides-Extra: lightgbm
+Requires-Dist: lightgbm >=3.0.0 ; extra == 'lightgbm'
+Provides-Extra: pytorch
+Requires-Dist: torch >=1.9.0 ; extra == 'pytorch'
+Requires-Dist: pytorch-lightning >=2.0.0 ; extra == 'pytorch'
+Provides-Extra: sklearn
+Requires-Dist: scikit-learn >=1.0.0 ; extra == 'sklearn'
+Provides-Extra: test
+Requires-Dist: pytest >=6.0.0 ; extra == 'test'
+Requires-Dist: pytest-cov >=3.0.0 ; extra == 'test'
+Requires-Dist: pytest-mock >=3.6.0 ; extra == 'test'
+Provides-Extra: transformers
+Requires-Dist: transformers >=4.0.0 ; extra == 'transformers'
+Requires-Dist: sentence-transformers >=2.0.0 ; extra == 'transformers'
+Provides-Extra: xgboost
+Requires-Dist: xgboost >=1.5.0 ; extra == 'xgboost'
+# Collie
+[![PyPI version](https://badge.fury.io/py/collie-mlops.svg)](https://badge.fury.io/py/collie-mlops)
+[![Python 3.10+](https://img.shields.io/badge/python-3.10+-blue.svg)](https://www.python.org/downloads/)
+[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
+[![Documentation](https://img.shields.io/badge/docs-sphinx-blue.svg)](docs/_build/html/index.html)
+[![codecov](https://codecov.io/gh/ChingHuanChiu/collie/branch/main/graph/badge.svg)](https://codecov.io/gh/ChingHuanChiu/collie)
+A Lightweight MLOps Framework for Machine Learning Workflows
+## Overview
+Collie is a modern MLOps framework designed to streamline machine learning workflows by providing a component-based architecture integrated with MLflow. It enables data scientists and ML engineers to build, deploy, and manage ML pipelines with ease through modular components that handle different stages of the ML lifecycle.
+## Features
+- **Component-Based Architecture**: Modular design with specialized components for each ML workflow stage
+- **MLflow Integration**: Built-in experiment tracking, model registration, and deployment capabilities
+- **Pipeline Orchestration**: Seamless workflow management with event-driven architecture
+- **Model Management**: Automated model versioning, staging, and promotion
+- **Framework Agnostic**: Supports multiple ML frameworks (PyTorch, scikit-learn, XGBoost, LightGBM, Transformers)
+## Architecture
+Collie follows an event-driven architecture with the following core components:
+- **Transformer**: Data preprocessing and feature engineering
+- **Tuner**: Hyperparameter optimization
+- **Trainer**: Model training and validation
+- **Evaluator**: Model evaluation and comparison
+- **Pusher**: Model deployment and registration
+- **Orchestrator**: Workflow coordination and execution
+## Quick Start
+### Installation
+```bash
+pip install collie-mlops
+```
+This will install Collie with all supported ML frameworks including:
+- scikit-learn
+- PyTorch
+- XGBoost
+- LightGBM
+- Transformers (with Sentence Transformers)
+### Prerequisites
+- Python >= 3.10
+- MLflow tracking server (can be local or remote)
+## Components
+### Transformer
+Handles data preprocessing, feature engineering, and data validation.
+```python
+class CustomTransformer(Transformer):
+    def handle(self, event) -> Event:
+        # Process your data
+        processed_data = ...
+        return Event(payload=TransformerPayload(train_data=processed_data))
+```
+### Tuner
+Performs hyperparameter optimization using various strategies.
+```python
+class CustomTuner(Tuner):
+    def handle(self, event) -> Event:
+        # Optimize hyperparameters
+        best_params = ...
+        return Event(payload=TunerPayload(hyperparameters=best_params))
+```
+### Trainer
+Trains machine learning models with automatic experiment tracking.
+```python
+class CustomTrainer(Trainer):
+    def handle(self, event) -> Event:
+        # Train your model
+        model = ...
+        return Event(payload=TrainerPayload(model=model))
+```
+### Evaluator
+Evaluates model performance and decides on deployment.
+```python
+class CustomEvaluator(Evaluator):
+    def handle(self, event) -> Event:
+        # Evaluate model performance
+        metrics = ...
+        is_better: bool = ...
+        return Event(payload=EvaluatorPayload(
+            metrics=metrics,
+            is_better_than_production=is_better
+        ))
+```
+### Pusher
+Handles model deployment and registration.
+```python
+class CustomPusher(Pusher):
+    def handle(self, event) -> Event:
+        # Deploy model to production
+        model_uri = ...
+        return Event(payload=PusherPayload(model_uri=model_uri))
+```
+## Configuration
+### MLflow Setup
+Start MLflow tracking server:
+```bash
+mlflow server \
+    --backend-store-uri sqlite:///mlflow.db \
+    --default-artifact-root ./mlruns \
+    --host 0.0.0.0 \
+    --port 5000
+```
+## Supported Frameworks
+Collie supports multiple ML frameworks through its model flavor system currently:
+-  **PyTorch**
+-  **scikit-learn**
+-  **XGBoost**
+-  **LightGBM**
+-  **Transformers**
+## Documentation
+[Here you are]( https://collie-mlops.readthedocs.io/en/latest/getting_started.html )
+## Roadmap
+- [ ] TensorFlow/Keras support
+- [ ] Model monitoring and drift detection
+- [ ] Integrate an LLM training/fine-tuning framework
+## License
+This project is licensed under the MIT License - see the [LICENSE](LICENSE) file for details.
+## Citation
+If you use Collie in your research, please cite:
+```bibtex
+@software{collie2025,
+  author = {ChingHuanChiu},
+  title = {Collie: A Lightweight MLOps Framework},
+  year = {2025},
+  url = {https://github.com/ChingHuanChiu/collie}
+}
+```
+---

collie_mlops-0.1.1b0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,45 @@
+collie/__init__.py,sha256=2WdIuiEzRvQWcfVcwu0jEk-72R-T2oQVlNnRQePeL1g,1834
+collie/_common/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/_common/decorator.py,sha256=9Kj6bSM6q38h7-Z32VYsHDeUAtHqWKmtLE7oLrkWGqg,1636
+collie/_common/exceptions.py,sha256=cjctM4jEcD5lRxm4gtKiSJ3c8r8tIcyOL_raVJMxQAY,3836
+collie/_common/utils.py,sha256=9vBstA9cUyhKQkxaggrNg-nYrdub-aVYYIsSVhssKWk,339
+collie/_common/mlflow_model_io/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/_common/mlflow_model_io/base_flavor_handler.py,sha256=sSYfigwwwy8fSo8G_0laW91tftVhPDWPUiUyGBYw6mE,535
+collie/_common/mlflow_model_io/flavor_registry.py,sha256=Cw_Og7Ewl2coCaf-Phw1LF5Zp_LxAG6OAyrm7MT8iZ8,2607
+collie/_common/mlflow_model_io/model_flavors.py,sha256=LCW53SAvB_bcR62XnPak_M97SWCf-QgwBJDzmzlrva0,9171
+collie/_common/mlflow_model_io/model_io.py,sha256=y5NcOEItkH0pC3bpqWmc_js9GvfAcqNnIv4oN7LN4pg,1879
+collie/contracts/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/contracts/event.py,sha256=vQWZbT5V_3qsU78TCwkrq2gYiq8isxbL8dOEXSKUgic,2207
+collie/contracts/mlflow.py,sha256=dhCTDvKMo3bxW9AjEBp50G_s13uc0RjhieHHs9stTBM,14496
+collie/contracts/orchestrator.py,sha256=eXFQHmzPJ1By3rrQ0_FA-khD0oDyzLqSVaoqlNbZM_w,2136
+collie/core/__init__.py,sha256=RugxaCy6wiyHp4lYQxP9_RGypXQKGOqjbE9ut9HgIC4,956
+collie/core/models.py,sha256=4FhAzXJjQs4712SppniRgydaig4XeA7K5WQWXRpUFzM,3258
+collie/core/enums/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/core/enums/components.py,sha256=6ENOAugVAuUzU_jBT-eopeVlkHoSjbjnlT4smhPMJBE,545
+collie/core/enums/ml_models.py,sha256=xoD7aO038wWpryNw35qkMLfkO6dRyKcD_aTlYCIpmwM,386
+collie/core/evaluator/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/core/evaluator/evaluator.py,sha256=K5n2Wma0BMVN6EqMK7ObRCxRWgJn7wTXP8W_u735Hjg,4559
+collie/core/orchestrator/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/core/orchestrator/orchestrator.py,sha256=9CTuTsysbohKN0cGWyVWxwJdFVT1OpkhDROOiWjko5c,1538
+collie/core/pusher/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/core/pusher/pusher.py,sha256=57nINSau_2xHKCa0P9DzdoEFmueY7-gX44JY7chu5Ss,4008
+collie/core/trainer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/core/trainer/trainer.py,sha256=De0t3UHU2205sO9vLhvL1mJISr2HPfO9TbzTj-C1HeM,2421
+collie/core/transform/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/core/transform/transform.py,sha256=Xso4DZRVDE6P8YtCYrOKkI_GuMD_ygUDc5OOn-B7I-A,2858
+collie/core/tuner/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/core/tuner/tuner.py,sha256=knB7pkB_D-dhM6qKvSwoHTPKnLdP_47sZAMj5GvarHg,2560
+collie/helper/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/helper/pytorch/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/helper/pytorch/trainer.py,sha256=TJb-ISRh3PMCeqY_rEbtqRGlSGGY0VuRZmayj4OFOhE,10921
+collie/helper/pytorch/callback/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/helper/pytorch/callback/callback.py,sha256=NHfhUBen8odZp9XJKkRU-NbLeKjEZbKtrimejpWiGf4,3539
+collie/helper/pytorch/callback/earlystop.py,sha256=8smHSn23Dl_jo2omJJiB9rCO-SgOYY2AvcEwh6Fgr1I,1498
+collie/helper/pytorch/callback/model_checkpoint.py,sha256=ZYQ0EjG1p-A9s8igr9ck0FA-AF-9ISz8QbpwPkTz_uc,3680
+collie/helper/pytorch/model/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+collie/helper/pytorch/model/loader.py,sha256=ocGXKelpjSXDfG_ZHKl1-1xi7NyoF6BPoVs3TCqJs9k,2239
+collie_mlops-0.1.1b0.dist-info/LICENSE,sha256=10_zh6gMsjITzBc30M8T7A2Kv5xPNJ5x4Y0gYmk-Zvs,1070
+collie_mlops-0.1.1b0.dist-info/METADATA,sha256=mFHHGUbz2A1S5NkordLv1MMla4i-WQorHHf3xMWlIe8,8763
+collie_mlops-0.1.1b0.dist-info/WHEEL,sha256=oiQVh_5PnQM0E3gPdiz09WCNmwiHDMaGer_elqB3coM,92
+collie_mlops-0.1.1b0.dist-info/top_level.txt,sha256=7Br75OZSTintD5Mvq6h42yDMf0oR_5n1Ec2u6FuTxAY,7
+collie_mlops-0.1.1b0.dist-info/RECORD,,

collie_mlops-0.1.1b0.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,5 @@
+Wheel-Version: 1.0
+Generator: bdist_wheel (0.42.0)
+Root-Is-Purelib: true
+Tag: py3-none-any

collie_mlops-0.1.1b0.dist-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ collie