PyPI - lasagnastack - Versions diffs - 0.1.0__tar.gz - Mend

lasagnastack 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

lasagnastack-0.1.0/PKG-INFO +205 -0
lasagnastack-0.1.0/README.md +184 -0
lasagnastack-0.1.0/pyproject.toml +106 -0
lasagnastack-0.1.0/setup.cfg +4 -0
lasagnastack-0.1.0/src/lasagnastack/__init__.py +0 -0
lasagnastack-0.1.0/src/lasagnastack/__main__.py +3 -0
lasagnastack-0.1.0/src/lasagnastack/base.py +205 -0
lasagnastack-0.1.0/src/lasagnastack/cache.py +30 -0
lasagnastack-0.1.0/src/lasagnastack/cli.py +73 -0
lasagnastack-0.1.0/src/lasagnastack/io.py +85 -0
lasagnastack-0.1.0/src/lasagnastack/llm/__init__.py +0 -0
lasagnastack-0.1.0/src/lasagnastack/llm/base.py +29 -0
lasagnastack-0.1.0/src/lasagnastack/llm/gemini.py +394 -0
lasagnastack-0.1.0/src/lasagnastack/logging_config.py +20 -0
lasagnastack-0.1.0/src/lasagnastack/models/__init__.py +0 -0
lasagnastack-0.1.0/src/lasagnastack/models/critique.py +14 -0
lasagnastack-0.1.0/src/lasagnastack/models/cut_list.py +123 -0
lasagnastack-0.1.0/src/lasagnastack/models/enhance.py +62 -0
lasagnastack-0.1.0/src/lasagnastack/models/inventory.py +85 -0
lasagnastack-0.1.0/src/lasagnastack/models/post_caption.py +8 -0
lasagnastack-0.1.0/src/lasagnastack/pipeline.py +172 -0
lasagnastack-0.1.0/src/lasagnastack/stages/__init__.py +0 -0
lasagnastack-0.1.0/src/lasagnastack/stages/analyse.py +144 -0
lasagnastack-0.1.0/src/lasagnastack/stages/critique.py +149 -0
lasagnastack-0.1.0/src/lasagnastack/stages/direct.py +94 -0
lasagnastack-0.1.0/src/lasagnastack/stages/enhance.py +120 -0
lasagnastack-0.1.0/src/lasagnastack/stages/ingest.py +183 -0
lasagnastack-0.1.0/src/lasagnastack/stages/post_caption.py +136 -0
lasagnastack-0.1.0/src/lasagnastack/stages/render.py +172 -0
lasagnastack-0.1.0/src/lasagnastack/video_editors/__init__.py +3 -0
lasagnastack-0.1.0/src/lasagnastack/video_editors/base.py +53 -0
lasagnastack-0.1.0/src/lasagnastack/video_editors/pycapcut.py +579 -0
lasagnastack-0.1.0/src/lasagnastack.egg-info/PKG-INFO +205 -0
lasagnastack-0.1.0/src/lasagnastack.egg-info/SOURCES.txt +40 -0
lasagnastack-0.1.0/src/lasagnastack.egg-info/dependency_links.txt +1 -0
lasagnastack-0.1.0/src/lasagnastack.egg-info/requires.txt +13 -0
lasagnastack-0.1.0/src/lasagnastack.egg-info/top_level.txt +1 -0
lasagnastack-0.1.0/tests/test_analyse.py +109 -0
lasagnastack-0.1.0/tests/test_critique.py +278 -0
lasagnastack-0.1.0/tests/test_direct.py +55 -0
lasagnastack-0.1.0/tests/test_ingest.py +233 -0
lasagnastack-0.1.0/tests/test_render.py +320 -0

lasagnastack-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,205 @@
+Metadata-Version: 2.4
+Name: lasagnastack
+Version: 0.1.0
+Summary: An AI pipeline that turns raw video clips into an editable CapCut project for short-form reel editing.
+Author-email: Julian Wong <julianwong2000@gmail.com>
+Requires-Python: <3.13,>=3.12
+Description-Content-Type: text/markdown
+Requires-Dist: av>=14.0.0
+Requires-Dist: ffmpeg-python>=0.2.0
+Requires-Dist: google-genai>=1.0.0
+Requires-Dist: mlflow>=2.19.0
+Requires-Dist: opencv-python-headless>=4.0.0
+Requires-Dist: pycapcut>=0.0.3
+Requires-Dist: pydantic>=2.0.0
+Requires-Dist: python-dotenv>=1.0.0
+Requires-Dist: python-semantic-release>=10.5.3
+Requires-Dist: scenedetect>=0.6.4
+Requires-Dist: setuptools>=80.9.0
+Requires-Dist: structlog>=25.0.0
+Requires-Dist: tenacity>=9.0.0
+# LasagnaStack
+<img src="docs/lasagna.png" alt="LasagnaStack" width="180" />
+An AI pipeline that turns raw video clips into an editable CapCut project for short-form reel editing.
+It is as simple as:
+```bash
+python -m lasagnastack make ./my_clips/ --out ./my_capcut_draft/
+```
+where...
+`./my_clips/`: a folder of raw video clips in MP4/MOV format + one `.txt` creator brief.
+`./my_capcut_draft/`: a CapCut draft folder, ready to open in CapCut Desktop.
+The pipeline runs in six sequential stages: **ingest** (uses ffmpeg) → **analyse** (uses LLM) → **direct** (uses LLM) → **critique loop** (uses LLM) → **enhance** (uses LLM) → **render** (uses pyCapCut).
+Each stage is a subclass of the `Stage` abstract base class (`base.py`). Adding, removing, or reordering stages requires only editing the `stages` list in `ReelPipeline`. See [`ARCHITECTURE.md`](ARCHITECTURE.md) for the full architecture guide.
+## Get started with development
+1. Clone the repository.
+```bash
+git clone https://github.com/jyjulianwong/LasagnaStack.git
+```
+2. Verify that you have a compatible Python version installed on your machine.
+```bash
+python --version
+```
+3. Install [uv](https://github.com/astral-sh/uv) (used as the package manager for this project).
+4. Install the development dependencies.
+```bash
+cd LasagnaStack/
+uv sync --all-groups
+uv run pre-commit install
+```
+## Set up environment
+Copy `.env.sample` to `.env` and fill in your values:
+```bash
+cp .env.sample .env
+```
+`.env` is gitignored. Values set in the shell environment take precedence over `.env`.
+## Authentication
+Get a Gemini API key at [aistudio.google.com/apikey](https://aistudio.google.com/apikey) and add it to your `.env`:
+```
+LSNSTK_LLM_GEMINI_API_KEY=your-key-here
+```
+## Run the pipeline
+Prepare an input folder containing your MP4/MOV clips and exactly one `.txt` brief file, then run:
+```bash
+uv run python -m lasagnastack make ./my_clips/ --out ./drafts/reel_2025_05_05
+```
+The pipeline pauses for confirmation between each stage. To skip all prompts:
+```bash
+uv run python -m lasagnastack make ./my_clips/ --out ./drafts/reel_2025_05_05 --yes
+```
+Full CLI reference:
+```
+usage: lasagnastack make [-h] --out OUTPUT_DIR [--skill SKILL_FILE] [--yes]
+                         [--critique-max-retries N] [--ingest-max-workers N]
+                         [--analyse-max-workers N] INPUT_DIR
+positional arguments:
+  INPUT_DIR                     Folder containing clips and brief .txt
+options:
+  --out OUTPUT_DIR              Destination for the CapCut draft and working files
+  --skill SKILL_FILE            Path to Markdown skill file injected into the direct,
+                                critique, and enhance prompt templates (optional)
+  --yes, -y                     Auto-confirm all stage prompts
+  --critique-max-retries N      Maximum # of critique loop retries (default: 2)
+  --ingest-max-workers N        Maximum # of parallel worker processes for `ingest` stage (default: 2)
+  --analyse-max-workers N       Maximum # of concurrent LLM calls for `analyse` stage (default: 4)
+```
+## Open the draft in CapCut Desktop (macOS)
+If CapCut Desktop is installed, the pipeline automatically:
+1. Detects `~/Movies/CapCut/User Data/`
+2. Copies **all** `.mp4`/`.mov` files from your input folder into the CapCut draft folder — including clips not used on the timeline — so they are immediately available in CapCut's import panel
+3. Rewrites the timeline clip paths in `draft_info.json` to point to the copied files
+4. Registers the draft in `root_meta_info.json` so it appears on the CapCut home screen straight away
+Open CapCut Desktop after the pipeline finishes — the draft will appear on the home screen under your local projects with all media already linked. Drafts are named **LasagnaStack - Reel Name** and use that same string as the folder name so they are easy to identify among existing projects.
+If CapCut is not installed, the draft is written to `<output_dir>/draft/LasagnaStack - {reel_name}/` and you can copy it manually.
+> This has been tested with CapCut Desktop 8.5.0 on macOS Sequoia 15.6.1. There may be issues with older versions or other operating systems.
+## Track LLM costs with MLflow
+Every pipeline run is automatically traced with [MLflow](https://mlflow.org). Each Gemini API call is recorded as a span (prompt, response, token counts, latency, and estimated USD cost). Session-level totals are written to the run when the pipeline finishes.
+**1. Start the MLflow server** (in a separate terminal, before running the pipeline):
+```bash
+mlflow server --host 127.0.0.1 --port 5001
+```
+> **macOS note:** port 5000 is reserved by AirPlay Receiver. Use 5001 or higher.
+**2. Add the tracking variables to `.env`:**
+```
+MLFLOW_TRACKING_URI=http://localhost:5001
+MLFLOW_EXPERIMENT_NAME=lasagnastack
+```
+**3. Run the pipeline as normal.** Open `http://localhost:5000` in your browser to watch live.
+In **Experiments -> lasagnastack -> Traces**, spans appear in real time as stages progress. Each trace has three levels: the top-level pipeline span (`ReelPipeline.run`), a per-stage span (e.g. `AnalyseStage.run`), and individual LLM call spans (`GeminiClient._call_api`) nested inside.
+Runs are named `lasagnastack-{brief_stem}-{4-char-id}` and tagged with the model, reel name, and `critique_max_retries`.
+> **No server?** Set `MLFLOW_TRACKING_URI=mlruns` to write results to a local folder instead, then view them with `mlflow ui`.
+## Configuration
+| Parameter | How to set | Default |
+|---|---|---|
+| LLM model | `LSNSTK_LLM_MODEL` env. var. | `gemini/gemini-2.5-flash` |
+| Gemini API key | `LSNSTK_LLM_GEMINI_API_KEY` env. var. (required) | — |
+| Path to skill file | `--skill` CLI flag | — |
+| `critique` stage maximum # of retries | `--critique-max-retries` CLI flag | `2` |
+| `ingest` stage maximum # of worker processes | `--ingest-max-workers` CLI flag | `2` |
+| `analyse` stage maximum # of concurrent LLM calls | `--analyse-max-workers` CLI flag | `4` |
+## Architecture
+See [`ARCHITECTURE.md`](ARCHITECTURE.md) for four annotated diagrams covering the pipeline data flow, the Stage 4 critique loop, the Stage 6 render + CapCut export, and the extensibility model.
+## Get started with Jupyter notebooks
+1. Once the above setup is complete, set up a Python kernel.
+```bash
+source .venv/bin/activate
+python -m ipykernel install --user --name=lasagnastack
+```
+2. Refer to the following common commands.
+```bash
+jupyter kernelspec list
+jupyter kernelspec uninstall lasagnastack
+```
+3. Start the Jupyter server.
+```bash
+jupyter lab
+```
+## This repo is cool because...
+- The pipeline is modularlised into stages, with each stage being responsible for transforming the global state of the pipeline run (similar to LangGraph). It is easy to add, remove, or reorder stages.
+- The pipeline supports "skills" -- each user can write their own skill `.md` file to customise the pipeline to their own accounts' styles and branding, or use pre-written skills from marketplaces to cater for different types of reel content.
+- Chain-of-thought reasoning is enabled via Gemini.
+- Human-in-the-loop is deeply integrated in the design, with each stage prompting the user for confirmation before proceeding to the next stage.
+- Prompt caching is enabled to avoid unnecessary LLM calls to reduce latency and cost.
+- The tool is deeply integrated with its host machine. It auto-detects CapCut Desktop, copies all source media (timeline clips and unused footage) so the project opens in CapCut with no missing-media errors, no manual steps, all your raw clips already in the import panel, and the timeline editor populated and ready to go.

lasagnastack-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,184 @@
+# LasagnaStack
+<img src="docs/lasagna.png" alt="LasagnaStack" width="180" />
+An AI pipeline that turns raw video clips into an editable CapCut project for short-form reel editing.
+It is as simple as:
+```bash
+python -m lasagnastack make ./my_clips/ --out ./my_capcut_draft/
+```
+where...
+`./my_clips/`: a folder of raw video clips in MP4/MOV format + one `.txt` creator brief.
+`./my_capcut_draft/`: a CapCut draft folder, ready to open in CapCut Desktop.
+The pipeline runs in six sequential stages: **ingest** (uses ffmpeg) → **analyse** (uses LLM) → **direct** (uses LLM) → **critique loop** (uses LLM) → **enhance** (uses LLM) → **render** (uses pyCapCut).
+Each stage is a subclass of the `Stage` abstract base class (`base.py`). Adding, removing, or reordering stages requires only editing the `stages` list in `ReelPipeline`. See [`ARCHITECTURE.md`](ARCHITECTURE.md) for the full architecture guide.
+## Get started with development
+1. Clone the repository.
+```bash
+git clone https://github.com/jyjulianwong/LasagnaStack.git
+```
+2. Verify that you have a compatible Python version installed on your machine.
+```bash
+python --version
+```
+3. Install [uv](https://github.com/astral-sh/uv) (used as the package manager for this project).
+4. Install the development dependencies.
+```bash
+cd LasagnaStack/
+uv sync --all-groups
+uv run pre-commit install
+```
+## Set up environment
+Copy `.env.sample` to `.env` and fill in your values:
+```bash
+cp .env.sample .env
+```
+`.env` is gitignored. Values set in the shell environment take precedence over `.env`.
+## Authentication
+Get a Gemini API key at [aistudio.google.com/apikey](https://aistudio.google.com/apikey) and add it to your `.env`:
+```
+LSNSTK_LLM_GEMINI_API_KEY=your-key-here
+```
+## Run the pipeline
+Prepare an input folder containing your MP4/MOV clips and exactly one `.txt` brief file, then run:
+```bash
+uv run python -m lasagnastack make ./my_clips/ --out ./drafts/reel_2025_05_05
+```
+The pipeline pauses for confirmation between each stage. To skip all prompts:
+```bash
+uv run python -m lasagnastack make ./my_clips/ --out ./drafts/reel_2025_05_05 --yes
+```
+Full CLI reference:
+```
+usage: lasagnastack make [-h] --out OUTPUT_DIR [--skill SKILL_FILE] [--yes]
+                         [--critique-max-retries N] [--ingest-max-workers N]
+                         [--analyse-max-workers N] INPUT_DIR
+positional arguments:
+  INPUT_DIR                     Folder containing clips and brief .txt
+options:
+  --out OUTPUT_DIR              Destination for the CapCut draft and working files
+  --skill SKILL_FILE            Path to Markdown skill file injected into the direct,
+                                critique, and enhance prompt templates (optional)
+  --yes, -y                     Auto-confirm all stage prompts
+  --critique-max-retries N      Maximum # of critique loop retries (default: 2)
+  --ingest-max-workers N        Maximum # of parallel worker processes for `ingest` stage (default: 2)
+  --analyse-max-workers N       Maximum # of concurrent LLM calls for `analyse` stage (default: 4)
+```
+## Open the draft in CapCut Desktop (macOS)
+If CapCut Desktop is installed, the pipeline automatically:
+1. Detects `~/Movies/CapCut/User Data/`
+2. Copies **all** `.mp4`/`.mov` files from your input folder into the CapCut draft folder — including clips not used on the timeline — so they are immediately available in CapCut's import panel
+3. Rewrites the timeline clip paths in `draft_info.json` to point to the copied files
+4. Registers the draft in `root_meta_info.json` so it appears on the CapCut home screen straight away
+Open CapCut Desktop after the pipeline finishes — the draft will appear on the home screen under your local projects with all media already linked. Drafts are named **LasagnaStack - Reel Name** and use that same string as the folder name so they are easy to identify among existing projects.
+If CapCut is not installed, the draft is written to `<output_dir>/draft/LasagnaStack - {reel_name}/` and you can copy it manually.
+> This has been tested with CapCut Desktop 8.5.0 on macOS Sequoia 15.6.1. There may be issues with older versions or other operating systems.
+## Track LLM costs with MLflow
+Every pipeline run is automatically traced with [MLflow](https://mlflow.org). Each Gemini API call is recorded as a span (prompt, response, token counts, latency, and estimated USD cost). Session-level totals are written to the run when the pipeline finishes.
+**1. Start the MLflow server** (in a separate terminal, before running the pipeline):
+```bash
+mlflow server --host 127.0.0.1 --port 5001
+```
+> **macOS note:** port 5000 is reserved by AirPlay Receiver. Use 5001 or higher.
+**2. Add the tracking variables to `.env`:**
+```
+MLFLOW_TRACKING_URI=http://localhost:5001
+MLFLOW_EXPERIMENT_NAME=lasagnastack
+```
+**3. Run the pipeline as normal.** Open `http://localhost:5000` in your browser to watch live.
+In **Experiments -> lasagnastack -> Traces**, spans appear in real time as stages progress. Each trace has three levels: the top-level pipeline span (`ReelPipeline.run`), a per-stage span (e.g. `AnalyseStage.run`), and individual LLM call spans (`GeminiClient._call_api`) nested inside.
+Runs are named `lasagnastack-{brief_stem}-{4-char-id}` and tagged with the model, reel name, and `critique_max_retries`.
+> **No server?** Set `MLFLOW_TRACKING_URI=mlruns` to write results to a local folder instead, then view them with `mlflow ui`.
+## Configuration
+| Parameter | How to set | Default |
+|---|---|---|
+| LLM model | `LSNSTK_LLM_MODEL` env. var. | `gemini/gemini-2.5-flash` |
+| Gemini API key | `LSNSTK_LLM_GEMINI_API_KEY` env. var. (required) | — |
+| Path to skill file | `--skill` CLI flag | — |
+| `critique` stage maximum # of retries | `--critique-max-retries` CLI flag | `2` |
+| `ingest` stage maximum # of worker processes | `--ingest-max-workers` CLI flag | `2` |
+| `analyse` stage maximum # of concurrent LLM calls | `--analyse-max-workers` CLI flag | `4` |
+## Architecture
+See [`ARCHITECTURE.md`](ARCHITECTURE.md) for four annotated diagrams covering the pipeline data flow, the Stage 4 critique loop, the Stage 6 render + CapCut export, and the extensibility model.
+## Get started with Jupyter notebooks
+1. Once the above setup is complete, set up a Python kernel.
+```bash
+source .venv/bin/activate
+python -m ipykernel install --user --name=lasagnastack
+```
+2. Refer to the following common commands.
+```bash
+jupyter kernelspec list
+jupyter kernelspec uninstall lasagnastack
+```
+3. Start the Jupyter server.
+```bash
+jupyter lab
+```
+## This repo is cool because...
+- The pipeline is modularlised into stages, with each stage being responsible for transforming the global state of the pipeline run (similar to LangGraph). It is easy to add, remove, or reorder stages.
+- The pipeline supports "skills" -- each user can write their own skill `.md` file to customise the pipeline to their own accounts' styles and branding, or use pre-written skills from marketplaces to cater for different types of reel content.
+- Chain-of-thought reasoning is enabled via Gemini.
+- Human-in-the-loop is deeply integrated in the design, with each stage prompting the user for confirmation before proceeding to the next stage.
+- Prompt caching is enabled to avoid unnecessary LLM calls to reduce latency and cost.
+- The tool is deeply integrated with its host machine. It auto-detects CapCut Desktop, copies all source media (timeline clips and unused footage) so the project opens in CapCut with no missing-media errors, no manual steps, all your raw clips already in the import panel, and the timeline editor populated and ready to go.

lasagnastack-0.1.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,106 @@
+[build-system]
+requires = ["setuptools", "wheel"]
+build-backend = "setuptools.build_meta"
+[project]
+name = "lasagnastack"
+version = "0.1.0"
+description = "An AI pipeline that turns raw video clips into an editable CapCut project for short-form reel editing."
+authors = [
+    { name = "Julian Wong", email = "julianwong2000@gmail.com" }
+]
+readme = "README.md"
+requires-python = ">=3.12,<3.13"
+dependencies = [
+    "av>=14.0.0",
+    "ffmpeg-python>=0.2.0",
+    "google-genai>=1.0.0",
+    "mlflow>=2.19.0",
+    "opencv-python-headless>=4.0.0",
+    "pycapcut>=0.0.3",
+    "pydantic>=2.0.0",
+    "python-dotenv>=1.0.0",
+    "python-semantic-release>=10.5.3",
+    "scenedetect>=0.6.4",
+    "setuptools>=80.9.0",
+    "structlog>=25.0.0",
+    "tenacity>=9.0.0",
+]
+[dependency-groups]
+dev = [
+    "pre-commit>=4.2.0",
+    "pyrefly>=0.26.0",
+    "pytest>=7.2.0",
+    "ruff>=0.11.1",
+    "uv-sort==0.6.0",
+]
+docs = [
+    "pdoc>=15.0.4",
+]
+notebook = [
+    "ipykernel>=6.30.0",
+    "ipython>=9.4.0",
+    "jupyterlab>=4.4.5",
+    "matplotlib>=3.10.3",
+    "nbconvert>=7.16.6",
+    "notebook>=7.4.4",
+    "plotly>=6.2.0",
+    "seaborn>=0.13.2",
+    "voila>=0.5.8",
+]
+[tool.setuptools.packages.find]
+where = ["src"]
+[tool.ruff]
+line-length = 88
+indent-width = 4
+exclude = [
+    "build",
+    "dist",
+    "__pycache__",
+    "*.ipynb"
+]
+fix = true
+[tool.ruff.lint.pycodestyle]
+ignore-overlong-task-comments = true
+[tool.ruff.lint]
+# Enable Pyflakes (`F`) and a subset of the pycodestyle (`E`) codes by default.
+# Unlike Flake8, Ruff doesn't enable pycodestyle warnings (`W`) or
+# McCabe complexity (`C901`) by default.
+select = ["E4", "E7", "E9", "F", "I"]
+ignore = []
+# Allow fix for all enabled rules (when `--fix`) is provided.
+fixable = ["ALL"]
+unfixable = []
+task-tags = ["HACK", "TODO"]
+[tool.pydocstyle]
+convention = "google"
+add-ignore = "D104,D418"
+[tool.pyrefly]
+# Set the directory Pyrefly will search for files to type check
+project-includes = ["src/lasagnastack/*"]
+project-excludes = ["**/*venv/**/*"]
+# Manually set the `sys.platform` Pyrefly will assume when type checking
+python-platform = "darwin"
+# Return an import error when `<library>-stubs` can be imported, but no non-stubs version of that library can be found
+ignore-missing-source = false
+# A table mapping error codes to an `is-enabled` boolean
+[tool.pyrefly.errors]
+# Disable `bad-assignment` errors
+bad-assignment = false
+# Disable `bad-return` errors
+bad-return = false
+[tool.semantic_release]
+version_toml = ["pyproject.toml:project.version"]

lasagnastack-0.1.0/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0

lasagnastack-0.1.0/src/lasagnastack/__init__.py ADDED Viewed

File without changes

lasagnastack-0.1.0/src/lasagnastack/__main__.py ADDED Viewed

@@ -0,0 +1,3 @@
+from lasagnastack.cli import main
+main()