PyPI - karaoke-gen - Versions diffs - 0.75.54__py3-none-any.whl - Mend

karaoke-gen 0.75.54__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of karaoke-gen might be problematic. Click here for more details.

Files changed (287) hide show

karaoke_gen/__init__.py +38 -0
karaoke_gen/audio_fetcher.py +1614 -0
karaoke_gen/audio_processor.py +790 -0
karaoke_gen/config.py +83 -0
karaoke_gen/file_handler.py +387 -0
karaoke_gen/instrumental_review/__init__.py +45 -0
karaoke_gen/instrumental_review/analyzer.py +408 -0
karaoke_gen/instrumental_review/editor.py +322 -0
karaoke_gen/instrumental_review/models.py +171 -0
karaoke_gen/instrumental_review/server.py +475 -0
karaoke_gen/instrumental_review/static/index.html +1529 -0
karaoke_gen/instrumental_review/waveform.py +409 -0
karaoke_gen/karaoke_finalise/__init__.py +1 -0
karaoke_gen/karaoke_finalise/karaoke_finalise.py +1833 -0
karaoke_gen/karaoke_gen.py +1026 -0
karaoke_gen/lyrics_processor.py +474 -0
karaoke_gen/metadata.py +160 -0
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/resources/AvenirNext-Bold.ttf +0 -0
karaoke_gen/resources/Montserrat-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-SemiBold.ttf +0 -0
karaoke_gen/resources/Zurich_Cn_BT_Bold.ttf +0 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/__init__.py +18 -0
karaoke_gen/utils/bulk_cli.py +492 -0
karaoke_gen/utils/cli_args.py +432 -0
karaoke_gen/utils/gen_cli.py +978 -0
karaoke_gen/utils/remote_cli.py +3268 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen/video_generator.py +424 -0
karaoke_gen-0.75.54.dist-info/METADATA +718 -0
karaoke_gen-0.75.54.dist-info/RECORD +287 -0
karaoke_gen-0.75.54.dist-info/WHEEL +4 -0
karaoke_gen-0.75.54.dist-info/entry_points.txt +5 -0
karaoke_gen-0.75.54.dist-info/licenses/LICENSE +21 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +594 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +919 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +214 -0
lyrics_transcriber/frontend/src/api.ts +254 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +413 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1387 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/SyncControls.tsx +185 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/TimelineCanvas.tsx +704 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/UpcomingWordsBar.tsx +80 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/index.tsx +905 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelectionModal.tsx +127 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +336 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js +43288 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +306 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +379 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +650 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0

karaoke_gen/instrumental_review/server.py ADDED Viewed

@@ -0,0 +1,475 @@
+"""
+Local FastAPI server for instrumental review.
+This module provides a local HTTP server that serves the instrumental review
+UI for local CLI usage. It provides the same API endpoints as the cloud backend
+to enable UI reuse.
+Similar pattern to LyricsTranscriber's ReviewServer.
+"""
+import logging
+import os
+from pathlib import Path
+import socket
+import threading
+import webbrowser
+from typing import List, Optional
+from fastapi import FastAPI, HTTPException, UploadFile, File
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import FileResponse, HTMLResponse
+from pydantic import BaseModel
+import shutil
+import tempfile
+import uvicorn
+from pydub import AudioSegment
+from karaoke_gen.instrumental_review import (
+    AnalysisResult,
+    AudioAnalyzer,
+    AudioEditor,
+    MuteRegion,
+    WaveformGenerator,
+)
+logger = logging.getLogger(__name__)
+# Request/Response Models
+class MuteRegionRequest(BaseModel):
+    start_seconds: float
+    end_seconds: float
+class CreateCustomRequest(BaseModel):
+    mute_regions: List[MuteRegionRequest]
+class SelectionRequest(BaseModel):
+    selection: str
+class InstrumentalReviewServer:
+    """
+    Local FastAPI server for instrumental review UI.
+    This server provides a web interface for reviewing and selecting
+    instrumental tracks in the local CLI workflow. It serves the same
+    API endpoints as the cloud backend to enable UI reuse.
+    """
+    def __init__(
+        self,
+        output_dir: str,
+        base_name: str,
+        analysis: AnalysisResult,
+        waveform_path: str,
+        backing_vocals_path: str,
+        clean_instrumental_path: str,
+        with_backing_path: Optional[str] = None,
+        original_audio_path: Optional[str] = None,
+    ):
+        """
+        Initialize the review server.
+        Args:
+            output_dir: Directory containing the audio files
+            base_name: Base name for output files (e.g., "Artist - Title")
+            analysis: Analysis result from AudioAnalyzer
+            waveform_path: Path to the waveform image
+            backing_vocals_path: Path to the backing vocals audio file
+            clean_instrumental_path: Path to the clean instrumental audio file
+            with_backing_path: Path to the instrumental with backing vocals
+            original_audio_path: Path to the original audio file (with vocals)
+        """
+        self.output_dir = output_dir
+        self.base_name = base_name
+        self.analysis = analysis
+        self.waveform_path = waveform_path
+        self.backing_vocals_path = backing_vocals_path
+        self.clean_instrumental_path = clean_instrumental_path
+        self.with_backing_path = with_backing_path
+        self.original_audio_path = original_audio_path
+        self.custom_instrumental_path: Optional[str] = None
+        self.uploaded_instrumental_path: Optional[str] = None
+        self.selection: Optional[str] = None
+        self._app: Optional[FastAPI] = None
+        self._server_thread: Optional[threading.Thread] = None
+        self._selection_event = threading.Event()
+        self._shutdown_event = threading.Event()
+    def _create_app(self) -> FastAPI:
+        """Create and configure the FastAPI application."""
+        app = FastAPI(title="Instrumental Review", docs_url=None, redoc_url=None)
+        # Configure CORS
+        app.add_middleware(
+            CORSMiddleware,
+            allow_origins=["*"],
+            allow_credentials=True,
+            allow_methods=["*"],
+            allow_headers=["*"],
+        )
+        # Register routes
+        self._register_routes(app)
+        return app
+    def _register_routes(self, app: FastAPI) -> None:
+        """Register API routes."""
+        @app.get("/")
+        async def serve_frontend():
+            """Serve the frontend HTML."""
+            return HTMLResponse(content=self._get_frontend_html())
+        @app.get("/api/jobs/local/instrumental-analysis")
+        async def get_analysis():
+            """Get analysis data for the instrumental review."""
+            return {
+                "job_id": "local",
+                "artist": self.base_name.split(" - ")[0] if " - " in self.base_name else "",
+                "title": self.base_name.split(" - ")[1] if " - " in self.base_name else self.base_name,
+                "status": "awaiting_instrumental_selection",
+                "analysis": {
+                    "has_audible_content": self.analysis.has_audible_content,
+                    "total_duration_seconds": self.analysis.total_duration_seconds,
+                    "audible_segments": [
+                        {
+                            "start_seconds": seg.start_seconds,
+                            "end_seconds": seg.end_seconds,
+                            "duration_seconds": seg.duration_seconds,
+                            "avg_amplitude_db": seg.avg_amplitude_db,
+                            "peak_amplitude_db": seg.peak_amplitude_db,
+                        }
+                        for seg in self.analysis.audible_segments
+                    ],
+                    "recommended_selection": self.analysis.recommended_selection.value,
+                    "total_audible_duration_seconds": self.analysis.total_audible_duration_seconds,
+                    "audible_percentage": self.analysis.audible_percentage,
+                    "silence_threshold_db": self.analysis.silence_threshold_db,
+                },
+                "audio_urls": {
+                    "clean_instrumental": "/api/audio/clean_instrumental" if self.clean_instrumental_path else None,
+                    "backing_vocals": "/api/audio/backing_vocals" if self.backing_vocals_path else None,
+                    "with_backing": "/api/audio/with_backing" if self.with_backing_path else None,
+                    "custom_instrumental": "/api/audio/custom_instrumental" if self.custom_instrumental_path else None,
+                    "uploaded_instrumental": "/api/audio/uploaded_instrumental" if self.uploaded_instrumental_path else None,
+                    "original": "/api/audio/original" if self.original_audio_path else None,
+                },
+                "waveform_url": "/api/waveform" if self.waveform_path else None,
+                "has_custom_instrumental": self.custom_instrumental_path is not None,
+                "has_uploaded_instrumental": self.uploaded_instrumental_path is not None,
+                "has_original": self.original_audio_path is not None,
+            }
+        @app.get("/api/jobs/local/waveform-data")
+        async def get_waveform_data(num_points: int = 600):
+            """Get waveform amplitude data for client-side rendering."""
+            # Validate num_points parameter
+            if num_points <= 0 or num_points > 10000:
+                raise HTTPException(
+                    status_code=400,
+                    detail="num_points must be between 1 and 10000"
+                )
+            if not self.backing_vocals_path or not os.path.exists(self.backing_vocals_path):
+                raise HTTPException(status_code=404, detail="Backing vocals file not found")
+            try:
+                generator = WaveformGenerator()
+                amplitudes, duration = generator.generate_data_only(self.backing_vocals_path, num_points)
+                return {"amplitudes": amplitudes, "duration": duration}
+            except Exception as e:
+                logger.exception(f"Error generating waveform data: {e}")
+                raise HTTPException(status_code=500, detail=str(e)) from e
+        @app.get("/api/audio/{stem_type}")
+        async def stream_audio(stem_type: str):
+            """Stream audio file."""
+            path_map = {
+                "clean_instrumental": self.clean_instrumental_path,
+                "backing_vocals": self.backing_vocals_path,
+                "with_backing": self.with_backing_path,
+                "custom_instrumental": self.custom_instrumental_path,
+                "uploaded_instrumental": self.uploaded_instrumental_path,
+                "original": self.original_audio_path,
+            }
+            audio_path = path_map.get(stem_type)
+            if not audio_path or not os.path.exists(audio_path):
+                raise HTTPException(status_code=404, detail=f"Audio file not found: {stem_type}")
+            # Determine content type
+            ext = os.path.splitext(audio_path)[1].lower()
+            content_types = {
+                ".flac": "audio/flac",
+                ".mp3": "audio/mpeg",
+                ".wav": "audio/wav",
+            }
+            content_type = content_types.get(ext, "application/octet-stream")
+            return FileResponse(audio_path, media_type=content_type)
+        @app.get("/api/waveform")
+        async def get_waveform_image():
+            """Serve waveform image."""
+            if not self.waveform_path or not os.path.exists(self.waveform_path):
+                raise HTTPException(status_code=404, detail="Waveform image not found")
+            return FileResponse(self.waveform_path, media_type="image/png")
+        @app.post("/api/jobs/local/create-custom-instrumental")
+        async def create_custom_instrumental(request: CreateCustomRequest):
+            """Create a custom instrumental with muted regions."""
+            if not request.mute_regions:
+                raise HTTPException(status_code=400, detail="No mute regions provided")
+            try:
+                mute_regions = [
+                    MuteRegion(
+                        start_seconds=r.start_seconds,
+                        end_seconds=r.end_seconds,
+                    )
+                    for r in request.mute_regions
+                ]
+                editor = AudioEditor()
+                output_path = os.path.join(
+                    self.output_dir,
+                    f"{self.base_name} (Instrumental Custom).flac"
+                )
+                result = editor.create_custom_instrumental(
+                    clean_instrumental_path=self.clean_instrumental_path,
+                    backing_vocals_path=self.backing_vocals_path,
+                    mute_regions=mute_regions,
+                    output_path=output_path,
+                )
+                self.custom_instrumental_path = result.output_path
+                return {
+                    "status": "success",
+                    "custom_instrumental_url": "/api/audio/custom_instrumental",
+                    "statistics": {
+                        "mute_regions_applied": len(result.mute_regions_applied),
+                        "total_muted_duration_seconds": result.total_muted_duration_seconds,
+                        "output_duration_seconds": result.output_duration_seconds,
+                    },
+                }
+            except Exception as e:
+                logger.exception(f"Error creating custom instrumental: {e}")
+                raise HTTPException(status_code=500, detail=str(e)) from e
+        @app.post("/api/jobs/local/upload-instrumental")
+        async def upload_instrumental(file: UploadFile = File(...)):
+            """Upload a custom instrumental audio file."""
+            # Validate file type
+            allowed_extensions = {".flac", ".mp3", ".wav", ".m4a", ".ogg"}
+            ext = os.path.splitext(file.filename or "")[1].lower()
+            if ext not in allowed_extensions:
+                raise HTTPException(
+                    status_code=400,
+                    detail=f"Invalid file type. Allowed: {', '.join(allowed_extensions)}"
+                )
+            tmp_path = None
+            file_moved = False
+            try:
+                # Save to temp file first to validate
+                with tempfile.NamedTemporaryFile(delete=False, suffix=ext) as tmp:
+                    shutil.copyfileobj(file.file, tmp)
+                    tmp_path = tmp.name
+                # Load and check duration
+                uploaded_audio = AudioSegment.from_file(tmp_path)
+                uploaded_duration = len(uploaded_audio) / 1000.0  # ms to seconds
+                expected_duration = self.analysis.total_duration_seconds
+                duration_diff = abs(uploaded_duration - expected_duration)
+                if duration_diff > 0.5:
+                    raise HTTPException(
+                        status_code=400,
+                        detail=f"Duration mismatch: uploaded file is {uploaded_duration:.2f}s, "
+                               f"expected {expected_duration:.2f}s (±0.5s allowed)"
+                    )
+                # Move to final location
+                output_path = os.path.join(
+                    self.output_dir,
+                    f"{self.base_name} (Instrumental Uploaded){ext}"
+                )
+                shutil.move(tmp_path, output_path)
+                file_moved = True
+                self.uploaded_instrumental_path = output_path
+                return {
+                    "status": "success",
+                    "uploaded_instrumental_url": "/api/audio/uploaded_instrumental",
+                    "duration_seconds": uploaded_duration,
+                    "filename": file.filename,
+                }
+            except HTTPException:
+                raise
+            except Exception as e:
+                logger.exception(f"Error uploading instrumental: {e}")
+                raise HTTPException(status_code=500, detail=str(e)) from e
+            finally:
+                # Clean up temp file if it wasn't moved
+                if tmp_path and not file_moved and os.path.exists(tmp_path):
+                    try:
+                        os.unlink(tmp_path)
+                    except OSError:
+                        pass  # Best effort cleanup
+        @app.post("/api/jobs/local/select-instrumental")
+        async def select_instrumental(request: SelectionRequest):
+            """Submit instrumental selection."""
+            if request.selection not in ("clean", "with_backing", "custom", "uploaded", "original"):
+                raise HTTPException(status_code=400, detail=f"Invalid selection: {request.selection}")
+            self.selection = request.selection
+            self._selection_event.set()
+            return {"status": "success", "selection": request.selection}
+    @staticmethod
+    def _get_static_dir() -> Path:
+        """Get the path to the static assets directory."""
+        return Path(__file__).parent / "static"
+    def _get_frontend_html(self) -> str:
+        """Return the frontend HTML by reading from the static file."""
+        static_file = self._get_static_dir() / "index.html"
+        if static_file.exists():
+            return static_file.read_text(encoding="utf-8")
+        else:
+            # Fallback error message if file is missing
+            return """<!DOCTYPE html>
+<html>
+<head><title>Error</title></head>
+<body style="background:#1a1a1a;color:#fff;font-family:sans-serif;padding:2rem;">
+<h1>Frontend assets not found</h1>
+<p>The static/index.html file is missing from the instrumental_review module.</p>
+</body>
+</html>"""
+    @staticmethod
+    def _is_port_available(host: str, port: int) -> bool:
+        """Check if a port is available for binding."""
+        try:
+            with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as sock:
+                sock.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
+                sock.bind((host, port))
+                return True
+        except OSError:
+            return False
+    @staticmethod
+    def _find_available_port(host: str, preferred_port: int, max_attempts: int = 100) -> int:
+        """
+        Find an available port, starting with the preferred port.
+        Args:
+            host: Host to bind to
+            preferred_port: The preferred port to try first
+            max_attempts: Maximum number of ports to try
+        Returns:
+            An available port number
+        Raises:
+            RuntimeError: If no available port could be found
+        """
+        # Try the preferred port first
+        if InstrumentalReviewServer._is_port_available(host, preferred_port):
+            return preferred_port
+        # Try subsequent ports
+        for offset in range(1, max_attempts):
+            port = preferred_port + offset
+            if port > 65535:
+                break
+            if InstrumentalReviewServer._is_port_available(host, port):
+                return port
+        # Last resort: let the OS assign a port
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as sock:
+            sock.bind((host, 0))
+            return sock.getsockname()[1]
+    def start_and_open_browser(self, port: int = 8765) -> str:
+        """
+        Start server, open browser, and block until selection is submitted.
+        Args:
+            port: Preferred port to run the server on. If unavailable, will
+                  automatically find an available port.
+        Returns:
+            The user's selection ("clean", "with_backing", or "custom")
+        """
+        self._app = self._create_app()
+        # Find an available port (handles concurrent CLI instances)
+        host = "127.0.0.1"
+        actual_port = self._find_available_port(host, port)
+        if actual_port != port:
+            logger.info(f"Port {port} in use, using port {actual_port} instead")
+        # Run uvicorn in a separate thread
+        config = uvicorn.Config(
+            self._app,
+            host=host,
+            port=actual_port,
+            log_level="warning",
+        )
+        server = uvicorn.Server(config)
+        def run_server():
+            server.run()
+        self._server_thread = threading.Thread(target=run_server, daemon=True)
+        self._server_thread.start()
+        # Wait a moment for server to start
+        import time
+        time.sleep(0.5)
+        url = f"http://localhost:{actual_port}/"
+        logger.info(f"Instrumental review server started at {url}")
+        # Open browser
+        webbrowser.open(url)
+        # Wait for selection
+        logger.info("Waiting for instrumental selection...")
+        self._selection_event.wait()
+        # Give a moment for response to be sent
+        time.sleep(0.5)
+        return self.get_selection()
+    def stop(self) -> None:
+        """Stop the server."""
+        self._shutdown_event.set()
+    def get_selection(self) -> str:
+        """Get the user's selection."""
+        if self.selection is None:
+            raise ValueError("No selection has been made")
+        return self.selection
+    def get_custom_instrumental_path(self) -> Optional[str]:
+        """Get the path to the custom instrumental if one was created."""
+        return self.custom_instrumental_path
+    def get_uploaded_instrumental_path(self) -> Optional[str]:
+        """Get the path to the uploaded instrumental if one was uploaded."""
+        return self.uploaded_instrumental_path