PyPI - karaoke-gen - Versions diffs - 0.75.54__py3-none-any.whl - Mend

karaoke-gen 0.75.54__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of karaoke-gen might be problematic. Click here for more details.

Files changed (287) hide show

karaoke_gen/__init__.py +38 -0
karaoke_gen/audio_fetcher.py +1614 -0
karaoke_gen/audio_processor.py +790 -0
karaoke_gen/config.py +83 -0
karaoke_gen/file_handler.py +387 -0
karaoke_gen/instrumental_review/__init__.py +45 -0
karaoke_gen/instrumental_review/analyzer.py +408 -0
karaoke_gen/instrumental_review/editor.py +322 -0
karaoke_gen/instrumental_review/models.py +171 -0
karaoke_gen/instrumental_review/server.py +475 -0
karaoke_gen/instrumental_review/static/index.html +1529 -0
karaoke_gen/instrumental_review/waveform.py +409 -0
karaoke_gen/karaoke_finalise/__init__.py +1 -0
karaoke_gen/karaoke_finalise/karaoke_finalise.py +1833 -0
karaoke_gen/karaoke_gen.py +1026 -0
karaoke_gen/lyrics_processor.py +474 -0
karaoke_gen/metadata.py +160 -0
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/resources/AvenirNext-Bold.ttf +0 -0
karaoke_gen/resources/Montserrat-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-SemiBold.ttf +0 -0
karaoke_gen/resources/Zurich_Cn_BT_Bold.ttf +0 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/__init__.py +18 -0
karaoke_gen/utils/bulk_cli.py +492 -0
karaoke_gen/utils/cli_args.py +432 -0
karaoke_gen/utils/gen_cli.py +978 -0
karaoke_gen/utils/remote_cli.py +3268 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen/video_generator.py +424 -0
karaoke_gen-0.75.54.dist-info/METADATA +718 -0
karaoke_gen-0.75.54.dist-info/RECORD +287 -0
karaoke_gen-0.75.54.dist-info/WHEEL +4 -0
karaoke_gen-0.75.54.dist-info/entry_points.txt +5 -0
karaoke_gen-0.75.54.dist-info/licenses/LICENSE +21 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +594 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +919 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +214 -0
lyrics_transcriber/frontend/src/api.ts +254 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +413 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1387 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/SyncControls.tsx +185 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/TimelineCanvas.tsx +704 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/UpcomingWordsBar.tsx +80 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/index.tsx +905 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelectionModal.tsx +127 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +336 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js +43288 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +306 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +379 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +650 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0

karaoke_gen/config.py ADDED Viewed

@@ -0,0 +1,83 @@
+"""
+Configuration utilities for karaoke generation.
+This module provides configuration loading and setup functions.
+Style loading is delegated to the unified style_loader module.
+"""
+import os
+import sys
+import logging
+# Import from the unified style loader module
+from .style_loader import (
+    # Re-export defaults for backwards compatibility
+    DEFAULT_STYLE_PARAMS,
+    DEFAULT_INTRO_STYLE as _DEFAULT_INTRO,
+    DEFAULT_END_STYLE as _DEFAULT_END,
+    # Functions
+    load_style_params_from_file,
+    apply_style_overrides,
+    get_intro_format as _get_intro_format,
+    get_end_format as _get_end_format,
+    get_video_durations,
+    get_existing_images,
+)
+def load_style_params(style_params_json, style_overrides, logger):
+    """
+    Loads style parameters from a JSON file or uses defaults.
+    This is the main entry point for the local CLI to load styles.
+    Args:
+        style_params_json: Path to style JSON file, or None for defaults.
+        style_overrides: Dict of "section.key" -> value overrides.
+        logger: Logger for messages.
+    Returns:
+        Dictionary of style parameters.
+    """
+    style_params = load_style_params_from_file(
+        style_params_json,
+        logger=logger,
+        exit_on_error=True,
+    )
+    if style_overrides:
+        apply_style_overrides(style_params, style_overrides, logger)
+    return style_params
+def setup_title_format(style_params):
+    """
+    Sets up the title format dictionary from style parameters.
+    This is a thin wrapper around style_loader.get_intro_format()
+    for backwards compatibility.
+    """
+    return _get_intro_format(style_params)
+def setup_end_format(style_params):
+    """
+    Sets up the end format dictionary from style parameters.
+    This is a thin wrapper around style_loader.get_end_format()
+    for backwards compatibility.
+    """
+    return _get_end_format(style_params)
+def setup_ffmpeg_command(log_level):
+    """Sets up the base ffmpeg command string based on log level."""
+    # Path to the Windows PyInstaller frozen bundled ffmpeg.exe,
+    # or the system-installed FFmpeg binary on Mac/Linux
+    ffmpeg_path = os.path.join(sys._MEIPASS, "ffmpeg.exe") if getattr(sys, "frozen", False) else "ffmpeg"
+    ffmpeg_base_command = f"{ffmpeg_path} -hide_banner -nostats"
+    if log_level == logging.DEBUG:
+        ffmpeg_base_command += " -loglevel verbose"
+    else:
+        ffmpeg_base_command += " -loglevel fatal"
+    return ffmpeg_base_command

karaoke_gen/file_handler.py ADDED Viewed

@@ -0,0 +1,387 @@
+import os
+import glob
+import logging
+import shutil
+import tempfile
+from .utils import sanitize_filename
+try:
+    import yt_dlp
+    YT_DLP_AVAILABLE = True
+except ImportError:
+    YT_DLP_AVAILABLE = False
+# Placeholder class or functions for file handling
+class FileHandler:
+    def __init__(self, logger, ffmpeg_base_command, create_track_subfolders, dry_run):
+        self.logger = logger
+        self.ffmpeg_base_command = ffmpeg_base_command
+        self.create_track_subfolders = create_track_subfolders
+        self.dry_run = dry_run
+    def _file_exists(self, file_path):
+        """Check if a file exists and log the result."""
+        exists = os.path.isfile(file_path)
+        if exists:
+            self.logger.info(f"File already exists, skipping creation: {file_path}")
+        return exists
+    # Placeholder methods - to be filled by user moving code
+    def copy_input_media(self, input_media, output_filename_no_extension):
+        self.logger.debug(f"Copying media from local path {input_media} to filename {output_filename_no_extension} + existing extension")
+        copied_file_name = output_filename_no_extension + os.path.splitext(input_media)[1]
+        self.logger.debug(f"Target filename: {copied_file_name}")
+        # Check if source and destination are the same
+        if os.path.abspath(input_media) == os.path.abspath(copied_file_name):
+            self.logger.info("Source and destination are the same file, skipping copy")
+            return input_media
+        self.logger.debug(f"Copying {input_media} to {copied_file_name}")
+        shutil.copy2(input_media, copied_file_name)
+        return copied_file_name
+    def download_audio_from_fetcher_result(self, filepath, output_filename_no_extension):
+        """
+        Handle audio that was downloaded via the AudioFetcher.
+        This method copies/moves the downloaded file to the expected location
+        and returns the path with the correct naming convention.
+        Args:
+            filepath: Path to the downloaded audio file from AudioFetcher
+            output_filename_no_extension: Desired output filename without extension
+        Returns:
+            Path to the renamed/copied audio file
+        """
+        if not os.path.isfile(filepath):
+            self.logger.error(f"Downloaded file not found: {filepath}")
+            return None
+        # Get the extension from the downloaded file
+        ext = os.path.splitext(filepath)[1]
+        target_path = f"{output_filename_no_extension}{ext}"
+        # If source and target are the same, no action needed
+        if os.path.abspath(filepath) == os.path.abspath(target_path):
+            self.logger.debug(f"Downloaded file already at target location: {target_path}")
+            return target_path
+        # Copy the file to the target location
+        self.logger.debug(f"Copying downloaded file from {filepath} to {target_path}")
+        shutil.copy2(filepath, target_path)
+        return target_path
+    def download_video(self, url, output_filename_no_extension, cookies_str=None):
+        """
+        Download audio from a URL (YouTube, etc.) using yt-dlp.
+        This method downloads the best quality audio from a URL and saves it
+        to the specified output path. It handles YouTube and other video platforms
+        supported by yt-dlp.
+        Args:
+            url: URL to download from (YouTube, Vimeo, etc.)
+            output_filename_no_extension: Output filename without extension
+            cookies_str: Optional cookies string for authenticated downloads
+        Returns:
+            Path to downloaded audio file, or None if failed
+        """
+        if not YT_DLP_AVAILABLE:
+            self.logger.error("yt-dlp is not installed. Install with: pip install yt-dlp")
+            return None
+        self.logger.info(f"Downloading audio from URL: {url}")
+        # Configure yt-dlp options
+        ydl_opts = {
+            'format': 'bestaudio/best',
+            'outtmpl': output_filename_no_extension + '.%(ext)s',
+            'postprocessors': [{
+                'key': 'FFmpegExtractAudio',
+                'preferredcodec': 'best',
+                'preferredquality': '0',  # Best quality
+            }],
+            'quiet': True,
+            'no_warnings': True,
+            'extract_flat': False,
+            # Anti-detection options
+            'user_agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36',
+            'retries': 3,
+            'fragment_retries': 3,
+            'http_headers': {
+                'Accept-Language': 'en-US,en;q=0.9',
+                'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
+            },
+        }
+        # Handle cookies if provided - use safe tempfile pattern to avoid leaks
+        cookie_file_path = None
+        if cookies_str:
+            try:
+                # Use context manager to safely write cookies file
+                with tempfile.NamedTemporaryFile(mode='w', suffix='.txt', delete=False) as cookie_file:
+                    cookie_file.write(cookies_str)
+                    cookie_file_path = cookie_file.name
+                ydl_opts['cookiefile'] = cookie_file_path
+            except Exception as e:
+                self.logger.warning(f"Failed to write cookies file: {e}")
+                cookie_file_path = None
+        try:
+            with yt_dlp.YoutubeDL(ydl_opts) as ydl:
+                # Extract info first to get actual filename
+                info = ydl.extract_info(url, download=True)
+                if info is None:
+                    self.logger.error("Failed to extract info from URL")
+                    return None
+                # Find the downloaded file
+                # The actual filename might differ from template due to post-processing
+                downloaded_file = None
+                # Check common extensions
+                for ext in ['m4a', 'opus', 'webm', 'mp3', 'flac', 'wav', 'ogg', 'aac']:
+                    candidate = f"{output_filename_no_extension}.{ext}"
+                    if os.path.exists(candidate):
+                        downloaded_file = candidate
+                        break
+                if downloaded_file is None:
+                    # Try to find any audio file with matching prefix
+                    import glob
+                    matches = glob.glob(f"{output_filename_no_extension}.*")
+                    audio_extensions = ['.m4a', '.opus', '.webm', '.mp3', '.flac', '.wav', '.ogg', '.aac']
+                    for match in matches:
+                        if any(match.endswith(ext) for ext in audio_extensions):
+                            downloaded_file = match
+                            break
+                if downloaded_file and os.path.exists(downloaded_file):
+                    self.logger.info(f"Successfully downloaded: {downloaded_file}")
+                    return downloaded_file
+                else:
+                    self.logger.error("Downloaded file not found after yt-dlp completed")
+                    return None
+        except yt_dlp.DownloadError as e:
+            self.logger.error(f"yt-dlp download error: {e}")
+            return None
+        except Exception as e:
+            self.logger.error(f"Failed to download from URL: {e}")
+            return None
+        finally:
+            # Clean up cookie file if we created one
+            if cookie_file_path is not None:
+                try:
+                    os.unlink(cookie_file_path)
+                except Exception:
+                    pass
+    def extract_metadata_from_url(self, url):
+        """
+        Extract metadata (artist, title) from a URL without downloading.
+        Uses yt-dlp to fetch video metadata including title, uploader/artist,
+        and other information that can be used for the karaoke generation.
+        Args:
+            url: URL to extract metadata from
+        Returns:
+            Dict with 'artist', 'title', 'duration', and 'raw_info', or None if failed
+        """
+        if not YT_DLP_AVAILABLE:
+            self.logger.error("yt-dlp is not installed. Install with: pip install yt-dlp")
+            return None
+        self.logger.info(f"Extracting metadata from URL: {url}")
+        ydl_opts = {
+            'quiet': True,
+            'no_warnings': True,
+            'extract_flat': False,
+            'skip_download': True,
+        }
+        try:
+            with yt_dlp.YoutubeDL(ydl_opts) as ydl:
+                info = ydl.extract_info(url, download=False)
+                if info is None:
+                    self.logger.error("Failed to extract metadata from URL")
+                    return None
+                # Try to extract artist and title from various fields
+                raw_title = info.get('title', '')
+                uploader = info.get('uploader', '') or info.get('channel', '') or info.get('artist', '')
+                duration = info.get('duration', 0)
+                # Attempt to parse "Artist - Title" format from title
+                artist = None
+                title = raw_title
+                if ' - ' in raw_title:
+                    parts = raw_title.split(' - ', 1)
+                    if len(parts) == 2:
+                        artist = parts[0].strip()
+                        title = parts[1].strip()
+                # Fall back to uploader as artist if not found in title
+                if not artist:
+                    artist = uploader
+                # Clean up title (remove common suffixes like "(Official Video)")
+                title_cleanup_patterns = [
+                    '(official video)', '(official music video)', '(official audio)',
+                    '(lyric video)', '(lyrics)', '(visualizer)', '(music video)',
+                    '[official video]', '[official music video]', '[official audio]',
+                    '(hd)', '(4k)', '(remastered)', '| official video', '| official audio',
+                ]
+                title_lower = title.lower()
+                for pattern in title_cleanup_patterns:
+                    if pattern in title_lower:
+                        idx = title_lower.find(pattern)
+                        title = title[:idx].strip()
+                        title_lower = title.lower()
+                return {
+                    'artist': artist,
+                    'title': title,
+                    'duration': duration,
+                    'raw_info': info,
+                }
+        except Exception as e:
+            self.logger.error(f"Failed to extract metadata from URL: {e}")
+            return None
+    def extract_still_image_from_video(self, input_filename, output_filename_no_extension):
+        output_filename = output_filename_no_extension + ".png"
+        self.logger.info(f"Extracting still image from position 30s input media")
+        ffmpeg_command = f'{self.ffmpeg_base_command} -i "{input_filename}" -ss 00:00:30 -vframes 1 "{output_filename}"'
+        self.logger.debug(f"Running command: {ffmpeg_command}")
+        os.system(ffmpeg_command)
+        return output_filename
+    def convert_to_wav(self, input_filename, output_filename_no_extension):
+        """Convert input audio to WAV format, with input validation."""
+        # Validate input file exists and is readable
+        if not os.path.isfile(input_filename):
+            raise Exception(f"Input audio file not found: {input_filename}")
+        if os.path.getsize(input_filename) == 0:
+            raise Exception(f"Input audio file is empty: {input_filename}")
+        # Validate input file format using ffprobe
+        probe_command = f'ffprobe -v error -show_entries stream=codec_type -of default=noprint_wrappers=1 "{input_filename}"'
+        probe_output = os.popen(probe_command).read()
+        if "codec_type=audio" not in probe_output:
+            raise Exception(f"No valid audio stream found in file: {input_filename}")
+        output_filename = output_filename_no_extension + ".wav"
+        self.logger.info(f"Converting input media to audio WAV file")
+        ffmpeg_command = f'{self.ffmpeg_base_command} -n -i "{input_filename}" "{output_filename}"'
+        self.logger.debug(f"Running command: {ffmpeg_command}")
+        if not self.dry_run:
+            os.system(ffmpeg_command)
+        return output_filename
+    def setup_output_paths(self, output_dir, artist, title):
+        if title is None and artist is None:
+            raise ValueError("Error: At least title or artist must be provided")
+        # If only title is provided, use it for both artist and title portions of paths
+        if artist is None:
+            sanitized_title = sanitize_filename(title)
+            artist_title = sanitized_title
+        else:
+            sanitized_artist = sanitize_filename(artist)
+            sanitized_title = sanitize_filename(title)
+            artist_title = f"{sanitized_artist} - {sanitized_title}"
+        track_output_dir = output_dir
+        if self.create_track_subfolders:
+            track_output_dir = os.path.join(output_dir, f"{artist_title}")
+        if not os.path.exists(track_output_dir):
+            self.logger.debug(f"Output dir {track_output_dir} did not exist, creating")
+            os.makedirs(track_output_dir)
+        return track_output_dir, artist_title
+    def backup_existing_outputs(self, track_output_dir, artist, title):
+        """
+        Backup existing outputs to a versioned folder.
+        Args:
+            track_output_dir: The directory containing the track outputs
+            artist: The artist name
+            title: The track title
+        Returns:
+            The path to the original input audio file
+        """
+        self.logger.info(f"Backing up existing outputs for {artist} - {title}")
+        # Sanitize artist and title for filenames
+        sanitized_artist = sanitize_filename(artist)
+        sanitized_title = sanitize_filename(title)
+        base_name = f"{sanitized_artist} - {sanitized_title}"
+        # Find the next available version number
+        version_num = 1
+        while os.path.exists(os.path.join(track_output_dir, f"version-{version_num}")):
+            version_num += 1
+        version_dir = os.path.join(track_output_dir, f"version-{version_num}")
+        self.logger.info(f"Creating backup directory: {version_dir}")
+        os.makedirs(version_dir, exist_ok=True)
+        # Find the input audio file (we'll need this for re-running the transcription)
+        input_audio_wav = os.path.join(track_output_dir, f"{base_name}.wav")
+        if not os.path.exists(input_audio_wav):
+            self.logger.warning(f"Input audio file not found: {input_audio_wav}")
+            # Try to find any WAV file
+            wav_files = glob.glob(os.path.join(track_output_dir, "*.wav"))
+            if wav_files:
+                input_audio_wav = wav_files[0]
+                self.logger.info(f"Using alternative input audio file: {input_audio_wav}")
+            else:
+                raise Exception(f"No input audio file found in {track_output_dir}")
+        # List of file patterns to move
+        file_patterns = [
+            f"{base_name} (With Vocals).*",
+            f"{base_name} (Karaoke).*",
+            f"{base_name} (Final Karaoke*).*",
+        ]
+        # Move files matching patterns to version directory
+        for pattern in file_patterns:
+            for file_path in glob.glob(os.path.join(track_output_dir, pattern)):
+                if os.path.isfile(file_path):
+                    dest_path = os.path.join(version_dir, os.path.basename(file_path))
+                    self.logger.info(f"Moving {file_path} to {dest_path}")
+                    if not self.dry_run:
+                        shutil.move(file_path, dest_path)
+        # Also backup the lyrics directory
+        lyrics_dir = os.path.join(track_output_dir, "lyrics")
+        if os.path.exists(lyrics_dir):
+            lyrics_backup_dir = os.path.join(version_dir, "lyrics")
+            self.logger.info(f"Backing up lyrics directory to {lyrics_backup_dir}")
+            if not self.dry_run:
+                shutil.copytree(lyrics_dir, lyrics_backup_dir)
+                # Remove the original lyrics directory
+                shutil.rmtree(lyrics_dir)
+        return input_audio_wav

karaoke_gen/instrumental_review/__init__.py ADDED Viewed

@@ -0,0 +1,45 @@
+"""
+Instrumental Review Module - Shared core for both local and remote CLI.
+This module provides audio analysis and editing functionality for instrumental
+selection in karaoke generation. It's designed to be:
+- Pure Python with no cloud dependencies (GCS, etc.)
+- Reusable by both local CLI (karaoke-gen) and remote backend (Cloud Run)
+- Easy to test without mocking cloud services
+Classes:
+    AudioAnalyzer: Analyzes backing vocals audio for audible content
+    AudioEditor: Creates custom instrumentals by muting regions
+    WaveformGenerator: Generates waveform visualization images
+    InstrumentalReviewServer: Local HTTP server for browser-based review
+Models:
+    AnalysisResult: Result of audio analysis
+    AudibleSegment: A detected segment of audible content
+    MuteRegion: A region to mute in the backing vocals
+    RecommendedSelection: Enum of selection recommendations
+"""
+from .models import (
+    AnalysisResult,
+    AudibleSegment,
+    MuteRegion,
+    RecommendedSelection,
+)
+from .analyzer import AudioAnalyzer
+from .editor import AudioEditor
+from .waveform import WaveformGenerator
+from .server import InstrumentalReviewServer
+__all__ = [
+    # Models
+    "AnalysisResult",
+    "AudibleSegment",
+    "MuteRegion",
+    "RecommendedSelection",
+    # Classes
+    "AudioAnalyzer",
+    "AudioEditor",
+    "WaveformGenerator",
+    "InstrumentalReviewServer",
+]