PyPI - karaoke-gen - Versions diffs - 0.57.0__py3-none-any.whl → 0.71.27__py3-none-any.whl - Mend

karaoke-gen 0.57.0py3-none-any.whl → 0.71.27py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

karaoke_gen/audio_fetcher.py +461 -0
karaoke_gen/audio_processor.py +407 -30
karaoke_gen/config.py +62 -113
karaoke_gen/file_handler.py +32 -59
karaoke_gen/karaoke_finalise/karaoke_finalise.py +148 -67
karaoke_gen/karaoke_gen.py +270 -61
karaoke_gen/lyrics_processor.py +13 -1
karaoke_gen/metadata.py +78 -73
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/bulk_cli.py +6 -0
karaoke_gen/utils/cli_args.py +424 -0
karaoke_gen/utils/gen_cli.py +26 -261
karaoke_gen/utils/remote_cli.py +1965 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen-0.71.27.dist-info/METADATA +610 -0
karaoke_gen-0.71.27.dist-info/RECORD +275 -0
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/WHEEL +1 -1
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/entry_points.txt +1 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +520 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +1043 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +212 -0
lyrics_transcriber/frontend/src/api.ts +239 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +387 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1373 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +688 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js +42039 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +267 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +290 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +648 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0
karaoke_gen-0.57.0.dist-info/METADATA +0 -167
karaoke_gen-0.57.0.dist-info/RECORD +0 -23
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info/licenses}/LICENSE +0 -0

lyrics_transcriber/output/cdg.py ADDED Viewed

@@ -0,0 +1,619 @@
+import logging
+from typing import List, Optional, Tuple
+import logging
+import re
+import toml
+from pathlib import Path
+from PIL import ImageFont
+import os
+import zipfile
+import shutil
+from lyrics_transcriber.output.cdgmaker.cdg import CDG_VISIBLE_WIDTH
+from lyrics_transcriber.output.cdgmaker.composer import KaraokeComposer
+from lyrics_transcriber.output.cdgmaker.render import get_wrapped_text
+from lyrics_transcriber.types import LyricsSegment
+class CDGGenerator:
+    """Generates CD+G (CD Graphics) format karaoke files."""
+    def __init__(self, output_dir: str, logger: Optional[logging.Logger] = None):
+        """Initialize CDGGenerator.
+        Args:
+            output_dir: Directory where output files will be written
+            logger: Optional logger instance
+        """
+        self.output_dir = output_dir
+        self.logger = logger or logging.getLogger(__name__)
+        self.cdg_visible_width = 280
+    def _sanitize_filename(self, filename: str) -> str:
+        """Replace or remove characters that are unsafe for filenames."""
+        if not filename:
+            return ""
+        # Replace problematic characters with underscores
+        for char in ["\\", "/", ":", "*", "?", '"', "<", ">", "|"]:
+            filename = filename.replace(char, "_")
+        # Remove any trailing spaces
+        filename = filename.rstrip(" ")
+        return filename
+    def _get_safe_filename(self, artist: str, title: str, suffix: str = "", ext: str = "") -> str:
+        """Create a safe filename from artist and title."""
+        safe_artist = self._sanitize_filename(artist)
+        safe_title = self._sanitize_filename(title)
+        base = f"{safe_artist} - {safe_title}"
+        if suffix:
+            base += f" ({suffix})"
+        if ext:
+            base += f".{ext}"
+        return base
+    def generate_cdg(
+        self,
+        segments: List[LyricsSegment],
+        audio_file: str,
+        title: str,
+        artist: str,
+        cdg_styles: dict,
+    ) -> Tuple[str, str, str]:
+        """Generate a CDG file from lyrics segments and audio file.
+        Args:
+            segments: List of LyricsSegment objects containing timing and text
+            audio_file: Path to the audio file
+            title: Title of the song
+            artist: Artist name
+            cdg_styles: Dictionary containing CDG style parameters
+        Returns:
+            Tuple containing paths to (cdg_file, mp3_file, zip_file)
+        """
+        self._validate_and_setup_font(cdg_styles)
+        # Convert segments to the format expected by the rest of the code
+        lyrics_data = self._convert_segments_to_lyrics_data(segments)
+        toml_file = self._create_toml_file(
+            audio_file=audio_file,
+            title=title,
+            artist=artist,
+            lyrics_data=lyrics_data,
+            cdg_styles=cdg_styles,
+        )
+        try:
+            self._compose_cdg(toml_file)
+            output_zip = self._find_cdg_zip(artist, title)
+            self._extract_cdg_files(output_zip)
+            cdg_file = self._get_cdg_path(artist, title)
+            mp3_file = self._get_mp3_path(artist, title)
+            self._verify_output_files(cdg_file, mp3_file)
+            self.logger.info("CDG file generated successfully")
+            return cdg_file, mp3_file, output_zip
+        except Exception as e:
+            self.logger.error(f"Error composing CDG: {e}")
+            raise
+    def _convert_segments_to_lyrics_data(self, segments: List[LyricsSegment]) -> List[dict]:
+        """Convert LyricsSegment objects to the format needed for CDG generation."""
+        lyrics_data = []
+        for segment in segments:
+            # Convert each word to a lyric entry
+            for word in segment.words:
+                # Convert time from seconds to centiseconds
+                timestamp = int(word.start_time * 100)
+                lyrics_data.append({"timestamp": timestamp, "text": word.text.upper()})  # CDG format expects uppercase text
+                self.logger.debug(f"Added lyric: timestamp {timestamp}, text '{word.text}'")
+        # Sort by timestamp to ensure correct order
+        lyrics_data.sort(key=lambda x: x["timestamp"])
+        return lyrics_data
+    def _create_toml_file(
+        self,
+        audio_file: str,
+        title: str,
+        artist: str,
+        lyrics_data: List[dict],
+        cdg_styles: dict,
+    ) -> str:
+        """Create TOML configuration file for CDG generation."""
+        safe_filename = self._get_safe_filename(artist, title, "Karaoke", "toml")
+        toml_file = os.path.join(self.output_dir, safe_filename)
+        self.logger.debug(f"Generating TOML file: {toml_file}")
+        self.generate_toml(
+            audio_file=audio_file,
+            title=title,
+            artist=artist,
+            lyrics_data=lyrics_data,
+            output_file=toml_file,
+            cdg_styles=cdg_styles,
+        )
+        return toml_file
+    def generate_toml(
+        self,
+        audio_file: str,
+        title: str,
+        artist: str,
+        lyrics_data: List[dict],
+        output_file: str,
+        cdg_styles: dict,
+    ) -> None:
+        """Generate a TOML configuration file for CDG creation."""
+        audio_file = os.path.abspath(audio_file)
+        self.logger.debug(f"Using absolute audio file path: {audio_file}")
+        self._validate_cdg_styles(cdg_styles)
+        instrumentals = self._detect_instrumentals(lyrics_data, cdg_styles)
+        sync_times, formatted_lyrics = self._format_lyrics_data(lyrics_data, instrumentals, cdg_styles)
+        toml_data = self._create_toml_data(
+            title=title,
+            artist=artist,
+            audio_file=audio_file,
+            output_name=f"{artist} - {title} (Karaoke)",
+            sync_times=sync_times,
+            instrumentals=instrumentals,
+            formatted_lyrics=formatted_lyrics,
+            cdg_styles=cdg_styles,
+        )
+        self._write_toml_file(toml_data, output_file)
+    def _validate_and_setup_font(self, cdg_styles: dict) -> None:
+        """Validate and set up font path in CDG styles."""
+        if not cdg_styles.get("font_path"):
+            return
+        if not os.path.isabs(cdg_styles["font_path"]) and not os.path.exists(cdg_styles["font_path"]):
+            package_font_path = os.path.join(os.path.dirname(__file__), "fonts", cdg_styles["font_path"])
+            if os.path.exists(package_font_path):
+                cdg_styles["font_path"] = package_font_path
+                self.logger.debug(f"Found font in package fonts directory: {cdg_styles['font_path']}")
+            else:
+                self.logger.warning(
+                    f"Font file {cdg_styles['font_path']} not found in package fonts directory {package_font_path}, will use default font"
+                )
+                cdg_styles["font_path"] = None
+    def _compose_cdg(self, toml_file: str) -> None:
+        """Compose CDG using KaraokeComposer."""
+        kc = KaraokeComposer.from_file(toml_file, logger=self.logger)
+        kc.compose()
+        # kc.create_mp4(height=1080, fps=30)
+    def _find_cdg_zip(self, artist: str, title: str) -> str:
+        """Find the generated CDG ZIP file."""
+        safe_filename = self._get_safe_filename(artist, title, "Karaoke", "zip")
+        output_zip = os.path.join(self.output_dir, safe_filename)
+        self.logger.info(f"Looking for CDG ZIP file in output directory: {output_zip}")
+        if os.path.isfile(output_zip):
+            self.logger.info(f"Found CDG ZIP file: {output_zip}")
+            return output_zip
+        self.logger.error("Failed to find CDG ZIP file. Output directory contents:")
+        for file in os.listdir(self.output_dir):
+            self.logger.error(f" - {file}")
+        raise FileNotFoundError(f"CDG ZIP file not found: {output_zip}")
+    def _extract_cdg_files(self, zip_path: str) -> None:
+        """Extract files from the CDG ZIP."""
+        self.logger.info(f"Extracting CDG ZIP file: {zip_path}")
+        with zipfile.ZipFile(zip_path, "r") as zip_ref:
+            zip_ref.extractall(self.output_dir)
+    def _get_cdg_path(self, artist: str, title: str) -> str:
+        """Get the path to the CDG file."""
+        safe_filename = self._get_safe_filename(artist, title, "Karaoke", "cdg")
+        return os.path.join(self.output_dir, safe_filename)
+    def _get_mp3_path(self, artist: str, title: str) -> str:
+        """Get the path to the MP3 file."""
+        safe_filename = self._get_safe_filename(artist, title, "Karaoke", "mp3")
+        return os.path.join(self.output_dir, safe_filename)
+    def _verify_output_files(self, cdg_file: str, mp3_file: str) -> None:
+        """Verify that the required output files exist."""
+        if not os.path.isfile(cdg_file):
+            raise FileNotFoundError(f"CDG file not found after extraction: {cdg_file}")
+        if not os.path.isfile(mp3_file):
+            raise FileNotFoundError(f"MP3 file not found after extraction: {mp3_file}")
+    def detect_instrumentals(
+        self,
+        lyrics_data,
+        line_tile_height,
+        instrumental_font_color,
+        instrumental_background,
+        instrumental_transition,
+        instrumental_gap_threshold,
+        instrumental_text,
+    ):
+        instrumentals = []
+        for i in range(len(lyrics_data) - 1):
+            current_end = lyrics_data[i]["timestamp"]
+            next_start = lyrics_data[i + 1]["timestamp"]
+            gap = next_start - current_end
+            if gap >= instrumental_gap_threshold:
+                instrumental_start = current_end + 200  # Add 2 seconds (200 centiseconds) delay
+                instrumental_duration = (gap - 200) // 100  # Convert to seconds
+                instrumentals.append(
+                    {
+                        "sync": instrumental_start,
+                        "wait": True,
+                        "text": f"{instrumental_text}\n{instrumental_duration} seconds\n",
+                        "text_align": "center",
+                        "text_placement": "bottom middle",
+                        "line_tile_height": line_tile_height,
+                        "fill": instrumental_font_color,
+                        "stroke": "",
+                        "image": instrumental_background,
+                        "transition": instrumental_transition,
+                    }
+                )
+                self.logger.info(
+                    f"Detected instrumental: Gap of {gap} cs, starting at {instrumental_start} cs, duration {instrumental_duration} seconds"
+                )
+        self.logger.info(f"Total instrumentals detected: {len(instrumentals)}")
+        return instrumentals
+    def _validate_cdg_styles(self, cdg_styles: dict) -> None:
+        """Validate required style parameters are present."""
+        required_styles = {
+            "title_color",
+            "artist_color",
+            "background_color",
+            "border_color",
+            "font_path",
+            "font_size",
+            "stroke_width",
+            "stroke_style",
+            "active_fill",
+            "active_stroke",
+            "inactive_fill",
+            "inactive_stroke",
+            "title_screen_background",
+            "instrumental_background",
+            "instrumental_transition",
+            "instrumental_font_color",
+            "title_screen_transition",
+            "row",
+            "line_tile_height",
+            "lines_per_page",
+            "clear_mode",
+            "sync_offset",
+            "instrumental_gap_threshold",
+            "instrumental_text",
+            "lead_in_threshold",
+            "lead_in_symbols",
+            "lead_in_duration",
+            "lead_in_total",
+            "title_artist_gap",
+            "title_top_padding",
+            "intro_duration_seconds",
+            "first_syllable_buffer_seconds",
+            "outro_background",
+            "outro_transition",
+            "outro_text_line1",
+            "outro_text_line2",
+            "outro_line1_color",
+            "outro_line2_color",
+            "outro_line1_line2_gap",
+        }
+        optional_styles_with_defaults = {
+            "title_top_padding": 0,
+            # Any other optional parameters with their default values
+        }
+        # Add any missing optional parameters with their default values
+        for key, default_value in optional_styles_with_defaults.items():
+            if key not in cdg_styles:
+                cdg_styles[key] = default_value
+        missing_styles = required_styles - set(cdg_styles.keys())
+        if missing_styles:
+            raise ValueError(f"Missing required style parameters: {', '.join(missing_styles)}")
+    def _detect_instrumentals(self, lyrics_data: List[dict], cdg_styles: dict) -> List[dict]:
+        """Detect instrumental sections in lyrics."""
+        return self.detect_instrumentals(
+            lyrics_data=lyrics_data,
+            line_tile_height=cdg_styles["line_tile_height"],
+            instrumental_font_color=cdg_styles["instrumental_font_color"],
+            instrumental_background=cdg_styles["instrumental_background"],
+            instrumental_transition=cdg_styles["instrumental_transition"],
+            instrumental_gap_threshold=cdg_styles["instrumental_gap_threshold"],
+            instrumental_text=cdg_styles["instrumental_text"],
+        )
+    def _format_lyrics_data(self, lyrics_data: List[dict], instrumentals: List[dict], cdg_styles: dict) -> tuple[List[int], List[str]]:
+        """Format lyrics data with lead-in symbols and handle line wrapping.
+        Returns:
+            tuple: (sync_times, formatted_lyrics) where sync_times includes lead-in timings
+        """
+        sync_times = []
+        formatted_lyrics = []
+        for i, lyric in enumerate(lyrics_data):
+            self.logger.debug(f"Processing lyric {i}: timestamp {lyric['timestamp']}, text '{lyric['text']}'")
+            if i == 0 or lyric["timestamp"] - lyrics_data[i - 1]["timestamp"] >= cdg_styles["lead_in_threshold"]:
+                lead_in_start = lyric["timestamp"] - cdg_styles["lead_in_total"]
+                self.logger.debug(f"Adding lead-in before lyric {i} at timestamp {lead_in_start}")
+                for j, symbol in enumerate(cdg_styles["lead_in_symbols"]):
+                    sync_time = lead_in_start + j * cdg_styles["lead_in_duration"]
+                    sync_times.append(sync_time)
+                    formatted_lyrics.append(symbol)
+                    self.logger.debug(f"  Added lead-in symbol {j+1}: '{symbol}' at {sync_time}")
+            sync_times.append(lyric["timestamp"])
+            formatted_lyrics.append(lyric["text"])
+            self.logger.debug(f"Added lyric: '{lyric['text']}' at {lyric['timestamp']}")
+        formatted_text = self.format_lyrics(
+            formatted_lyrics,
+            instrumentals,
+            sync_times,
+            font_path=cdg_styles["font_path"],
+            font_size=cdg_styles["font_size"],
+        )
+        return sync_times, formatted_text
+    def _create_toml_data(
+        self,
+        title: str,
+        artist: str,
+        audio_file: str,
+        output_name: str,
+        sync_times: List[int],
+        instrumentals: List[dict],
+        formatted_lyrics: List[str],
+        cdg_styles: dict,
+    ) -> dict:
+        """Create TOML data structure."""
+        safe_output_name = self._get_safe_filename(artist, title, "Karaoke")
+        return {
+            "title": title,
+            "artist": artist,
+            "file": audio_file,
+            "outname": safe_output_name,
+            "clear_mode": cdg_styles["clear_mode"],
+            "sync_offset": cdg_styles["sync_offset"],
+            "background": cdg_styles["background_color"],
+            "border": cdg_styles["border_color"],
+            "font": cdg_styles["font_path"],
+            "font_size": cdg_styles["font_size"],
+            "stroke_width": cdg_styles["stroke_width"],
+            "stroke_style": cdg_styles["stroke_style"],
+            "singers": [
+                {
+                    "active_fill": cdg_styles["active_fill"],
+                    "active_stroke": cdg_styles["active_stroke"],
+                    "inactive_fill": cdg_styles["inactive_fill"],
+                    "inactive_stroke": cdg_styles["inactive_stroke"],
+                }
+            ],
+            "lyrics": [
+                {
+                    "singer": 1,
+                    "sync": sync_times,
+                    "row": cdg_styles["row"],
+                    "line_tile_height": cdg_styles["line_tile_height"],
+                    "lines_per_page": cdg_styles["lines_per_page"],
+                    "text": formatted_lyrics,
+                }
+            ],
+            "title_color": cdg_styles["title_color"],
+            "artist_color": cdg_styles["artist_color"],
+            "title_screen_background": cdg_styles["title_screen_background"],
+            "title_screen_transition": cdg_styles["title_screen_transition"],
+            "instrumentals": instrumentals,
+            "intro_duration_seconds": cdg_styles["intro_duration_seconds"],
+            "title_top_padding": cdg_styles["title_top_padding"],
+            "title_artist_gap": cdg_styles["title_artist_gap"],
+            "first_syllable_buffer_seconds": cdg_styles["first_syllable_buffer_seconds"],
+            "outro_background": cdg_styles["outro_background"],
+            "outro_transition": cdg_styles["outro_transition"],
+            "outro_text_line1": cdg_styles["outro_text_line1"],
+            "outro_text_line2": cdg_styles["outro_text_line2"],
+            "outro_line1_color": cdg_styles["outro_line1_color"],
+            "outro_line2_color": cdg_styles["outro_line2_color"],
+            "outro_line1_line2_gap": cdg_styles["outro_line1_line2_gap"],
+        }
+    def _write_toml_file(self, toml_data: dict, output_file: str) -> None:
+        """Write TOML data to file."""
+        with open(output_file, "w", encoding="utf-8") as f:
+            toml.dump(toml_data, f)
+        self.logger.info(f"TOML file generated: {output_file}")
+    def get_font(self, font_path=None, font_size=18):
+        try:
+            return ImageFont.truetype(font_path, font_size) if font_path else ImageFont.load_default()
+        except IOError:
+            self.logger.warning(f"Font file {font_path} not found. Using default font.")
+            return ImageFont.load_default()
+    def get_text_width(self, text, font):
+        return font.getmask(text).getbbox()[2]
+    def wrap_text(self, text, max_width, font):
+        words = text.split()
+        lines = []
+        current_line = []
+        current_width = 0
+        for word in words:
+            word_width = self.get_text_width(word, font)
+            if current_width + word_width <= max_width:
+                current_line.append(word)
+                current_width += word_width + self.get_text_width(" ", font)
+            else:
+                if current_line:
+                    lines.append(" ".join(current_line))
+                    self.logger.debug(f"Wrapped line: {' '.join(current_line)}")
+                current_line = [word]
+                current_width = word_width
+        if current_line:
+            lines.append(" ".join(current_line))
+            self.logger.debug(f"Wrapped line: {' '.join(current_line)}")
+        return lines
+    def format_lyrics(self, lyrics_data, instrumentals, sync_times, font_path=None, font_size=18):
+        formatted_lyrics = []
+        font = self.get_font(font_path, font_size)
+        self.logger.debug(f"Using font: {font}")
+        current_line = ""
+        lines_on_page = 0
+        page_number = 1
+        for i, text in enumerate(lyrics_data):
+            self.logger.debug(f"format_lyrics: Processing text {i}: '{text}' (sync time: {sync_times[i]})")
+            if text.startswith("/"):
+                if current_line:
+                    wrapped_lines = get_wrapped_text(current_line.strip(), font, CDG_VISIBLE_WIDTH).split("\n")
+                    for wrapped_line in wrapped_lines:
+                        formatted_lyrics.append(wrapped_line)
+                        lines_on_page += 1
+                        self.logger.debug(f"format_lyrics: Added wrapped line: '{wrapped_line}'. Lines on page: {lines_on_page}")
+                        # Add empty line after punctuation immediately
+                        if wrapped_line.endswith(("!", "?", ".")) and not wrapped_line == "~":
+                            formatted_lyrics.append("~")
+                            lines_on_page += 1
+                            self.logger.debug(f"format_lyrics: Added empty line after punctuation. Lines on page now: {lines_on_page}")
+                        if lines_on_page == 4:
+                            lines_on_page = 0
+                            page_number += 1
+                            self.logger.debug(f"format_lyrics: Page full. New page number: {page_number}")
+                    current_line = ""
+                text = text[1:]
+            current_line += text + " "
+            # self.logger.debug(f"format_lyrics: Current line: '{current_line}'")
+            is_last_before_instrumental = any(
+                inst["sync"] > sync_times[i] and (i == len(sync_times) - 1 or sync_times[i + 1] > inst["sync"]) for inst in instrumentals
+            )
+            if is_last_before_instrumental or i == len(lyrics_data) - 1:
+                if current_line:
+                    wrapped_lines = get_wrapped_text(current_line.strip(), font, CDG_VISIBLE_WIDTH).split("\n")
+                    for wrapped_line in wrapped_lines:
+                        formatted_lyrics.append(wrapped_line)
+                        lines_on_page += 1
+                        self.logger.debug(
+                            f"format_lyrics: Added wrapped line at end of section: '{wrapped_line}'. Lines on page: {lines_on_page}"
+                        )
+                        if lines_on_page == 4:
+                            lines_on_page = 0
+                            page_number += 1
+                            self.logger.debug(f"format_lyrics: Page full. New page number: {page_number}")
+                    current_line = ""
+                if is_last_before_instrumental:
+                    self.logger.debug(f"format_lyrics: is_last_before_instrumental: True lines_on_page: {lines_on_page}")
+                    # Calculate remaining lines needed to reach next full page
+                    remaining_lines = 4 - (lines_on_page % 4) if lines_on_page % 4 != 0 else 0
+                    if remaining_lines > 0:
+                        formatted_lyrics.extend(["~"] * remaining_lines)
+                        self.logger.debug(f"format_lyrics: Added {remaining_lines} empty lines to complete current page")
+                    # Reset the counter and increment page
+                    lines_on_page = 0
+                    page_number += 1
+                    self.logger.debug(f"format_lyrics: Reset lines_on_page to 0. New page number: {page_number}")
+        return "\n".join(formatted_lyrics)
+    def generate_cdg_from_lrc(
+        self,
+        lrc_file: str,
+        audio_file: str,
+        title: str,
+        artist: str,
+        cdg_styles: dict,
+    ) -> Tuple[str, str, str]:
+        """Generate a CDG file from an LRC file and audio file.
+        Args:
+            lrc_file: Path to the LRC file
+            audio_file: Path to the audio file
+            title: Title of the song
+            artist: Artist name
+            cdg_styles: Dictionary containing CDG style parameters
+        Returns:
+            Tuple containing paths to (cdg_file, mp3_file, zip_file)
+        """
+        self._validate_and_setup_font(cdg_styles)
+        # Parse LRC file and convert to lyrics_data format
+        lyrics_data = self._parse_lrc(lrc_file)
+        toml_file = self._create_toml_file(
+            audio_file=audio_file,
+            title=title,
+            artist=artist,
+            lyrics_data=lyrics_data,
+            cdg_styles=cdg_styles,
+        )
+        try:
+            self._compose_cdg(toml_file)
+            output_zip = self._find_cdg_zip(artist, title)
+            self._extract_cdg_files(output_zip)
+            cdg_file = self._get_cdg_path(artist, title)
+            mp3_file = self._get_mp3_path(artist, title)
+            self._verify_output_files(cdg_file, mp3_file)
+            self.logger.info("CDG file generated successfully")
+            return cdg_file, mp3_file, output_zip
+        except Exception as e:
+            self.logger.error(f"Error composing CDG: {e}")
+            raise
+    def _parse_lrc(self, lrc_file: str) -> List[dict]:
+        """Parse LRC file and extract timestamps and lyrics."""
+        with open(lrc_file, "r", encoding="utf-8") as f:
+            content = f.read()
+        # Extract timestamps and lyrics
+        pattern = r"\[(\d{2}):(\d{2})\.(\d{3})\](\d+:)?(/?.*)"
+        matches = re.findall(pattern, content)
+        if not matches:
+            raise ValueError(f"No valid lyrics found in the LRC file: {lrc_file}")
+        lyrics = []
+        for match in matches:
+            minutes, seconds, milliseconds = map(int, match[:3])
+            timestamp = (minutes * 60 + seconds) * 100 + int(milliseconds / 10)  # Convert to centiseconds
+            text = match[4].strip().upper()
+            if text:  # Only add non-empty lyrics
+                lyrics.append({"timestamp": timestamp, "text": text})
+        self.logger.info(f"Found {len(lyrics)} lyric lines")
+        return lyrics

lyrics_transcriber/output/cdgmaker/__init__.py ADDED Viewed

File without changes

karaoke-gen 0.57.0__py3-none-any.whl → 0.71.27__py3-none-any.whl

karaoke-gen 0.57.0py3-none-any.whl → 0.71.27py3-none-any.whl