PyPI - karaoke-gen - Versions diffs - 0.57.0__py3-none-any.whl → 0.71.27__py3-none-any.whl - Mend

karaoke-gen 0.57.0py3-none-any.whl → 0.71.27py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

karaoke_gen/audio_fetcher.py +461 -0
karaoke_gen/audio_processor.py +407 -30
karaoke_gen/config.py +62 -113
karaoke_gen/file_handler.py +32 -59
karaoke_gen/karaoke_finalise/karaoke_finalise.py +148 -67
karaoke_gen/karaoke_gen.py +270 -61
karaoke_gen/lyrics_processor.py +13 -1
karaoke_gen/metadata.py +78 -73
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/bulk_cli.py +6 -0
karaoke_gen/utils/cli_args.py +424 -0
karaoke_gen/utils/gen_cli.py +26 -261
karaoke_gen/utils/remote_cli.py +1965 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen-0.71.27.dist-info/METADATA +610 -0
karaoke_gen-0.71.27.dist-info/RECORD +275 -0
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/WHEEL +1 -1
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/entry_points.txt +1 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +520 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +1043 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +212 -0
lyrics_transcriber/frontend/src/api.ts +239 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +387 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1373 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +688 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js +42039 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +267 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +290 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +648 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0
karaoke_gen-0.57.0.dist-info/METADATA +0 -167
karaoke_gen-0.57.0.dist-info/RECORD +0 -23
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info/licenses}/LICENSE +0 -0

lyrics_transcriber/output/lyrics_file.py ADDED Viewed

@@ -0,0 +1,102 @@
+import logging
+import os
+from typing import List, Optional
+from lyrics_transcriber.types import LyricsSegment, Word
+class LyricsFileGenerator:
+    """Handles generation of lyrics files in various formats (LRC, etc)."""
+    def __init__(self, output_dir: str, logger: Optional[logging.Logger] = None):
+        """Initialize LyricsFileGenerator.
+        Args:
+            output_dir: Directory where output files will be written
+            logger: Optional logger instance
+        """
+        self.output_dir = output_dir
+        self.logger = logger or logging.getLogger(__name__)
+    def _get_output_path(self, output_prefix: str, extension: str) -> str:
+        """Generate full output path for a file."""
+        return os.path.join(self.output_dir, f"{output_prefix}.{extension}")
+    def generate_lrc(self, segments: List[LyricsSegment], output_prefix: str) -> str:
+        """Generate LRC format lyrics file.
+        Args:
+            segments: List of LyricsSegment objects containing word timing data
+            output_prefix: Prefix for output filename
+        Returns:
+            Path to generated LRC file
+        """
+        self.logger.info("Generating LRC format lyrics")
+        output_path = self._get_output_path(f"{output_prefix} (Karaoke)", "lrc")
+        try:
+            self._write_lrc_file(output_path, segments)
+            self.logger.info(f"LRC file generated: {output_path}")
+            return output_path
+        except Exception as e:
+            self.logger.error(f"Failed to generate LRC file: {str(e)}")
+            raise
+    def _write_lrc_file(self, output_path: str, segments: List[LyricsSegment]) -> None:
+        """Write LRC file content with MidiCo-compatible word-level timestamps.
+        Args:
+            output_path: Path to write the LRC file
+            segments: List of LyricsSegment objects containing word timing data
+        """
+        with open(output_path, "w", encoding="utf-8") as f:
+            # Write MidiCo header
+            f.write("[re:MidiCo]\n")
+            for segment in segments:
+                for i, word in enumerate(segment.words):
+                    start_time = self._format_lrc_timestamp(word.start_time)
+                    # Add space after all words except last in segment
+                    text = word.text
+                    if i != len(segment.words) - 1:
+                        text += " "
+                    # Add "/" prefix for first word in segment
+                    prefix = "/" if i == 0 else ""
+                    # Write MidiCo formatted line
+                    f.write(f"[{start_time}]1:{prefix}{text}\n")
+    def _format_lrc_timestamp(self, seconds: float) -> str:
+        """Format timestamp for MidiCo LRC format (MM:SS.mmm).
+        Args:
+            seconds: Time in seconds
+        Returns:
+            Formatted timestamp string in MM:SS.mmm format
+        """
+        minutes = int(seconds // 60)
+        remaining_seconds = seconds % 60
+        # Convert to milliseconds and round to nearest integer
+        total_milliseconds = round(remaining_seconds * 1000)
+        # Extract seconds and milliseconds
+        seconds_part = total_milliseconds // 1000
+        milliseconds = total_milliseconds % 1000
+        # Handle rollover
+        if seconds_part == 60:
+            seconds_part = 0
+            minutes += 1
+        return f"{minutes:02d}:{seconds_part:02d}.{milliseconds:03d}"
+    # Future methods for other lyrics file formats can be added here
+    # def generate_txt(self, segments: List[LyricsSegment], output_prefix: str) -> str:
+    #     """Generate Power Karaoke TXT format lyrics file."""
+    #     pass

lyrics_transcriber/output/plain_text.py ADDED Viewed

@@ -0,0 +1,96 @@
+import logging
+import os
+from typing import List, Optional
+from lyrics_transcriber.types import LyricsData, LyricsSegment
+from lyrics_transcriber.correction.corrector import CorrectionResult
+class PlainTextGenerator:
+    """Handles generation of plain text output files for lyrics and transcriptions."""
+    def __init__(self, output_dir: str, logger: Optional[logging.Logger] = None):
+        """Initialize PlainTextGenerator.
+        Args:
+            output_dir: Directory where output files will be written
+            logger: Optional logger instance
+        """
+        self.output_dir = output_dir
+        self.logger = logger or logging.getLogger(__name__)
+    def _get_output_path(self, output_prefix: str, extension: str) -> str:
+        """Generate full output path for a file."""
+        return os.path.join(self.output_dir, f"{output_prefix}.{extension}")
+    def write_lyrics(self, lyrics_data: LyricsData, output_prefix: str) -> str:
+        """Write plain text lyrics file from provider data.
+        Args:
+            lyrics_data: LyricsData from a lyrics provider
+            output_prefix: Prefix for output filename
+        Returns:
+            Path to generated file
+        """
+        self.logger.info("Writing plain lyrics file")
+        provider_name = lyrics_data.metadata.source.title()
+        output_path = self._get_output_path(f"{output_prefix} (Lyrics {provider_name})", "txt")
+        try:
+            with open(output_path, "w", encoding="utf-8") as f:
+                # Join segment texts with newlines
+                lyrics_text = "\n".join(segment.text for segment in lyrics_data.segments)
+                f.write(lyrics_text)
+            self.logger.info(f"Plain lyrics file generated: {output_path}")
+            return output_path
+        except Exception as e:
+            self.logger.error(f"Failed to write plain lyrics file: {str(e)}")
+            raise
+    def write_corrected_lyrics(self, segments: List[LyricsSegment], output_prefix: str) -> str:
+        """Write corrected lyrics as plain text file.
+        Args:
+            segments: List of corrected LyricsSegment objects
+            output_prefix: Prefix for output filename
+        Returns:
+            Path to generated file
+        """
+        self.logger.info("Writing corrected lyrics file")
+        output_path = self._get_output_path(f"{output_prefix} (Lyrics Corrected)", "txt")
+        try:
+            with open(output_path, "w", encoding="utf-8") as f:
+                for segment in segments:
+                    f.write(f"{segment.text}\n")
+            self.logger.info(f"Corrected lyrics file generated: {output_path}")
+            return output_path
+        except Exception as e:
+            self.logger.error(f"Failed to write corrected lyrics file: {str(e)}")
+            raise
+    def write_original_transcription(self, correction_result: CorrectionResult, output_prefix: str) -> str:
+        """Write original (uncorrected) transcription as plain text.
+        Args:
+            correction_result: CorrectionResult containing original transcription
+            output_prefix: Prefix for output filename
+        Returns:
+            Path to generated file
+        """
+        self.logger.info("Writing original transcription file")
+        output_path = self._get_output_path(f"{output_prefix} (Lyrics Uncorrected)", "txt")
+        transcribed_text = " ".join(" ".join(w.text for w in segment.words) for segment in correction_result.original_segments)
+        try:
+            with open(output_path, "w", encoding="utf-8") as f:
+                f.write(transcribed_text)
+            self.logger.info(f"Original transcription file generated: {output_path}")
+            return output_path
+        except Exception as e:
+            self.logger.error(f"Failed to write original transcription file: {str(e)}")
+            raise

lyrics_transcriber/output/segment_resizer.py ADDED Viewed

@@ -0,0 +1,431 @@
+import logging
+import re
+from typing import List, Optional
+from lyrics_transcriber.types import LyricsSegment, Word
+from lyrics_transcriber.utils.word_utils import WordUtils
+class SegmentResizer:
+    """Handles resizing of lyrics segments to ensure proper line lengths and natural breaks.
+    This class processes lyrics segments and splits them into smaller segments when they exceed
+    a maximum line length. It attempts to split at natural break points like sentence endings,
+    commas, or conjunctions to maintain readability.
+    Example:
+        resizer = SegmentResizer(max_line_length=36)
+        segments = [
+            LyricsSegment(
+                text="This is a very long sentence that needs to be split into multiple lines for better readability",
+                words=[...],  # List of Word objects with timing information
+                start_time=0.0,
+                end_time=5.0
+            )
+        ]
+        resized = resizer.resize_segments(segments)
+        # Results in:
+        # [
+        #     LyricsSegment(text="This is a very long sentence", ...),
+        #     LyricsSegment(text="that needs to be split", ...),
+        #     LyricsSegment(text="into multiple lines", ...),
+        #     LyricsSegment(text="for better readability", ...)
+        # ]
+    """
+    def __init__(self, max_line_length: int = 36, logger: Optional[logging.Logger] = None):
+        """Initialize the SegmentResizer.
+        Args:
+            max_line_length: Maximum allowed length for a single line of text
+            logger: Optional logger for debugging information
+        """
+        self.max_line_length = max_line_length
+        self.logger = logger or logging.getLogger(__name__)
+    def resize_segments(self, segments: List[LyricsSegment]) -> List[LyricsSegment]:
+        """Main entry point for resizing segments.
+        Takes a list of potentially long segments and splits them into smaller ones
+        while preserving word timing information.
+        Example:
+            Input segment: "Hello world, this is a test. And here's another sentence."
+            Output segments: [
+                "Hello world, this is a test.",
+                "And here's another sentence."
+            ]
+        Args:
+            segments: List of LyricsSegment objects to process
+        Returns:
+            List of resized LyricsSegment objects
+        """
+        self._log_input_segments(segments)
+        resized_segments: List[LyricsSegment] = []
+        for segment_idx, segment in enumerate(segments):
+            cleaned_segment = self._create_cleaned_segment(segment)
+            # Only split if the segment is longer than max_line_length
+            if len(cleaned_segment.text) <= self.max_line_length:
+                resized_segments.append(cleaned_segment)
+                continue
+            # Process oversized segments
+            resized_segments.extend(self._split_oversized_segment(segment_idx, segment))
+        self._log_output_segments(resized_segments)
+        return resized_segments
+    def _clean_text(self, text: str) -> str:
+        """Clean text by removing newlines and extra whitespace.
+        Example:
+            Input: "Hello\n  World  \n!"
+            Output: "Hello World !"
+        Args:
+            text: String to clean
+        Returns:
+            Cleaned string with normalized whitespace
+        """
+        return " ".join(text.replace("\n", " ").split())
+    def _create_cleaned_segment(self, segment: LyricsSegment) -> LyricsSegment:
+        """Create a new segment with cleaned text while preserving timing info.
+        Example:
+            Input: LyricsSegment(text="Hello\n  World\n", words=[...])
+            Output: LyricsSegment(text="Hello World", words=[...])
+        """
+        cleaned_text = self._clean_text(segment.text)
+        return LyricsSegment(
+            id=segment.id,  # Preserve the original segment ID
+            text=cleaned_text,
+            words=segment.words,
+            start_time=segment.start_time,
+            end_time=segment.end_time,
+        )
+    def _create_cleaned_word(self, word: Word) -> Word:
+        """Create a new word with cleaned text."""
+        cleaned_text = self._clean_text(word.text)
+        return Word(
+            id=word.id,  # Preserve the original word ID
+            text=cleaned_text,
+            start_time=word.start_time,
+            end_time=word.end_time,
+            confidence=word.confidence if hasattr(word, "confidence") else None,
+        )
+    def _split_oversized_segment(self, segment_idx: int, segment: LyricsSegment) -> List[LyricsSegment]:
+        """Split an oversized segment into multiple segments at natural break points.
+        Example:
+            Input: "This is a long sentence. Here's another one."
+            Output: [
+                LyricsSegment(text="This is a long sentence.", ...),
+                LyricsSegment(text="Here's another one.", ...)
+            ]
+        """
+        segment_text = self._clean_text(segment.text)
+        self.logger.info(f"Processing oversized segment {segment_idx}: '{segment_text}'")
+        split_lines = self._process_segment_text(segment_text)
+        self.logger.debug(f"Split into {len(split_lines)} lines: {split_lines}")
+        return self._create_segments_from_lines(segment_text, split_lines, segment.words)
+    def _create_segments_from_lines(self, segment_text: str, split_lines: List[str], words: List[Word]) -> List[LyricsSegment]:
+        """Create segments from split lines while preserving word timing.
+        Matches words to their corresponding lines based on text position and
+        creates new segments with the correct timing information.
+        Example:
+            segment_text: "Hello world, how are you"
+            split_lines: ["Hello world,", "how are you"]
+            words: [Word("Hello", 0.0, 1.0), Word("world", 1.0, 2.0), ...]
+        Returns segments with words properly assigned to each line.
+        """
+        segments: List[LyricsSegment] = []
+        words_to_process = words.copy()
+        current_pos = 0
+        for line in split_lines:
+            line_words = []
+            line_text = line.strip()
+            remaining_line = line_text
+            # Keep processing words until we've found all words for this line
+            while words_to_process and remaining_line:
+                word = words_to_process[0]
+                word_clean = self._clean_text(word.text)
+                # Check if the cleaned word appears in the remaining line text
+                if word_clean in remaining_line:
+                    word_pos = remaining_line.find(word_clean)
+                    if word_pos != -1:
+                        line_words.append(words_to_process.pop(0))
+                        # Remove the word and any following spaces from remaining line
+                        remaining_line = remaining_line[word_pos + len(word_clean) :].strip()
+                        continue
+                # If we can't find the word in the remaining line, we're done with this line
+                break
+            if line_words:
+                segments.append(self._create_segment_from_words(line, line_words))
+                current_pos += len(line) + 1  # +1 for the space between lines
+        # If we have any remaining words, create a final segment with them
+        if words_to_process:
+            remaining_text = " ".join(self._clean_text(w.text) for w in words_to_process)
+            segments.append(self._create_segment_from_words(remaining_text, words_to_process))
+        return segments
+    def _create_line_segment(
+        self, line_idx: int, line: str, segment_text: str, available_words: List[Word], current_pos: int
+    ) -> Optional[LyricsSegment]:
+        """Create a single segment from a line of text."""
+        line_pos = segment_text.find(line, current_pos)
+        if line_pos == -1:
+            self.logger.error(f"Failed to find line '{line}' in segment text '{segment_text}' " f"starting from position {current_pos}")
+            return None
+        line_words = self._find_words_for_line(line, line_pos, len(line), segment_text, available_words, current_pos)
+        if line_words:
+            return self._create_segment_from_words(line, line_words)
+        else:
+            self.logger.warning(f"No words found for line '{line}'")
+            return None
+    def _find_words_for_line(
+        self, line: str, line_pos: int, line_length: int, segment_text: str, available_words: List[Word], current_pos: int
+    ) -> List[Word]:
+        """Find words that belong to a specific line."""
+        line_words = []
+        line_text = line.strip()
+        remaining_text = line_text
+        for word in available_words:
+            # Skip if word isn't in remaining text
+            if word.text not in remaining_text:
+                continue
+            # Find position of word in line
+            word_pos = remaining_text.find(word.text)
+            if word_pos != -1:
+                line_words.append(word)
+                # Remove processed text up to and including this word
+                remaining_text = remaining_text[word_pos + len(word.text) :].strip()
+            if not remaining_text:  # All words found
+                break
+        return line_words
+    def _create_segment_from_words(self, line: str, words: List[Word]) -> LyricsSegment:
+        """Create a new segment from a list of words."""
+        cleaned_text = self._clean_text(line)
+        return LyricsSegment(
+            id=WordUtils.generate_id(),  # Generate new ID for split segments
+            text=cleaned_text,
+            words=words,
+            start_time=words[0].start_time,
+            end_time=words[-1].end_time,
+        )
+    def _process_segment_text(self, text: str) -> List[str]:
+        """Process segment text to determine optimal split points."""
+        self.logger.debug(f"Processing segment text: '{text}'")
+        processed_lines: List[str] = []
+        remaining_text = text.strip()
+        while remaining_text:
+            self.logger.debug(f"Remaining text to process: '{remaining_text}'")
+            # If remaining text is within limit, add it and we're done
+            if len(remaining_text) <= self.max_line_length:
+                processed_lines.append(remaining_text)
+                break
+            # Find best split point
+            split_point = self._find_best_split_point(remaining_text)
+            first_part = remaining_text[:split_point].strip()
+            second_part = remaining_text[split_point:].strip()
+            # Only split if:
+            # 1. We found a valid split point
+            # 2. First part isn't too long
+            # 3. Both parts are non-empty
+            if split_point < len(remaining_text) and len(first_part) <= self.max_line_length and first_part and second_part:
+                processed_lines.append(first_part)
+                remaining_text = second_part
+            else:
+                # If we can't find a good split, keep the whole text
+                processed_lines.append(remaining_text)
+                break
+        return processed_lines
+    def _find_best_split_point(self, line: str) -> int:
+        """Find the best split point that creates natural, well-balanced segments."""
+        self.logger.debug(f"Finding best split point for line: '{line}' (length: {len(line)})")
+        # If line is within max length, don't split
+        if len(line) <= self.max_line_length:
+            return len(line)
+        break_points = self._find_break_points(line)
+        best_point = None
+        best_score = float("-inf")
+        # Try each break point and score it
+        for priority, points in enumerate(break_points):
+            for point in sorted(points):  # Sort points to prefer earlier ones in same priority
+                if point <= 0 or point >= len(line):
+                    continue
+                first_part = line[:point].strip()
+                # Skip if first part is too long
+                if len(first_part) > self.max_line_length:
+                    continue
+                # Score this break point
+                score = self._score_break_point(line, point, priority)
+                if score > best_score:
+                    best_score = score
+                    best_point = point
+        # If no good break points found, fall back to last space before max_length
+        if best_point is None:
+            last_space = line.rfind(" ", 0, self.max_line_length)
+            if last_space != -1:
+                return last_space
+        return best_point if best_point is not None else self.max_line_length
+    def _score_break_point(self, line: str, point: int, priority: int) -> float:
+        """Score a potential break point based on multiple factors.
+        Factors considered:
+        1. Priority of the break point type (sentence > clause > comma, etc.)
+        2. Balance of segment lengths
+        3. Proximity to target length
+        Example:
+            line: "This is a sentence. And more text."
+            point: 18 (after "sentence.")
+            priority: 0 (sentence break)
+        Returns a score where higher is better. Score components:
+        - Base score (100-20*priority): 100 for priority 0
+        - Length ratio bonus (0-10): Based on segment balance
+        - Target length bonus (0-5): Based on proximity to ideal length
+        """
+        first_segment = line[:point].strip()
+        second_segment = line[point:].strip()
+        # Base score starts with priority
+        score = 100 - (priority * 20)  # Priorities 0-4 give scores 100,80,60,40,20
+        # Length ratio bonus
+        length_ratio = min(len(first_segment), len(second_segment)) / max(len(first_segment), len(second_segment))
+        score += length_ratio * 10
+        # Target length bonus
+        target_length = self.max_line_length * 0.7
+        first_length_score = 1 - abs(len(first_segment) - target_length) / self.max_line_length
+        score += first_length_score * 5
+        return score
+    def _find_break_points(self, line: str) -> List[List[int]]:
+        """Find potential break points in order of preference.
+        Returns a list of lists, where each inner list contains break points
+        of the same priority. Break points are indices where text should be split.
+        Priority order:
+        1. Sentence endings (., !, ?)
+        2. Major clause breaks (;, -)
+        3. Comma breaks
+        4. Coordinating conjunctions (and, but, or)
+        5. Prepositions/articles (in, at, the, a)
+        Example:
+            Input: "Hello, world. This is a test"
+            Output: [
+                [12],  # sentence break after "world."
+                [],   # no semicolons or dashes
+                [5],  # comma after "Hello,"
+                [],   # no conjunctions
+                [15]  # preposition "is"
+            ]
+        """
+        break_points = []
+        # Priority 1: Sentence endings
+        sentence_breaks = []
+        for punct in [".", "!", "?"]:
+            for match in re.finditer(rf"\{punct}\s+", line):
+                sentence_breaks.append(match.start() + 1)
+        break_points.append(sentence_breaks)
+        # Priority 2: Major clause breaks (semicolons, dashes)
+        major_breaks = []
+        for punct in [";", " - "]:
+            for match in re.finditer(re.escape(punct), line):
+                major_breaks.append(match.start())  # Position before the punctuation
+        break_points.append(major_breaks)
+        # Priority 3: Comma breaks, typically marking natural pauses
+        comma_breaks = []
+        for match in re.finditer(r",\s+", line):
+            comma_breaks.append(match.start() + 1)  # Position after the comma
+        break_points.append(comma_breaks)
+        # Priority 4: Coordinating conjunctions with surrounding spaces
+        conjunction_breaks = []
+        for conj in [" and ", " but ", " or "]:
+            for match in re.finditer(re.escape(conj), line):
+                conjunction_breaks.append(match.start())  # Position before the conjunction
+        break_points.append(conjunction_breaks)
+        # Priority 5: Prepositions or articles with surrounding spaces (last resort)
+        minor_breaks = []
+        for prep in [" in ", " at ", " the ", " a "]:
+            for match in re.finditer(re.escape(prep), line):
+                minor_breaks.append(match.start())  # Position before the preposition
+        break_points.append(minor_breaks)
+        return break_points
+    def _log_input_segments(self, segments: List[LyricsSegment]) -> None:
+        """Log input segment information."""
+        self.logger.info(f"Starting segment resize. Input: {len(segments)} segments")
+        for idx, segment in enumerate(segments):
+            self.logger.debug(
+                f"Input segment {idx}: text='{segment.text}', "
+                f"words={len(segment.words)} words, "
+                f"time={segment.start_time:.2f}-{segment.end_time:.2f}"
+            )
+    def _log_output_segments(self, segments: List[LyricsSegment]) -> None:
+        """Log output segment information."""
+        self.logger.info(f"Finished resizing. Output: {len(segments)} segments")
+        for idx, segment in enumerate(segments):
+            self.logger.debug(
+                f"Output segment {idx}: text='{segment.text}', "
+                f"words={len(segment.words)} words, "
+                f"time={segment.start_time:.2f}-{segment.end_time:.2f}"
+            )

karaoke-gen 0.57.0__py3-none-any.whl → 0.71.27__py3-none-any.whl

karaoke-gen 0.57.0py3-none-any.whl → 0.71.27py3-none-any.whl