PyPI - lyrics-transcriber - Versions diffs - 0.30.1__py3-none-any.whl → 0.32.2__py3-none-any.whl - Mend

lyrics-transcriber 0.30.1py3-none-any.whl → 0.32.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (84) hide show

lyrics_transcriber/__init__.py +2 -1
lyrics_transcriber/cli/cli_main.py +33 -12
lyrics_transcriber/core/config.py +35 -0
lyrics_transcriber/core/controller.py +85 -121
lyrics_transcriber/correction/anchor_sequence.py +471 -0
lyrics_transcriber/correction/corrector.py +237 -33
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +30 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +91 -0
lyrics_transcriber/correction/handlers/levenshtein.py +147 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +98 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +55 -0
lyrics_transcriber/correction/handlers/repeat.py +71 -0
lyrics_transcriber/correction/handlers/sound_alike.py +223 -0
lyrics_transcriber/correction/handlers/syllables_match.py +182 -0
lyrics_transcriber/correction/handlers/word_count_match.py +54 -0
lyrics_transcriber/correction/handlers/word_operations.py +135 -0
lyrics_transcriber/correction/phrase_analyzer.py +426 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +5 -81
lyrics_transcriber/lyrics/genius.py +5 -2
lyrics_transcriber/lyrics/spotify.py +3 -3
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/{ass.py → ass/ass.py} +150 -690
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +37 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +219 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +503 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +1919 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +101 -193
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +91 -0
lyrics_transcriber/output/segment_resizer.py +416 -0
lyrics_transcriber/output/subtitles.py +328 -302
lyrics_transcriber/output/video.py +219 -0
lyrics_transcriber/review/__init__.py +1 -0
lyrics_transcriber/review/server.py +138 -0
lyrics_transcriber/transcribers/audioshake.py +3 -2
lyrics_transcriber/transcribers/base_transcriber.py +5 -42
lyrics_transcriber/transcribers/whisper.py +3 -4
lyrics_transcriber/types.py +454 -0
{lyrics_transcriber-0.30.1.dist-info → lyrics_transcriber-0.32.2.dist-info}/METADATA +14 -3
lyrics_transcriber-0.32.2.dist-info/RECORD +86 -0
{lyrics_transcriber-0.30.1.dist-info → lyrics_transcriber-0.32.2.dist-info}/WHEEL +1 -1
{lyrics_transcriber-0.30.1.dist-info → lyrics_transcriber-0.32.2.dist-info}/entry_points.txt +1 -0
lyrics_transcriber/correction/base_strategy.py +0 -29
lyrics_transcriber/correction/strategy_diff.py +0 -263
lyrics_transcriber-0.30.1.dist-info/RECORD +0 -25
{lyrics_transcriber-0.30.1.dist-info → lyrics_transcriber-0.32.2.dist-info}/LICENSE +0 -0

lyrics_transcriber/output/segment_resizer.py ADDED Viewed

@@ -0,0 +1,416 @@
+import logging
+import re
+from typing import List, Optional, Tuple
+from lyrics_transcriber.types import LyricsSegment, Word
+class SegmentResizer:
+    """Handles resizing of lyrics segments to ensure proper line lengths and natural breaks.
+    This class processes lyrics segments and splits them into smaller segments when they exceed
+    a maximum line length. It attempts to split at natural break points like sentence endings,
+    commas, or conjunctions to maintain readability.
+    Example:
+        resizer = SegmentResizer(max_line_length=36)
+        segments = [
+            LyricsSegment(
+                text="This is a very long sentence that needs to be split into multiple lines for better readability",
+                words=[...],  # List of Word objects with timing information
+                start_time=0.0,
+                end_time=5.0
+            )
+        ]
+        resized = resizer.resize_segments(segments)
+        # Results in:
+        # [
+        #     LyricsSegment(text="This is a very long sentence", ...),
+        #     LyricsSegment(text="that needs to be split", ...),
+        #     LyricsSegment(text="into multiple lines", ...),
+        #     LyricsSegment(text="for better readability", ...)
+        # ]
+    """
+    def __init__(self, max_line_length: int = 36, logger: Optional[logging.Logger] = None):
+        """Initialize the SegmentResizer.
+        Args:
+            max_line_length: Maximum allowed length for a single line of text
+            logger: Optional logger for debugging information
+        """
+        self.max_line_length = max_line_length
+        self.logger = logger or logging.getLogger(__name__)
+    def resize_segments(self, segments: List[LyricsSegment]) -> List[LyricsSegment]:
+        """Main entry point for resizing segments.
+        Takes a list of potentially long segments and splits them into smaller ones
+        while preserving word timing information.
+        Example:
+            Input segment: "Hello world, this is a test. And here's another sentence."
+            Output segments: [
+                "Hello world, this is a test.",
+                "And here's another sentence."
+            ]
+        Args:
+            segments: List of LyricsSegment objects to process
+        Returns:
+            List of resized LyricsSegment objects
+        """
+        self._log_input_segments(segments)
+        resized_segments: List[LyricsSegment] = []
+        for segment_idx, segment in enumerate(segments):
+            cleaned_segment = self._create_cleaned_segment(segment)
+            # Only split if the segment is longer than max_line_length
+            if len(cleaned_segment.text) <= self.max_line_length:
+                resized_segments.append(cleaned_segment)
+                continue
+            # Process oversized segments
+            resized_segments.extend(self._split_oversized_segment(segment_idx, segment))
+        self._log_output_segments(resized_segments)
+        return resized_segments
+    def _clean_text(self, text: str) -> str:
+        """Clean text by removing newlines and extra whitespace.
+        Example:
+            Input: "Hello\n  World  \n!"
+            Output: "Hello World !"
+        Args:
+            text: String to clean
+        Returns:
+            Cleaned string with normalized whitespace
+        """
+        return " ".join(text.replace("\n", " ").split())
+    def _create_cleaned_segment(self, segment: LyricsSegment) -> LyricsSegment:
+        """Create a new segment with cleaned text while preserving timing info.
+        Example:
+            Input: LyricsSegment(text="Hello\n  World\n", words=[...])
+            Output: LyricsSegment(text="Hello World", words=[...])
+        """
+        cleaned_text = self._clean_text(segment.text)
+        return LyricsSegment(text=cleaned_text, words=segment.words, start_time=segment.start_time, end_time=segment.end_time)
+    def _create_cleaned_word(self, word: Word) -> Word:
+        """Create a new word with cleaned text."""
+        cleaned_text = self._clean_text(word.text)
+        return Word(
+            text=cleaned_text,
+            start_time=word.start_time,
+            end_time=word.end_time,
+            confidence=word.confidence if hasattr(word, "confidence") else None,
+        )
+    def _split_oversized_segment(self, segment_idx: int, segment: LyricsSegment) -> List[LyricsSegment]:
+        """Split an oversized segment into multiple segments at natural break points.
+        Example:
+            Input: "This is a long sentence. Here's another one."
+            Output: [
+                LyricsSegment(text="This is a long sentence.", ...),
+                LyricsSegment(text="Here's another one.", ...)
+            ]
+        """
+        self.logger.info(f"Processing oversized segment {segment_idx}: '{segment.text}'")
+        segment_text = self._clean_text(segment.text)
+        split_lines = self._process_segment_text(segment_text)
+        self.logger.debug(f"Split into {len(split_lines)} lines: {split_lines}")
+        return self._create_segments_from_lines(segment_text, split_lines, segment.words)
+    def _create_segments_from_lines(self, segment_text: str, split_lines: List[str], words: List[Word]) -> List[LyricsSegment]:
+        """Create segments from split lines while preserving word timing.
+        Matches words to their corresponding lines based on text position and
+        creates new segments with the correct timing information.
+        Example:
+            segment_text: "Hello world, how are you"
+            split_lines: ["Hello world,", "how are you"]
+            words: [Word("Hello", 0.0, 1.0), Word("world", 1.0, 2.0), ...]
+        Returns segments with words properly assigned to each line.
+        """
+        segments: List[LyricsSegment] = []
+        words_to_process = words.copy()
+        current_pos = 0
+        for line in split_lines:
+            line_words = []
+            line_text = line.strip()
+            remaining_line = line_text
+            # Keep processing words until we've found all words for this line
+            while words_to_process and remaining_line:
+                word = words_to_process[0]
+                word_clean = self._clean_text(word.text)
+                # Check if the cleaned word appears in the remaining line text
+                if word_clean in remaining_line:
+                    word_pos = remaining_line.find(word_clean)
+                    if word_pos != -1:
+                        line_words.append(words_to_process.pop(0))
+                        # Remove the word and any following spaces from remaining line
+                        remaining_line = remaining_line[word_pos + len(word_clean):].strip()
+                        continue
+                # If we can't find the word in the remaining line, we're done with this line
+                break
+            if line_words:
+                segments.append(self._create_segment_from_words(line, line_words))
+                current_pos += len(line) + 1  # +1 for the space between lines
+        # If we have any remaining words, create a final segment with them
+        if words_to_process:
+            remaining_text = " ".join(self._clean_text(w.text) for w in words_to_process)
+            segments.append(self._create_segment_from_words(remaining_text, words_to_process))
+        return segments
+    def _create_line_segment(
+        self, line_idx: int, line: str, segment_text: str, available_words: List[Word], current_pos: int
+    ) -> Optional[LyricsSegment]:
+        """Create a single segment from a line of text."""
+        line_pos = segment_text.find(line, current_pos)
+        if line_pos == -1:
+            self.logger.error(f"Failed to find line '{line}' in segment text '{segment_text}' " f"starting from position {current_pos}")
+            return None
+        line_words = self._find_words_for_line(line, line_pos, len(line), segment_text, available_words, current_pos)
+        if line_words:
+            return self._create_segment_from_words(line, line_words)
+        else:
+            self.logger.warning(f"No words found for line '{line}'")
+            return None
+    def _find_words_for_line(
+        self, line: str, line_pos: int, line_length: int, segment_text: str, available_words: List[Word], current_pos: int
+    ) -> List[Word]:
+        """Find words that belong to a specific line."""
+        line_words = []
+        line_text = line.strip()
+        remaining_text = line_text
+        for word in available_words:
+            # Skip if word isn't in remaining text
+            if word.text not in remaining_text:
+                continue
+            # Find position of word in line
+            word_pos = remaining_text.find(word.text)
+            if word_pos != -1:
+                line_words.append(word)
+                # Remove processed text up to and including this word
+                remaining_text = remaining_text[word_pos + len(word.text) :].strip()
+            if not remaining_text:  # All words found
+                break
+        return line_words
+    def _create_segment_from_words(self, line: str, words: List[Word]) -> LyricsSegment:
+        """Create a new segment from a list of words."""
+        cleaned_text = self._clean_text(line)
+        return LyricsSegment(text=cleaned_text, words=words, start_time=words[0].start_time, end_time=words[-1].end_time)
+    def _process_segment_text(self, text: str) -> List[str]:
+        """Process segment text to determine optimal split points."""
+        self.logger.debug(f"Processing segment text: '{text}'")
+        processed_lines: List[str] = []
+        remaining_text = text.strip()
+        while remaining_text:
+            self.logger.debug(f"Remaining text to process: '{remaining_text}'")
+            # If remaining text is within limit, add it and we're done
+            if len(remaining_text) <= self.max_line_length:
+                processed_lines.append(remaining_text)
+                break
+            # Find best split point
+            split_point = self._find_best_split_point(remaining_text)
+            first_part = remaining_text[:split_point].strip()
+            second_part = remaining_text[split_point:].strip()
+            # Only split if:
+            # 1. We found a valid split point
+            # 2. First part isn't too long
+            # 3. Both parts are non-empty
+            if split_point < len(remaining_text) and len(first_part) <= self.max_line_length and first_part and second_part:
+                processed_lines.append(first_part)
+                remaining_text = second_part
+            else:
+                # If we can't find a good split, keep the whole text
+                processed_lines.append(remaining_text)
+                break
+        return processed_lines
+    def _find_best_split_point(self, line: str) -> int:
+        """Find the best split point that creates natural, well-balanced segments."""
+        self.logger.debug(f"Finding best split point for line: '{line}' (length: {len(line)})")
+        # If line is within max length, don't split
+        if len(line) <= self.max_line_length:
+            return len(line)
+        break_points = self._find_break_points(line)
+        best_point = None
+        best_score = float("-inf")
+        # Try each break point and score it
+        for priority, points in enumerate(break_points):
+            for point in sorted(points):  # Sort points to prefer earlier ones in same priority
+                if point <= 0 or point >= len(line):
+                    continue
+                first_part = line[:point].strip()
+                # Skip if first part is too long
+                if len(first_part) > self.max_line_length:
+                    continue
+                # Score this break point
+                score = self._score_break_point(line, point, priority)
+                if score > best_score:
+                    best_score = score
+                    best_point = point
+        # If no good break points found, fall back to last space before max_length
+        if best_point is None:
+            last_space = line.rfind(" ", 0, self.max_line_length)
+            if last_space != -1:
+                return last_space
+        return best_point if best_point is not None else self.max_line_length
+    def _score_break_point(self, line: str, point: int, priority: int) -> float:
+        """Score a potential break point based on multiple factors.
+        Factors considered:
+        1. Priority of the break point type (sentence > clause > comma, etc.)
+        2. Balance of segment lengths
+        3. Proximity to target length
+        Example:
+            line: "This is a sentence. And more text."
+            point: 18 (after "sentence.")
+            priority: 0 (sentence break)
+        Returns a score where higher is better. Score components:
+        - Base score (100-20*priority): 100 for priority 0
+        - Length ratio bonus (0-10): Based on segment balance
+        - Target length bonus (0-5): Based on proximity to ideal length
+        """
+        first_segment = line[:point].strip()
+        second_segment = line[point:].strip()
+        # Base score starts with priority
+        score = 100 - (priority * 20)  # Priorities 0-4 give scores 100,80,60,40,20
+        # Length ratio bonus
+        length_ratio = min(len(first_segment), len(second_segment)) / max(len(first_segment), len(second_segment))
+        score += length_ratio * 10
+        # Target length bonus
+        target_length = self.max_line_length * 0.7
+        first_length_score = 1 - abs(len(first_segment) - target_length) / self.max_line_length
+        score += first_length_score * 5
+        return score
+    def _find_break_points(self, line: str) -> List[List[int]]:
+        """Find potential break points in order of preference.
+        Returns a list of lists, where each inner list contains break points
+        of the same priority. Break points are indices where text should be split.
+        Priority order:
+        1. Sentence endings (., !, ?)
+        2. Major clause breaks (;, -)
+        3. Comma breaks
+        4. Coordinating conjunctions (and, but, or)
+        5. Prepositions/articles (in, at, the, a)
+        Example:
+            Input: "Hello, world. This is a test"
+            Output: [
+                [12],  # sentence break after "world."
+                [],   # no semicolons or dashes
+                [5],  # comma after "Hello,"
+                [],   # no conjunctions
+                [15]  # preposition "is"
+            ]
+        """
+        break_points = []
+        # Priority 1: Sentence endings
+        sentence_breaks = []
+        for punct in [".", "!", "?"]:
+            for match in re.finditer(rf"\{punct}\s+", line):
+                sentence_breaks.append(match.start() + 1)
+        break_points.append(sentence_breaks)
+        # Priority 2: Major clause breaks (semicolons, dashes)
+        major_breaks = []
+        for punct in [";", " - "]:
+            for match in re.finditer(re.escape(punct), line):
+                major_breaks.append(match.start())  # Position before the punctuation
+        break_points.append(major_breaks)
+        # Priority 3: Comma breaks, typically marking natural pauses
+        comma_breaks = []
+        for match in re.finditer(r",\s+", line):
+            comma_breaks.append(match.start() + 1)  # Position after the comma
+        break_points.append(comma_breaks)
+        # Priority 4: Coordinating conjunctions with surrounding spaces
+        conjunction_breaks = []
+        for conj in [" and ", " but ", " or "]:
+            for match in re.finditer(re.escape(conj), line):
+                conjunction_breaks.append(match.start())  # Position before the conjunction
+        break_points.append(conjunction_breaks)
+        # Priority 5: Prepositions or articles with surrounding spaces (last resort)
+        minor_breaks = []
+        for prep in [" in ", " at ", " the ", " a "]:
+            for match in re.finditer(re.escape(prep), line):
+                minor_breaks.append(match.start())  # Position before the preposition
+        break_points.append(minor_breaks)
+        return break_points
+    def _log_input_segments(self, segments: List[LyricsSegment]) -> None:
+        """Log input segment information."""
+        self.logger.info(f"Starting segment resize. Input: {len(segments)} segments")
+        for idx, segment in enumerate(segments):
+            self.logger.debug(
+                f"Input segment {idx}: text='{segment.text}', "
+                f"words={len(segment.words)} words, "
+                f"time={segment.start_time:.2f}-{segment.end_time:.2f}"
+            )
+    def _log_output_segments(self, segments: List[LyricsSegment]) -> None:
+        """Log output segment information."""
+        self.logger.info(f"Finished resizing. Output: {len(segments)} segments")
+        for idx, segment in enumerate(segments):
+            self.logger.debug(
+                f"Output segment {idx}: text='{segment.text}', "
+                f"words={len(segment.words)} words, "
+                f"time={segment.start_time:.2f}-{segment.end_time:.2f}"
+            )

lyrics-transcriber 0.30.1__py3-none-any.whl → 0.32.2__py3-none-any.whl

lyrics-transcriber 0.30.1py3-none-any.whl → 0.32.2py3-none-any.whl