PyPI - karaoke-gen - Versions diffs - 0.75.54__py3-none-any.whl - Mend

karaoke-gen 0.75.54__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of karaoke-gen might be problematic. Click here for more details.

Files changed (287) hide show

karaoke_gen/__init__.py +38 -0
karaoke_gen/audio_fetcher.py +1614 -0
karaoke_gen/audio_processor.py +790 -0
karaoke_gen/config.py +83 -0
karaoke_gen/file_handler.py +387 -0
karaoke_gen/instrumental_review/__init__.py +45 -0
karaoke_gen/instrumental_review/analyzer.py +408 -0
karaoke_gen/instrumental_review/editor.py +322 -0
karaoke_gen/instrumental_review/models.py +171 -0
karaoke_gen/instrumental_review/server.py +475 -0
karaoke_gen/instrumental_review/static/index.html +1529 -0
karaoke_gen/instrumental_review/waveform.py +409 -0
karaoke_gen/karaoke_finalise/__init__.py +1 -0
karaoke_gen/karaoke_finalise/karaoke_finalise.py +1833 -0
karaoke_gen/karaoke_gen.py +1026 -0
karaoke_gen/lyrics_processor.py +474 -0
karaoke_gen/metadata.py +160 -0
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/resources/AvenirNext-Bold.ttf +0 -0
karaoke_gen/resources/Montserrat-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-SemiBold.ttf +0 -0
karaoke_gen/resources/Zurich_Cn_BT_Bold.ttf +0 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/__init__.py +18 -0
karaoke_gen/utils/bulk_cli.py +492 -0
karaoke_gen/utils/cli_args.py +432 -0
karaoke_gen/utils/gen_cli.py +978 -0
karaoke_gen/utils/remote_cli.py +3268 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen/video_generator.py +424 -0
karaoke_gen-0.75.54.dist-info/METADATA +718 -0
karaoke_gen-0.75.54.dist-info/RECORD +287 -0
karaoke_gen-0.75.54.dist-info/WHEEL +4 -0
karaoke_gen-0.75.54.dist-info/entry_points.txt +5 -0
karaoke_gen-0.75.54.dist-info/licenses/LICENSE +21 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +594 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +919 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +214 -0
lyrics_transcriber/frontend/src/api.ts +254 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +413 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1387 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/SyncControls.tsx +185 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/TimelineCanvas.tsx +704 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/UpcomingWordsBar.tsx +80 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/index.tsx +905 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelectionModal.tsx +127 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +336 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js +43288 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +306 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +379 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +650 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0

lyrics_transcriber/correction/agentic/handlers/base.py ADDED Viewed

@@ -0,0 +1,51 @@
+"""Base handler interface for gap correction."""
+from abc import ABC, abstractmethod
+from typing import List, Dict, Any
+from ..models.schemas import CorrectionProposal, GapCategory
+class BaseHandler(ABC):
+    """Base class for category-specific correction handlers."""
+    def __init__(self, artist: str = None, title: str = None):
+        """Initialize handler with song metadata.
+        Args:
+            artist: Song artist name
+            title: Song title
+        """
+        self.artist = artist
+        self.title = title
+    @abstractmethod
+    def handle(
+        self,
+        gap_id: str,
+        gap_words: List[Dict[str, Any]],
+        preceding_words: str,
+        following_words: str,
+        reference_contexts: Dict[str, str],
+        classification_reasoning: str = ""
+    ) -> List[CorrectionProposal]:
+        """Process a gap and return correction proposals.
+        Args:
+            gap_id: Unique identifier for the gap
+            gap_words: List of word dictionaries with id, text, start_time, end_time
+            preceding_words: Context before the gap
+            following_words: Context after the gap
+            reference_contexts: Dictionary of reference lyrics by source
+            classification_reasoning: Reasoning from the classifier
+        Returns:
+            List of CorrectionProposal objects
+        """
+        raise NotImplementedError
+    @property
+    @abstractmethod
+    def category(self) -> GapCategory:
+        """Return the gap category this handler processes."""
+        raise NotImplementedError

lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py ADDED Viewed

@@ -0,0 +1,46 @@
+"""Handler for complex gaps with multiple error types."""
+from typing import List, Dict, Any
+from .base import BaseHandler
+from ..models.schemas import CorrectionProposal, GapCategory
+class ComplexMultiErrorHandler(BaseHandler):
+    """Handles large, complex gaps with multiple types of errors."""
+    @property
+    def category(self) -> GapCategory:
+        return GapCategory.COMPLEX_MULTI_ERROR
+    def handle(
+        self,
+        gap_id: str,
+        gap_words: List[Dict[str, Any]],
+        preceding_words: str,
+        following_words: str,
+        reference_contexts: Dict[str, str],
+        classification_reasoning: str = ""
+    ) -> List[CorrectionProposal]:
+        """Flag complex gaps for human review."""
+        if not gap_words:
+            return []
+        # Complex multi-error gaps are too difficult for automatic correction
+        # Always flag for human review
+        gap_text = ' '.join(w.get('text', '') for w in gap_words)
+        word_count = len(gap_words)
+        proposal = CorrectionProposal(
+            word_ids=[w['id'] for w in gap_words],
+            action="Flag",
+            confidence=0.3,
+            reason=f"Complex gap with {word_count} words and multiple error types: '{gap_text[:100]}...'. Too complex for automatic correction. {classification_reasoning}",
+            gap_category=self.category,
+            requires_human_review=True,
+            artist=self.artist,
+            title=self.title
+        )
+        return [proposal]

lyrics_transcriber/correction/agentic/handlers/extra_words.py ADDED Viewed

@@ -0,0 +1,74 @@
+"""Handler for extra filler words at sentence starts."""
+from typing import List, Dict, Any
+from .base import BaseHandler
+from ..models.schemas import CorrectionProposal, GapCategory
+class ExtraWordsHandler(BaseHandler):
+    """Handles gaps with extra filler words like 'And', 'But', 'Well'."""
+    # Common filler words that are often incorrectly added by transcription
+    FILLER_WORDS = {'and', 'but', 'well', 'so', 'or', 'then', 'now'}
+    @property
+    def category(self) -> GapCategory:
+        return GapCategory.EXTRA_WORDS
+    def handle(
+        self,
+        gap_id: str,
+        gap_words: List[Dict[str, Any]],
+        preceding_words: str,
+        following_words: str,
+        reference_contexts: Dict[str, str],
+        classification_reasoning: str = ""
+    ) -> List[CorrectionProposal]:
+        """Propose deletion of filler words."""
+        if not gap_words:
+            return []
+        proposals = []
+        # Look for filler words at the start of the gap
+        for i, word in enumerate(gap_words):
+            text = word.get('text', '').strip().lower().rstrip(',.!?;:')
+            if text in self.FILLER_WORDS:
+                # Check if this is likely at a sentence/line start
+                # (either it's the first word or preceded by punctuation)
+                is_sentence_start = (
+                    i == 0 or
+                    gap_words[i-1].get('text', '').strip()[-1:] in '.!?'
+                )
+                if is_sentence_start:
+                    proposal = CorrectionProposal(
+                        word_id=word['id'],
+                        action="DeleteWord",
+                        confidence=0.80,
+                        reason=f"Extra filler word '{word.get('text')}' at sentence start not in reference. {classification_reasoning}",
+                        gap_category=self.category,
+                        requires_human_review=False,
+                        artist=self.artist,
+                        title=self.title
+                    )
+                    proposals.append(proposal)
+        # If no filler words found, flag for review
+        if not proposals:
+            proposal = CorrectionProposal(
+                word_ids=[w['id'] for w in gap_words],
+                action="Flag",
+                confidence=0.5,
+                reason=f"Classified as extra words but no obvious fillers found. {classification_reasoning}",
+                gap_category=self.category,
+                requires_human_review=True,
+                artist=self.artist,
+                title=self.title
+            )
+            proposals.append(proposal)
+        return proposals

lyrics_transcriber/correction/agentic/handlers/no_error.py ADDED Viewed

@@ -0,0 +1,42 @@
+"""Handler for gaps where transcription matches at least one reference source."""
+from typing import List, Dict, Any
+from .base import BaseHandler
+from ..models.schemas import CorrectionProposal, GapCategory
+class NoErrorHandler(BaseHandler):
+    """Handles gaps where the transcription is correct (matches a reference source)."""
+    @property
+    def category(self) -> GapCategory:
+        return GapCategory.NO_ERROR
+    def handle(
+        self,
+        gap_id: str,
+        gap_words: List[Dict[str, Any]],
+        preceding_words: str,
+        following_words: str,
+        reference_contexts: Dict[str, str],
+        classification_reasoning: str = ""
+    ) -> List[CorrectionProposal]:
+        """Return NO_ACTION since transcription is correct."""
+        if not gap_words:
+            return []
+        # Create a single NO_ACTION proposal
+        proposal = CorrectionProposal(
+            word_ids=[w['id'] for w in gap_words],
+            action="NoAction",
+            confidence=0.99,
+            reason=f"Transcription matches at least one reference source. {classification_reasoning}",
+            gap_category=self.category,
+            requires_human_review=False,
+            artist=self.artist,
+            title=self.title
+        )
+        return [proposal]

lyrics_transcriber/correction/agentic/handlers/punctuation.py ADDED Viewed

@@ -0,0 +1,44 @@
+"""Handler for punctuation-only differences."""
+from typing import List, Dict, Any
+from .base import BaseHandler
+from ..models.schemas import CorrectionProposal, GapCategory
+class PunctuationHandler(BaseHandler):
+    """Handles gaps where only punctuation/capitalization differs."""
+    @property
+    def category(self) -> GapCategory:
+        return GapCategory.PUNCTUATION_ONLY
+    def handle(
+        self,
+        gap_id: str,
+        gap_words: List[Dict[str, Any]],
+        preceding_words: str,
+        following_words: str,
+        reference_contexts: Dict[str, str],
+        classification_reasoning: str = ""
+    ) -> List[CorrectionProposal]:
+        """Return NO_ACTION for punctuation-only differences."""
+        # For punctuation differences, we don't need to make any changes
+        # The transcription is correct, just styled differently
+        if not gap_words:
+            return []
+        # Create a single NO_ACTION proposal for the entire gap
+        proposal = CorrectionProposal(
+            word_ids=[w['id'] for w in gap_words],
+            action="NoAction",
+            confidence=0.95,
+            reason=f"Punctuation/style difference only. {classification_reasoning}",
+            gap_category=self.category,
+            requires_human_review=False,
+            artist=self.artist,
+            title=self.title
+        )
+        return [proposal]

lyrics_transcriber/correction/agentic/handlers/registry.py ADDED Viewed

@@ -0,0 +1,60 @@
+"""Registry for mapping gap categories to handlers."""
+from typing import Dict, Type
+from .base import BaseHandler
+from .punctuation import PunctuationHandler
+from .sound_alike import SoundAlikeHandler
+from .background_vocals import BackgroundVocalsHandler
+from .extra_words import ExtraWordsHandler
+from .repeated_section import RepeatedSectionHandler
+from .complex_multi_error import ComplexMultiErrorHandler
+from .ambiguous import AmbiguousHandler
+from .no_error import NoErrorHandler
+from ..models.schemas import GapCategory
+class HandlerRegistry:
+    """Registry for mapping gap categories to their handler classes."""
+    _handlers: Dict[GapCategory, Type[BaseHandler]] = {
+        GapCategory.PUNCTUATION_ONLY: PunctuationHandler,
+        GapCategory.SOUND_ALIKE: SoundAlikeHandler,
+        GapCategory.BACKGROUND_VOCALS: BackgroundVocalsHandler,
+        GapCategory.EXTRA_WORDS: ExtraWordsHandler,
+        GapCategory.REPEATED_SECTION: RepeatedSectionHandler,
+        GapCategory.COMPLEX_MULTI_ERROR: ComplexMultiErrorHandler,
+        GapCategory.AMBIGUOUS: AmbiguousHandler,
+        GapCategory.NO_ERROR: NoErrorHandler,
+    }
+    @classmethod
+    def get_handler(cls, category: GapCategory, artist: str = None, title: str = None) -> BaseHandler:
+        """Get a handler instance for the given category.
+        Args:
+            category: Gap category
+            artist: Song artist name
+            title: Song title
+        Returns:
+            Handler instance for the category
+        Raises:
+            ValueError: If category is not registered
+        """
+        handler_class = cls._handlers.get(category)
+        if not handler_class:
+            raise ValueError(f"No handler registered for category: {category}")
+        return handler_class(artist=artist, title=title)
+    @classmethod
+    def register_handler(cls, category: GapCategory, handler_class: Type[BaseHandler]):
+        """Register a custom handler for a category.
+        Args:
+            category: Gap category
+            handler_class: Handler class to register
+        """
+        cls._handlers[category] = handler_class

lyrics_transcriber/correction/agentic/handlers/repeated_section.py ADDED Viewed

@@ -0,0 +1,44 @@
+"""Handler for repeated sections (chorus, verse repetitions)."""
+from typing import List, Dict, Any
+from .base import BaseHandler
+from ..models.schemas import CorrectionProposal, GapCategory
+class RepeatedSectionHandler(BaseHandler):
+    """Handles gaps where transcription includes repeated sections not in condensed references."""
+    @property
+    def category(self) -> GapCategory:
+        return GapCategory.REPEATED_SECTION
+    def handle(
+        self,
+        gap_id: str,
+        gap_words: List[Dict[str, Any]],
+        preceding_words: str,
+        following_words: str,
+        reference_contexts: Dict[str, str],
+        classification_reasoning: str = ""
+    ) -> List[CorrectionProposal]:
+        """Flag repeated sections for human review."""
+        if not gap_words:
+            return []
+        # Repeated sections need audio verification - always flag for review
+        gap_text = ' '.join(w.get('text', '') for w in gap_words)
+        proposal = CorrectionProposal(
+            word_ids=[w['id'] for w in gap_words],
+            action="Flag",
+            confidence=0.5,
+            reason=f"Repeated section detected: '{gap_text[:100]}...'. Reference lyrics may be condensed. Requires audio verification. {classification_reasoning}",
+            gap_category=self.category,
+            requires_human_review=True,
+            artist=self.artist,
+            title=self.title
+        )
+        return [proposal]

lyrics_transcriber/correction/agentic/handlers/sound_alike.py ADDED Viewed

@@ -0,0 +1,126 @@
+"""Handler for sound-alike transcription errors."""
+from typing import List, Dict, Any, Optional
+from .base import BaseHandler
+from ..models.schemas import CorrectionProposal, GapCategory
+import re
+class SoundAlikeHandler(BaseHandler):
+    """Handles gaps with sound-alike errors (homophones, similar-sounding phrases)."""
+    @property
+    def category(self) -> GapCategory:
+        return GapCategory.SOUND_ALIKE
+    def _extract_replacement_from_references(
+        self,
+        gap_words: List[Dict[str, Any]],
+        reference_contexts: Dict[str, str],
+        preceding_words: str,
+        following_words: str
+    ) -> Optional[str]:
+        """Try to extract the correct text from reference lyrics.
+        Args:
+            gap_words: Words in the gap
+            reference_contexts: Reference lyrics from each source
+            preceding_words: Words before gap
+            following_words: Words after gap
+        Returns:
+            Replacement text if found, None otherwise
+        """
+        if not reference_contexts:
+            return None
+        # Normalize preceding and following for matching
+        preceding_norm = self._normalize_text(preceding_words)
+        following_norm = self._normalize_text(following_words)
+        # Take last few words of preceding and first few words of following
+        preceding_tokens = preceding_norm.split()[-5:] if preceding_norm else []
+        following_tokens = following_norm.split()[:5] if following_norm else []
+        # Try to find the context in each reference
+        for source, ref_text in reference_contexts.items():
+            ref_norm = self._normalize_text(ref_text)
+            # Try to find the preceding context
+            if preceding_tokens:
+                preceding_pattern = ' '.join(preceding_tokens)
+                if preceding_pattern in ref_norm:
+                    # Found the context, now extract what comes after
+                    start_idx = ref_norm.index(preceding_pattern) + len(preceding_pattern)
+                    remaining = ref_norm[start_idx:].strip()
+                    # Find where following context starts
+                    if following_tokens:
+                        following_pattern = ' '.join(following_tokens)
+                        if following_pattern in remaining:
+                            end_idx = remaining.index(following_pattern)
+                            replacement = remaining[:end_idx].strip()
+                            if replacement:
+                                return replacement
+        return None
+    def _normalize_text(self, text: str) -> str:
+        """Normalize text for comparison (lowercase, remove punctuation)."""
+        # Remove punctuation except apostrophes in contractions
+        text = re.sub(r'[^\w\s\']', ' ', text.lower())
+        # Normalize whitespace
+        text = ' '.join(text.split())
+        return text
+    def handle(
+        self,
+        gap_id: str,
+        gap_words: List[Dict[str, Any]],
+        preceding_words: str,
+        following_words: str,
+        reference_contexts: Dict[str, str],
+        classification_reasoning: str = ""
+    ) -> List[CorrectionProposal]:
+        """Propose replacement based on reference lyrics."""
+        if not gap_words:
+            return []
+        # Try to extract the correct replacement from references
+        replacement_text = self._extract_replacement_from_references(
+            gap_words,
+            reference_contexts,
+            preceding_words,
+            following_words
+        )
+        if replacement_text:
+            # Found a replacement in reference lyrics
+            proposal = CorrectionProposal(
+                word_ids=[w['id'] for w in gap_words],
+                action="ReplaceWord",
+                replacement_text=replacement_text,
+                confidence=0.75,
+                reason=f"Sound-alike error. Reference suggests: '{replacement_text}'. {classification_reasoning}",
+                gap_category=self.category,
+                requires_human_review=False,
+                artist=self.artist,
+                title=self.title
+            )
+            return [proposal]
+        else:
+            # Could not extract replacement, flag for human review
+            gap_text = ' '.join(w.get('text', '') for w in gap_words)
+            proposal = CorrectionProposal(
+                word_ids=[w['id'] for w in gap_words],
+                action="Flag",
+                confidence=0.6,
+                reason=f"Sound-alike error detected for '{gap_text}' but could not extract replacement from references. {classification_reasoning}",
+                gap_category=self.category,
+                requires_human_review=True,
+                artist=self.artist,
+                title=self.title
+            )
+            return [proposal]

lyrics_transcriber/correction/agentic/models/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""Models and schemas for agentic correction (to be implemented via TDD)."""
+__all__ = []

lyrics_transcriber/correction/agentic/models/ai_correction.py ADDED Viewed

@@ -0,0 +1,31 @@
+from dataclasses import dataclass
+from datetime import datetime
+from typing import Optional
+from .enums import CorrectionType
+@dataclass
+class AICorrection:
+    id: str
+    original_text: str
+    corrected_text: str
+    confidence_score: float
+    reasoning: str
+    model_used: str
+    correction_type: CorrectionType
+    processing_time_ms: int
+    tokens_used: int
+    created_at: datetime
+    word_position: int
+    session_id: str
+    def validate(self) -> None:
+        if not (0.0 <= self.confidence_score <= 1.0):
+            raise ValueError("confidence_score must be between 0.0 and 1.0")
+        if self.original_text == self.corrected_text:
+            raise ValueError("original_text and corrected_text must differ")
+        if self.processing_time_ms <= 0:
+            raise ValueError("processing_time_ms must be positive")

lyrics_transcriber/correction/agentic/models/correction_session.py ADDED Viewed

@@ -0,0 +1,30 @@
+from dataclasses import dataclass
+from datetime import datetime
+from typing import Optional, Dict
+from .enums import SessionType, SessionStatus
+@dataclass
+class CorrectionSession:
+    id: str
+    audio_file_hash: str
+    session_type: SessionType
+    ai_model_config: Dict[str, object]
+    total_corrections: int
+    accepted_corrections: int
+    human_modifications: int
+    session_duration_ms: int
+    accuracy_improvement: float
+    started_at: datetime
+    completed_at: Optional[datetime]
+    status: SessionStatus
+    def validate(self) -> None:
+        # Basic validations per data-model
+        if any(v < 0 for v in (self.total_corrections, self.accepted_corrections, self.human_modifications)):
+            raise ValueError("correction counts must be non-negative")
+        if self.completed_at is not None and self.completed_at < self.started_at:
+            raise ValueError("completed_at must be after started_at")

lyrics_transcriber/correction/agentic/models/enums.py ADDED Viewed

@@ -0,0 +1,38 @@
+from enum import Enum
+class CorrectionType(str, Enum):
+    WORD_SUBSTITUTION = "WORD_SUBSTITUTION"
+    WORD_INSERTION = "WORD_INSERTION"
+    WORD_DELETION = "WORD_DELETION"
+    PUNCTUATION = "PUNCTUATION"
+    TIMING_ADJUSTMENT = "TIMING_ADJUSTMENT"
+    LINGUISTIC_IMPROVEMENT = "LINGUISTIC_IMPROVEMENT"
+class ReviewerAction(str, Enum):
+    ACCEPT = "ACCEPT"
+    REJECT = "REJECT"
+    MODIFY = "MODIFY"
+class FeedbackCategory(str, Enum):
+    AI_CORRECT = "AI_CORRECT"
+    AI_INCORRECT = "AI_INCORRECT"
+    AI_SUBOPTIMAL = "AI_SUBOPTIMAL"
+    CONTEXT_NEEDED = "CONTEXT_NEEDED"
+    SUBJECTIVE_PREFERENCE = "SUBJECTIVE_PREFERENCE"
+class SessionType(str, Enum):
+    FULL_CORRECTION = "FULL_CORRECTION"
+    PARTIAL_REVIEW = "PARTIAL_REVIEW"
+    REPROCESSING = "REPROCESSING"
+class SessionStatus(str, Enum):
+    IN_PROGRESS = "IN_PROGRESS"
+    COMPLETED = "COMPLETED"
+    FAILED = "FAILED"

lyrics_transcriber/correction/agentic/models/human_feedback.py ADDED Viewed

@@ -0,0 +1,30 @@
+from dataclasses import dataclass
+from datetime import datetime
+from typing import Optional
+from .enums import ReviewerAction, FeedbackCategory
+@dataclass
+class HumanFeedback:
+    id: str
+    ai_correction_id: str
+    reviewer_action: ReviewerAction
+    final_text: Optional[str]
+    reason_category: FeedbackCategory
+    reason_detail: Optional[str]
+    reviewer_confidence: float
+    review_time_ms: int
+    reviewer_id: Optional[str]
+    created_at: datetime
+    session_id: str
+    def validate(self) -> None:
+        if self.reviewer_action == ReviewerAction.MODIFY and not self.final_text:
+            raise ValueError("final_text required when action is MODIFY")
+        if self.reviewer_confidence is not None and not (0.0 <= self.reviewer_confidence <= 1.0):
+            raise ValueError("reviewer_confidence must be between 0.0 and 1.0")
+        if self.review_time_ms <= 0:
+            raise ValueError("review_time_ms must be positive")

lyrics_transcriber/correction/agentic/models/learning_data.py ADDED Viewed

@@ -0,0 +1,26 @@
+from dataclasses import dataclass
+from datetime import datetime, timedelta
+from typing import Dict
+@dataclass
+class LearningData:
+    id: str
+    session_id: str
+    error_patterns: Dict[str, int]
+    correction_strategies: Dict[str, int]
+    model_performance: Dict[str, float]
+    feedback_trends: Dict[str, int]
+    improvement_metrics: Dict[str, float]
+    data_quality_score: float
+    created_at: datetime
+    expires_at: datetime
+    def validate(self) -> None:
+        if not (0.0 <= self.data_quality_score <= 1.0):
+            raise ValueError("data_quality_score must be between 0.0 and 1.0")
+        # Note: exact 3-year check depends on business rule; enforce >= 3 years
+        if (self.expires_at - self.created_at).days < 365 * 3:
+            raise ValueError("expires_at must be at least 3 years from created_at")