PyPI - karaoke-gen - Versions diffs - 0.75.54__py3-none-any.whl - Mend

karaoke-gen 0.75.54__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of karaoke-gen might be problematic. Click here for more details.

Files changed (287) hide show

karaoke_gen/__init__.py +38 -0
karaoke_gen/audio_fetcher.py +1614 -0
karaoke_gen/audio_processor.py +790 -0
karaoke_gen/config.py +83 -0
karaoke_gen/file_handler.py +387 -0
karaoke_gen/instrumental_review/__init__.py +45 -0
karaoke_gen/instrumental_review/analyzer.py +408 -0
karaoke_gen/instrumental_review/editor.py +322 -0
karaoke_gen/instrumental_review/models.py +171 -0
karaoke_gen/instrumental_review/server.py +475 -0
karaoke_gen/instrumental_review/static/index.html +1529 -0
karaoke_gen/instrumental_review/waveform.py +409 -0
karaoke_gen/karaoke_finalise/__init__.py +1 -0
karaoke_gen/karaoke_finalise/karaoke_finalise.py +1833 -0
karaoke_gen/karaoke_gen.py +1026 -0
karaoke_gen/lyrics_processor.py +474 -0
karaoke_gen/metadata.py +160 -0
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/resources/AvenirNext-Bold.ttf +0 -0
karaoke_gen/resources/Montserrat-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-SemiBold.ttf +0 -0
karaoke_gen/resources/Zurich_Cn_BT_Bold.ttf +0 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/__init__.py +18 -0
karaoke_gen/utils/bulk_cli.py +492 -0
karaoke_gen/utils/cli_args.py +432 -0
karaoke_gen/utils/gen_cli.py +978 -0
karaoke_gen/utils/remote_cli.py +3268 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen/video_generator.py +424 -0
karaoke_gen-0.75.54.dist-info/METADATA +718 -0
karaoke_gen-0.75.54.dist-info/RECORD +287 -0
karaoke_gen-0.75.54.dist-info/WHEEL +4 -0
karaoke_gen-0.75.54.dist-info/entry_points.txt +5 -0
karaoke_gen-0.75.54.dist-info/licenses/LICENSE +21 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +594 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +919 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +214 -0
lyrics_transcriber/frontend/src/api.ts +254 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +413 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1387 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/SyncControls.tsx +185 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/TimelineCanvas.tsx +704 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/UpcomingWordsBar.tsx +80 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/index.tsx +905 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelectionModal.tsx +127 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +336 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js +43288 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +306 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +379 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +650 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0

lyrics_transcriber/correction/agentic/providers/response_cache.py ADDED Viewed

@@ -0,0 +1,218 @@
+"""Response caching for LLM calls to avoid redundant API requests."""
+from __future__ import annotations
+import json
+import hashlib
+import logging
+from pathlib import Path
+from typing import Optional, Dict, Any
+from datetime import datetime
+logger = logging.getLogger(__name__)
+class ResponseCache:
+    """Caches LLM responses based on prompt hash.
+    This allows reusing responses when iterating on frontend/UI changes
+    without re-running expensive LLM inference calls.
+    Cache Structure:
+        {
+            "prompt_hash": {
+                "prompt": "full prompt text",
+                "response": "llm response",
+                "timestamp": "iso datetime",
+                "model": "model identifier",
+                "metadata": {...}
+            }
+        }
+    """
+    def __init__(self, cache_dir: str = "cache", enabled: bool = True):
+        """Initialize response cache.
+        Args:
+            cache_dir: Directory to store cache file
+            enabled: Whether caching is enabled (can be disabled via env var)
+        """
+        self.cache_dir = Path(cache_dir)
+        self.cache_dir.mkdir(parents=True, exist_ok=True)
+        self.cache_file = self.cache_dir / "llm_response_cache.json"
+        self.enabled = enabled
+        self._cache: Dict[str, Dict[str, Any]] = {}
+        self._load_cache()
+    def _load_cache(self) -> None:
+        """Load cache from disk."""
+        if not self.cache_file.exists():
+            self._cache = {}
+            return
+        try:
+            with open(self.cache_file, 'r', encoding='utf-8') as f:
+                self._cache = json.load(f)
+            logger.debug(f"📦 Loaded {len(self._cache)} cached responses")
+        except Exception as e:
+            logger.warning(f"Failed to load cache: {e}")
+            self._cache = {}
+    def _save_cache(self) -> None:
+        """Save cache to disk."""
+        try:
+            with open(self.cache_file, 'w', encoding='utf-8') as f:
+                json.dump(self._cache, f, indent=2, ensure_ascii=False)
+            logger.debug(f"💾 Saved {len(self._cache)} cached responses")
+        except Exception as e:
+            logger.warning(f"Failed to save cache: {e}")
+    def _compute_hash(self, prompt: str, model: str) -> str:
+        """Compute hash for prompt + model combination.
+        Args:
+            prompt: The full prompt text
+            model: Model identifier
+        Returns:
+            SHA256 hash as hex string
+        """
+        # Include both prompt and model in hash
+        combined = f"{model}::{prompt}"
+        return hashlib.sha256(combined.encode('utf-8')).hexdigest()
+    def get(self, prompt: str, model: str) -> Optional[str]:
+        """Get cached response for prompt if available.
+        Args:
+            prompt: The prompt text
+            model: Model identifier
+        Returns:
+            Cached response string or None if not found
+        """
+        if not self.enabled:
+            return None
+        prompt_hash = self._compute_hash(prompt, model)
+        if prompt_hash in self._cache:
+            cached = self._cache[prompt_hash]
+            logger.info(f"🎯 Cache HIT for {model} (hash: {prompt_hash[:8]}...)")
+            logger.debug(f"   Cached at: {cached.get('timestamp')}")
+            return cached.get('response')
+        logger.debug(f"📭 Cache MISS for {model} (hash: {prompt_hash[:8]}...)")
+        return None
+    def set(
+        self,
+        prompt: str,
+        model: str,
+        response: str,
+        metadata: Optional[Dict[str, Any]] = None
+    ) -> None:
+        """Store response in cache.
+        Args:
+            prompt: The prompt text
+            model: Model identifier
+            response: The LLM response
+            metadata: Optional metadata to store with cache entry
+        """
+        if not self.enabled:
+            return
+        prompt_hash = self._compute_hash(prompt, model)
+        self._cache[prompt_hash] = {
+            "prompt": prompt[:500] + "..." if len(prompt) > 500 else prompt,  # Truncate for readability
+            "response": response,
+            "timestamp": datetime.utcnow().isoformat(),
+            "model": model,
+            "metadata": metadata or {}
+        }
+        # Save to disk immediately (for persistence across runs)
+        self._save_cache()
+        logger.debug(f"💾 Cached response for {model} (hash: {prompt_hash[:8]}...)")
+    def clear(self) -> int:
+        """Clear all cached responses.
+        Returns:
+            Number of entries cleared
+        """
+        count = len(self._cache)
+        self._cache = {}
+        self._save_cache()
+        logger.info(f"🗑️ Cleared {count} cached responses")
+        return count
+    def get_stats(self) -> Dict[str, Any]:
+        """Get cache statistics.
+        Returns:
+            Dictionary with cache statistics
+        """
+        if not self._cache:
+            return {
+                "total_entries": 0,
+                "cache_file": str(self.cache_file),
+                "enabled": self.enabled
+            }
+        # Count by model
+        by_model = {}
+        for entry in self._cache.values():
+            model = entry.get('model', 'unknown')
+            by_model[model] = by_model.get(model, 0) + 1
+        # Find oldest and newest
+        timestamps = [
+            datetime.fromisoformat(entry['timestamp'])
+            for entry in self._cache.values()
+            if 'timestamp' in entry
+        ]
+        return {
+            "total_entries": len(self._cache),
+            "by_model": by_model,
+            "oldest": min(timestamps).isoformat() if timestamps else None,
+            "newest": max(timestamps).isoformat() if timestamps else None,
+            "cache_file": str(self.cache_file),
+            "enabled": self.enabled
+        }
+    def prune_old_entries(self, days: int = 30) -> int:
+        """Remove cache entries older than specified days.
+        Args:
+            days: Remove entries older than this many days
+        Returns:
+            Number of entries removed
+        """
+        from datetime import timedelta
+        cutoff = datetime.utcnow() - timedelta(days=days)
+        to_remove = []
+        for prompt_hash, entry in self._cache.items():
+            if 'timestamp' in entry:
+                try:
+                    entry_time = datetime.fromisoformat(entry['timestamp'])
+                    if entry_time < cutoff:
+                        to_remove.append(prompt_hash)
+                except Exception:
+                    pass
+        for prompt_hash in to_remove:
+            del self._cache[prompt_hash]
+        if to_remove:
+            self._save_cache()
+            logger.info(f"🗑️ Pruned {len(to_remove)} old cache entries (older than {days} days)")
+        return len(to_remove)

lyrics_transcriber/correction/agentic/providers/response_parser.py ADDED Viewed

@@ -0,0 +1,111 @@
+"""Parser for LLM responses into structured correction proposals."""
+from __future__ import annotations
+import json
+import logging
+from typing import List, Dict, Any
+logger = logging.getLogger(__name__)
+class ResponseParser:
+    """Parses LLM responses into structured proposal dictionaries.
+    Handles both JSON and raw text responses, providing consistent
+    output format for downstream processing.
+    Single Responsibility: Response parsing only, no model invocation.
+    """
+    def parse(self, content: str) -> List[Dict[str, Any]]:
+        """Parse response content into proposal dictionaries.
+        Attempts to parse as JSON first. If that fails, tries to fix
+        common JSON issues and retries. Falls back to raw content.
+        Args:
+            content: Raw response content from LLM
+        Returns:
+            List of proposal dictionaries. On parse failure, returns
+            [{"raw": content}] to preserve the response.
+        """
+        # Try JSON parsing first
+        try:
+            data = json.loads(content)
+            return self._normalize_json_response(data)
+        except json.JSONDecodeError as e:
+            logger.debug(f"🤖 Response is not valid JSON: {e}")
+            # Try to fix common issues
+            fixed_content = self._attempt_json_fix(content)
+            if fixed_content != content:
+                try:
+                    data = json.loads(fixed_content)
+                    logger.debug("🤖 Successfully parsed after JSON fix")
+                    return self._normalize_json_response(data)
+                except json.JSONDecodeError:
+                    pass  # Fall through to raw handling
+            return self._handle_raw_response(content)
+    def _attempt_json_fix(self, content: str) -> str:
+        """Attempt to fix common JSON formatting issues.
+        Args:
+            content: Raw JSON string
+        Returns:
+            Fixed JSON string (or original if no fixes applied)
+        """
+        # Fix 1: Replace invalid escape sequences like \' with '
+        # (JSON only allows \", \\, \/, \b, \f, \n, \r, \t)
+        fixed = content.replace("\\'", "'")
+        # Fix 2: Remove any trailing commas before } or ]
+        import re
+        fixed = re.sub(r',\s*}', '}', fixed)
+        fixed = re.sub(r',\s*]', ']', fixed)
+        return fixed
+    def _normalize_json_response(self, data: Any) -> List[Dict[str, Any]]:
+        """Normalize JSON data into a list of dictionaries.
+        Handles both single dict and list of dicts responses.
+        Args:
+            data: Parsed JSON data
+        Returns:
+            List of dictionaries
+        """
+        if isinstance(data, dict):
+            # Single proposal - wrap in list
+            return [data]
+        elif isinstance(data, list):
+            # Already a list - return as-is
+            return data
+        else:
+            # Unexpected type - wrap in error dict
+            logger.warning(f"🤖 Unexpected JSON type: {type(data)}")
+            return [{"error": "unexpected_type", "data": str(data)}]
+    def _handle_raw_response(self, content: str) -> List[Dict[str, Any]]:
+        """Handle non-JSON responses.
+        Wraps raw content in a dict for downstream handling.
+        The "raw" key indicates this needs manual processing.
+        Args:
+            content: Raw response text
+        Returns:
+            List with single dict containing raw content
+        """
+        logger.info(
+            f"🤖 Returning raw response (non-JSON): "
+            f"{content[:100]}{'...' if len(content) > 100 else ''}"
+        )
+        return [{"raw": content}]

lyrics_transcriber/correction/agentic/providers/retry_executor.py ADDED Viewed

@@ -0,0 +1,127 @@
+"""Retry execution logic with exponential backoff."""
+from __future__ import annotations
+import time
+import random
+import logging
+from typing import Callable, TypeVar, Generic
+from dataclasses import dataclass
+from .config import ProviderConfig
+logger = logging.getLogger(__name__)
+T = TypeVar('T')
+@dataclass
+class ExecutionResult(Generic[T]):
+    """Result of a retry execution attempt.
+    Attributes:
+        success: Whether execution succeeded
+        value: The return value if successful
+        error: Error message if failed
+        attempts: Number of attempts made
+    """
+    success: bool
+    value: T | None = None
+    error: str | None = None
+    attempts: int = 0
+class RetryExecutor:
+    """Executes operations with retry logic and exponential backoff.
+    Implements exponential backoff with jitter to prevent thundering herd.
+    Single Responsibility: Retry logic only, no model-specific behavior.
+    """
+    def __init__(self, config: ProviderConfig):
+        """Initialize retry executor with configuration.
+        Args:
+            config: Provider configuration with retry parameters
+        """
+        self._config = config
+    def execute_with_retry(
+        self,
+        operation: Callable[[], T],
+        operation_name: str = "operation"
+    ) -> ExecutionResult[T]:
+        """Execute operation with retry logic.
+        Args:
+            operation: Callable that performs the operation
+            operation_name: Name for logging purposes
+        Returns:
+            ExecutionResult with success/failure status and value/error
+        """
+        max_attempts = max(1, self._config.max_retries + 1)
+        last_error: Exception | None = None
+        for attempt in range(max_attempts):
+            try:
+                logger.debug(
+                    f"🤖 Executing {operation_name} "
+                    f"(attempt {attempt + 1}/{max_attempts})"
+                )
+                result = operation()
+                logger.debug(f"🤖 {operation_name} succeeded on attempt {attempt + 1}")
+                return ExecutionResult(
+                    success=True,
+                    value=result,
+                    attempts=attempt + 1
+                )
+            except Exception as e:
+                last_error = e
+                logger.warning(
+                    f"🤖 {operation_name} failed on attempt {attempt + 1}: {e}"
+                )
+                # Don't sleep after the last attempt
+                if attempt < max_attempts - 1:
+                    sleep_duration = self._calculate_backoff(attempt)
+                    logger.debug(f"🤖 Backing off for {sleep_duration:.2f}s")
+                    time.sleep(sleep_duration)
+        # All attempts failed
+        error_msg = str(last_error) if last_error else "unknown error"
+        logger.error(
+            f"🤖 {operation_name} failed after {max_attempts} attempts: {error_msg}"
+        )
+        return ExecutionResult(
+            success=False,
+            error=error_msg,
+            attempts=max_attempts
+        )
+    def _calculate_backoff(self, attempt: int) -> float:
+        """Calculate backoff duration with exponential backoff and jitter.
+        Formula: base * (factor ^ attempt) + random_jitter
+        Args:
+            attempt: Current attempt number (0-indexed)
+        Returns:
+            Sleep duration in seconds
+        """
+        base = self._config.retry_backoff_base_seconds
+        factor = self._config.retry_backoff_factor
+        # Exponential backoff
+        backoff = base * (factor ** attempt)
+        # Add jitter (0-50ms) to prevent thundering herd
+        jitter = random.uniform(0, 0.05)
+        return backoff + jitter

lyrics_transcriber/correction/agentic/router.py ADDED Viewed

@@ -0,0 +1,35 @@
+from __future__ import annotations
+import os
+from typing import Dict, Any
+from .providers.config import ProviderConfig
+class ModelRouter:
+    """Rules-based routing by gap type/length/uncertainty (scaffold)."""
+    def __init__(self, config: ProviderConfig | None = None):
+        self._config = config or ProviderConfig.from_env()
+    def choose_model(self, gap_type: str, uncertainty: float) -> str:
+        """Choose appropriate model based on gap characteristics.
+        Returns model identifier in format "provider/model" for LangChain:
+        - "ollama/gpt-oss:latest" for local Ollama models
+        - "openai/gpt-4" for OpenAI models
+        - "anthropic/claude-3-sonnet-20240229" for Anthropic models
+        """
+        # Simple baseline per technical guidance
+        if self._config.privacy_mode:
+            # Use the actual model from env, or default to a common Ollama model
+            return os.getenv("AGENTIC_AI_MODEL", "ollama/gpt-oss:latest")
+        # For high-uncertainty gaps, use Claude (best reasoning)
+        if uncertainty > 0.5:
+            return "anthropic/claude-3-sonnet-20240229"
+        # Default to GPT-4 for general cases
+        return "openai/gpt-4"

lyrics_transcriber/correction/agentic/workflows/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+"""LangGraph workflows for agentic correction (scaffold)."""
+__all__ = []

lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py ADDED Viewed

@@ -0,0 +1,24 @@
+from __future__ import annotations
+from typing import Any, Dict
+def build_consensus_workflow() -> Any:
+    """Return a minimal consensus workflow (scaffold).
+    Returns None if langgraph not installed to avoid hard dependency.
+    """
+    try:
+        from langgraph.graph import StateGraph  # type: ignore
+    except Exception:
+        return None
+    def merge_results(state: Dict[str, Any]) -> Dict[str, Any]:
+        return state
+    g = StateGraph(dict)
+    g.add_node("MergeResults", merge_results)
+    g.set_entry_point("MergeResults")
+    return g.compile()

lyrics_transcriber/correction/agentic/workflows/correction_graph.py ADDED Viewed

@@ -0,0 +1,59 @@
+from __future__ import annotations
+from typing import Dict, Any, List, Annotated
+from typing_extensions import TypedDict
+class CorrectionState(TypedDict):
+    """State for the correction workflow.
+    This is a minimal state for now, but can be expanded as we add
+    more sophisticated correction logic (e.g., multi-step reasoning,
+    validation loops, etc.)
+    """
+    prompt: str
+    proposals: List[Dict[str, Any]]
+def build_correction_graph(callbacks=None) -> Any:
+    """Build a LangGraph workflow for lyrics correction.
+    Currently a simple pass-through, but structured to allow future
+    expansion with multi-step reasoning, validation loops, etc.
+    Args:
+        callbacks: Optional callbacks (e.g., Langfuse handlers) to attach
+    Returns:
+        Compiled LangGraph or None if LangGraph not installed
+    """
+    try:
+        from langgraph.graph import StateGraph, END
+    except ImportError:
+        return None
+    def correction_node(state: CorrectionState) -> CorrectionState:
+        """Main correction node - currently a pass-through.
+        Future expansion: This could invoke sub-agents, do multi-step
+        reasoning, or implement validation loops.
+        """
+        # For now, just pass through - actual correction happens in provider
+        return state
+    # Build the graph
+    graph_builder = StateGraph(CorrectionState)
+    graph_builder.add_node("correct", correction_node)
+    graph_builder.set_entry_point("correct")
+    graph_builder.set_finish_point("correct")
+    # Compile with optional callbacks
+    # Note: Per Langfuse docs, we can use .with_config() to add callbacks
+    compiled = graph_builder.compile()
+    if callbacks:
+        return compiled.with_config({"callbacks": callbacks})
+    return compiled

lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py ADDED Viewed

@@ -0,0 +1,24 @@
+from __future__ import annotations
+from typing import Any, Dict
+def build_feedback_workflow() -> Any:
+    """Return a minimal feedback processing workflow (scaffold).
+    Returns None if langgraph not installed to avoid hard dependency.
+    """
+    try:
+        from langgraph.graph import StateGraph  # type: ignore
+    except Exception:
+        return None
+    def process_feedback(state: Dict[str, Any]) -> Dict[str, Any]:
+        return state
+    g = StateGraph(dict)
+    g.add_node("ProcessFeedback", process_feedback)
+    g.set_entry_point("ProcessFeedback")
+    return g.compile()