PyPI - karaoke-gen - Versions diffs - 0.75.54__py3-none-any.whl - Mend

karaoke-gen 0.75.54__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of karaoke-gen might be problematic. Click here for more details.

Files changed (287) hide show

karaoke_gen/__init__.py +38 -0
karaoke_gen/audio_fetcher.py +1614 -0
karaoke_gen/audio_processor.py +790 -0
karaoke_gen/config.py +83 -0
karaoke_gen/file_handler.py +387 -0
karaoke_gen/instrumental_review/__init__.py +45 -0
karaoke_gen/instrumental_review/analyzer.py +408 -0
karaoke_gen/instrumental_review/editor.py +322 -0
karaoke_gen/instrumental_review/models.py +171 -0
karaoke_gen/instrumental_review/server.py +475 -0
karaoke_gen/instrumental_review/static/index.html +1529 -0
karaoke_gen/instrumental_review/waveform.py +409 -0
karaoke_gen/karaoke_finalise/__init__.py +1 -0
karaoke_gen/karaoke_finalise/karaoke_finalise.py +1833 -0
karaoke_gen/karaoke_gen.py +1026 -0
karaoke_gen/lyrics_processor.py +474 -0
karaoke_gen/metadata.py +160 -0
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/resources/AvenirNext-Bold.ttf +0 -0
karaoke_gen/resources/Montserrat-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-Bold.ttf +0 -0
karaoke_gen/resources/Oswald-SemiBold.ttf +0 -0
karaoke_gen/resources/Zurich_Cn_BT_Bold.ttf +0 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/__init__.py +18 -0
karaoke_gen/utils/bulk_cli.py +492 -0
karaoke_gen/utils/cli_args.py +432 -0
karaoke_gen/utils/gen_cli.py +978 -0
karaoke_gen/utils/remote_cli.py +3268 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen/video_generator.py +424 -0
karaoke_gen-0.75.54.dist-info/METADATA +718 -0
karaoke_gen-0.75.54.dist-info/RECORD +287 -0
karaoke_gen-0.75.54.dist-info/WHEEL +4 -0
karaoke_gen-0.75.54.dist-info/entry_points.txt +5 -0
karaoke_gen-0.75.54.dist-info/licenses/LICENSE +21 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +594 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +919 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +214 -0
lyrics_transcriber/frontend/src/api.ts +254 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +413 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1387 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/SyncControls.tsx +185 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/TimelineCanvas.tsx +704 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/UpcomingWordsBar.tsx +80 -0
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/index.tsx +905 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelectionModal.tsx +127 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +336 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js +43288 -0
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +306 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +379 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +650 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0

lyrics_transcriber/correction/agentic/providers/config.py ADDED Viewed

@@ -0,0 +1,73 @@
+from dataclasses import dataclass
+from typing import Optional
+import os
+@dataclass(frozen=True)
+class ProviderConfig:
+    """Centralized configuration for AI providers.
+    Values are loaded from environment variables to keep credentials out of code.
+    This module is safe to import during setup; it does not perform any network I/O.
+    """
+    openai_api_key: Optional[str]
+    anthropic_api_key: Optional[str]
+    google_api_key: Optional[str]
+    openrouter_api_key: Optional[str]
+    privacy_mode: bool
+    cache_dir: str
+    request_timeout_seconds: float = 30.0
+    max_retries: int = 2
+    retry_backoff_base_seconds: float = 0.2
+    retry_backoff_factor: float = 2.0
+    circuit_breaker_failure_threshold: int = 3
+    circuit_breaker_open_seconds: int = 60
+    @staticmethod
+    def from_env(cache_dir: Optional[str] = None) -> "ProviderConfig":
+        """Create config from environment variables.
+        Args:
+            cache_dir: Cache directory path. If None, uses LYRICS_TRANSCRIBER_CACHE_DIR
+                      env var or defaults to ~/lyrics-transcriber-cache
+        """
+        if cache_dir is None:
+            cache_dir = os.getenv(
+                "LYRICS_TRANSCRIBER_CACHE_DIR",
+                os.path.join(os.path.expanduser("~"), "lyrics-transcriber-cache")
+            )
+        return ProviderConfig(
+            openai_api_key=os.getenv("OPENAI_API_KEY"),
+            anthropic_api_key=os.getenv("ANTHROPIC_API_KEY"),
+            google_api_key=os.getenv("GOOGLE_API_KEY"),
+            openrouter_api_key=os.getenv("OPENROUTER_API_KEY"),
+            privacy_mode=os.getenv("PRIVACY_MODE", "false").lower() in {"1", "true", "yes"},
+            cache_dir=cache_dir,
+            request_timeout_seconds=float(os.getenv("AGENTIC_TIMEOUT_SECONDS", "30.0")),
+            max_retries=int(os.getenv("AGENTIC_MAX_RETRIES", "2")),
+            retry_backoff_base_seconds=float(os.getenv("AGENTIC_BACKOFF_BASE_SECONDS", "0.2")),
+            retry_backoff_factor=float(os.getenv("AGENTIC_BACKOFF_FACTOR", "2.0")),
+            circuit_breaker_failure_threshold=int(os.getenv("AGENTIC_CIRCUIT_THRESHOLD", "3")),
+            circuit_breaker_open_seconds=int(os.getenv("AGENTIC_CIRCUIT_OPEN_SECONDS", "60")),
+        )
+    def validate_environment(self, logger: Optional[object] = None) -> None:
+        """Log warnings if required keys are missing for non-privacy mode."""
+        def _log(msg: str) -> None:
+            try:
+                if logger is not None:
+                    logger.warning(msg)
+                else:
+                    print(msg)
+            except Exception:
+                pass
+        if self.privacy_mode:
+            return
+        if not any([self.openai_api_key, self.anthropic_api_key, self.google_api_key, self.openrouter_api_key]):
+            _log("No AI provider API keys configured; set PRIVACY_MODE=1 to avoid cloud usage or add provider keys.")

lyrics_transcriber/correction/agentic/providers/constants.py ADDED Viewed

@@ -0,0 +1,24 @@
+"""Constants for the agentic correction providers module."""
+# Logging constants
+PROMPT_LOG_LENGTH = 200  # Characters to log from prompts
+RESPONSE_LOG_LENGTH = 500  # Characters to log from responses
+# Model specification format
+MODEL_SPEC_FORMAT = "provider/model"  # Expected format for model identifiers
+# Default Langfuse host
+DEFAULT_LANGFUSE_HOST = "https://cloud.langfuse.com"
+# Raw response indicator
+RAW_RESPONSE_KEY = "raw"  # Key used to wrap unparsed responses
+# Error response keys
+ERROR_KEY = "error"
+ERROR_MESSAGE_KEY = "message"
+# Circuit breaker error types
+CIRCUIT_OPEN_ERROR = "circuit_open"
+MODEL_INIT_ERROR = "model_init_failed"
+PROVIDER_ERROR = "provider_error"

lyrics_transcriber/correction/agentic/providers/health.py ADDED Viewed

@@ -0,0 +1,28 @@
+from typing import List, Dict, Any
+def is_ollama_available() -> bool:
+    """Return True if a local Ollama server responds to a simple list() call.
+    This function is intentionally lightweight and safe to call during setup.
+    """
+    try:
+        import ollama  # type: ignore
+        _ = ollama.list()
+        return True
+    except Exception:
+        return False
+def get_ollama_models() -> List[Dict[str, Any]]:
+    """Return available local models from Ollama if available; otherwise empty list."""
+    try:
+        import ollama  # type: ignore
+        data = ollama.list() or {}
+        return data.get("models", []) if isinstance(data, dict) else []
+    except Exception:
+        return []

lyrics_transcriber/correction/agentic/providers/langchain_bridge.py ADDED Viewed

@@ -0,0 +1,212 @@
+"""Refactored LangChain-based provider bridge using composition.
+This is a much cleaner version that delegates to specialized components:
+- ModelFactory: Creates ChatModels
+- CircuitBreaker: Manages failure state
+- ResponseParser: Parses responses
+- RetryExecutor: Handles retry logic
+- ResponseCache: Caches LLM responses to avoid redundant calls
+Each component has a single responsibility and is independently testable.
+"""
+from __future__ import annotations
+import logging
+import os
+from typing import List, Dict, Any, Optional
+from datetime import datetime
+from .base import BaseAIProvider
+from .config import ProviderConfig
+from .model_factory import ModelFactory
+from .circuit_breaker import CircuitBreaker
+from .response_parser import ResponseParser
+from .retry_executor import RetryExecutor
+from .response_cache import ResponseCache
+from .constants import (
+    PROMPT_LOG_LENGTH,
+    RESPONSE_LOG_LENGTH,
+    CIRCUIT_OPEN_ERROR,
+    MODEL_INIT_ERROR,
+    PROVIDER_ERROR,
+)
+logger = logging.getLogger(__name__)
+class LangChainBridge(BaseAIProvider):
+    """Provider bridge using LangChain ChatModels with reliability patterns.
+    This bridge is now much simpler - it delegates to specialized components
+    rather than handling everything itself. This follows the Single
+    Responsibility Principle and makes the code more testable.
+    Components:
+        - ModelFactory: Creates and configures ChatModels
+        - CircuitBreaker: Protects against cascading failures
+        - ResponseParser: Handles JSON/raw response parsing
+        - RetryExecutor: Implements exponential backoff
+    """
+    def __init__(
+        self,
+        model: str,
+        config: ProviderConfig | None = None,
+        model_factory: ModelFactory | None = None,
+        circuit_breaker: CircuitBreaker | None = None,
+        response_parser: ResponseParser | None = None,
+        retry_executor: RetryExecutor | None = None,
+        response_cache: ResponseCache | None = None,
+    ):
+        """Initialize the bridge with components (dependency injection).
+        Args:
+            model: Model identifier in format "provider/model"
+            config: Provider configuration (creates default if None)
+            model_factory: Factory for creating ChatModels (creates default if None)
+            circuit_breaker: Circuit breaker instance (creates default if None)
+            response_parser: Response parser instance (creates default if None)
+            retry_executor: Retry executor instance (creates default if None)
+            response_cache: Response cache instance (creates default if None)
+        """
+        self._model = model
+        self._config = config or ProviderConfig.from_env()
+        # Dependency injection with sensible defaults
+        self._factory = model_factory or ModelFactory()
+        self._circuit_breaker = circuit_breaker or CircuitBreaker(self._config)
+        self._parser = response_parser or ResponseParser()
+        self._executor = retry_executor or RetryExecutor(self._config)
+        # Initialize cache (enabled by default, can be disabled via DISABLE_LLM_CACHE=1)
+        cache_enabled = os.getenv("DISABLE_LLM_CACHE", "0").lower() not in {"1", "true", "yes"}
+        self._cache = response_cache or ResponseCache(
+            cache_dir=self._config.cache_dir,
+            enabled=cache_enabled
+        )
+        # Lazy-initialized chat model
+        self._chat_model: Optional[Any] = None
+    def name(self) -> str:
+        """Return provider name for logging."""
+        return f"langchain:{self._model}"
+    def generate_correction_proposals(
+        self,
+        prompt: str,
+        schema: Dict[str, Any],
+        session_id: str | None = None
+    ) -> List[Dict[str, Any]]:
+        """Generate correction proposals using LangChain ChatModel.
+        This method is now much simpler - it orchestrates the components
+        rather than implementing all the logic itself.
+        Args:
+            prompt: The correction prompt
+            schema: Pydantic schema for structured output (for future use)
+            session_id: Optional Langfuse session ID for grouping traces
+        Returns:
+            List of correction proposal dictionaries, or error dicts on failure
+        """
+        # Store session_id for use in _invoke_model
+        self._session_id = session_id
+        # Step 0: Check cache first
+        cached_response = self._cache.get(prompt, self._model)
+        if cached_response:
+            # Parse cached response and return
+            parsed = self._parser.parse(cached_response)
+            logger.debug(f"🎯 Using cached response ({len(parsed)} items)")
+            return parsed
+        # Step 1: Check circuit breaker
+        if self._circuit_breaker.is_open(self._model):
+            open_until = self._circuit_breaker.get_open_until(self._model)
+            return [{
+                "error": CIRCUIT_OPEN_ERROR,
+                "until": open_until
+            }]
+        # Step 2: Get or create chat model
+        if not self._chat_model:
+            try:
+                self._chat_model = self._factory.create_chat_model(
+                    self._model,
+                    self._config
+                )
+            except Exception as e:
+                self._circuit_breaker.record_failure(self._model)
+                logger.error(f"🤖 Failed to initialize chat model: {e}")
+                return [{
+                    "error": MODEL_INIT_ERROR,
+                    "message": str(e)
+                }]
+        # Step 3: Execute with retry logic
+        logger.debug(
+            f"🤖 [LangChain] Sending prompt to {self._model}: "
+            f"{prompt[:PROMPT_LOG_LENGTH]}..."
+        )
+        result = self._executor.execute_with_retry(
+            operation=lambda: self._invoke_model(prompt),
+            operation_name=f"invoke_{self._model}"
+        )
+        # Step 4: Handle result and update circuit breaker
+        if result.success:
+            self._circuit_breaker.record_success(self._model)
+            logger.info(
+                f"🤖 [LangChain] Got response from {self._model}: "
+                f"{result.value[:RESPONSE_LOG_LENGTH]}..."
+            )
+            # Step 5: Cache the raw response for future use
+            self._cache.set(
+                prompt=prompt,
+                model=self._model,
+                response=result.value,
+                metadata={
+                    "session_id": session_id,
+                    "timestamp": datetime.utcnow().isoformat()
+                }
+            )
+            # Step 6: Parse response
+            return self._parser.parse(result.value)
+        else:
+            self._circuit_breaker.record_failure(self._model)
+            return [{
+                "error": PROVIDER_ERROR,
+                "message": result.error or "unknown"
+            }]
+    def _invoke_model(self, prompt: str) -> str:
+        """Invoke the chat model with a prompt.
+        This is a simple wrapper that can be passed to the retry executor.
+        Args:
+            prompt: The prompt to send
+        Returns:
+            Response content as string
+        Raises:
+            Exception: Any error from the model invocation
+        """
+        from langchain_core.messages import HumanMessage
+        # Prepare config with session_id in metadata (Langfuse format)
+        config = {}
+        if hasattr(self, '_session_id') and self._session_id:
+            config["metadata"] = {"langfuse_session_id": self._session_id}
+            logger.debug(f"🤖 [LangChain] Invoking with session_id: {self._session_id}")
+        response = self._chat_model.invoke([HumanMessage(content=prompt)], config=config)
+        return response.content

lyrics_transcriber/correction/agentic/providers/model_factory.py ADDED Viewed

@@ -0,0 +1,209 @@
+"""Factory for creating LangChain ChatModels with Langfuse callbacks."""
+from __future__ import annotations
+import logging
+import os
+from typing import Any, Optional, List
+from .config import ProviderConfig
+logger = logging.getLogger(__name__)
+class ModelFactory:
+    """Creates and configures LangChain ChatModels with observability.
+    This factory handles:
+    - Parsing model specifications ("provider/model" format)
+    - Creating Langfuse callbacks when configured
+    - Instantiating the appropriate ChatModel for each provider
+    Single Responsibility: Model creation only, no execution or state management.
+    """
+    def __init__(self):
+        self._langfuse_handler: Optional[Any] = None
+        self._langfuse_initialized = False
+    def create_chat_model(self, model_spec: str, config: ProviderConfig) -> Any:
+        """Create a ChatModel from a model specification.
+        Args:
+            model_spec: Model identifier in format "provider/model"
+                       e.g. "ollama/gpt-oss:latest", "openai/gpt-4"
+            config: Provider configuration with timeouts, retries, etc.
+        Returns:
+            Configured LangChain ChatModel instance
+        Raises:
+            ValueError: If model_spec format is invalid or provider unsupported
+        """
+        provider, model_name = self._parse_model_spec(model_spec)
+        callbacks = self._create_callbacks(model_spec)
+        return self._instantiate_model(provider, model_name, callbacks, config)
+    def _parse_model_spec(self, spec: str) -> tuple[str, str]:
+        """Parse model specification into provider and model name.
+        Args:
+            spec: Model spec in format "provider/model"
+        Returns:
+            Tuple of (provider, model_name)
+        Raises:
+            ValueError: If format is invalid
+        """
+        parts = spec.split("/", 1)
+        if len(parts) != 2:
+            raise ValueError(
+                f"Model spec must be in format 'provider/model', got: {spec}"
+            )
+        return parts[0], parts[1]
+    def _create_callbacks(self, model_spec: str) -> List[Any]:
+        """Create Langfuse callback handlers if configured.
+        Args:
+            model_spec: Model specification for logging
+        Returns:
+            List of callback handlers (may be empty)
+        """
+        # Only initialize Langfuse once
+        if not self._langfuse_initialized:
+            self._initialize_langfuse(model_spec)
+            self._langfuse_initialized = True
+        return [self._langfuse_handler] if self._langfuse_handler else []
+    def _initialize_langfuse(self, model_spec: str) -> None:
+        """Initialize Langfuse callback handler if keys are present.
+        Langfuse reads credentials from environment variables automatically:
+        - LANGFUSE_PUBLIC_KEY
+        - LANGFUSE_SECRET_KEY
+        - LANGFUSE_HOST (optional)
+        Args:
+            model_spec: Model specification for logging
+        Raises:
+            RuntimeError: If Langfuse keys are set but initialization fails
+        """
+        public_key = os.getenv("LANGFUSE_PUBLIC_KEY")
+        secret_key = os.getenv("LANGFUSE_SECRET_KEY")
+        if not (public_key and secret_key):
+            logger.debug("🤖 Langfuse keys not found, tracing disabled")
+            return
+        try:
+            from langfuse import Langfuse
+            from langfuse.langchain import CallbackHandler
+            # Initialize Langfuse client first (this is required!)
+            langfuse_client = Langfuse(
+                public_key=public_key,
+                secret_key=secret_key,
+                host=os.getenv("LANGFUSE_HOST", "https://cloud.langfuse.com"),
+            )
+            # Then create callback handler with the same public_key
+            # The handler will use the initialized client
+            self._langfuse_handler = CallbackHandler(public_key=public_key)
+            logger.info(f"🤖 Langfuse callback handler initialized for {model_spec}")
+        except Exception as e:
+            # If Langfuse keys are set, we MUST fail fast
+            raise RuntimeError(
+                f"Langfuse keys are set but initialization failed: {e}\n"
+                f"This indicates a configuration or dependency problem.\n"
+                f"Check:\n"
+                f"  - LANGFUSE_PUBLIC_KEY: {public_key[:10]}...\n"
+                f"  - LANGFUSE_SECRET_KEY: {'set' if secret_key else 'not set'}\n"
+                f"  - LANGFUSE_HOST: {os.getenv('LANGFUSE_HOST', 'default')}\n"
+                f"  - langfuse package version: pip show langfuse"
+            ) from e
+    def _instantiate_model(
+        self,
+        provider: str,
+        model_name: str,
+        callbacks: List[Any],
+        config: ProviderConfig
+    ) -> Any:
+        """Instantiate the appropriate ChatModel for the provider.
+        Args:
+            provider: Provider name (ollama, openai, anthropic)
+            model_name: Model name within that provider
+            callbacks: List of callback handlers
+            config: Provider configuration
+        Returns:
+            Configured ChatModel instance
+        Raises:
+            ValueError: If provider is not supported
+            ImportError: If provider package is not installed
+        """
+        try:
+            if provider == "ollama":
+                return self._create_ollama_model(model_name, callbacks, config)
+            elif provider == "openai":
+                return self._create_openai_model(model_name, callbacks, config)
+            elif provider == "anthropic":
+                return self._create_anthropic_model(model_name, callbacks, config)
+            else:
+                raise ValueError(f"Unsupported provider: {provider}")
+        except ImportError as e:
+            raise ImportError(
+                f"Failed to import {provider} provider. "
+                f"Install with: pip install langchain-{provider}"
+            ) from e
+    def _create_ollama_model(
+        self, model_name: str, callbacks: List[Any], config: ProviderConfig
+    ) -> Any:
+        """Create ChatOllama model."""
+        from langchain_ollama import ChatOllama
+        model = ChatOllama(
+            model=model_name,
+            timeout=config.request_timeout_seconds,
+            callbacks=callbacks,
+        )
+        logger.debug(f"🤖 Created Ollama model: {model_name}")
+        return model
+    def _create_openai_model(
+        self, model_name: str, callbacks: List[Any], config: ProviderConfig
+    ) -> Any:
+        """Create ChatOpenAI model."""
+        from langchain_openai import ChatOpenAI
+        model = ChatOpenAI(
+            model=model_name,
+            timeout=config.request_timeout_seconds,
+            max_retries=config.max_retries,
+            callbacks=callbacks,
+        )
+        logger.debug(f"🤖 Created OpenAI model: {model_name}")
+        return model
+    def _create_anthropic_model(
+        self, model_name: str, callbacks: List[Any], config: ProviderConfig
+    ) -> Any:
+        """Create ChatAnthropic model."""
+        from langchain_anthropic import ChatAnthropic
+        model = ChatAnthropic(
+            model=model_name,
+            timeout=config.request_timeout_seconds,
+            max_retries=config.max_retries,
+            callbacks=callbacks,
+        )
+        logger.debug(f"🤖 Created Anthropic model: {model_name}")
+        return model