PyPI - karaoke-gen - Versions diffs - 0.57.0__py3-none-any.whl → 0.71.23__py3-none-any.whl - Mend

karaoke-gen 0.57.0py3-none-any.whl → 0.71.23py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

karaoke_gen/audio_fetcher.py +461 -0
karaoke_gen/audio_processor.py +407 -30
karaoke_gen/config.py +62 -113
karaoke_gen/file_handler.py +32 -59
karaoke_gen/karaoke_finalise/karaoke_finalise.py +148 -67
karaoke_gen/karaoke_gen.py +270 -61
karaoke_gen/lyrics_processor.py +13 -1
karaoke_gen/metadata.py +78 -73
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/bulk_cli.py +6 -0
karaoke_gen/utils/cli_args.py +424 -0
karaoke_gen/utils/gen_cli.py +26 -261
karaoke_gen/utils/remote_cli.py +1815 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen-0.71.23.dist-info/METADATA +610 -0
karaoke_gen-0.71.23.dist-info/RECORD +275 -0
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.23.dist-info}/WHEEL +1 -1
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.23.dist-info}/entry_points.txt +1 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +520 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +1043 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +212 -0
lyrics_transcriber/frontend/src/api.ts +239 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +387 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1373 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +688 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js +42039 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +267 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +290 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +648 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0
karaoke_gen-0.57.0.dist-info/METADATA +0 -167
karaoke_gen-0.57.0.dist-info/RECORD +0 -23
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.23.dist-info/licenses}/LICENSE +0 -0

lyrics_transcriber/correction/agentic/providers/langchain_bridge.py ADDED Viewed

@@ -0,0 +1,212 @@
+"""Refactored LangChain-based provider bridge using composition.
+This is a much cleaner version that delegates to specialized components:
+- ModelFactory: Creates ChatModels
+- CircuitBreaker: Manages failure state
+- ResponseParser: Parses responses
+- RetryExecutor: Handles retry logic
+- ResponseCache: Caches LLM responses to avoid redundant calls
+Each component has a single responsibility and is independently testable.
+"""
+from __future__ import annotations
+import logging
+import os
+from typing import List, Dict, Any, Optional
+from datetime import datetime
+from .base import BaseAIProvider
+from .config import ProviderConfig
+from .model_factory import ModelFactory
+from .circuit_breaker import CircuitBreaker
+from .response_parser import ResponseParser
+from .retry_executor import RetryExecutor
+from .response_cache import ResponseCache
+from .constants import (
+    PROMPT_LOG_LENGTH,
+    RESPONSE_LOG_LENGTH,
+    CIRCUIT_OPEN_ERROR,
+    MODEL_INIT_ERROR,
+    PROVIDER_ERROR,
+)
+logger = logging.getLogger(__name__)
+class LangChainBridge(BaseAIProvider):
+    """Provider bridge using LangChain ChatModels with reliability patterns.
+    This bridge is now much simpler - it delegates to specialized components
+    rather than handling everything itself. This follows the Single
+    Responsibility Principle and makes the code more testable.
+    Components:
+        - ModelFactory: Creates and configures ChatModels
+        - CircuitBreaker: Protects against cascading failures
+        - ResponseParser: Handles JSON/raw response parsing
+        - RetryExecutor: Implements exponential backoff
+    """
+    def __init__(
+        self,
+        model: str,
+        config: ProviderConfig | None = None,
+        model_factory: ModelFactory | None = None,
+        circuit_breaker: CircuitBreaker | None = None,
+        response_parser: ResponseParser | None = None,
+        retry_executor: RetryExecutor | None = None,
+        response_cache: ResponseCache | None = None,
+    ):
+        """Initialize the bridge with components (dependency injection).
+        Args:
+            model: Model identifier in format "provider/model"
+            config: Provider configuration (creates default if None)
+            model_factory: Factory for creating ChatModels (creates default if None)
+            circuit_breaker: Circuit breaker instance (creates default if None)
+            response_parser: Response parser instance (creates default if None)
+            retry_executor: Retry executor instance (creates default if None)
+            response_cache: Response cache instance (creates default if None)
+        """
+        self._model = model
+        self._config = config or ProviderConfig.from_env()
+        # Dependency injection with sensible defaults
+        self._factory = model_factory or ModelFactory()
+        self._circuit_breaker = circuit_breaker or CircuitBreaker(self._config)
+        self._parser = response_parser or ResponseParser()
+        self._executor = retry_executor or RetryExecutor(self._config)
+        # Initialize cache (enabled by default, can be disabled via DISABLE_LLM_CACHE=1)
+        cache_enabled = os.getenv("DISABLE_LLM_CACHE", "0").lower() not in {"1", "true", "yes"}
+        self._cache = response_cache or ResponseCache(
+            cache_dir=self._config.cache_dir,
+            enabled=cache_enabled
+        )
+        # Lazy-initialized chat model
+        self._chat_model: Optional[Any] = None
+    def name(self) -> str:
+        """Return provider name for logging."""
+        return f"langchain:{self._model}"
+    def generate_correction_proposals(
+        self,
+        prompt: str,
+        schema: Dict[str, Any],
+        session_id: str | None = None
+    ) -> List[Dict[str, Any]]:
+        """Generate correction proposals using LangChain ChatModel.
+        This method is now much simpler - it orchestrates the components
+        rather than implementing all the logic itself.
+        Args:
+            prompt: The correction prompt
+            schema: Pydantic schema for structured output (for future use)
+            session_id: Optional Langfuse session ID for grouping traces
+        Returns:
+            List of correction proposal dictionaries, or error dicts on failure
+        """
+        # Store session_id for use in _invoke_model
+        self._session_id = session_id
+        # Step 0: Check cache first
+        cached_response = self._cache.get(prompt, self._model)
+        if cached_response:
+            # Parse cached response and return
+            parsed = self._parser.parse(cached_response)
+            logger.debug(f"🎯 Using cached response ({len(parsed)} items)")
+            return parsed
+        # Step 1: Check circuit breaker
+        if self._circuit_breaker.is_open(self._model):
+            open_until = self._circuit_breaker.get_open_until(self._model)
+            return [{
+                "error": CIRCUIT_OPEN_ERROR,
+                "until": open_until
+            }]
+        # Step 2: Get or create chat model
+        if not self._chat_model:
+            try:
+                self._chat_model = self._factory.create_chat_model(
+                    self._model,
+                    self._config
+                )
+            except Exception as e:
+                self._circuit_breaker.record_failure(self._model)
+                logger.error(f"🤖 Failed to initialize chat model: {e}")
+                return [{
+                    "error": MODEL_INIT_ERROR,
+                    "message": str(e)
+                }]
+        # Step 3: Execute with retry logic
+        logger.debug(
+            f"🤖 [LangChain] Sending prompt to {self._model}: "
+            f"{prompt[:PROMPT_LOG_LENGTH]}..."
+        )
+        result = self._executor.execute_with_retry(
+            operation=lambda: self._invoke_model(prompt),
+            operation_name=f"invoke_{self._model}"
+        )
+        # Step 4: Handle result and update circuit breaker
+        if result.success:
+            self._circuit_breaker.record_success(self._model)
+            logger.info(
+                f"🤖 [LangChain] Got response from {self._model}: "
+                f"{result.value[:RESPONSE_LOG_LENGTH]}..."
+            )
+            # Step 5: Cache the raw response for future use
+            self._cache.set(
+                prompt=prompt,
+                model=self._model,
+                response=result.value,
+                metadata={
+                    "session_id": session_id,
+                    "timestamp": datetime.utcnow().isoformat()
+                }
+            )
+            # Step 6: Parse response
+            return self._parser.parse(result.value)
+        else:
+            self._circuit_breaker.record_failure(self._model)
+            return [{
+                "error": PROVIDER_ERROR,
+                "message": result.error or "unknown"
+            }]
+    def _invoke_model(self, prompt: str) -> str:
+        """Invoke the chat model with a prompt.
+        This is a simple wrapper that can be passed to the retry executor.
+        Args:
+            prompt: The prompt to send
+        Returns:
+            Response content as string
+        Raises:
+            Exception: Any error from the model invocation
+        """
+        from langchain_core.messages import HumanMessage
+        # Prepare config with session_id in metadata (Langfuse format)
+        config = {}
+        if hasattr(self, '_session_id') and self._session_id:
+            config["metadata"] = {"langfuse_session_id": self._session_id}
+            logger.debug(f"🤖 [LangChain] Invoking with session_id: {self._session_id}")
+        response = self._chat_model.invoke([HumanMessage(content=prompt)], config=config)
+        return response.content

lyrics_transcriber/correction/agentic/providers/model_factory.py ADDED Viewed

@@ -0,0 +1,209 @@
+"""Factory for creating LangChain ChatModels with Langfuse callbacks."""
+from __future__ import annotations
+import logging
+import os
+from typing import Any, Optional, List
+from .config import ProviderConfig
+logger = logging.getLogger(__name__)
+class ModelFactory:
+    """Creates and configures LangChain ChatModels with observability.
+    This factory handles:
+    - Parsing model specifications ("provider/model" format)
+    - Creating Langfuse callbacks when configured
+    - Instantiating the appropriate ChatModel for each provider
+    Single Responsibility: Model creation only, no execution or state management.
+    """
+    def __init__(self):
+        self._langfuse_handler: Optional[Any] = None
+        self._langfuse_initialized = False
+    def create_chat_model(self, model_spec: str, config: ProviderConfig) -> Any:
+        """Create a ChatModel from a model specification.
+        Args:
+            model_spec: Model identifier in format "provider/model"
+                       e.g. "ollama/gpt-oss:latest", "openai/gpt-4"
+            config: Provider configuration with timeouts, retries, etc.
+        Returns:
+            Configured LangChain ChatModel instance
+        Raises:
+            ValueError: If model_spec format is invalid or provider unsupported
+        """
+        provider, model_name = self._parse_model_spec(model_spec)
+        callbacks = self._create_callbacks(model_spec)
+        return self._instantiate_model(provider, model_name, callbacks, config)
+    def _parse_model_spec(self, spec: str) -> tuple[str, str]:
+        """Parse model specification into provider and model name.
+        Args:
+            spec: Model spec in format "provider/model"
+        Returns:
+            Tuple of (provider, model_name)
+        Raises:
+            ValueError: If format is invalid
+        """
+        parts = spec.split("/", 1)
+        if len(parts) != 2:
+            raise ValueError(
+                f"Model spec must be in format 'provider/model', got: {spec}"
+            )
+        return parts[0], parts[1]
+    def _create_callbacks(self, model_spec: str) -> List[Any]:
+        """Create Langfuse callback handlers if configured.
+        Args:
+            model_spec: Model specification for logging
+        Returns:
+            List of callback handlers (may be empty)
+        """
+        # Only initialize Langfuse once
+        if not self._langfuse_initialized:
+            self._initialize_langfuse(model_spec)
+            self._langfuse_initialized = True
+        return [self._langfuse_handler] if self._langfuse_handler else []
+    def _initialize_langfuse(self, model_spec: str) -> None:
+        """Initialize Langfuse callback handler if keys are present.
+        Langfuse reads credentials from environment variables automatically:
+        - LANGFUSE_PUBLIC_KEY
+        - LANGFUSE_SECRET_KEY
+        - LANGFUSE_HOST (optional)
+        Args:
+            model_spec: Model specification for logging
+        Raises:
+            RuntimeError: If Langfuse keys are set but initialization fails
+        """
+        public_key = os.getenv("LANGFUSE_PUBLIC_KEY")
+        secret_key = os.getenv("LANGFUSE_SECRET_KEY")
+        if not (public_key and secret_key):
+            logger.debug("🤖 Langfuse keys not found, tracing disabled")
+            return
+        try:
+            from langfuse import Langfuse
+            from langfuse.langchain import CallbackHandler
+            # Initialize Langfuse client first (this is required!)
+            langfuse_client = Langfuse(
+                public_key=public_key,
+                secret_key=secret_key,
+                host=os.getenv("LANGFUSE_HOST", "https://cloud.langfuse.com"),
+            )
+            # Then create callback handler with the same public_key
+            # The handler will use the initialized client
+            self._langfuse_handler = CallbackHandler(public_key=public_key)
+            logger.info(f"🤖 Langfuse callback handler initialized for {model_spec}")
+        except Exception as e:
+            # If Langfuse keys are set, we MUST fail fast
+            raise RuntimeError(
+                f"Langfuse keys are set but initialization failed: {e}\n"
+                f"This indicates a configuration or dependency problem.\n"
+                f"Check:\n"
+                f"  - LANGFUSE_PUBLIC_KEY: {public_key[:10]}...\n"
+                f"  - LANGFUSE_SECRET_KEY: {'set' if secret_key else 'not set'}\n"
+                f"  - LANGFUSE_HOST: {os.getenv('LANGFUSE_HOST', 'default')}\n"
+                f"  - langfuse package version: pip show langfuse"
+            ) from e
+    def _instantiate_model(
+        self,
+        provider: str,
+        model_name: str,
+        callbacks: List[Any],
+        config: ProviderConfig
+    ) -> Any:
+        """Instantiate the appropriate ChatModel for the provider.
+        Args:
+            provider: Provider name (ollama, openai, anthropic)
+            model_name: Model name within that provider
+            callbacks: List of callback handlers
+            config: Provider configuration
+        Returns:
+            Configured ChatModel instance
+        Raises:
+            ValueError: If provider is not supported
+            ImportError: If provider package is not installed
+        """
+        try:
+            if provider == "ollama":
+                return self._create_ollama_model(model_name, callbacks, config)
+            elif provider == "openai":
+                return self._create_openai_model(model_name, callbacks, config)
+            elif provider == "anthropic":
+                return self._create_anthropic_model(model_name, callbacks, config)
+            else:
+                raise ValueError(f"Unsupported provider: {provider}")
+        except ImportError as e:
+            raise ImportError(
+                f"Failed to import {provider} provider. "
+                f"Install with: pip install langchain-{provider}"
+            ) from e
+    def _create_ollama_model(
+        self, model_name: str, callbacks: List[Any], config: ProviderConfig
+    ) -> Any:
+        """Create ChatOllama model."""
+        from langchain_ollama import ChatOllama
+        model = ChatOllama(
+            model=model_name,
+            timeout=config.request_timeout_seconds,
+            callbacks=callbacks,
+        )
+        logger.debug(f"🤖 Created Ollama model: {model_name}")
+        return model
+    def _create_openai_model(
+        self, model_name: str, callbacks: List[Any], config: ProviderConfig
+    ) -> Any:
+        """Create ChatOpenAI model."""
+        from langchain_openai import ChatOpenAI
+        model = ChatOpenAI(
+            model=model_name,
+            timeout=config.request_timeout_seconds,
+            max_retries=config.max_retries,
+            callbacks=callbacks,
+        )
+        logger.debug(f"🤖 Created OpenAI model: {model_name}")
+        return model
+    def _create_anthropic_model(
+        self, model_name: str, callbacks: List[Any], config: ProviderConfig
+    ) -> Any:
+        """Create ChatAnthropic model."""
+        from langchain_anthropic import ChatAnthropic
+        model = ChatAnthropic(
+            model=model_name,
+            timeout=config.request_timeout_seconds,
+            max_retries=config.max_retries,
+            callbacks=callbacks,
+        )
+        logger.debug(f"🤖 Created Anthropic model: {model_name}")
+        return model

lyrics_transcriber/correction/agentic/providers/response_cache.py ADDED Viewed

@@ -0,0 +1,218 @@
+"""Response caching for LLM calls to avoid redundant API requests."""
+from __future__ import annotations
+import json
+import hashlib
+import logging
+from pathlib import Path
+from typing import Optional, Dict, Any
+from datetime import datetime
+logger = logging.getLogger(__name__)
+class ResponseCache:
+    """Caches LLM responses based on prompt hash.
+    This allows reusing responses when iterating on frontend/UI changes
+    without re-running expensive LLM inference calls.
+    Cache Structure:
+        {
+            "prompt_hash": {
+                "prompt": "full prompt text",
+                "response": "llm response",
+                "timestamp": "iso datetime",
+                "model": "model identifier",
+                "metadata": {...}
+            }
+        }
+    """
+    def __init__(self, cache_dir: str = "cache", enabled: bool = True):
+        """Initialize response cache.
+        Args:
+            cache_dir: Directory to store cache file
+            enabled: Whether caching is enabled (can be disabled via env var)
+        """
+        self.cache_dir = Path(cache_dir)
+        self.cache_dir.mkdir(parents=True, exist_ok=True)
+        self.cache_file = self.cache_dir / "llm_response_cache.json"
+        self.enabled = enabled
+        self._cache: Dict[str, Dict[str, Any]] = {}
+        self._load_cache()
+    def _load_cache(self) -> None:
+        """Load cache from disk."""
+        if not self.cache_file.exists():
+            self._cache = {}
+            return
+        try:
+            with open(self.cache_file, 'r', encoding='utf-8') as f:
+                self._cache = json.load(f)
+            logger.debug(f"📦 Loaded {len(self._cache)} cached responses")
+        except Exception as e:
+            logger.warning(f"Failed to load cache: {e}")
+            self._cache = {}
+    def _save_cache(self) -> None:
+        """Save cache to disk."""
+        try:
+            with open(self.cache_file, 'w', encoding='utf-8') as f:
+                json.dump(self._cache, f, indent=2, ensure_ascii=False)
+            logger.debug(f"💾 Saved {len(self._cache)} cached responses")
+        except Exception as e:
+            logger.warning(f"Failed to save cache: {e}")
+    def _compute_hash(self, prompt: str, model: str) -> str:
+        """Compute hash for prompt + model combination.
+        Args:
+            prompt: The full prompt text
+            model: Model identifier
+        Returns:
+            SHA256 hash as hex string
+        """
+        # Include both prompt and model in hash
+        combined = f"{model}::{prompt}"
+        return hashlib.sha256(combined.encode('utf-8')).hexdigest()
+    def get(self, prompt: str, model: str) -> Optional[str]:
+        """Get cached response for prompt if available.
+        Args:
+            prompt: The prompt text
+            model: Model identifier
+        Returns:
+            Cached response string or None if not found
+        """
+        if not self.enabled:
+            return None
+        prompt_hash = self._compute_hash(prompt, model)
+        if prompt_hash in self._cache:
+            cached = self._cache[prompt_hash]
+            logger.info(f"🎯 Cache HIT for {model} (hash: {prompt_hash[:8]}...)")
+            logger.debug(f"   Cached at: {cached.get('timestamp')}")
+            return cached.get('response')
+        logger.debug(f"📭 Cache MISS for {model} (hash: {prompt_hash[:8]}...)")
+        return None
+    def set(
+        self,
+        prompt: str,
+        model: str,
+        response: str,
+        metadata: Optional[Dict[str, Any]] = None
+    ) -> None:
+        """Store response in cache.
+        Args:
+            prompt: The prompt text
+            model: Model identifier
+            response: The LLM response
+            metadata: Optional metadata to store with cache entry
+        """
+        if not self.enabled:
+            return
+        prompt_hash = self._compute_hash(prompt, model)
+        self._cache[prompt_hash] = {
+            "prompt": prompt[:500] + "..." if len(prompt) > 500 else prompt,  # Truncate for readability
+            "response": response,
+            "timestamp": datetime.utcnow().isoformat(),
+            "model": model,
+            "metadata": metadata or {}
+        }
+        # Save to disk immediately (for persistence across runs)
+        self._save_cache()
+        logger.debug(f"💾 Cached response for {model} (hash: {prompt_hash[:8]}...)")
+    def clear(self) -> int:
+        """Clear all cached responses.
+        Returns:
+            Number of entries cleared
+        """
+        count = len(self._cache)
+        self._cache = {}
+        self._save_cache()
+        logger.info(f"🗑️ Cleared {count} cached responses")
+        return count
+    def get_stats(self) -> Dict[str, Any]:
+        """Get cache statistics.
+        Returns:
+            Dictionary with cache statistics
+        """
+        if not self._cache:
+            return {
+                "total_entries": 0,
+                "cache_file": str(self.cache_file),
+                "enabled": self.enabled
+            }
+        # Count by model
+        by_model = {}
+        for entry in self._cache.values():
+            model = entry.get('model', 'unknown')
+            by_model[model] = by_model.get(model, 0) + 1
+        # Find oldest and newest
+        timestamps = [
+            datetime.fromisoformat(entry['timestamp'])
+            for entry in self._cache.values()
+            if 'timestamp' in entry
+        ]
+        return {
+            "total_entries": len(self._cache),
+            "by_model": by_model,
+            "oldest": min(timestamps).isoformat() if timestamps else None,
+            "newest": max(timestamps).isoformat() if timestamps else None,
+            "cache_file": str(self.cache_file),
+            "enabled": self.enabled
+        }
+    def prune_old_entries(self, days: int = 30) -> int:
+        """Remove cache entries older than specified days.
+        Args:
+            days: Remove entries older than this many days
+        Returns:
+            Number of entries removed
+        """
+        from datetime import timedelta
+        cutoff = datetime.utcnow() - timedelta(days=days)
+        to_remove = []
+        for prompt_hash, entry in self._cache.items():
+            if 'timestamp' in entry:
+                try:
+                    entry_time = datetime.fromisoformat(entry['timestamp'])
+                    if entry_time < cutoff:
+                        to_remove.append(prompt_hash)
+                except Exception:
+                    pass
+        for prompt_hash in to_remove:
+            del self._cache[prompt_hash]
+        if to_remove:
+            self._save_cache()
+            logger.info(f"🗑️ Pruned {len(to_remove)} old cache entries (older than {days} days)")
+        return len(to_remove)

karaoke-gen 0.57.0__py3-none-any.whl → 0.71.23__py3-none-any.whl

karaoke-gen 0.57.0py3-none-any.whl → 0.71.23py3-none-any.whl