PyPI - lyrics-transcriber - Versions diffs - 0.30.0__py3-none-any.whl → 0.32.1__py3-none-any.whl - Mend

lyrics-transcriber 0.30.0py3-none-any.whl → 0.32.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

lyrics_transcriber/__init__.py +2 -1
lyrics_transcriber/cli/{main.py → cli_main.py} +47 -14
lyrics_transcriber/core/config.py +35 -0
lyrics_transcriber/core/controller.py +164 -166
lyrics_transcriber/correction/anchor_sequence.py +471 -0
lyrics_transcriber/correction/corrector.py +256 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +30 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +91 -0
lyrics_transcriber/correction/handlers/levenshtein.py +147 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +98 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +55 -0
lyrics_transcriber/correction/handlers/repeat.py +71 -0
lyrics_transcriber/correction/handlers/sound_alike.py +223 -0
lyrics_transcriber/correction/handlers/syllables_match.py +182 -0
lyrics_transcriber/correction/handlers/word_count_match.py +54 -0
lyrics_transcriber/correction/handlers/word_operations.py +135 -0
lyrics_transcriber/correction/phrase_analyzer.py +426 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +125 -0
lyrics_transcriber/lyrics/genius.py +73 -0
lyrics_transcriber/lyrics/spotify.py +82 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/{ass.py → ass/ass.py} +150 -690
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +37 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +219 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +503 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +1919 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +140 -171
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +91 -0
lyrics_transcriber/output/segment_resizer.py +416 -0
lyrics_transcriber/output/subtitles.py +328 -302
lyrics_transcriber/output/video.py +219 -0
lyrics_transcriber/review/__init__.py +1 -0
lyrics_transcriber/review/server.py +138 -0
lyrics_transcriber/storage/dropbox.py +110 -134
lyrics_transcriber/transcribers/audioshake.py +171 -105
lyrics_transcriber/transcribers/base_transcriber.py +149 -0
lyrics_transcriber/transcribers/whisper.py +267 -133
lyrics_transcriber/types.py +454 -0
{lyrics_transcriber-0.30.0.dist-info → lyrics_transcriber-0.32.1.dist-info}/METADATA +14 -3
lyrics_transcriber-0.32.1.dist-info/RECORD +86 -0
{lyrics_transcriber-0.30.0.dist-info → lyrics_transcriber-0.32.1.dist-info}/WHEEL +1 -1
lyrics_transcriber-0.32.1.dist-info/entry_points.txt +4 -0
lyrics_transcriber/core/corrector.py +0 -56
lyrics_transcriber/core/fetcher.py +0 -143
lyrics_transcriber/storage/tokens.py +0 -116
lyrics_transcriber/transcribers/base.py +0 -31
lyrics_transcriber-0.30.0.dist-info/RECORD +0 -22
lyrics_transcriber-0.30.0.dist-info/entry_points.txt +0 -3
{lyrics_transcriber-0.30.0.dist-info → lyrics_transcriber-0.32.1.dist-info}/LICENSE +0 -0

lyrics_transcriber/__init__.py CHANGED Viewed

@@ -1,3 +1,4 @@
-from .core.controller import LyricsTranscriber, TranscriberConfig, LyricsConfig, OutputConfig
+from lyrics_transcriber.core.config import TranscriberConfig, LyricsConfig, OutputConfig
+from lyrics_transcriber.core.controller import LyricsTranscriber
 __all__ = ["LyricsTranscriber", "TranscriberConfig", "LyricsConfig", "OutputConfig"]

lyrics_transcriber/cli/{main.py → cli_main.py} RENAMED Viewed

@@ -60,9 +60,14 @@ def create_arg_parser() -> argparse.ArgumentParser:
     output_group.add_argument(
         "--cache_dir",
         type=Path,
-        default=Path("/tmp/lyrics-transcriber-cache/"),
         help="Directory to cache downloaded/generated files. Default: /tmp/lyrics-transcriber-cache/",
     )
+    output_group.add_argument(
+        "--output_styles_json",
+        type=Path,
+        help="JSON file containing output style configurations for CDG and video generation",
+    )
+    output_group.add_argument("--generate_cdg", action="store_true", help="Generate CDG karaoke files")
     # Video options
     video_group = parser.add_argument_group("Video Options")
@@ -70,16 +75,22 @@ def create_arg_parser() -> argparse.ArgumentParser:
     video_group.add_argument(
         "--video_resolution", choices=["4k", "1080p", "720p", "360p"], default="360p", help="Resolution of the karaoke video. Default: 360p"
     )
-    video_group.add_argument("--video_background_image", type=Path, help="Image file to use for karaoke video background")
-    video_group.add_argument(
-        "--video_background_color",
-        default="black",
-        help="Color for karaoke video background (hex format or FFmpeg color name). Default: black",
-    )
     return parser
+def parse_args(parser: argparse.ArgumentParser, args_list: list[str] | None = None) -> argparse.Namespace:
+    """Parse and process command line arguments."""
+    # Use provided args_list for testing, otherwise use sys.argv
+    args = parser.parse_args(args_list)
+    # Set default cache_dir if not provided
+    if not hasattr(args, "cache_dir") or args.cache_dir is None:
+        args.cache_dir = Path(os.getenv("LYRICS_TRANSCRIBER_CACHE_DIR", "/tmp/lyrics-transcriber-cache/"))
+    return args
 def get_config_from_env() -> Dict[str, str]:
     """Load configuration from environment variables."""
     load_dotenv()
@@ -121,12 +132,12 @@ def create_configs(args: argparse.Namespace, env_config: Dict[str, str]) -> tupl
     )
     output_config = OutputConfig(
-        output_dir=str(args.output_dir) if args.output_dir else None,
+        output_styles_json=str(args.output_styles_json),
+        output_dir=str(args.output_dir) if args.output_dir else os.getcwd(),
         cache_dir=str(args.cache_dir),
         render_video=args.render_video,
+        generate_cdg=args.generate_cdg,
         video_resolution=args.video_resolution,
-        video_background_image=str(args.video_background_image) if args.video_background_image else None,
-        video_background_color=args.video_background_color,
     )
     return transcriber_config, lyrics_config, output_config
@@ -151,7 +162,7 @@ def validate_args(args: argparse.Namespace, parser: argparse.ArgumentParser, log
 def main() -> None:
     """Main entry point for the CLI."""
     parser = create_arg_parser()
-    args = parser.parse_args()
+    args = parse_args(parser)
     # Set up logging first
     logger = setup_logging(args.log_level)
@@ -182,13 +193,35 @@ def main() -> None:
         # Log results
         logger.info("*** Success! ***")
+        # Log all generated output files
+        if results.original_txt:
+            logger.info(f"Generated original transcription: {results.original_txt}")
+        if results.corrections_json:
+            logger.info(f"Generated corrections data: {results.corrections_json}")
+        if results.corrected_txt:
+            logger.info(f"Generated corrected lyrics: {results.corrected_txt}")
         if results.lrc_filepath:
             logger.info(f"Generated LRC file: {results.lrc_filepath}")
+        if results.cdg_filepath:
+            logger.info(f"Generated CDG file: {results.cdg_filepath}")
+        if results.mp3_filepath:
+            logger.info(f"Generated MP3 file: {results.mp3_filepath}")
+        if results.cdg_zip_filepath:
+            logger.info(f"Generated CDG ZIP archive: {results.cdg_zip_filepath}")
         if results.ass_filepath:
-            logger.info(f"Generated ASS file: {results.ass_filepath}")
+            logger.info(f"Generated ASS subtitles: {results.ass_filepath}")
         if results.video_filepath:
-            logger.info(f"Generated video file: {results.video_filepath}")
+            logger.info(f"Generated video: {results.video_filepath}")
     except Exception as e:
-        logger.error(f"Processing failed: {str(e)}")
+        # Get the full exception traceback
+        import traceback
+        error_details = traceback.format_exc()
+        # Log both the error message and the full traceback
+        logger.error(f"Processing failed: {str(e)}\n\nFull traceback:\n{error_details}")
         exit(1)

lyrics_transcriber/core/config.py ADDED Viewed

@@ -0,0 +1,35 @@
+import os
+from dataclasses import dataclass, field
+from typing import Any, Dict, Optional
+@dataclass
+class TranscriberConfig:
+    """Configuration for transcription services."""
+    audioshake_api_token: Optional[str] = None
+    runpod_api_key: Optional[str] = None
+    whisper_runpod_id: Optional[str] = None
+@dataclass
+class LyricsConfig:
+    """Configuration for lyrics services."""
+    genius_api_token: Optional[str] = None
+    spotify_cookie: Optional[str] = None
+@dataclass
+class OutputConfig:
+    """Configuration for output generation."""
+    output_styles_json: str
+    max_line_length: int = 36
+    styles: Dict[str, Any] = field(default_factory=dict)
+    output_dir: Optional[str] = os.getcwd()
+    cache_dir: str = os.getenv("LYRICS_TRANSCRIBER_CACHE_DIR", "/tmp/lyrics-transcriber-cache/")
+    render_video: bool = False
+    generate_cdg: bool = False
+    video_resolution: str = "360p"
+    enable_review: bool = True

lyrics_transcriber/core/controller.py CHANGED Viewed

@@ -1,65 +1,44 @@
 import os
 import logging
-from dataclasses import dataclass
+from dataclasses import dataclass, field
 from typing import Dict, Optional, List
-from ..transcribers.base import BaseTranscriber
-from ..transcribers.audioshake import AudioShakeTranscriber
-from ..transcribers.whisper import WhisperTranscriber
-from .fetcher import LyricsFetcher
-from ..output.generator import OutputGenerator
-from .corrector import LyricsTranscriptionCorrector
+from lyrics_transcriber.types import (
+    LyricsData,
+    TranscriptionResult,
+    CorrectionResult,
+)
+from lyrics_transcriber.transcribers.base_transcriber import BaseTranscriber
+from lyrics_transcriber.transcribers.audioshake import AudioShakeTranscriber, AudioShakeConfig
+from lyrics_transcriber.transcribers.whisper import WhisperTranscriber, WhisperConfig
+from lyrics_transcriber.lyrics.base_lyrics_provider import BaseLyricsProvider, LyricsProviderConfig
+from lyrics_transcriber.lyrics.genius import GeniusProvider
+from lyrics_transcriber.lyrics.spotify import SpotifyProvider
+from lyrics_transcriber.output.generator import OutputGenerator
+from lyrics_transcriber.correction.corrector import LyricsCorrector
+from lyrics_transcriber.core.config import TranscriberConfig, LyricsConfig, OutputConfig
 @dataclass
-class TranscriberConfig:
-    """Configuration for transcription services."""
-    audioshake_api_token: Optional[str] = None
-    runpod_api_key: Optional[str] = None
-    whisper_runpod_id: Optional[str] = None
-@dataclass
-class LyricsConfig:
-    """Configuration for lyrics services."""
-    genius_api_token: Optional[str] = None
-    spotify_cookie: Optional[str] = None
-@dataclass
-class OutputConfig:
-    """Configuration for output generation."""
-    output_dir: Optional[str] = None
-    cache_dir: str = "/tmp/lyrics-transcriber-cache/"
-    render_video: bool = False
-    video_resolution: str = "360p"
-    video_background_image: Optional[str] = None
-    video_background_color: str = "black"
-@dataclass
-class TranscriptionResult:
+class LyricsControllerResult:
     """Holds the results of the transcription and correction process."""
-    # Lyrics from internet sources
-    lyrics_text: Optional[str] = None
-    lyrics_source: Optional[str] = None
-    lyrics_genius: Optional[str] = None
-    lyrics_spotify: Optional[str] = None
-    spotify_lyrics_data: Optional[Dict] = None
+    # Results from different sources
+    lyrics_results: List[LyricsData] = field(default_factory=list)
+    transcription_results: List[TranscriptionResult] = field(default_factory=list)
-    # Transcription results
-    transcription_whisper: Optional[Dict] = None
-    transcription_audioshake: Optional[Dict] = None
-    transcription_primary: Optional[Dict] = None
-    transcription_corrected: Optional[Dict] = None
+    # Corrected results
+    transcription_corrected: Optional[CorrectionResult] = None
     # Output files
     lrc_filepath: Optional[str] = None
     ass_filepath: Optional[str] = None
     video_filepath: Optional[str] = None
+    mp3_filepath: Optional[str] = None
+    cdg_filepath: Optional[str] = None
+    cdg_zip_filepath: Optional[str] = None
+    original_txt: Optional[str] = None
+    corrected_txt: Optional[str] = None
+    corrections_json: Optional[str] = None
 class LyricsTranscriber:
@@ -79,8 +58,9 @@ class LyricsTranscriber:
         transcriber_config: Optional[TranscriberConfig] = None,
         lyrics_config: Optional[LyricsConfig] = None,
         output_config: Optional[OutputConfig] = None,
-        lyrics_fetcher: Optional[LyricsFetcher] = None,
-        corrector: Optional[LyricsTranscriptionCorrector] = None,
+        transcribers: Optional[Dict[str, BaseTranscriber]] = None,
+        lyrics_providers: Optional[Dict[str, BaseLyricsProvider]] = None,
+        corrector: Optional[LyricsCorrector] = None,
         output_generator: Optional[OutputGenerator] = None,
         logger: Optional[logging.Logger] = None,
         log_level: int = logging.DEBUG,
@@ -109,175 +89,193 @@ class LyricsTranscriber:
         self.title = title
         self.output_prefix = f"{artist} - {title}" if artist and title else os.path.splitext(os.path.basename(audio_filepath))[0]
+        # Add after creating necessary folders
+        self.logger.debug(f"Using cache directory: {self.output_config.cache_dir}")
+        self.logger.debug(f"Using output directory: {self.output_config.output_dir}")
         # Create necessary folders
         os.makedirs(self.output_config.cache_dir, exist_ok=True)
-        if self.output_config.output_dir:
-            os.makedirs(self.output_config.output_dir, exist_ok=True)
+        os.makedirs(self.output_config.output_dir, exist_ok=True)
         # Initialize results
-        self.results = TranscriptionResult()
+        self.results = LyricsControllerResult()
         # Initialize components (with dependency injection)
-        self.transcribers = self._initialize_transcribers()
-        self.lyrics_fetcher = lyrics_fetcher or self._initialize_lyrics_fetcher()
-        self.corrector = corrector or LyricsTranscriptionCorrector(logger=self.logger)
+        self.transcribers = transcribers or self._initialize_transcribers()
+        self.lyrics_providers = lyrics_providers or self._initialize_lyrics_providers()
+        self.corrector = corrector or LyricsCorrector(cache_dir=self.output_config.cache_dir, logger=self.logger)
         self.output_generator = output_generator or self._initialize_output_generator()
     def _initialize_transcribers(self) -> Dict[str, BaseTranscriber]:
         """Initialize available transcription services."""
         transcribers = {}
+        # Add debug logging for config values
+        self.logger.debug(f"Initializing transcribers with config: {self.transcriber_config}")
+        self.logger.debug(f"Using cache directory for transcribers: {self.output_config.cache_dir}")
         if self.transcriber_config.audioshake_api_token:
-            transcribers["audioshake"] = AudioShakeTranscriber(api_token=self.transcriber_config.audioshake_api_token, logger=self.logger)
+            self.logger.debug("Initializing AudioShake transcriber")
+            transcribers["audioshake"] = {
+                "instance": AudioShakeTranscriber(
+                    cache_dir=self.output_config.cache_dir,
+                    config=AudioShakeConfig(api_token=self.transcriber_config.audioshake_api_token),
+                    logger=self.logger,
+                ),
+                "priority": 1,  # AudioShake has highest priority
+            }
+        else:
+            self.logger.debug("Skipping AudioShake transcriber - no API token provided")
         if self.transcriber_config.runpod_api_key and self.transcriber_config.whisper_runpod_id:
-            transcribers["whisper"] = WhisperTranscriber(
-                logger=self.logger,
-                runpod_api_key=self.transcriber_config.runpod_api_key,
-                endpoint_id=self.transcriber_config.whisper_runpod_id,
-            )
+            self.logger.debug("Initializing Whisper transcriber")
+            transcribers["whisper"] = {
+                "instance": WhisperTranscriber(
+                    cache_dir=self.output_config.cache_dir,
+                    config=WhisperConfig(
+                        runpod_api_key=self.transcriber_config.runpod_api_key, endpoint_id=self.transcriber_config.whisper_runpod_id
+                    ),
+                    logger=self.logger,
+                ),
+                "priority": 2,  # Whisper has lower priority
+            }
+        else:
+            self.logger.debug("Skipping Whisper transcriber - missing runpod_api_key or whisper_runpod_id")
         return transcribers
-    def _initialize_lyrics_fetcher(self) -> LyricsFetcher:
-        """Initialize lyrics fetching service."""
-        return LyricsFetcher(
-            genius_api_token=self.lyrics_config.genius_api_token, spotify_cookie=self.lyrics_config.spotify_cookie, logger=self.logger
+    def _initialize_lyrics_providers(self) -> Dict[str, BaseLyricsProvider]:
+        """Initialize available lyrics providers."""
+        providers = {}
+        # Create provider config with all necessary parameters
+        provider_config = LyricsProviderConfig(
+            genius_api_token=self.lyrics_config.genius_api_token,
+            spotify_cookie=self.lyrics_config.spotify_cookie,
+            cache_dir=self.output_config.cache_dir,
+            audio_filepath=self.audio_filepath,
         )
+        if provider_config.genius_api_token:
+            self.logger.debug("Initializing Genius lyrics provider")
+            providers["genius"] = GeniusProvider(config=provider_config, logger=self.logger)
+        else:
+            self.logger.debug("Skipping Genius provider - no API token provided")
+        if provider_config.spotify_cookie:
+            self.logger.debug("Initializing Spotify lyrics provider")
+            providers["spotify"] = SpotifyProvider(config=provider_config, logger=self.logger)
+        else:
+            self.logger.debug("Skipping Spotify provider - no cookie provided")
+        return providers
     def _initialize_output_generator(self) -> OutputGenerator:
         """Initialize output generation service."""
-        return OutputGenerator(
-            logger=self.logger,
-            output_dir=self.output_config.output_dir,
-            cache_dir=self.output_config.cache_dir,
-            video_resolution=self.output_config.video_resolution,
-            video_background_image=self.output_config.video_background_image,
-            video_background_color=self.output_config.video_background_color,
-        )
+        return OutputGenerator(config=self.output_config, logger=self.logger)
-    def process(self) -> TranscriptionResult:
+    def process(self) -> LyricsControllerResult:
         """
         Main processing method that orchestrates the entire workflow.
         Returns:
-            TranscriptionResult containing all outputs and generated files.
+            LyricsControllerResult containing all outputs and generated files.
         Raises:
             Exception: If a critical error occurs during processing.
         """
-        try:
-            # Step 1: Fetch lyrics if artist and title are provided
-            if self.artist and self.title:
-                self.fetch_lyrics()
-            # Step 2: Run transcription
-            self.transcribe()
+        # Step 1: Fetch lyrics if artist and title are provided
+        if self.artist and self.title:
+            self.fetch_lyrics()
-            # Step 3: Process and correct lyrics
-            if self.results.transcription_primary:
-                self.correct_lyrics()
+        # Step 2: Run transcription
+        self.transcribe()
-            # Step 4: Generate outputs
-            if self.results.transcription_corrected:
-                self.generate_outputs()
+        # Step 3: Process and correct lyrics
+        self.correct_lyrics()
-            self.logger.info("Processing completed successfully")
-            return self.results
+        # Step 4: Generate outputs
+        self.generate_outputs()
-        except Exception as e:
-            self.logger.error(f"Error during processing: {str(e)}")
-            raise
+        self.logger.info("Processing completed successfully")
+        return self.results
     def fetch_lyrics(self) -> None:
-        """Fetch lyrics from online sources."""
+        """Fetch lyrics from available providers."""
         self.logger.info(f"Fetching lyrics for {self.artist} - {self.title}")
-        try:
-            lyrics_result = self.lyrics_fetcher.fetch_lyrics(self.artist, self.title)
-            # Update results
-            self.results.lyrics_text = lyrics_result["lyrics"]
-            self.results.lyrics_source = lyrics_result["source"]
-            self.results.lyrics_genius = lyrics_result["genius_lyrics"]
-            self.results.lyrics_spotify = lyrics_result["spotify_lyrics"]
-            self.results.spotify_lyrics_data = lyrics_result.get("spotify_lyrics_data")
+        for name, provider in self.lyrics_providers.items():
+            try:
+                result = provider.fetch_lyrics(self.artist, self.title)
+                if result:
+                    self.results.lyrics_results.append(result)
+                    self.logger.info(f"Successfully fetched lyrics from {name}")
-            if lyrics_result["lyrics"]:
-                self.logger.info(f"Successfully fetched lyrics from {lyrics_result['source']}")
-            else:
-                self.logger.warning("No lyrics found from any source")
+            except Exception as e:
+                self.logger.error(f"Failed to fetch lyrics from {name}: {str(e)}")
+                continue
-        except Exception as e:
-            self.logger.error(f"Failed to fetch lyrics: {str(e)}")
-            # Don't raise - we can continue without lyrics
+        if not self.results.lyrics_results:
+            self.logger.warning("No lyrics found from any source")
     def transcribe(self) -> None:
         """Run transcription using all available transcribers."""
-        self.logger.info("Starting transcription process")
-        for name, transcriber in self.transcribers.items():
-            try:
-                result = transcriber.transcribe(self.audio_filepath)
+        self.logger.info(f"Starting transcription with providers: {list(self.transcribers.keys())}")
-                # Store result based on transcriber type
-                if name == "whisper":
-                    self.results.transcription_whisper = result
-                elif name == "audioshake":
-                    self.results.transcription_audioshake = result
+        for name, transcriber_info in self.transcribers.items():
+            self.logger.info(f"Running transcription with {name}")
+            result = transcriber_info["instance"].transcribe(self.audio_filepath)
+            if result:
+                # Add the transcriber name and priority to the result
+                self.results.transcription_results.append(
+                    TranscriptionResult(name=name, priority=transcriber_info["priority"], result=result)
+                )
+                self.logger.debug(f"Transcription completed for {name}")
-                # Use first successful transcription as primary
-                if not self.results.transcription_primary:
-                    self.results.transcription_primary = result
-            except Exception as e:
-                self.logger.error(f"Transcription failed for {name}: {str(e)}")
-                continue
+        if not self.results.transcription_results:
+            self.logger.warning("No successful transcriptions from any provider")
     def correct_lyrics(self) -> None:
         """Run lyrics correction using transcription and internet lyrics."""
         self.logger.info("Starting lyrics correction process")
-        try:
-            # Set input data for correction
-            self.corrector.set_input_data(
-                spotify_lyrics_data_dict=self.results.spotify_lyrics_data,
-                spotify_lyrics_text=self.results.lyrics_spotify,
-                genius_lyrics_text=self.results.lyrics_genius,
-                transcription_data_dict_whisper=self.results.transcription_whisper,
-                transcription_data_dict_audioshake=self.results.transcription_audioshake,
-            )
-            # Run correction
-            corrected_data = self.corrector.run_corrector()
-            # Store corrected results
-            self.results.transcription_corrected = corrected_data
-            self.logger.info("Lyrics correction completed")
-        except Exception as e:
-            self.logger.error(f"Failed to correct lyrics: {str(e)}")
-            # Use uncorrected transcription as fallback
-            self.results.transcription_corrected = self.results.transcription_primary
-            self.logger.warning("Using uncorrected transcription as fallback")
+        # Run correction
+        corrected_data = self.corrector.run(
+            transcription_results=self.results.transcription_results, lyrics_results=self.results.lyrics_results
+        )
+        # Store corrected results
+        self.results.transcription_corrected = corrected_data
+        self.logger.info("Lyrics correction completed")
+        # Add human review step
+        if self.output_config.enable_review:  # We'll need to add this config option
+            from ..review import start_review_server
+            self.logger.info("Starting human review process")
+            self.results.transcription_corrected = start_review_server(corrected_data)
+            self.logger.info("Human review completed")
     def generate_outputs(self) -> None:
         """Generate output files."""
         self.logger.info("Generating output files")
-        try:
-            output_files = self.output_generator.generate_outputs(
-                transcription_data=self.results.transcription_corrected,
-                output_prefix=self.output_prefix,
-                audio_filepath=self.audio_filepath,
-                render_video=self.output_config.render_video,
-            )
-            # Store output paths
-            self.results.lrc_filepath = output_files.get("lrc")
-            self.results.ass_filepath = output_files.get("ass")
-            self.results.video_filepath = output_files.get("video")
-        except Exception as e:
-            self.logger.error(f"Failed to generate outputs: {str(e)}")
-            raise
+        output_files = self.output_generator.generate_outputs(
+            transcription_corrected=self.results.transcription_corrected,
+            lyrics_results=self.results.lyrics_results,
+            output_prefix=self.output_prefix,
+            audio_filepath=self.audio_filepath,
+            artist=self.artist,
+            title=self.title,
+        )
+        # Store all output paths in results
+        self.results.lrc_filepath = output_files.lrc
+        self.results.ass_filepath = output_files.ass
+        self.results.video_filepath = output_files.video
+        self.results.original_txt = output_files.original_txt
+        self.results.corrected_txt = output_files.corrected_txt
+        self.results.corrections_json = output_files.corrections_json
+        self.results.cdg_filepath = output_files.cdg
+        self.results.mp3_filepath = output_files.mp3
+        self.results.cdg_zip_filepath = output_files.cdg_zip

lyrics-transcriber 0.30.0__py3-none-any.whl → 0.32.1__py3-none-any.whl

lyrics-transcriber 0.30.0py3-none-any.whl → 0.32.1py3-none-any.whl