PyPI - lyrics-transcriber - Versions diffs - 0.30.0__py3-none-any.whl → 0.30.1__py3-none-any.whl - Mend

lyrics-transcriber 0.30.0py3-none-any.whl → 0.30.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

lyrics_transcriber/cli/{main.py → cli_main.py} +15 -3
lyrics_transcriber/core/controller.py +129 -95
lyrics_transcriber/correction/base_strategy.py +29 -0
lyrics_transcriber/correction/corrector.py +52 -0
lyrics_transcriber/correction/strategy_diff.py +263 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +201 -0
lyrics_transcriber/lyrics/genius.py +70 -0
lyrics_transcriber/lyrics/spotify.py +82 -0
lyrics_transcriber/output/generator.py +158 -97
lyrics_transcriber/output/subtitles.py +12 -12
lyrics_transcriber/storage/dropbox.py +110 -134
lyrics_transcriber/transcribers/audioshake.py +170 -105
lyrics_transcriber/transcribers/base_transcriber.py +186 -0
lyrics_transcriber/transcribers/whisper.py +268 -133
{lyrics_transcriber-0.30.0.dist-info → lyrics_transcriber-0.30.1.dist-info}/METADATA +1 -1
lyrics_transcriber-0.30.1.dist-info/RECORD +25 -0
lyrics_transcriber-0.30.1.dist-info/entry_points.txt +3 -0
lyrics_transcriber/core/corrector.py +0 -56
lyrics_transcriber/core/fetcher.py +0 -143
lyrics_transcriber/storage/tokens.py +0 -116
lyrics_transcriber/transcribers/base.py +0 -31
lyrics_transcriber-0.30.0.dist-info/RECORD +0 -22
lyrics_transcriber-0.30.0.dist-info/entry_points.txt +0 -3
{lyrics_transcriber-0.30.0.dist-info → lyrics_transcriber-0.30.1.dist-info}/LICENSE +0 -0
{lyrics_transcriber-0.30.0.dist-info → lyrics_transcriber-0.30.1.dist-info}/WHEEL +0 -0

lyrics_transcriber/transcribers/whisper.py CHANGED Viewed

@@ -1,134 +1,60 @@
 #! /usr/bin/env python3
+from dataclasses import dataclass
 import os
-import sys
 import json
 import requests
 import hashlib
 import tempfile
-from time import sleep
+import time
+from typing import Optional, Dict, Any, Protocol, Union
+from pathlib import Path
 from pydub import AudioSegment
-from .base import BaseTranscriber
-from ..storage.dropbox import DropboxHandler
+from .base_transcriber import BaseTranscriber, TranscriptionData, LyricsSegment, Word, TranscriptionError
-class WhisperTranscriber(BaseTranscriber):
-    """Transcription service using Whisper API via RunPod."""
+@dataclass
+class WhisperConfig:
+    """Configuration for Whisper transcription service."""
-    def __init__(
-        self,
-        logger=None,
-        runpod_api_key=None,
-        endpoint_id=None,
-        dropbox_app_key=None,
-        dropbox_app_secret=None,
-        dropbox_refresh_token=None,
-        dropbox_access_token=None,
-    ):
-        super().__init__(logger)
-        self.runpod_api_key = runpod_api_key or os.getenv("RUNPOD_API_KEY")
-        self.endpoint_id = endpoint_id or os.getenv("WHISPER_RUNPOD_ID")
-        if not self.runpod_api_key or not self.endpoint_id:
-            raise ValueError("RunPod API key and endpoint ID must be provided either directly or via environment variables")
-        self.dbx = DropboxHandler(
-            app_key=dropbox_app_key or os.getenv("WHISPER_DROPBOX_APP_KEY"),
-            app_secret=dropbox_app_secret or os.getenv("WHISPER_DROPBOX_APP_SECRET"),
-            refresh_token=dropbox_refresh_token or os.getenv("WHISPER_DROPBOX_REFRESH_TOKEN"),
-            access_token=dropbox_access_token or os.getenv("WHISPER_DROPBOX_ACCESS_TOKEN"),
-        )
+    runpod_api_key: Optional[str] = None
+    endpoint_id: Optional[str] = None
+    dropbox_app_key: Optional[str] = None
+    dropbox_app_secret: Optional[str] = None
+    dropbox_refresh_token: Optional[str] = None
+    timeout_minutes: int = 10
-    def get_name(self) -> str:
-        return "Whisper"
-    def transcribe(self, audio_filepath: str) -> dict:
-        """
-        Transcribe an audio file using Whisper API via RunPod.
+class FileStorageProtocol(Protocol):
+    """Protocol for file storage operations."""
-        Args:
-            audio_filepath: Path to the audio file to transcribe
+    def file_exists(self, path: str) -> bool: ...  # pragma: no cover
+    def upload_with_retry(self, file: Any, path: str) -> None: ...  # pragma: no cover
+    def create_or_get_shared_link(self, path: str) -> str: ...  # pragma: no cover
-        Returns:
-            Dict containing:
-                - segments: List of segments with start/end times and word-level data
-                - text: Full text transcription
-                - metadata: Dict of additional info
-        """
-        self.logger.info(f"Starting transcription for {audio_filepath} using Whisper API")
-        # Calculate MD5 hash and prepare file
-        file_hash = self._get_file_md5(audio_filepath)
-        processed_filepath = self._convert_to_flac(audio_filepath)
+class RunPodWhisperAPI:
+    """Handles interactions with RunPod API."""
-        try:
-            # Upload to Dropbox and get URL
-            dropbox_path = f"/transcription_temp/{file_hash}{os.path.splitext(processed_filepath)[1]}"
-            audio_url = self._upload_and_get_link(processed_filepath, dropbox_path)
-            # Get transcription from API
-            result = self._run_transcription(audio_url)
-            # Add metadata
-            result["metadata"] = {
-                "service": self.get_name(),
-                "model": "large-v2",
-                "language": "en",
-            }
+    def __init__(self, config: WhisperConfig, logger):
+        self.config = config
+        self.logger = logger
+        self._validate_config()
-            return result
+    def _validate_config(self) -> None:
+        """Validate API configuration."""
+        if not self.config.runpod_api_key or not self.config.endpoint_id:
+            raise ValueError("RunPod API key and endpoint ID must be provided")
-        finally:
-            # Clean up temporary FLAC file if one was created
-            if processed_filepath != audio_filepath:
-                self.logger.debug(f"Cleaning up temporary file: {processed_filepath}")
-                os.unlink(processed_filepath)
-    def _convert_to_flac(self, filepath: str) -> str:
-        """Convert WAV to FLAC if needed for faster upload."""
-        if not filepath.lower().endswith(".wav"):
-            return filepath
-        self.logger.info("Converting WAV to FLAC for faster upload...")
-        audio = AudioSegment.from_wav(filepath)
-        with tempfile.NamedTemporaryFile(suffix=".flac", delete=False) as temp_flac:
-            flac_path = temp_flac.name
-            audio.export(flac_path, format="flac")
-        return flac_path
-    def _get_file_md5(self, filepath: str) -> str:
-        """Calculate MD5 hash of a file."""
-        md5_hash = hashlib.md5()
-        with open(filepath, "rb") as f:
-            for chunk in iter(lambda: f.read(4096), b""):
-                md5_hash.update(chunk)
-        return md5_hash.hexdigest()
-    def _upload_and_get_link(self, filepath: str, dropbox_path: str) -> str:
-        """Upload file to Dropbox and return shared link."""
-        if not self.dbx.file_exists(dropbox_path):
-            self.logger.info("Uploading file to Dropbox...")
-            with open(filepath, "rb") as f:
-                self.dbx.upload_with_retry(f, dropbox_path)
-        else:
-            self.logger.info("File already exists in Dropbox, skipping upload...")
-        audio_url = self.dbx.create_or_get_shared_link(dropbox_path)
-        self.logger.debug(f"Using shared link: {audio_url}")
-        return audio_url
-    def _run_transcription(self, audio_url: str) -> dict:
-        """Submit transcription job to RunPod and get results."""
-        run_url = f"https://api.runpod.ai/v2/{self.endpoint_id}/run"
-        status_url = f"https://api.runpod.ai/v2/{self.endpoint_id}/status"
-        headers = {"Authorization": f"Bearer {self.runpod_api_key}"}
+    def submit_job(self, audio_url: str) -> str:
+        """Submit transcription job and return job ID."""
+        run_url = f"https://api.runpod.ai/v2/{self.config.endpoint_id}/run"
+        headers = {"Authorization": f"Bearer {self.config.runpod_api_key}"}
         payload = {
             "input": {
                 "audio": audio_url,
                 "word_timestamps": True,
-                "model": "large-v2",
+                "model": "medium",
                 "temperature": 0.2,
                 "best_of": 5,
                 "compression_ratio_threshold": 2.8,
@@ -138,49 +64,258 @@ class WhisperTranscriber(BaseTranscriber):
             }
         }
-        # Submit job
         self.logger.info("Submitting transcription job...")
         response = requests.post(run_url, json=payload, headers=headers)
         self.logger.debug(f"Response status code: {response.status_code}")
+        # Try to parse and log the JSON response
         try:
-            self.logger.debug(f"Response content: {json.dumps(response.json(), indent=2)}")
-        except:
+            response_json = response.json()
+            self.logger.debug(f"Response content: {json.dumps(response_json, indent=2)}")
+        except ValueError:
             self.logger.debug(f"Raw response content: {response.text}")
+            # Re-raise if we can't parse the response at all
+            raise TranscriptionError(f"Invalid JSON response: {response.text}")
+        response.raise_for_status()
+        return response_json["id"]
+    def get_job_status(self, job_id: str) -> Dict[str, Any]:
+        """Get job status and results."""
+        status_url = f"https://api.runpod.ai/v2/{self.config.endpoint_id}/status/{job_id}"
+        headers = {"Authorization": f"Bearer {self.config.runpod_api_key}"}
+        response = requests.get(status_url, headers=headers)
         response.raise_for_status()
-        job_id = response.json()["id"]
+        return response.json()
+    def cancel_job(self, job_id: str) -> None:
+        """Cancel a running job."""
+        cancel_url = f"https://api.runpod.ai/v2/{self.config.endpoint_id}/cancel/{job_id}"
+        headers = {"Authorization": f"Bearer {self.config.runpod_api_key}"}
+        try:
+            response = requests.post(cancel_url, headers=headers)
+            response.raise_for_status()
+        except Exception as e:
+            self.logger.warning(f"Failed to cancel job {job_id}: {e}")
+    def wait_for_job_result(self, job_id: str) -> Dict[str, Any]:
+        """Poll for job completion and return results."""
+        self.logger.info(f"Getting job result for job {job_id}")
+        start_time = time.time()
+        last_status_log = start_time
+        timeout_seconds = self.config.timeout_minutes * 60
-        # Poll for results
-        self.logger.info("Waiting for results...")
         while True:
-            status_response = requests.get(f"{status_url}/{job_id}", headers=headers)
-            status_response.raise_for_status()
-            status_data = status_response.json()
+            current_time = time.time()
+            elapsed_time = current_time - start_time
+            if elapsed_time > timeout_seconds:
+                self.cancel_job(job_id)
+                raise TranscriptionError(f"Transcription timed out after {self.config.timeout_minutes} minutes")
+            # Log status periodically
+            if current_time - last_status_log >= 60:
+                self.logger.info(f"Still waiting for transcription... Elapsed time: {int(elapsed_time/60)} minutes")
+                last_status_log = current_time
+            status_data = self.get_job_status(job_id)
             if status_data["status"] == "COMPLETED":
                 return status_data["output"]
             elif status_data["status"] == "FAILED":
-                raise Exception(f"Transcription failed: {status_data.get('error', 'Unknown error')}")
+                error_msg = status_data.get("error", "Unknown error")
+                self.logger.error(f"Job failed with error: {error_msg}")
+                raise TranscriptionError(f"Transcription failed: {error_msg}")
+            time.sleep(5)
+class AudioProcessor:
+    """Handles audio file processing."""
+    def __init__(self, logger):
+        self.logger = logger
+    def get_file_md5(self, filepath: str) -> str:
+        """Calculate MD5 hash of a file."""
+        md5_hash = hashlib.md5()
+        with open(filepath, "rb") as f:
+            for chunk in iter(lambda: f.read(4096), b""):
+                md5_hash.update(chunk)
+        return md5_hash.hexdigest()
+    def convert_to_flac(self, filepath: str) -> str:
+        """Convert WAV to FLAC if needed for faster upload."""
+        if not filepath.lower().endswith(".wav"):
+            return filepath
+        self.logger.info("Converting WAV to FLAC for faster upload...")
+        audio = AudioSegment.from_wav(filepath)
+        with tempfile.NamedTemporaryFile(suffix=".flac", delete=False) as temp_flac:
+            flac_path = temp_flac.name
+            audio.export(flac_path, format="flac")
+        return flac_path
+class WhisperTranscriber(BaseTranscriber):
+    """Transcription service using Whisper API via RunPod."""
+    def __init__(
+        self,
+        cache_dir: Union[str, Path],
+        config: Optional[WhisperConfig] = None,
+        logger: Optional[Any] = None,
+        runpod_client: Optional[RunPodWhisperAPI] = None,
+        storage_client: Optional[FileStorageProtocol] = None,
+        audio_processor: Optional[AudioProcessor] = None,
+    ):
+        """Initialize Whisper transcriber."""
+        super().__init__(cache_dir=cache_dir, logger=logger)
+        # Initialize configuration
+        self.config = config or WhisperConfig(
+            runpod_api_key=os.getenv("RUNPOD_API_KEY"),
+            endpoint_id=os.getenv("WHISPER_RUNPOD_ID"),
+            dropbox_app_key=os.getenv("WHISPER_DROPBOX_APP_KEY"),
+            dropbox_app_secret=os.getenv("WHISPER_DROPBOX_APP_SECRET"),
+            dropbox_refresh_token=os.getenv("WHISPER_DROPBOX_REFRESH_TOKEN"),
+        )
+        # Initialize components (with dependency injection)
+        self.runpod = runpod_client or RunPodWhisperAPI(self.config, self.logger)
+        self.storage = storage_client or self._initialize_storage()
+        self.audio_processor = audio_processor or AudioProcessor(self.logger)
+    def _initialize_storage(self) -> FileStorageProtocol:
+        """Initialize storage client."""
+        from ..storage.dropbox import DropboxHandler, DropboxConfig
-            sleep(2)  # Wait 2 seconds before checking again
+        # Create config using os.getenv directly
+        config = DropboxConfig(
+            app_key=os.getenv("WHISPER_DROPBOX_APP_KEY"),
+            app_secret=os.getenv("WHISPER_DROPBOX_APP_SECRET"),
+            refresh_token=os.getenv("WHISPER_DROPBOX_REFRESH_TOKEN"),
+        )
+        # Log the actual config values being used
+        self.logger.debug("Initializing DropboxHandler with config")
+        return DropboxHandler(config=config)
+    def get_name(self) -> str:
+        return "Whisper"
+    def _perform_transcription(self, audio_filepath: str) -> TranscriptionData:
+        """Actually perform the whisper transcription using Whisper API."""
+        self.logger.info(f"Starting transcription for {audio_filepath}")
-if __name__ == "__main__":
-    # Example usage
-    import logging
+        # Start transcription and get results
+        job_id = self.start_transcription(audio_filepath)
+        result = self.get_transcription_result(job_id)
+        return result
-    logging.basicConfig(level=logging.INFO)
+    def start_transcription(self, audio_filepath: str) -> str:
+        """Prepare audio and start whisper transcription job."""
+        audio_url, temp_filepath = self._prepare_audio_url(audio_filepath)
+        try:
+            return self.runpod.submit_job(audio_url)
+        except Exception as e:
+            if temp_filepath:
+                self._cleanup_temporary_files(temp_filepath)
+            raise TranscriptionError(f"Failed to submit job: {str(e)}") from e
+    def _prepare_audio_url(self, audio_filepath: str) -> tuple[str, Optional[str]]:
+        """Process audio file and return URL for API and path to any temporary files."""
+        if audio_filepath.startswith(("http://", "https://")):
+            return audio_filepath, None
+        file_hash = self.audio_processor.get_file_md5(audio_filepath)
+        temp_flac_filepath = self.audio_processor.convert_to_flac(audio_filepath)
+        # Upload and get URL
+        dropbox_path = f"/transcription_temp/{file_hash}{os.path.splitext(temp_flac_filepath)[1]}"
+        url = self._upload_and_get_link(temp_flac_filepath, dropbox_path)
+        return url, temp_flac_filepath
+    def get_transcription_result(self, job_id: str) -> Dict[str, Any]:
+        """Poll for whisper job completion and return raw results."""
+        raw_data = self.runpod.wait_for_job_result(job_id)
+        # Add job_id to raw data for later use
+        raw_data["job_id"] = job_id
+        return raw_data
+    def _convert_result_format(self, raw_data: Dict[str, Any]) -> TranscriptionData:
+        """Convert Whisper API response to standard format."""
+        self._validate_response(raw_data)
+        job_id = raw_data.get("job_id")
+        all_words = []
+        # First collect all words from word_timestamps
+        word_list = [
+            Word(
+                text=word["word"].strip(),
+                start_time=word["start"],
+                end_time=word["end"],
+                confidence=word.get("probability"),  # Only set if provided
+            )
+            for word in raw_data.get("word_timestamps", [])
+        ]
+        all_words.extend(word_list)
+        # Then create segments, using the words that fall within each segment's time range
+        segments = []
+        for seg in raw_data["segments"]:
+            segment_words = [word for word in word_list if seg["start"] <= word.start_time < seg["end"]]
+            segments.append(LyricsSegment(text=seg["text"].strip(), words=segment_words, start_time=seg["start"], end_time=seg["end"]))
+        return TranscriptionData(
+            segments=segments,
+            words=all_words,
+            text=raw_data["transcription"],
+            source=self.get_name(),
+            metadata={
+                "language": raw_data.get("detected_language", "en"),
+                "model": raw_data.get("model"),
+                "job_id": job_id,
+            },
+        )
-    if len(sys.argv) > 1:
-        audio_file = sys.argv[1]
-    else:
-        audio_file = input("Enter the path to your audio file: ")
+    def _upload_and_get_link(self, filepath: str, dropbox_path: str) -> str:
+        """Upload file to storage and return shared link."""
+        if not self.storage.file_exists(dropbox_path):
+            self.logger.info("Uploading file to storage...")
+            with open(filepath, "rb") as f:
+                self.storage.upload_with_retry(f, dropbox_path)
+        else:
+            self.logger.info("File already exists in storage, skipping upload...")
-    transcriber = WhisperTranscriber()
-    results = transcriber.transcribe(audio_file)
+        audio_url = self.storage.create_or_get_shared_link(dropbox_path)
+        self.logger.debug(f"Using shared link: {audio_url}")
+        return audio_url
-    output_file = f"transcription_results_{WhisperTranscriber._get_file_md5(audio_file)}.json"
-    with open(output_file, "w", encoding="utf-8") as f:
-        json.dump(results, f, indent=2)
-    print(f"Transcription completed! Results saved to {output_file}")
+    def _cleanup_temporary_files(self, *filepaths: Optional[str]) -> None:
+        """Clean up any temporary files that were created during transcription."""
+        for filepath in filepaths:
+            if filepath and os.path.exists(filepath):
+                try:
+                    os.remove(filepath)
+                    self.logger.debug(f"Cleaned up temporary file: {filepath}")
+                except Exception as e:
+                    self.logger.warning(f"Failed to clean up temporary file {filepath}: {e}")
+    def _validate_response(self, raw_data: Dict[str, Any]) -> None:
+        """Validate the response contains required fields."""
+        if not isinstance(raw_data, dict):
+            raise TranscriptionError(f"Invalid response format: {raw_data}")
+        if "segments" not in raw_data:
+            raise TranscriptionError("Response missing required 'segments' field")
+        if "transcription" not in raw_data:
+            raise TranscriptionError("Response missing required 'transcription' field")

{lyrics_transcriber-0.30.0.dist-info → lyrics_transcriber-0.30.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: lyrics-transcriber
-Version: 0.30.0
+Version: 0.30.1
 Summary: Automatically create synchronised lyrics files in ASS and MidiCo LRC formats with word-level timestamps, using Whisper and lyrics from Genius and Spotify
 Home-page: https://github.com/karaokenerds/python-lyrics-transcriber
 License: MIT

lyrics_transcriber-0.30.1.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,25 @@
+lyrics_transcriber/__init__.py,sha256=Hj2HdSBAl6kmiqa5s3MDo_RobkITadzuF-81-ON3awA,180
+lyrics_transcriber/cli/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+lyrics_transcriber/cli/cli_main.py,sha256=-h3W9E4P5lHEjIBWiDvY0v7avldhA-cfYoAVwMlv0Zo,8137
+lyrics_transcriber/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+lyrics_transcriber/core/controller.py,sha256=k_moklU2NqpHOGxWTRVyImWgX6_dv1NES0j50-FRGxw,13057
+lyrics_transcriber/correction/base_strategy.py,sha256=vEKsj19ZNZZkvHRP0J7cZamJWqjLZHbRJ9sN0AyHbAA,867
+lyrics_transcriber/correction/corrector.py,sha256=lsXJ1l5sNoZjIU65A3yWTXkOcraz7QP9KU8OUzA_UTc,2147
+lyrics_transcriber/correction/strategy_diff.py,sha256=xJTFnmVcuE18zZcitweVaRqB82jCMm9Ey29zAFB4LsI,10188
+lyrics_transcriber/lyrics/base_lyrics_provider.py,sha256=s5IDrlT6OudAA_gIlAQzeD0bPqoUFsiYftSQQm7XxOE,7518
+lyrics_transcriber/lyrics/genius.py,sha256=zDiv0t2f7wphnPdcyPH6tahXBfOnbE63Nu8eRG0nqg4,3195
+lyrics_transcriber/lyrics/spotify.py,sha256=Sic3nPFcpSWW7lE-yr3stb6D5m5WFSQXCwzWj3lW0Ls,3584
+lyrics_transcriber/output/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+lyrics_transcriber/output/ass.py,sha256=b8lnjgXGD1OD1ld_b1xxUmSOf4nSEfz9BpgSkh16R4g,90291
+lyrics_transcriber/output/generator.py,sha256=idUsuS01bnaIB5spDFZlxE0wsvJ2I071SmJfXO9BCCk,10870
+lyrics_transcriber/output/subtitles.py,sha256=JEehSPl81hxhK6cS6RK4XAC_OLentCxiMCE7UYI9B64,11851
+lyrics_transcriber/storage/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+lyrics_transcriber/storage/dropbox.py,sha256=Dyam1ULTkoxD1X5trkZ5dGp5XhBGCn998moC8IS9-68,9804
+lyrics_transcriber/transcribers/audioshake.py,sha256=0sXvD1FJYXxISH72n5HaN9fnTxgmaQrqmY1W5Lb6Yu8,8631
+lyrics_transcriber/transcribers/base_transcriber.py,sha256=9XWUlBSwBCjKvz7Gs1NT7EIysMyacS-YlvDjpwlqwgI,6985
+lyrics_transcriber/transcribers/whisper.py,sha256=QE9Dsb6emGOaFcepJHrECjVdCfAJZRncGj7uXy-0mAk,12942
+lyrics_transcriber-0.30.1.dist-info/LICENSE,sha256=BiPihPDxhxIPEx6yAxVfAljD5Bhm_XG2teCbPEj_m0Y,1069
+lyrics_transcriber-0.30.1.dist-info/METADATA,sha256=c6P3R-KVxCJ10m-92bezeetdztdB7vvv5RMlTnF4Xbg,5485
+lyrics_transcriber-0.30.1.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
+lyrics_transcriber-0.30.1.dist-info/entry_points.txt,sha256=KHZMIwodpv7TQUN9z28G-0knEFsRta9ZBAcIbmBAT40,75
+lyrics_transcriber-0.30.1.dist-info/RECORD,,

lyrics_transcriber-0.30.1.dist-info/entry_points.txt ADDED Viewed

@@ -0,0 +1,3 @@
+[console_scripts]
+lyrics-transcriber=lyrics_transcriber.cli.cli_main:main

lyrics_transcriber/core/corrector.py DELETED Viewed

@@ -1,56 +0,0 @@
-import json
-import logging
-from typing import Dict, Optional
-class LyricsTranscriptionCorrector:
-    def __init__(
-        self,
-        logger: Optional[logging.Logger] = None,
-    ):
-        self.logger = logger or logging.getLogger(__name__)
-        # Initialize instance variables for input data
-        self.spotify_lyrics_data_dict = None
-        self.spotify_lyrics_text = None
-        self.genius_lyrics_text = None
-        self.transcription_data_dict_whisper = None
-        self.transcription_data_dict_audioshake = None
-    def set_input_data(
-        self,
-        spotify_lyrics_data_dict: Optional[Dict] = None,
-        spotify_lyrics_text: Optional[str] = None,
-        genius_lyrics_text: Optional[str] = None,
-        transcription_data_dict_whisper: Optional[Dict] = None,
-        transcription_data_dict_audioshake: Optional[Dict] = None,
-    ) -> None:
-        """Store the input data as instance variables"""
-        self.spotify_lyrics_data_dict = spotify_lyrics_data_dict
-        self.spotify_lyrics_text = spotify_lyrics_text
-        self.genius_lyrics_text = genius_lyrics_text
-        self.transcription_data_dict_whisper = transcription_data_dict_whisper
-        self.transcription_data_dict_audioshake = transcription_data_dict_audioshake
-    def run_corrector(self) -> Dict:
-        """
-        Test implementation that replaces every third word with 'YOLO' in the AudioShake transcription.
-        """
-        self.logger.info("Running corrector (test implementation - replacing every 3rd word with YOLO)")
-        # Create a deep copy to avoid modifying the original
-        modified_data = json.loads(json.dumps(self.transcription_data_dict_audioshake))
-        # Process each segment
-        for segment in modified_data["segments"]:
-            # Replace every third word in the words list
-            for i in range(2, len(segment["words"]), 3):
-                segment["words"][i]["text"] = "YOLO"
-            # Reconstruct the segment text from the modified words
-            segment["text"] = " ".join(word["text"] for word in segment["words"])
-        # Reconstruct the full text from all segments
-        modified_data["text"] = "".join(segment["text"] for segment in modified_data["segments"])
-        return modified_data

lyrics-transcriber 0.30.0__py3-none-any.whl → 0.30.1__py3-none-any.whl

lyrics-transcriber 0.30.0py3-none-any.whl → 0.30.1py3-none-any.whl