PyPI - karaoke-gen - Versions diffs - 0.90.1__py3-none-any.whl → 0.96.0__py3-none-any.whl - Mend

karaoke-gen 0.90.1py3-none-any.whl → 0.96.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (187) hide show

backend/.coveragerc +20 -0
backend/.gitignore +37 -0
backend/Dockerfile +43 -0
backend/Dockerfile.base +74 -0
backend/README.md +242 -0
backend/__init__.py +0 -0
backend/api/__init__.py +0 -0
backend/api/dependencies.py +457 -0
backend/api/routes/__init__.py +0 -0
backend/api/routes/admin.py +742 -0
backend/api/routes/audio_search.py +903 -0
backend/api/routes/auth.py +348 -0
backend/api/routes/file_upload.py +2076 -0
backend/api/routes/health.py +344 -0
backend/api/routes/internal.py +435 -0
backend/api/routes/jobs.py +1610 -0
backend/api/routes/review.py +652 -0
backend/api/routes/themes.py +162 -0
backend/api/routes/users.py +1014 -0
backend/config.py +172 -0
backend/main.py +133 -0
backend/middleware/__init__.py +5 -0
backend/middleware/audit_logging.py +124 -0
backend/models/__init__.py +0 -0
backend/models/job.py +519 -0
backend/models/requests.py +123 -0
backend/models/theme.py +153 -0
backend/models/user.py +254 -0
backend/models/worker_log.py +164 -0
backend/pyproject.toml +29 -0
backend/quick-check.sh +93 -0
backend/requirements.txt +29 -0
backend/run_tests.sh +60 -0
backend/services/__init__.py +0 -0
backend/services/audio_analysis_service.py +243 -0
backend/services/audio_editing_service.py +278 -0
backend/services/audio_search_service.py +702 -0
backend/services/auth_service.py +630 -0
backend/services/credential_manager.py +792 -0
backend/services/discord_service.py +172 -0
backend/services/dropbox_service.py +301 -0
backend/services/email_service.py +1093 -0
backend/services/encoding_interface.py +454 -0
backend/services/encoding_service.py +405 -0
backend/services/firestore_service.py +512 -0
backend/services/flacfetch_client.py +573 -0
backend/services/gce_encoding/README.md +72 -0
backend/services/gce_encoding/__init__.py +22 -0
backend/services/gce_encoding/main.py +589 -0
backend/services/gce_encoding/requirements.txt +16 -0
backend/services/gdrive_service.py +356 -0
backend/services/job_logging.py +258 -0
backend/services/job_manager.py +842 -0
backend/services/job_notification_service.py +271 -0
backend/services/local_encoding_service.py +590 -0
backend/services/local_preview_encoding_service.py +407 -0
backend/services/lyrics_cache_service.py +216 -0
backend/services/metrics.py +413 -0
backend/services/packaging_service.py +287 -0
backend/services/rclone_service.py +106 -0
backend/services/storage_service.py +209 -0
backend/services/stripe_service.py +275 -0
backend/services/structured_logging.py +254 -0
backend/services/template_service.py +330 -0
backend/services/theme_service.py +469 -0
backend/services/tracing.py +543 -0
backend/services/user_service.py +721 -0
backend/services/worker_service.py +558 -0
backend/services/youtube_service.py +112 -0
backend/services/youtube_upload_service.py +445 -0
backend/tests/__init__.py +4 -0
backend/tests/conftest.py +224 -0
backend/tests/emulator/__init__.py +7 -0
backend/tests/emulator/conftest.py +88 -0
backend/tests/emulator/test_e2e_cli_backend.py +1053 -0
backend/tests/emulator/test_emulator_integration.py +356 -0
backend/tests/emulator/test_style_loading_direct.py +436 -0
backend/tests/emulator/test_worker_logs_direct.py +229 -0
backend/tests/emulator/test_worker_logs_subcollection.py +443 -0
backend/tests/requirements-test.txt +10 -0
backend/tests/requirements.txt +6 -0
backend/tests/test_admin_email_endpoints.py +411 -0
backend/tests/test_api_integration.py +460 -0
backend/tests/test_api_routes.py +93 -0
backend/tests/test_audio_analysis_service.py +294 -0
backend/tests/test_audio_editing_service.py +386 -0
backend/tests/test_audio_search.py +1398 -0
backend/tests/test_audio_services.py +378 -0
backend/tests/test_auth_firestore.py +231 -0
backend/tests/test_config_extended.py +68 -0
backend/tests/test_credential_manager.py +377 -0
backend/tests/test_dependencies.py +54 -0
backend/tests/test_discord_service.py +244 -0
backend/tests/test_distribution_services.py +820 -0
backend/tests/test_dropbox_service.py +472 -0
backend/tests/test_email_service.py +492 -0
backend/tests/test_emulator_integration.py +322 -0
backend/tests/test_encoding_interface.py +412 -0
backend/tests/test_file_upload.py +1739 -0
backend/tests/test_flacfetch_client.py +632 -0
backend/tests/test_gdrive_service.py +524 -0
backend/tests/test_instrumental_api.py +431 -0
backend/tests/test_internal_api.py +343 -0
backend/tests/test_job_creation_regression.py +583 -0
backend/tests/test_job_manager.py +339 -0
backend/tests/test_job_manager_notifications.py +329 -0
backend/tests/test_job_notification_service.py +443 -0
backend/tests/test_jobs_api.py +273 -0
backend/tests/test_local_encoding_service.py +423 -0
backend/tests/test_local_preview_encoding_service.py +567 -0
backend/tests/test_main.py +87 -0
backend/tests/test_models.py +918 -0
backend/tests/test_packaging_service.py +382 -0
backend/tests/test_requests.py +201 -0
backend/tests/test_routes_jobs.py +282 -0
backend/tests/test_routes_review.py +337 -0
backend/tests/test_services.py +556 -0
backend/tests/test_services_extended.py +112 -0
backend/tests/test_storage_service.py +448 -0
backend/tests/test_style_upload.py +261 -0
backend/tests/test_template_service.py +295 -0
backend/tests/test_theme_service.py +516 -0
backend/tests/test_unicode_sanitization.py +522 -0
backend/tests/test_upload_api.py +256 -0
backend/tests/test_validate.py +156 -0
backend/tests/test_video_worker_orchestrator.py +847 -0
backend/tests/test_worker_log_subcollection.py +509 -0
backend/tests/test_worker_logging.py +365 -0
backend/tests/test_workers.py +1116 -0
backend/tests/test_workers_extended.py +178 -0
backend/tests/test_youtube_service.py +247 -0
backend/tests/test_youtube_upload_service.py +568 -0
backend/validate.py +173 -0
backend/version.py +27 -0
backend/workers/README.md +597 -0
backend/workers/__init__.py +11 -0
backend/workers/audio_worker.py +618 -0
backend/workers/lyrics_worker.py +683 -0
backend/workers/render_video_worker.py +483 -0
backend/workers/screens_worker.py +525 -0
backend/workers/style_helper.py +198 -0
backend/workers/video_worker.py +1277 -0
backend/workers/video_worker_orchestrator.py +701 -0
backend/workers/worker_logging.py +278 -0
karaoke_gen/instrumental_review/static/index.html +7 -4
karaoke_gen/karaoke_finalise/karaoke_finalise.py +6 -1
karaoke_gen/utils/__init__.py +163 -8
karaoke_gen/video_background_processor.py +9 -4
{karaoke_gen-0.90.1.dist-info → karaoke_gen-0.96.0.dist-info}/METADATA +1 -1
{karaoke_gen-0.90.1.dist-info → karaoke_gen-0.96.0.dist-info}/RECORD +186 -41
lyrics_transcriber/correction/agentic/providers/config.py +9 -5
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +1 -51
lyrics_transcriber/correction/corrector.py +192 -130
lyrics_transcriber/correction/operations.py +24 -9
lyrics_transcriber/frontend/package-lock.json +2 -2
lyrics_transcriber/frontend/package.json +1 -1
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +1 -1
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +11 -7
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +31 -5
lyrics_transcriber/frontend/src/components/EditModal.tsx +28 -10
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +123 -27
lyrics_transcriber/frontend/src/components/EditWordList.tsx +112 -60
lyrics_transcriber/frontend/src/components/Header.tsx +90 -76
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +53 -31
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/SyncControls.tsx +44 -13
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/TimelineCanvas.tsx +66 -50
lyrics_transcriber/frontend/src/components/LyricsSynchronizer/index.tsx +124 -30
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +1 -1
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +12 -5
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +3 -3
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +1 -1
lyrics_transcriber/frontend/src/components/WordDivider.tsx +11 -7
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +4 -2
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +103 -1
lyrics_transcriber/frontend/src/theme.ts +42 -15
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -1
lyrics_transcriber/frontend/vite.config.js +5 -0
lyrics_transcriber/frontend/web_assets/assets/{index-BECn1o8Q.js → index-BSMgOq4Z.js} +6959 -5782
lyrics_transcriber/frontend/web_assets/assets/index-BSMgOq4Z.js.map +1 -0
lyrics_transcriber/frontend/web_assets/index.html +6 -2
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.svg +5 -0
lyrics_transcriber/output/generator.py +17 -3
lyrics_transcriber/output/video.py +60 -95
lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js.map +0 -1
{karaoke_gen-0.90.1.dist-info → karaoke_gen-0.96.0.dist-info}/WHEEL +0 -0
{karaoke_gen-0.90.1.dist-info → karaoke_gen-0.96.0.dist-info}/entry_points.txt +0 -0
{karaoke_gen-0.90.1.dist-info → karaoke_gen-0.96.0.dist-info}/licenses/LICENSE +0 -0

backend/workers/video_worker_orchestrator.py ADDED Viewed

@@ -0,0 +1,701 @@
+"""
+Video Worker Orchestrator.
+Coordinates the video generation pipeline stages in a unified way,
+regardless of whether encoding happens locally or on GCE.
+This resolves the code path divergence where GCE encoding bypassed
+features like YouTube upload, Discord notifications, and CDG/TXT packaging.
+Pipeline stages:
+1. Setup - Download files, prepare directories
+2. Packaging - CDG/TXT generation (if enabled)
+3. Encoding - GCE or Local via EncodingBackend interface
+4. Organization - Brand code, folder structure
+5. Distribution - YouTube, Dropbox, Google Drive uploads
+6. Notification - Discord notifications
+"""
+import logging
+import os
+import time
+from dataclasses import dataclass, field
+from typing import Optional, Dict, Any, List
+from pathlib import Path
+from backend.models.job import JobStatus
+from backend.services.job_manager import JobManager
+from backend.services.storage_service import StorageService
+from backend.services.tracing import job_span, add_span_event
+from karaoke_gen.utils import sanitize_filename
+logger = logging.getLogger(__name__)
+@dataclass
+class OrchestratorConfig:
+    """Configuration for the video worker orchestrator."""
+    job_id: str
+    artist: str
+    title: str
+    # Input file paths (in temp_dir)
+    title_video_path: str
+    karaoke_video_path: str
+    instrumental_audio_path: str
+    end_video_path: Optional[str] = None
+    lrc_file_path: Optional[str] = None
+    title_jpg_path: Optional[str] = None
+    # Output directory
+    output_dir: str = ""
+    # Feature flags
+    enable_cdg: bool = False
+    enable_txt: bool = False
+    enable_youtube_upload: bool = False
+    # Service configurations
+    brand_prefix: Optional[str] = None
+    discord_webhook_url: Optional[str] = None
+    youtube_credentials: Optional[Dict[str, Any]] = None
+    youtube_description_template: Optional[str] = None
+    cdg_styles: Optional[Dict[str, Any]] = None
+    # Dropbox/GDrive configuration
+    dropbox_path: Optional[str] = None
+    gdrive_folder_id: Optional[str] = None
+    # Keep existing brand code (for re-processing)
+    keep_brand_code: Optional[str] = None
+    # Encoding backend preference
+    encoding_backend: str = "auto"  # "auto", "local", "gce"
+    # Additional options
+    dry_run: bool = False
+    non_interactive: bool = True
+@dataclass
+class OrchestratorResult:
+    """Result from the video worker orchestrator."""
+    success: bool
+    error_message: Optional[str] = None
+    # Generated files
+    final_video: Optional[str] = None  # Lossless 4K MP4
+    final_video_mkv: Optional[str] = None  # Lossless 4K MKV
+    final_video_lossy: Optional[str] = None  # Lossy 4K MP4
+    final_video_720p: Optional[str] = None  # Lossy 720p MP4
+    final_karaoke_cdg_zip: Optional[str] = None
+    final_karaoke_txt_zip: Optional[str] = None
+    # Organization
+    brand_code: Optional[str] = None
+    # Distribution results
+    youtube_url: Optional[str] = None
+    dropbox_link: Optional[str] = None
+    gdrive_files: Optional[Dict[str, str]] = field(default_factory=dict)
+    # Timing
+    encoding_time_seconds: Optional[float] = None
+    total_time_seconds: Optional[float] = None
+class VideoWorkerOrchestrator:
+    """
+    Orchestrates the video generation pipeline.
+    This class coordinates all stages of video generation in a unified way,
+    ensuring that features like YouTube upload and Discord notifications
+    work regardless of whether GCE or local encoding is used.
+    """
+    def __init__(
+        self,
+        config: OrchestratorConfig,
+        job_manager: Optional[JobManager] = None,
+        storage: Optional[StorageService] = None,
+        job_logger: Optional[logging.Logger] = None,
+    ):
+        """
+        Initialize the orchestrator.
+        Args:
+            config: Orchestrator configuration
+            job_manager: Job manager for state updates (optional)
+            storage: Storage service for file downloads (optional)
+            job_logger: Job-specific logger (optional)
+        """
+        self.config = config
+        self.job_manager = job_manager
+        self.storage = storage
+        self.job_log = job_logger or logging.getLogger(__name__)
+        # Services (lazy-loaded)
+        self._encoding_backend = None
+        self._packaging_service = None
+        self._youtube_service = None
+        self._discord_service = None
+        # State
+        self.result = OrchestratorResult(success=False)
+    def _get_encoding_backend(self):
+        """Lazy-load the encoding backend."""
+        if self._encoding_backend is None:
+            from backend.services.encoding_interface import get_encoding_backend
+            self._encoding_backend = get_encoding_backend(
+                backend_type=self.config.encoding_backend,
+                dry_run=self.config.dry_run,
+                logger=self.job_log,
+            )
+        return self._encoding_backend
+    def _get_packaging_service(self):
+        """Lazy-load the packaging service."""
+        if self._packaging_service is None:
+            from backend.services.packaging_service import PackagingService
+            self._packaging_service = PackagingService(
+                cdg_styles=self.config.cdg_styles,
+                dry_run=self.config.dry_run,
+                non_interactive=self.config.non_interactive,
+                logger=self.job_log,
+            )
+        return self._packaging_service
+    def _get_youtube_service(self):
+        """Lazy-load the YouTube upload service."""
+        if self._youtube_service is None:
+            from backend.services.youtube_upload_service import YouTubeUploadService
+            self._youtube_service = YouTubeUploadService(
+                credentials=self.config.youtube_credentials,
+                non_interactive=self.config.non_interactive,
+                server_side_mode=True,
+                dry_run=self.config.dry_run,
+                logger=self.job_log,
+            )
+        return self._youtube_service
+    def _get_discord_service(self):
+        """Lazy-load the Discord notification service."""
+        if self._discord_service is None:
+            from backend.services.discord_service import DiscordNotificationService
+            self._discord_service = DiscordNotificationService(
+                webhook_url=self.config.discord_webhook_url,
+                dry_run=self.config.dry_run,
+                logger=self.job_log,
+            )
+        return self._discord_service
+    def _update_progress(self, status: JobStatus, progress: int, message: str):
+        """Update job progress if job_manager is available."""
+        if self.job_manager:
+            self.job_manager.transition_to_state(
+                job_id=self.config.job_id,
+                new_status=status,
+                progress=progress,
+                message=message
+            )
+    async def run(self) -> OrchestratorResult:
+        """
+        Run the full video generation pipeline.
+        Returns:
+            OrchestratorResult with generated files and metadata
+        """
+        start_time = time.time()
+        try:
+            with job_span("orchestrator", self.config.job_id) as span:
+                self.job_log.info(f"Starting orchestrated video generation for {self.config.artist} - {self.config.title}")
+                # Stage 1: Packaging (CDG/TXT) - runs BEFORE encoding
+                # This depends on LRC file, not on encoded videos
+                if self.config.enable_cdg or self.config.enable_txt:
+                    await self._run_packaging()
+                # Stage 2: Encoding
+                await self._run_encoding()
+                # Stage 3: Organization (brand code)
+                await self._run_organization()
+                # Stage 4: Distribution (YouTube, Dropbox, GDrive)
+                await self._run_distribution()
+                # Stage 5: Notifications (Discord)
+                await self._run_notifications()
+                self.result.success = True
+                self.result.total_time_seconds = time.time() - start_time
+                self.job_log.info(f"Orchestrated video generation complete in {self.result.total_time_seconds:.1f}s")
+        except Exception as e:
+            self.result.success = False
+            self.result.error_message = str(e)
+            self.result.total_time_seconds = time.time() - start_time
+            self.job_log.error(f"Orchestrated video generation failed: {e}")
+            logger.error(f"[job:{self.config.job_id}] Orchestration failed: {e}")
+        return self.result
+    async def _run_packaging(self):
+        """Run the packaging stage (CDG/TXT generation)."""
+        self.job_log.info("Starting packaging stage (CDG/TXT)")
+        if not self.config.lrc_file_path or not os.path.isfile(self.config.lrc_file_path):
+            self.job_log.warning("No LRC file available, skipping CDG/TXT packaging")
+            return
+        base_name = f"{self.config.artist} - {self.config.title}"
+        packaging_service = self._get_packaging_service()
+        # Generate CDG package
+        if self.config.enable_cdg:
+            self.job_log.info("Generating CDG package")
+            try:
+                cdg_zip_path = os.path.join(
+                    self.config.output_dir,
+                    f"{base_name} (Final Karaoke CDG).zip"
+                )
+                mp3_path = os.path.join(
+                    self.config.output_dir,
+                    f"{base_name} (Karaoke).mp3"
+                )
+                cdg_path = os.path.join(
+                    self.config.output_dir,
+                    f"{base_name} (Karaoke).cdg"
+                )
+                zip_file, mp3_file, cdg_file = packaging_service.create_cdg_package(
+                    lrc_file=self.config.lrc_file_path,
+                    audio_file=self.config.instrumental_audio_path,
+                    output_zip_path=cdg_zip_path,
+                    artist=self.config.artist,
+                    title=self.config.title,
+                    output_mp3_path=mp3_path,
+                    output_cdg_path=cdg_path,
+                )
+                self.result.final_karaoke_cdg_zip = zip_file
+                self.job_log.info(f"CDG package created: {zip_file}")
+            except Exception as e:
+                self.job_log.error(f"CDG generation failed: {e}")
+                # Don't fail the pipeline, CDG is optional
+        # Generate TXT package
+        if self.config.enable_txt:
+            self.job_log.info("Generating TXT package")
+            try:
+                # TXT package needs MP3 file (from CDG generation or create it)
+                mp3_path = os.path.join(
+                    self.config.output_dir,
+                    f"{base_name} (Karaoke).mp3"
+                )
+                if not os.path.isfile(mp3_path):
+                    self.job_log.info("MP3 not found, CDG must be enabled first for TXT")
+                    return
+                txt_zip_path = os.path.join(
+                    self.config.output_dir,
+                    f"{base_name} (Final Karaoke TXT).zip"
+                )
+                zip_file, txt_file = packaging_service.create_txt_package(
+                    lrc_file=self.config.lrc_file_path,
+                    mp3_file=mp3_path,
+                    output_zip_path=txt_zip_path,
+                )
+                self.result.final_karaoke_txt_zip = zip_file
+                self.job_log.info(f"TXT package created: {zip_file}")
+            except Exception as e:
+                self.job_log.error(f"TXT generation failed: {e}")
+                # Don't fail the pipeline, TXT is optional
+    async def _run_encoding(self):
+        """Run the encoding stage."""
+        self.job_log.info("Starting encoding stage")
+        self._update_progress(JobStatus.ENCODING, 75, "Encoding videos")
+        encoding_backend = self._get_encoding_backend()
+        self.job_log.info(f"Using encoding backend: {encoding_backend.name}")
+        # Build encoding input
+        from backend.services.encoding_interface import EncodingInput
+        from backend.config import settings
+        # For GCE encoding, we need to provide GCS paths
+        gcs_bucket = settings.gcs_bucket_name
+        input_gcs_path = f"gs://{gcs_bucket}/jobs/{self.config.job_id}/"
+        output_gcs_path = f"gs://{gcs_bucket}/jobs/{self.config.job_id}/finals/"
+        encoding_input = EncodingInput(
+            title_video_path=self.config.title_video_path,
+            karaoke_video_path=self.config.karaoke_video_path,
+            instrumental_audio_path=self.config.instrumental_audio_path,
+            end_video_path=self.config.end_video_path,
+            artist=self.config.artist,
+            title=self.config.title,
+            brand_code=self.config.keep_brand_code,
+            output_dir=self.config.output_dir,
+            options={
+                "job_id": self.config.job_id,
+                "input_gcs_path": input_gcs_path,
+                "output_gcs_path": output_gcs_path,
+            },
+        )
+        # Run encoding
+        with job_span("encoding", self.config.job_id) as span:
+            add_span_event("encoding_started", {"backend": encoding_backend.name})
+            output = await encoding_backend.encode(encoding_input)
+            add_span_event("encoding_completed", {
+                "success": output.success,
+                "duration": output.encoding_time_seconds or 0
+            })
+        if not output.success:
+            raise Exception(f"Encoding failed: {output.error_message}")
+        # Store results - for GCE backend, these are GCS blob paths that need to be downloaded
+        self.result.final_video = output.lossless_4k_mp4_path
+        self.result.final_video_mkv = output.lossless_mkv_path
+        self.result.final_video_lossy = output.lossy_4k_mp4_path
+        self.result.final_video_720p = output.lossy_720p_mp4_path
+        self.result.encoding_time_seconds = output.encoding_time_seconds
+        # For GCE encoding, download the encoded files from GCS to local directory
+        # This is required for YouTube upload and other local file operations
+        if encoding_backend.name == "gce" and self.storage:
+            await self._download_gce_encoded_files(output)
+        self.job_log.info(f"Encoding complete ({encoding_backend.name}) in {output.encoding_time_seconds:.1f}s")
+    async def _download_gce_encoded_files(self, output):
+        """
+        Download GCE-encoded files from GCS to the local output directory.
+        GCE encoding stores files in GCS and returns blob paths like:
+        'jobs/{job_id}/finals/Artist - Title (Final Karaoke Lossless 4k).mp4'
+        This method downloads those files locally so that subsequent stages
+        (YouTube upload, etc.) can access them as local files.
+        Args:
+            output: EncodingOutput from the GCE backend with GCS blob paths
+        """
+        self.job_log.info("Downloading GCE-encoded files from GCS")
+        # Map of result attributes to download
+        file_mappings = [
+            ('lossless_4k_mp4_path', 'final_video'),
+            ('lossless_mkv_path', 'final_video_mkv'),
+            ('lossy_4k_mp4_path', 'final_video_lossy'),
+            ('lossy_720p_mp4_path', 'final_video_720p'),
+        ]
+        downloaded_count = 0
+        for output_attr, result_attr in file_mappings:
+            gcs_path = getattr(output, output_attr, None)
+            if not gcs_path:
+                continue
+            # Extract filename from GCS path
+            filename = os.path.basename(gcs_path)
+            local_path = os.path.join(self.config.output_dir, filename)
+            try:
+                self.job_log.info(f"Downloading {filename} from GCS")
+                self.storage.download_file(gcs_path, local_path)
+                # Update the result to point to local file
+                setattr(self.result, result_attr, local_path)
+                downloaded_count += 1
+                self.job_log.info(f"Downloaded {filename} to {local_path}")
+            except Exception as e:
+                self.job_log.error(f"Failed to download {filename}: {e}")
+                # Clear the result attribute so downstream doesn't try to use invalid GCS path
+                setattr(self.result, result_attr, None)
+                # Don't fail - some formats might not be generated
+        self.job_log.info(f"Downloaded {downloaded_count} encoded files from GCS")
+    async def _run_organization(self):
+        """Run the organization stage (brand code generation)."""
+        self.job_log.info("Starting organization stage")
+        # Use existing brand code if provided
+        if self.config.keep_brand_code:
+            self.result.brand_code = self.config.keep_brand_code
+            self.job_log.info(f"Using preserved brand code: {self.result.brand_code}")
+            return
+        # Generate brand code from Dropbox if configured
+        if self.config.dropbox_path and self.config.brand_prefix:
+            try:
+                from backend.services.dropbox_service import get_dropbox_service
+                dropbox = get_dropbox_service()
+                if dropbox.is_configured:
+                    brand_code = dropbox.get_next_brand_code(
+                        self.config.dropbox_path,
+                        self.config.brand_prefix
+                    )
+                    self.result.brand_code = brand_code
+                    self.job_log.info(f"Generated brand code: {brand_code}")
+                else:
+                    self.job_log.warning("Dropbox not configured, skipping brand code generation")
+            except Exception as e:
+                self.job_log.error(f"Brand code generation failed: {e}")
+                # Don't fail - brand code is optional
+    async def _run_distribution(self):
+        """Run the distribution stage (YouTube, Dropbox, GDrive uploads)."""
+        self.job_log.info("Starting distribution stage")
+        self._update_progress(JobStatus.PACKAGING, 90, "Uploading files")
+        # YouTube upload
+        if self.config.enable_youtube_upload and self.config.youtube_credentials:
+            await self._upload_to_youtube()
+        # Dropbox upload
+        if self.config.dropbox_path and self.config.brand_prefix:
+            await self._upload_to_dropbox()
+        # Google Drive upload
+        if self.config.gdrive_folder_id:
+            await self._upload_to_gdrive()
+    async def _upload_to_youtube(self):
+        """Upload video to YouTube."""
+        self.job_log.info("Uploading to YouTube")
+        # Find the best video file to upload (prefer MKV for FLAC audio, then lossless MP4)
+        video_to_upload = None
+        if self.result.final_video_mkv and os.path.isfile(self.result.final_video_mkv):
+            video_to_upload = self.result.final_video_mkv
+        elif self.result.final_video and os.path.isfile(self.result.final_video):
+            video_to_upload = self.result.final_video
+        elif self.result.final_video_lossy and os.path.isfile(self.result.final_video_lossy):
+            video_to_upload = self.result.final_video_lossy
+        if not video_to_upload:
+            self.job_log.warning("No video file available for YouTube upload")
+            return
+        try:
+            youtube_service = self._get_youtube_service()
+            # Build video title
+            title = f"{self.config.artist} - {self.config.title} (Karaoke)"
+            # Build description
+            description = self.config.youtube_description_template or ""
+            if self.result.brand_code:
+                description = f"{description}\n\nBrand Code: {self.result.brand_code}".strip()
+            # Upload
+            video_id, video_url = youtube_service.upload_video(
+                video_path=video_to_upload,
+                title=title,
+                description=description,
+                thumbnail_path=self.config.title_jpg_path,
+                tags=["karaoke", self.config.artist, self.config.title],
+                replace_existing=True,  # Server-side always replaces
+            )
+            if video_url:
+                self.result.youtube_url = video_url
+                self.job_log.info(f"Uploaded to YouTube: {video_url}")
+            else:
+                self.job_log.warning("YouTube upload did not return a URL")
+        except Exception as e:
+            self.job_log.error(f"YouTube upload failed: {e}")
+            # Don't fail the pipeline - YouTube is optional
+    async def _upload_to_dropbox(self):
+        """Upload files to Dropbox."""
+        self.job_log.info("Uploading to Dropbox")
+        try:
+            from backend.services.dropbox_service import get_dropbox_service
+            dropbox = get_dropbox_service()
+            if not dropbox.is_configured:
+                self.job_log.warning("Dropbox not configured, skipping upload")
+                return
+            # Sanitize artist/title to handle Unicode characters (curly quotes, em dashes, etc.)
+            safe_artist = sanitize_filename(self.config.artist) if self.config.artist else "Unknown"
+            safe_title = sanitize_filename(self.config.title) if self.config.title else "Unknown"
+            base_name = f"{safe_artist} - {safe_title}"
+            folder_name = f"{self.result.brand_code or 'TRACK-0000'} - {base_name}"
+            remote_folder = f"{self.config.dropbox_path}/{folder_name}"
+            # Upload entire output directory
+            dropbox.upload_folder(self.config.output_dir, remote_folder)
+            # Create sharing link
+            try:
+                sharing_link = dropbox.create_shared_link(remote_folder)
+                self.result.dropbox_link = sharing_link
+                self.job_log.info(f"Dropbox sharing link: {sharing_link}")
+            except Exception as e:
+                self.job_log.warning(f"Failed to create Dropbox sharing link: {e}")
+            self.job_log.info("Dropbox upload complete")
+        except Exception as e:
+            self.job_log.error(f"Dropbox upload failed: {e}")
+            # Don't fail the pipeline - Dropbox is optional
+    async def _upload_to_gdrive(self):
+        """Upload files to Google Drive."""
+        self.job_log.info("Uploading to Google Drive")
+        try:
+            from backend.services.gdrive_service import get_gdrive_service
+            gdrive = get_gdrive_service()
+            if not gdrive.is_configured:
+                self.job_log.warning("Google Drive not configured, skipping upload")
+                return
+            base_name = f"{self.config.artist} - {self.config.title}"
+            brand_code = self.result.brand_code or f"{self.config.brand_prefix or 'TRACK'}-0000"
+            # Map result files to expected keys
+            output_files = {
+                'final_karaoke_lossy_mp4': self.result.final_video_lossy,
+                'final_karaoke_lossy_720p_mp4': self.result.final_video_720p,
+                'final_karaoke_cdg_zip': self.result.final_karaoke_cdg_zip,
+            }
+            uploaded = gdrive.upload_to_public_share(
+                root_folder_id=self.config.gdrive_folder_id,
+                brand_code=brand_code,
+                base_name=base_name,
+                output_files=output_files,
+            )
+            self.result.gdrive_files = uploaded
+            self.job_log.info(f"Google Drive upload complete: {len(uploaded)} files")
+        except Exception as e:
+            self.job_log.error(f"Google Drive upload failed: {e}")
+            # Don't fail the pipeline - GDrive is optional
+    async def _run_notifications(self):
+        """Run the notifications stage (Discord)."""
+        self.job_log.info("Starting notifications stage")
+        if not self.config.discord_webhook_url:
+            self.job_log.debug("No Discord webhook configured, skipping notification")
+            return
+        if not self.result.youtube_url:
+            self.job_log.info("No YouTube URL available, skipping Discord notification")
+            return
+        try:
+            discord_service = self._get_discord_service()
+            discord_service.post_video_notification(self.result.youtube_url)
+            self.job_log.info("Discord notification sent")
+        except Exception as e:
+            self.job_log.error(f"Discord notification failed: {e}")
+            # Don't fail the pipeline - notifications are optional
+def create_orchestrator_config_from_job(
+    job,
+    temp_dir: str,
+    youtube_credentials: Optional[Dict[str, Any]] = None,
+    cdg_styles: Optional[Dict[str, Any]] = None,
+) -> OrchestratorConfig:
+    """
+    Create an OrchestratorConfig from a job object.
+    This is a helper function to bridge the existing job structure
+    with the new orchestrator configuration.
+    Args:
+        job: Job object from Firestore
+        temp_dir: Temporary directory with downloaded files
+        youtube_credentials: Pre-loaded YouTube credentials
+        cdg_styles: CDG style configuration
+    Returns:
+        OrchestratorConfig for the orchestrator
+    """
+    # Sanitize artist/title to handle Unicode characters (curly quotes, em dashes, etc.)
+    safe_artist = sanitize_filename(job.artist) if job.artist else "Unknown"
+    safe_title = sanitize_filename(job.title) if job.title else "Unknown"
+    base_name = f"{safe_artist} - {safe_title}"
+    # Determine instrumental file path
+    instrumental_selection = job.state_data.get('instrumental_selection', 'clean')
+    existing_instrumental = getattr(job, 'existing_instrumental_gcs_path', None)
+    if existing_instrumental:
+        ext = Path(existing_instrumental).suffix.lower()
+        instrumental_path = os.path.join(temp_dir, f"{base_name} (Instrumental User){ext}")
+    else:
+        instrumental_suffix = "Clean" if instrumental_selection == 'clean' else "Backing"
+        instrumental_path = os.path.join(temp_dir, f"{base_name} (Instrumental {instrumental_suffix}).flac")
+    return OrchestratorConfig(
+        job_id=job.job_id,
+        artist=job.artist,
+        title=job.title,
+        # Input files
+        title_video_path=os.path.join(temp_dir, f"{base_name} (Title).mov"),
+        karaoke_video_path=os.path.join(temp_dir, f"{base_name} (With Vocals).mov"),
+        instrumental_audio_path=instrumental_path,
+        end_video_path=os.path.join(temp_dir, f"{base_name} (End).mov"),
+        lrc_file_path=os.path.join(temp_dir, f"{base_name} (Karaoke).lrc"),
+        title_jpg_path=os.path.join(temp_dir, f"{base_name} (Title).jpg"),
+        # Output directory
+        output_dir=temp_dir,
+        # Feature flags
+        enable_cdg=getattr(job, 'enable_cdg', False),
+        enable_txt=getattr(job, 'enable_txt', False),
+        enable_youtube_upload=getattr(job, 'enable_youtube_upload', False),
+        # Service configurations
+        brand_prefix=getattr(job, 'brand_prefix', None),
+        discord_webhook_url=getattr(job, 'discord_webhook_url', None),
+        youtube_credentials=youtube_credentials,
+        youtube_description_template=getattr(job, 'youtube_description_template', None),
+        cdg_styles=cdg_styles,
+        # Dropbox/GDrive
+        dropbox_path=getattr(job, 'dropbox_path', None),
+        gdrive_folder_id=getattr(job, 'gdrive_folder_id', None),
+        # Keep existing brand code
+        keep_brand_code=getattr(job, 'keep_brand_code', None),
+        # Encoding backend - auto selects GCE if available
+        encoding_backend="auto",
+        # Server-side defaults
+        dry_run=False,
+        non_interactive=True,
+    )

karaoke-gen 0.90.1__py3-none-any.whl → 0.96.0__py3-none-any.whl

karaoke-gen 0.90.1py3-none-any.whl → 0.96.0py3-none-any.whl