PyPI - karaoke-gen - Versions diffs - 0.57.0__py3-none-any.whl → 0.71.27__py3-none-any.whl - Mend

karaoke-gen 0.57.0py3-none-any.whl → 0.71.27py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (268) hide show

karaoke_gen/audio_fetcher.py +461 -0
karaoke_gen/audio_processor.py +407 -30
karaoke_gen/config.py +62 -113
karaoke_gen/file_handler.py +32 -59
karaoke_gen/karaoke_finalise/karaoke_finalise.py +148 -67
karaoke_gen/karaoke_gen.py +270 -61
karaoke_gen/lyrics_processor.py +13 -1
karaoke_gen/metadata.py +78 -73
karaoke_gen/pipeline/__init__.py +87 -0
karaoke_gen/pipeline/base.py +215 -0
karaoke_gen/pipeline/context.py +230 -0
karaoke_gen/pipeline/executors/__init__.py +21 -0
karaoke_gen/pipeline/executors/local.py +159 -0
karaoke_gen/pipeline/executors/remote.py +257 -0
karaoke_gen/pipeline/stages/__init__.py +27 -0
karaoke_gen/pipeline/stages/finalize.py +202 -0
karaoke_gen/pipeline/stages/render.py +165 -0
karaoke_gen/pipeline/stages/screens.py +139 -0
karaoke_gen/pipeline/stages/separation.py +191 -0
karaoke_gen/pipeline/stages/transcription.py +191 -0
karaoke_gen/style_loader.py +531 -0
karaoke_gen/utils/bulk_cli.py +6 -0
karaoke_gen/utils/cli_args.py +424 -0
karaoke_gen/utils/gen_cli.py +26 -261
karaoke_gen/utils/remote_cli.py +1965 -0
karaoke_gen/video_background_processor.py +351 -0
karaoke_gen-0.71.27.dist-info/METADATA +610 -0
karaoke_gen-0.71.27.dist-info/RECORD +275 -0
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/WHEEL +1 -1
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/entry_points.txt +1 -0
lyrics_transcriber/__init__.py +10 -0
lyrics_transcriber/cli/__init__.py +0 -0
lyrics_transcriber/cli/cli_main.py +285 -0
lyrics_transcriber/core/__init__.py +0 -0
lyrics_transcriber/core/config.py +50 -0
lyrics_transcriber/core/controller.py +520 -0
lyrics_transcriber/correction/__init__.py +0 -0
lyrics_transcriber/correction/agentic/__init__.py +9 -0
lyrics_transcriber/correction/agentic/adapter.py +71 -0
lyrics_transcriber/correction/agentic/agent.py +313 -0
lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
lyrics_transcriber/correction/agentic/models/enums.py +38 -0
lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
lyrics_transcriber/correction/agentic/models/utils.py +19 -0
lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
lyrics_transcriber/correction/agentic/providers/base.py +36 -0
lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
lyrics_transcriber/correction/agentic/providers/config.py +73 -0
lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
lyrics_transcriber/correction/agentic/providers/health.py +28 -0
lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
lyrics_transcriber/correction/agentic/router.py +35 -0
lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
lyrics_transcriber/correction/anchor_sequence.py +1043 -0
lyrics_transcriber/correction/corrector.py +760 -0
lyrics_transcriber/correction/feedback/__init__.py +2 -0
lyrics_transcriber/correction/feedback/schemas.py +107 -0
lyrics_transcriber/correction/feedback/store.py +236 -0
lyrics_transcriber/correction/handlers/__init__.py +0 -0
lyrics_transcriber/correction/handlers/base.py +52 -0
lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
lyrics_transcriber/correction/handlers/llm.py +293 -0
lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
lyrics_transcriber/correction/handlers/repeat.py +88 -0
lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
lyrics_transcriber/correction/handlers/word_operations.py +187 -0
lyrics_transcriber/correction/operations.py +352 -0
lyrics_transcriber/correction/phrase_analyzer.py +435 -0
lyrics_transcriber/correction/text_utils.py +30 -0
lyrics_transcriber/frontend/.gitignore +23 -0
lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
lyrics_transcriber/frontend/.yarnrc.yml +3 -0
lyrics_transcriber/frontend/README.md +50 -0
lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
lyrics_transcriber/frontend/__init__.py +25 -0
lyrics_transcriber/frontend/eslint.config.js +28 -0
lyrics_transcriber/frontend/index.html +18 -0
lyrics_transcriber/frontend/package.json +42 -0
lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/public/favicon.ico +0 -0
lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/src/App.tsx +212 -0
lyrics_transcriber/frontend/src/api.ts +239 -0
lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
lyrics_transcriber/frontend/src/components/Header.tsx +387 -0
lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1373 -0
lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +688 -0
lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
lyrics_transcriber/frontend/src/main.tsx +17 -0
lyrics_transcriber/frontend/src/theme.ts +177 -0
lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
lyrics_transcriber/frontend/src/types.js +2 -0
lyrics_transcriber/frontend/src/types.ts +199 -0
lyrics_transcriber/frontend/src/validation.ts +132 -0
lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
lyrics_transcriber/frontend/tsconfig.app.json +26 -0
lyrics_transcriber/frontend/tsconfig.json +25 -0
lyrics_transcriber/frontend/tsconfig.node.json +23 -0
lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
lyrics_transcriber/frontend/update_version.js +11 -0
lyrics_transcriber/frontend/vite.config.d.ts +2 -0
lyrics_transcriber/frontend/vite.config.js +10 -0
lyrics_transcriber/frontend/vite.config.ts +11 -0
lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js +42039 -0
lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js.map +1 -0
lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
lyrics_transcriber/frontend/web_assets/index.html +18 -0
lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
lyrics_transcriber/frontend/yarn.lock +3752 -0
lyrics_transcriber/lyrics/__init__.py +0 -0
lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
lyrics_transcriber/lyrics/file_provider.py +95 -0
lyrics_transcriber/lyrics/genius.py +384 -0
lyrics_transcriber/lyrics/lrclib.py +231 -0
lyrics_transcriber/lyrics/musixmatch.py +156 -0
lyrics_transcriber/lyrics/spotify.py +290 -0
lyrics_transcriber/lyrics/user_input_provider.py +44 -0
lyrics_transcriber/output/__init__.py +0 -0
lyrics_transcriber/output/ass/__init__.py +21 -0
lyrics_transcriber/output/ass/ass.py +2088 -0
lyrics_transcriber/output/ass/ass_specs.txt +732 -0
lyrics_transcriber/output/ass/config.py +180 -0
lyrics_transcriber/output/ass/constants.py +23 -0
lyrics_transcriber/output/ass/event.py +94 -0
lyrics_transcriber/output/ass/formatters.py +132 -0
lyrics_transcriber/output/ass/lyrics_line.py +265 -0
lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
lyrics_transcriber/output/ass/section_detector.py +89 -0
lyrics_transcriber/output/ass/section_screen.py +106 -0
lyrics_transcriber/output/ass/style.py +187 -0
lyrics_transcriber/output/cdg.py +619 -0
lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
lyrics_transcriber/output/cdgmaker/config.py +151 -0
lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
lyrics_transcriber/output/cdgmaker/pack.py +507 -0
lyrics_transcriber/output/cdgmaker/render.py +346 -0
lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
lyrics_transcriber/output/cdgmaker/utils.py +132 -0
lyrics_transcriber/output/countdown_processor.py +267 -0
lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
lyrics_transcriber/output/fonts/arial.ttf +0 -0
lyrics_transcriber/output/fonts/georgia.ttf +0 -0
lyrics_transcriber/output/fonts/verdana.ttf +0 -0
lyrics_transcriber/output/generator.py +257 -0
lyrics_transcriber/output/lrc_to_cdg.py +61 -0
lyrics_transcriber/output/lyrics_file.py +102 -0
lyrics_transcriber/output/plain_text.py +96 -0
lyrics_transcriber/output/segment_resizer.py +431 -0
lyrics_transcriber/output/subtitles.py +397 -0
lyrics_transcriber/output/video.py +544 -0
lyrics_transcriber/review/__init__.py +0 -0
lyrics_transcriber/review/server.py +676 -0
lyrics_transcriber/storage/__init__.py +0 -0
lyrics_transcriber/storage/dropbox.py +225 -0
lyrics_transcriber/transcribers/__init__.py +0 -0
lyrics_transcriber/transcribers/audioshake.py +290 -0
lyrics_transcriber/transcribers/base_transcriber.py +157 -0
lyrics_transcriber/transcribers/whisper.py +330 -0
lyrics_transcriber/types.py +648 -0
lyrics_transcriber/utils/__init__.py +0 -0
lyrics_transcriber/utils/word_utils.py +27 -0
karaoke_gen-0.57.0.dist-info/METADATA +0 -167
karaoke_gen-0.57.0.dist-info/RECORD +0 -23
{karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info/licenses}/LICENSE +0 -0

karaoke_gen/style_loader.py ADDED Viewed

@@ -0,0 +1,531 @@
+"""
+Unified style loading and configuration module.
+This module provides a single source of truth for:
+- Default style configurations (intro, karaoke, end, cdg)
+- Asset key mappings (GCS asset keys -> style JSON paths)
+- Style loading from local files
+- Style loading from GCS with asset path updates
+Used by both the local CLI (karaoke-gen) and the cloud backend workers.
+"""
+import json
+import logging
+import os
+from pathlib import Path
+from typing import Any, Callable, Dict, List, Optional, Tuple, Union
+logger = logging.getLogger(__name__)
+# =============================================================================
+# DEFAULT STYLE CONFIGURATIONS
+# =============================================================================
+DEFAULT_INTRO_STYLE = {
+    "video_duration": 5,
+    "existing_image": None,
+    "background_color": "#000000",
+    "background_image": None,
+    "font": "Montserrat-Bold.ttf",
+    "artist_color": "#ffdf6b",
+    "artist_gradient": None,
+    "artist_text_transform": None,
+    "title_color": "#ffffff",
+    "title_gradient": None,
+    "title_text_transform": None,
+    "title_region": "370, 200, 3100, 480",
+    "artist_region": "370, 700, 3100, 480",
+    "extra_text": None,
+    "extra_text_color": "#ffffff",
+    "extra_text_gradient": None,
+    "extra_text_region": "370, 1200, 3100, 480",
+    "extra_text_text_transform": None,
+}
+DEFAULT_END_STYLE = {
+    "video_duration": 5,
+    "existing_image": None,
+    "background_color": "#000000",
+    "background_image": None,
+    "font": "Montserrat-Bold.ttf",
+    "artist_color": "#ffdf6b",
+    "artist_gradient": None,
+    "artist_text_transform": None,
+    "title_color": "#ffffff",
+    "title_gradient": None,
+    "title_text_transform": None,
+    "title_region": None,
+    "artist_region": None,
+    "extra_text": "THANK YOU FOR SINGING!",
+    "extra_text_color": "#ff7acc",
+    "extra_text_gradient": None,
+    "extra_text_region": None,
+    "extra_text_text_transform": None,
+}
+DEFAULT_KARAOKE_STYLE = {
+    # Video background
+    "background_color": "#000000",
+    "background_image": None,
+    # Font settings
+    "font": "Arial",
+    "font_path": "",  # Must be string, not None (for ASS generator)
+    "ass_name": "Default",
+    # Colors in "R, G, B, A" format (required by ASS)
+    "primary_color": "112, 112, 247, 255",
+    "secondary_color": "255, 255, 255, 255",
+    "outline_color": "26, 58, 235, 255",
+    "back_color": "0, 0, 0, 0",
+    # Boolean style options
+    "bold": False,
+    "italic": False,
+    "underline": False,
+    "strike_out": False,
+    # Numeric style options (all required for ASS)
+    "scale_x": 100,
+    "scale_y": 100,
+    "spacing": 0,
+    "angle": 0.0,
+    "border_style": 1,
+    "outline": 1,
+    "shadow": 0,
+    "margin_l": 0,
+    "margin_r": 0,
+    "margin_v": 0,
+    "encoding": 0,
+    # Layout settings
+    "max_line_length": 40,
+    "top_padding": 200,
+    "font_size": 100,
+}
+DEFAULT_CDG_STYLE = {
+    "font_path": None,
+    "instrumental_background": None,
+    "title_screen_background": None,
+    "outro_background": None,
+}
+# Combined defaults for convenience
+DEFAULT_STYLE_PARAMS = {
+    "intro": DEFAULT_INTRO_STYLE.copy(),
+    "end": DEFAULT_END_STYLE.copy(),
+    "karaoke": DEFAULT_KARAOKE_STYLE.copy(),
+    "cdg": DEFAULT_CDG_STYLE.copy(),
+}
+# =============================================================================
+# ASSET KEY MAPPINGS
+# =============================================================================
+# Maps GCS/upload asset keys to (section, field) paths in the style JSON.
+# Some assets map to multiple fields (e.g., font applies to intro, karaoke, end).
+ASSET_KEY_MAPPINGS: Dict[str, Union[Tuple[str, str], List[Tuple[str, str]]]] = {
+    # Background images - each maps to one section
+    "intro_background": ("intro", "background_image"),
+    "style_intro_background": ("intro", "background_image"),  # CLI upload key
+    "karaoke_background": ("karaoke", "background_image"),
+    "style_karaoke_background": ("karaoke", "background_image"),  # CLI upload key
+    "end_background": ("end", "background_image"),
+    "style_end_background": ("end", "background_image"),  # CLI upload key
+    # Font - maps to multiple sections
+    "font": [
+        ("intro", "font"),
+        ("karaoke", "font_path"),
+        ("end", "font"),
+        ("cdg", "font_path"),
+    ],
+    "style_font": [  # CLI upload key
+        ("intro", "font"),
+        ("karaoke", "font_path"),
+        ("end", "font"),
+        ("cdg", "font_path"),
+    ],
+    # CDG-specific backgrounds
+    "cdg_instrumental_background": ("cdg", "instrumental_background"),
+    "style_cdg_instrumental_background": ("cdg", "instrumental_background"),
+    "cdg_title_background": ("cdg", "title_screen_background"),
+    "style_cdg_title_background": ("cdg", "title_screen_background"),
+    "cdg_outro_background": ("cdg", "outro_background"),
+    "style_cdg_outro_background": ("cdg", "outro_background"),
+}
+# =============================================================================
+# STYLE LOADING FUNCTIONS
+# =============================================================================
+def load_style_params_from_file(
+    style_json_path: Optional[str],
+    logger: Optional[logging.Logger] = None,
+    exit_on_error: bool = True,
+) -> Dict[str, Any]:
+    """
+    Load style parameters from a local JSON file.
+    Args:
+        style_json_path: Path to the style JSON file, or None for defaults.
+        logger: Optional logger for messages.
+        exit_on_error: If True, calls sys.exit(1) on file errors.
+                       If False, raises exceptions instead.
+    Returns:
+        Dictionary of style parameters (loaded or defaults).
+    Raises:
+        FileNotFoundError: If file not found and exit_on_error=False.
+        json.JSONDecodeError: If invalid JSON and exit_on_error=False.
+    """
+    import sys
+    log = logger or logging.getLogger(__name__)
+    if not style_json_path:
+        log.info("No style parameters JSON file provided. Using default styles.")
+        return get_default_style_params()
+    try:
+        with open(style_json_path, "r") as f:
+            style_params = json.load(f)
+        log.info(f"Loaded style parameters from {style_json_path}")
+        return style_params
+    except FileNotFoundError:
+        log.error(f"Style parameters configuration file not found: {style_json_path}")
+        if exit_on_error:
+            sys.exit(1)
+        raise
+    except json.JSONDecodeError as e:
+        log.error(f"Invalid JSON in style parameters configuration file: {e}")
+        if exit_on_error:
+            sys.exit(1)
+        raise
+    except Exception as e:
+        log.error(f"Error loading style parameters file {style_json_path}: {e}")
+        if exit_on_error:
+            sys.exit(1)
+        raise
+def apply_style_overrides(
+    style_params: Dict[str, Any],
+    overrides: Dict[str, str],
+    logger: Optional[logging.Logger] = None,
+) -> None:
+    """
+    Recursively apply overrides to style parameters (in place).
+    Args:
+        style_params: Style parameters dict to modify.
+        overrides: Dict of "section.key" -> value overrides.
+        logger: Optional logger for messages.
+    """
+    log = logger or logging.getLogger(__name__)
+    for key, value in overrides.items():
+        keys = key.split('.')
+        current_level = style_params
+        for i, k in enumerate(keys):
+            if i == len(keys) - 1:
+                if k in current_level:
+                    # Cast to original type if possible
+                    try:
+                        original_type = type(current_level[k])
+                        if original_type == bool:
+                            value = str(value).lower() in ('true', '1', 't', 'y', 'yes')
+                        elif current_level[k] is not None:
+                            value = original_type(value)
+                    except (ValueError, TypeError) as e:
+                        log.warning(
+                            f"Could not cast override value '{value}' for key '{key}' "
+                            f"to original type. Using as string. Error: {e}"
+                        )
+                    current_level[k] = value
+                    log.info(f"Overrode style: {key} = {value}")
+                else:
+                    log.warning(f"Override key '{key}' not found in style parameters.")
+            elif k in current_level and isinstance(current_level[k], dict):
+                current_level = current_level[k]
+            else:
+                log.warning(
+                    f"Override key part '{k}' not found or not a dictionary for key '{key}'."
+                )
+                break
+def update_asset_paths(
+    style_data: Dict[str, Any],
+    local_assets: Dict[str, str],
+    logger: Optional[logging.Logger] = None,
+) -> bool:
+    """
+    Update file paths in style data to point to local asset files.
+    This is used when assets are downloaded from GCS and need their
+    paths updated in the style JSON to point to the local copies.
+    Args:
+        style_data: Style parameters dict to modify (in place).
+        local_assets: Dict mapping asset keys to local file paths.
+        logger: Optional logger for messages.
+    Returns:
+        True if any paths were updated, False otherwise.
+    """
+    log = logger or logging.getLogger(__name__)
+    updates_made = False
+    for asset_key, local_path in local_assets.items():
+        if asset_key not in ASSET_KEY_MAPPINGS:
+            continue
+        mappings = ASSET_KEY_MAPPINGS[asset_key]
+        # Normalize to list of tuples
+        if isinstance(mappings, tuple):
+            mappings = [mappings]
+        for section, field in mappings:
+            if section in style_data and isinstance(style_data[section], dict):
+                old_value = style_data[section].get(field, 'NOT SET')
+                style_data[section][field] = local_path
+                log.info(f"Updated {section}.{field}: {old_value} -> {local_path}")
+                updates_made = True
+    return updates_made
+def save_style_params(
+    style_data: Dict[str, Any],
+    output_path: str,
+    logger: Optional[logging.Logger] = None,
+) -> str:
+    """
+    Save style parameters to a JSON file.
+    Args:
+        style_data: Style parameters dict to save.
+        output_path: Path to save the JSON file.
+        logger: Optional logger for messages.
+    Returns:
+        The output path.
+    """
+    log = logger or logging.getLogger(__name__)
+    with open(output_path, 'w') as f:
+        json.dump(style_data, f, indent=2)
+    log.info(f"Saved style parameters to: {output_path}")
+    return output_path
+# =============================================================================
+# GCS STYLE LOADING (for backend workers)
+# =============================================================================
+def load_styles_from_gcs(
+    style_params_gcs_path: Optional[str],
+    style_assets: Optional[Dict[str, str]],
+    temp_dir: str,
+    download_func: Callable[[str, str], None],
+    logger: Optional[logging.Logger] = None,
+) -> Tuple[str, Dict[str, Any]]:
+    """
+    Download and process style configuration from GCS.
+    This is the main entry point for backend workers to load styles.
+    It handles:
+    1. Downloading style_params.json from GCS
+    2. Downloading all style assets (backgrounds, fonts)
+    3. Updating paths in the style JSON to point to local files
+    4. Saving the updated JSON
+    Args:
+        style_params_gcs_path: GCS path to style_params.json, or None.
+        style_assets: Dict of asset_key -> GCS path for style assets.
+        temp_dir: Temporary directory for downloaded files.
+        download_func: Function(gcs_path, local_path) to download files.
+        logger: Optional logger for messages.
+    Returns:
+        Tuple of (local_styles_path, style_data_dict).
+        If no custom styles, returns (minimal_styles_path, minimal_styles_dict).
+    """
+    log = logger or logging.getLogger(__name__)
+    style_dir = os.path.join(temp_dir, "style")
+    os.makedirs(style_dir, exist_ok=True)
+    styles_path = os.path.join(style_dir, "styles.json")
+    if not style_params_gcs_path:
+        log.info("No custom style_params_gcs_path found, using minimal/default styles")
+        minimal_styles = get_minimal_karaoke_styles()
+        save_style_params(minimal_styles, styles_path, log)
+        return styles_path, minimal_styles
+    try:
+        log.info(f"Downloading custom styles from {style_params_gcs_path}")
+        download_func(style_params_gcs_path, styles_path)
+        with open(styles_path, 'r') as f:
+            style_data = json.load(f)
+        log.info(f"Loaded style sections: {list(style_data.keys())}")
+        # Download style assets
+        local_assets = {}
+        if style_assets:
+            log.info(f"Downloading {len(style_assets)} style assets...")
+            for asset_key, gcs_path in style_assets.items():
+                if asset_key == 'style_params':
+                    continue  # Already downloaded
+                try:
+                    ext = os.path.splitext(gcs_path)[1] or '.png'
+                    local_path = os.path.join(style_dir, f"{asset_key}{ext}")
+                    download_func(gcs_path, local_path)
+                    local_assets[asset_key] = local_path
+                    log.info(f"  Downloaded {asset_key}: {local_path}")
+                except Exception as e:
+                    log.warning(f"  Failed to download {asset_key}: {e}")
+        # Update paths in style_data
+        if local_assets:
+            updates_made = update_asset_paths(style_data, local_assets, log)
+            if updates_made:
+                save_style_params(style_data, styles_path, log)
+        # Log karaoke style for debugging
+        if 'karaoke' in style_data:
+            k = style_data['karaoke']
+            log.info(
+                f"Final karaoke style: background_image={k.get('background_image', 'NOT SET')}, "
+                f"font_path={k.get('font_path', 'NOT SET')}"
+            )
+        return styles_path, style_data
+    except Exception as e:
+        log.warning(f"Failed to download custom styles: {e}, using defaults")
+        minimal_styles = get_minimal_karaoke_styles()
+        save_style_params(minimal_styles, styles_path, log)
+        return styles_path, minimal_styles
+# =============================================================================
+# HELPER FUNCTIONS
+# =============================================================================
+def get_default_style_params() -> Dict[str, Any]:
+    """Get a fresh copy of the default style parameters."""
+    return {
+        "intro": DEFAULT_INTRO_STYLE.copy(),
+        "end": DEFAULT_END_STYLE.copy(),
+        "karaoke": DEFAULT_KARAOKE_STYLE.copy(),
+        "cdg": DEFAULT_CDG_STYLE.copy(),
+    }
+def get_minimal_karaoke_styles() -> Dict[str, Any]:
+    """
+    Get minimal styles for karaoke video generation.
+    This is used when no custom styles are provided, providing
+    just enough configuration for the ASS subtitle generator and CDG generator.
+    """
+    return {
+        "karaoke": DEFAULT_KARAOKE_STYLE.copy(),
+        "cdg": DEFAULT_CDG_STYLE.copy(),
+    }
+def get_intro_format(style_params: Dict[str, Any]) -> Dict[str, Any]:
+    """
+    Extract intro/title screen format from style parameters.
+    Merges custom intro params with defaults.
+    """
+    defaults = DEFAULT_INTRO_STYLE
+    intro_params = style_params.get("intro", {})
+    result = defaults.copy()
+    result.update(intro_params)
+    return result
+def get_end_format(style_params: Dict[str, Any]) -> Dict[str, Any]:
+    """
+    Extract end screen format from style parameters.
+    Merges custom end params with defaults.
+    """
+    defaults = DEFAULT_END_STYLE
+    end_params = style_params.get("end", {})
+    result = defaults.copy()
+    result.update(end_params)
+    return result
+def get_karaoke_format(style_params: Dict[str, Any]) -> Dict[str, Any]:
+    """
+    Extract karaoke video format from style parameters.
+    Merges custom karaoke params with defaults.
+    """
+    defaults = DEFAULT_KARAOKE_STYLE
+    karaoke_params = style_params.get("karaoke", {})
+    result = defaults.copy()
+    result.update(karaoke_params)
+    return result
+def get_cdg_format(style_params: Dict[str, Any]) -> Optional[Dict[str, Any]]:
+    """
+    Extract CDG generation format from style parameters.
+    Returns None if no CDG section is defined.
+    """
+    if "cdg" not in style_params:
+        return None
+    defaults = DEFAULT_CDG_STYLE
+    cdg_params = style_params.get("cdg", {})
+    result = defaults.copy()
+    result.update(cdg_params)
+    return result
+def get_video_durations(style_params: Dict[str, Any]) -> Tuple[int, int]:
+    """
+    Get intro and end video durations from style parameters.
+    Returns:
+        Tuple of (intro_duration, end_duration) in seconds.
+    """
+    intro_duration = style_params.get("intro", {}).get(
+        "video_duration", DEFAULT_INTRO_STYLE["video_duration"]
+    )
+    end_duration = style_params.get("end", {}).get(
+        "video_duration", DEFAULT_END_STYLE["video_duration"]
+    )
+    return intro_duration, end_duration
+def get_existing_images(style_params: Dict[str, Any]) -> Tuple[Optional[str], Optional[str]]:
+    """
+    Get existing title and end images from style parameters.
+    Returns:
+        Tuple of (existing_title_image, existing_end_image) paths or None.
+    """
+    existing_title_image = style_params.get("intro", {}).get("existing_image")
+    existing_end_image = style_params.get("end", {}).get("existing_image")
+    return existing_title_image, existing_end_image

karaoke_gen/utils/bulk_cli.py CHANGED Viewed

@@ -1,4 +1,10 @@
 #!/usr/bin/env python
+# Suppress SyntaxWarnings from third-party dependencies (pydub, syrics)
+# that have invalid escape sequences in regex patterns (not yet fixed for Python 3.12+)
+import warnings
+warnings.filterwarnings("ignore", category=SyntaxWarning, module="pydub")
+warnings.filterwarnings("ignore", category=SyntaxWarning, module="syrics")
 import argparse
 import logging
 import pkg_resources

karaoke-gen 0.57.0__py3-none-any.whl → 0.71.27__py3-none-any.whl

karaoke-gen 0.57.0py3-none-any.whl → 0.71.27py3-none-any.whl