PyPI - karaoke-gen - Versions diffs - 0.50.0__py3-none-any.whl - Mend

karaoke-gen 0.50.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of karaoke-gen might be problematic. Click here for more details.

Files changed (23) hide show

karaoke_gen-0.50.0.dist-info/LICENSE +21 -0
karaoke_gen-0.50.0.dist-info/METADATA +140 -0
karaoke_gen-0.50.0.dist-info/RECORD +23 -0
karaoke_gen-0.50.0.dist-info/WHEEL +4 -0
karaoke_gen-0.50.0.dist-info/entry_points.txt +4 -0
karaoke_prep/__init__.py +1 -0
karaoke_prep/audio_processor.py +396 -0
karaoke_prep/config.py +134 -0
karaoke_prep/file_handler.py +186 -0
karaoke_prep/karaoke_finalise/__init__.py +1 -0
karaoke_prep/karaoke_finalise/karaoke_finalise.py +1163 -0
karaoke_prep/karaoke_prep.py +687 -0
karaoke_prep/lyrics_processor.py +225 -0
karaoke_prep/metadata.py +105 -0
karaoke_prep/resources/AvenirNext-Bold.ttf +0 -0
karaoke_prep/resources/Montserrat-Bold.ttf +0 -0
karaoke_prep/resources/Oswald-Bold.ttf +0 -0
karaoke_prep/resources/Oswald-SemiBold.ttf +0 -0
karaoke_prep/resources/Zurich_Cn_BT_Bold.ttf +0 -0
karaoke_prep/utils/__init__.py +18 -0
karaoke_prep/utils/bulk_cli.py +483 -0
karaoke_prep/utils/gen_cli.py +873 -0
karaoke_prep/video_generator.py +424 -0

karaoke_prep/utils/bulk_cli.py ADDED Viewed

@@ -0,0 +1,483 @@
+#!/usr/bin/env python
+import argparse
+import logging
+import pkg_resources
+import os
+import csv
+import asyncio
+import json
+import sys
+from karaoke_prep import KaraokePrep
+from karaoke_prep.karaoke_finalise import KaraokeFinalise
+# Global logger
+logger = logging.getLogger(__name__)
+logger.setLevel(logging.INFO)  # Set initial log level
+async def process_track_prep(row, args, logger, log_formatter):
+    """First phase: Process a track through prep stage only, without video rendering"""
+    original_dir = os.getcwd()
+    try:
+        artist = row["Artist"].strip()
+        title = row["Title"].strip()
+        guide_file = row["Mixed Audio Filename"].strip()
+        instrumental_file = row["Instrumental Audio Filename"].strip()
+        logger.info(f"Initial prep phase for track: {artist} - {title}")
+        kprep = KaraokePrep(
+            artist=artist,
+            title=title,
+            input_media=guide_file,
+            existing_instrumental=instrumental_file,
+            style_params_json=args.style_params_json,
+            logger=logger,
+            log_level=args.log_level,
+            dry_run=args.dry_run,
+            render_video=False,  # First phase: no video rendering
+            create_track_subfolders=True,
+        )
+        tracks = await kprep.process()
+        return True
+    except Exception as e:
+        logger.error(f"Failed initial prep for {artist} - {title}: {str(e)}")
+        return False
+    finally:
+        os.chdir(original_dir)
+async def process_track_render(row, args, logger, log_formatter):
+    """Phase 2: Process a track through karaoke-finalise."""
+    # First, load CDG styles if CDG generation is enabled
+    cdg_styles = None
+    if args.enable_cdg:
+        if not args.style_params_json:
+            # Raise ValueError instead of sys.exit
+            raise ValueError("CDG styles JSON file path (--style_params_json) is required when --enable_cdg is used")
+        try:
+            with open(args.style_params_json, "r") as f:
+                style_params = json.load(f) # Use json.load directly with file object
+                # Check if 'cdg' key exists
+                if "cdg" not in style_params:
+                    raise ValueError(f"'cdg' key not found in style parameters file: {args.style_params_json}")
+                cdg_styles = style_params["cdg"]
+        except FileNotFoundError:
+            # Re-raise FileNotFoundError
+            raise FileNotFoundError(f"CDG styles configuration file not found: {args.style_params_json}")
+        except json.JSONDecodeError as e:
+            # Raise ValueError for invalid JSON
+            raise ValueError(f"Invalid JSON in CDG styles configuration file: {str(e)}")
+    original_dir = os.getcwd()
+    artist = row["Artist"].strip()
+    title = row["Title"].strip()
+    guide_file = row["Mixed Audio Filename"].strip()
+    instrumental_file = row["Instrumental Audio Filename"].strip()
+    try:
+        # Initialize KaraokeFinalise first (needed for test assertions)
+        kfinalise = KaraokeFinalise(
+            log_formatter=log_formatter,
+            log_level=args.log_level,
+            dry_run=args.dry_run,
+            enable_cdg=args.enable_cdg,
+            enable_txt=args.enable_txt,
+            cdg_styles=cdg_styles,
+            non_interactive=True
+        )
+        # Try to find the track directory
+        track_dir_found = False
+        # Try several directory naming patterns
+        possible_dirs = [
+            os.path.join(args.output_dir, f"{artist} - {title}"),
+            os.path.join(args.output_dir, f"{artist} - {title}"),  # Original artist/title from row
+            os.path.join(args.output_dir, f"{artist} - {title}")   # With space replace (same here)
+        ]
+        for track_dir in possible_dirs:
+            if os.path.exists(track_dir):
+                track_dir_found = True
+                break
+        if not track_dir_found:
+            logger.error(f"Track directory not found. Tried: {', '.join(possible_dirs)}")
+            return True  # Return True to continue with other tracks
+        # First run KaraokePrep with video rendering enabled
+        # This is so the human can review all of the lyrics for the entire batch fairly quickly,
+        # then leave the script running to render the videos for all of them.
+        logger.info(f"Video rendering for track: {artist} - {title}")
+        kprep = KaraokePrep(
+            artist=artist,
+            title=title,
+            input_media=guide_file,
+            existing_instrumental=instrumental_file,
+            style_params_json=args.style_params_json,
+            logger=logger,
+            log_level=args.log_level,
+            dry_run=args.dry_run,
+            render_video=True,  # Second phase: with video rendering
+            create_track_subfolders=True,
+            skip_transcription_review=True,
+        )
+        tracks = await kprep.process()
+        # Process with KaraokeFinalise in the track directory
+        for track_dir in possible_dirs:
+            if os.path.exists(track_dir):
+                try:
+                    os.chdir(track_dir)
+                    # Process with KaraokeFinalise
+                    kfinalise.process()
+                    return True
+                except Exception as e:
+                    logger.error(f"Error during finalisation: {str(e)}")
+                    raise  # Re-raise to be caught by outer try/except
+                finally:
+                    # Always go back to original directory
+                    os.chdir(original_dir)
+    except Exception as e:
+        logger.error(f"Failed render/finalise for {artist} - {title}: {str(e)}")
+        os.chdir(original_dir)  # Make sure we go back to original directory
+        return False
+def update_csv_status(csv_path, row_index, new_status, dry_run=False):
+    """Update the status of a processed row in the CSV file.
+    Args:
+        csv_path (str): Path to the CSV file
+        row_index (int): Index of the row to update
+        new_status (str): New status to set
+        dry_run (bool): If True, log the update but don't modify the file
+    Returns:
+        bool: True if updated, False if in dry run mode or error occurred
+    """
+    if dry_run:
+        logger.info(f"DRY RUN: Would update row {row_index} in {csv_path} to status '{new_status}'")
+        return False
+    try:
+        # Read all rows
+        with open(csv_path, "r") as f:
+            reader = csv.DictReader(f)
+            rows = list(reader)
+        # Check if CSV has any rows
+        if not rows:
+            logger.error(f"CSV file {csv_path} is empty or has no data rows")
+            return False
+        # Update status for the processed row
+        if row_index < 0 or row_index >= len(rows):
+            logger.error(f"Row index {row_index} is out of range for CSV with {len(rows)} rows")
+            return False
+        rows[row_index]["Status"] = new_status
+        # Write back to CSV
+        fieldnames = rows[0].keys()
+        with open(csv_path, "w", newline="") as f:
+            writer = csv.DictWriter(f, fieldnames=fieldnames)
+            writer.writeheader()
+            writer.writerows(rows)
+        return True
+    except Exception as e:
+        logger.error(f"Error updating CSV status: {str(e)}")
+        return False
+def parse_arguments():
+    """Parse command line arguments"""
+    parser = argparse.ArgumentParser(
+        description="Process multiple karaoke tracks in bulk from a CSV file.",
+        formatter_class=lambda prog: argparse.RawTextHelpFormatter(prog, max_help_position=54),
+    )
+    # Basic information
+    parser.add_argument(
+        "input_csv",
+        help="Path to CSV file containing tracks to process. CSV should have columns: Artist,Title,Mixed Audio Filename,Instrumental Audio Filename,Status",
+    )
+    package_version = pkg_resources.get_distribution("karaoke-gen").version
+    parser.add_argument("-v", "--version", action="version", version=f"%(prog)s {package_version}")
+    # Required arguments
+    parser.add_argument(
+        "--style_params_json",
+        required=True,
+        help="Path to style parameters JSON file",
+    )
+    parser.add_argument(
+        "--output_dir",
+        default=".",
+        help="Optional: directory to write output files (default: <current dir>). Example: --output_dir=/app/karaoke",
+    )
+    # Finalise-specific arguments
+    parser.add_argument(
+        "--enable_cdg",
+        action="store_true",
+        help="Optional: Enable CDG ZIP generation during finalisation. Example: --enable_cdg",
+    )
+    parser.add_argument(
+        "--enable_txt",
+        action="store_true",
+        help="Optional: Enable TXT ZIP generation during finalisation. Example: --enable_txt",
+    )
+    # Logging & Debugging
+    parser.add_argument(
+        "--log_level",
+        default="info",
+        help="Optional: logging level, e.g. info, debug, warning (default: %(default)s). Example: --log_level=debug",
+    )
+    parser.add_argument(
+        "--dry_run",
+        action="store_true",
+        help="Optional: perform a dry run without making any changes (default: %(default)s). Example: --dry_run",
+    )
+    args = parser.parse_args()
+    # Convert input_csv to absolute path early
+    args.input_csv = os.path.abspath(args.input_csv)
+    # Validate and convert log level
+    if isinstance(args.log_level, str):
+        try:
+            log_level_int = getattr(logging, args.log_level.upper())
+            args.log_level = log_level_int  # Store the numeric log level back in args
+        except AttributeError:
+            # Raise ValueError for invalid log level string
+            raise ValueError(f"Invalid log level string: {args.log_level}")
+    elif not isinstance(args.log_level, int):
+         # If it's neither string nor int, raise error
+         raise ValueError(f"Invalid log level type: {type(args.log_level)}")
+    return args
+def _parse_and_validate_args():
+    """Parses arguments and performs initial validation."""
+    args = parse_arguments() # Calls the modified parse_arguments
+    # Validate input CSV existence (raises FileNotFoundError if invalid)
+    if not validate_input_csv(args.input_csv):
+         raise FileNotFoundError(f"Input CSV file not found: {args.input_csv}")
+    # Validate style params JSON existence if CDG is enabled
+    if args.enable_cdg:
+        if not args.style_params_json:
+            raise ValueError("CDG styles JSON file path (--style_params_json) is required when --enable_cdg is used")
+        if not os.path.isfile(args.style_params_json):
+             raise FileNotFoundError(f"CDG styles configuration file not found: {args.style_params_json}")
+        # Basic JSON validation can also happen here if desired, or deferred to process_track_render
+        try:
+            with open(args.style_params_json, 'r') as f:
+                json.load(f)
+        except json.JSONDecodeError as e:
+             raise ValueError(f"Invalid JSON in CDG styles configuration file: {args.style_params_json} - {e}")
+        except FileNotFoundError: # Should be caught above, but belt-and-suspenders
+             raise FileNotFoundError(f"CDG styles configuration file not found: {args.style_params_json}")
+    return args
+def validate_input_csv(csv_path):
+    """Validate that the input CSV file exists.
+    Args:
+        csv_path (str): Path to the CSV file
+    Returns:
+        bool: True if the file exists, False otherwise
+    """
+    if not os.path.isfile(csv_path):
+        logger.error(f"Input CSV file not found: {csv_path}")
+        return False
+    return True
+def _read_csv_file(csv_path):
+    """Reads the CSV file and returns rows as a list of dictionaries."""
+    try:
+        with open(csv_path, "r", newline='') as f: # Added newline=''
+            reader = csv.DictReader(f)
+            # Check for required columns before reading all rows
+            required_columns = {"Artist", "Title", "Mixed Audio Filename", "Instrumental Audio Filename", "Status"}
+            if not required_columns.issubset(reader.fieldnames):
+                 missing = required_columns - set(reader.fieldnames)
+                 raise ValueError(f"CSV file missing required columns: {', '.join(missing)}")
+            rows = list(reader)
+        if not rows:
+             logger.warning(f"CSV file {csv_path} is empty or contains only headers.")
+        return rows
+    except FileNotFoundError:
+        # This should ideally be caught earlier by validate_input_csv, but handle defensively
+        logger.error(f"CSV file not found during read: {csv_path}")
+        raise # Re-raise the exception
+    except Exception as e:
+        logger.error(f"Error reading CSV file {csv_path}: {e}")
+        raise # Re-raise other read errors
+async def process_csv_rows(csv_path, rows, args, logger, log_formatter):
+    """Process all rows in a CSV file.
+    Args:
+        csv_path (str): Path to the CSV file
+        rows (list): List of CSV rows as dictionaries
+        args (argparse.Namespace): Command line arguments
+        logger (logging.Logger): Logger instance
+        log_formatter (logging.Formatter): Log formatter
+    Returns:
+        dict: A summary of the processing results
+    """
+    results = {
+        "prep_success": 0,
+        "prep_failed": 0,
+        "render_success": 0,
+        "render_failed": 0,
+        "skipped": 0
+    }
+    # Phase 1: Initial prep for all tracks
+    logger.info("Starting Phase 1: Initial prep for all tracks")
+    for i, row in enumerate(rows):
+        status = row["Status"].lower() if "Status" in row else ""
+        if status != "uploaded":
+            logger.info(f"Skipping {row.get('Artist', 'Unknown')} - {row.get('Title', 'Unknown')} (Status: {row.get('Status', 'Unknown')})")
+            results["skipped"] += 1
+            continue
+        success = await process_track_prep(row, args, logger, log_formatter)
+        if success:
+            results["prep_success"] += 1
+            if not args.dry_run:
+                update_csv_status(csv_path, i, "Prep_Complete", args.dry_run)
+        else:
+            results["prep_failed"] += 1
+            if not args.dry_run:
+                update_csv_status(csv_path, i, "Prep_Failed", args.dry_run)
+    # Phase 2: Render and finalise all tracks
+    logger.info("Starting Phase 2: Render and finalise for all tracks")
+    for i, row in enumerate(rows):
+        status = row["Status"].lower() if "Status" in row else ""
+        if status not in ["prep_complete", "uploaded"]:
+            logger.info(f"Skipping {row.get('Artist', 'Unknown')} - {row.get('Title', 'Unknown')} (Status: {row.get('Status', 'Unknown')})")
+            continue
+        success = await process_track_render(row, args, logger, log_formatter)
+        if success:
+            results["render_success"] += 1
+            if not args.dry_run:
+                update_csv_status(csv_path, i, "Completed", args.dry_run)
+        else:
+            results["render_failed"] += 1
+            if not args.dry_run:
+                update_csv_status(csv_path, i, "Render_Failed", args.dry_run)
+    return results
+async def async_main():
+    """Main async function to process bulk tracks from CSV"""
+    # Parse and validate arguments first (raises exceptions on failure)
+    args = _parse_and_validate_args()
+    # Set log level based on validated args (logger should already be partially set up by main)
+    logger.setLevel(args.log_level)
+    logger.info(f"Log level set to {logging.getLevelName(args.log_level)}")
+    if args.dry_run:
+        logger.info("Dry run mode enabled. No changes will be made.")
+    logger.info(f"Starting bulk processing with input CSV: {args.input_csv}")
+    # Read CSV (raises exceptions on failure)
+    rows = _read_csv_file(args.input_csv)
+    # Check if log_formatter is available (should be set by main)
+    global log_formatter
+    if log_formatter is None:
+         # This case should ideally not happen if main() calls setup_logging correctly
+         logger.warning("Log formatter not found, setting up default.")
+         log_formatter = setup_logging(args.log_level)
+    # Process the CSV rows
+    results = await process_csv_rows(args.input_csv, rows, args, logger, log_formatter)
+    # Log summary
+    logger.info(f"Processing complete. Summary: {results}")
+    return results
+def setup_logging(log_level=logging.INFO):
+    """Set up logging with the given log level.
+    Args:
+        log_level (int): Logging level (e.g., logging.INFO, logging.DEBUG)
+    Returns:
+        logging.Formatter: The log formatter for use by other functions
+    """
+    global log_formatter  # Make log_formatter accessible to other functions
+    log_handler = logging.StreamHandler()
+    log_formatter = logging.Formatter(fmt="%(asctime)s.%(msecs)03d - %(levelname)s - %(module)s - %(message)s", datefmt="%Y-%m-%d %H:%M:%S")
+    log_handler.setFormatter(log_formatter)
+    logger.addHandler(log_handler)
+    logger.setLevel(log_level)
+    return log_formatter
+def main():
+    """Main entry point for the CLI."""
+    log_formatter = None # Initialize log_formatter
+    try:
+        # Set up logging early to capture potential errors during setup/parsing
+        # Get initial args just for log level if provided, otherwise default
+        temp_args, _ = argparse.ArgumentParser(add_help=False).parse_known_args()
+        initial_log_level_str = getattr(temp_args, 'log_level', 'info')
+        try:
+            initial_log_level = getattr(logging, initial_log_level_str.upper())
+        except AttributeError:
+            initial_log_level = logging.INFO
+            print(f"Warning: Invalid initial log level '{initial_log_level_str}'. Using INFO.", file=sys.stderr)
+        log_formatter = setup_logging(initial_log_level)
+        # Run the async main function using asyncio
+        asyncio.run(async_main())
+        logger.info("Bulk processing finished successfully.")
+        sys.exit(0)
+    except (FileNotFoundError, ValueError, argparse.ArgumentError) as e:
+        # Log specific configuration/setup errors before exiting
+        if logger.handlers: # Check if logger was set up
+             logger.error(f"Configuration error: {str(e)}")
+        else: # Fallback if logging setup failed
+             print(f"Error: {str(e)}", file=sys.stderr)
+        sys.exit(1)
+    except Exception as e:
+        # Catch any other unexpected errors during processing
+        if logger.handlers:
+            logger.exception(f"An unexpected error occurred during bulk processing: {str(e)}") # Use exception for traceback
+        else:
+            print(f"An unexpected error occurred: {str(e)}", file=sys.stderr)
+        sys.exit(1)
+if __name__ == "__main__":
+    main()