PyPI - peg-this - Versions diffs - 4.0.0__py3-none-any.whl → 4.1.0__py3-none-any.whl - Mend

peg-this 4.0.0py3-none-any.whl → 4.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

peg_this/features/audio.py +63 -16
peg_this/features/batch.py +105 -79
peg_this/features/convert.py +179 -95
peg_this/features/crop.py +63 -34
peg_this/features/inspect.py +71 -21
peg_this/features/join.py +85 -31
peg_this/features/subtitle.py +397 -0
peg_this/features/trim.py +40 -10
peg_this/peg_this.py +4 -1
peg_this/utils/validation.py +228 -0
peg_this-4.1.0.dist-info/METADATA +283 -0
peg_this-4.1.0.dist-info/RECORD +21 -0
{peg_this-4.0.0.dist-info → peg_this-4.1.0.dist-info}/WHEEL +1 -1
peg_this-4.0.0.dist-info/METADATA +0 -164
peg_this-4.0.0.dist-info/RECORD +0 -19
{peg_this-4.0.0.dist-info → peg_this-4.1.0.dist-info}/entry_points.txt +0 -0
{peg_this-4.0.0.dist-info → peg_this-4.1.0.dist-info}/licenses/LICENSE +0 -0
{peg_this-4.0.0.dist-info → peg_this-4.1.0.dist-info}/top_level.txt +0 -0

peg_this/features/subtitle.py ADDED Viewed

@@ -0,0 +1,397 @@
+import os
+import tempfile
+from pathlib import Path
+import ffmpeg
+import questionary
+from rich.console import Console
+from rich.progress import Progress, SpinnerColumn, TextColumn, BarColumn, TimeElapsedColumn
+from peg_this.utils.ffmpeg_utils import run_command, has_audio_stream
+from peg_this.utils.validation import (
+    validate_input_file, check_output_file, check_disk_space,
+    get_video_duration, format_duration, press_continue
+)
+console = Console()
+def check_existing_subtitles(file_path):
+    try:
+        probe = ffmpeg.probe(file_path)
+        subtitle_streams = [s for s in probe.get('streams', []) if s.get('codec_type') == 'subtitle']
+        return len(subtitle_streams) > 0, len(subtitle_streams)
+    except Exception:
+        return False, 0
+def sanitize_path_for_filter(path):
+    path_str = str(path)
+    path_str = path_str.replace("\\", "/")
+    path_str = path_str.replace(":", "\\:")
+    path_str = path_str.replace("'", "\\'")
+    return path_str
+def extract_audio_for_whisper(input_file, temp_dir):
+    temp_wav = os.path.join(temp_dir, "temp_audio.wav")
+    try:
+        console.print("[cyan]Extracting audio for analysis...[/cyan]")
+        (
+            ffmpeg
+            .input(input_file)
+            .output(temp_wav, ac=1, ar=16000, vn=None, loglevel="error")
+            .overwrite_output()
+            .run(capture_stdout=True, capture_stderr=True)
+        )
+        if not os.path.exists(temp_wav):
+            console.print("[bold red]Error: Failed to extract audio file.[/bold red]")
+            return None
+        if os.path.getsize(temp_wav) == 0:
+            console.print("[bold red]Error: Extracted audio is empty.[/bold red]")
+            return None
+        return temp_wav
+    except ffmpeg.Error as e:
+        error_msg = e.stderr.decode() if e.stderr else "Unknown error"
+        console.print(f"[bold red]Failed to extract audio: {error_msg}[/bold red]")
+        return None
+def format_timestamp(seconds):
+    hours = int(seconds // 3600)
+    minutes = int((seconds % 3600) // 60)
+    secs = int(seconds % 60)
+    millis = int((seconds - int(seconds)) * 1000)
+    return f"{hours:02d}:{minutes:02d}:{secs:02d},{millis:03d}"
+def format_timestamp_vtt(seconds):
+    hours = int(seconds // 3600)
+    minutes = int((seconds % 3600) // 60)
+    secs = int(seconds % 60)
+    millis = int((seconds - int(seconds)) * 1000)
+    return f"{hours:02d}:{minutes:02d}:{secs:02d}.{millis:03d}"
+def segments_to_srt(segments):
+    srt_content = []
+    for i, segment in enumerate(segments, 1):
+        start = format_timestamp(segment.start)
+        end = format_timestamp(segment.end)
+        text = segment.text.strip()
+        srt_content.append(f"{i}\n{start} --> {end}\n{text}\n")
+    return "\n".join(srt_content)
+def segments_to_vtt(segments):
+    vtt_content = ["WEBVTT\n"]
+    for segment in segments:
+        start = format_timestamp_vtt(segment.start)
+        end = format_timestamp_vtt(segment.end)
+        text = segment.text.strip()
+        vtt_content.append(f"{start} --> {end}\n{text}\n")
+    return "\n".join(vtt_content)
+def segments_to_txt(segments):
+    return "\n".join(segment.text.strip() for segment in segments)
+def segments_to_lrc(segments):
+    lrc_content = []
+    for segment in segments:
+        minutes = int(segment.start // 60)
+        seconds = segment.start % 60
+        text = segment.text.strip()
+        lrc_content.append(f"[{minutes:02d}:{seconds:05.2f}]{text}")
+    return "\n".join(lrc_content)
+def generate_subtitles(file_path):
+    if not validate_input_file(file_path):
+        press_continue()
+        return
+    if not has_audio_stream(file_path):
+        console.print("[bold red]Error: File has no audio stream.[/bold red]")
+        console.print("[dim]Subtitles require audio to transcribe.[/dim]")
+        press_continue()
+        return
+    has_subs, sub_count = check_existing_subtitles(file_path)
+    if has_subs:
+        console.print(f"[yellow]Note: This video already has {sub_count} subtitle track(s) embedded.[/yellow]")
+        if not questionary.confirm("Continue generating new subtitles?", default=True).ask():
+            return
+    duration = get_video_duration(file_path)
+    if duration > 3600:
+        console.print(f"[yellow]Note: This is a long video ({format_duration(duration)}).[/yellow]")
+        console.print("[dim]Transcription may take a while. Consider using a smaller model for faster results.[/dim]")
+        if not questionary.confirm("Continue?", default=True).ask():
+            return
+    try:
+        from faster_whisper import WhisperModel
+    except ImportError:
+        console.print("[bold red]Error: faster-whisper is not installed.[/bold red]")
+        console.print("[yellow]Install it with: pip install faster-whisper[/yellow]")
+        press_continue()
+        return
+    console.print("\n[bold cyan]Subtitle Generation (Whisper AI)[/bold cyan]")
+    if duration > 0:
+        console.print(f"[dim]Video duration: {format_duration(duration)}[/dim]")
+    if duration > 1800:
+        default_model = "tiny.en (fastest, English only, ~75MB)"
+        console.print("[dim]Tip: For long videos, smaller models are recommended.[/dim]")
+    else:
+        default_model = "small.en (balanced, English only, ~500MB)"
+    model_choice = questionary.select(
+        "Select Whisper model:",
+        choices=[
+            "tiny.en (fastest, English only, ~75MB)",
+            "base.en (fast, English only, ~150MB)",
+            "small.en (balanced, English only, ~500MB)",
+            "medium.en (accurate, English only, ~1.5GB)",
+            "small (balanced, multilingual, ~500MB)",
+            "medium (accurate, multilingual, ~1.5GB)",
+            "large-v3 (best quality, multilingual, ~3GB)",
+        ],
+        default=default_model
+    ).ask()
+    if not model_choice:
+        return
+    model_name = model_choice.split(" ")[0]
+    language = "en"
+    if not model_name.endswith(".en"):
+        if questionary.confirm("Change language? (default: English)", default=False).ask():
+            console.print("\n[dim]Common codes: en (English), ta (Tamil), hi (Hindi), te (Telugu),")
+            console.print("ml (Malayalam), kn (Kannada), fr (French), de (German), es (Spanish), zh (Chinese)[/dim]")
+            console.print("[dim]Full list: https://en.wikipedia.org/wiki/List_of_ISO_639-1_codes[/dim]")
+            language = questionary.text(
+                "Enter language code (or 'auto' to detect automatically):",
+                default="en"
+            ).ask()
+            if not language:
+                return
+            if language == "auto":
+                language = None
+    processing_mode = questionary.select(
+        "Select processing mode:",
+        choices=[
+            "Fast (Recommended) - Optimized for speed, great accuracy",
+            "Accurate - Best quality, slower processing",
+        ],
+        default="Fast (Recommended) - Optimized for speed, great accuracy"
+    ).ask()
+    if not processing_mode:
+        return
+    compute_type = "int8" if "Fast" in processing_mode else "float32"
+    action = questionary.select(
+        "What do you want to do with the subtitles?",
+        choices=[
+            "Export as sidecar file (.srt/.vtt)",
+            "Embed into video (Soft Subtitles)",
+            "Burn into video (Hard Subtitles)"
+        ]
+    ).ask()
+    if not action:
+        return
+    output_format = "srt"
+    if "sidecar" in action:
+        output_format = questionary.select(
+            "Select format:",
+            choices=["srt", "vtt", "txt", "lrc"]
+        ).ask()
+        if not output_format:
+            return
+    input_p = Path(file_path)
+    if "sidecar" in action:
+        output_path = input_p.with_name(f"{input_p.stem}.{output_format}")
+        action_result, final_output_path = check_output_file(str(output_path), "Subtitle file")
+    elif "Embed" in action:
+        output_path = input_p.with_name(f"{input_p.stem}_softsub{input_p.suffix}")
+        action_result, final_output_path = check_output_file(str(output_path), "Video file")
+    elif "Burn" in action:
+        output_path = input_p.with_name(f"{input_p.stem}_hardsub{input_p.suffix}")
+        action_result, final_output_path = check_output_file(str(output_path), "Video file")
+        if action_result != 'cancel' and not check_disk_space(file_path, multiplier=2):
+            return
+    else:
+        action_result = 'proceed'
+        final_output_path = None
+    if action_result == 'cancel':
+        console.print("[yellow]Operation cancelled.[/yellow]")
+        press_continue()
+        return
+    crf = "23"
+    if "Burn" in action:
+        quality = questionary.select(
+            "Select Video Quality (CRF):",
+            choices=["High (18)", "Medium (23)", "Low (28)"],
+            default="Medium (23)"
+        ).ask()
+        if not quality:
+            return
+        crf = quality.split("(")[1].strip(")")
+    with tempfile.TemporaryDirectory() as temp_dir:
+        wav_path = extract_audio_for_whisper(file_path, temp_dir)
+        if not wav_path:
+            press_continue()
+            return
+        console.print(f"[cyan]Loading Whisper model '{model_name}'...[/cyan]")
+        console.print("[dim]First run will download the model (may take a few minutes)[/dim]")
+        try:
+            model = WhisperModel(model_name, device="cpu", compute_type=compute_type)
+        except Exception as e:
+            error_msg = str(e)
+            if "out of memory" in error_msg.lower():
+                console.print("[bold red]Error: Not enough memory to load model.[/bold red]")
+                console.print("[yellow]Try using a smaller model (tiny or base).[/yellow]")
+            elif "network" in error_msg.lower() or "connection" in error_msg.lower():
+                console.print("[bold red]Error: Failed to download model. Check your internet connection.[/bold red]")
+            else:
+                console.print(f"[bold red]Failed to load model: {e}[/bold red]")
+            press_continue()
+            return
+        console.print("[cyan]Transcribing audio...[/cyan]")
+        try:
+            with Progress(
+                SpinnerColumn(),
+                TextColumn("[progress.description]{task.description}"),
+                BarColumn(),
+                TimeElapsedColumn(),
+                console=console
+            ) as progress:
+                task = progress.add_task("Transcribing...", total=None)
+                segments_generator, info = model.transcribe(
+                    wav_path,
+                    language=language,
+                    beam_size=5,
+                    vad_filter=True,
+                    vad_parameters=dict(min_silence_duration_ms=500)
+                )
+                segments = list(segments_generator)
+                progress.update(task, completed=100)
+        except KeyboardInterrupt:
+            console.print("\n[yellow]Transcription cancelled by user.[/yellow]")
+            press_continue()
+            return
+        except Exception as e:
+            error_msg = str(e)
+            if "out of memory" in error_msg.lower():
+                console.print("[bold red]Error: Ran out of memory during transcription.[/bold red]")
+                console.print("[yellow]Try using a smaller model or processing a shorter video.[/yellow]")
+            else:
+                console.print(f"[bold red]Transcription failed: {e}[/bold red]")
+            press_continue()
+            return
+        if not segments:
+            console.print("[bold yellow]No speech detected in audio.[/bold yellow]")
+            console.print("[dim]The video might be silent, have only music, or the audio quality is too low.[/dim]")
+            press_continue()
+            return
+        detected_lang = info.language if language is None else language
+        console.print(f"[green]Detected language: {detected_lang}[/green]")
+        console.print(f"[green]Transcribed {len(segments)} segments[/green]")
+        if output_format == "srt" or "Embed" in action or "Burn" in action:
+            subtitle_content = segments_to_srt(segments)
+            sub_ext = "srt"
+        elif output_format == "vtt":
+            subtitle_content = segments_to_vtt(segments)
+            sub_ext = "vtt"
+        elif output_format == "txt":
+            subtitle_content = segments_to_txt(segments)
+            sub_ext = "txt"
+        elif output_format == "lrc":
+            subtitle_content = segments_to_lrc(segments)
+            sub_ext = "lrc"
+        else:
+            subtitle_content = segments_to_srt(segments)
+            sub_ext = "srt"
+        if not subtitle_content.strip():
+            console.print("[bold yellow]Warning: Generated subtitles are empty.[/bold yellow]")
+            press_continue()
+            return
+        sub_temp_path = os.path.join(temp_dir, f"output.{sub_ext}")
+        try:
+            with open(sub_temp_path, "w", encoding="utf-8") as f:
+                f.write(subtitle_content)
+        except IOError as e:
+            console.print(f"[bold red]Error writing subtitle file: {e}[/bold red]")
+            press_continue()
+            return
+        try:
+            if "sidecar" in action:
+                with open(final_output_path, "w", encoding="utf-8") as f:
+                    f.write(subtitle_content)
+                console.print(f"[bold green]Saved subtitles to: {final_output_path}[/bold green]")
+            elif "Embed" in action:
+                console.print("[cyan]Embedding subtitles (Soft Subs)...[/cyan]")
+                ext = input_p.suffix.lower()
+                scodec = "mov_text" if ext in ['.mp4', '.m4v', '.mov'] else "srt"
+                stream = ffmpeg.input(file_path)
+                sub_stream = ffmpeg.input(sub_temp_path)
+                out = ffmpeg.output(
+                    stream, sub_stream, str(final_output_path),
+                    c='copy', **{'c:s': scodec}, **{'metadata:s:s:0': f'language={detected_lang}'}
+                )
+                if action_result == 'overwrite':
+                    out = out.overwrite_output()
+                if run_command(out, "Embedding subtitles...", show_progress=True):
+                    console.print(f"[bold green]Created: {final_output_path}[/bold green]")
+                else:
+                    console.print("[bold red]Failed to embed subtitles.[/bold red]")
+            elif "Burn" in action:
+                console.print("[cyan]Burning subtitles (Hard Subs)...[/cyan]")
+                console.print("[dim]This requires re-encoding and may take a while...[/dim]")
+                stream = ffmpeg.input(file_path)
+                video = stream.video.filter('subtitles', sub_temp_path)
+                audio = stream.audio
+                out = ffmpeg.output(
+                    video, audio, str(final_output_path),
+                    vcodec='libx264', acodec='copy', crf=crf, preset='fast'
+                )
+                if action_result == 'overwrite':
+                    out = out.overwrite_output()
+                if run_command(out, "Burning subtitles (Re-encoding)...", show_progress=True):
+                    console.print(f"[bold green]Created: {final_output_path}[/bold green]")
+                else:
+                    console.print("[bold red]Failed to burn subtitles.[/bold red]")
+        except PermissionError:
+            console.print("[bold red]Error: Permission denied. Cannot write to output location.[/bold red]")
+            console.print("[dim]Try saving to a different location or check folder permissions.[/dim]")
+        except IOError as e:
+            console.print(f"[bold red]Error writing output: {e}[/bold red]")
+        except Exception as e:
+            console.print(f"[bold red]Unexpected error: {e}[/bold red]")
+    press_continue()

peg_this/features/trim.py CHANGED Viewed

@@ -1,4 +1,3 @@
 from pathlib import Path
 import ffmpeg
@@ -6,21 +5,52 @@ import questionary
 from rich.console import Console
 from peg_this.utils.ffmpeg_utils import run_command
+from peg_this.utils.validation import (
+    validate_input_file, check_output_file, get_video_duration,
+    validate_time_range, format_duration, press_continue
+)
 console = Console()
 def trim_video(file_path):
-    """Cut a video by specifying start and end times."""
+    if not validate_input_file(file_path):
+        press_continue()
+        return
+    duration = get_video_duration(file_path)
+    if duration > 0:
+        console.print(f"[dim]Video duration: {format_duration(duration)}[/dim]")
     start_time = questionary.text("Enter start time (HH:MM:SS or seconds):").ask()
-    if not start_time: return
+    if not start_time:
+        return
     end_time = questionary.text("Enter end time (HH:MM:SS or seconds):").ask()
-    if not end_time: return
+    if not end_time:
+        return
+    start_secs, end_secs = validate_time_range(start_time, end_time, duration if duration > 0 else None)
+    if start_secs is None:
+        press_continue()
+        return
     output_file = f"{Path(file_path).stem}_trimmed{Path(file_path).suffix}"
-    stream = ffmpeg.input(file_path, ss=start_time, to=end_time).output(output_file, c='copy', y=None)
-    run_command(stream, "Trimming video...", show_progress=True)
-    console.print(f"[bold green]Successfully trimmed to {output_file}[/bold green]")
-    questionary.press_any_key_to_continue().ask()
+    action_result, final_output = check_output_file(output_file, "Video file")
+    if action_result == 'cancel':
+        console.print("[yellow]Operation cancelled.[/yellow]")
+        press_continue()
+        return
+    stream = ffmpeg.input(file_path, ss=start_secs, to=end_secs).output(final_output, c='copy')
+    if action_result == 'overwrite':
+        stream = stream.overwrite_output()
+    if run_command(stream, "Trimming video...", show_progress=True):
+        console.print(f"[bold green]Successfully trimmed to {final_output}[/bold green]")
+    else:
+        console.print("[bold red]Failed to trim video.[/bold red]")
+    press_continue()

peg_this/peg_this.py CHANGED Viewed

@@ -13,6 +13,7 @@ from peg_this.features.convert import convert_file, convert_image, resize_image,
 from peg_this.features.crop import crop_video, crop_image
 from peg_this.features.inspect import inspect_file
 from peg_this.features.join import join_videos
+from peg_this.features.subtitle import generate_subtitles
 from peg_this.features.trim import trim_video
 from peg_this.utils.ffmpeg_utils import check_ffmpeg_ffprobe
 from peg_this.utils.ui_utils import select_media_file
@@ -77,6 +78,7 @@ def action_menu(file_path):
             choices=[
                 "Inspect File Details",
                 "Convert",
+                "Generate Subtitles (Whisper)",
                 "Trim Video",
                 "Crop Video (Visual)",
                 "Extract Audio",
@@ -93,6 +95,7 @@ def action_menu(file_path):
         actions = {
             "Inspect File Details": inspect_file,
             "Convert": convert_file,
+            "Generate Subtitles (Whisper)": generate_subtitles,
             "Trim Video": trim_video,
             "Crop Video (Visual)": crop_video,
             "Extract Audio": extract_audio,
@@ -137,7 +140,7 @@ def main_menu():
 def main():
-    """Main entry point for the application script."""
+    """Main entry point for the application."""
     try:
         main_menu()
     except (KeyboardInterrupt, EOFError):

peg-this 4.0.0__py3-none-any.whl → 4.1.0__py3-none-any.whl

peg-this 4.0.0py3-none-any.whl → 4.1.0py3-none-any.whl