PyPI - lattifai - Versions diffs - 1.2.1__py3-none-any.whl → 1.3.0__py3-none-any.whl - Mend

lattifai 1.2.1py3-none-any.whl → 1.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

lattifai/_init.py +20 -0
lattifai/alignment/__init__.py +9 -1
lattifai/alignment/lattice1_aligner.py +175 -54
lattifai/alignment/lattice1_worker.py +47 -4
lattifai/alignment/punctuation.py +38 -0
lattifai/alignment/segmenter.py +3 -2
lattifai/alignment/text_align.py +441 -0
lattifai/alignment/tokenizer.py +134 -65
lattifai/audio2.py +162 -183
lattifai/cli/__init__.py +2 -1
lattifai/cli/alignment.py +5 -0
lattifai/cli/caption.py +111 -4
lattifai/cli/transcribe.py +2 -6
lattifai/cli/youtube.py +7 -1
lattifai/client.py +72 -123
lattifai/config/__init__.py +28 -0
lattifai/config/alignment.py +14 -0
lattifai/config/caption.py +45 -31
lattifai/config/client.py +16 -0
lattifai/config/event.py +102 -0
lattifai/config/media.py +20 -0
lattifai/config/transcription.py +25 -1
lattifai/data/__init__.py +8 -0
lattifai/data/caption.py +228 -0
lattifai/diarization/__init__.py +41 -1
lattifai/errors.py +78 -53
lattifai/event/__init__.py +65 -0
lattifai/event/lattifai.py +166 -0
lattifai/mixin.py +49 -32
lattifai/transcription/base.py +8 -2
lattifai/transcription/gemini.py +147 -16
lattifai/transcription/lattifai.py +25 -63
lattifai/types.py +1 -1
lattifai/utils.py +7 -13
lattifai/workflow/__init__.py +28 -4
lattifai/workflow/file_manager.py +2 -5
lattifai/youtube/__init__.py +43 -0
lattifai/youtube/client.py +1265 -0
lattifai/youtube/types.py +23 -0
lattifai-1.3.0.dist-info/METADATA +678 -0
lattifai-1.3.0.dist-info/RECORD +57 -0
{lattifai-1.2.1.dist-info → lattifai-1.3.0.dist-info}/entry_points.txt +1 -2
lattifai/__init__.py +0 -88
lattifai/alignment/sentence_splitter.py +0 -219
lattifai/caption/__init__.py +0 -20
lattifai/caption/caption.py +0 -1467
lattifai/caption/gemini_reader.py +0 -462
lattifai/caption/gemini_writer.py +0 -173
lattifai/caption/supervision.py +0 -34
lattifai/caption/text_parser.py +0 -145
lattifai/cli/app_installer.py +0 -142
lattifai/cli/server.py +0 -44
lattifai/server/app.py +0 -427
lattifai/workflow/youtube.py +0 -577
lattifai-1.2.1.dist-info/METADATA +0 -1134
lattifai-1.2.1.dist-info/RECORD +0 -58
{lattifai-1.2.1.dist-info → lattifai-1.3.0.dist-info}/WHEEL +0 -0
{lattifai-1.2.1.dist-info → lattifai-1.3.0.dist-info}/licenses/LICENSE +0 -0
{lattifai-1.2.1.dist-info → lattifai-1.3.0.dist-info}/top_level.txt +0 -0

lattifai/youtube/client.py ADDED Viewed

@@ -0,0 +1,1265 @@
+"""
+YouTube client for metadata extraction and media download using yt-dlp
+"""
+import asyncio
+import logging
+import os
+import re
+import tempfile
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+try:
+    import yt_dlp
+except ImportError:
+    yt_dlp = None
+from lattifai.caption.config import CAPTION_FORMATS
+from ..errors import LattifAIError
+from ..workflow.base import setup_workflow_logger
+from ..workflow.file_manager import TRANSCRIBE_CHOICE, FileExistenceManager
+from .types import CaptionTrack, VideoMetadata
+logger = logging.getLogger(__name__)
+class YouTubeError(LattifAIError):
+    """Base error for YouTube operations"""
+    pass
+class VideoUnavailableError(YouTubeError):
+    """Video is not available (private, deleted, etc)"""
+    pass
+class YoutubeLoader:
+    """Lightweight YouTube metadata and caption content loader
+    Use this class when you need to:
+    - Fetch video metadata quickly
+    - Get caption content in memory (not save to disk)
+    - Support proxy and cookies configuration
+    """
+    def __init__(self, proxy: Optional[str] = None, cookies: Optional[str] = None):
+        if yt_dlp is None:
+            raise ImportError("yt-dlp is required. Install with `pip install yt-dlp`")
+        # Auto-load from environment if not specified
+        if proxy is None:
+            proxy = os.getenv("YOUTUBE_PROXY")
+        if cookies is None:
+            cookies = os.getenv("YOUTUBE_COOKIE_FILE") or os.getenv("YOUTUBE_COOKIE_BROWSER")
+        self.proxy = proxy
+        self.cookies = cookies
+        # Base configuration for metadata extraction
+        self._base_opts = {
+            "quiet": True,
+            "no_warnings": True,
+            "skip_download": True,
+            "extract_flat": False,  # Need full info for captions
+            "youtube_include_dash_manifest": False,
+            "youtube_include_hls_manifest": False,
+        }
+        if self.proxy:
+            self._base_opts["proxy"] = self.proxy
+            logger.info(f"🌐 Using proxy: {self.proxy}")
+        # Cookie configuration
+        if self.cookies:
+            # Check if it's a browser name (chrome, firefox, safari, etc.)
+            browser_names = ["chrome", "firefox", "safari", "edge", "opera", "brave"]
+            if self.cookies.lower() in browser_names:
+                # Use cookies from browser directly
+                self._base_opts["cookiesfrombrowser"] = (self.cookies.lower(),)
+                logger.info(f"🍪 Using cookies from browser: {self.cookies}")
+            else:
+                # Use cookie file
+                cookie_path = Path(self.cookies).expanduser()
+                if cookie_path.exists():
+                    self._base_opts["cookiefile"] = str(cookie_path)
+                    logger.info(f"🍪 Using cookie file: {cookie_path}")
+                else:
+                    logger.warning(f"⚠️ Cookie file not found: {cookie_path}")
+                    logger.warning("💡 Tip: Run 'yt-dlp --cookies-from-browser chrome' to extract cookies")
+        # Note: player_client configuration is removed to avoid format availability issues
+        # with certain videos. Let yt-dlp automatically select the best client.
+        # Previous config caused "Requested format is not available" errors for some videos.
+    def get_video_info(self, video_id: str) -> Dict[str, Any]:
+        """
+        Fetch basic video metadata and list of available captions.
+        Returns a dict with 'metadata' (VideoMetadata) and 'captions' (List[CaptionTrack]).
+        """
+        url = f"https://www.youtube.com/watch?v={video_id}"
+        opts = {
+            **self._base_opts,
+            "writesubtitles": True,
+            "writeautomaticsub": True,
+        }
+        try:
+            with yt_dlp.YoutubeDL(opts) as ydl:
+                info = ydl.extract_info(url, download=False)
+                # Parse metadata
+                metadata = VideoMetadata(
+                    video_id=info.get("id", video_id),
+                    title=info.get("title", "Unknown"),
+                    description=info.get("description", ""),
+                    duration=float(info.get("duration", 0)),
+                    thumbnail_url=info.get("thumbnail", ""),
+                    channel_name=info.get("uploader", "Unknown"),
+                    view_count=info.get("view_count", 0),
+                    upload_date=info.get("upload_date"),
+                )
+                # Parse captions
+                tracks: List[CaptionTrack] = []
+                # Manual captions
+                subtitles = info.get("subtitles", {})
+                for lang, formats in subtitles.items():
+                    for fmt in formats:
+                        tracks.append(
+                            CaptionTrack(
+                                language_code=lang,
+                                language_name=self._get_lang_name(formats),
+                                kind="manual",
+                                ext=fmt.get("ext", ""),
+                                url=fmt.get("url"),
+                            )
+                        )
+                # Auto captions
+                auto_subs = info.get("automatic_captions", {})
+                for lang, formats in auto_subs.items():
+                    for fmt in formats:
+                        tracks.append(
+                            CaptionTrack(
+                                language_code=lang,
+                                language_name=self._get_lang_name(formats),
+                                kind="asr",
+                                ext=fmt.get("ext", ""),
+                                url=fmt.get("url"),
+                            )
+                        )
+                return {"metadata": metadata, "captions": tracks}
+        except yt_dlp.utils.DownloadError as e:
+            msg = str(e)
+            if "Sign in to confirm" in msg or "not a bot" in msg:
+                # Bot detection error - provide helpful guidance
+                error_msg = (
+                    f"🤖 YouTube Bot Detection: Video {video_id} requires authentication.\n\n"
+                    "Solutions:\n"
+                    "1. Use browser cookies (recommended):\n"
+                    "   loader = YoutubeLoader(cookies='chrome')  # or 'firefox', 'safari'\n\n"
+                    "2. Export cookie file:\n"
+                    "   yt-dlp --cookies-from-browser chrome --cookies cookies.txt <video_url>\n"
+                    "   loader = YoutubeLoader(cookies='cookies.txt')\n\n"
+                    "3. Environment variable:\n"
+                    "   export YOUTUBE_COOKIE_BROWSER=chrome\n\n"
+                    f"Original error: {msg}"
+                )
+                raise VideoUnavailableError(error_msg) from e
+            elif "Private video" in msg:
+                raise VideoUnavailableError(f"Video {video_id} is private") from e
+            raise YouTubeError(f"yt-dlp failed: {msg}") from e
+        except Exception as e:
+            raise YouTubeError(f"Unexpected error: {str(e)}") from e
+    def get_caption(self, video_id: str, lang: str = "en") -> Dict[str, str]:
+        """
+        Fetch transcript for a specific language.
+        Returns a dict with 'content' (raw string) and 'fmt' (format extension).
+        """
+        url = f"https://www.youtube.com/watch?v={video_id}"
+        # We need to download json3 or vtt to parse.
+        # Ideally we want json3 for precision, but yt-dlp prefers vtt/srv3
+        opts = {
+            **self._base_opts,
+            "writesubtitles": True,
+            "writeautomaticsub": True,
+            "subtitleslangs": [lang],
+            "skip_download": True,
+        }
+        try:
+            with yt_dlp.YoutubeDL(opts) as ydl:
+                info = ydl.extract_info(url, download=False)
+                # Look for the requested language in subtitles or automatic_captions
+                subs = info.get("subtitles", {}).get(lang)
+                if not subs:
+                    subs = info.get("automatic_captions", {}).get(lang)
+                if not subs:
+                    raise YouTubeError(f"No captions found for language: {lang}")
+                # Sort to find best format (json3 > vtt > ttml > srv3)
+                best_fmt = self._find_best_format(subs)
+                if not best_fmt or not best_fmt.get("url"):
+                    raise YouTubeError("Could not find a download URL for captions")
+                caption_url = best_fmt["url"]
+                ext = best_fmt.get("ext")
+                content = self._fetch_caption(caption_url)
+                return {"content": content, "fmt": ext}
+        except Exception as e:
+            raise YouTubeError(f"Failed to fetch transcript: {str(e)}") from e
+    def _get_lang_name(self, formats: List[Dict]) -> str:
+        if formats and "name" in formats[0]:
+            return formats[0]["name"]
+        return "Unknown"
+    def _find_best_format(self, formats: List[Dict]) -> Optional[Dict]:
+        # Prefer json3 (best precision), srv3 (word-level timing), then vtt
+        priority = ["json3", "srv3", "vtt", "ttml", "srv2", "srv1"]
+        for fmt_ext in priority:
+            for f in formats:
+                if f.get("ext") == fmt_ext:
+                    return f
+        return formats[0] if formats else None
+    def _fetch_caption(self, url: str) -> str:
+        import requests
+        try:
+            resp = requests.get(url, proxies={"https": self.proxy} if self.proxy else None)
+            resp.raise_for_status()
+            return resp.text
+        except Exception as e:
+            logger.error(f"Error fetching caption: {e}")
+            raise YouTubeError("Failed to fetch caption content") from e
+    def get_audio_url(
+        self,
+        video_id: str,
+        format_preference: str = "m4a",
+        quality: str = "best",
+        audio_track_id: Optional[str] = None,
+    ) -> Dict[str, Any]:
+        """
+        Get direct audio-only stream URL for a YouTube video.
+        Args:
+            video_id: YouTube video ID
+            format_preference: Preferred audio format (m4a, webm, opus)
+            quality: Audio quality - "best" (highest bitrate), "medium" (~128kbps),
+                    "low" (~50kbps), or specific bitrate like "128", "64"
+            audio_track_id: Specific audio track ID for multi-language videos (e.g., "en.2")
+        Returns:
+            Dict with url, mime_type, bitrate, content_length, format_id, ext
+        """
+        url = f"https://www.youtube.com/watch?v={video_id}"
+        # Use base opts (includes proxy and cookie config) + DASH manifest
+        opts = {
+            **self._base_opts,
+            "youtube_include_dash_manifest": True,
+        }
+        try:
+            with yt_dlp.YoutubeDL(opts) as ydl:
+                info = ydl.extract_info(url, download=False)
+                # Get all formats and filter for audio-only (no video track)
+                formats = info.get("formats", [])
+                def is_direct_url(url: str) -> bool:
+                    """Check if URL is a direct stream URL (not HLS manifest)"""
+                    if not url:
+                        return False
+                    # HLS manifests contain these patterns
+                    hls_patterns = ["manifest.googlevideo.com", "/hls_playlist/", ".m3u8"]
+                    return not any(p in url for p in hls_patterns)
+                audio_formats = [
+                    f
+                    for f in formats
+                    if f.get("acodec") not in (None, "none")
+                    and f.get("vcodec") in (None, "none")
+                    and f.get("url")  # Must have a direct URL
+                    and is_direct_url(f.get("url"))  # Exclude HLS manifests
+                ]
+                if not audio_formats:
+                    # Fallback: If no audio-only formats, use lowest resolution video with audio
+                    # This happens with HLS-only videos (e.g., protected content)
+                    logger.warning("No audio-only formats found. Falling back to lowest resolution video with audio.")
+                    audio_formats = [
+                        f
+                        for f in formats
+                        if f.get("acodec") not in (None, "none")
+                        and f.get("vcodec") not in (None, "none")
+                        and f.get("url")
+                        and is_direct_url(f.get("url"))  # Exclude HLS manifests
+                    ]
+                    # Sort by resolution (lowest first) for minimal bandwidth
+                    audio_formats.sort(key=lambda f: f.get("height") or f.get("width") or 9999)
+                if not audio_formats:
+                    # Check if there are HLS-only formats (common for Shorts)
+                    # HLS can still work with server-side streaming (same IP)
+                    hls_with_audio = [f for f in formats if f.get("acodec") not in (None, "none") and f.get("url")]
+                    if hls_with_audio:
+                        logger.warning("Only HLS streams available. Returning HLS URL for server-side streaming.")
+                        # Sort: prefer audio-only, then by resolution (lowest first)
+                        hls_with_audio.sort(
+                            key=lambda f: (
+                                0 if f.get("vcodec") in (None, "none") else 1,
+                                f.get("height") or f.get("width") or 9999,
+                            )
+                        )
+                        audio_formats = hls_with_audio
+                    else:
+                        raise YouTubeError(
+                            "No formats with audio available. YouTube may require authentication for this video."
+                        )
+                # Filter by audio_track_id if specified (for multi-language audio)
+                if audio_track_id:
+                    # yt-dlp uses format_id patterns like "251-0" or "audio_track" field
+                    # Try matching by format_id suffix or audio_track field
+                    track_filtered = [
+                        f
+                        for f in audio_formats
+                        if f.get("audio_track", {}).get("id") == audio_track_id
+                        or (f.get("format_id") and audio_track_id in f.get("format_id", ""))
+                        or f.get("language") == audio_track_id.split(".")[0]  # e.g., "en" from "en.2"
+                    ]
+                    if track_filtered:
+                        audio_formats = track_filtered
+                        logger.info(f"Filtered to {len(audio_formats)} formats for audio_track_id={audio_track_id}")
+                # Parse quality parameter
+                # "best" = highest bitrate, "medium" ~128kbps, "low" ~50kbps
+                quality_tier = quality.lower()
+                if quality_tier == "best":
+                    max_bitrate = float("inf")
+                elif quality_tier == "medium":
+                    max_bitrate = 160  # Allow up to 160kbps for "medium"
+                elif quality_tier == "low":
+                    max_bitrate = 70  # Allow up to 70kbps for "low"
+                elif quality_tier.isdigit():
+                    max_bitrate = int(quality_tier) + 20  # Allow some tolerance
+                else:
+                    max_bitrate = float("inf")  # Default to best
+                # Sort by preference: format match > bitrate (within limit)
+                def score_format(f: Dict) -> tuple:
+                    ext = f.get("ext", "")
+                    ext_match = 2 if ext == format_preference else 0
+                    # Prefer m4a/webm over other formats
+                    common_format = 1 if ext in ("m4a", "webm", "opus") else 0
+                    bitrate = f.get("abr") or f.get("tbr") or 0
+                    # For quality tiers, filter then maximize
+                    if bitrate <= max_bitrate:
+                        quality_score = bitrate  # Higher is better within limit
+                    else:
+                        quality_score = -1000  # Exclude formats exceeding limit
+                    return (ext_match, common_format, quality_score)
+                audio_formats.sort(key=score_format, reverse=True)
+                best = audio_formats[0]
+                # Check if selected format is HLS (requires server-side streaming)
+                best_url = best.get("url", "")
+                is_hls = not is_direct_url(best_url)
+                return {
+                    "url": best_url,
+                    "mime_type": best.get("ext", format_preference),
+                    "bitrate": best.get("abr") or best.get("tbr"),
+                    "sample_rate": best.get("asr"),  # Audio sample rate
+                    "content_length": best.get("filesize") or best.get("filesize_approx"),
+                    "format_id": best.get("format_id"),
+                    "ext": best.get("ext"),
+                    "is_hls": is_hls,  # True = use server streaming, False = use proxy
+                }
+        except yt_dlp.utils.DownloadError as e:
+            msg = str(e)
+            if "Sign in to confirm" in msg or "not a bot" in msg:
+                raise YouTubeError(
+                    f"🤖 YouTube Bot Detection: Cookie configuration required to access this video. "
+                    f"Reference: YoutubeLoader(cookies='chrome') or set environment variable YOUTUBE_COOKIE_BROWSER=chrome. "
+                    f"Original error: {msg}"
+                ) from e
+            raise YouTubeError(f"Failed to get audio URL: {msg}") from e
+        except Exception as e:
+            raise YouTubeError(f"Unexpected error getting audio URL: {str(e)}") from e
+    def get_video_url(self, video_id: str, format_preference: str = "mp4", quality: str = "best") -> Dict[str, Any]:
+        """
+        Get direct video stream URL for a YouTube video.
+        Args:
+            video_id: YouTube video ID
+            format_preference: Preferred video format (mp4, webm)
+            quality: Video quality (best, 1080, 720, 480, 360)
+        Returns:
+            Dict with url, mime_type, width, height, fps, vcodec, acodec, bitrate, content_length, format_id, ext
+        Note:
+            Prioritizes formats that include both video AND audio to avoid silent videos.
+            YouTube separates high-quality video and audio streams; we prefer pre-muxed formats.
+        """
+        url = f"https://www.youtube.com/watch?v={video_id}"
+        # Use base opts (includes proxy and cookie config) + DASH and HLS manifests
+        opts = {
+            **self._base_opts,
+            "youtube_include_dash_manifest": True,
+            "youtube_include_hls_manifest": True,
+        }
+        try:
+            with yt_dlp.YoutubeDL(opts) as ydl:
+                info = ydl.extract_info(url, download=False)
+                # Get all formats
+                formats = info.get("formats", [])
+                def is_direct_url(url: str) -> bool:
+                    """Check if URL is a direct stream URL (not HLS manifest)"""
+                    if not url:
+                        return False
+                    hls_patterns = ["manifest.googlevideo.com", "/hls_playlist/", ".m3u8"]
+                    return not any(p in url for p in hls_patterns)
+                # Filter for video formats:
+                # - Must have video codec
+                # - Must have a URL
+                # - Prefer direct URLs (DASH) over HLS manifests
+                def is_usable_video(f: Dict) -> bool:
+                    if f.get("vcodec") in (None, "none"):
+                        return False
+                    if not f.get("url"):
+                        return False
+                    return True
+                # First try: direct URLs only (exclude HLS)
+                video_formats = [f for f in formats if is_usable_video(f) and is_direct_url(f.get("url", ""))]
+                # Fallback: include HLS if no direct formats
+                if not video_formats:
+                    logger.warning("No direct video URLs found. Falling back to HLS formats.")
+                    video_formats = [f for f in formats if is_usable_video(f)]
+                if not video_formats:
+                    raise YouTubeError("No video formats available")
+                # Parse target height from quality parameter
+                target_height = None
+                if quality != "best" and quality.isdigit():
+                    target_height = int(quality)
+                # Sort by preference: has_audio (MOST IMPORTANT) > format match > resolution > bitrate
+                # YouTube high-quality streams are often video-only; we MUST prefer formats with audio
+                def score_format(f: Dict) -> tuple:
+                    ext = f.get("ext", "")
+                    ext_match = 1 if ext == format_preference else 0
+                    height = f.get("height") or 0
+                    bitrate = f.get("tbr") or f.get("vbr") or 0
+                    # has_audio is now the HIGHEST priority - video without audio is useless for most users
+                    has_audio = 10 if f.get("acodec") not in (None, "none") else 0
+                    # For quality filtering, penalize formats exceeding target
+                    height_score = height
+                    if target_height and height > target_height:
+                        height_score = -1000  # Heavily penalize exceeding target
+                    return (has_audio, ext_match, height_score, bitrate)
+                video_formats.sort(key=score_format, reverse=True)
+                best = video_formats[0]
+                # Check if selected format is HLS
+                best_url = best.get("url", "")
+                is_hls = not is_direct_url(best_url)
+                # Log selection for debugging
+                logger.info(
+                    f"Selected video format: {best.get('format_id')} "
+                    f"({best.get('width')}x{best.get('height')}, "
+                    f"vcodec={best.get('vcodec')}, acodec={best.get('acodec')}, is_hls={is_hls})"
+                )
+                return {
+                    "url": best_url,
+                    "mime_type": best.get("ext", format_preference),
+                    "width": best.get("width"),
+                    "height": best.get("height"),
+                    "fps": best.get("fps"),
+                    "vcodec": best.get("vcodec"),
+                    "acodec": best.get("acodec"),
+                    "bitrate": best.get("tbr") or best.get("vbr"),
+                    "content_length": best.get("filesize") or best.get("filesize_approx"),
+                    "format_id": best.get("format_id"),
+                    "ext": best.get("ext"),
+                    "is_hls": is_hls,
+                }
+        except yt_dlp.utils.DownloadError as e:
+            msg = str(e)
+            if "Sign in to confirm" in msg or "not a bot" in msg:
+                raise YouTubeError(
+                    f"🤖 YouTube Bot Detection: Cookie configuration required to access this video. "
+                    f"Reference: YoutubeLoader(cookies='chrome') or set environment variable YOUTUBE_COOKIE_BROWSER=chrome. "
+                    f"Original error: {msg}"
+                ) from e
+            raise YouTubeError(f"Failed to get video URL: {msg}") from e
+        except Exception as e:
+            raise YouTubeError(f"Unexpected error getting video URL: {str(e)}") from e
+class YouTubeDownloader:
+    """YouTube media and caption file downloader using yt-dlp
+    Use this class when you need to:
+    - Download audio/video files to disk
+    - Download caption files to disk
+    - Manage file existence and overwrite options
+    - Async download support
+    """
+    def __init__(self):
+        if yt_dlp is None:
+            raise ImportError("yt-dlp is required. Install with `pip install yt-dlp`")
+        self.logger = setup_workflow_logger("youtube")
+        self.logger.info(f"yt-dlp version: {yt_dlp.version.__version__}")
+    def _normalize_audio_quality(self, quality: str) -> str:
+        """
+        Normalize quality parameter for audio downloads.
+        Handles cross-type quality values (e.g., video resolution used for audio).
+        Args:
+            quality: Raw quality string
+        Returns:
+            Normalized audio quality string
+        """
+        quality_lower = quality.lower()
+        # Direct audio quality values
+        if quality_lower in ("best", "medium", "low"):
+            return quality_lower
+        # Numeric values need interpretation
+        if quality_lower.isdigit():
+            value = int(quality_lower)
+            # Values > 320 are likely video resolutions, not audio bitrates
+            if value > 320:
+                self.logger.warning(f"⚠️ Quality '{quality}' looks like video resolution, using 'best' for audio")
+                return "best"
+            # Values <= 320 are reasonable audio bitrates
+            return quality_lower
+        # Unknown value, default to best
+        return "best"
+    def _normalize_video_quality(self, quality: str) -> str:
+        """
+        Normalize quality parameter for video downloads.
+        Handles cross-type quality values (e.g., audio bitrate/quality used for video).
+        Args:
+            quality: Raw quality string
+        Returns:
+            Normalized video quality string
+        """
+        quality_lower = quality.lower()
+        # Map audio quality terms to video equivalents
+        if quality_lower == "low":
+            self.logger.info("🎬 Mapping audio quality 'low' to video 360p")
+            return "360"
+        elif quality_lower == "medium":
+            self.logger.info("🎬 Mapping audio quality 'medium' to video 720p")
+            return "720"
+        elif quality_lower == "best":
+            return "best"
+        # Numeric values
+        if quality_lower.isdigit():
+            value = int(quality_lower)
+            # Values <= 320 are likely audio bitrates, not video resolutions
+            if value <= 320:
+                self.logger.warning(f"⚠️ Quality '{quality}' looks like audio bitrate, using 'best' for video")
+                return "best"
+            # Values > 320 are reasonable video resolutions
+            return quality_lower
+        # Unknown value, default to best
+        return "best"
+    def _build_audio_format_selector(self, audio_track_id: Optional[str], quality: str = "best") -> str:
+        """
+        Build yt-dlp format selector string for audio track and quality selection.
+        Args:
+            audio_track_id: Audio track selection:
+                - "original": Select the original audio track (format_id contains "drc")
+                - Language code (e.g., "en", "ja"): Select by language
+                - Format ID (e.g., "251-drc"): Select specific format
+                - None: No filtering
+            quality: Audio quality:
+                - "best": Highest bitrate (default)
+                - "medium": ~128 kbps
+                - "low": ~50 kbps
+                - Numeric string (e.g., "128"): Target bitrate in kbps
+        Returns:
+            yt-dlp format selector string
+        """
+        # Normalize quality for audio context
+        quality_lower = self._normalize_audio_quality(quality)
+        # Build quality filter
+        quality_filter = ""
+        if quality_lower == "medium":
+            quality_filter = "[abr<=160]"
+            self.logger.info("🎵 Audio quality: medium (~128 kbps)")
+        elif quality_lower == "low":
+            quality_filter = "[abr<=70]"
+            self.logger.info("🎵 Audio quality: low (~50 kbps)")
+        elif quality_lower.isdigit():
+            max_bitrate = int(quality_lower) + 20  # Allow some tolerance
+            quality_filter = f"[abr<={max_bitrate}]"
+            self.logger.info(f"🎵 Audio quality: ~{quality_lower} kbps")
+        # "best" = no filter, use bestaudio
+        # Build track filter
+        if audio_track_id is None:
+            return f"bestaudio{quality_filter}/bestaudio/best"
+        if audio_track_id.lower() == "original":
+            self.logger.info("🎵 Selecting original audio track (format_id contains 'drc')")
+            return f"bestaudio[format_id*=drc]{quality_filter}/bestaudio{quality_filter}/bestaudio/best"
+        # Check if it looks like a format_id (contains hyphen or is numeric)
+        if "-" in audio_track_id or audio_track_id.isdigit():
+            self.logger.info(f"🎵 Selecting audio by format_id: {audio_track_id}")
+            return f"bestaudio[format_id={audio_track_id}]{quality_filter}/bestaudio{quality_filter}/bestaudio/best"
+        # Assume it's a language code
+        self.logger.info(f"🎵 Selecting audio by language: {audio_track_id}")
+        return f"bestaudio[language^={audio_track_id}]{quality_filter}/bestaudio{quality_filter}/bestaudio/best"
+    def _build_video_format_selector(self, audio_format_selector: str, quality: str = "best") -> str:
+        """
+        Build yt-dlp format selector string for video with quality selection.
+        Args:
+            audio_format_selector: Audio format selector from _build_audio_format_selector
+            quality: Video quality:
+                - "best": Highest resolution (default)
+                - "low": 360p
+                - "medium": 720p
+                - "1080", "720", "480", "360": Target resolution
+        Returns:
+            yt-dlp format selector string
+        """
+        # Normalize quality for video context
+        quality_lower = self._normalize_video_quality(quality)
+        if quality_lower.isdigit():
+            height = int(quality_lower)
+            self.logger.info(f"🎬 Video quality: {height}p")
+            return f"bestvideo[height<={height}]+{audio_format_selector}/best[height<={height}]/best"
+        # "best" or fallback
+        return f"bestvideo*+{audio_format_selector}/best"
+    @staticmethod
+    def extract_video_id(url: str) -> str:
+        """
+        Extract video ID from YouTube URL
+        Supports various YouTube URL formats:
+        - https://www.youtube.com/watch?v=VIDEO_ID
+        - https://youtu.be/VIDEO_ID
+        - https://www.youtube.com/shorts/VIDEO_ID
+        - https://m.youtube.com/watch?v=VIDEO_ID
+        Returns:
+            Video ID (e.g., 'cprOj8PWepY')
+        """
+        patterns = [
+            r"(?:youtube\.com/watch\?v=|youtu\.be/|youtube\.com/shorts/)([a-zA-Z0-9_-]{11})",
+            r"youtube\.com/embed/([a-zA-Z0-9_-]{11})",
+            r"youtube\.com/v/([a-zA-Z0-9_-]{11})",
+        ]
+        for pattern in patterns:
+            match = re.search(pattern, url)
+            if match:
+                return match.group(1)
+        return "youtube_media"
+    async def get_video_info(self, url: str) -> Dict[str, Any]:
+        """Get video metadata without downloading"""
+        self.logger.info(f"🔍 Extracting video info for: {url}")
+        opts = {
+            "quiet": True,
+            "no_warnings": True,
+            "skip_download": True,
+        }
+        try:
+            # Run in thread pool to avoid blocking
+            loop = asyncio.get_event_loop()
+            def _extract_info():
+                with yt_dlp.YoutubeDL(opts) as ydl:
+                    return ydl.extract_info(url, download=False)
+            metadata = await loop.run_in_executor(None, _extract_info)
+            # Extract relevant info
+            info = {
+                "title": metadata.get("title", "Unknown"),
+                "duration": metadata.get("duration", 0),
+                "uploader": metadata.get("uploader", "Unknown"),
+                "upload_date": metadata.get("upload_date", "Unknown"),
+                "view_count": metadata.get("view_count", 0),
+                "description": metadata.get("description", ""),
+                "thumbnail": metadata.get("thumbnail", ""),
+                "webpage_url": metadata.get("webpage_url", url),
+            }
+            self.logger.info(f'✅ Video info extracted: {info["title"]}')
+            return info
+        except yt_dlp.utils.DownloadError as e:
+            self.logger.error(f"Failed to extract video info: {str(e)}")
+            raise RuntimeError(f"Failed to extract video info: {str(e)}")
+        except Exception as e:
+            self.logger.error(f"Failed to parse video metadata: {str(e)}")
+            raise RuntimeError(f"Failed to parse video metadata: {str(e)}")
+    async def download_media(
+        self,
+        url: str,
+        output_dir: Optional[str] = None,
+        media_format: Optional[str] = None,
+        force_overwrite: bool = False,
+        audio_track_id: Optional[str] = "original",
+        quality: str = "best",
+    ) -> str:
+        """
+        Download media (audio or video) from YouTube URL based on format
+        This is a unified method that automatically selects between audio and video
+        download based on the media format extension.
+        Args:
+            url: YouTube URL
+            output_dir: Output directory (default: temp directory)
+            media_format: Media format - audio (mp3, wav, m4a, aac, opus, ogg, flac, aiff)
+                         or video (mp4, webm, mkv, avi, mov, etc.) (default: mp3)
+            force_overwrite: Skip user confirmation and overwrite existing files
+            audio_track_id: Audio track selection for multi-language videos:
+                - "original": Select the original audio track (default)
+                - Language code (e.g., "en", "ja"): Select by language
+                - Format ID (e.g., "251-drc"): Select specific format
+                - None: No filtering, use yt-dlp default
+            quality: Media quality selection:
+                For audio: "best", "medium", "low", or bitrate like "128"
+                For video: "best", "1080", "720", "480", "360"
+        Returns:
+            Path to downloaded media file
+        """
+        media_format = media_format or "mp3"
+        # Determine if format is audio or video
+        audio_formats = ["mp3", "wav", "m4a", "aac", "opus", "ogg", "flac", "aiff"]
+        is_audio = media_format.lower() in audio_formats
+        if is_audio:
+            self.logger.info(f"🎵 Detected audio format: {media_format}")
+            return await self.download_audio(
+                url=url,
+                output_dir=output_dir,
+                media_format=media_format,
+                force_overwrite=force_overwrite,
+                audio_track_id=audio_track_id,
+                quality=quality,
+            )
+        else:
+            self.logger.info(f"🎬 Detected video format: {media_format}")
+            return await self.download_video(
+                url=url,
+                output_dir=output_dir,
+                video_format=media_format,
+                force_overwrite=force_overwrite,
+                audio_track_id=audio_track_id,
+                quality=quality,
+            )
+    async def _download_media_internal(
+        self,
+        url: str,
+        output_dir: str,
+        media_format: str,
+        is_audio: bool,
+        force_overwrite: bool = False,
+        audio_track_id: Optional[str] = "original",
+        quality: str = "best",
+    ) -> str:
+        """
+        Internal unified method for downloading audio or video from YouTube
+        Args:
+            url: YouTube URL
+            output_dir: Output directory
+            media_format: Media format (audio or video extension)
+            is_audio: True for audio download, False for video download
+            force_overwrite: Skip user confirmation and overwrite existing files
+            audio_track_id: Audio track selection for multi-language videos:
+                - "original": Select the original audio track (default)
+                - Language code (e.g., "en", "ja"): Select by language
+                - Format ID (e.g., "251-drc"): Select specific format
+                - None: No filtering, use yt-dlp default
+            quality: Media quality selection:
+                For audio: "best", "medium", "low", or bitrate like "128"
+                For video: "best", "1080", "720", "480", "360"
+        Returns:
+            Path to downloaded media file
+        """
+        target_dir = Path(output_dir).expanduser()
+        media_type = "audio" if is_audio else "video"
+        emoji = "🎵" if is_audio else "🎬"
+        self.logger.info(f"{emoji} Downloading {media_type} from: {url}")
+        self.logger.info(f"📁 Output directory: {target_dir}")
+        self.logger.info(f'{"🎶" if is_audio else "🎥"} Media format: {media_format}')
+        # Create output directory if it doesn't exist
+        target_dir.mkdir(parents=True, exist_ok=True)
+        # Extract video ID and check for existing files
+        video_id = self.extract_video_id(url)
+        existing_files = FileExistenceManager.check_existing_files(video_id, str(target_dir), [media_format])
+        # Handle existing files
+        if existing_files["media"] and not force_overwrite:
+            if FileExistenceManager.is_interactive_mode():
+                user_choice = FileExistenceManager.prompt_user_confirmation(
+                    {"media": existing_files["media"]}, "media download"
+                )
+                if user_choice == "cancel":
+                    raise RuntimeError("Media download cancelled by user")
+                elif user_choice == "overwrite":
+                    # Continue with download
+                    pass
+                elif user_choice in existing_files["media"]:
+                    # User selected a specific file
+                    return user_choice
+                else:
+                    # Fallback: use first file
+                    self.logger.info(f'✅ Using existing media file: {existing_files["media"][0]}')
+                    return existing_files["media"][0]
+            else:
+                # Non-interactive mode: use existing file
+                self.logger.info(f'✅ Using existing media file: {existing_files["media"][0]}')
+                return existing_files["media"][0]
+        # Generate output filename template
+        output_template = str(target_dir / f"{video_id}.%(ext)s")
+        # Build format selector with audio track and quality filtering
+        audio_format_selector = self._build_audio_format_selector(audio_track_id, quality)
+        # Build yt-dlp options based on media type
+        if is_audio:
+            opts = {
+                "format": audio_format_selector,
+                "postprocessors": [
+                    {
+                        "key": "FFmpegExtractAudio",
+                        "preferredcodec": media_format,
+                        "preferredquality": "0",  # Best quality for conversion
+                    }
+                ],
+                "outtmpl": output_template,
+                "noplaylist": True,
+                "quiet": False,
+                "no_warnings": True,
+            }
+        else:
+            # For video, combine video with selected audio track
+            video_format_selector = self._build_video_format_selector(audio_format_selector, quality)
+            opts = {
+                "format": video_format_selector,
+                "merge_output_format": media_format,
+                "outtmpl": output_template,
+                "noplaylist": True,
+                "quiet": False,
+                "no_warnings": True,
+            }
+        try:
+            # Run in thread pool to avoid blocking
+            loop = asyncio.get_event_loop()
+            def _download():
+                with yt_dlp.YoutubeDL(opts) as ydl:
+                    ydl.download([url])
+            await loop.run_in_executor(None, _download)
+            self.logger.info(f"✅ {media_type.capitalize()} download completed")
+            # Check for expected file format
+            expected_file = target_dir / f"{video_id}.{media_format}"
+            if expected_file.exists():
+                self.logger.info(f"{emoji} Downloaded {media_type}: {expected_file}")
+                return str(expected_file)
+            # Fallback: search for media files with this video_id
+            if is_audio:
+                fallback_extensions = [media_format, "mp3", "wav", "m4a", "aac"]
+            else:
+                fallback_extensions = [media_format, "mp4", "webm", "mkv"]
+            for ext in fallback_extensions:
+                files = list(target_dir.glob(f"{video_id}*.{ext}"))
+                if files:
+                    latest_file = max(files, key=os.path.getctime)
+                    self.logger.info(f"{emoji} Found {media_type} file: {latest_file}")
+                    return str(latest_file)
+            raise RuntimeError(f"Downloaded {media_type} file not found")
+        except yt_dlp.utils.DownloadError as e:
+            self.logger.error(f"Failed to download {media_type}: {str(e)}")
+            raise RuntimeError(f"Failed to download {media_type}: {str(e)}")
+        except Exception as e:
+            self.logger.error(f"Failed to download {media_type}: {str(e)}")
+            raise RuntimeError(f"Failed to download {media_type}: {str(e)}")
+    async def download_audio(
+        self,
+        url: str,
+        output_dir: Optional[str] = None,
+        media_format: Optional[str] = None,
+        force_overwrite: bool = False,
+        audio_track_id: Optional[str] = "original",
+        quality: str = "best",
+    ) -> str:
+        """
+        Download audio from YouTube URL
+        Args:
+            url: YouTube URL
+            output_dir: Output directory (default: temp directory)
+            media_format: Audio format (default: mp3)
+            force_overwrite: Skip user confirmation and overwrite existing files
+            audio_track_id: Audio track selection for multi-language videos
+            quality: Audio quality ("best", "medium", "low", or bitrate like "128")
+        Returns:
+            Path to downloaded audio file
+        """
+        target_dir = output_dir or tempfile.gettempdir()
+        media_format = media_format or "mp3"
+        return await self._download_media_internal(
+            url,
+            target_dir,
+            media_format,
+            is_audio=True,
+            force_overwrite=force_overwrite,
+            audio_track_id=audio_track_id,
+            quality=quality,
+        )
+    async def download_video(
+        self,
+        url: str,
+        output_dir: Optional[str] = None,
+        video_format: str = "mp4",
+        force_overwrite: bool = False,
+        audio_track_id: Optional[str] = "original",
+        quality: str = "best",
+    ) -> str:
+        """
+        Download video from YouTube URL
+        Args:
+            url: YouTube URL
+            output_dir: Output directory (default: temp directory)
+            video_format: Video format
+            force_overwrite: Skip user confirmation and overwrite existing files
+            audio_track_id: Audio track selection for multi-language videos
+            quality: Video quality ("best", "1080", "720", "480", "360")
+        Returns:
+            Path to downloaded video file
+        """
+        target_dir = output_dir or tempfile.gettempdir()
+        return await self._download_media_internal(
+            url,
+            target_dir,
+            video_format,
+            is_audio=False,
+            force_overwrite=force_overwrite,
+            audio_track_id=audio_track_id,
+            quality=quality,
+        )
+    async def download_captions(
+        self,
+        url: str,
+        output_dir: str,
+        force_overwrite: bool = False,
+        source_lang: Optional[str] = None,
+        transcriber_name: Optional[str] = None,
+    ) -> Optional[str]:
+        """
+        Download video captions using yt-dlp
+        Args:
+            url: YouTube URL
+            output_dir: Output directory
+            force_overwrite: Skip user confirmation and overwrite existing files
+            source_lang: Specific caption language/track to download (e.g., 'en')
+                          If None, downloads all available captions
+            transcriber_name: Name of the transcriber (for user prompts)
+        Returns:
+            Path to downloaded transcript file or None if not available
+        """
+        target_dir = Path(output_dir).expanduser()
+        # Create output directory if it doesn't exist
+        target_dir.mkdir(parents=True, exist_ok=True)
+        # Extract video ID and check for existing caption files
+        video_id = self.extract_video_id(url)
+        if not force_overwrite:
+            existing_files = FileExistenceManager.check_existing_files(
+                video_id, str(target_dir), caption_formats=CAPTION_FORMATS
+            )
+            # Handle existing caption files
+            if existing_files["caption"] and not force_overwrite:
+                if FileExistenceManager.is_interactive_mode():
+                    user_choice = FileExistenceManager.prompt_user_confirmation(
+                        {"caption": existing_files["caption"]}, "caption download", transcriber_name=transcriber_name
+                    )
+                    if user_choice == "cancel":
+                        raise RuntimeError("Caption download cancelled by user")
+                    elif user_choice == "overwrite":
+                        # Continue with download
+                        pass
+                    elif user_choice == TRANSCRIBE_CHOICE:
+                        return TRANSCRIBE_CHOICE
+                    elif user_choice in existing_files["caption"]:
+                        # User selected a specific file
+                        caption_file = Path(user_choice)
+                        self.logger.info(f"✅ Using selected caption file: {caption_file}")
+                        return str(caption_file)
+                    else:
+                        # Fallback: use first file
+                        caption_file = Path(existing_files["caption"][0])
+                        self.logger.info(f"✅ Using existing caption file: {caption_file}")
+                        return str(caption_file)
+                else:
+                    caption_file = Path(existing_files["caption"][0])
+                    self.logger.info(f"🔍 Found existing caption: {caption_file}")
+                    return str(caption_file)
+        self.logger.info(f"📥 Downloading caption for: {url}")
+        if source_lang:
+            self.logger.info(f"🎯 Targeting specific caption track: {source_lang}")
+        output_template = str(target_dir / f"{video_id}.%(ext)s")
+        # Configure yt-dlp options for caption download
+        opts = {
+            "skip_download": True,  # Don't download video/audio
+            "writesubtitles": True,
+            "writeautomaticsub": True,
+            "subtitlesformat": "best",
+            "outtmpl": output_template,
+            "quiet": False,
+            "no_warnings": True,
+        }
+        # Add caption language selection if specified
+        if source_lang:
+            opts["subtitleslangs"] = [f"{source_lang}*"]
+        try:
+            # Run in thread pool to avoid blocking
+            loop = asyncio.get_event_loop()
+            def _download_subs():
+                with yt_dlp.YoutubeDL(opts) as ydl:
+                    ydl.download([url])
+            await loop.run_in_executor(None, _download_subs)
+        except yt_dlp.utils.DownloadError as e:
+            error_msg = str(e)
+            # Check for specific error conditions
+            if "No automatic or manual captions found" in error_msg:
+                self.logger.warning("No captions available for this video")
+            elif "HTTP Error 429" in error_msg or "Too Many Requests" in error_msg:
+                self.logger.error("YouTube rate limit exceeded. Please try again later or use a different method.")
+                self.logger.error(
+                    "YouTube rate limit exceeded (HTTP 429). "
+                    "Try again later or use --cookies option with authenticated cookies. "
+                    "See: https://github.com/yt-dlp/yt-dlp/wiki/FAQ#how-do-i-pass-cookies-to-yt-dlp"
+                )
+            else:
+                self.logger.error(f"Failed to download transcript: {error_msg}")
+        except Exception as e:
+            self.logger.error(f"Failed to download transcript: {str(e)}")
+        # Find the downloaded transcript file
+        caption_patterns = [
+            f"{video_id}.*vtt",
+            f"{video_id}.*srt",
+            f"{video_id}.*sub",
+            f"{video_id}.*sbv",
+            f"{video_id}.*ssa",
+            f"{video_id}.*ass",
+        ]
+        caption_files = []
+        for pattern in caption_patterns:
+            _caption_files = list(target_dir.glob(pattern))
+            for caption_file in _caption_files:
+                self.logger.info(f"📥 Downloaded caption: {caption_file}")
+            caption_files.extend(_caption_files)
+        # If only one caption file, return it directly
+        if len(caption_files) == 1:
+            self.logger.info(f"✅ Using caption: {caption_files[0]}")
+            return str(caption_files[0])
+        # Multiple caption files found, let user choose
+        if FileExistenceManager.is_interactive_mode():
+            self.logger.info(f"📋 Found {len(caption_files)} caption files")
+            caption_choice = FileExistenceManager.prompt_file_selection(
+                file_type="caption",
+                files=[str(f) for f in caption_files],
+                operation="use",
+                transcriber_name=transcriber_name,
+            )
+            if caption_choice == "cancel":
+                raise RuntimeError("Caption selection cancelled by user")
+            elif caption_choice == TRANSCRIBE_CHOICE:
+                return caption_choice
+            elif caption_choice:
+                self.logger.info(f"✅ Selected caption: {caption_choice}")
+                return caption_choice
+            elif caption_files:
+                # Fallback to first file
+                self.logger.info(f"✅ Using first caption: {caption_files[0]}")
+                return str(caption_files[0])
+            else:
+                self.logger.warning("No caption files available after download")
+                return None
+        elif caption_files:
+            # Non-interactive mode: use first file
+            self.logger.info(f"✅ Using first caption: {caption_files[0]}")
+            return str(caption_files[0])
+        else:
+            self.logger.warning("No caption files available after download")
+            return None
+    async def list_available_captions(self, url: str) -> List[Dict[str, Any]]:
+        """
+        List all available caption tracks for a YouTube video
+        Args:
+            url: YouTube URL
+        Returns:
+            List of caption track information dictionaries
+        """
+        self.logger.info(f"📋 Listing available captions for: {url}")
+        opts = {
+            "skip_download": True,
+            "listsubtitles": True,
+            "quiet": True,
+            "no_warnings": True,
+        }
+        try:
+            # Run in thread pool to avoid blocking
+            loop = asyncio.get_event_loop()
+            def _get_info():
+                with yt_dlp.YoutubeDL(opts) as ydl:
+                    return ydl.extract_info(url, download=False)
+            info = await loop.run_in_executor(None, _get_info)
+            caption_info = []
+            # Parse manual captions
+            subtitles = info.get("subtitles", {})
+            for lang, formats in subtitles.items():
+                if formats:
+                    format_names = [f.get("ext", "") for f in formats]
+                    lang_name = formats[0].get("name", lang) if formats else lang
+                    caption_info.append(
+                        {"language": lang, "name": lang_name, "formats": format_names, "kind": "manual"}
+                    )
+            # Parse automatic captions
+            auto_subs = info.get("automatic_captions", {})
+            for lang, formats in auto_subs.items():
+                if formats:
+                    format_names = [f.get("ext", "") for f in formats]
+                    lang_name = formats[0].get("name", lang) if formats else lang
+                    caption_info.append({"language": lang, "name": lang_name, "formats": format_names, "kind": "asr"})
+            self.logger.info(f"✅ Found {len(caption_info)} caption tracks")
+            return caption_info
+        except yt_dlp.utils.DownloadError as e:
+            self.logger.error(f"Failed to list captions: {str(e)}")
+            raise RuntimeError(f"Failed to list captions: {str(e)}")
+        except Exception as e:
+            self.logger.error(f"Failed to list captions: {str(e)}")
+            raise RuntimeError(f"Failed to list captions: {str(e)}")

lattifai 1.2.1__py3-none-any.whl → 1.3.0__py3-none-any.whl

lattifai 1.2.1py3-none-any.whl → 1.3.0py3-none-any.whl