PyPI - lattifai - Versions diffs - 1.2.2__py3-none-any.whl → 1.3.0__py3-none-any.whl - Mend

lattifai 1.2.2py3-none-any.whl → 1.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

lattifai/_init.py +20 -0
lattifai/alignment/__init__.py +2 -3
lattifai/alignment/lattice1_aligner.py +117 -4
lattifai/alignment/lattice1_worker.py +47 -4
lattifai/alignment/segmenter.py +3 -2
lattifai/alignment/text_align.py +2 -1
lattifai/alignment/tokenizer.py +56 -29
lattifai/audio2.py +162 -183
lattifai/cli/alignment.py +5 -0
lattifai/cli/caption.py +6 -6
lattifai/cli/transcribe.py +1 -5
lattifai/cli/youtube.py +3 -0
lattifai/client.py +41 -12
lattifai/config/__init__.py +21 -3
lattifai/config/alignment.py +7 -0
lattifai/config/caption.py +13 -243
lattifai/config/client.py +16 -0
lattifai/config/event.py +102 -0
lattifai/config/transcription.py +25 -1
lattifai/data/__init__.py +8 -0
lattifai/data/caption.py +228 -0
lattifai/errors.py +78 -53
lattifai/event/__init__.py +65 -0
lattifai/event/lattifai.py +166 -0
lattifai/mixin.py +22 -17
lattifai/transcription/base.py +2 -1
lattifai/transcription/gemini.py +147 -16
lattifai/transcription/lattifai.py +8 -11
lattifai/types.py +1 -1
lattifai/youtube/client.py +143 -48
{lattifai-1.2.2.dist-info → lattifai-1.3.0.dist-info}/METADATA +117 -54
lattifai-1.3.0.dist-info/RECORD +57 -0
lattifai/__init__.py +0 -88
lattifai/alignment/sentence_splitter.py +0 -350
lattifai/caption/__init__.py +0 -96
lattifai/caption/caption.py +0 -661
lattifai/caption/formats/__init__.py +0 -199
lattifai/caption/formats/base.py +0 -211
lattifai/caption/formats/gemini.py +0 -722
lattifai/caption/formats/json.py +0 -194
lattifai/caption/formats/lrc.py +0 -309
lattifai/caption/formats/nle/__init__.py +0 -9
lattifai/caption/formats/nle/audition.py +0 -561
lattifai/caption/formats/nle/avid.py +0 -423
lattifai/caption/formats/nle/fcpxml.py +0 -549
lattifai/caption/formats/nle/premiere.py +0 -589
lattifai/caption/formats/pysubs2.py +0 -642
lattifai/caption/formats/sbv.py +0 -147
lattifai/caption/formats/tabular.py +0 -338
lattifai/caption/formats/textgrid.py +0 -193
lattifai/caption/formats/ttml.py +0 -652
lattifai/caption/formats/vtt.py +0 -469
lattifai/caption/parsers/__init__.py +0 -9
lattifai/caption/parsers/text_parser.py +0 -147
lattifai/caption/standardize.py +0 -636
lattifai/caption/supervision.py +0 -34
lattifai/caption/utils.py +0 -474
lattifai-1.2.2.dist-info/RECORD +0 -76
{lattifai-1.2.2.dist-info → lattifai-1.3.0.dist-info}/WHEEL +0 -0
{lattifai-1.2.2.dist-info → lattifai-1.3.0.dist-info}/entry_points.txt +0 -0
{lattifai-1.2.2.dist-info → lattifai-1.3.0.dist-info}/licenses/LICENSE +0 -0
{lattifai-1.2.2.dist-info → lattifai-1.3.0.dist-info}/top_level.txt +0 -0

lattifai/caption/formats/nle/avid.py DELETED Viewed

@@ -1,423 +0,0 @@
-"""Avid DS Subtitle format writer for Avid Media Composer integration.
-This module provides functionality to export captions in Avid DS format,
-which is the native format for Avid Media Composer's SubCap plugin.
-Format specification:
-- Header: "@ This file written with the Avid Caption plugin, version 1"
-- Body: Tab-separated timecode (HH:MM:SS:FF) and text
-- Timecodes are frame-based, not millisecond-based
-"""
-from dataclasses import dataclass
-from enum import Enum
-from pathlib import Path
-from typing import List, Optional, Union
-from lhotse.utils import Pathlike
-from ...supervision import Supervision
-from .. import register_writer
-from ..base import FormatReader, FormatWriter
-class FrameRate(Enum):
-    """Standard video frame rates for professional editing."""
-    FPS_23_976 = 23.976  # Film (24p pulldown)
-    FPS_24 = 24.0  # Film
-    FPS_25 = 25.0  # PAL / 25p
-    FPS_29_97_NDF = 29.97  # NTSC Non-Drop Frame
-    FPS_29_97_DF = 29.97  # NTSC Drop Frame (handled separately)
-    FPS_30 = 30.0  # 30p
-    FPS_50 = 50.0  # PAL 50p
-    FPS_59_94 = 59.94  # NTSC 60p
-    FPS_60 = 60.0  # 60p
-@dataclass
-class AvidDSConfig:
-    """Configuration for Avid DS export.
-    Attributes:
-        fps: Frame rate for timecode calculation
-        drop_frame: Whether to use drop-frame timecode (for 29.97fps)
-        max_line_length: Maximum characters per line (Avid SubCap typically limits to 32-40)
-        include_speaker: Whether to include speaker labels in text
-    """
-    fps: float = 25.0
-    drop_frame: bool = False
-    max_line_length: int = 40
-    include_speaker: bool = True
-class AvidDSWriter:
-    """Writer for Avid DS subtitle format.
-    This writer generates files compatible with Avid Media Composer's SubCap plugin.
-    It handles frame-based timecode conversion and enforces broadcast-safe line lengths.
-    Example:
-        >>> from lattifai.caption import Caption
-        >>> from lattifai.caption.formats.nle.avid import AvidDSWriter, AvidDSConfig
-        >>> caption = Caption.read("input.srt")
-        >>> config = AvidDSConfig(fps=25.0)
-        >>> AvidDSWriter.write(caption.supervisions, "output_avid.txt", config)
-    """
-    # Avid DS file header (required for SubCap plugin)
-    HEADER = "@ This file written with the Avid Caption plugin, version 1"
-    @classmethod
-    def seconds_to_timecode(
-        cls,
-        seconds: float,
-        fps: float = 25.0,
-        drop_frame: bool = False,
-    ) -> str:
-        """Convert seconds to SMPTE timecode (HH:MM:SS:FF).
-        Args:
-            seconds: Time in seconds
-            fps: Frame rate (e.g., 23.976, 24, 25, 29.97, 30)
-            drop_frame: Use drop-frame timecode (only for 29.97fps)
-        Returns:
-            Timecode string in HH:MM:SS:FF format (or HH:MM:SS;FF for drop-frame)
-        Note:
-            Drop-frame timecode skips frame numbers 0 and 1 at the start of each
-            minute except every 10th minute to keep timecode in sync with real time
-            for 29.97fps video.
-        """
-        if seconds < 0:
-            seconds = 0
-        if drop_frame and abs(fps - 29.97) < 0.01:
-            # Drop-frame calculation for 29.97fps
-            # Total frames at 29.97fps
-            total_frames = int(round(seconds * 29.97))
-            # Drop-frame adjustment
-            # 2 frames dropped every minute except every 10th minute
-            # = 2 * 9 = 18 frames dropped every 10 minutes
-            d = total_frames // 17982  # Number of complete 10-minute chunks
-            m = total_frames % 17982  # Remaining frames
-            if m >= 2:
-                # Add back dropped frames
-                total_frames += 18 * d + 2 * ((m - 2) // 1798)
-            frames = total_frames % 30
-            total_seconds = total_frames // 30
-            secs = total_seconds % 60
-            total_minutes = total_seconds // 60
-            mins = total_minutes % 60
-            hours = total_minutes // 60
-            # Drop-frame uses semicolon separator
-            return f"{hours:02d}:{mins:02d}:{secs:02d};{frames:02d}"
-        else:
-            # Non-drop frame calculation
-            total_frames = int(round(seconds * fps))
-            frames = int(total_frames % fps)
-            total_seconds = int(total_frames // fps)
-            secs = total_seconds % 60
-            total_minutes = total_seconds // 60
-            mins = total_minutes % 60
-            hours = total_minutes // 60
-            return f"{hours:02d}:{mins:02d}:{secs:02d}:{frames:02d}"
-    @classmethod
-    def wrap_text(cls, text: str, max_length: int = 40) -> List[str]:
-        """Wrap text to fit within maximum line length.
-        Args:
-            text: Text to wrap
-            max_length: Maximum characters per line
-        Returns:
-            List of wrapped lines
-        """
-        if len(text) <= max_length:
-            return [text]
-        words = text.split()
-        lines = []
-        current_line = []
-        current_length = 0
-        for word in words:
-            word_length = len(word)
-            # +1 for space between words
-            if current_length + word_length + (1 if current_line else 0) <= max_length:
-                current_line.append(word)
-                current_length += word_length + (1 if len(current_line) > 1 else 0)
-            else:
-                if current_line:
-                    lines.append(" ".join(current_line))
-                current_line = [word]
-                current_length = word_length
-        if current_line:
-            lines.append(" ".join(current_line))
-        return lines
-    @classmethod
-    def write(
-        cls,
-        supervisions: List[Supervision],
-        output_path: Pathlike,
-        config: Optional[AvidDSConfig] = None,
-    ) -> Path:
-        """Write supervisions to Avid DS format file.
-        Args:
-            supervisions: List of supervision segments
-            output_path: Output file path
-            config: Avid DS export configuration
-        Returns:
-            Path to written file
-        """
-        if config is None:
-            config = AvidDSConfig()
-        output_path = Path(output_path)
-        lines = [cls.HEADER, ""]  # Header + blank line
-        for sup in supervisions:
-            # Convert timestamps to timecode
-            start_tc = cls.seconds_to_timecode(sup.start, config.fps, config.drop_frame)
-            end_tc = cls.seconds_to_timecode(sup.end, config.fps, config.drop_frame)
-            # Prepare text
-            text = sup.text.strip() if sup.text else ""
-            # Check if speaker should be included
-            include_this_speaker = config.include_speaker and sup.speaker
-            if include_this_speaker and hasattr(sup, "custom") and sup.custom:
-                if not sup.custom.get("original_speaker", True):
-                    include_this_speaker = False
-            if include_this_speaker:
-                text = f"{sup.speaker}: {text}"
-            # Wrap text to max line length
-            wrapped_lines = cls.wrap_text(text, config.max_line_length)
-            text = "\n".join(wrapped_lines)
-            # Avid DS format: START_TC TAB END_TC TAB TEXT
-            lines.append(f"{start_tc}\t{end_tc}\t{text}")
-        # Write file
-        with open(output_path, "w", encoding="utf-8") as f:
-            f.write("\n".join(lines))
-        return output_path
-    @classmethod
-    def to_bytes(
-        cls,
-        supervisions: List[Supervision],
-        config: Optional[AvidDSConfig] = None,
-    ) -> bytes:
-        """Convert supervisions to Avid DS format bytes.
-        Args:
-            supervisions: List of supervision segments
-            config: Avid DS export configuration
-        Returns:
-            Avid DS content as bytes
-        """
-        if config is None:
-            config = AvidDSConfig()
-        lines = [cls.HEADER, ""]
-        for sup in supervisions:
-            start_tc = cls.seconds_to_timecode(sup.start, config.fps, config.drop_frame)
-            end_tc = cls.seconds_to_timecode(sup.end, config.fps, config.drop_frame)
-            text = sup.text.strip() if sup.text else ""
-            # Check if speaker should be included
-            include_this_speaker = config.include_speaker and sup.speaker
-            if include_this_speaker and hasattr(sup, "custom") and sup.custom:
-                if not sup.custom.get("original_speaker", True):
-                    include_this_speaker = False
-            if include_this_speaker:
-                text = f"{sup.speaker}: {text}"
-            wrapped_lines = cls.wrap_text(text, config.max_line_length)
-            text = "\n".join(wrapped_lines)
-            lines.append(f"{start_tc}\t{end_tc}\t{text}")
-        return "\n".join(lines).encode("utf-8")
-@register_writer("avid_ds")
-class AvidDSFormat(FormatWriter):
-    """Format handler for Avid DS caption format."""
-    format_id = "avid_ds"
-    extensions = [".txt"]
-    description = "Avid DS Caption Format"
-    @classmethod
-    def write(
-        cls,
-        supervisions: List[Supervision],
-        output_path: Pathlike,
-        include_speaker: bool = True,
-        **kwargs,
-    ):
-        """Write supervisions to Avid DS format file.
-        Args:
-            supervisions: List of supervision segments
-            output_path: Path to output file
-            include_speaker: Whether to include speaker labels
-            **kwargs: Additional config options (fps, drop_frame, etc.)
-        Returns:
-            Path to written file
-        """
-        # Filter out unsupported kwargs (word_level, karaoke, karaoke_config, metadata not supported by Avid DS)
-        kwargs.pop("word_level", None)
-        kwargs.pop("karaoke", None)
-        kwargs.pop("karaoke_config", None)
-        kwargs.pop("metadata", None)
-        config = AvidDSConfig(include_speaker=include_speaker, **kwargs)
-        return AvidDSWriter.write(supervisions, output_path, config)
-    @classmethod
-    def to_bytes(
-        cls,
-        supervisions: List[Supervision],
-        include_speaker: bool = True,
-        **kwargs,
-    ) -> bytes:
-        """Convert supervisions to Avid DS format bytes.
-        Args:
-            supervisions: List of supervision segments
-            include_speaker: Whether to include speaker labels
-            **kwargs: Additional config options
-        Returns:
-            Avid DS content as bytes
-        """
-        # Filter out unsupported kwargs (word_level, karaoke, karaoke_config, metadata not supported by Avid DS)
-        kwargs.pop("word_level", None)
-        kwargs.pop("karaoke", None)
-        kwargs.pop("karaoke_config", None)
-        kwargs.pop("metadata", None)
-        config = AvidDSConfig(include_speaker=include_speaker, **kwargs)
-        return AvidDSWriter.to_bytes(supervisions, config)
-class AvidDSReader:
-    """Reader for Avid DS subtitle format."""
-    @classmethod
-    def _timecode_to_seconds(cls, tc: str, fps: float = 25.0) -> float:
-        """Convert SMPTE timecode (HH:MM:SS:FF) to seconds."""
-        parts = tc.replace(";", ":").split(":")
-        if len(parts) != 4:
-            return 0.0
-        h, m, s, f = map(int, parts)
-        total_seconds = h * 3600 + m * 60 + s
-        return total_seconds + (f / fps)
-    @classmethod
-    def read(cls, source: str, normalize_text: bool = True) -> List[Supervision]:
-        """Read Avid DS content and return supervisions."""
-        supervisions = []
-        lines = source.splitlines()
-        # Check header roughly
-        if not any(line.startswith("@") for line in lines[:5]):
-            # Not a strict Avid DS file maybe, but try anyway if columns match
-            pass
-        for line in lines:
-            line = line.strip()
-            if not line or line.startswith("@") or line.startswith("#"):
-                continue
-            parts = line.split("\t")
-            if len(parts) >= 3:
-                start_tc = parts[0]
-                end_tc = parts[1]
-                text = "\t".join(parts[2:])  # Text might contain tabs? unlikely for captions but safe join
-                # Heuristic: verify TC format roughly
-                if ":" not in start_tc:
-                    continue
-                # Default FPS 25.0 if unknown, usually Avid DS is context dependent.
-                # Ideally config or header hints FPS, but standard TXT often lacks it.
-                # We assume 25 or try to guess?
-                # Let's verify separators: ';' implies drop frame (29.97).
-                fps = 25.0
-                if ";" in start_tc or ";" in end_tc:
-                    fps = 29.97
-                start_sec = cls._timecode_to_seconds(start_tc, fps)
-                end_sec = cls._timecode_to_seconds(end_tc, fps)
-                # Handle text cleanup
-                # Remove speaker if present and normalize?
-                # Avid DS text is just raw text usually.
-                if end_sec > start_sec:
-                    supervisions.append(
-                        Supervision(
-                            id=str(uuid.uuid4()),
-                            recording_id="avid_import",
-                            start=start_sec,
-                            duration=end_sec - start_sec,
-                            text=text.strip() if normalize_text else text,
-                        )
-                    )
-        return sorted(supervisions, key=lambda s: s.start)
-import uuid
-from .. import register_reader
-@register_reader("avid_ds")
-class AvidDSReaderHandler(FormatReader):
-    """Reader handler for Avid DS."""
-    format_id = "avid_ds"
-    extensions = [".txt"]
-    @classmethod
-    def can_read(cls, path: Union[Pathlike, str]) -> bool:
-        # Txt is generic, so we must peek content
-        if isinstance(path, (str, Path)) and not cls.is_content(path):
-            # We rely on upstream detection or explicit format selection usually.
-            # but check ext
-            return str(path).lower().endswith(".txt")
-        return False
-    @classmethod
-    def read(cls, source: Union[Pathlike, str], normalize_text: bool = True, **kwargs) -> List[Supervision]:
-        if isinstance(source, (str, Path)) and not cls.is_content(source):
-            with open(source, "r", encoding="utf-8") as f:
-                content = f.read()
-        else:
-            content = str(source)
-        return AvidDSReader.read(content, normalize_text=normalize_text)

lattifai 1.2.2__py3-none-any.whl → 1.3.0__py3-none-any.whl

lattifai 1.2.2py3-none-any.whl → 1.3.0py3-none-any.whl