PyPI - lattifai - Versions diffs - 0.1.4__py3-none-any.whl → 0.1.5__py3-none-any.whl - Mend

lattifai 0.1.4py3-none-any.whl → 0.1.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

lattifai/__init__.py +63 -0
lattifai/client.py +5 -7
lattifai/tokenizers/phonemizer.py +1 -1
lattifai/tokenizers/tokenizer.py +7 -3
lattifai/workers/lattice1_alpha.py +7 -5
{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/METADATA +54 -77
lattifai-0.1.5.dist-info/RECORD +24 -0
{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/entry_points.txt +1 -0
{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/top_level.txt +1 -0
scripts/__init__.py +1 -0
scripts/install_k2.py +520 -0
lattifai-0.1.4.dist-info/RECORD +0 -22
{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/WHEEL +0 -0
{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/licenses/LICENSE +0 -0

lattifai/__init__.py CHANGED Viewed

@@ -1,3 +1,7 @@
+import os
+import sys
+import warnings
 from .base_client import LattifAIError
 from .io import SubtitleIO
@@ -13,6 +17,65 @@ except Exception:
     __version__ = '0.1.0'  # fallback version
+# Check and auto-install k2 if not present
+def _check_and_install_k2():
+    """Check if k2 is installed and attempt to install it if not."""
+    try:
+        import k2
+        return True
+    except ImportError:
+        pass
+    # k2 not found, try to install it
+    if os.environ.get('SKIP_K2_INSTALL'):
+        warnings.warn(
+            '\n' + '=' * 70 + '\n'
+            '  k2 is not installed and auto-installation is disabled.\n'
+            '  \n'
+            '  To use lattifai, please install k2 by running:\n'
+            '  \n'
+            '      install-k2\n'
+            '  \n' + '=' * 70,
+            RuntimeWarning,
+            stacklevel=2,
+        )
+        return False
+    print('\n' + '=' * 70)
+    print('  k2 is not installed. Attempting to install it now...')
+    print('  This is a one-time setup and may take a few minutes.')
+    print('=' * 70 + '\n')
+    try:
+        # Import and run the installation script
+        from scripts.install_k2 import install_k2_main
+        install_k2_main(dry_run=False)
+        print('\n' + '=' * 70)
+        print('  k2 has been installed successfully!')
+        print('=' * 70 + '\n')
+        return True
+    except Exception as e:
+        warnings.warn(
+            '\n' + '=' * 70 + '\n'
+            f'  Failed to auto-install k2: {e}\n'
+            '  \n'
+            '  Please install k2 manually by running:\n'
+            '  \n'
+            '      install-k2\n'
+            '  \n' + '=' * 70,
+            RuntimeWarning,
+            stacklevel=2,
+        )
+        return False
+# Auto-install k2 on first import
+_check_and_install_k2()
 # Lazy import for LattifAI to avoid dependency issues during basic import
 def __getattr__(name):
     if name == 'LattifAI':

lattifai/client.py CHANGED Viewed

@@ -24,8 +24,9 @@ class LattifAI(SyncAPIClient):
         self,
         *,
         api_key: Optional[str] = None,
-        base_url: Optional[str] = None,
+        model_name_or_path: str = 'Lattifai/Lattice-1-Alpha',
         device: str = 'cpu',
+        base_url: Optional[str] = None,
         timeout: Union[float, int] = 60.0,
         max_retries: int = 2,
         default_headers: Optional[Dict[str, str]] = None,
@@ -52,19 +53,16 @@ class LattifAI(SyncAPIClient):
         )
         # Initialize components
-        model_name_or_path = '/Users/feiteng/GEEK/OmniCaptions/HF_models/Lattice-1-Alpha'
         if not Path(model_name_or_path).exists():
-            from huggingface_hub import hf_hub_download
+            from huggingface_hub import snapshot_download
-            model_path = hf_hub_download(repo_id=model_name_or_path, repo_type='model')
+            model_path = snapshot_download(repo_id=model_name_or_path, repo_type='model')
         else:
             model_path = model_name_or_path
         self.tokenizer = LatticeTokenizer.from_pretrained(
             client_wrapper=self,
-            model_path=f'{model_path}/words.bin',
-            g2p_model_path=f'{model_path}/g2p.bin' if Path(f'{model_path}/g2p.bin').exists() else None,
+            model_path=model_path,
             device=device,
         )
         self.worker = Lattice1AlphaWorker(model_path, device=device, num_threads=8)

lattifai/tokenizers/phonemizer.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import re
 from typing import List, Optional, Union
-from dp.phonemizer import Phonemizer
+from dp.phonemizer import Phonemizer  # g2p-phonemizer
 from num2words import num2words
 LANGUAGE = 'omni'

lattifai/tokenizers/tokenizer.py CHANGED Viewed

@@ -33,22 +33,26 @@ class LatticeTokenizer:
     def from_pretrained(
         client_wrapper: SyncAPIClient,
         model_path: str,
-        g2p_model_path: Optional[str] = None,
         device: str = 'cpu',
         compressed: bool = True,
     ):
         """Load tokenizer from exported binary file"""
+        from pathlib import Path
+        words_model_path = f'{model_path}/words.bin'
         if compressed:
-            with gzip.open(model_path, 'rb') as f:
+            with gzip.open(words_model_path, 'rb') as f:
                 data = pickle.load(f)
         else:
-            with open(model_path, 'rb') as f:
+            with open(words_model_path, 'rb') as f:
                 data = pickle.load(f)
         tokenizer = LatticeTokenizer(client_wrapper=client_wrapper)
         tokenizer.words = data['words']
         tokenizer.dictionaries = defaultdict(list, data['dictionaries'])
         tokenizer.oov_word = data['oov_word']
+        g2p_model_path = f'{model_path}/g2p.bin' if Path(f'{model_path}/g2p.bin').exists() else None
         if g2p_model_path:
             tokenizer.g2p_model = G2Phonemizer(g2p_model_path, device=device)
         return tokenizer

lattifai/workers/lattice1_alpha.py CHANGED Viewed

@@ -5,8 +5,9 @@ from typing import Any, BinaryIO, Dict, Tuple, Union
 import numpy as np
 import onnxruntime as ort
+import resampy
+import soundfile as sf
 import torch
-import torchaudio
 from lhotse import FbankConfig
 from lhotse.features.kaldi.layers import Wav2LogFilterBank
 from lhotse.utils import Pathlike
@@ -58,11 +59,12 @@ class Lattice1AlphaWorker:
     def load_audio(self, audio: Union[Pathlike, BinaryIO]) -> Tuple[torch.Tensor, int]:
         # load audio
-        waveform, sample_rate = torchaudio.load(audio, channels_first=True)
-        if waveform.size(0) > 1:  # TODO: support choose channel
-            waveform = torch.mean(waveform, dim=0, keepdim=True)
+        waveform, sample_rate = sf.read(audio, always_2d=True, dtype='float32')
+        if waveform.shape[1] > 1:  # TODO: support choose channel
+            waveform = np.mean(waveform, axis=1, keepdims=True)
         if sample_rate != self.config['sample_rate']:
-            waveform = torchaudio.functional.resample(waveform, sample_rate, self.config['sample_rate'])
+            waveform = resampy.resample(waveform, sample_rate, self.config['sample_rate'], axis=0)
+        waveform = torch.from_numpy(waveform.T).to(self.device)  # (1, L)
         return waveform
     def alignment(

{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: lattifai
-Version: 0.1.4
+Version: 0.1.5
 Summary: Lattifai Python SDK: Seamless Integration with Lattifai's Speech and Video AI Services
 Author-email: Lattifai Technologies <tech@lattifai.com>
 Maintainer-email: Lattice <tech@lattifai.com>
@@ -26,10 +26,10 @@ License: MIT License
         OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
         SOFTWARE.
 Project-URL: Homepage, https://github.com/lattifai/lattifai-python
-Project-URL: Documentation, https://github.com/lattifai/lattifai-python/api.md
+Project-URL: Documentation, https://github.com/lattifai/lattifai-python/README.md
 Project-URL: Bug Tracker, https://github.com/lattifai/lattifai-python/issues
 Project-URL: Discussions, https://github.com/lattifai/lattifai-python/discussions
-Project-URL: Changelog, https://github.com/lattifai/lattifai-python/CHANGELOG
+Project-URL: Changelog, https://github.com/lattifai/lattifai-python/CHANGELOG.md
 Keywords: lattifai,speech recognition,video analysis,ai,sdk,api client
 Classifier: Development Status :: 5 - Production/Stable
 Classifier: Intended Audience :: Developers
@@ -54,6 +54,12 @@ Requires-Dist: python-dotenv
 Requires-Dist: lhotse>=1.26.0
 Requires-Dist: colorful>=0.5.6
 Requires-Dist: lattifai-core>=0.1.4
+Requires-Dist: pysubs2
+Requires-Dist: praatio
+Requires-Dist: tgt
+Requires-Dist: onnxruntime
+Requires-Dist: resampy
+Requires-Dist: g2p-phonemizer>=0.1.1
 Provides-Extra: numpy
 Requires-Dist: numpy; extra == "numpy"
 Provides-Extra: test
@@ -70,24 +76,51 @@ Dynamic: license-file
 # LattifAI Python
-> ⚠️ **Under Active Development** - Official release scheduled for October 18, 2025
+<!-- <p align="center">
+  <a href="https://badge.fury.io/py/lattifai"><img src="https://badge.fury.io/py/lattifai.svg" alt="PyPI version"></a>
+</p> -->
 [![PyPI version](https://badge.fury.io/py/lattifai.svg)](https://badge.fury.io/py/lattifai)
-The official Python library for the LattifAI API - Advanced forced alignment and subtitle generation powered by `Lattice-1-Alpha` model.
+<p align="center">
+   &nbsp&nbsp 🖥️ <a href="https://github.com/lattifai/lattifai-python">GitHub</a> &nbsp&nbsp  | &nbsp&nbsp🤗 <a href="https://huggingface.co/Lattifai/Lattice-1-Alpha">Lattifai/Lattice-1-Alpha</a>&nbsp&nbsp | &nbsp&nbsp 📑 <a href="https://lattifai.com/blogs">Blog</a> &nbsp&nbsp |  &nbsp&nbsp <a href="https://discord.gg/gTZqdaBJ"><img src="https://img.shields.io/badge/Discord-Join-5865F2?logo=discord&logoColor=white" alt="Discord" style="vertical-align: middle;"></a>&nbsp&nbsp
+</p>
+The official Python library for the LattifAI API - Advanced forced alignment and subtitle generation powered by `[Lattifai/Lattice-1-Alpha](https://huggingface.co/Lattifai/Lattice-1-Alpha)` model.
 ## Installation
 ```bash
 pip install lattifai
+install-k2  # Required: This step must be executed to install k2 dependencies
 ```
+> **⚠️ Important**: After installing `lattifai`, you **must** run `install-k2` to install the required k2 library. The library will not function properly without this step.
 ## GPU Support Status
-> **🚧 GPU Support Coming Soon**: CUDA/GPU acceleration is currently under active development. The current version supports CPU-only processing. GPU support will be available in an upcoming release, providing significant performance improvements for large audio files.
+> **🚧 GPU Support Coming Soon**: The current version supports CPU-only processing. NVIDIA GPU and Apple Silicon acceleration will be available in an upcoming release, providing significant performance improvements for large audio files.
 ## Quick Start
+### Command Line Interface
+The library provides powerful command-line tools for batch processing and automation.
+#### Using the Main CLI
+```bash
+# Show available commands
+lattifai --help
+# Perform alignment (same as lattifai-align)
+lattifai align input_audio.wav input_subtitle.srt output.srt
+# Subtitle format conversion
+lattifai subtitle convert input.srt output.vtt
+```
 ### Python API
 ```python
@@ -97,6 +130,7 @@ from lattifai import LattifAI
 # Initialize client
 client = LattifAI(
     api_key=os.environ.get("LATTIFAI_API_KEY"),  # Optional if set in environment
+    model_name_or_path='Lattifai/Lattice-1-Alpha',
     device='cpu',  # Currently only CPU is supported, GPU support coming soon
 )
@@ -111,35 +145,6 @@ result = client.alignment(
 print(f"Alignment complete! Output saved to: {result}")
 ```
-### Command Line Interface
-The library provides powerful command-line tools for batch processing and automation.
-#### Basic Alignment
-```bash
-# Align audio with subtitle file
-lattifai-align input_audio.wav input_subtitle.srt output_aligned.srt
-# Specify input format explicitly
-lattifai-align -F srt input_audio.wav transcript.txt output.srt
-# Auto-detect input format (default)
-lattifai-align input_audio.wav subtitle_file.vtt output.vtt
-```
-#### Using the Main CLI
-```bash
-# Show available commands
-lattifai --help
-# Perform alignment (same as lattifai-align)
-lattifai align input_audio.wav input_subtitle.srt output.srt
-# Subtitle format conversion
-lattifai subtitle convert input.srt output.vtt
-```
 #### Supported Input Formats
@@ -163,12 +168,11 @@ lattifai subtitle convert input.srt output.vtt
 ```python
 LattifAI(
     api_key: Optional[str] = None,           # API key (or set LATTIFAI_API_KEY env var)
-    base_url: Optional[str] = None,          # API base URL (or set LATTIFAI_BASE_URL env var)
     device: str = 'cpu',                     # Device for processing (currently only 'cpu' supported)
 )
 ```
-> **Note**: The `device` parameter currently only supports `'cpu'`. GPU support (`'cuda'`) is under active development and will be available in future releases.
+> **Note**: The `device` parameter currently only supports `'cpu'`. GPU support will be available in future releases.
 #### Methods
@@ -194,41 +198,11 @@ def alignment(
 **Returns:**
 - Path to output file (if `output_subtitle_path` specified) or alignment results
-**Example:**
-```python
-# Basic usage
-result = client.alignment("audio.wav", "subtitle.srt")
-# With explicit format and output path
-result = client.alignment(
-    audio="interview.mp3",
-    subtitle="transcript.txt",
-    format="txt",
-    output_subtitle_path="aligned_interview.srt"
-)
-```
 ## Configuration
 ### Environment Variables
 - `LATTIFAI_API_KEY`: Your LattifAI API key (required)
-- `LATTIFAI_BASE_URL`: Base URL for the API (default: `https://api.lattifai.com/v1`)
-### Device Configuration
-> **Note**: GPU/CUDA support is currently under development and will be available in a future release. Currently, only CPU processing is supported.
-The library is designed to support both CPU and GPU processing:
-```python
-# CPU processing (currently supported)
-client = LattifAI(device='cpu')
-# GPU processing (coming soon)
-# client = LattifAI(device='cuda')  # Will be available in future releases
-```
 ### Performance Tuning
@@ -236,11 +210,11 @@ For better performance with large files:
 ```python
 client = LattifAI(
-    device='cpu',         # Currently only CPU is supported
+    device='cpu',         # Currently only CPU is supported, cuda/mps will be supported in upcoming releases.
 )
 ```
-> **GPU Acceleration**: CUDA support is in active development and will significantly improve processing speed for large audio files. Expected in upcoming releases.
+> **GPU Acceleration**: CUDA and Apple Silicon(MPS) support is in active development and will significantly improve processing speed for large audio files. Expected in upcoming releases.
 ## Examples
@@ -340,7 +314,7 @@ except Exception as e:
 ## Model Information
-This library uses the **Lattice-1-Alpha** model for high-quality forced alignment and subtitle generation.
+This library uses the **[Lattice-1-Alpha](https://huggingface.co/Lattifai/Lattice-1-Alpha)** model for high-quality forced alignment and subtitle generation.
 ### Model Features
 - **High Accuracy**: State-of-the-art alignment precision
@@ -360,7 +334,7 @@ This library uses the **Lattice-1-Alpha** model for high-quality forced alignmen
 - **Core Dependencies**:
   - httpx (HTTP client)
   - lhotse (audio processing)
-  - colorful (colored output)
+  - k2 (audio computation)
   - python-dotenv (environment management)
   - click (command line interface)
@@ -397,21 +371,24 @@ To manually run these tools:
 ```bash
 # Sort imports
-isort src/ tests/
+isort src/ tests/ scripts/
 # Run linter
-ruff check src/ tests/
+ruff check src/ tests/ scripts/
 # Run formatter
-ruff format src/ tests/
+ruff format src/ tests/ scripts/
 # Fix issues automatically
-ruff check --fix src/ tests/
+ruff check --fix src/ tests/ scripts/
 ```
 ### Running Tests
 ```bash
+# Install test dependencies first
+pip install -e ".[test]"
 # Run all tests
 pytest
@@ -461,7 +438,7 @@ This project is licensed under the Apache License 2.0 - see the [LICENSE](LICENS
 ## Support
-- **Documentation**: [API Documentation](https://github.com/lattifai/lattifai-python/api.md)
+- **Documentation**: [API Documentation](https://github.com/lattifai/lattifai-python/README.md)
 - **Issues**: [GitHub Issues](https://github.com/lattifai/lattifai-python/issues)
 - **Discussions**: [GitHub Discussions](https://github.com/lattifai/lattifai-python/discussions)
-- **Changelog**: [CHANGELOG.md](https://github.com/lattifai/lattifai-python/CHANGELOG)
+- **Changelog**: [CHANGELOG.md](https://github.com/lattifai/lattifai-python/CHANGELOG.md)

lattifai-0.1.5.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,24 @@
+lattifai/__init__.py,sha256=wPE3D03AK8Ktu2WFXqJ6rx6jvPVWKstFQgyPq0tndUU,2324
+lattifai/base_client.py,sha256=ktFtATjL9pLSJUD-VqeJKA1FHkrsGHX7Uq_x00H7gO8,3322
+lattifai/client.py,sha256=p9mFkyOINKBGB87TE6P4y6Z3fPOPSqi6HAyz00TMuag,4520
+lattifai/bin/__init__.py,sha256=7YhmtEM8kbxJtz2-KIskvpLKBZAvkMSceVx8z4fkgQ4,61
+lattifai/bin/align.py,sha256=uX8VaATzn8CgdHUtry1ZGhXiz0Jr89ELdfRK6GWC1t8,989
+lattifai/bin/cli_base.py,sha256=4xlN4cnJZh54ErhHUHgJpyVsrcB-ftwniFzRQL_7SlU,289
+lattifai/bin/subtitle.py,sha256=bUWImAHpvyY59Vskqb5loQiD5ytQOxR8lTQRiQ4LyNA,647
+lattifai/io/__init__.py,sha256=vHWRN7MvAch-GUeFqqO-gM57SM-4YOpGUjIxFJdjfPA,671
+lattifai/io/reader.py,sha256=ErPnPMUvYQpjZ7Vd86EsHUkOcEfKdoI8iM3yKHRzSOQ,2576
+lattifai/io/supervision.py,sha256=5UfSsgBhXoDU3-6drDtoD7y8HIiA4xRKZnbOKgeejwM,354
+lattifai/io/writer.py,sha256=1eAEFLlL8kricxRDPFBtVmeC4IiFyFnjbWXvw0VU-q4,2036
+lattifai/tokenizers/__init__.py,sha256=aqv44PDtq6g3oFFKW_l4HSR5ywT5W8eP1dHHywIvBfs,72
+lattifai/tokenizers/phonemizer.py,sha256=SfRi1KIMpmaao6OVmR1h_I_3QU-vrE6D5bh72Afg5XM,1759
+lattifai/tokenizers/tokenizer.py,sha256=u4lgS6-jN9cLuMNIojA4Swfsqb1EcyI7Bh_iw7tuL-s,5818
+lattifai/workers/__init__.py,sha256=s6YfkIq4FDIAzY9sPjRpXnJfszj2repqnMTqydRM5Zw,83
+lattifai/workers/lattice1_alpha.py,sha256=5OJ6APnFpWvi1azKlkbJqF85e2n5JyZ_m8L1XQ2r3qg,4862
+lattifai-0.1.5.dist-info/licenses/LICENSE,sha256=LNuoH5jpXXNKgjQ3XLwztFq8D3O7kZI-LSg81o4ym2M,1065
+scripts/__init__.py,sha256=4nwVNeJeEuGiWGBACgySViLlm5DrqcvFOWpo7Ds8MUA,49
+scripts/install_k2.py,sha256=iGdy_VZrwaBJfdKy5EDvPX0x5V4dH_lm3f8DEiVWcOQ,21166
+lattifai-0.1.5.dist-info/METADATA,sha256=LsJCRZPTmnuF279cKjO6jtK1ZzG8JrL0sEnOfjvoNxk,13644
+lattifai-0.1.5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+lattifai-0.1.5.dist-info/entry_points.txt,sha256=CwTI2NbJvF9msIHboAfTA99cmDr_HOWoODjS8R64JOw,131
+lattifai-0.1.5.dist-info/top_level.txt,sha256=-OVWZ68YYFcTN13ARkLasp2OUappe9wEVq-CKes7jM4,17
+lattifai-0.1.5.dist-info/RECORD,,

{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/entry_points.txt RENAMED Viewed

@@ -1,3 +1,4 @@
 [console_scripts]
+install-k2 = scripts.install_k2:install_k2
 lattifai = lattifai.bin:cli
 lattifai-align = lattifai.bin.align:align

{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/top_level.txt RENAMED Viewed

	@@ -1 +1,2 @@
1 1	lattifai
2	+ scripts

scripts/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ """Scripts for lattifai package installation."""

scripts/install_k2.py ADDED Viewed

@@ -0,0 +1,520 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+"""
+Auto-install the latest k2 wheel that matches the current machine.
+- Prints in English.
+- Sources:
+  Linux CUDA wheels:     https://k2-fsa.github.io/k2/installation/pre-compiled-cuda-wheels-linux/index.html
+  macOS CPU wheels:      https://k2-fsa.github.io/k2/installation/pre-compiled-cpu-wheels-macos/index.html
+  Windows CPU wheels:    https://k2-fsa.github.io/k2/installation/pre-compiled-cpu-wheels-windows/index.html
+Usage:
+  python install_k2_auto.py            # install immediately
+  python install_k2_auto.py --dry-run  # only show what would be installed
+"""
+import argparse
+import os
+import platform
+import re
+import subprocess
+import sys
+import urllib.request
+from html.parser import HTMLParser
+from typing import List, Optional, Tuple
+os.environ['KMP_DUPLICATE_LIB_OK'] = 'TRUE'
+os.environ['OMP_NUM_THREADS'] = '4'
+CUDA_LINUX_URL = 'https://k2-fsa.github.io/k2/installation/pre-compiled-cuda-wheels-linux/index.html'
+MAC_CPU_URL = 'https://k2-fsa.github.io/k2/installation/pre-compiled-cpu-wheels-macos/index.html'
+WIN_CPU_URL = 'https://k2-fsa.github.io/k2/installation/pre-compiled-cpu-wheels-windows/index.html'
+class WheelLinkParser(HTMLParser):
+    def __init__(self, parse_mode='wheels'):
+        super().__init__()
+        self.links: List[str] = []
+        self.parse_mode = parse_mode  # 'wheels' or 'versions'
+    def handle_starttag(self, tag, attrs):
+        if tag.lower() == 'a':
+            href = dict(attrs).get('href')
+            if href:
+                if self.parse_mode == 'wheels' and href.endswith('.whl'):
+                    self.links.append(href)
+                elif self.parse_mode == 'versions' and re.match(r'^\d+\.\d+\.\d+\.html$', href):
+                    # Match version links like "2.8.0.html"
+                    self.links.append(href)
+def fetch_wheel_links(
+    page_url: str, target_torch_version: Optional[str] = None, cuda_version: Optional[str] = None
+) -> List[str]:
+    """
+    Fetch wheel links from k2 pages. The structure is:
+    - Index page contains links to version-specific pages (e.g., 2.8.0.html)
+    - Version pages contain actual .whl file links
+    Args:
+        page_url: The base URL to fetch wheels from
+        target_torch_version: If specified, only fetch wheels for this torch version (e.g., "2.8.0")
+        cuda_version: If specified, prefer wheels with this CUDA version (e.g., "12.1")
+    """
+    with urllib.request.urlopen(page_url) as resp:
+        html = resp.read().decode('utf-8', errors='ignore')
+    # First, try to find version page links
+    version_parser = WheelLinkParser(parse_mode='versions')
+    version_parser.feed(html)
+    if version_parser.links:
+        # If we found version links, this is an index page
+        # Filter version links if target_torch_version is specified
+        version_links_to_process = version_parser.links
+        if target_torch_version:
+            target_filename = f'{target_torch_version}.html'
+            version_links_to_process = [link for link in version_parser.links if link == target_filename]
+            if not version_links_to_process:
+                print(f'[WARN] No page found for torch version {target_torch_version}')
+                return []
+            print(f'[INFO] Found torch version {target_torch_version}, fetching wheels from {target_filename}')
+        else:
+            # If no target version specified, choose the highest version (latest torch version)
+            def parse_version_from_link(link: str) -> Tuple[int, int, int]:
+                # Extract version from "2.8.0.html" -> (2, 8, 0)
+                match = re.match(r'^(\d+)\.(\d+)\.(\d+)\.html$', link)
+                if match:
+                    return (int(match.group(1)), int(match.group(2)), int(match.group(3)))
+                return (0, 0, 0)
+            # Sort by version and take the highest
+            sorted_versions = sorted(version_parser.links, key=parse_version_from_link, reverse=True)
+            if sorted_versions:
+                latest_version = sorted_versions[0]
+                version_links_to_process = [latest_version]
+                version_str = latest_version.replace('.html', '')
+                print(f'[INFO] No target torch version specified, using latest version: {version_str}')
+        # Fetch wheel links from version pages
+        all_wheel_links = []
+        base_url = page_url.rsplit('/', 1)[0]
+        py_tag, abi_tag = py_tags()
+        for version_link in version_links_to_process:
+            version_url = f'{base_url}/{version_link}'
+            try:
+                with urllib.request.urlopen(version_url) as resp:
+                    version_html = resp.read().decode('utf-8', errors='ignore')
+                wheel_parser = WheelLinkParser(parse_mode='wheels')
+                wheel_parser.feed(version_html)
+                # If target version specified or using latest version, find matching wheels
+                if target_torch_version or len(version_links_to_process) == 1:
+                    matching_wheels = []
+                    for wheel_link in wheel_parser.links:
+                        if py_tag in wheel_link and abi_tag in wheel_link:
+                            matching_wheels.append(wheel_link)
+                    if cuda_version and matching_wheels:
+                        # First try to find wheels with the specified CUDA version
+                        cuda_specific_wheels = []
+                        for wheel_link in matching_wheels:
+                            wheel_cuda = parse_cuda_from_filename(wheel_link)
+                            if wheel_cuda and wheel_cuda == cuda_version:
+                                cuda_specific_wheels.append(wheel_link)
+                        if cuda_specific_wheels:
+                            # Found wheels with specified CUDA version, pick the latest one by dev date
+                            def sort_by_devdate(wheel: str) -> int:
+                                return parse_devdate(wheel) or 0
+                            best_wheel = max(cuda_specific_wheels, key=sort_by_devdate)
+                            print(
+                                f'[INFO] Found matching wheel for Python {py_tag} and CUDA {cuda_version}: {best_wheel}'
+                            )
+                            return [best_wheel] if best_wheel.startswith('http') else [best_wheel]
+                        else:
+                            print(f'[WARN] No wheel found for CUDA {cuda_version}, falling back to latest version')
+                    # If no CUDA version specified or no matching CUDA wheels found, use the latest wheel
+                    if matching_wheels:
+                        def sort_by_devdate(wheel: str) -> int:
+                            return parse_devdate(wheel) or 0
+                        best_wheel = max(matching_wheels, key=sort_by_devdate)
+                        cuda_info = (
+                            f' (CUDA {parse_cuda_from_filename(best_wheel)})'
+                            if parse_cuda_from_filename(best_wheel)
+                            else ''
+                        )
+                        print(f'[INFO] Found matching wheel for Python {py_tag}{cuda_info}: {best_wheel}')
+                        return [best_wheel]
+                    version_str = version_link.replace('.html', '')
+                    print(f'[WARN] No wheel found for Python {py_tag} in torch {version_str}')
+                else:
+                    all_wheel_links.extend(wheel_parser.links)
+            except Exception as e:
+                print(f'[WARN] Failed to fetch {version_url}: {e}')
+                continue
+        # If target version specified or latest version but no matching wheel found
+        if target_torch_version or len(version_links_to_process) == 1:
+            return []
+        # Normalize to absolute URLs for all wheels case
+        abs_links = []
+        for href in all_wheel_links:
+            if href.startswith('http://') or href.startswith('https://'):
+                abs_links.append(href)
+            else:
+                # For huggingface links, they are already absolute in the href
+                abs_links.append(href)
+        return abs_links
+    else:
+        raise ValueError('No version links found on the page; unexpected page structure.')
+def py_tags() -> Tuple[str, str]:
+    """Return (py_tag, abi_tag), e.g. ('cp310', 'cp310') for CPython."""
+    impl = platform.python_implementation().lower()
+    if impl != 'cpython':
+        # Wheels are for CPython; still try cpXY
+        pass
+    major, minor = sys.version_info.major, sys.version_info.minor
+    tag = f'cp{major}{minor}'
+    return tag, tag
+def detect_torch_version() -> Optional[str]:
+    """
+    Detect installed PyTorch version string like '2.8.0'.
+    Returns None if PyTorch is not installed.
+    """
+    try:
+        import importlib
+        torch = importlib.import_module('torch')
+        version = getattr(torch, '__version__', None)
+        if version:
+            # Extract major.minor.patch from version string (remove +cu118 etc suffixes)
+            version_match = re.match(r'(\d+\.\d+\.\d+)', str(version))
+            if version_match:
+                return version_match.group(1)
+    except Exception:
+        pass
+    return None
+def detect_cuda_version_linux() -> Optional[str]:
+    """
+    Detect CUDA version string like '12.1'.
+    Priority: torch.version.cuda -> nvidia-smi -> None
+    """
+    # Try PyTorch if installed
+    try:
+        import importlib
+        torch = importlib.import_module('torch')
+        v = getattr(getattr(torch, 'version', None), 'cuda', None)
+        if v:
+            return str(v)
+    except Exception:
+        pass
+    # # Try nvidia-smi
+    # try:
+    #     out = subprocess.check_output(["nvidia-smi"], stderr=subprocess.STDOUT, text=True)
+    #     m = re.search(r"CUDA Version:\s*([\d.]+)", out)
+    #     if m:
+    #         return m.group(1)
+    # except Exception:
+    #     pass
+    return None
+def parse_cuda_from_filename(name: str) -> Optional[str]:
+    # e.g., ...+cuda12.1-..., ...+cuda11.8-...
+    m = re.search(r'cuda(\d+(?:\.\d+)?)', name)
+    return m.group(1) if m else None
+def parse_devdate(name: str) -> Optional[int]:
+    # e.g., dev20240606
+    m = re.search(r'dev(\d{8})', name)
+    return int(m.group(1)) if m else None
+def parse_version_tuple(name: str) -> Tuple[int, ...]:
+    # k2-<version>...   take first contiguous version-like sequence
+    m = re.search(r'k2-([\d]+(?:\.[\d]+)*)', name)
+    if not m:
+        return tuple()
+    return tuple(int(p) for p in m.group(1).split('.'))
+def best_match_cuda(candidates: List[str], installed_cuda: Optional[str]) -> List[str]:
+    """
+    Keep only CUDA wheels; if installed_cuda present, prefer same major.minor,
+    else fallback to highest CUDA version available.
+    """
+    cuda_wheels = [w for w in candidates if 'cuda' in w.lower()]
+    if not cuda_wheels:
+        return []
+    if installed_cuda:
+        # Normalize like '12.1' -> (12,1)
+        def to_tuple(v: str) -> Tuple[int, int]:
+            parts = v.split('.')
+            major = int(parts[0])
+            minor = int(parts[1]) if len(parts) > 1 else 0
+            return (major, minor)
+        target = to_tuple(installed_cuda)
+        # Score by distance in (major, minor); prefer exact or closest lower/higher
+        def score(w: str) -> Tuple[int, int, int]:
+            wc = parse_cuda_from_filename(w) or '0'
+            wt = to_tuple(wc)
+            # absolute distance
+            dist = (abs(wt[0] - target[0]) * 100) + abs(wt[1] - target[1])
+            # Prefer same major, then higher minor not exceeding target, etc.
+            bias = 0 if wt[0] == target[0] else 1
+            # Negative if <= target to prefer not exceeding
+            not_exceed = 0 if (wt <= target) else 1
+            return (dist, bias, not_exceed)
+        cuda_wheels.sort(key=score)
+        # Keep top-N that share the best CUDA version string (for later date/version sorting)
+        best_cuda = parse_cuda_from_filename(cuda_wheels[0])
+        cuda_wheels = [w for w in cuda_wheels if parse_cuda_from_filename(w) == best_cuda]
+        return cuda_wheels
+    # No installed CUDA detected: pick the highest CUDA in page (by version tuple)
+    def cudatuple(w: str) -> Tuple[int, int]:
+        c = parse_cuda_from_filename(w) or '0'
+        parts = c.split('.')
+        major = int(parts[0])
+        minor = int(parts[1]) if len(parts) > 1 else 0
+        return (major, minor)
+    cuda_wheels.sort(key=cudatuple, reverse=True)
+    top = parse_cuda_from_filename(cuda_wheels[0])
+    return [w for w in cuda_wheels if parse_cuda_from_filename(w) == top]
+def platform_tag_filters() -> List[str]:
+    system = platform.system().lower()
+    machine = platform.machine().lower()
+    if system == 'linux':
+        # Manylinux tags typically include 'linux_x86_64' or 'manylinux...' but
+        # the page often lists 'linux_x86_64'. We'll match the common substrings.
+        if 'aarch64' in machine or 'arm64' in machine:
+            return ['linux_aarch64', 'manylinux_aarch64']
+        return ['linux_x86_64', 'manylinux_x86_64']
+    if system == 'darwin':
+        if 'arm64' in machine or 'aarch64' in machine:
+            return ['macosx_11_0_arm64', 'macosx_12_0_arm64', 'macosx_13_0_arm64', 'macosx_14_0_arm64']
+        # Intel macs
+        return [
+            'macosx_10_9_x86_64',
+            'macosx_11_0_x86_64',
+            'macosx_12_0_x86_64',
+            'macosx_13_0_x86_64',
+            'macosx_14_0_x86_64',
+        ]
+    if system == 'windows':
+        if 'arm64' in machine:
+            # If k2 provides win_arm64 wheels in future, this will catch them.
+            return ['win_arm64']
+        return ['win_amd64']
+    return []
+def choose_best_wheel(links: List[str], require_cuda: bool) -> Optional[str]:
+    py_tag, abi_tag = py_tags()
+    plat_filters = platform_tag_filters()
+    def match_basic(name: str) -> bool:
+        # python tag & abi tag must appear
+        if py_tag not in name or abi_tag not in name:
+            return False
+        # platform tag must match one of known substrings
+        if not any(tag in name for tag in plat_filters):
+            return False
+        return True
+    candidates = [u for u in links if match_basic(u)]
+    if not candidates:
+        return None
+    if require_cuda:
+        candidates = best_match_cuda(candidates, detect_cuda_version_linux())
+        if not candidates:
+            return None
+    else:
+        # For CPU, try to exclude CUDA wheels explicitly
+        candidates = [u for u in candidates if 'cuda' not in u.lower()]
+    # Now sort by (dev date desc, version desc, URL lex desc as tie-breaker)
+    def sort_key(u: str):
+        date = parse_devdate(u) or 0
+        ver = parse_version_tuple(u)
+        return (date, ver, u)
+    candidates.sort(key=sort_key, reverse=True)
+    return candidates[0] if candidates else None
+def run_pip_install(wheel_url: str, dry_run: bool):
+    cmd = [sys.executable, '-m', 'pip', 'install', '--upgrade', '--no-cache-dir', wheel_url]
+    print('[INFO] Pip command:', ' '.join(cmd))
+    if dry_run:
+        print('[DRY-RUN] Skipping actual installation.')
+        return
+    try:
+        subprocess.check_call(cmd)
+        print('[SUCCESS] k2 has been installed successfully.')
+    except subprocess.CalledProcessError as e:
+        print('[ERROR] pip install failed with exit code:', e.returncode)
+        sys.exit(e.returncode)
+def install_k2_main(dry_run: bool = False):
+    """Main function to install k2 without argparse, suitable for programmatic use."""
+    system = platform.system().lower()
+    print(f'[INFO] Detected OS: {system}')
+    print(f'[INFO] Python: {platform.python_version()} | Impl: {platform.python_implementation()}')
+    # Check if torch is already installed
+    torch_version = detect_torch_version()
+    if torch_version:
+        print(f'[INFO] Detected PyTorch version: {torch_version}')
+    else:
+        print('[INFO] PyTorch not detected, will search all available versions')
+    if system == 'linux':
+        print('[INFO] Target: Linux (CUDA wheels)')
+        cuda_version = detect_cuda_version_linux()
+        if not cuda_version:
+            print('[WARN] No CUDA detected on Linux.')
+            # print("[HINT] Install CUDA or build from source if CPU-only is required.")
+            # print("")
+            # print("To build k2 from source, you can run the following commands:")
+            # print("  git clone https://github.com/k2-fsa/k2.git")
+            # print("  cd k2")
+            # print('  export K2_MAKE_ARGS="-j6"')
+            # print("  python3 setup.py install")
+            # print("")
+            # response = input("Do you want to continue with source installation? (y/N): ").strip().lower()
+            # if response in ["y", "yes"]:
+            #     print("[INFO] Please run the commands above manually to install k2 from source.")
+            # sys.exit(2)
+        print(f'[INFO] Detected CUDA version: {cuda_version}')
+        wheel = None
+        for _torch_version in [torch_version, None] if torch_version else [None]:
+            for _cuda_version in [cuda_version, None] if cuda_version else [None]:
+                links = fetch_wheel_links(CUDA_LINUX_URL, _torch_version, cuda_version=_cuda_version)
+                if _torch_version and links:
+                    # If we have torch version and found matching wheel, use it directly
+                    wheel = links[0]
+                else:
+                    # Fallback to traditional selection
+                    if not links:
+                        links = fetch_wheel_links(CUDA_LINUX_URL)
+                    wheel = choose_best_wheel(links, require_cuda=_cuda_version is not None)
+                    if not _torch_version and links and not wheel:
+                        wheel = links[0]  # Pick first available as last resort
+                if not wheel:
+                    if _cuda_version:
+                        print(
+                            f'[WARN] No suitable wheel found for CUDA {_cuda_version}, " + \
+                            "trying without CUDA preference...'
+                        )
+                else:
+                    break  # Found a wheel, exit loop
+            if not wheel and _torch_version:
+                print(
+                    f'[WARN] Tried torch version {_torch_version}, but not found wheel, trying without torch version...'
+                )
+            if wheel:
+                break
+        print(f'[INFO] Selected wheel:\n  {wheel}')
+        run_pip_install(wheel, dry_run)
+        return
+    elif system == 'darwin':
+        print('[INFO] Target: macOS (CPU wheels)')
+        for _torch_version in [torch_version, None] if torch_version else [None]:
+            links = fetch_wheel_links(MAC_CPU_URL, _torch_version)
+            if _torch_version and links:
+                # If we have torch version and found matching wheel, use it directly
+                wheel = links[0]
+            else:
+                # Fallback to traditional selection
+                if not links:
+                    links = fetch_wheel_links(MAC_CPU_URL)
+                wheel = choose_best_wheel(links, require_cuda=False)
+                if links and not wheel:
+                    wheel = links[0]  # Pick first available as last resort
+        if not wheel:
+            print('[ERROR] Could not find a suitable macOS CPU wheel for your Python/platform.')
+            sys.exit(1)
+        print(f'[INFO] Selected wheel:\n  {wheel}')
+        run_pip_install(wheel, dry_run)
+        return
+    elif system == 'windows':
+        print('[INFO] Target: Windows (CPU wheels)')
+        for _torch_version in [torch_version, None] if torch_version else [None]:
+            links = fetch_wheel_links(WIN_CPU_URL, torch_version)
+            if torch_version and links:
+                # If we have torch version and found matching wheel, use it directly
+                wheel = links[0]
+            else:
+                # Fallback to traditional selection
+                if not links:
+                    links = fetch_wheel_links(WIN_CPU_URL)
+                wheel = choose_best_wheel(links, require_cuda=False)
+                if links and not wheel:
+                    wheel = links[0]  # Pick first available as last resort
+        if not wheel:
+            print('[ERROR] Could not find a suitable Windows CPU wheel for your Python/platform.')
+            sys.exit(1)
+        print(f'[INFO] Selected wheel:\n  {wheel}')
+        run_pip_install(wheel, dry_run)
+        return
+    else:
+        print(f'[ERROR] Unsupported OS: {system}')
+        sys.exit(3)
+def install_k2():
+    """CLI entry point with argparse support."""
+    parser = argparse.ArgumentParser(description='Auto-install the latest k2 wheel for your environment.')
+    parser.add_argument('--dry-run', action='store_true', help='Show what would be installed without making changes.')
+    args = parser.parse_args()
+    install_k2_main(dry_run=args.dry_run)
+if __name__ == '__main__':
+    install_k2()

lattifai-0.1.4.dist-info/RECORD DELETED Viewed

@@ -1,22 +0,0 @@
-lattifai/__init__.py,sha256=8vZF9_yObaoDZ6sUaJBuQqUp5mGBRfD4z0SdTY_8BcQ,672
-lattifai/base_client.py,sha256=ktFtATjL9pLSJUD-VqeJKA1FHkrsGHX7Uq_x00H7gO8,3322
-lattifai/client.py,sha256=szz9aT_GTa5JKA2ZGsd7XHr56aG_H-nf83yqRcPUVxs,4664
-lattifai/bin/__init__.py,sha256=7YhmtEM8kbxJtz2-KIskvpLKBZAvkMSceVx8z4fkgQ4,61
-lattifai/bin/align.py,sha256=uX8VaATzn8CgdHUtry1ZGhXiz0Jr89ELdfRK6GWC1t8,989
-lattifai/bin/cli_base.py,sha256=4xlN4cnJZh54ErhHUHgJpyVsrcB-ftwniFzRQL_7SlU,289
-lattifai/bin/subtitle.py,sha256=bUWImAHpvyY59Vskqb5loQiD5ytQOxR8lTQRiQ4LyNA,647
-lattifai/io/__init__.py,sha256=vHWRN7MvAch-GUeFqqO-gM57SM-4YOpGUjIxFJdjfPA,671
-lattifai/io/reader.py,sha256=ErPnPMUvYQpjZ7Vd86EsHUkOcEfKdoI8iM3yKHRzSOQ,2576
-lattifai/io/supervision.py,sha256=5UfSsgBhXoDU3-6drDtoD7y8HIiA4xRKZnbOKgeejwM,354
-lattifai/io/writer.py,sha256=1eAEFLlL8kricxRDPFBtVmeC4IiFyFnjbWXvw0VU-q4,2036
-lattifai/tokenizers/__init__.py,sha256=aqv44PDtq6g3oFFKW_l4HSR5ywT5W8eP1dHHywIvBfs,72
-lattifai/tokenizers/phonemizer.py,sha256=Q5Z-4rbT3AjAPLNPnyvWGcEaJuKXRudgeIK6tUhVsJs,1741
-lattifai/tokenizers/tokenizer.py,sha256=Qqg12zihl192Tlax6plVyxthrnzBciGLSRuzFQRgOdc,5663
-lattifai/workers/__init__.py,sha256=s6YfkIq4FDIAzY9sPjRpXnJfszj2repqnMTqydRM5Zw,83
-lattifai/workers/lattice1_alpha.py,sha256=kR5wNLMn1qN14PvRA6RlWjQUGblYrJ636ILC-XkvS0s,4770
-lattifai-0.1.4.dist-info/licenses/LICENSE,sha256=LNuoH5jpXXNKgjQ3XLwztFq8D3O7kZI-LSg81o4ym2M,1065
-lattifai-0.1.4.dist-info/METADATA,sha256=HEsoKRRfjRoeNwUff7Cx44sYP9trid_bdtX3j5WqK6o,13628
-lattifai-0.1.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-lattifai-0.1.4.dist-info/entry_points.txt,sha256=BaixG8HYzE3Ff0QDAmsbX8cjsxZSLwUv5u4cnIpunr0,88
-lattifai-0.1.4.dist-info/top_level.txt,sha256=tHSoXF26r-IGfbIP_JoYATqbmf14h5NrnNJGH4j5reI,9
-lattifai-0.1.4.dist-info/RECORD,,

{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/WHEEL RENAMED Viewed

File without changes

{lattifai-0.1.4.dist-info → lattifai-0.1.5.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

lattifai 0.1.4__py3-none-any.whl → 0.1.5__py3-none-any.whl

lattifai 0.1.4py3-none-any.whl → 0.1.5py3-none-any.whl