PyPI - kabigon - Versions diffs - 0.8.1__py3-none-any.whl → 0.8.2__py3-none-any.whl - Mend

kabigon 0.8.1py3-none-any.whl → 0.8.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

kabigon/youtube.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import aioytt
 import aioytt.video_id
-import timeout_decorator
 from youtube_transcript_api import YouTubeTranscriptApi
 from .loader import Loader
@@ -12,7 +11,6 @@ class YoutubeLoader(Loader):
     def __init__(self, languages: list[str] | None = None) -> None:
         self.languages = languages or DEFAULT_LANGUAGES
-    @timeout_decorator.timeout(20)
     def load(self, url: str) -> str:
         video_id = aioytt.video_id.parse_video_id(url)

kabigon/ytdlp.py CHANGED Viewed

@@ -1,25 +1,21 @@
-import functools
+# import functools
 import hashlib
 import os
-import subprocess
+# import subprocess
 import tempfile
 from typing import Final
-import numpy as np
-import timeout_decorator
-import whisper
+# import numpy as np
 import yt_dlp
 from loguru import logger
 from .loader import Loader
 try:
-    import mlx_whisper  # noqa: F401 # type: ignore
-    _mlx_whisper_installed = True
+    import whisper
 except ImportError:
-    _mlx_whisper_installed = False
+    logger.info("OpenAI Whisper not installed. Please install it with `pip install openai-whisper`.")
 DEFAULT_FFMPEG_PATH: Final[str] = "ffmpeg"
@@ -65,68 +61,58 @@ def download_audio(url: str) -> str:
     return filename + ".mp3"
-def load_audio(file: str, sr: int = 16000):
-    """
-    Open an audio file and read as mono waveform, resampling as necessary
-    Parameters
-    ----------
-    file: str
-        The audio file to open
-    sr: int
-        The sample rate to resample the audio if necessary
-    Returns
-    -------
-    A NumPy array containing the audio waveform, in float32 dtype.
-    """
-    ffmpeg_path = get_ffmpeg_path()
-    # This launches a subprocess to decode audio while down-mixing
-    # and resampling as necessary.  Requires the ffmpeg CLI in PATH.
-    # fmt: off
-    cmd = [
-        ffmpeg_path,
-        "-nostdin",
-        "-threads", "0",
-        "-i", file,
-        "-f", "s16le",
-        "-ac", "1",
-        "-acodec", "pcm_s16le",
-        "-ar", str(sr),
-        "-"
-    ]
-    # fmt: on
-    try:
-        out = subprocess.run(cmd, capture_output=True, check=True).stdout
-    except subprocess.CalledProcessError as e:
-        raise RuntimeError(f"Failed to load audio: {e.stderr.decode()}") from e
-    return np.frombuffer(out, np.int16).flatten().astype(np.float32) / 32768.0
-@functools.cache
-def _load_whisper_model() -> whisper.Whisper:
-    return whisper.load_model("tiny")
-def _transcribe(audio: np.ndarray) -> dict:
-    if _mlx_whisper_installed:
-        return mlx_whisper.transcribe(audio, path_or_hf_repo="mlx-community/whisper-tiny")
-    model = _load_whisper_model()
-    return model.transcribe(audio)
+# def load_audio(file: str, sr: int = 16000):
+#     """
+#     Open an audio file and read as mono waveform, resampling as necessary
+#     Parameters
+#     ----------
+#     file: str
+#         The audio file to open
+#     sr: int
+#         The sample rate to resample the audio if necessary
+#     Returns
+#     -------
+#     A NumPy array containing the audio waveform, in float32 dtype.
+#     """
+#     ffmpeg_path = get_ffmpeg_path()
+#     # This launches a subprocess to decode audio while down-mixing
+#     # and resampling as necessary.  Requires the ffmpeg CLI in PATH.
+#     # fmt: off
+#     cmd = [
+#         ffmpeg_path,
+#         "-nostdin",
+#         "-threads", "0",
+#         "-i", file,
+#         "-f", "s16le",
+#         "-ac", "1",
+#         "-acodec", "pcm_s16le",
+#         "-ar", str(sr),
+#         "-"
+#     ]
+#     # fmt: on
+#     try:
+#         out = subprocess.run(cmd, capture_output=True, check=True).stdout
+#     except subprocess.CalledProcessError as e:
+#         raise RuntimeError(f"Failed to load audio: {e.stderr.decode()}") from e
+#     return np.frombuffer(out, np.int16).flatten().astype(np.float32) / 32768.0
 class YtdlpLoader(Loader):
-    @timeout_decorator.timeout(300)
+    def __init__(self, model: str = "tiny") -> None:
+        self.model = whisper.load_model(model)
     def load(self, url: str) -> str:
         audio_file = download_audio(url)
-        audio = load_audio(audio_file)
+        # audio = load_audio(audio_file)
+        audio = whisper.load_audio(audio_file)
         # Clean up the audio file
         os.remove(audio_file)
-        result = _transcribe(audio)
+        result = self.model.transcribe(audio)
         return result.get("text", "")

{kabigon-0.8.1.dist-info → kabigon-0.8.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: kabigon
-Version: 0.8.1
+Version: 0.8.2
 Author-email: narumi <toucans-cutouts0f@icloud.com>
 License-File: LICENSE
 Requires-Python: >=3.10
@@ -9,14 +9,19 @@ Requires-Dist: firecrawl-py>=2.4.1
 Requires-Dist: httpx>=0.28.1
 Requires-Dist: loguru>=0.7.3
 Requires-Dist: markdownify>=0.14.1
-Requires-Dist: openai-whisper>=20240930
-Requires-Dist: playwright>=1.52.0
+Requires-Dist: numpy>=2.2.5
 Requires-Dist: pypdf>=5.3.0
 Requires-Dist: rich>=13.9.4
-Requires-Dist: timeout-decorator>=0.5.0
 Requires-Dist: typer>=0.15.3
 Requires-Dist: youtube-transcript-api>=0.6.3
 Requires-Dist: yt-dlp>=2025.4.30
+Provides-Extra: all
+Requires-Dist: openai-whisper>=20240930; extra == 'all'
+Requires-Dist: playwright>=1.52.0; extra == 'all'
+Provides-Extra: playwright
+Requires-Dist: playwright>=1.52.0; extra == 'playwright'
+Provides-Extra: whisper
+Requires-Dist: openai-whisper>=20240930; extra == 'whisper'
 Description-Content-Type: text/markdown
 # kabigon

{kabigon-0.8.1.dist-info → kabigon-0.8.2.dist-info}/RECORD RENAMED Viewed

@@ -11,10 +11,10 @@ kabigon/py.typed,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
 kabigon/reel.py,sha256=qOwWCvcp7xNKg0JDunq_Bsl8yqqMzrnAOI9k5mSqrOU,874
 kabigon/twitter.py,sha256=aRqAiFxIwln6lteWdoF6SmvbzO62yBTQRzcB7UcVJwk,1046
 kabigon/utils.py,sha256=eNTLtHLSB2erDac2HH3jWemgfr8Ou_ozwVb8h9BD-4g,922
-kabigon/youtube.py,sha256=HoiFNq0ookPL7_rO_wloBaY8yTIX6xP8A77F7y02q64,1166
-kabigon/ytdlp.py,sha256=_QRcyFx9s7NnI1MvcWdKKxlX-hHLnqtduCSL5_UH6dU,3140
-kabigon-0.8.1.dist-info/METADATA,sha256=8nZX3ukADj-qndGHMMuZluG_HdI8-wqNu8QJBoplPRc,1079
-kabigon-0.8.1.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-kabigon-0.8.1.dist-info/entry_points.txt,sha256=O3FYAO9w-NQvlGMJrBvtrnGHSK2QkUnQBTa30YXRbVE,45
-kabigon-0.8.1.dist-info/licenses/LICENSE,sha256=H2T3_RTgmcngMeC7p_SXT3GwBLkd2DaNgAZuxulcfiA,1066
-kabigon-0.8.1.dist-info/RECORD,,
+kabigon/youtube.py,sha256=F9GpLa0iUy03wYU94RrrnrXa6ExqbG6CZpqx5bPENWE,1106
+kabigon/ytdlp.py,sha256=oeFoE7nWZWaT0dR9nwt_SZh_FE0gJ6Gulh6QzGCB6xo,2956
+kabigon-0.8.2.dist-info/METADATA,sha256=UEq0yUqP0dgzyqMhxiHgLvP0wT_nf0PlQLy8VkufrEg,1287
+kabigon-0.8.2.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+kabigon-0.8.2.dist-info/entry_points.txt,sha256=O3FYAO9w-NQvlGMJrBvtrnGHSK2QkUnQBTa30YXRbVE,45
+kabigon-0.8.2.dist-info/licenses/LICENSE,sha256=H2T3_RTgmcngMeC7p_SXT3GwBLkd2DaNgAZuxulcfiA,1066
+kabigon-0.8.2.dist-info/RECORD,,

{kabigon-0.8.1.dist-info → kabigon-0.8.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{kabigon-0.8.1.dist-info → kabigon-0.8.2.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{kabigon-0.8.1.dist-info → kabigon-0.8.2.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

kabigon 0.8.1__py3-none-any.whl → 0.8.2__py3-none-any.whl

kabigon 0.8.1py3-none-any.whl → 0.8.2py3-none-any.whl