PyPI - s2t - Versions diffs - 0.1.0.post1.dev2__py3-none-any.whl → 0.1.1__py3-none-any.whl - Mend

s2t 0.1.0.post1.dev2py3-none-any.whl → 0.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

s2t/cli.py +2 -0
s2t/whisper_engine.py +22 -1
{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/METADATA +1 -1
s2t-0.1.1.dist-info/RECORD +14 -0
s2t-0.1.0.post1.dev2.dist-info/RECORD +0 -14
{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/WHEEL +0 -0
{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/entry_points.txt +0 -0
{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/top_level.txt +0 -0

s2t/cli.py CHANGED Viewed

@@ -256,6 +256,8 @@ def run_session(opts: SessionOptions) -> int:
     else:
         print("—" * 60)
         print("Transcript (clipboard text):")
+        # Visual separator before the actual transcript text
+        print("=" * 60)
         print(text_final.rstrip("\n"))
     if opts.profile:

s2t/whisper_engine.py CHANGED Viewed

@@ -75,10 +75,31 @@ class WhisperEngine:
         frames: int,
         initial_prompt: str | None = None,
     ) -> TranscriptionResult:
+        # Load audio without ffmpeg by reading via soundfile and passing a numpy array
+        # to Whisper. We ensure mono float32 at 16 kHz as expected by Whisper's API.
         task = "translate" if self.translate else "transcribe"
+        import numpy as np
+        try:
+            import soundfile as sf
+        except Exception as e:
+            raise RuntimeError("soundfile is required to read recorded audio.") from e
+        from .utils import resample_linear
+        # Read audio from file (supports WAV/FLAC via libsndfile), convert to mono
+        data, sr = sf.read(str(audio_path), dtype="float32", always_2d=True)
+        # data shape: (n_frames, n_channels). Convert to mono by averaging if needed
+        if data.ndim == 2 and data.shape[1] > 1:
+            mono = data.mean(axis=1)
+        else:
+            mono = data.reshape(-1)
+        # Resample to 16k expected by Whisper when passing arrays
+        mono_16k: np.ndarray = resample_linear(mono, int(sr), 16000)
         t0 = time.perf_counter()
         res: dict[str, Any] = model.transcribe(
-            str(audio_path),
+            mono_16k,
             task=task,
             language=self.language,
             fp16=False,

{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: s2t
-Version: 0.1.0.post1.dev2
+Version: 0.1.1
 Summary: Speech to Text (s2t): Record audio, run Whisper, export formats, and copy transcript to clipboard.
 Author: Maintainers
 License-Expression: LicenseRef-Proprietary

s2t-0.1.1.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,14 @@
+s2t/__init__.py,sha256=wV4E9i-7KrUn1dOtLUQB3ZGEKx9gRWH3hPHlpw-ZdWc,332
+s2t/cli.py,sha256=_7zIhcdI7DI_3Dxs2EcvQkE-fSGclkJ2TjCvDYlI65E,15871
+s2t/config.py,sha256=mzz6ljGEupNDAzlUwf5kvl0iKqO8WZ4TWsU4nSVtp0M,409
+s2t/outputs.py,sha256=Lo8VcARZ7QPuuQQNu8myD5J4c4NO1Rs0L1DLnzLe9tM,1546
+s2t/py.typed,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
+s2t/recorder.py,sha256=uBD9mYf-uUCkRJw8fQitVnDrX6PwRNXJycyY4dBfXL0,8076
+s2t/types.py,sha256=BuMyWuueS7EZbk7I_CkIWSb69Yi6g9-wr7CZLAZKflw,242
+s2t/utils.py,sha256=YU6YhiuONmqhrKte4DY5tiC5PP-yFExJMMBzFUiA8qA,3416
+s2t/whisper_engine.py,sha256=T_M2ghXfUbFgJqiDI46ZQB1GugzjIRb7hv22fqls65M,5996
+s2t-0.1.1.dist-info/METADATA,sha256=G2dB1li8K3NRKXhpKgySgKAo94AiqxXa141Wb_-v1-4,4557
+s2t-0.1.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+s2t-0.1.1.dist-info/entry_points.txt,sha256=JISIUlZAJ3DX1dB6zT3X_E3vcXI-eWEQKwHiT35fPKs,37
+s2t-0.1.1.dist-info/top_level.txt,sha256=o8N0JcuHdIrfX3iGHvntHiDC2XgN7__joyNu08ZOh0s,4
+s2t-0.1.1.dist-info/RECORD,,

s2t-0.1.0.post1.dev2.dist-info/RECORD DELETED Viewed

@@ -1,14 +0,0 @@
-s2t/__init__.py,sha256=wV4E9i-7KrUn1dOtLUQB3ZGEKx9gRWH3hPHlpw-ZdWc,332
-s2t/cli.py,sha256=5Z0YxLPwvfV8wrU-vN1s1HzzOLmA0HYi5uVf6brUtQQ,15786
-s2t/config.py,sha256=mzz6ljGEupNDAzlUwf5kvl0iKqO8WZ4TWsU4nSVtp0M,409
-s2t/outputs.py,sha256=Lo8VcARZ7QPuuQQNu8myD5J4c4NO1Rs0L1DLnzLe9tM,1546
-s2t/py.typed,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
-s2t/recorder.py,sha256=uBD9mYf-uUCkRJw8fQitVnDrX6PwRNXJycyY4dBfXL0,8076
-s2t/types.py,sha256=BuMyWuueS7EZbk7I_CkIWSb69Yi6g9-wr7CZLAZKflw,242
-s2t/utils.py,sha256=YU6YhiuONmqhrKte4DY5tiC5PP-yFExJMMBzFUiA8qA,3416
-s2t/whisper_engine.py,sha256=s9NBPtyptdhKauKQB4moq2SeGDQp2z7qc13e8C00SxY,5075
-s2t-0.1.0.post1.dev2.dist-info/METADATA,sha256=c-7jrltbRiLjW0ixPZwgf49L8Ar7p7N5Dc7b0QO_pUo,4568
-s2t-0.1.0.post1.dev2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-s2t-0.1.0.post1.dev2.dist-info/entry_points.txt,sha256=JISIUlZAJ3DX1dB6zT3X_E3vcXI-eWEQKwHiT35fPKs,37
-s2t-0.1.0.post1.dev2.dist-info/top_level.txt,sha256=o8N0JcuHdIrfX3iGHvntHiDC2XgN7__joyNu08ZOh0s,4
-s2t-0.1.0.post1.dev2.dist-info/RECORD,,

{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{s2t-0.1.0.post1.dev2.dist-info → s2t-0.1.1.dist-info}/top_level.txt RENAMED Viewed

File without changes

s2t 0.1.0.post1.dev2__py3-none-any.whl → 0.1.1__py3-none-any.whl

s2t 0.1.0.post1.dev2py3-none-any.whl → 0.1.1py3-none-any.whl