PyPI - s2t - Versions diffs - 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl - Mend

s2t 0.1.3py3-none-any.whl → 0.1.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

s2t/recorder.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from __future__ import annotations
+import os
 import queue
 import select
 import sys
@@ -46,6 +47,8 @@ class Recorder:
             raise RuntimeError("sounddevice/soundfile required for recording.") from e
         evt_q: queue.Queue[str] = queue.Queue()
+        # Control queue is separate from audio frames to avoid control backpressure.
+        ctrl_q: queue.Queue[str] = queue.Queue()
         stop_evt = threading.Event()
         def key_reader() -> None:
@@ -61,10 +64,14 @@ class Recorder:
                     ms = cast(_MSVCRT, msvcrt)
                     last_space = 0.0
+                    if self.verbose:
+                        print("[key] using msvcrt (Windows)", file=sys.stderr)
                     while not stop_evt.is_set():
                         if ms.kbhit():
                             ch = ms.getwch()
                             if ch in ("\r", "\n"):
+                                if self.verbose:
+                                    print("[key] ENTER", file=sys.stderr)
                                 evt_q.put("ENTER")
                                 break
                             if ch == " ":
@@ -74,33 +81,118 @@ class Recorder:
                                 ):
                                     continue
                                 last_space = now
+                                if self.verbose:
+                                    print("[key] SPACE", file=sys.stderr)
                                 evt_q.put("SPACE")
                         time.sleep(0.01)
                 else:
-                    fd = sys.stdin.fileno()
-                    old = termios.tcgetattr(fd)
-                    tty.setcbreak(fd)
-                    last_space = 0.0
+                    # Prefer sys.stdin when it's a TTY (original, proven path). If not a TTY, try /dev/tty, else fallback to stdin line reads.
                     try:
-                        while not stop_evt.is_set():
-                            r, _, _ = select.select([sys.stdin], [], [], 0.05)
-                            if r:
-                                ch = sys.stdin.read(1)
-                                if ch in ("\n", "\r"):
-                                    evt_q.put("ENTER")
-                                    break
-                                if ch == " ":
-                                    now = time.perf_counter()
-                                    if self.debounce_ms and (now - last_space) < (
-                                        self.debounce_ms / 1000.0
-                                    ):
+                        if sys.stdin.isatty():
+                            fd = sys.stdin.fileno()
+                            if self.verbose:
+                                print("[key] using sys.stdin (isatty, fd read)", file=sys.stderr)
+                            old = termios.tcgetattr(fd)
+                            tty.setcbreak(fd)
+                            last_space = 0.0
+                            try:
+                                while not stop_evt.is_set():
+                                    r, _, _ = select.select([fd], [], [], 0.05)
+                                    if r:
+                                        try:
+                                            ch_b = os.read(fd, 1)
+                                        except BlockingIOError:
+                                            continue
+                                        if not ch_b:
+                                            continue
+                                        ch = ch_b.decode(errors="ignore")
+                                        if ch in ("\n", "\r"):
+                                            if self.verbose:
+                                                print("[key] ENTER", file=sys.stderr)
+                                            evt_q.put("ENTER")
+                                            break
+                                        if ch == " ":
+                                            now = time.perf_counter()
+                                            if self.debounce_ms and (now - last_space) < (
+                                                self.debounce_ms / 1000.0
+                                            ):
+                                                continue
+                                            last_space = now
+                                            if self.verbose:
+                                                print("[key] SPACE", file=sys.stderr)
+                                            evt_q.put("SPACE")
+                            finally:
+                                termios.tcsetattr(fd, termios.TCSADRAIN, old)
+                        else:
+                            # Try /dev/tty when stdin is not a TTY
+                            using_devtty = False
+                            fd = None
+                            try:
+                                fd = os.open("/dev/tty", os.O_RDONLY)
+                                using_devtty = True
+                                if self.verbose:
+                                    print("[key] using /dev/tty (stdin not TTY)", file=sys.stderr)
+                                old = termios.tcgetattr(fd)
+                                tty.setcbreak(fd)
+                                last_space = 0.0
+                                try:
+                                    while not stop_evt.is_set():
+                                        r, _, _ = select.select([fd], [], [], 0.05)
+                                        if r:
+                                            ch_b = os.read(fd, 1)
+                                            if not ch_b:
+                                                continue
+                                            ch = ch_b.decode(errors="ignore")
+                                            if ch in ("\n", "\r"):
+                                                if self.verbose:
+                                                    print("[key] ENTER", file=sys.stderr)
+                                                evt_q.put("ENTER")
+                                                break
+                                            if ch == " ":
+                                                now = time.perf_counter()
+                                                if self.debounce_ms and (now - last_space) < (
+                                                    self.debounce_ms / 1000.0
+                                                ):
+                                                    continue
+                                                last_space = now
+                                                if self.verbose:
+                                                    print("[key] SPACE", file=sys.stderr)
+                                                evt_q.put("SPACE")
+                                finally:
+                                    termios.tcsetattr(fd, termios.TCSADRAIN, old)
+                            except Exception:
+                                if using_devtty and fd is not None:
+                                    try:
+                                        os.close(fd)
+                                    except Exception:
+                                        pass
+                                print(
+                                    "Warning: no TTY for key input; falling back to stdin line mode.",
+                                    file=sys.stderr,
+                                )
+                                # Last resort: line-buffered stdin; Enter will still end.
+                                while not stop_evt.is_set():
+                                    line = sys.stdin.readline()
+                                    if not line:
+                                        time.sleep(0.05)
                                         continue
-                                    last_space = now
-                                    evt_q.put("SPACE")
-                    finally:
-                        termios.tcsetattr(fd, termios.TCSADRAIN, old)
-            except Exception:
-                pass
+                                    # If user hits Enter on empty line, treat as ENTER
+                                    if line == "\n" or line == "\r\n":
+                                        if self.verbose:
+                                            print("[key] ENTER (line mode)", file=sys.stderr)
+                                        evt_q.put("ENTER")
+                                        break
+                                    # If first non-empty char is space, treat as SPACE
+                                    if line and line[0] == " ":
+                                        if self.verbose:
+                                            print("[key] SPACE (line mode)", file=sys.stderr)
+                                        evt_q.put("SPACE")
+                    except Exception as e:
+                        print(f"Warning: key reader failed: {e}", file=sys.stderr)
+            except Exception as e:
+                # Log unexpected key reader errors to aid debugging, but keep recording running.
+                print(f"Warning: key reader stopped unexpectedly: {e}", file=sys.stderr)
         audio_q: queue.Queue[tuple[str, Any]] = queue.Queue(maxsize=128)
         chunk_index = 1
@@ -117,67 +209,106 @@ class Recorder:
                 str(cur_path), mode="w", samplerate=self.samplerate, channels=self.channels
             )
             while True:
-                kind, payload = audio_q.get()
+                # First, handle any pending control commands so SPACE/ENTER are never blocked by frames backlog.
+                try:
+                    while True:
+                        cmd = ctrl_q.get_nowait()
+                        if cmd == "split":
+                            fh.flush()
+                            fh.close()
+                            if frames_written > 0:
+                                dur = frames_written / float(self.samplerate)
+                                chunk_paths.append(cur_path)
+                                chunk_frames.append(frames_written)
+                                chunk_offsets.append(offset_seconds_total)
+                                offset_seconds_total += dur
+                                if self.verbose:
+                                    print(
+                                        f"Saved chunk: {cur_path.name} ({dur:.2f}s)",
+                                        file=sys.stderr,
+                                    )
+                                tx_queue.put(
+                                    (chunk_index, cur_path, frames_written, chunk_offsets[-1])
+                                )
+                            else:
+                                try:
+                                    cur_path.unlink(missing_ok=True)
+                                except Exception:
+                                    pass
+                            frames_written = 0
+                            chunk_index += 1
+                            if (
+                                self.pause_after_first_chunk
+                                and chunk_index == 2
+                                and self.resume_event is not None
+                            ):
+                                self._paused = True
+                                self.resume_event.wait()
+                                self._paused = False
+                            cur_path = self.session_dir / f"chunk_{chunk_index:04d}{self.ext}"
+                            fh = sf.SoundFile(
+                                str(cur_path),
+                                mode="w",
+                                samplerate=self.samplerate,
+                                channels=self.channels,
+                            )
+                        elif cmd == "finish":
+                            fh.flush()
+                            fh.close()
+                            if frames_written > 0:
+                                dur = frames_written / float(self.samplerate)
+                                chunk_paths.append(cur_path)
+                                chunk_frames.append(frames_written)
+                                chunk_offsets.append(offset_seconds_total)
+                                offset_seconds_total += dur
+                                if self.verbose:
+                                    print(
+                                        f"Saved chunk: {cur_path.name} ({dur:.2f}s)",
+                                        file=sys.stderr,
+                                    )
+                                tx_queue.put(
+                                    (chunk_index, cur_path, frames_written, chunk_offsets[-1])
+                                )
+                            else:
+                                try:
+                                    cur_path.unlink(missing_ok=True)
+                                except Exception:
+                                    pass
+                            tx_queue.put((-1, Path(), 0, 0.0))
+                            return
+                except queue.Empty:
+                    pass
+                # Then, write frames if available; short timeout to re-check control queue regularly.
+                try:
+                    kind, payload = audio_q.get(timeout=0.05)
+                except queue.Empty:
+                    continue
                 if kind == "frames":
                     data = payload
                     fh.write(data)
                     frames_written += len(data)
-                elif kind == "split":
-                    fh.flush()
-                    fh.close()
-                    if frames_written > 0:
-                        dur = frames_written / float(self.samplerate)
-                        chunk_paths.append(cur_path)
-                        chunk_frames.append(frames_written)
-                        chunk_offsets.append(offset_seconds_total)
-                        offset_seconds_total += dur
-                        if self.verbose:
-                            print(f"Saved chunk: {cur_path.name} ({dur:.2f}s)", file=sys.stderr)
-                        tx_queue.put((chunk_index, cur_path, frames_written, chunk_offsets[-1]))
-                    else:
-                        try:
-                            cur_path.unlink(missing_ok=True)
-                        except Exception:
-                            pass
-                    frames_written = 0
-                    chunk_index += 1
-                    if (
-                        self.pause_after_first_chunk
-                        and chunk_index == 2
-                        and self.resume_event is not None
-                    ):
-                        self._paused = True
-                        self.resume_event.wait()
-                        self._paused = False
-                    cur_path = self.session_dir / f"chunk_{chunk_index:04d}{self.ext}"
-                    fh = sf.SoundFile(
-                        str(cur_path), mode="w", samplerate=self.samplerate, channels=self.channels
-                    )
-                elif kind == "finish":
-                    fh.flush()
-                    fh.close()
-                    if frames_written > 0:
-                        dur = frames_written / float(self.samplerate)
-                        chunk_paths.append(cur_path)
-                        chunk_frames.append(frames_written)
-                        chunk_offsets.append(offset_seconds_total)
-                        offset_seconds_total += dur
-                        if self.verbose:
-                            print(f"Saved chunk: {cur_path.name} ({dur:.2f}s)", file=sys.stderr)
-                        tx_queue.put((chunk_index, cur_path, frames_written, chunk_offsets[-1]))
-                    else:
-                        try:
-                            cur_path.unlink(missing_ok=True)
-                        except Exception:
-                            pass
-                    break
             tx_queue.put((-1, Path(), 0, 0.0))
+        # Timestamp of last dropped-frame warning (throttling for verbose mode)
+        last_drop_log = 0.0
         def cb(indata: Any, frames: int, time_info: Any, status: Any) -> None:
+            nonlocal last_drop_log
             if status:
                 print(status, file=sys.stderr)
             if not self._paused:
-                audio_q.put(("frames", indata.copy()))
+                try:
+                    audio_q.put_nowait(("frames", indata.copy()))
+                except queue.Full:
+                    # Drop frame if the queue is saturated; throttle warnings.
+                    now = time.perf_counter()
+                    if self.verbose and (now - last_drop_log) > 1.0:
+                        print(
+                            "Warning: audio queue full; dropping input frames.",
+                            file=sys.stderr,
+                        )
+                        last_drop_log = now
         key_t = threading.Thread(target=key_reader, daemon=True)
         writer_t = threading.Thread(target=writer_fn, daemon=True)
@@ -197,9 +328,9 @@ class Recorder:
                 except queue.Empty:
                     continue
                 if evt == "SPACE":
-                    audio_q.put(("split", None))
+                    ctrl_q.put("split")
                 elif evt == "ENTER":
-                    audio_q.put(("finish", None))
+                    ctrl_q.put("finish")
                     break
         writer_t.join()
         return chunk_paths, chunk_frames, chunk_offsets

{s2t-0.1.3.dist-info → s2t-0.1.4.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: s2t
-Version: 0.1.3
+Version: 0.1.4
 Summary: Speech to Text (s2t): Record audio, run Whisper, export formats, and copy transcript to clipboard.
 Author: Maintainers
 License-Expression: LicenseRef-Proprietary

{s2t-0.1.3.dist-info → s2t-0.1.4.dist-info}/RECORD RENAMED Viewed

@@ -3,14 +3,14 @@ s2t/cli.py,sha256=Qf6Hz0Ew9ncLbQQoCPDG7ZiYWeGbwBcZMZi_WbEu54w,20018
 s2t/config.py,sha256=lFc_x5fIx_q0JpTcI4Lm4aubxhIXVH34foBvLMUNFGs,437
 s2t/outputs.py,sha256=Lo8VcARZ7QPuuQQNu8myD5J4c4NO1Rs0L1DLnzLe9tM,1546
 s2t/py.typed,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
-s2t/recorder.py,sha256=uBD9mYf-uUCkRJw8fQitVnDrX6PwRNXJycyY4dBfXL0,8076
+s2t/recorder.py,sha256=0sw1UJqQIRdiJO5dugUxRjTN5kFU0CBETVjoQz99a8E,16055
 s2t/types.py,sha256=jBiRN-tr0qVw-lhaXvnsyKrVGDyLkqEbxs9qkQ6qGqI,339
 s2t/utils.py,sha256=YU6YhiuONmqhrKte4DY5tiC5PP-yFExJMMBzFUiA8qA,3416
 s2t/whisper_engine.py,sha256=x-V7ST9e3JnwMWdbMh4C7dHjA420jaOtXH2-igeh7vc,6492
 s2t/translator/__init__.py,sha256=K-MKves7kZ4-62POfrmWeOcBaTjsTzeFSu8QNHqYuus,239
 s2t/translator/argos_backend.py,sha256=VW_OYFFBuNZgcWM-fbvR6XGokuxS2fptkCMFIO9MD1I,19068
-s2t-0.1.3.dist-info/METADATA,sha256=V0l2MbvH4Kd5nt9Qk3jAoLQIoo1If0w2pSjjG901CQA,4642
-s2t-0.1.3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-s2t-0.1.3.dist-info/entry_points.txt,sha256=JISIUlZAJ3DX1dB6zT3X_E3vcXI-eWEQKwHiT35fPKs,37
-s2t-0.1.3.dist-info/top_level.txt,sha256=o8N0JcuHdIrfX3iGHvntHiDC2XgN7__joyNu08ZOh0s,4
-s2t-0.1.3.dist-info/RECORD,,
+s2t-0.1.4.dist-info/METADATA,sha256=oQYIN7eNFsSBvLQZTaORC_TvJtp0AUuhkuVmMIsfI28,4642
+s2t-0.1.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+s2t-0.1.4.dist-info/entry_points.txt,sha256=JISIUlZAJ3DX1dB6zT3X_E3vcXI-eWEQKwHiT35fPKs,37
+s2t-0.1.4.dist-info/top_level.txt,sha256=o8N0JcuHdIrfX3iGHvntHiDC2XgN7__joyNu08ZOh0s,4
+s2t-0.1.4.dist-info/RECORD,,

{s2t-0.1.3.dist-info → s2t-0.1.4.dist-info}/WHEEL RENAMED Viewed

File without changes

{s2t-0.1.3.dist-info → s2t-0.1.4.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{s2t-0.1.3.dist-info → s2t-0.1.4.dist-info}/top_level.txt RENAMED Viewed

File without changes

s2t 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl

s2t 0.1.3py3-none-any.whl → 0.1.4py3-none-any.whl