PyPI - pygpt-net - Versions diffs - 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl - Mend

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (182) hide show

pygpt_net/CHANGELOG.txt +15 -0
pygpt_net/__init__.py +3 -3
pygpt_net/app.py +4 -0
pygpt_net/{container.py → app_core.py} +5 -6
pygpt_net/controller/__init__.py +5 -2
pygpt_net/controller/access/control.py +1 -9
pygpt_net/controller/assistant/assistant.py +4 -4
pygpt_net/controller/assistant/batch.py +7 -7
pygpt_net/controller/assistant/files.py +4 -4
pygpt_net/controller/assistant/threads.py +3 -3
pygpt_net/controller/attachment/attachment.py +4 -7
pygpt_net/controller/audio/audio.py +25 -1
pygpt_net/controller/audio/ui.py +2 -2
pygpt_net/controller/chat/audio.py +1 -8
pygpt_net/controller/chat/common.py +30 -4
pygpt_net/controller/chat/handler/stream_worker.py +1124 -0
pygpt_net/controller/chat/output.py +8 -3
pygpt_net/controller/chat/stream.py +4 -405
pygpt_net/controller/chat/text.py +3 -2
pygpt_net/controller/chat/vision.py +11 -19
pygpt_net/controller/config/placeholder.py +1 -1
pygpt_net/controller/ctx/ctx.py +1 -1
pygpt_net/controller/ctx/summarizer.py +1 -1
pygpt_net/controller/kernel/kernel.py +11 -3
pygpt_net/controller/kernel/reply.py +5 -1
pygpt_net/controller/mode/mode.py +21 -12
pygpt_net/controller/plugins/settings.py +3 -2
pygpt_net/controller/presets/editor.py +112 -99
pygpt_net/controller/realtime/__init__.py +12 -0
pygpt_net/controller/realtime/manager.py +53 -0
pygpt_net/controller/realtime/realtime.py +268 -0
pygpt_net/controller/theme/theme.py +3 -2
pygpt_net/controller/ui/mode.py +7 -0
pygpt_net/controller/ui/ui.py +19 -1
pygpt_net/controller/ui/vision.py +4 -4
pygpt_net/core/agents/legacy.py +2 -2
pygpt_net/core/agents/runners/openai_workflow.py +2 -2
pygpt_net/core/assistants/files.py +5 -5
pygpt_net/core/assistants/store.py +4 -4
pygpt_net/core/audio/audio.py +6 -1
pygpt_net/core/audio/backend/native/__init__.py +12 -0
pygpt_net/core/audio/backend/{native.py → native/native.py} +426 -127
pygpt_net/core/audio/backend/native/player.py +139 -0
pygpt_net/core/audio/backend/native/realtime.py +250 -0
pygpt_net/core/audio/backend/pyaudio/__init__.py +12 -0
pygpt_net/core/audio/backend/pyaudio/playback.py +194 -0
pygpt_net/core/audio/backend/pyaudio/pyaudio.py +923 -0
pygpt_net/core/audio/backend/pyaudio/realtime.py +275 -0
pygpt_net/core/audio/backend/pygame/__init__.py +12 -0
pygpt_net/core/audio/backend/{pygame.py → pygame/pygame.py} +130 -19
pygpt_net/core/audio/backend/shared/__init__.py +38 -0
pygpt_net/core/audio/backend/shared/conversions.py +211 -0
pygpt_net/core/audio/backend/shared/envelope.py +38 -0
pygpt_net/core/audio/backend/shared/player.py +137 -0
pygpt_net/core/audio/backend/shared/rt.py +52 -0
pygpt_net/core/audio/capture.py +5 -0
pygpt_net/core/audio/output.py +13 -2
pygpt_net/core/audio/whisper.py +6 -2
pygpt_net/core/bridge/bridge.py +4 -3
pygpt_net/core/bridge/worker.py +31 -9
pygpt_net/core/debug/console/console.py +2 -2
pygpt_net/core/debug/presets.py +2 -2
pygpt_net/core/dispatcher/dispatcher.py +37 -1
pygpt_net/core/events/__init__.py +2 -1
pygpt_net/core/events/realtime.py +55 -0
pygpt_net/core/experts/experts.py +2 -2
pygpt_net/core/image/image.py +51 -1
pygpt_net/core/modes/modes.py +2 -2
pygpt_net/core/presets/presets.py +3 -3
pygpt_net/core/realtime/options.py +87 -0
pygpt_net/core/realtime/shared/__init__.py +0 -0
pygpt_net/core/realtime/shared/audio.py +213 -0
pygpt_net/core/realtime/shared/loop.py +64 -0
pygpt_net/core/realtime/shared/session.py +59 -0
pygpt_net/core/realtime/shared/text.py +37 -0
pygpt_net/core/realtime/shared/tools.py +276 -0
pygpt_net/core/realtime/shared/turn.py +38 -0
pygpt_net/core/realtime/shared/types.py +16 -0
pygpt_net/core/realtime/worker.py +164 -0
pygpt_net/core/tokens/tokens.py +4 -4
pygpt_net/core/types/__init__.py +1 -0
pygpt_net/core/types/image.py +48 -0
pygpt_net/core/types/mode.py +5 -2
pygpt_net/core/vision/analyzer.py +1 -1
pygpt_net/data/config/config.json +13 -4
pygpt_net/data/config/models.json +219 -101
pygpt_net/data/config/modes.json +3 -9
pygpt_net/data/config/settings.json +135 -27
pygpt_net/data/config/settings_section.json +2 -2
pygpt_net/data/locale/locale.de.ini +7 -7
pygpt_net/data/locale/locale.en.ini +25 -12
pygpt_net/data/locale/locale.es.ini +7 -7
pygpt_net/data/locale/locale.fr.ini +7 -7
pygpt_net/data/locale/locale.it.ini +7 -7
pygpt_net/data/locale/locale.pl.ini +8 -8
pygpt_net/data/locale/locale.uk.ini +7 -7
pygpt_net/data/locale/locale.zh.ini +3 -3
pygpt_net/data/locale/plugin.audio_input.en.ini +4 -0
pygpt_net/data/locale/plugin.audio_output.en.ini +4 -0
pygpt_net/item/model.py +23 -3
pygpt_net/plugin/audio_input/plugin.py +37 -4
pygpt_net/plugin/audio_input/simple.py +57 -8
pygpt_net/plugin/cmd_files/worker.py +3 -0
pygpt_net/plugin/openai_dalle/plugin.py +4 -4
pygpt_net/plugin/openai_vision/plugin.py +12 -13
pygpt_net/provider/agents/openai/agent.py +5 -5
pygpt_net/provider/agents/openai/agent_b2b.py +5 -5
pygpt_net/provider/agents/openai/agent_planner.py +5 -6
pygpt_net/provider/agents/openai/agent_with_experts.py +5 -5
pygpt_net/provider/agents/openai/agent_with_experts_feedback.py +4 -4
pygpt_net/provider/agents/openai/agent_with_feedback.py +4 -4
pygpt_net/provider/agents/openai/bot_researcher.py +2 -2
pygpt_net/provider/agents/openai/bots/research_bot/agents/planner_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/search_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/writer_agent.py +1 -1
pygpt_net/provider/agents/openai/evolve.py +5 -5
pygpt_net/provider/agents/openai/supervisor.py +4 -4
pygpt_net/provider/api/__init__.py +27 -0
pygpt_net/provider/api/anthropic/__init__.py +68 -0
pygpt_net/provider/api/google/__init__.py +295 -0
pygpt_net/provider/api/google/audio.py +121 -0
pygpt_net/provider/api/google/chat.py +591 -0
pygpt_net/provider/api/google/image.py +427 -0
pygpt_net/provider/api/google/realtime/__init__.py +12 -0
pygpt_net/provider/api/google/realtime/client.py +1945 -0
pygpt_net/provider/api/google/realtime/realtime.py +186 -0
pygpt_net/provider/api/google/tools.py +222 -0
pygpt_net/provider/api/google/vision.py +129 -0
pygpt_net/provider/{gpt → api/openai}/__init__.py +24 -4
pygpt_net/provider/api/openai/agents/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/agents/computer.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/experts.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/response.py +1 -1
pygpt_net/provider/{gpt → api/openai}/assistants.py +1 -1
pygpt_net/provider/{gpt → api/openai}/chat.py +15 -8
pygpt_net/provider/{gpt → api/openai}/completion.py +1 -1
pygpt_net/provider/{gpt → api/openai}/image.py +1 -1
pygpt_net/provider/api/openai/realtime/__init__.py +12 -0
pygpt_net/provider/api/openai/realtime/client.py +1828 -0
pygpt_net/provider/api/openai/realtime/realtime.py +194 -0
pygpt_net/provider/{gpt → api/openai}/remote_tools.py +1 -1
pygpt_net/provider/{gpt → api/openai}/responses.py +34 -20
pygpt_net/provider/{gpt → api/openai}/store.py +2 -2
pygpt_net/provider/{gpt → api/openai}/vision.py +1 -1
pygpt_net/provider/api/openai/worker/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/worker/assistants.py +4 -4
pygpt_net/provider/{gpt → api/openai}/worker/importer.py +10 -10
pygpt_net/provider/audio_input/google_genai.py +103 -0
pygpt_net/provider/audio_input/openai_whisper.py +1 -1
pygpt_net/provider/audio_output/google_genai_tts.py +229 -0
pygpt_net/provider/audio_output/openai_tts.py +9 -6
pygpt_net/provider/core/config/patch.py +26 -0
pygpt_net/provider/core/model/patch.py +20 -0
pygpt_net/provider/core/preset/json_file.py +2 -4
pygpt_net/provider/llms/anthropic.py +2 -5
pygpt_net/provider/llms/base.py +4 -3
pygpt_net/provider/llms/google.py +8 -9
pygpt_net/provider/llms/openai.py +1 -1
pygpt_net/provider/loaders/hub/image_vision/base.py +1 -1
pygpt_net/ui/dialog/preset.py +71 -55
pygpt_net/ui/layout/toolbox/footer.py +16 -0
pygpt_net/ui/layout/toolbox/image.py +5 -0
pygpt_net/ui/main.py +6 -4
pygpt_net/ui/widget/option/combo.py +15 -1
pygpt_net/utils.py +9 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/METADATA +55 -55
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/RECORD +181 -135
pygpt_net/core/audio/backend/pyaudio.py +0 -554
/pygpt_net/{provider/gpt/agents → controller/chat/handler}/__init__.py +0 -0
/pygpt_net/{provider/gpt/worker → core/realtime}/__init__.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/client.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/remote_tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/utils.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/audio.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/computer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/container.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/summarizer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/utils.py +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/LICENSE +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/WHEEL +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/entry_points.txt +0 -0

pygpt_net/core/audio/backend/pyaudio/realtime.py ADDED Viewed

@@ -0,0 +1,275 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.31 23:00:00                  #
+# ================================================== #
+import threading
+from typing import Optional
+import numpy as np
+from PySide6.QtCore import QTimer, QObject, Qt
+class RealtimeSessionPyAudio(QObject):
+    """
+    Realtime PCM playback session using PyAudio in callback mode.
+    Consumes already-converted PCM frames, keeps GUI responsive and emits volume updates.
+    """
+    def __init__(
+            self,
+            device_index: int,
+            rate: int,
+            channels: int,
+            width_bytes: int = 2,
+            parent: Optional[QObject] = None,
+            volume_emitter: Optional[callable] = None,
+    ):
+        super().__init__(parent)
+        import pyaudio  # local import to keep backend import-safe
+        self._pa = pyaudio.PyAudio()
+        self.device_index = int(device_index)
+        self.rate = int(rate)
+        self.channels = int(channels)
+        self.width = int(width_bytes)
+        self.frame_bytes = max(1, self.channels * self.width)
+        self.bytes_per_ms = max(1, int(self.rate * self.frame_bytes / 1000))
+        # choose PyAudio format from width
+        self.pa_format = self._pa.get_format_from_width(
+            self.width,
+            unsigned=(self.width == 1)
+        )
+        # internal buffers/flags
+        self._buffer = bytearray()
+        self._buf_lock = threading.Lock()
+        self._final = False
+        self._tail_ms = 60  # add a small silence tail to avoid clicks
+        # volume metering
+        self._volume_emitter = volume_emitter
+        self._vol_buffer = bytearray()
+        self._vol_lock = threading.Lock()
+        self._vol_timer = QTimer(self)
+        self._vol_timer.setTimerType(Qt.PreciseTimer)
+        self._vol_timer.setInterval(33)  # ~30 Hz meter
+        self._vol_timer.timeout.connect(self._emit_volume_tick)
+        self._vol_timer.start()
+        # open callback-based output stream
+        self._stream = self._pa.open(
+            format=self.pa_format,
+            channels=self.channels,
+            rate=self.rate,
+            output=True,
+            output_device_index=self.device_index,
+            stream_callback=self._callback,
+            frames_per_buffer=max(256, int(self.rate / 100))  # ~10 ms
+        )
+        try:
+            self._stream.start_stream()
+        except Exception:
+            pass
+        # stop callback (set by backend)
+        self.on_stopped = None
+    def is_active(self) -> bool:
+        """
+        Return True if PortAudio stream is active.
+        :return: True if active
+        """
+        try:
+            return self._stream is not None and self._stream.is_active()
+        except Exception:
+            return False
+    def is_finalized(self) -> bool:
+        """
+        Return True if session was marked final.
+        :return: True if final
+        """
+        return bool(self._final)
+    def feed(self, data: bytes) -> None:
+        """
+        Append PCM bytes (already in session/device format).
+        :param data: bytes to append
+        """
+        if not data:
+            return
+        with self._buf_lock:
+            self._buffer.extend(data)
+        # push to volume window from the same bytes
+        self._vol_push(data)
+    def mark_final(self) -> None:
+        """No more data will be supplied; add a small silence tail."""
+        if not self._final:
+            pad = self.bytes_per_ms * self._tail_ms
+            pad -= (pad % self.frame_bytes)
+            if pad > 0:
+                with self._buf_lock:
+                    self._buffer.extend(self._silence(pad))
+        self._final = True
+    def stop(self) -> None:
+        """Stop playback and free resources."""
+        try:
+            if self._vol_timer:
+                self._vol_timer.stop()
+        except Exception:
+            pass
+        try:
+            if self._stream and self._stream.is_active():
+                self._stream.stop_stream()
+        except Exception:
+            pass
+        try:
+            if self._stream:
+                self._stream.close()
+        except Exception:
+            pass
+        try:
+            if self._pa:
+                self._pa.terminate()
+        except Exception:
+            pass
+        # zero the meter
+        try:
+            if self._volume_emitter:
+                self._volume_emitter(0)
+        except Exception:
+            pass
+        self._stream = None
+        self._pa = None
+        cb = self.on_stopped
+        self.on_stopped = None
+        if cb:
+            try:
+                cb()
+            except Exception:
+                pass
+        self.deleteLater()
+    # ---- internal ----
+    def _callback(self, in_data, frame_count, time_info, status):
+        """
+        PortAudio callback: deliver frames from buffer.
+        :param in_data: input data (ignored)
+        :param frame_count: number of frames requested
+        :param time_info: timing info (ignored)
+        :param status: status flags (ignored)
+        :return: (data bytes, flag)
+        """
+        import pyaudio
+        need = frame_count * self.frame_bytes
+        out = b""
+        with self._buf_lock:
+            if len(self._buffer) >= need:
+                out = bytes(self._buffer[:need])
+                del self._buffer[:need]
+            elif len(self._buffer) > 0:
+                out = bytes(self._buffer)
+                self._buffer.clear()
+        if len(out) < need:
+            out += self._silence(need - len(out))
+        # meter push from what is actually written
+        self._vol_push(out)
+        # auto-finish: when final and nothing more to play, complete and stop()
+        if self._final and self._buffer_empty():
+            QTimer.singleShot(0, self.stop)  # stop on the GUI thread
+            return out, pyaudio.paComplete
+        return out, pyaudio.paContinue
+    def _buffer_empty(self) -> bool:
+        """
+        Check if internal buffer is empty.
+        :return: True if empty
+        """
+        with self._buf_lock:
+            return len(self._buffer) == 0
+    def _silence(self, n: int) -> bytes:
+        """
+        Generate n bytes of silence.
+        :param n: number of bytes
+        :return: bytes of silence
+        """
+        if n <= 0:
+            return b""
+        if self.width == 1:
+            return bytes([128]) * n  # silence for unsigned 8-bit
+        return b"\x00" * n
+    def _vol_push(self, chunk: bytes) -> None:
+        """
+        Push chunk to volume buffer and trim if needed.
+        :param chunk: bytes to push to volume buffer
+        """
+        if not chunk:
+            return
+        with self._vol_lock:
+            self._vol_buffer.extend(chunk)
+            max_bytes = max(1, self.bytes_per_ms * 100)  # ~100 ms window
+            if len(self._vol_buffer) > max_bytes:
+                del self._vol_buffer[:len(self._vol_buffer) - max_bytes]
+    def _emit_volume_tick(self) -> None:
+        """Emit volume level based on current volume buffer."""
+        if self._volume_emitter is None:
+            return
+        with self._vol_lock:
+            buf = bytes(self._vol_buffer)
+        if not buf:
+            try:
+                self._volume_emitter(0)
+            except Exception:
+                pass
+            return
+        try:
+            # decode by sample width
+            if self.width == 1:
+                arr = np.frombuffer(buf, dtype=np.uint8).astype(np.int16)
+                arr = (arr - 128).astype(np.float32) / 128.0
+            elif self.width == 2:
+                arr = np.frombuffer(buf, dtype=np.int16).astype(np.float32) / 32768.0
+            elif self.width == 4:
+                arr = np.frombuffer(buf, dtype=np.int32).astype(np.float32) / 2147483648.0
+            else:
+                arr = np.frombuffer(buf, dtype=np.int16).astype(np.float32) / 32768.0
+            if arr.size == 0:
+                self._volume_emitter(0)
+                return
+            rms = float(np.sqrt(np.mean(arr.astype(np.float64) ** 2)))
+            db = -60.0 if rms <= 1e-9 else 20.0 * float(np.log10(min(1.0, rms)))
+            db = max(-60.0, min(0.0, db))
+            volume = int(((db + 60.0) / 60.0) * 100.0)
+            self._volume_emitter(volume)
+        except Exception:
+            pass

pygpt_net/core/audio/backend/pygame/__init__.py ADDED Viewed

@@ -0,0 +1,12 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.31 23:00:00                  #
+# ================================================== #
+from .pygame import PygameBackend

pygpt_net/core/audio/backend/{pygame.py → pygame/pygame.py} RENAMED Viewed

@@ -6,15 +6,20 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.27 07:00:00                  #
+# Updated Date: 2025.08.31 04:00:00                  #
 # ================================================== #
 import time
 import wave
+import numpy as np
 from typing import List, Tuple
+from collections import deque
+from threading import Lock
 from PySide6.QtCore import QTimer
+from ..shared import f32_to_s16le, build_rt_input_delta_event
 class PygameBackend:
     MIN_FRAMES = 25  # minimum frames to start transcription
@@ -22,6 +27,8 @@ class PygameBackend:
         """
         Audio input capture core using pygame's SDL2 audio capture backend.
         Captured devices are stored as device name strings.
+        :param window: Window instance
         """
         self.window = window
         self.path = None
@@ -55,10 +62,14 @@ class PygameBackend:
         self.initialized = False
         self.mode = "input"  # input|control
+        # --- REALTIME INPUT (mic -> dispatcher) ---
+        self._rt_signals = None           # set with set_rt_signals()
+        self._rt_queue = deque()          # queue of raw float32 chunks from SDL audio thread
+        self._rt_lock = Lock()            # protects _rt_queue
+        self._is_recording = False        # suppress updates after stop
     def init(self):
-        """
-        Initialize the pygame audio system if not already initialized.
-        """
+        """Initialize the pygame audio system if not already initialized."""
         if not self.initialized:
             import pygame
             from pygame._sdl2 import (
@@ -110,10 +121,20 @@ class PygameBackend:
         """
         self.path = path
+    def set_rt_signals(self, signals) -> None:
+        """
+        Set signals object for realtime events.
+        :param signals: Signals object
+        """
+        self._rt_signals = signals
     def start(self):
         """
         Start audio recording using pygame’s SDL2 audio capture.
         Returns True if started successfully.
+        :return: True if started
         """
         self.init()
         # Clear previously recorded frames.
@@ -136,15 +157,23 @@ class PygameBackend:
         self.timer.timeout.connect(self._update_level)
         self.timer.start(50)  # update every 50ms
+        # mark recording as active after setup
+        self._is_recording = True
         return True
     def stop(self):
         """
         Stop audio recording.
         Returns True if stopped and audio data was saved (if path is set).
+        :return: True if stopped and saved
         """
         self.init()
         result = False
+        # immediately mark as not recording
+        self._is_recording = False
         if self.audio_source is not None:
             if self.timer is not None:
                 self.timer.stop()
@@ -154,6 +183,12 @@ class PygameBackend:
             self.audio_source.pause(1)
             self.audio_source = None
+            # Emit final input chunk marker for realtime consumers
+            try:
+                self._emit_rt_input_delta(b"", final=True)
+            except Exception:
+                pass
             if self.frames:
                 if self.path:
                     self.save_audio_file(self.path)
@@ -162,35 +197,48 @@ class PygameBackend:
                     print("File path is not set.")
             else:
                 print("No audio data recorded")
+        # reset level indicator
+        try:
+            self.reset_audio_level()
+        except Exception:
+            pass
         return result
     def has_source(self) -> bool:
         """
         Check if the audio source is available.
+        :return: True if audio source is available
         """
         return self.audio_source is not None
     def has_frames(self) -> bool:
         """
         Check if any audio frames have been recorded.
+        :return: True if any frames recorded
         """
         return bool(self.frames)
     def has_min_frames(self) -> bool:
         """
         Check if at least MIN_FRAMES audio frames have been recorded.
+        :return: True if at least MIN_FRAMES recorded
         """
         return len(self.frames) >= self.MIN_FRAMES
     def reset_audio_level(self):
-        """
-        Reset the audio level bar (if available).
-        """
+        """Reset the audio level bar (if available)."""
         self.window.controller.audio.ui.on_input_volume_change(0, self.mode)
     def check_audio_input(self) -> bool:
         """
         Check if a default audio input device is available using pygame.
+        :return: True if an audio input device is available
         """
         from pygame._sdl2 import (
             get_audio_device_names,
@@ -226,6 +274,8 @@ class PygameBackend:
     def device_changed(self, index: int):
         """
         Change the selected audio input device by its index in the devices list.
+        :param index: Index of the device in the devices list.
         """
         self.init()
         if 0 <= index < len(self.devices):
@@ -234,9 +284,7 @@ class PygameBackend:
             self.selected_device = None
     def prepare_device(self):
-        """
-        Set the current audio input device based on configuration.
-        """
+        """Set the current audio input device based on configuration."""
         self.init()
         if self.window is not None and hasattr(self.window, "core"):
             device_index = int(self.window.core.config.get('audio.input.device', 0))
@@ -251,14 +299,26 @@ class PygameBackend:
         """
         Callback function called in the audio thread.
         It receives a memoryview of audio data which is converted to bytes and appended.
+        :param audiodevice: The audio device instance (not used here).
+        :param audiomemoryview: MemoryView of the captured audio data.
         """
+        if not self._is_recording:
+            return
         # Append captured audio bytes to the frames list.
-        self.frames.append(bytes(audiomemoryview))
+        chunk = bytes(audiomemoryview)
+        self.frames.append(chunk)
+        # Enqueue chunk for realtime emission (processed on the Qt thread).
+        try:
+            with self._rt_lock:
+                self._rt_queue.append(chunk)
+        except Exception:
+            pass
     def setup_audio_input(self):
-        """
-        Create an AudioDevice with the selected device name and start recording.
-        """
+        """Create an AudioDevice with the selected device name and start recording."""
         self.init()
         from pygame._sdl2 import (
             AudioDevice,
@@ -289,16 +349,18 @@ class PygameBackend:
         Periodically called (via QTimer) to compute RMS from the last captured audio chunk
         and update the audio level bar.
         """
+        # Drain realtime queue first to keep latency low.
+        self._drain_rt_queue()
         if not self.frames:
             return
-        import numpy as np
         # Use the last captured chunk.
         last_chunk = self.frames[-1]
         try:
             # Interpret the bytes as float32 samples.
             samples = np.frombuffer(last_chunk, dtype=np.float32)
-        except Exception as e:
+        except Exception:
             return
         if samples.size == 0:
             return
@@ -329,7 +391,6 @@ class PygameBackend:
         :param filename: The path to the output WAV file.
         """
-        import numpy as np
         full_data = b"".join(self.frames)
         try:
             data_array = np.frombuffer(full_data, dtype=np.float32)
@@ -337,7 +398,7 @@ class PygameBackend:
             print("Error converting audio data:", e)
             return
         # Convert float32 values in the range -1.0 ... 1.0 to PCM int16.
-        int_data = (data_array * 32767).astype(np.int16)
+        int_data = (np.clip(data_array, -1.0, 1.0) * 32767.0).astype(np.int16)
         new_data = int_data.tobytes()
         with wave.open(filename, 'wb') as wf:
             wf.setnchannels(self.channels)
@@ -490,11 +551,61 @@ class PygameBackend:
     def get_default_input_device(self) -> tuple:
         """
         Retrieve the default input device using PyAudio.
+        :return: (index, name)
         """
         return 0, "Default Input Device"
     def get_default_output_device(self) -> tuple:
         """
         Retrieve the default output device using PyAudio.
+        :return: (index, name)
         """
-        return 0, "Default Output Device"
+        return 0, "Default Output Device"
+    # --------------------
+    # REALTIME INPUT HELPERS
+    # --------------------
+    def _emit_rt_input_delta(self, data: bytes, final: bool) -> None:
+        """
+        Emit RT_INPUT_AUDIO_DELTA with a provider-agnostic payload.
+        Standardizes to PCM16, little-endian, and includes rate/channels.
+        :param data: PCM16LE audio bytes
+        :param final: True if this is the final chunk
+        """
+        if not self._rt_signals:
+            return
+        try:
+            event = build_rt_input_delta_event(
+                rate=int(self.rate),
+                channels=int(self.channels),
+                data=data or b"",
+                final=bool(final),
+            )
+            # Ensure emission on the Qt thread
+            QTimer.singleShot(0, lambda: self._rt_signals.response.emit(event))
+        except Exception:
+            pass
+    def _drain_rt_queue(self) -> None:
+        """
+        Drain queued float32 chunks from the audio thread, convert to PCM16,
+        and emit a single realtime delta event.
+        """
+        if not self._rt_signals:
+            # nothing to emit
+            with self._rt_lock:
+                self._rt_queue.clear()
+            return
+        with self._rt_lock:
+            if not self._rt_queue:
+                return
+            raw = b"".join(self._rt_queue)
+            self._rt_queue.clear()
+        s16 = f32_to_s16le(raw)
+        if s16:
+            self._emit_rt_input_delta(s16, final=False)

pygpt_net/core/audio/backend/shared/__init__.py ADDED Viewed

@@ -0,0 +1,38 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.31 23:00:00                  #
+# ================================================== #
+# Shared helpers for audio backends
+from .rt import (
+    build_rt_input_delta_event,
+    build_output_volume_event,
+)
+from .conversions import (
+    qaudio_dtype,
+    qaudio_norm_factor,
+    qaudio_to_s16le,
+    pyaudio_to_s16le,
+    f32_to_s16le,
+    convert_s16_pcm,
+)
+from .envelope import compute_envelope_from_file
+__all__ = [
+    "build_rt_input_delta_event",
+    "build_output_volume_event",
+    "qaudio_dtype",
+    "qaudio_norm_factor",
+    "qaudio_to_s16le",
+    "pyaudio_to_s16le",
+    "f32_to_s16le",
+    "convert_s16_pcm",
+    "compute_envelope_from_file",
+]

pygpt-net 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl