PyPI - pygpt-net - Versions diffs - 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl - Mend

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (182) hide show

pygpt_net/CHANGELOG.txt +15 -0
pygpt_net/__init__.py +3 -3
pygpt_net/app.py +4 -0
pygpt_net/{container.py → app_core.py} +5 -6
pygpt_net/controller/__init__.py +5 -2
pygpt_net/controller/access/control.py +1 -9
pygpt_net/controller/assistant/assistant.py +4 -4
pygpt_net/controller/assistant/batch.py +7 -7
pygpt_net/controller/assistant/files.py +4 -4
pygpt_net/controller/assistant/threads.py +3 -3
pygpt_net/controller/attachment/attachment.py +4 -7
pygpt_net/controller/audio/audio.py +25 -1
pygpt_net/controller/audio/ui.py +2 -2
pygpt_net/controller/chat/audio.py +1 -8
pygpt_net/controller/chat/common.py +30 -4
pygpt_net/controller/chat/handler/stream_worker.py +1124 -0
pygpt_net/controller/chat/output.py +8 -3
pygpt_net/controller/chat/stream.py +4 -405
pygpt_net/controller/chat/text.py +3 -2
pygpt_net/controller/chat/vision.py +11 -19
pygpt_net/controller/config/placeholder.py +1 -1
pygpt_net/controller/ctx/ctx.py +1 -1
pygpt_net/controller/ctx/summarizer.py +1 -1
pygpt_net/controller/kernel/kernel.py +11 -3
pygpt_net/controller/kernel/reply.py +5 -1
pygpt_net/controller/mode/mode.py +21 -12
pygpt_net/controller/plugins/settings.py +3 -2
pygpt_net/controller/presets/editor.py +112 -99
pygpt_net/controller/realtime/__init__.py +12 -0
pygpt_net/controller/realtime/manager.py +53 -0
pygpt_net/controller/realtime/realtime.py +268 -0
pygpt_net/controller/theme/theme.py +3 -2
pygpt_net/controller/ui/mode.py +7 -0
pygpt_net/controller/ui/ui.py +19 -1
pygpt_net/controller/ui/vision.py +4 -4
pygpt_net/core/agents/legacy.py +2 -2
pygpt_net/core/agents/runners/openai_workflow.py +2 -2
pygpt_net/core/assistants/files.py +5 -5
pygpt_net/core/assistants/store.py +4 -4
pygpt_net/core/audio/audio.py +6 -1
pygpt_net/core/audio/backend/native/__init__.py +12 -0
pygpt_net/core/audio/backend/{native.py → native/native.py} +426 -127
pygpt_net/core/audio/backend/native/player.py +139 -0
pygpt_net/core/audio/backend/native/realtime.py +250 -0
pygpt_net/core/audio/backend/pyaudio/__init__.py +12 -0
pygpt_net/core/audio/backend/pyaudio/playback.py +194 -0
pygpt_net/core/audio/backend/pyaudio/pyaudio.py +923 -0
pygpt_net/core/audio/backend/pyaudio/realtime.py +275 -0
pygpt_net/core/audio/backend/pygame/__init__.py +12 -0
pygpt_net/core/audio/backend/{pygame.py → pygame/pygame.py} +130 -19
pygpt_net/core/audio/backend/shared/__init__.py +38 -0
pygpt_net/core/audio/backend/shared/conversions.py +211 -0
pygpt_net/core/audio/backend/shared/envelope.py +38 -0
pygpt_net/core/audio/backend/shared/player.py +137 -0
pygpt_net/core/audio/backend/shared/rt.py +52 -0
pygpt_net/core/audio/capture.py +5 -0
pygpt_net/core/audio/output.py +13 -2
pygpt_net/core/audio/whisper.py +6 -2
pygpt_net/core/bridge/bridge.py +4 -3
pygpt_net/core/bridge/worker.py +31 -9
pygpt_net/core/debug/console/console.py +2 -2
pygpt_net/core/debug/presets.py +2 -2
pygpt_net/core/dispatcher/dispatcher.py +37 -1
pygpt_net/core/events/__init__.py +2 -1
pygpt_net/core/events/realtime.py +55 -0
pygpt_net/core/experts/experts.py +2 -2
pygpt_net/core/image/image.py +51 -1
pygpt_net/core/modes/modes.py +2 -2
pygpt_net/core/presets/presets.py +3 -3
pygpt_net/core/realtime/options.py +87 -0
pygpt_net/core/realtime/shared/__init__.py +0 -0
pygpt_net/core/realtime/shared/audio.py +213 -0
pygpt_net/core/realtime/shared/loop.py +64 -0
pygpt_net/core/realtime/shared/session.py +59 -0
pygpt_net/core/realtime/shared/text.py +37 -0
pygpt_net/core/realtime/shared/tools.py +276 -0
pygpt_net/core/realtime/shared/turn.py +38 -0
pygpt_net/core/realtime/shared/types.py +16 -0
pygpt_net/core/realtime/worker.py +164 -0
pygpt_net/core/tokens/tokens.py +4 -4
pygpt_net/core/types/__init__.py +1 -0
pygpt_net/core/types/image.py +48 -0
pygpt_net/core/types/mode.py +5 -2
pygpt_net/core/vision/analyzer.py +1 -1
pygpt_net/data/config/config.json +13 -4
pygpt_net/data/config/models.json +219 -101
pygpt_net/data/config/modes.json +3 -9
pygpt_net/data/config/settings.json +135 -27
pygpt_net/data/config/settings_section.json +2 -2
pygpt_net/data/locale/locale.de.ini +7 -7
pygpt_net/data/locale/locale.en.ini +25 -12
pygpt_net/data/locale/locale.es.ini +7 -7
pygpt_net/data/locale/locale.fr.ini +7 -7
pygpt_net/data/locale/locale.it.ini +7 -7
pygpt_net/data/locale/locale.pl.ini +8 -8
pygpt_net/data/locale/locale.uk.ini +7 -7
pygpt_net/data/locale/locale.zh.ini +3 -3
pygpt_net/data/locale/plugin.audio_input.en.ini +4 -0
pygpt_net/data/locale/plugin.audio_output.en.ini +4 -0
pygpt_net/item/model.py +23 -3
pygpt_net/plugin/audio_input/plugin.py +37 -4
pygpt_net/plugin/audio_input/simple.py +57 -8
pygpt_net/plugin/cmd_files/worker.py +3 -0
pygpt_net/plugin/openai_dalle/plugin.py +4 -4
pygpt_net/plugin/openai_vision/plugin.py +12 -13
pygpt_net/provider/agents/openai/agent.py +5 -5
pygpt_net/provider/agents/openai/agent_b2b.py +5 -5
pygpt_net/provider/agents/openai/agent_planner.py +5 -6
pygpt_net/provider/agents/openai/agent_with_experts.py +5 -5
pygpt_net/provider/agents/openai/agent_with_experts_feedback.py +4 -4
pygpt_net/provider/agents/openai/agent_with_feedback.py +4 -4
pygpt_net/provider/agents/openai/bot_researcher.py +2 -2
pygpt_net/provider/agents/openai/bots/research_bot/agents/planner_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/search_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/writer_agent.py +1 -1
pygpt_net/provider/agents/openai/evolve.py +5 -5
pygpt_net/provider/agents/openai/supervisor.py +4 -4
pygpt_net/provider/api/__init__.py +27 -0
pygpt_net/provider/api/anthropic/__init__.py +68 -0
pygpt_net/provider/api/google/__init__.py +295 -0
pygpt_net/provider/api/google/audio.py +121 -0
pygpt_net/provider/api/google/chat.py +591 -0
pygpt_net/provider/api/google/image.py +427 -0
pygpt_net/provider/api/google/realtime/__init__.py +12 -0
pygpt_net/provider/api/google/realtime/client.py +1945 -0
pygpt_net/provider/api/google/realtime/realtime.py +186 -0
pygpt_net/provider/api/google/tools.py +222 -0
pygpt_net/provider/api/google/vision.py +129 -0
pygpt_net/provider/{gpt → api/openai}/__init__.py +24 -4
pygpt_net/provider/api/openai/agents/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/agents/computer.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/experts.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/response.py +1 -1
pygpt_net/provider/{gpt → api/openai}/assistants.py +1 -1
pygpt_net/provider/{gpt → api/openai}/chat.py +15 -8
pygpt_net/provider/{gpt → api/openai}/completion.py +1 -1
pygpt_net/provider/{gpt → api/openai}/image.py +1 -1
pygpt_net/provider/api/openai/realtime/__init__.py +12 -0
pygpt_net/provider/api/openai/realtime/client.py +1828 -0
pygpt_net/provider/api/openai/realtime/realtime.py +194 -0
pygpt_net/provider/{gpt → api/openai}/remote_tools.py +1 -1
pygpt_net/provider/{gpt → api/openai}/responses.py +34 -20
pygpt_net/provider/{gpt → api/openai}/store.py +2 -2
pygpt_net/provider/{gpt → api/openai}/vision.py +1 -1
pygpt_net/provider/api/openai/worker/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/worker/assistants.py +4 -4
pygpt_net/provider/{gpt → api/openai}/worker/importer.py +10 -10
pygpt_net/provider/audio_input/google_genai.py +103 -0
pygpt_net/provider/audio_input/openai_whisper.py +1 -1
pygpt_net/provider/audio_output/google_genai_tts.py +229 -0
pygpt_net/provider/audio_output/openai_tts.py +9 -6
pygpt_net/provider/core/config/patch.py +26 -0
pygpt_net/provider/core/model/patch.py +20 -0
pygpt_net/provider/core/preset/json_file.py +2 -4
pygpt_net/provider/llms/anthropic.py +2 -5
pygpt_net/provider/llms/base.py +4 -3
pygpt_net/provider/llms/google.py +8 -9
pygpt_net/provider/llms/openai.py +1 -1
pygpt_net/provider/loaders/hub/image_vision/base.py +1 -1
pygpt_net/ui/dialog/preset.py +71 -55
pygpt_net/ui/layout/toolbox/footer.py +16 -0
pygpt_net/ui/layout/toolbox/image.py +5 -0
pygpt_net/ui/main.py +6 -4
pygpt_net/ui/widget/option/combo.py +15 -1
pygpt_net/utils.py +9 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/METADATA +55 -55
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/RECORD +181 -135
pygpt_net/core/audio/backend/pyaudio.py +0 -554
/pygpt_net/{provider/gpt/agents → controller/chat/handler}/__init__.py +0 -0
/pygpt_net/{provider/gpt/worker → core/realtime}/__init__.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/client.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/remote_tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/utils.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/audio.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/computer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/container.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/summarizer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/utils.py +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/LICENSE +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/WHEEL +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/entry_points.txt +0 -0

pygpt_net/data/locale/locale.uk.ini CHANGED Viewed

@@ -845,7 +845,7 @@ mode.agent_openai.tooltip = Просунуті агенти (OpenAI)
 mode.agent.tooltip = Прості агенти (legacy)
 mode.assistant = Помічник
 mode.assistant.tooltip = Чат за допомогою API Асистентів
-mode.audio = Чат з аудіо
+mode.audio = Realtime + audio
 mode.chat = Чат
 mode.chat.tooltip = Режим чату (за замовчуванням)
 mode.completion = Завершення
@@ -1174,9 +1174,9 @@ settings.ctx.sources = Показати джерела індексу Llama
 settings.ctx.sources.desc = Якщо включено, використані джерела будуть відображатися в відповіді (якщо доступно, не працюватиме в потоковому чаті)
 settings.ctx.use_extra = Використовувати додатковий контекст виводу
 settings.ctx.use_extra.desc = Якщо увімкнено, звичайний текстовий вивід (якщо доступний) з результатів команд буде відображений поруч з JSON виводом.
+settings.debug.show_menu = Показати меню налагодження
 settings.defaults.app.confirm = Завантажити заводські налаштування додатку?
 settings.defaults.user.confirm = Відмінити поточні зміни?
-settings.developer.debug = Показати меню налагодження
 settings.dict.delete.confirm = Видалити елемент зі списку?
 settings.download.dir = Директорія для завантаження файлів
 settings.download.dir.desc = Піддиректорія для завантажених файлів, наприклад, у режимі помічників, всередині "data"
@@ -1197,9 +1197,9 @@ settings.frequency_penalty = Частотний штраф
 settings.func_call.native = Використовувати рідні виклики функцій API
 settings.func_call.native.desc = Якщо увімкнено, програма буде використовувати рідні виклики функцій API замість внутрішнього формату pygpt і нижченаведених запитів команд не використовуватимуться. Лише режими чату та асистентів.
 settings.img_dialog_open = Відкрити діалогове вікно зображення після генерації (Режим зображення)
-settings.img_prompt_model = DALL-E: модель генерації запиту
-settings.img_quality = DALL-E: якість зображення
-settings.img_resolution = DALL-E: розмір зображення
+settings.img_prompt_model = Модель Генерації Запиту
+settings.img_quality = Якість Зображення
+settings.img_resolution = Розмір Зображення
 settings.layout.animation.disable = Вимкнути анімації
 settings.layout.animation.disable.desc = Вимикає анімації макета, як анімовані завантажувачі тощо.
 settings.layout.density = Щільність компонування
@@ -1294,7 +1294,7 @@ settings.prompt.ctx.auto_summary.user = Контекст: авто-резюме
 settings.prompt.ctx.auto_summary.user.desc = Заповнювачі: {input}, {output}
 settings.prompt.expert = Експерт: Основний запит
 settings.prompt.expert.desc = Інструкція (системний запит) для ведучого експерта, як керувати підеекспертами. Інструкції для підеекспертів даються з їхніх налаштувань.
-settings.prompt.img = DALL-E: генерація зображення
+settings.prompt.img = Генерація зображення
 settings.prompt.img.desc = Підказка для генерації команддля DALL-E (якщо вимкнено сирівний режим). Тільки режим зображення.
 settings.remote_tools.code_interpreter = Інтерпретатор коду
 settings.remote_tools.code_interpreter.desc = Увімкніть віддалений інструмент `code_interpreter` у режимі Чат / через Responses API OpenAI.
@@ -1336,7 +1336,7 @@ settings.section.audio.cache = Кеш
 settings.section.audio.device = Пристрої
 settings.section.audio.options = Параметри
 settings.section.ctx = Контекст
-settings.section.developer = Розробник
+settings.section.debug = Налагодження
 settings.section.files = Файли та вкладення
 settings.section.general = Загальні
 settings.section.images = Зображення

pygpt_net/data/locale/locale.zh.ini CHANGED Viewed

@@ -845,7 +845,7 @@ mode.agent_openai.tooltip = 高级代理 (OpenAI)
 mode.agent.tooltip = 简单代理（自主）
 mode.assistant = 助手
 mode.assistant.tooltip = 使用助手API進行聊天
-mode.audio = 语音聊天
+mode.audio = Realtime + audio
 mode.chat = 聊天模式
 mode.chat.tooltip = 聊天模式（預設）
 mode.completion = 完成模式
@@ -1174,9 +1174,9 @@ settings.ctx.sources = 显示Llama索引源
 settings.ctx.sources.desc = 如果启用，使用的源将在回应中显示（如果可用，不适用于流式聊天）
 settings.ctx.use_extra = 使用额外的上下文输出
 settings.ctx.use_extra.desc = 如果启用，将在命令结果的 JSON 输出旁边显示纯文本输出（如果有）。
+settings.debug.show_menu = 显示调试菜单
 settings.defaults.app.confirm = 加载出厂应用程序设置？
 settings.defaults.user.confirm = 撤销当前更改？
-settings.developer.debug = 显示调试菜单
 settings.dict.delete.confirm = 从列表中移除项目？
 settings.download.dir = 文件下载目录
 settings.download.dir.desc = 下载文件的子目录，例如在助手模式下，位于 "data" 内部
@@ -1336,7 +1336,7 @@ settings.section.audio.cache = 缓存
 settings.section.audio.device = 设备
 settings.section.audio.options = 选项
 settings.section.ctx = 上下文
-settings.section.developer = 開發者
+settings.section.debug = 调试
 settings.section.files = 文件和附件
 settings.section.general = 一般
 settings.section.images = 圖像

pygpt_net/data/locale/plugin.audio_input.en.ini CHANGED Viewed

@@ -17,6 +17,10 @@ google_args.tooltip = Provide additional keyword arguments for recognize_google(
 google_cloud_args.description = Additional keyword arguments for r.recognize_google_cloud(audio, **kwargs).
 google_cloud_args.label = Additional keyword arguments
 google_cloud_args.tooltip = Provide additional keyword arguments for recognize_google_cloud()
+google_genai_audio_model.description = Specify Gemini model supporting audio, e.g., gemini-2.5-flash
+google_genai_audio_model.label = Model
+google_genai_audio_prompt.description = System prompt for transcription
+google_genai_audio_prompt.label = System Prompt
 magic_word.description = Activate listening only after the magic word is provided, like 'Hey GPT' or 'OK GPT'. Default: False.
 magic_word.label = Magic word
 magic_word_phrase_length.description = Magic word phrase length. Default: 2.

pygpt_net/data/locale/plugin.audio_output.en.ini CHANGED Viewed

@@ -15,6 +15,10 @@ eleven_labs_voice.description = Specify the Voice ID.
 eleven_labs_voice.label = Voice ID
 google_api_key.description = You can obtain your own API key here: https://console.cloud.google.com/apis/library/texttospeech.googleapis.com
 google_api_key.label = Google Cloud Text-to-speech API Key
+google_genai_tts_model.description = Specify Gemini TTS model, e.g.: gemini-2.5-flash-preview-tts or gemini-2.5-pro-preview-tts
+google_genai_tts_model.label = Model
+google_genai_tts_voice.description = Specify voice, e.g.: Puck, Kore, Charon, Leda, Zephyr... (case-sensitive)
+google_genai_tts_voice.label = Voice
 google_lang.description = Specify the language code.
 google_lang.label = Language code
 google_voice.description = Specify the voice.

pygpt_net/item/model.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.23 15:00:00                  #
+# Updated Date: 2025.08.28 09:00:00                  #
 # ================================================== #
 import json
@@ -253,7 +253,17 @@ class ModelItem:
         :return: True if supports image input
         """
-        if MODE_VISION in self.mode or MULTIMODAL_IMAGE in self.input:
+        if MULTIMODAL_IMAGE in self.input:
+            return True
+        return False
+    def is_image_output(self) -> bool:
+        """
+        Check if model supports image output
+        :return: True if supports image output
+        """
+        if "image" in self.output or MODE_VISION in self.mode:
             return True
         return False
@@ -263,7 +273,17 @@ class ModelItem:
         :return: True if supports audio input
         """
-        if MODE_AUDIO in self.mode or MULTIMODAL_AUDIO in self.input:
+        if MULTIMODAL_AUDIO in self.input:
+            return True
+        return False
+    def is_audio_output(self) -> bool:
+        """
+        Check if model supports audio output
+        :return: True if supports audio output
+        """
+        if MULTIMODAL_AUDIO in self.output:
             return True
         return False

pygpt_net/plugin/audio_input/plugin.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2024.11.26 19:00:00                  #
+# Updated Date: 2025.08.31 23:00:00                  #
 # ================================================== #
 import os
@@ -23,6 +23,7 @@ from pygpt_net.utils import trans
 from .config import Config
 from .worker import Worker
 from .simple import Simple
+from ...core.types import MODE_AUDIO
 class Plugin(BasePlugin):
@@ -124,13 +125,31 @@ class Plugin(BasePlugin):
             words = [x.strip() for x in words]  # remove white-spaces
         return words
-    def toggle_recording_simple(self):
+    def toggle_recording_simple(
+            self,
+            state: bool = None,
+            auto: bool = False
+    ):
         """
         Event: AUDIO_INPUT_RECORD_TOGGLE
         Toggle recording
+        :param state: state to set
+        :param auto: True if called automatically (not by user)
+        """
+        if self.window.controller.realtime.is_enabled():
+            self.handler_simple.toggle_realtime(state=state, auto=auto)
+            return
+        self.handler_simple.toggle_recording(state=state)
+    def is_recording(self) -> bool:
         """
-        self.handler_simple.toggle_recording()
+        Check if is recording (simple mode)
+        :return: True if is recording
+        """
+        return self.handler_simple.is_recording
     def toggle_speech(self, state: bool):
         """
@@ -214,7 +233,9 @@ class Plugin(BasePlugin):
             self.toggle_speech(data['value'])
         elif name == Event.AUDIO_INPUT_RECORD_TOGGLE:
-            self.toggle_recording_simple()
+            state = data['state'] if 'value' in data else None
+            auto = data['auto'] if 'auto' in data else False
+            self.toggle_recording_simple(state=state, auto=auto)
         elif name == Event.AUDIO_INPUT_STOP:
             self.on_stop()
@@ -492,6 +513,18 @@ class Plugin(BasePlugin):
                 self.window.dispatch(event)  # send text, input clear in send method
                 self.set_status('')
+    def handle_realtime_stopped(self):
+        """Handle realtime stopped"""
+        context = BridgeContext()
+        context.prompt = "..."
+        extra = {}
+        event = KernelEvent(KernelEvent.INPUT_SYSTEM, {
+            'context': context,
+            'extra': extra,
+        })
+        self.window.dispatch(event)  # send text, input clear in send method
+        self.set_status('')
     @Slot(object)
     def handle_status(self, data: str):
         """

pygpt_net/plugin/audio_input/simple.py CHANGED Viewed

@@ -6,14 +6,14 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.27 07:00:00                  #
+# Updated Date: 2025.08.31 23:00:00                  #
 # ================================================== #
 import os
 from PySide6.QtCore import QTimer
-from pygpt_net.core.events import AppEvent
+from pygpt_net.core.events import AppEvent, RealtimeEvent
 from pygpt_net.core.tabs.tab import Tab
 from pygpt_net.utils import trans
@@ -32,8 +32,46 @@ class Simple:
         self.is_recording = False
         self.timer = None
-    def toggle_recording(self):
-        """Toggle recording"""
+    def toggle_realtime(
+            self,
+            state: bool = None,
+            auto: bool = False
+    ):
+        """
+        Toggle recording
+        :param state: True to start recording, False to stop recording, None to toggle
+        :param auto: True if called automatically (not by user)
+        """
+        if state is not None:
+            if state and not self.is_recording:
+                self.start_recording(realtime=True)
+            elif not state:
+                self.force_stop()
+            else:
+                self.force_stop()
+            return
+        if self.is_recording:
+            self.stop_recording(realtime=True)
+            if not auto:
+                self.plugin.window.dispatch(RealtimeEvent(RealtimeEvent.RT_INPUT_AUDIO_MANUAL_STOP))
+        else:
+            self.start_recording(realtime=True)
+            if not auto:
+                self.plugin.window.dispatch(RealtimeEvent(RealtimeEvent.RT_INPUT_AUDIO_MANUAL_START))
+    def toggle_recording(self, state: bool = None):
+        """
+        Toggle recording
+        :param state: True to start recording, False to stop recording, None to toggle
+        """
+        if state is not None:
+            if state and not self.is_recording:
+                self.start_recording()
+            elif not state:
+                self.force_stop()
+            return
         if self.is_recording:
             self.stop_recording()
         else:
@@ -51,11 +89,12 @@ class Simple:
         """Stop timeout"""
         self.stop_recording(timeout=True)
-    def start_recording(self, force: bool = False):
+    def start_recording(self, force: bool = False, realtime: bool = False):
         """
         Start recording
         :param force: True to force recording
+        :param realtime: True if called from realtime callback
         """
         # display snap warning if not displayed yet
         if (not self.plugin.window.core.config.get("audio.input.snap", False)
@@ -89,7 +128,7 @@ class Simple:
             # disable in continuous mode
             timeout = int(self.plugin.window.core.config.get('audio.input.timeout', 120) or 0) # get timeout
             timeout_continuous = self.plugin.window.core.config.get('audio.input.timeout.continuous', False) # enable continuous timeout
-            if timeout > 0:
+            if timeout > 0 and not realtime:
                 if self.timer is None and (not continuous_enabled or timeout_continuous):
                     self.timer = QTimer()
                     self.timer.timeout.connect(self.stop_timeout)
@@ -119,11 +158,12 @@ class Simple:
                 )
             self.switch_btn_start()  # switch button to start
-    def stop_recording(self, timeout: bool = False):
+    def stop_recording(self, timeout: bool = False, realtime: bool = False):
         """
         Stop recording
         :param timeout: True if stopped due to timeout
+        :param realtime: True if called from realtime callback
         """
         self.plugin.window.core.audio.capture.reset_audio_level()
         self.is_recording = False
@@ -143,7 +183,7 @@ class Simple:
                 return
             if self.plugin.window.core.audio.capture.has_frames():
-                if not self.plugin.window.core.audio.capture.has_min_frames():
+                if not self.plugin.window.core.audio.capture.has_min_frames() and not realtime:
                     self.plugin.window.update_status(trans("status.audio.too_short"))
                     self.plugin.window.dispatch(AppEvent(AppEvent.VOICE_CONTROL_STOPPED))  # app event
                     return
@@ -152,6 +192,15 @@ class Simple:
         else:
             self.plugin.window.update_status("")
+    def force_stop(self):
+        """Stop recording"""
+        self.is_recording = False
+        self.plugin.window.dispatch(AppEvent(AppEvent.INPUT_VOICE_LISTEN_STOPPED))  # app event
+        self.switch_btn_start()  # switch button to start
+        if self.plugin.window.core.audio.capture.has_source():
+            self.plugin.window.core.audio.capture.stop()  # stop recording
+            return
     def on_stop(self):
         """Handle auto-transcribe"""
         path = os.path.join(self.plugin.window.core.config.path, self.plugin.input_file)

pygpt_net/plugin/cmd_files/worker.py CHANGED Viewed

@@ -920,6 +920,9 @@ class Worker(BaseWorker):
         :param context: context data
         :return: extra data
         """
+        # disabled in v2.6.31
+        # reason: do not duplicate context in chat
+        return {}
         cmd = item["cmd"]
         extra = {
             'plugin': "cmd_files",

pygpt_net/plugin/openai_dalle/plugin.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.07.30 00:00:00                  #
+# Updated Date: 2025.08.28 09:00:00                  #
 # ================================================== #
 from pygpt_net.core.types import (
@@ -42,8 +42,8 @@ class Plugin(BasePlugin):
         ]
         self.allowed_modes = [
             MODE_CHAT,
-            MODE_LANGCHAIN,
-            MODE_VISION,
+            # MODE_LANGCHAIN,
+            # MODE_VISION,
             MODE_LLAMA_INDEX,
             MODE_ASSISTANT,
             MODE_AGENT,
@@ -166,7 +166,7 @@ class Plugin(BasePlugin):
                     sync = False
                     if self.window.core.config.get("mode") in [MODE_AGENT_LLAMA, MODE_AGENT_OPENAI]:
                         sync = True
-                    self.window.core.gpt.image.generate(bridge_context, extra, sync)  # force inline mode, async call
+                    self.window.core.api.openai.image.generate(bridge_context, extra, sync)  # force inline mode, async call
             except Exception as e:
                 self.log("Error: " + str(e))
                 return

pygpt_net/plugin/openai_vision/plugin.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.15 23:00:00                  #
+# Updated Date: 2025.08.28 09:00:00                  #
 # ================================================== #
 from pygpt_net.core.types import (
@@ -102,7 +102,7 @@ class Plugin(BasePlugin):
                 )  # mode change
         elif name == Event.MODEL_BEFORE:
-            if "mode" in data and data["mode"] == MODE_VISION:
+            if data.get("mode") == MODE_CHAT:
                 key = self.get_option_value("model")
                 if self.window.core.models.has(key):
                     data['model'] = self.window.core.models.get(key)
@@ -119,7 +119,7 @@ class Plugin(BasePlugin):
                 data['value'] = self.on_system_prompt(data['value'])
         elif name == Event.UI_ATTACHMENTS:
-            mode = data["mode"]
+            mode = data.get("mode")
             if mode in [MODE_AGENT, MODE_AGENT_LLAMA, MODE_AGENT_OPENAI] and not self.window.core.config.get("cmd"):
                 pass
             else:
@@ -263,8 +263,7 @@ class Plugin(BasePlugin):
         # append vision prompt only if vision is provided or enabled
         if not self.is_vision_provided():
             return prompt
-        prompt = "Image attachment has been already sent.\n\n" + prompt
-        return prompt
+        return "Image attachment has been already sent.\n\n" + prompt
     def on_pre_prompt(self, prompt: str) -> str:
         """
@@ -294,12 +293,12 @@ class Plugin(BasePlugin):
         """
         mode = self.window.core.config.get('mode')
         attachments = self.window.core.attachments.get_all(mode)
-        self.window.core.gpt.vision.build_content(
+        self.window.core.api.openai.vision.build_content(
             str(self.prompt),
             attachments,
         )  # tmp build content, provide attachments from global mode
-        built_attachments = self.window.core.gpt.vision.attachments
+        built_attachments = self.window.core.api.openai.vision.attachments
         if len(built_attachments) > 0:
             return True
         return False
@@ -313,13 +312,13 @@ class Plugin(BasePlugin):
         result = False
         mode = self.window.core.config.get('mode')
         attachments = self.window.core.attachments.get_all(mode)  # from global mode
-        self.window.core.gpt.vision.build_content(
+        self.window.core.api.openai.vision.build_content(
             str(self.prompt),
             attachments,
         )  # tmp build content, provide attachments from global mode
-        built_attachments = self.window.core.gpt.vision.attachments
-        built_urls = self.window.core.gpt.vision.urls
+        built_attachments = self.window.core.api.openai.vision.attachments
+        built_urls = self.window.core.api.openai.vision.urls
         # check for images in URLs found in prompt
         img_urls = []
@@ -343,13 +342,13 @@ class Plugin(BasePlugin):
         :return: updated mode
         """
         # abort if already in vision mode or command enabled
-        if mode == MODE_VISION or mode in self.disabled_mode_switch:
+        if mode in self.disabled_mode_switch:
             return mode  # keep current mode
-        # if already used in this ctx then keep vision mode
+        # if already used in this ctx then keep vision (in CHAT) mode
         if self.is_vision_provided():
             ctx.is_vision = True
-            return MODE_VISION
+            return MODE_CHAT
         return mode  # keep current mode

pygpt_net/provider/agents/openai/agent.py CHANGED Viewed

@@ -26,12 +26,12 @@ from pygpt_net.core.types import (
 from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
-from pygpt_net.provider.gpt.agents.remote_tools import is_computer_tool, append_tools
-from pygpt_net.provider.gpt.agents.computer import Agent as ComputerAgent, LocalComputer
-from pygpt_net.provider.gpt.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.remote_tools import is_computer_tool, append_tools
+from pygpt_net.provider.api.openai.agents.computer import Agent as ComputerAgent, LocalComputer
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from ..base import BaseAgent
-from ...gpt.agents.experts import get_experts
 class Agent(BaseAgent):
     def __init__(self, *args, **kwargs):
@@ -159,7 +159,7 @@ class Agent(BaseAgent):
                     agent,
                     **kwargs
                 )
-                final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+                final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
                 response_id = result.last_response_id
                 if verbose:
                     print("Final response:", result)

pygpt_net/provider/agents/openai/agent_b2b.py CHANGED Viewed

@@ -29,12 +29,12 @@ from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
-from pygpt_net.provider.gpt.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from pygpt_net.utils import trans
 from ..base import BaseAgent
-from ...gpt.agents.experts import get_experts
 class Agent(BaseAgent):
@@ -274,7 +274,7 @@ class Agent(BaseAgent):
                 if verbose:
                     print("Final response:", result)
-                final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+                final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
                 if bridge.stopped():
                     bridge.on_stop(ctx)
@@ -305,7 +305,7 @@ class Agent(BaseAgent):
                 if verbose:
                     print("Final response:", result)
-                final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+                final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
                 if bridge.stopped():
                     bridge.on_stop(ctx)
                     break

pygpt_net/provider/agents/openai/agent_planner.py CHANGED Viewed

@@ -30,14 +30,13 @@ from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.client import get_custom_model_provider, set_openai_env
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
-from pygpt_net.provider.gpt.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.client import get_custom_model_provider, set_openai_env
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from pygpt_net.utils import trans
 from ..base import BaseAgent
-from ...gpt.agents.experts import get_experts
 @dataclass
 class EvaluationFeedback:
@@ -327,7 +326,7 @@ class Agent(BaseAgent):
                     print("Final response:", result)
                 input_items = result.to_input_list()
-                final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+                final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
                 if bridge.stopped():
                     bridge.on_stop(ctx)

pygpt_net/provider/agents/openai/agent_with_experts.py CHANGED Viewed

@@ -29,12 +29,12 @@ from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.client import get_custom_model_provider, set_openai_env
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
-from pygpt_net.provider.gpt.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.client import get_custom_model_provider, set_openai_env
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from ..base import BaseAgent
-from ...gpt.agents.experts import get_experts
 class Agent(BaseAgent):
@@ -137,7 +137,7 @@ class Agent(BaseAgent):
                 agent,
                 **kwargs
             )
-            final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+            final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
             response_id = result.last_response_id
             if verbose:
                 print("Final response:", result)

pygpt_net/provider/agents/openai/agent_with_experts_feedback.py CHANGED Viewed

@@ -29,12 +29,12 @@ from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
-from pygpt_net.provider.gpt.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from pygpt_net.utils import trans
 from ..base import BaseAgent
-from ...gpt.agents.experts import get_experts
 @dataclass
@@ -221,7 +221,7 @@ class Agent(BaseAgent):
                     print("Final response:", result)
                 input_items = result.to_input_list()
-                final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+                final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
                 if bridge.stopped():
                     bridge.on_stop(ctx)

pygpt_net/provider/agents/openai/agent_with_feedback.py CHANGED Viewed

@@ -29,12 +29,12 @@ from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
-from pygpt_net.provider.gpt.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from pygpt_net.utils import trans
 from ..base import BaseAgent
-from ...gpt.agents.experts import get_experts
 @dataclass
@@ -221,7 +221,7 @@ class Agent(BaseAgent):
                     print("Final response:", result)
                 input_items = result.to_input_list()
-                final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+                final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
                 if bridge.stopped():
                     bridge.on_stop(ctx)

pygpt-net 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl