PyPI - pygpt-net - Versions diffs - 2.6.28__py3-none-any.whl → 2.6.30__py3-none-any.whl - Mend

pygpt-net 2.6.28py3-none-any.whl → 2.6.30py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

pygpt_net/CHANGELOG.txt +13 -0
pygpt_net/__init__.py +3 -3
pygpt_net/{container.py → app_core.py} +5 -6
pygpt_net/controller/access/control.py +1 -9
pygpt_net/controller/assistant/assistant.py +4 -4
pygpt_net/controller/assistant/batch.py +7 -7
pygpt_net/controller/assistant/files.py +4 -4
pygpt_net/controller/assistant/threads.py +3 -3
pygpt_net/controller/attachment/attachment.py +4 -7
pygpt_net/controller/chat/common.py +1 -1
pygpt_net/controller/chat/stream.py +961 -294
pygpt_net/controller/chat/vision.py +11 -19
pygpt_net/controller/config/placeholder.py +1 -1
pygpt_net/controller/ctx/ctx.py +1 -1
pygpt_net/controller/ctx/summarizer.py +1 -1
pygpt_net/controller/mode/mode.py +21 -12
pygpt_net/controller/plugins/settings.py +3 -2
pygpt_net/controller/presets/editor.py +112 -99
pygpt_net/controller/theme/common.py +2 -0
pygpt_net/controller/theme/theme.py +6 -2
pygpt_net/controller/ui/vision.py +4 -4
pygpt_net/core/agents/legacy.py +2 -2
pygpt_net/core/agents/runners/openai_workflow.py +2 -2
pygpt_net/core/assistants/files.py +5 -5
pygpt_net/core/assistants/store.py +4 -4
pygpt_net/core/bridge/bridge.py +3 -3
pygpt_net/core/bridge/worker.py +28 -9
pygpt_net/core/debug/console/console.py +2 -2
pygpt_net/core/debug/presets.py +2 -2
pygpt_net/core/experts/experts.py +2 -2
pygpt_net/core/idx/llm.py +21 -3
pygpt_net/core/modes/modes.py +2 -2
pygpt_net/core/presets/presets.py +3 -3
pygpt_net/core/tokens/tokens.py +4 -4
pygpt_net/core/types/mode.py +5 -2
pygpt_net/core/vision/analyzer.py +1 -1
pygpt_net/data/config/config.json +6 -3
pygpt_net/data/config/models.json +75 -3
pygpt_net/data/config/modes.json +3 -9
pygpt_net/data/config/settings.json +112 -55
pygpt_net/data/config/settings_section.json +2 -2
pygpt_net/data/locale/locale.de.ini +2 -2
pygpt_net/data/locale/locale.en.ini +9 -2
pygpt_net/data/locale/locale.es.ini +2 -2
pygpt_net/data/locale/locale.fr.ini +2 -2
pygpt_net/data/locale/locale.it.ini +2 -2
pygpt_net/data/locale/locale.pl.ini +3 -3
pygpt_net/data/locale/locale.uk.ini +2 -2
pygpt_net/data/locale/locale.zh.ini +2 -2
pygpt_net/item/model.py +23 -3
pygpt_net/plugin/openai_dalle/plugin.py +4 -4
pygpt_net/plugin/openai_vision/plugin.py +12 -13
pygpt_net/provider/agents/openai/agent.py +5 -5
pygpt_net/provider/agents/openai/agent_b2b.py +5 -5
pygpt_net/provider/agents/openai/agent_planner.py +5 -6
pygpt_net/provider/agents/openai/agent_with_experts.py +5 -5
pygpt_net/provider/agents/openai/agent_with_experts_feedback.py +4 -4
pygpt_net/provider/agents/openai/agent_with_feedback.py +4 -4
pygpt_net/provider/agents/openai/bot_researcher.py +2 -2
pygpt_net/provider/agents/openai/bots/research_bot/agents/planner_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/search_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/writer_agent.py +1 -1
pygpt_net/provider/agents/openai/evolve.py +5 -5
pygpt_net/provider/agents/openai/supervisor.py +4 -4
pygpt_net/provider/api/__init__.py +27 -0
pygpt_net/provider/api/anthropic/__init__.py +68 -0
pygpt_net/provider/api/google/__init__.py +262 -0
pygpt_net/provider/api/google/audio.py +114 -0
pygpt_net/provider/api/google/chat.py +552 -0
pygpt_net/provider/api/google/image.py +287 -0
pygpt_net/provider/api/google/tools.py +222 -0
pygpt_net/provider/api/google/vision.py +129 -0
pygpt_net/provider/{gpt → api/openai}/__init__.py +2 -2
pygpt_net/provider/{gpt → api/openai}/agents/computer.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/experts.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/response.py +1 -1
pygpt_net/provider/{gpt → api/openai}/assistants.py +1 -1
pygpt_net/provider/{gpt → api/openai}/chat.py +15 -8
pygpt_net/provider/{gpt → api/openai}/completion.py +1 -1
pygpt_net/provider/{gpt → api/openai}/image.py +1 -1
pygpt_net/provider/{gpt → api/openai}/remote_tools.py +1 -1
pygpt_net/provider/{gpt → api/openai}/responses.py +34 -20
pygpt_net/provider/{gpt → api/openai}/store.py +2 -2
pygpt_net/provider/{gpt → api/openai}/vision.py +1 -1
pygpt_net/provider/{gpt → api/openai}/worker/assistants.py +4 -4
pygpt_net/provider/{gpt → api/openai}/worker/importer.py +10 -10
pygpt_net/provider/audio_input/openai_whisper.py +1 -1
pygpt_net/provider/audio_output/google_tts.py +12 -0
pygpt_net/provider/audio_output/openai_tts.py +1 -1
pygpt_net/provider/core/config/patch.py +11 -0
pygpt_net/provider/core/model/patch.py +9 -0
pygpt_net/provider/core/preset/json_file.py +2 -4
pygpt_net/provider/llms/anthropic.py +2 -5
pygpt_net/provider/llms/base.py +4 -3
pygpt_net/provider/llms/openai.py +1 -1
pygpt_net/provider/loaders/hub/image_vision/base.py +1 -1
pygpt_net/ui/dialog/preset.py +71 -55
pygpt_net/ui/main.py +6 -4
pygpt_net/utils.py +9 -0
{pygpt_net-2.6.28.dist-info → pygpt_net-2.6.30.dist-info}/METADATA +42 -48
{pygpt_net-2.6.28.dist-info → pygpt_net-2.6.30.dist-info}/RECORD +115 -107
/pygpt_net/provider/{gpt → api/openai}/agents/__init__.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/client.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/remote_tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/utils.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/audio.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/computer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/container.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/summarizer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/utils.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/worker/__init__.py +0 -0
{pygpt_net-2.6.28.dist-info → pygpt_net-2.6.30.dist-info}/LICENSE +0 -0
{pygpt_net-2.6.28.dist-info → pygpt_net-2.6.30.dist-info}/WHEEL +0 -0
{pygpt_net-2.6.28.dist-info → pygpt_net-2.6.30.dist-info}/entry_points.txt +0 -0

pygpt_net/ui/dialog/preset.py CHANGED Viewed

@@ -6,12 +6,12 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.14 13:00:00                  #
+# Updated Date: 2025.08.28 09:00:00                  #
 # ================================================== #
 from PySide6.QtCore import Qt
 from PySide6.QtWidgets import QPushButton, QHBoxLayout, QLabel, QVBoxLayout, QSplitter, QWidget, QSizePolicy, \
-    QTabWidget, QLineEdit, QFileDialog
+    QTabWidget, QFileDialog
 from pygpt_net.core.types import (
     MODE_AGENT,
@@ -51,12 +51,8 @@ class Preset(BaseConfigDialog):
         """Setup preset editor dialog"""
         self.window.ui.nodes['preset.btn.current'] = QPushButton(trans("dialog.preset.btn.current"))
         self.window.ui.nodes['preset.btn.save'] = QPushButton(trans("dialog.preset.btn.save"))
-        self.window.ui.nodes['preset.btn.current'].clicked.connect(
-            lambda: self.window.controller.presets.editor.from_current()
-        )
-        self.window.ui.nodes['preset.btn.save'].clicked.connect(
-            lambda: self.window.controller.presets.editor.save()
-        )
+        self.window.ui.nodes['preset.btn.current'].clicked.connect(self.window.controller.presets.editor.from_current)
+        self.window.ui.nodes['preset.btn.save'].clicked.connect(self.window.controller.presets.editor.save)
         self.window.ui.nodes['preset.btn.current'].setAutoDefault(False)
         self.window.ui.nodes['preset.btn.save'].setAutoDefault(True)
@@ -119,14 +115,14 @@ class Preset(BaseConfigDialog):
         mode_keys_middle = [
             MODE_COMPLETION,
             MODE_IMAGE,
-            MODE_VISION,
+            # MODE_VISION,
             MODE_COMPUTER,
+            MODE_EXPERT,
         ]
         mode_keys_right = [
             MODE_AGENT_LLAMA,
             MODE_AGENT_OPENAI,
             MODE_AGENT,
-            MODE_EXPERT,
         ]
         rows_mode_left = QVBoxLayout()
@@ -156,17 +152,20 @@ class Preset(BaseConfigDialog):
         rows_mode.addStretch(1)
         # modes
-        self.window.ui.nodes['preset.editor.modes'] = QWidget()
-        self.window.ui.nodes['preset.editor.modes'].setLayout(rows_mode)
-        self.window.ui.nodes['preset.editor.modes'].setContentsMargins(0, 0, 0, 0)
+        modes = QWidget()
+        modes.setLayout(rows_mode)
+        modes.setContentsMargins(0, 0, 0, 0)
+        self.window.ui.nodes['preset.editor.modes'] = modes
         # experts
         self.window.ui.nodes['preset.editor.experts'] = ExpertsEditor(self.window)
         # desc and prompt
-        self.window.ui.nodes['preset.editor.description'] = QWidget()
-        self.window.ui.nodes['preset.editor.description'].setLayout(options['description'])
-        self.window.ui.nodes['preset.editor.description'].setContentsMargins(0, 5, 0, 5)
+        desc = QWidget()
+        desc.setLayout(options['description'])
+        desc.setContentsMargins(0, 5, 0, 5)
+        self.window.ui.nodes['preset.editor.description'] = desc
         # prompt + extra options
         prompt_layout = QVBoxLayout()
@@ -195,6 +194,7 @@ class Preset(BaseConfigDialog):
             "agent_provider_openai",
             "idx",
         ]
+        # personalize tab
         personalize_keys = [
             "ai_name",
             "user_name",
@@ -202,15 +202,18 @@ class Preset(BaseConfigDialog):
             "ai_personalize",
         ]
         for key in left_keys:
-            self.window.ui.nodes['preset.editor.' + key] = QWidget()
-            self.window.ui.nodes['preset.editor.' + key].setLayout(options[key])
-            self.window.ui.nodes['preset.editor.' + key].setContentsMargins(0, 0, 0, 0)
-            rows.addWidget(self.window.ui.nodes['preset.editor.' + key])
+            node_key = f"preset.editor.{key}"
+            node = QWidget()
+            node.setLayout(options[key])
+            node.setContentsMargins(0, 0, 0, 0)
+            rows.addWidget(node)
+            self.window.ui.nodes[node_key] = node
         # remote tools
-        self.window.ui.nodes['preset.editor.remote_tools'] = QWidget()
-        self.window.ui.nodes['preset.editor.remote_tools'].setLayout(options['remote_tools'])
-        self.window.ui.nodes['preset.editor.remote_tools'].setContentsMargins(0, 0, 0, 0)
+        remote_tools =  QWidget()
+        remote_tools.setLayout(options['remote_tools'])
+        remote_tools.setContentsMargins(0, 0, 0, 0)
+        self.window.ui.nodes['preset.editor.remote_tools'] = remote_tools
         rows_remote_tools = QVBoxLayout()
         rows_remote_tools.addWidget(self.window.ui.nodes['preset.editor.remote_tools'])
@@ -222,10 +225,12 @@ class Preset(BaseConfigDialog):
         # personalize
         personalize_rows = QVBoxLayout()
         for key in personalize_keys:
-            self.window.ui.nodes['preset.editor.' + key] = QWidget()
-            self.window.ui.nodes['preset.editor.' + key].setLayout(options[key])
-            self.window.ui.nodes['preset.editor.' + key].setContentsMargins(0, 0, 0, 0)
-            personalize_rows.addWidget(self.window.ui.nodes['preset.editor.' + key])
+            node_key = f"preset.editor.{key}"
+            node = QWidget()
+            node.setLayout(options[key])
+            node.setContentsMargins(0, 0, 0, 0)
+            personalize_rows.addWidget(node)
+            self.window.ui.nodes[node_key] = node
         self.window.ui.nodes['preset.editor.ai_avatar'].setVisible(False)
@@ -255,11 +260,12 @@ class Preset(BaseConfigDialog):
         widget_main = QWidget()
         widget_main.setLayout(main)
-        self.window.ui.splitters['editor.presets'] = QSplitter(Qt.Vertical)
-        self.window.ui.splitters['editor.presets'].addWidget(widget_main)
-        self.window.ui.splitters['editor.presets'].addWidget(widget_prompt)
-        self.window.ui.splitters['editor.presets'].setStretchFactor(0, 1)
-        self.window.ui.splitters['editor.presets'].setStretchFactor(1, 2)
+        splitter = QSplitter(Qt.Vertical)
+        splitter.addWidget(widget_main)
+        splitter.addWidget(widget_prompt)
+        splitter.setStretchFactor(0, 1)
+        splitter.setStretchFactor(1, 2)
+        self.window.ui.splitters['editor.presets'] = splitter
         widget_personalize = QWidget()
         widget_personalize.setLayout(personalize_rows)
@@ -270,24 +276,26 @@ class Preset(BaseConfigDialog):
         widget_experts = QWidget()
         widget_experts.setLayout(experts_rows)
-        self.window.ui.tabs['preset.editor.tabs'] = QTabWidget()
-        self.window.ui.tabs['preset.editor.tabs'].addTab(self.window.ui.splitters['editor.presets'], trans("preset.tab.general"))
-        self.window.ui.tabs['preset.editor.tabs'].addTab(widget_personalize, trans("preset.tab.personalize"))
-        self.window.ui.tabs['preset.editor.tabs'].addTab(widget_experts, trans("preset.tab.experts"))
-        self.window.ui.tabs['preset.editor.tabs'].addTab(widget_remote_tools, trans("preset.tab.remote_tools"))
+        tabs = QTabWidget()
+        tabs.addTab(splitter, trans("preset.tab.general"))
+        tabs.addTab(widget_personalize, trans("preset.tab.personalize"))
+        tabs.addTab(widget_experts, trans("preset.tab.experts"))
+        tabs.addTab(widget_remote_tools, trans("preset.tab.remote_tools"))
+        self.window.ui.tabs['preset.editor.tabs'] = tabs
         layout = QVBoxLayout()
         layout.addWidget(self.window.ui.tabs['preset.editor.tabs'])
         layout.addLayout(footer)
-        self.window.ui.dialog['editor.' + self.dialog_id] = EditorDialog(self.window, self.dialog_id)
-        self.window.ui.dialog['editor.' + self.dialog_id].setSizeGripEnabled(True)
-        self.window.ui.dialog['editor.' + self.dialog_id].setWindowFlags(
-            self.window.ui.dialog['editor.' + self.dialog_id].windowFlags() | Qt.WindowMaximizeButtonHint
+        dialog = EditorDialog(self.window, self.dialog_id)
+        dialog.setSizeGripEnabled(True)
+        dialog.setWindowFlags(
+            dialog.windowFlags() | Qt.WindowMaximizeButtonHint
         )
-        self.window.ui.dialog['editor.' + self.dialog_id].setLayout(layout)
-        self.window.ui.dialog['editor.' + self.dialog_id].setWindowTitle(trans('dialog.preset'))
-        self.window.ui.dialog['editor.' + self.dialog_id].on_close_callback = self.on_close
+        dialog.setLayout(layout)
+        dialog.setWindowTitle(trans('dialog.preset'))
+        dialog.on_close_callback = self.on_close
+        self.window.ui.dialog['editor.' + self.dialog_id] = dialog
     def prepare_extra_config(self, prompt_layout):
@@ -301,15 +309,17 @@ class Preset(BaseConfigDialog):
         prompt_widget.setLayout(prompt_layout)
         self.window.ui.nodes['preset.editor.extra'] = {}
-        self.window.ui.tabs['preset.editor.extra'] = QTabWidget()
-        self.window.ui.tabs['preset.editor.extra'].addTab(
+        tabs = QTabWidget()
+        tabs.addTab(
             prompt_widget,
             trans("preset.prompt"),
         )
-        self.window.ui.tabs['preset.editor.extra'].setSizePolicy(QSizePolicy.Expanding, QSizePolicy.Expanding)
-        self.window.ui.tabs['preset.editor.extra'].setMinimumHeight(150)
+        tabs.setSizePolicy(QSizePolicy.Expanding, QSizePolicy.Expanding)
+        tabs.setMinimumHeight(150)
         layout = QVBoxLayout()
-        layout.addWidget(self.window.ui.tabs['preset.editor.extra'])
+        layout.addWidget(tabs)
+        self.window.ui.tabs['preset.editor.extra'] = tabs
         return layout
@@ -368,6 +378,7 @@ class AvatarWidget(QWidget):
         self.init_ui()
     def init_ui(self):
+        """Initialize the avatar widget UI."""
         main_layout = QVBoxLayout(self)
         main_layout.setContentsMargins(0, 0, 0, 0)
@@ -397,13 +408,19 @@ class AvatarWidget(QWidget):
         main_layout.addStretch()
     def open_file_dialog(self):
+        """Open a file dialog to select an avatar image file."""
         file_name, _ = QFileDialog.getOpenFileName(
             self, trans("preset.personalize.avatar.choose.title"), "", "Images (*.png *.jpg *.jpeg *.bmp *.gif *.webp)"
         )
         if file_name:
             self.window.controller.presets.editor.upload_avatar(file_name)
-    def load_avatar(self, file_path):
+    def load_avatar(self, file_path: str):
+        """
+        Load and display the avatar image from the given file path.
+        :param file_path: Path to the avatar image file
+        """
         from PySide6.QtGui import QPixmap
         pixmap = QPixmap(file_path)
         if not pixmap.isNull():
@@ -420,9 +437,7 @@ class AvatarWidget(QWidget):
         self.remove_button.setEnabled(enabled)
     def disable_remove_button(self):
-        """
-        Disable the remove button.
-        """
+        """Disable the remove button."""
         self.enable_remove_button(False)
     def get_cover_pixmap(self, pixmap, target_width, target_height):
@@ -432,6 +447,7 @@ class AvatarWidget(QWidget):
         :param pixmap: Original pixmap
         :param target_width: Target width for the avatar preview
         :param target_height: Target height for the avatar preview
+        :return: Scaled and cropped pixmap
         """
         factor = max(target_width / pixmap.width(), target_height / pixmap.height())
         new_width = int(pixmap.width() * factor)
@@ -439,9 +455,9 @@ class AvatarWidget(QWidget):
         scaled_pix = pixmap.scaled(new_width, new_height, Qt.KeepAspectRatio, Qt.SmoothTransformation)
         x = (scaled_pix.width() - target_width) // 2
         y = (scaled_pix.height() - target_height) // 2
-        cropped_pix = scaled_pix.copy(x, y, target_width, target_height)
-        return cropped_pix
+        return scaled_pix.copy(x, y, target_width, target_height)
     def remove_avatar(self):
+        """Remove the current avatar image."""
         self.avatar_preview.clear()
         self.remove_button.setEnabled(False)

pygpt_net/ui/main.py CHANGED Viewed

@@ -17,12 +17,13 @@ from PySide6.QtWidgets import QMainWindow, QApplication
 from qt_material import QtStyleTools
 from pygpt_net.core.events import BaseEvent, KernelEvent, ControlEvent
-from pygpt_net.container import Container
+from pygpt_net.app_core import Core
 from pygpt_net.controller import Controller
 from pygpt_net.tools import Tools
 from pygpt_net.ui import UI
 from pygpt_net.ui.widget.textarea.web import ChatWebOutput
-from pygpt_net.utils import get_app_meta
+from pygpt_net.utils import get_app_meta, freeze_updates
 class MainWindow(QMainWindow, QtStyleTools):
@@ -63,7 +64,7 @@ class MainWindow(QMainWindow, QtStyleTools):
         self.meta = get_app_meta()
         # setup service container
-        self.core = Container(self)
+        self.core = Core(self)
         self.core.init()
         self.core.patch()  # patch version if needed
         self.core.post_setup()
@@ -85,7 +86,8 @@ class MainWindow(QMainWindow, QtStyleTools):
         # setup UI
         self.ui = UI(self)
-        self.ui.init()
+        with freeze_updates(self):
+            self.ui.init()
         # global shortcuts
         self.shortcuts = []

pygpt_net/utils.py CHANGED Viewed

@@ -13,6 +13,7 @@ import json
 import os
 import re
 from datetime import datetime
+from contextlib import contextmanager
 from PySide6 import QtCore, QtGui
 from PySide6.QtWidgets import QApplication
@@ -61,6 +62,14 @@ def trans(key: str, reload: bool = False, domain: str = None) -> str:
     return locale.get(key, domain)
+@contextmanager
+def freeze_updates(widget):
+    widget.setUpdatesEnabled(False)
+    try:
+        yield
+    finally:
+        widget.setUpdatesEnabled(True)
 def get_init_value(key: str = "__version__") -> str:
     """
     Return config value from __init__.py

{pygpt_net-2.6.28.dist-info → pygpt_net-2.6.30.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: pygpt-net
-Version: 2.6.28
+Version: 2.6.30
 Summary: Desktop AI Assistant powered by: OpenAI GPT-5, GPT-4, o1, o3, Gemini, Claude, Grok, DeepSeek, and other models supported by Llama Index, and Ollama. Chatbot, agents, completion, image generation, vision analysis, speech-to-text, plugins, internet access, file handling, command execution and more.
 License: MIT
 Keywords: ai,api,api key,app,assistant,bielik,chat,chatbot,chatgpt,claude,dall-e,deepseek,desktop,gemini,gpt,gpt-3.5,gpt-4,gpt-4-vision,gpt-4o,gpt-5,gpt-oss,gpt3.5,gpt4,grok,langchain,llama-index,llama3,mistral,o1,o3,ollama,openai,presets,py-gpt,py_gpt,pygpt,pyside,qt,text completion,tts,ui,vision,whisper
@@ -117,7 +117,7 @@ Description-Content-Type: text/markdown
 [![pygpt](https://snapcraft.io/pygpt/badge.svg)](https://snapcraft.io/pygpt)
-Release: **2.6.28** | build: **2025-08-27** | Python: **>=3.10, <3.14**
+Release: **2.6.30** | build: **2025-08-29** | Python: **>=3.10, <3.14**
 > Official website: https://pygpt.net | Documentation: https://pygpt.readthedocs.io
 >
@@ -157,7 +157,7 @@ You can download compiled 64-bit versions for Windows and Linux here: https://py
 - Desktop AI Assistant for `Linux`, `Windows` and `Mac`, written in Python.
 - Works similarly to `ChatGPT`, but locally (on a desktop computer).
-- 12 modes of operation: Chat, Chat with Files, Chat with Audio, Research (Perplexity), Completion, Image generation, Vision, Assistants, Experts, Computer use, Agents and Autonomous Mode.
+- 11 modes of operation: Chat, Chat with Files, Chat with Audio, Research (Perplexity), Completion, Image generation, Assistants, Experts, Computer use, Agents and Autonomous Mode.
 - Supports multiple models like `OpenAI GPT-5`, `GPT-4`, `o1`, `o3`, `o4`, `Google Gemini`, `Anthropic Claude`, `xAI Grok`, `DeepSeek V3/R1`, `Perplexity / Sonar`, and any model accessible through `LlamaIndex` and `Ollama` such as `DeepSeek`, `gpt-oss`, `Llama 3`, `Mistral`, `Bielik`, etc.
 - Chat with your own Files: integrated `LlamaIndex` support: chat with data such as: `txt`, `pdf`, `csv`, `html`, `md`, `docx`, `json`, `epub`, `xlsx`, `xml`, webpages, `Google`, `GitHub`, video/audio, images and other data types, or use conversation history as additional context provided to the model.
 - Built-in vector databases support and automated files and data embedding.
@@ -181,7 +181,7 @@ You can download compiled 64-bit versions for Windows and Linux here: https://py
 - Includes simple painter / drawing tool.
 - Supports multiple languages.
 - Requires no previous knowledge of using AI models.
-- Simplifies image generation using `DALL-E`.
+- Simplifies image generation using image models like `DALL-E` and `Imagen`.
 - Fully configurable.
 - Themes support.
 - Real-time code syntax highlighting.
@@ -439,9 +439,9 @@ Alternatively, you can try removing snap and reinstalling it:
 `sudo snap install pygpt`
-**Access to microphone and audio in Windows version:**
+**Access to a microphone and audio in Windows version:**
-If you have a problems with audio or microphone in the non-binary PIP/Python version on Windows, check to see if FFmpeg is installed. If it's not, install it and add it to the PATH. You can find a tutorial on how to do this here: https://phoenixnap.com/kb/ffmpeg-windows. The binary version already includes FFmpeg.
+If you have a problems with audio or a microphone in the non-binary PIP/Python version on Windows, check to see if FFmpeg is installed. If it's not, install it and add it to the PATH. You can find a tutorial on how to do this here: https://phoenixnap.com/kb/ffmpeg-windows. The binary version already includes FFmpeg.
 **Windows and VC++ Redistributable**
@@ -519,9 +519,16 @@ Here, you can add or manage API keys for any supported provider.
 **+ Inline Vision and Image generation**
-This mode in **PyGPT** mirrors `ChatGPT`, allowing you to chat with models such as `GPT-5`, `GPT-4`, `o1`, `o3`, and`Claude`, `Gemini`, `Grok`, `Perplexity (sonar)`, `Deepseek`, and others. It works by using the `Responses` and `ChatCompletions` OpenAI API (or compatible). You can select the API endpoint to use in: `Config -> Settings -> API Keys`.
+In **PyGPT**, this mode mirrors `ChatGPT`, allowing you to chat with models like `GPT-5`, `GPT-4`, `o1`, `o3`, `Claude`, `Gemini`, `Grok`, `Perplexity (Sonar)`, `Deepseek`, and more. It works using the OpenAI API `Responses` and `ChatCompletions`, or the `Google GenAI SDK` if the Google native client is enabled. You can choose the API endpoint for `ChatCompletions` in `Config -> Settings -> API Keys`.
-**Tip: This mode directly uses the OpenAI SDK. Other models, such as Gemini, Claude, Grok, Sonar, or Llama3, are supported in Chat mode via LlamaIndex or OpenAI API compatible endpoints (if available), which the application switches to in the background when working with models other than OpenAI.**
+**Tip:** This mode uses the provider SDK directly. If there's no native client built into the app, models like Gemini, Claude, Grok, Sonar, or Llama3 are supported in Chat mode via LlamaIndex or compatible OpenAI API endpoints. The app automatically switches to these endpoints when using non-OpenAI models.
+Currently built-in native clients:
+- OpenAI SDK
+- Google GenAI SDK
+Support for Anthropic and xAI native clients is coming soon.
 The main part of the interface is a chat window where you see your conversations. Below it is a message box for typing. On the right side, you can set up or change the model and system prompt. You can also save these settings as presets to easily switch between models or tasks.
@@ -683,17 +690,16 @@ From version `2.0.107` the `davinci` models are deprecated and has been replaced
 ## Image generation
-### DALL-E 3
+### OpenAI DALL-E 3 / Google Imagen 3 and 4
-**PyGPT** enables quick and easy image creation with `DALL-E 3` or `gpt-image-1`.
-The older model version, `DALL-E 2`, is also accessible. Generating images is akin to a chat conversation  -  a user's prompt triggers the generation, followed by downloading, saving to the computer,
-and displaying the image onscreen. You can send raw prompt to `DALL-E` in `Image generation` mode or ask the model for the best prompt.
+**PyGPT** enables quick and easy image creation with image models like `DALL-E 3`, `gpt-image-1` or `Google Imagen`.
+Generating images is akin to a chat conversation  -  a user's prompt triggers the generation, followed by downloading, saving to the computer, and displaying the image onscreen. You can send raw prompt to the model in `Image generation` mode or ask the model for the best prompt.
 ![v3_img](https://github.com/szczyglis-dev/py-gpt/raw/master/docs/source/images/v3_img.png)
-Image generation using DALL-E is available in every mode via plugin `Image Generation (inline)`. Just ask any model, in any mode, like e.g. GPT-4 to generate an image and it will do it inline, without need to mode change.
+Image generation using image models is also available in every mode via plugin `Image Generation (inline)`. Just ask any model, in any mode, like e.g. GPT or Gemini to generate an image and it will do it inline, without need to mode change.
-If you want to generate images (using DALL-E) directly in chat you must enable plugin **Image generation (inline)** in the Plugins menu.
+If you want to generate images directly in chat you must enable plugin **Image generation (inline)** in the Plugins menu.
 Plugin allows you to generate images in Chat mode:
 ![v3_img_chat](https://github.com/szczyglis-dev/py-gpt/raw/master/docs/source/images/v3_img_chat.png)
@@ -708,7 +714,7 @@ the bottom of the screen. This replaces the conversation temperature slider when
 There is an option for switching prompt generation mode.
-If **Raw Mode** is enabled, DALL-E will receive the prompt exactly as you have provided it.
+If **Raw Mode** is enabled, a model will receive the prompt exactly as you have provided it.
 If **Raw Mode** is disabled, a model will generate the best prompt for you based on your instructions.
 ### Image storage
@@ -724,31 +730,6 @@ prompts for creating new images.
 Images are stored in ``img`` directory in **PyGPT** user data folder.
-## Vision
-This mode enables image analysis using the `GPT-5`, `GPT-4o` and other vision (multimodal) models. Functioning much like the chat mode,
-it also allows you to upload images or provide URLs to images. The vision feature can analyze both local
-images and those found online.
-Vision is also integrated into any chat mode via plugin `Vision (inline)`. Just enable the plugin and use Vision in other work modes, such as Chat or Chat with Files.
-Vision mode also includes real-time video capture from camera. To capture image from camera and append it to chat just click on video at left side. You can also enable `Auto capture` - image will be captured and appended to chat message every time you send message.
-**1) Video camera real-time image capture**
-![v3_vision_chat](https://github.com/szczyglis-dev/py-gpt/raw/master/docs/source/images/v3_vision_chat.png)
-**2) you can also provide an image URL**
-![v2_mode_vision](https://github.com/szczyglis-dev/py-gpt/raw/master/docs/source/images/v2_mode_vision.png)
-**3) or you can just upload your local images or use the inline Vision in the standard chat mode:**
-![v2_mode_vision_upload](https://github.com/szczyglis-dev/py-gpt/raw/master/docs/source/images/v2_mode_vision_upload.png)
-**Tip:** When using `Vision (inline)` by utilizing a plugin in standard mode, such as `Chat` (not `Vision` mode), the `+ Vision` label will appear at the bottom of the Chat window.
 ## Assistants
 This mode uses the OpenAI's **Assistants API**.
@@ -2363,8 +2344,6 @@ Config -> Settings...
 - `Directory for file downloads`: Subdirectory for downloaded files, e.g. in Assistants mode, inside "data". Default: "download"
-- `Verbose mode`: Enabled verbose mode when using attachment as additional context.
 - `Model for querying index`: Model to use for preparing query and querying the index when the RAG option is selected.
 - `Model for attachment content summary`: Model to use when generating a summary for the content of a file when the Summary option is selected.
@@ -2569,8 +2548,6 @@ Enable/disable remote tools, like Web Search or Image generation to use in OpenA
 **General**
-- `Verbose` - enables verbose mode.
 - `Auto retrieve additional context from RAG`: Auto retrieve additional context from RAG at the beginning if the index is provided.
 - `Display a tray notification when the goal is achieved.`: If enabled, a notification will be displayed after goal achieved / finished run.
@@ -2641,10 +2618,12 @@ Enable/disable remote tools, like Web Search or Image generation to use in OpenA
 - `Check for updates in background`: Enables checking for updates in background (checking every 5 minutes). Default: True.
-**Developer**
+**Debug**
 - `Show debug menu`: Enables debug (developer) menu.
+- `Log level`: toggle log level (ERROR|WARNING|INFO|DEBUG)
 - `Log and debug context`: Enables logging of context input/output.
 - `Log and debug events`: Enables logging of event dispatch.
@@ -2653,12 +2632,14 @@ Enable/disable remote tools, like Web Search or Image generation to use in OpenA
 - `Log DALL-E usage to console`: Enables logging of DALL-E usage to console.
+- `Log attachments usage to console`: Enables logging of attachments usage to console.
+- `Log Agents usage to console`: Enables logging of Agents usage to console.
 - `Log LlamaIndex usage to console`: Enables logging of LlamaIndex usage to console.
 - `Log Assistants usage to console`: Enables logging of Assistants API usage to console.
-- `Log level`: toggle log level (ERROR|WARNING|INFO|DEBUG)
 ## JSON files
@@ -3363,7 +3344,7 @@ These wrappers are loaded into the application during startup using `launcher.ad
 ```python
 # app.py
-from pygpt_net.provider.llms.openai import OpenAILLM
+from pygpt_net.provider.api.openai import OpenAILLM
 from pygpt_net.provider.llms.azure_openai import AzureOpenAILLM
 from pygpt_net.provider.llms.anthropic import AnthropicLLM
 from pygpt_net.provider.llms.hugging_face import HuggingFaceLLM
@@ -3575,6 +3556,19 @@ may consume additional tokens that are not displayed in the main window.
 ## Recent changes:
+**2.6.30 (2025-08-29)**
+- Added native Google GenAI API support (beta); live audio is not supported yet (#132).
+- Added new predefined models for image generation: Google Imagen3 and Imagen4.
+- Optimized token usage in the Responses API.
+- Removed Vision mode (it is now integrated into Chat).
+**2.6.29 (2025-08-28)**
+- Verbose options have been moved to the Developer section in settings.
+- Enhanced logging of embeddings usage.
+- Fixed styles list.
 **2.6.28 (2025-08-27)**
 - Added new plugins: Tuya (IoT) and Wikipedia.

pygpt-net 2.6.28__py3-none-any.whl → 2.6.30__py3-none-any.whl

pygpt-net 2.6.28py3-none-any.whl → 2.6.30py3-none-any.whl