PyPI - pygpt-net - Versions diffs - 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl - Mend

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (182) hide show

pygpt_net/CHANGELOG.txt +15 -0
pygpt_net/__init__.py +3 -3
pygpt_net/app.py +4 -0
pygpt_net/{container.py → app_core.py} +5 -6
pygpt_net/controller/__init__.py +5 -2
pygpt_net/controller/access/control.py +1 -9
pygpt_net/controller/assistant/assistant.py +4 -4
pygpt_net/controller/assistant/batch.py +7 -7
pygpt_net/controller/assistant/files.py +4 -4
pygpt_net/controller/assistant/threads.py +3 -3
pygpt_net/controller/attachment/attachment.py +4 -7
pygpt_net/controller/audio/audio.py +25 -1
pygpt_net/controller/audio/ui.py +2 -2
pygpt_net/controller/chat/audio.py +1 -8
pygpt_net/controller/chat/common.py +30 -4
pygpt_net/controller/chat/handler/stream_worker.py +1124 -0
pygpt_net/controller/chat/output.py +8 -3
pygpt_net/controller/chat/stream.py +4 -405
pygpt_net/controller/chat/text.py +3 -2
pygpt_net/controller/chat/vision.py +11 -19
pygpt_net/controller/config/placeholder.py +1 -1
pygpt_net/controller/ctx/ctx.py +1 -1
pygpt_net/controller/ctx/summarizer.py +1 -1
pygpt_net/controller/kernel/kernel.py +11 -3
pygpt_net/controller/kernel/reply.py +5 -1
pygpt_net/controller/mode/mode.py +21 -12
pygpt_net/controller/plugins/settings.py +3 -2
pygpt_net/controller/presets/editor.py +112 -99
pygpt_net/controller/realtime/__init__.py +12 -0
pygpt_net/controller/realtime/manager.py +53 -0
pygpt_net/controller/realtime/realtime.py +268 -0
pygpt_net/controller/theme/theme.py +3 -2
pygpt_net/controller/ui/mode.py +7 -0
pygpt_net/controller/ui/ui.py +19 -1
pygpt_net/controller/ui/vision.py +4 -4
pygpt_net/core/agents/legacy.py +2 -2
pygpt_net/core/agents/runners/openai_workflow.py +2 -2
pygpt_net/core/assistants/files.py +5 -5
pygpt_net/core/assistants/store.py +4 -4
pygpt_net/core/audio/audio.py +6 -1
pygpt_net/core/audio/backend/native/__init__.py +12 -0
pygpt_net/core/audio/backend/{native.py → native/native.py} +426 -127
pygpt_net/core/audio/backend/native/player.py +139 -0
pygpt_net/core/audio/backend/native/realtime.py +250 -0
pygpt_net/core/audio/backend/pyaudio/__init__.py +12 -0
pygpt_net/core/audio/backend/pyaudio/playback.py +194 -0
pygpt_net/core/audio/backend/pyaudio/pyaudio.py +923 -0
pygpt_net/core/audio/backend/pyaudio/realtime.py +275 -0
pygpt_net/core/audio/backend/pygame/__init__.py +12 -0
pygpt_net/core/audio/backend/{pygame.py → pygame/pygame.py} +130 -19
pygpt_net/core/audio/backend/shared/__init__.py +38 -0
pygpt_net/core/audio/backend/shared/conversions.py +211 -0
pygpt_net/core/audio/backend/shared/envelope.py +38 -0
pygpt_net/core/audio/backend/shared/player.py +137 -0
pygpt_net/core/audio/backend/shared/rt.py +52 -0
pygpt_net/core/audio/capture.py +5 -0
pygpt_net/core/audio/output.py +13 -2
pygpt_net/core/audio/whisper.py +6 -2
pygpt_net/core/bridge/bridge.py +4 -3
pygpt_net/core/bridge/worker.py +31 -9
pygpt_net/core/debug/console/console.py +2 -2
pygpt_net/core/debug/presets.py +2 -2
pygpt_net/core/dispatcher/dispatcher.py +37 -1
pygpt_net/core/events/__init__.py +2 -1
pygpt_net/core/events/realtime.py +55 -0
pygpt_net/core/experts/experts.py +2 -2
pygpt_net/core/image/image.py +51 -1
pygpt_net/core/modes/modes.py +2 -2
pygpt_net/core/presets/presets.py +3 -3
pygpt_net/core/realtime/options.py +87 -0
pygpt_net/core/realtime/shared/__init__.py +0 -0
pygpt_net/core/realtime/shared/audio.py +213 -0
pygpt_net/core/realtime/shared/loop.py +64 -0
pygpt_net/core/realtime/shared/session.py +59 -0
pygpt_net/core/realtime/shared/text.py +37 -0
pygpt_net/core/realtime/shared/tools.py +276 -0
pygpt_net/core/realtime/shared/turn.py +38 -0
pygpt_net/core/realtime/shared/types.py +16 -0
pygpt_net/core/realtime/worker.py +164 -0
pygpt_net/core/tokens/tokens.py +4 -4
pygpt_net/core/types/__init__.py +1 -0
pygpt_net/core/types/image.py +48 -0
pygpt_net/core/types/mode.py +5 -2
pygpt_net/core/vision/analyzer.py +1 -1
pygpt_net/data/config/config.json +13 -4
pygpt_net/data/config/models.json +219 -101
pygpt_net/data/config/modes.json +3 -9
pygpt_net/data/config/settings.json +135 -27
pygpt_net/data/config/settings_section.json +2 -2
pygpt_net/data/locale/locale.de.ini +7 -7
pygpt_net/data/locale/locale.en.ini +25 -12
pygpt_net/data/locale/locale.es.ini +7 -7
pygpt_net/data/locale/locale.fr.ini +7 -7
pygpt_net/data/locale/locale.it.ini +7 -7
pygpt_net/data/locale/locale.pl.ini +8 -8
pygpt_net/data/locale/locale.uk.ini +7 -7
pygpt_net/data/locale/locale.zh.ini +3 -3
pygpt_net/data/locale/plugin.audio_input.en.ini +4 -0
pygpt_net/data/locale/plugin.audio_output.en.ini +4 -0
pygpt_net/item/model.py +23 -3
pygpt_net/plugin/audio_input/plugin.py +37 -4
pygpt_net/plugin/audio_input/simple.py +57 -8
pygpt_net/plugin/cmd_files/worker.py +3 -0
pygpt_net/plugin/openai_dalle/plugin.py +4 -4
pygpt_net/plugin/openai_vision/plugin.py +12 -13
pygpt_net/provider/agents/openai/agent.py +5 -5
pygpt_net/provider/agents/openai/agent_b2b.py +5 -5
pygpt_net/provider/agents/openai/agent_planner.py +5 -6
pygpt_net/provider/agents/openai/agent_with_experts.py +5 -5
pygpt_net/provider/agents/openai/agent_with_experts_feedback.py +4 -4
pygpt_net/provider/agents/openai/agent_with_feedback.py +4 -4
pygpt_net/provider/agents/openai/bot_researcher.py +2 -2
pygpt_net/provider/agents/openai/bots/research_bot/agents/planner_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/search_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/writer_agent.py +1 -1
pygpt_net/provider/agents/openai/evolve.py +5 -5
pygpt_net/provider/agents/openai/supervisor.py +4 -4
pygpt_net/provider/api/__init__.py +27 -0
pygpt_net/provider/api/anthropic/__init__.py +68 -0
pygpt_net/provider/api/google/__init__.py +295 -0
pygpt_net/provider/api/google/audio.py +121 -0
pygpt_net/provider/api/google/chat.py +591 -0
pygpt_net/provider/api/google/image.py +427 -0
pygpt_net/provider/api/google/realtime/__init__.py +12 -0
pygpt_net/provider/api/google/realtime/client.py +1945 -0
pygpt_net/provider/api/google/realtime/realtime.py +186 -0
pygpt_net/provider/api/google/tools.py +222 -0
pygpt_net/provider/api/google/vision.py +129 -0
pygpt_net/provider/{gpt → api/openai}/__init__.py +24 -4
pygpt_net/provider/api/openai/agents/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/agents/computer.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/experts.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/response.py +1 -1
pygpt_net/provider/{gpt → api/openai}/assistants.py +1 -1
pygpt_net/provider/{gpt → api/openai}/chat.py +15 -8
pygpt_net/provider/{gpt → api/openai}/completion.py +1 -1
pygpt_net/provider/{gpt → api/openai}/image.py +1 -1
pygpt_net/provider/api/openai/realtime/__init__.py +12 -0
pygpt_net/provider/api/openai/realtime/client.py +1828 -0
pygpt_net/provider/api/openai/realtime/realtime.py +194 -0
pygpt_net/provider/{gpt → api/openai}/remote_tools.py +1 -1
pygpt_net/provider/{gpt → api/openai}/responses.py +34 -20
pygpt_net/provider/{gpt → api/openai}/store.py +2 -2
pygpt_net/provider/{gpt → api/openai}/vision.py +1 -1
pygpt_net/provider/api/openai/worker/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/worker/assistants.py +4 -4
pygpt_net/provider/{gpt → api/openai}/worker/importer.py +10 -10
pygpt_net/provider/audio_input/google_genai.py +103 -0
pygpt_net/provider/audio_input/openai_whisper.py +1 -1
pygpt_net/provider/audio_output/google_genai_tts.py +229 -0
pygpt_net/provider/audio_output/openai_tts.py +9 -6
pygpt_net/provider/core/config/patch.py +26 -0
pygpt_net/provider/core/model/patch.py +20 -0
pygpt_net/provider/core/preset/json_file.py +2 -4
pygpt_net/provider/llms/anthropic.py +2 -5
pygpt_net/provider/llms/base.py +4 -3
pygpt_net/provider/llms/google.py +8 -9
pygpt_net/provider/llms/openai.py +1 -1
pygpt_net/provider/loaders/hub/image_vision/base.py +1 -1
pygpt_net/ui/dialog/preset.py +71 -55
pygpt_net/ui/layout/toolbox/footer.py +16 -0
pygpt_net/ui/layout/toolbox/image.py +5 -0
pygpt_net/ui/main.py +6 -4
pygpt_net/ui/widget/option/combo.py +15 -1
pygpt_net/utils.py +9 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/METADATA +55 -55
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/RECORD +181 -135
pygpt_net/core/audio/backend/pyaudio.py +0 -554
/pygpt_net/{provider/gpt/agents → controller/chat/handler}/__init__.py +0 -0
/pygpt_net/{provider/gpt/worker → core/realtime}/__init__.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/client.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/remote_tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/utils.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/audio.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/computer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/container.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/summarizer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/utils.py +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/LICENSE +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/WHEEL +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/entry_points.txt +0 -0

pygpt_net/provider/agents/openai/bot_researcher.py CHANGED Viewed

@@ -25,12 +25,12 @@ from pygpt_net.core.types import (
 from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from pygpt_net.utils import trans
 from ..base import BaseAgent
 from .bots.research_bot.manager import ResearchManager
-from ...gpt.agents.experts import get_experts
 class Agent(BaseAgent):

pygpt_net/provider/agents/openai/bots/research_bot/agents/planner_agent.py CHANGED Viewed

@@ -15,7 +15,7 @@ from pydantic import BaseModel
 from agents import Agent
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
 class WebSearchItem(BaseModel):

pygpt_net/provider/agents/openai/bots/research_bot/agents/search_agent.py CHANGED Viewed

@@ -14,7 +14,7 @@ from agents.model_settings import ModelSettings
 from pygpt_net.core.types import OPENAI_REMOTE_TOOL_DISABLE_WEB_SEARCH
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
 def get_search_agent(

pygpt_net/provider/agents/openai/bots/research_bot/agents/writer_agent.py CHANGED Viewed

@@ -15,7 +15,7 @@ from pydantic import BaseModel
 from agents import Agent
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
 class ReportData(BaseModel):

pygpt_net/provider/agents/openai/evolve.py CHANGED Viewed

@@ -30,12 +30,12 @@ from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
 from pygpt_net.item.preset import PresetItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
-from pygpt_net.provider.gpt.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from pygpt_net.utils import trans
 from ..base import BaseAgent
-from ...gpt.agents.experts import get_experts
 @dataclass
@@ -340,7 +340,7 @@ class Agent(BaseAgent):
                 print("Winner: agent ", choose)
-                final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(results[choose], ctx)
+                final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(results[choose], ctx)
                 input_items = results[choose].to_input_list()
                 if bridge.stopped():
@@ -437,7 +437,7 @@ class Agent(BaseAgent):
                     bridge.on_stop(ctx)
                     break
-                window.core.gpt.responses.unpack_agent_response(results[choose], ctx)
+                window.core.api.openai.responses.unpack_agent_response(results[choose], ctx)
                 input_items = results[choose].to_input_list()
                 evaluator_result = await Runner.run(evaluator, input_items)

pygpt_net/provider/agents/openai/supervisor.py CHANGED Viewed

@@ -31,9 +31,9 @@ from pygpt_net.core.types import (
 from pygpt_net.item.ctx import CtxItem
 from pygpt_net.item.model import ModelItem
-from pygpt_net.provider.gpt.agents.remote_tools import append_tools
-from pygpt_net.provider.gpt.agents.response import StreamHandler
-from pygpt_net.provider.gpt.agents.experts import get_experts
+from pygpt_net.provider.api.openai.agents.remote_tools import append_tools
+from pygpt_net.provider.api.openai.agents.response import StreamHandler
+from pygpt_net.provider.api.openai.agents.experts import get_experts
 from pygpt_net.utils import trans
 from ..base import BaseAgent
@@ -218,7 +218,7 @@ class Agent(BaseAgent):
                 agent,
                 **kwargs
             )
-            final_output, last_response_id = window.core.gpt.responses.unpack_agent_response(result, ctx)
+            final_output, last_response_id = window.core.api.openai.responses.unpack_agent_response(result, ctx)
             response_id = result.last_response_id
             if verbose:
                 print("Final response:", result)

pygpt_net/provider/api/__init__.py ADDED Viewed

@@ -0,0 +1,27 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.28 20:00:00                  #
+# ================================================== #
+from .anthropic import ApiAnthropic
+from .google import ApiGoogle
+from .openai import ApiOpenAI
+class Api:
+    def __init__(self, window=None):
+        """
+        API wrappers core
+        :param window: Window instance
+        """
+        self.window = window
+        self.anthropic = ApiAnthropic(window)
+        self.google = ApiGoogle(window)
+        self.openai = ApiOpenAI(window)

pygpt_net/provider/api/anthropic/__init__.py ADDED Viewed

@@ -0,0 +1,68 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.28 09:00:00                  #
+# ================================================== #
+from anthropic import Anthropic
+from pygpt_net.core.types import (
+    MODE_CHAT,
+)
+from pygpt_net.item.model import ModelItem
+class ApiAnthropic:
+    def __init__(self, window=None):
+        """
+        Anthropic API wrapper core
+        :param window: Window instance
+        """
+        self.window = window
+        self.client = None
+        self.locked = False
+    def get_client(
+            self,
+            mode: str = MODE_CHAT,
+            model: ModelItem = None
+    ) -> Anthropic:
+        """
+        Return Anthropic client
+        :param mode: Mode
+        :param model: Model
+        :return: Anthropic client
+        """
+        if self.client is not None:
+            try:
+                self.client.close()  # close previous client if exists
+            except Exception as e:
+                self.window.core.debug.log(e)
+                print("Error closing previous Anthropic client:", e)
+        self.client = Anthropic(
+            api_key=self.window.core.config.get('api_key_anthropic', "")
+        )
+        return self.client
+    def stop(self):
+        """On global event stop"""
+        pass
+    def close(self):
+        """Close Anthropic client"""
+        if self.locked:
+            return
+        if self.client is not None:
+            try:
+                pass
+                # self.client.close()
+            except Exception as e:
+                self.window.core.debug.log(e)
+                print("Error closing Anthropic client:", e)

pygpt_net/provider/api/google/__init__.py ADDED Viewed

@@ -0,0 +1,295 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.30 06:00:00                  #
+# ================================================== #
+from typing import Optional, Dict, Any
+from google.genai import types as gtypes
+from google import genai
+from pygpt_net.core.types import (
+    MODE_ASSISTANT,
+    MODE_AUDIO,
+    MODE_CHAT,
+    MODE_COMPLETION,
+    MODE_IMAGE,
+    MODE_RESEARCH,
+)
+from pygpt_net.core.bridge.context import BridgeContext
+from pygpt_net.item.model import ModelItem
+from .chat import Chat
+from .vision import Vision
+from .tools import Tools
+from .audio import Audio
+from .image import Image
+from .realtime import Realtime
+class ApiGoogle:
+    def __init__(self, window=None):
+        """
+        Google GenAI API SDK wrapper
+        :param window: Window instance
+        """
+        self.window = window
+        self.chat = Chat(window)
+        self.vision = Vision(window)
+        self.tools = Tools(window)
+        self.audio = Audio(window)
+        self.image = Image(window)
+        self.realtime = Realtime(window)
+        self.client: Optional[genai.Client] = None
+        self.locked = False
+        self.last_client_args: Optional[Dict[str, Any]] = None
+    def get_client(
+            self,
+            mode: str = MODE_CHAT,
+            model: ModelItem = None
+    ) -> genai.Client:
+        """
+        Get or create Google GenAI client
+        :param mode: Mode (chat, completion, image, etc.)
+        :param model: ModelItem
+        :return: genai.Client instance
+        """
+        if not model:
+            model = ModelItem()
+            model.provider = "google"
+        args = self.window.core.models.prepare_client_args(mode, model)
+        filtered = {}
+        if args.get("api_key"):
+            filtered["api_key"] = args["api_key"]
+        if self.client is None or self.last_client_args != filtered:
+            self.client = genai.Client(**filtered)
+        self.last_client_args = filtered
+        return self.client
+    def call(
+            self,
+            context: BridgeContext,
+            extra: dict = None,
+            rt_signals = None
+    ) -> bool:
+        """
+        Make an API call to Google GenAI
+        :param context: BridgeContext
+        :param extra: Extra parameters
+        :param rt_signals: Realtime signals for audio streaming
+        :return: True if successful, False otherwise
+        """
+        mode = context.mode
+        model = context.model
+        stream = context.stream
+        ctx = context.ctx
+        ai_name = ctx.output_name if ctx else "assistant"
+        # No Responses API in google-genai
+        if ctx:
+            ctx.use_responses_api = False
+        used_tokens = 0
+        response = None
+        if mode in [MODE_COMPLETION, MODE_CHAT, MODE_AUDIO, MODE_RESEARCH]:
+            # Live API for audio streaming
+            if mode == MODE_AUDIO and stream:
+                is_realtime = self.realtime.begin(
+                    context=context,
+                    model=model,
+                    extra=extra or {},
+                    rt_signals=rt_signals
+                )
+                if is_realtime:
+                    return True
+            response = self.chat.send(context=context, extra=extra)
+            used_tokens = self.chat.get_used_tokens()
+            if ctx:
+                self.vision.append_images(ctx)
+        elif mode == MODE_IMAGE:
+            return self.image.generate(context=context, extra=extra)
+        elif mode == MODE_ASSISTANT:
+            return False  # not implemented for Google
+        if stream:
+            if ctx:
+                ctx.stream = response
+                ctx.set_output("", ai_name)
+                ctx.input_tokens = used_tokens
+            return True
+        if response is None:
+            return False
+        if isinstance(response, dict) and "error" in response:
+            return False
+        if ctx:
+            ctx.ai_name = ai_name
+            self.chat.unpack_response(mode, response, ctx)
+            try:
+                import json
+                for tc in getattr(ctx, "tool_calls", []) or []:
+                    fn = tc.get("function") or {}
+                    args = fn.get("arguments")
+                    if isinstance(args, str):
+                        try:
+                            fn["arguments"] = json.loads(args)
+                        except Exception:
+                            fn["arguments"] = {}
+            except Exception:
+                pass
+        return True
+    def quick_call(
+            self,
+            context: BridgeContext,
+            extra: dict = None
+    ) -> str:
+        """
+        Make a quick API call to Google GenAI and return the output text
+        :param context: BridgeContext
+        :param extra: Extra parameters
+        :return: Output text
+        """
+        if context.request:
+            context.stream = False
+            context.mode = MODE_CHAT
+            self.locked = True
+            self.call(context, extra)
+            self.locked = False
+            return context.ctx.output
+        self.locked = True
+        try:
+            ctx = context.ctx
+            prompt = context.prompt
+            system_prompt = context.system_prompt
+            temperature = context.temperature
+            history = context.history
+            functions = context.external_functions
+            model = context.model or self.window.core.models.from_defaults()
+            client = self.get_client(MODE_CHAT, model)
+            tools = self.tools.prepare(model, functions)
+            """
+            # with remote tools
+            base_tools = self.tools.prepare(model, functions)
+            remote_tools = self.build_remote_tools(model)
+            tools = (base_tools or []) + (remote_tools or [])
+            """
+            inputs = self.chat.build_input(
+                prompt=prompt,
+                system_prompt=system_prompt,
+                model=model,
+                history=history,
+                attachments=context.attachments,
+                multimodal_ctx=context.multimodal_ctx,
+            )
+            cfg = genai.types.GenerateContentConfig(
+                temperature=temperature if temperature is not None else self.window.core.config.get('temperature'),
+                top_p=self.window.core.config.get('top_p'),
+                max_output_tokens=context.max_tokens if context.max_tokens else None,
+                system_instruction=system_prompt if system_prompt else None,
+                tools=tools if tools else None,
+            )
+            resp = client.models.generate_content(
+                model=model.id,
+                contents=inputs,
+                config=cfg,
+            )
+            if ctx:
+                calls = self.chat.extract_tool_calls(resp)
+                if calls:
+                    ctx.tool_calls = calls
+            return self.chat.extract_text(resp)
+        except Exception as e:
+            self.window.core.debug.log(e)
+            return ""
+        finally:
+            self.locked = False
+    def build_remote_tools(self, model: ModelItem = None) -> list:
+        """
+        Build Google GenAI remote tools based on config flags.
+        - remote_tools.google.web_search: enables grounding via Google Search (Gemini 2.x)
+          or GoogleSearchRetrieval (Gemini 1.5 fallback).
+        - remote_tools.google.code_interpreter: enables code execution tool.
+        Returns a list of gtypes.Tool objects (can be empty).
+        :param model: ModelItem
+        :return: list of gtypes.Tool
+        """
+        tools: list = []
+        cfg = self.window.core.config
+        model_id = (model.id if model and getattr(model, "id", None) else "").lower()
+        # Google Search tool
+        if cfg.get("remote_tools.google.web_search") and "image" not in model.id:
+            try:
+                if not model_id.startswith("gemini-1.5") and not model_id.startswith("models/gemini-1.5"):
+                    # Gemini 2.x uses GoogleSearch
+                    tools.append(gtypes.Tool(google_search=gtypes.GoogleSearch()))
+                else:
+                    # Gemini 1.5 fallback uses GoogleSearchRetrieval
+                    # Note: Supported only for 1.5 models.
+                    tools.append(gtypes.Tool(
+                        google_search_retrieval=gtypes.GoogleSearchRetrieval()
+                    ))
+            except Exception as e:
+                # Do not break the request if tool construction fails
+                self.window.core.debug.log(e)
+        # Code Execution tool
+        if cfg.get("remote_tools.google.code_interpreter") and "image" not in model.id:
+            try:
+                tools.append(gtypes.Tool(code_execution=gtypes.ToolCodeExecution))
+            except Exception as e:
+                self.window.core.debug.log(e)
+        # URL Context tool
+        if cfg.get("remote_tools.google.url_ctx") and "image" not in model.id:
+            try:
+                # Supported on Gemini 2.x+ models (not on 1.5)
+                if not model_id.startswith("gemini-1.5") and not model_id.startswith("models/gemini-1.5"):
+                    tools.append(gtypes.Tool(url_context=gtypes.UrlContext))
+            except Exception as e:
+                self.window.core.debug.log(e)
+        return tools
+    def stop(self):
+        """On global event stop"""
+        pass
+    def close(self):
+        """Close Google client"""
+        if self.locked:
+            return
+        if self.client is not None:
+            try:
+                pass
+                # self.client.close()
+            except Exception as e:
+                self.window.core.debug.log(e)
+                print("Error closing Google client:", e)

pygpt_net/provider/api/google/audio.py ADDED Viewed

@@ -0,0 +1,121 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.28 20:00:00                  #
+# ================================================== #
+import base64
+import io
+import wave
+from typing import Optional, Tuple
+from google.genai.types import Part
+from pygpt_net.core.bridge.context import MultimodalContext
+class Audio:
+    def __init__(self, window=None):
+        """
+        Audio helpers for Google GenAI.
+        - Build audio input parts for requests
+        - Convert Google PCM output to WAV (base64) for UI compatibility
+        :param window: Window instance
+        """
+        self.window = window
+    # ---------- INPUT (user -> model) ----------
+    def build_part(
+            self,
+            multimodal_ctx: Optional[MultimodalContext]
+    ) -> Optional[Part]:
+        """
+        Build audio Part from multimodal context (inline bytes).
+        :param multimodal_ctx: MultimodalContext
+        :return: Part or None
+        """
+        if not multimodal_ctx or not multimodal_ctx.is_audio_input or not multimodal_ctx.audio_data:
+            return None
+        audio_format = (multimodal_ctx.audio_format or "wav").lower()
+        mime = f"audio/{audio_format}"
+        return Part.from_bytes(data=multimodal_ctx.audio_data, mime_type=mime)
+    # ---------- OUTPUT (model -> UI) ----------
+    def extract_first_audio_part(
+            self,
+            response
+    ) -> Tuple[Optional[bytes], Optional[str]]:
+        """
+        Extract first audio inline_data from a non-streaming response.
+        :param response: Google response object
+        :return: (audio_bytes, mime_type) or (None, None)
+        """
+        try:
+            candidates = getattr(response, "candidates", None) or []
+            for cand in candidates:
+                content = getattr(cand, "content", None)
+                parts = getattr(content, "parts", None) or []
+                for p in parts:
+                    inline = getattr(p, "inline_data", None)
+                    if not inline:
+                        continue
+                    mime = (getattr(inline, "mime_type", "") or "").lower()
+                    if not mime.startswith("audio/"):
+                        continue
+                    data = getattr(inline, "data", None)
+                    audio_bytes = self._ensure_bytes(data)
+                    if audio_bytes:
+                        return audio_bytes, mime
+        except Exception:
+            pass
+        return None, None
+    def pcm16_to_wav_base64(
+            self,
+            pcm_bytes: bytes,
+            rate: int = 24000,
+            channels: int = 1,
+            sample_width: int = 2
+    ) -> str:
+        """
+        Wrap raw PCM16 mono @ 24kHz into WAV and return base64-encoded payload.
+        :param pcm_bytes: Raw PCM16 bytes
+        :param rate: Sample rate (Hz), default 24000 for Google TTS
+        :param channels: Channels, default 1
+        :param sample_width: Bytes per sample, default 2 for PCM16
+        :return: Base64-encoded WAV
+        """
+        buf = io.BytesIO()
+        with wave.open(buf, "wb") as wf:
+            wf.setnchannels(channels)
+            wf.setsampwidth(sample_width)
+            wf.setframerate(rate)
+            wf.writeframes(pcm_bytes)
+        return base64.b64encode(buf.getvalue()).decode("utf-8")
+    @staticmethod
+    def _ensure_bytes(data) -> Optional[bytes]:
+        """
+        Return raw bytes from inline_data.data (bytes or base64 string).
+        :param data: bytes or base64 string
+        :return: bytes or None
+        """
+        try:
+            if isinstance(data, (bytes, bytearray)):
+                return bytes(data)
+            if isinstance(data, str):
+                return base64.b64decode(data)
+        except Exception:
+            return None
+        return None

pygpt-net 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl