PyPI - pygpt-net - Versions diffs - 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl - Mend

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (182) hide show

pygpt_net/CHANGELOG.txt +15 -0
pygpt_net/__init__.py +3 -3
pygpt_net/app.py +4 -0
pygpt_net/{container.py → app_core.py} +5 -6
pygpt_net/controller/__init__.py +5 -2
pygpt_net/controller/access/control.py +1 -9
pygpt_net/controller/assistant/assistant.py +4 -4
pygpt_net/controller/assistant/batch.py +7 -7
pygpt_net/controller/assistant/files.py +4 -4
pygpt_net/controller/assistant/threads.py +3 -3
pygpt_net/controller/attachment/attachment.py +4 -7
pygpt_net/controller/audio/audio.py +25 -1
pygpt_net/controller/audio/ui.py +2 -2
pygpt_net/controller/chat/audio.py +1 -8
pygpt_net/controller/chat/common.py +30 -4
pygpt_net/controller/chat/handler/stream_worker.py +1124 -0
pygpt_net/controller/chat/output.py +8 -3
pygpt_net/controller/chat/stream.py +4 -405
pygpt_net/controller/chat/text.py +3 -2
pygpt_net/controller/chat/vision.py +11 -19
pygpt_net/controller/config/placeholder.py +1 -1
pygpt_net/controller/ctx/ctx.py +1 -1
pygpt_net/controller/ctx/summarizer.py +1 -1
pygpt_net/controller/kernel/kernel.py +11 -3
pygpt_net/controller/kernel/reply.py +5 -1
pygpt_net/controller/mode/mode.py +21 -12
pygpt_net/controller/plugins/settings.py +3 -2
pygpt_net/controller/presets/editor.py +112 -99
pygpt_net/controller/realtime/__init__.py +12 -0
pygpt_net/controller/realtime/manager.py +53 -0
pygpt_net/controller/realtime/realtime.py +268 -0
pygpt_net/controller/theme/theme.py +3 -2
pygpt_net/controller/ui/mode.py +7 -0
pygpt_net/controller/ui/ui.py +19 -1
pygpt_net/controller/ui/vision.py +4 -4
pygpt_net/core/agents/legacy.py +2 -2
pygpt_net/core/agents/runners/openai_workflow.py +2 -2
pygpt_net/core/assistants/files.py +5 -5
pygpt_net/core/assistants/store.py +4 -4
pygpt_net/core/audio/audio.py +6 -1
pygpt_net/core/audio/backend/native/__init__.py +12 -0
pygpt_net/core/audio/backend/{native.py → native/native.py} +426 -127
pygpt_net/core/audio/backend/native/player.py +139 -0
pygpt_net/core/audio/backend/native/realtime.py +250 -0
pygpt_net/core/audio/backend/pyaudio/__init__.py +12 -0
pygpt_net/core/audio/backend/pyaudio/playback.py +194 -0
pygpt_net/core/audio/backend/pyaudio/pyaudio.py +923 -0
pygpt_net/core/audio/backend/pyaudio/realtime.py +275 -0
pygpt_net/core/audio/backend/pygame/__init__.py +12 -0
pygpt_net/core/audio/backend/{pygame.py → pygame/pygame.py} +130 -19
pygpt_net/core/audio/backend/shared/__init__.py +38 -0
pygpt_net/core/audio/backend/shared/conversions.py +211 -0
pygpt_net/core/audio/backend/shared/envelope.py +38 -0
pygpt_net/core/audio/backend/shared/player.py +137 -0
pygpt_net/core/audio/backend/shared/rt.py +52 -0
pygpt_net/core/audio/capture.py +5 -0
pygpt_net/core/audio/output.py +13 -2
pygpt_net/core/audio/whisper.py +6 -2
pygpt_net/core/bridge/bridge.py +4 -3
pygpt_net/core/bridge/worker.py +31 -9
pygpt_net/core/debug/console/console.py +2 -2
pygpt_net/core/debug/presets.py +2 -2
pygpt_net/core/dispatcher/dispatcher.py +37 -1
pygpt_net/core/events/__init__.py +2 -1
pygpt_net/core/events/realtime.py +55 -0
pygpt_net/core/experts/experts.py +2 -2
pygpt_net/core/image/image.py +51 -1
pygpt_net/core/modes/modes.py +2 -2
pygpt_net/core/presets/presets.py +3 -3
pygpt_net/core/realtime/options.py +87 -0
pygpt_net/core/realtime/shared/__init__.py +0 -0
pygpt_net/core/realtime/shared/audio.py +213 -0
pygpt_net/core/realtime/shared/loop.py +64 -0
pygpt_net/core/realtime/shared/session.py +59 -0
pygpt_net/core/realtime/shared/text.py +37 -0
pygpt_net/core/realtime/shared/tools.py +276 -0
pygpt_net/core/realtime/shared/turn.py +38 -0
pygpt_net/core/realtime/shared/types.py +16 -0
pygpt_net/core/realtime/worker.py +164 -0
pygpt_net/core/tokens/tokens.py +4 -4
pygpt_net/core/types/__init__.py +1 -0
pygpt_net/core/types/image.py +48 -0
pygpt_net/core/types/mode.py +5 -2
pygpt_net/core/vision/analyzer.py +1 -1
pygpt_net/data/config/config.json +13 -4
pygpt_net/data/config/models.json +219 -101
pygpt_net/data/config/modes.json +3 -9
pygpt_net/data/config/settings.json +135 -27
pygpt_net/data/config/settings_section.json +2 -2
pygpt_net/data/locale/locale.de.ini +7 -7
pygpt_net/data/locale/locale.en.ini +25 -12
pygpt_net/data/locale/locale.es.ini +7 -7
pygpt_net/data/locale/locale.fr.ini +7 -7
pygpt_net/data/locale/locale.it.ini +7 -7
pygpt_net/data/locale/locale.pl.ini +8 -8
pygpt_net/data/locale/locale.uk.ini +7 -7
pygpt_net/data/locale/locale.zh.ini +3 -3
pygpt_net/data/locale/plugin.audio_input.en.ini +4 -0
pygpt_net/data/locale/plugin.audio_output.en.ini +4 -0
pygpt_net/item/model.py +23 -3
pygpt_net/plugin/audio_input/plugin.py +37 -4
pygpt_net/plugin/audio_input/simple.py +57 -8
pygpt_net/plugin/cmd_files/worker.py +3 -0
pygpt_net/plugin/openai_dalle/plugin.py +4 -4
pygpt_net/plugin/openai_vision/plugin.py +12 -13
pygpt_net/provider/agents/openai/agent.py +5 -5
pygpt_net/provider/agents/openai/agent_b2b.py +5 -5
pygpt_net/provider/agents/openai/agent_planner.py +5 -6
pygpt_net/provider/agents/openai/agent_with_experts.py +5 -5
pygpt_net/provider/agents/openai/agent_with_experts_feedback.py +4 -4
pygpt_net/provider/agents/openai/agent_with_feedback.py +4 -4
pygpt_net/provider/agents/openai/bot_researcher.py +2 -2
pygpt_net/provider/agents/openai/bots/research_bot/agents/planner_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/search_agent.py +1 -1
pygpt_net/provider/agents/openai/bots/research_bot/agents/writer_agent.py +1 -1
pygpt_net/provider/agents/openai/evolve.py +5 -5
pygpt_net/provider/agents/openai/supervisor.py +4 -4
pygpt_net/provider/api/__init__.py +27 -0
pygpt_net/provider/api/anthropic/__init__.py +68 -0
pygpt_net/provider/api/google/__init__.py +295 -0
pygpt_net/provider/api/google/audio.py +121 -0
pygpt_net/provider/api/google/chat.py +591 -0
pygpt_net/provider/api/google/image.py +427 -0
pygpt_net/provider/api/google/realtime/__init__.py +12 -0
pygpt_net/provider/api/google/realtime/client.py +1945 -0
pygpt_net/provider/api/google/realtime/realtime.py +186 -0
pygpt_net/provider/api/google/tools.py +222 -0
pygpt_net/provider/api/google/vision.py +129 -0
pygpt_net/provider/{gpt → api/openai}/__init__.py +24 -4
pygpt_net/provider/api/openai/agents/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/agents/computer.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/experts.py +1 -1
pygpt_net/provider/{gpt → api/openai}/agents/response.py +1 -1
pygpt_net/provider/{gpt → api/openai}/assistants.py +1 -1
pygpt_net/provider/{gpt → api/openai}/chat.py +15 -8
pygpt_net/provider/{gpt → api/openai}/completion.py +1 -1
pygpt_net/provider/{gpt → api/openai}/image.py +1 -1
pygpt_net/provider/api/openai/realtime/__init__.py +12 -0
pygpt_net/provider/api/openai/realtime/client.py +1828 -0
pygpt_net/provider/api/openai/realtime/realtime.py +194 -0
pygpt_net/provider/{gpt → api/openai}/remote_tools.py +1 -1
pygpt_net/provider/{gpt → api/openai}/responses.py +34 -20
pygpt_net/provider/{gpt → api/openai}/store.py +2 -2
pygpt_net/provider/{gpt → api/openai}/vision.py +1 -1
pygpt_net/provider/api/openai/worker/__init__.py +0 -0
pygpt_net/provider/{gpt → api/openai}/worker/assistants.py +4 -4
pygpt_net/provider/{gpt → api/openai}/worker/importer.py +10 -10
pygpt_net/provider/audio_input/google_genai.py +103 -0
pygpt_net/provider/audio_input/openai_whisper.py +1 -1
pygpt_net/provider/audio_output/google_genai_tts.py +229 -0
pygpt_net/provider/audio_output/openai_tts.py +9 -6
pygpt_net/provider/core/config/patch.py +26 -0
pygpt_net/provider/core/model/patch.py +20 -0
pygpt_net/provider/core/preset/json_file.py +2 -4
pygpt_net/provider/llms/anthropic.py +2 -5
pygpt_net/provider/llms/base.py +4 -3
pygpt_net/provider/llms/google.py +8 -9
pygpt_net/provider/llms/openai.py +1 -1
pygpt_net/provider/loaders/hub/image_vision/base.py +1 -1
pygpt_net/ui/dialog/preset.py +71 -55
pygpt_net/ui/layout/toolbox/footer.py +16 -0
pygpt_net/ui/layout/toolbox/image.py +5 -0
pygpt_net/ui/main.py +6 -4
pygpt_net/ui/widget/option/combo.py +15 -1
pygpt_net/utils.py +9 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/METADATA +55 -55
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/RECORD +181 -135
pygpt_net/core/audio/backend/pyaudio.py +0 -554
/pygpt_net/{provider/gpt/agents → controller/chat/handler}/__init__.py +0 -0
/pygpt_net/{provider/gpt/worker → core/realtime}/__init__.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/client.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/remote_tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/agents/utils.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/audio.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/computer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/container.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/summarizer.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/tools.py +0 -0
/pygpt_net/provider/{gpt → api/openai}/utils.py +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/LICENSE +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/WHEEL +0 -0
{pygpt_net-2.6.29.dist-info → pygpt_net-2.6.31.dist-info}/entry_points.txt +0 -0

pygpt_net/provider/audio_output/google_genai_tts.py ADDED Viewed

@@ -0,0 +1,229 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.08.29 18:00:00                  #
+# ================================================== #
+import os
+import wave
+import base64
+from .base import BaseProvider
+class GoogleGenAITextToSpeech(BaseProvider):
+    def __init__(self, *args, **kwargs):
+        """
+        Google GenAI Text-to-Speech provider (Gemini TTS via API).
+        :param args: args
+        :param kwargs: kwargs
+        """
+        super(GoogleGenAITextToSpeech, self).__init__(*args, **kwargs)
+        self.plugin = kwargs.get("plugin")
+        self.id = "google_genai_tts"
+        self.name = "Google GenAI TTS"
+        # Supported preview TTS models (fallback to flash if invalid)
+        self.allowed_models = [
+            "gemini-2.5-flash-preview-tts",
+            "gemini-2.5-pro-preview-tts",
+        ]
+        # Prebuilt voice names exposed by Gemini TTS
+        # Keep list in sync with official docs; fallback to "Puck" if invalid.
+        self.allowed_voices = [
+            "Zephyr", "Puck", "Charon", "Kore", "Fenrir", "Leda", "Orus",
+            "Aoede", "Callirrhoe", "Autonoe", "Enceladus", "Iapetus",
+            "Umbriel", "Algieba", "Despina", "Erinome", "Algenib",
+            "Rasalgethi", "Laomedeia", "Achernar", "Alnilam", "Schedar",
+            "Gacrux", "Pulcherrima", "Achird", "Zubenelgenubi",
+            "Vindemiatrix", "Sadachbia", "Sadaltager", "Sulafat",
+        ]
+    def init_options(self):
+        """Initialize options"""
+        # Keep option names consistent with the app style; simple text fields are enough.
+        self.plugin.add_option(
+            "google_genai_tts_model",
+            type="text",
+            value="gemini-2.5-flash-preview-tts",
+            label="Model",
+            tab="google_genai_tts",
+            description="Specify Gemini TTS model, e.g.: gemini-2.5-flash-preview-tts or gemini-2.5-pro-preview-tts",
+        )
+        self.plugin.add_option(
+            "google_genai_tts_voice",
+            type="text",
+            value="Kore",
+            label="Voice",
+            tab="google_genai_tts",
+            description="Specify voice, e.g.: Puck, Kore, Charon, Leda, Zephyr... (case-sensitive)",
+            urls={
+                "Voices": "https://ai.google.dev/gemini-api/docs/speech-generation"
+            },
+        )
+    def speech(self, text: str) -> str:
+        """
+        Text to speech synthesis using Google GenAI (Gemini TTS).
+        :param text: text to synthesize
+        :return: path to generated audio file
+        """
+        # Get pre-configured GenAI client
+        client = self.plugin.window.core.api.google.get_client()
+        # Resolve path where audio should be written
+        output_file = self.plugin.output_file
+        path = os.path.join(self.plugin.window.core.config.path, output_file)
+        # Validate/select model
+        model = self.plugin.get_option_value("google_genai_tts_model") or "gemini-2.5-flash-preview-tts"
+        model = self._normalize_model_name(model)
+        if model not in self.allowed_models:
+            model = "gemini-2.5-flash-preview-tts"
+        # Validate/select voice
+        voice = self.plugin.get_option_value("google_genai_tts_voice") or "Kore"
+        # if voice not in self.allowed_voices:
+            # voice = "Kore"
+        # Build generation config for audio modality + voice
+        # Using explicit types for clarity and forward-compatibility
+        try:
+            from google.genai import types
+        except Exception as ex:
+            # Fail fast if SDK is missing or incompatible
+            raise RuntimeError("google.genai SDK is not available. Please install/update Google GenAI SDK.") from ex
+        gen_config = types.GenerateContentConfig(
+            response_modalities=["AUDIO"],
+            speech_config=types.SpeechConfig(
+                voice_config=types.VoiceConfig(
+                    prebuilt_voice_config=types.PrebuiltVoiceConfig(
+                        voice_name=voice
+                    )
+                )
+            ),
+            temperature=0.8,  # balanced default; keep configurable later if needed
+        )
+        # Perform TTS request
+        response = client.models.generate_content(
+            model=model,
+            contents=text,
+            config=gen_config,
+        )
+        # Extract PCM bytes from the first candidate/part
+        pcm = self._extract_pcm_bytes(response)
+        # Persist as standard WAV (PCM 16-bit, mono, 24 kHz)
+        self._save_wav(path, pcm, channels=1, rate=24000, sample_width=2)
+        return str(path)
+    def _extract_pcm_bytes(self, response) -> bytes:
+        """
+        Extract PCM bytes from generate_content response.
+        :param response: Google GenAI response object
+        :return: raw PCM byte data
+        """
+        # Defensive extraction to support minor SDK variations
+        data = None
+        try:
+            cand = response.candidates[0]
+            part = cand.content.parts[0]
+            if getattr(part, "inline_data", None) and getattr(part.inline_data, "data", None):
+                data = part.inline_data.data
+        except Exception:
+            pass
+        if data is None:
+            # Some SDK builds may return base64 str; try resolving alternative layout
+            try:
+                parts = getattr(response, "candidates", [])[0].content.parts
+                for p in parts:
+                    if getattr(p, "inline_data", None) and getattr(p.inline_data, "data", None):
+                        data = p.inline_data.data
+                        break
+            except Exception:
+                pass
+        if data is None:
+            raise RuntimeError("No audio data returned by Gemini TTS response.")
+        # Normalize to raw bytes
+        if isinstance(data, (bytes, bytearray)):
+            return bytes(data)
+        if isinstance(data, str):
+            # Fallback: treat as base64-encoded PCM
+            return base64.b64decode(data)
+        # Last resort: try bytes() cast
+        try:
+            return bytes(data)
+        except Exception as ex:
+            raise RuntimeError("Unsupported audio payload type returned by Gemini TTS.") from ex
+    def _save_wav(
+            self,
+            filename: str,
+            pcm_bytes: bytes,
+            channels: int = 1,
+            rate: int = 24000,
+            sample_width: int = 2
+    ):
+        """
+        Save raw PCM bytes to a WAV file.
+        :param filename: output WAV file path
+        :param pcm_bytes: raw PCM byte data
+        :param channels: number of audio channels (1=mono, 2=stereo)
+        :param rate: sample rate in Hz (e.g., 24000)
+        :param sample_width: sample width in bytes (e.g., 2 for 16-bit)
+        """
+        # Ensure parent directory exists
+        os.makedirs(os.path.dirname(filename), exist_ok=True)
+        # Write PCM payload as WAV
+        with wave.open(filename, "wb") as wf:
+            wf.setnchannels(channels)
+            wf.setsampwidth(sample_width)  # bytes per sample (2 -> 16-bit)
+            wf.setframerate(rate)
+            wf.writeframes(pcm_bytes)
+    def _normalize_model_name(self, model: str) -> str:
+        """
+        Normalize model id (strip optional 'models/' prefix).
+        :param model: model id
+        """
+        try:
+            return model.split("/")[-1]
+        except Exception:
+            return model
+    def is_configured(self) -> bool:
+        """
+        Check if provider is configured
+        :return: True if configured, False otherwise
+        """
+        api_key = self.plugin.window.core.config.get("api_key_google")
+        return api_key is not None and api_key != ""
+    def get_config_message(self) -> str:
+        """
+        Return message to display when provider is not configured
+        :return: message
+        """
+        return "Google GenAI API key is not set yet. Please configure it in settings."

pygpt_net/provider/audio_output/openai_tts.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.07 22:00:00                  #
+# Updated Date: 2025.08.29 18:00:00                  #
 # ================================================== #
 import os
@@ -51,6 +51,9 @@ class OpenAITextToSpeech(BaseProvider):
             use="audio_tts_whisper_voices",
             description="Specify voice, available voices: "
                         "alloy, echo, fable, onyx, nova, shimmer",
+            urls={
+                "Voices": "https://platform.openai.com/docs/guides/text-to-speech/voice-options"
+            },
         )
     def speech(self, text: str) -> str:
@@ -60,15 +63,15 @@ class OpenAITextToSpeech(BaseProvider):
         :param text: text to speech
         :return: path to generated audio file or None if audio playback is handled here
         """
-        client = self.plugin.window.core.gpt.get_client()
+        client = self.plugin.window.core.api.openai.get_client()
         output_file = self.plugin.output_file
         voice = self.plugin.get_option_value('openai_voice')
         model = self.plugin.get_option_value('openai_model')
         allowed_voices = self.plugin.window.core.audio.whisper.get_voices()
-        if model not in self.allowed_models:
-            model = 'tts-1'
-        if voice not in allowed_voices:
-            voice = 'alloy'
+        # if model not in self.allowed_models:
+            # model = 'tts-1'
+        # if voice not in allowed_voices:
+            # voice = 'alloy'
         path = os.path.join(
             self.plugin.window.core.config.path,
             output_file,

pygpt_net/provider/core/config/patch.py CHANGED Viewed

@@ -2355,6 +2355,32 @@ class Patch:
                 self.window.core.updater.patch_css('web-chatgpt_wide.light.css', True)
                 updated = True
+            # < 2.6.30
+            if old < parse_version("2.6.30"):
+                print("Migrating config from < 2.6.30...")
+                if "api_native_google" not in data:
+                    data["api_native_google"] = True
+                if "remote_tools.google.web_search" not in data:
+                    data["remote_tools.google.web_search"] = True
+                if "remote_tools.google.code_interpreter" not in data:
+                    data["remote_tools.google.code_interpreter"] = False
+                updated = True
+            # < 2.6.31
+            if old < parse_version("2.6.31"):
+                print("Migrating config from < 2.6.31...")
+                if "log.realtime" not in data:
+                    data["log.realtime"] = False
+                if "remote_tools.google.url_ctx" not in data:
+                    data["remote_tools.google.url_ctx"] = False
+                if "audio.input.auto_turn" not in data:
+                    data["audio.input.auto_turn"] = False
+                if "audio.input.vad.prefix" not in data:
+                    data["audio.input.vad.prefix"] = 300
+                if "audio.input.vad.silence" not in data:
+                    data["audio.input.vad.silence"] = 2000
+                updated = True
         # update file
         migrated = False
         if updated:

pygpt_net/provider/core/model/patch.py CHANGED Viewed

@@ -763,6 +763,26 @@ class Patch:
                             model.mode.append(MODE_AGENT_OPENAI)
                 updated = True
+            # <  2.6.30 <--- add Google Imagen models
+            if old < parse_version("2.6.30"):
+                print("Migrating models from < 2.6.30...")
+                if "imagen-3.0-generate-002" not in data:
+                    data["imagen-3.0-generate-002"] = base_data["imagen-3.0-generate-002"]
+                if "imagen-4.0-generate-001" not in data:
+                    data["imagen-4.0-generate-001"] = base_data["imagen-4.0-generate-001"]
+                updated = True
+            # <  2.6.31 <--- add realtime models
+            if old < parse_version("2.6.31"):
+                print("Migrating models from < 2.6.31...")
+                if "gemini-2.5-flash-preview-native-audio-dialog" not in data:
+                    data["gemini-2.5-flash-preview-native-audio-dialog"] = base_data["gemini-2.5-flash-preview-native-audio-dialog"]
+                if "gpt-realtime" not in data:
+                    data["gpt-realtime"] = base_data["gpt-realtime"]
+                if "gpt-4o-realtime-preview" not in data:
+                    data["gpt-4o-realtime-preview"] = base_data["gpt-4o-realtime-preview"]
+                updated = True
         # update file
         if updated:
             data = dict(sorted(data.items()))

pygpt_net/provider/core/preset/json_file.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.23 15:00:00                  #
+# Updated Date: 2025.08.28 09:00:00                  #
 # ================================================== #
 import json
@@ -192,7 +192,7 @@ class JsonFileProvider(BaseProvider):
             MODE_CHAT: item.chat,
             MODE_COMPLETION: item.completion,
             MODE_IMAGE: item.img,
-            MODE_VISION: item.vision,
+            # MODE_VISION: item.vision,
             # MODE_LANGCHAIN: item.langchain,
             MODE_ASSISTANT: item.assistant,
             MODE_LLAMA_INDEX: item.llama_index,
@@ -250,8 +250,6 @@ class JsonFileProvider(BaseProvider):
             item.llama_index = data[MODE_LLAMA_INDEX]
         if MODE_RESEARCH in data:
             item.research = data[MODE_RESEARCH]
-        if MODE_VISION in data:
-            item.vision = data[MODE_VISION]
         if 'agent_provider' in data:
             item.agent_provider = data['agent_provider']

pygpt_net/provider/llms/anthropic.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.26 19:00:00                  #
+# Updated Date: 2025.08.28 09:00:00                  #
 # ================================================== #
 from typing import List, Dict, Optional
@@ -93,10 +93,7 @@ class AnthropicLLM(BaseLLM):
         :param window: window instance
         :return: list of models
         """
-        import anthropic
-        client = anthropic.Anthropic(
-            api_key=window.core.config.get('api_key_anthropic', "")
-        )
+        client = window.core.api.anthropic.get_client()
         models_list = client.models.list()
         items = []
         if models_list.data:

pygpt_net/provider/llms/base.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.02 20:00:00                  #
+# Updated Date: 2025.08.28 09:00:00                  #
 # ================================================== #
 import os
@@ -18,7 +18,8 @@ from llama_index.core.multi_modal_llms import MultiModalLLM as LlamaMultiModalLL
 from pygpt_net.core.types import (
     MODE_LANGCHAIN,
-    MODE_LLAMA_INDEX, MODE_CHAT,
+    MODE_LLAMA_INDEX,
+    MODE_CHAT,
 )
 from pygpt_net.item.model import ModelItem
 from pygpt_net.utils import parse_args
@@ -221,7 +222,7 @@ class BaseLLM:
         """
         model = ModelItem()
         model.provider = self.id
-        return window.core.gpt.get_client(
+        return window.core.api.openai.get_client(
             mode=MODE_CHAT,
             model=model,
         )

pygpt_net/provider/llms/google.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.08.26 19:00:00                  #
+# Updated Date: 2025.08.30 06:00:00                  #
 # ================================================== #
 from typing import Optional, List, Dict
@@ -92,13 +92,12 @@ class GoogleLLM(BaseLLM):
         :return: list of models
         """
         items = []
-        client = self.get_client(window)
+        client = window.core.api.google.get_client()
         models_list = client.models.list()
-        if models_list.data:
-            for item in models_list.data:
-                id = item.id.replace("models/", "")
-                items.append({
-                    "id": id,
-                    "name": id,
-                })
+        for item in models_list:
+            id = item.name.replace("models/", "")
+            items.append({
+                "id": id,
+                "name": id,  # TODO: token limit get from API
+            })
         return items

pygpt_net/provider/llms/openai.py CHANGED Viewed

@@ -99,7 +99,7 @@ class OpenAILLM(BaseLLM):
         if window.core.config.get('api_use_responses_llama', False):
             tools = []
-            tools = window.core.gpt.remote_tools.append_to_tools(
+            tools = window.core.api.openai.remote_tools.append_to_tools(
                 mode=MODE_LLAMA_INDEX,
                 model=model,
                 stream=stream,

pygpt_net/provider/loaders/hub/image_vision/base.py CHANGED Viewed

@@ -145,7 +145,7 @@ class ImageVisionLLMReader(BaseReader):
                 image = image.convert("RGB")
             image_str = img_2_b64(image)
-        client = self._window.core.gpt.get_client()
+        client = self._window.core.api.openai.get_client()
         encoded = self._encode_image(str(file))
         content = [
             {

pygpt-net 2.6.29__py3-none-any.whl → 2.6.31__py3-none-any.whl

pygpt-net 2.6.29py3-none-any.whl → 2.6.31py3-none-any.whl