PyPI - pygpt-net - Versions diffs - 2.7.7__py3-none-any.whl → 2.7.8__py3-none-any.whl - Mend

pygpt-net 2.7.7py3-none-any.whl → 2.7.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

pygpt_net/CHANGELOG.txt +7 -0
pygpt_net/__init__.py +3 -3
pygpt_net/app.py +5 -1
pygpt_net/controller/assistant/batch.py +2 -2
pygpt_net/controller/assistant/files.py +7 -6
pygpt_net/controller/assistant/threads.py +0 -0
pygpt_net/controller/chat/command.py +0 -0
pygpt_net/controller/dialogs/confirm.py +35 -58
pygpt_net/controller/lang/mapping.py +9 -9
pygpt_net/controller/remote_store/{google/batch.py → batch.py} +209 -252
pygpt_net/controller/remote_store/remote_store.py +982 -13
pygpt_net/core/command/command.py +0 -0
pygpt_net/core/db/viewer.py +1 -1
pygpt_net/core/realtime/worker.py +3 -1
pygpt_net/{controller/remote_store/google → core/remote_store/anthropic}/__init__.py +0 -1
pygpt_net/core/remote_store/anthropic/files.py +211 -0
pygpt_net/core/remote_store/anthropic/store.py +208 -0
pygpt_net/core/remote_store/openai/store.py +5 -4
pygpt_net/core/remote_store/remote_store.py +5 -1
pygpt_net/{controller/remote_store/openai → core/remote_store/xai}/__init__.py +0 -1
pygpt_net/core/remote_store/xai/files.py +225 -0
pygpt_net/core/remote_store/xai/store.py +219 -0
pygpt_net/data/config/config.json +9 -6
pygpt_net/data/config/models.json +5 -4
pygpt_net/data/config/settings.json +54 -1
pygpt_net/data/icons/folder_eye.svg +1 -0
pygpt_net/data/icons/folder_eye_filled.svg +1 -0
pygpt_net/data/icons/folder_open.svg +1 -0
pygpt_net/data/icons/folder_open_filled.svg +1 -0
pygpt_net/data/locale/locale.de.ini +4 -3
pygpt_net/data/locale/locale.en.ini +14 -4
pygpt_net/data/locale/locale.es.ini +4 -3
pygpt_net/data/locale/locale.fr.ini +4 -3
pygpt_net/data/locale/locale.it.ini +4 -3
pygpt_net/data/locale/locale.pl.ini +5 -4
pygpt_net/data/locale/locale.uk.ini +4 -3
pygpt_net/data/locale/locale.zh.ini +4 -3
pygpt_net/icons.qrc +4 -0
pygpt_net/icons_rc.py +282 -138
pygpt_net/provider/api/anthropic/__init__.py +2 -0
pygpt_net/provider/api/anthropic/chat.py +84 -1
pygpt_net/provider/api/anthropic/store.py +307 -0
pygpt_net/provider/api/anthropic/stream.py +75 -0
pygpt_net/provider/api/anthropic/worker/__init__.py +0 -0
pygpt_net/provider/api/anthropic/worker/importer.py +278 -0
pygpt_net/provider/api/google/chat.py +59 -2
pygpt_net/provider/api/google/store.py +124 -3
pygpt_net/provider/api/google/stream.py +91 -24
pygpt_net/provider/api/google/worker/importer.py +16 -28
pygpt_net/provider/api/openai/assistants.py +2 -2
pygpt_net/provider/api/openai/store.py +4 -1
pygpt_net/provider/api/openai/worker/importer.py +19 -61
pygpt_net/provider/api/openai/worker/importer_assistants.py +230 -0
pygpt_net/provider/api/x_ai/__init__.py +30 -6
pygpt_net/provider/api/x_ai/audio.py +43 -11
pygpt_net/provider/api/x_ai/chat.py +92 -4
pygpt_net/provider/api/x_ai/realtime/__init__.py +12 -0
pygpt_net/provider/api/x_ai/realtime/client.py +1825 -0
pygpt_net/provider/api/x_ai/realtime/realtime.py +198 -0
pygpt_net/provider/api/x_ai/remote_tools.py +19 -1
pygpt_net/provider/api/x_ai/store.py +610 -0
pygpt_net/provider/api/x_ai/stream.py +30 -9
pygpt_net/provider/api/x_ai/worker/importer.py +308 -0
pygpt_net/provider/audio_input/xai_grok_voice.py +390 -0
pygpt_net/provider/audio_output/xai_tts.py +325 -0
pygpt_net/provider/core/config/patch.py +18 -3
pygpt_net/provider/core/config/patches/patch_before_2_6_42.py +2 -2
pygpt_net/provider/core/model/patch.py +13 -0
pygpt_net/tools/image_viewer/tool.py +334 -34
pygpt_net/tools/image_viewer/ui/dialogs.py +317 -21
pygpt_net/ui/dialog/assistant.py +1 -1
pygpt_net/ui/dialog/plugins.py +13 -5
pygpt_net/ui/dialog/remote_store.py +552 -0
pygpt_net/ui/dialogs.py +3 -5
pygpt_net/ui/layout/ctx/ctx_list.py +58 -7
pygpt_net/ui/menu/tools.py +6 -13
pygpt_net/ui/widget/dialog/{remote_store_google.py → remote_store.py} +10 -10
pygpt_net/ui/widget/element/button.py +4 -4
pygpt_net/ui/widget/image/display.py +2 -2
pygpt_net/ui/widget/lists/context.py +2 -2
{pygpt_net-2.7.7.dist-info → pygpt_net-2.7.8.dist-info}/METADATA +9 -2
{pygpt_net-2.7.7.dist-info → pygpt_net-2.7.8.dist-info}/RECORD +82 -70
pygpt_net/controller/remote_store/google/store.py +0 -615
pygpt_net/controller/remote_store/openai/batch.py +0 -524
pygpt_net/controller/remote_store/openai/store.py +0 -699
pygpt_net/ui/dialog/remote_store_google.py +0 -539
pygpt_net/ui/dialog/remote_store_openai.py +0 -539
pygpt_net/ui/widget/dialog/remote_store_openai.py +0 -56
pygpt_net/ui/widget/lists/remote_store_google.py +0 -248
pygpt_net/ui/widget/lists/remote_store_openai.py +0 -317
{pygpt_net-2.7.7.dist-info → pygpt_net-2.7.8.dist-info}/LICENSE +0 -0
{pygpt_net-2.7.7.dist-info → pygpt_net-2.7.8.dist-info}/WHEEL +0 -0
{pygpt_net-2.7.7.dist-info → pygpt_net-2.7.8.dist-info}/entry_points.txt +0 -0

pygpt_net/provider/audio_output/xai_tts.py ADDED Viewed

@@ -0,0 +1,325 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2026.01.06 20:00:00                  #
+# ================================================== #
+import asyncio
+import base64
+import json
+import os
+import queue
+import threading
+import wave
+from typing import Optional, Tuple
+from .base import BaseProvider
+class XAITextToSpeech(BaseProvider):
+    def __init__(self, *args, **kwargs):
+        """
+        xAI Grok Voice Agent text-to-speech provider (via WebSocket).
+        :param args: args
+        :param kwargs: kwargs
+        """
+        super(XAITextToSpeech, self).__init__(*args, **kwargs)
+        self.plugin = kwargs.get("plugin")
+        self.id = "xai_tts"
+        self.name = "xAI TTS"
+        self.supported_voices = ["Ara", "Rex", "Sal", "Eve", "Leo"]
+    def init_options(self):
+        """Initialize options"""
+        self.plugin.add_option(
+            "xai_tts_voice",
+            type="text",
+            value="Ara",
+            label="Voice",
+            tab="xai_tts",
+            description="Specify xAI Grok Voice name (Ara, Rex, Sal, Eve, Leo)",
+            urls={"Voices": "https://docs.x.ai/docs/guides/voice/agent"},
+        )
+        self.plugin.add_option(
+            "xai_tts_sample_rate",
+            type="text",
+            value="24000",
+            label="Sample rate (Hz)",
+            tab="xai_tts",
+            description="PCM sample rate for output audio, e.g., 16000 or 24000",
+        )
+        self.plugin.add_option(
+            "xai_tts_instructions",
+            type="textarea",
+            value="You are a neutral TTS voice. Speak clearly and read the text verbatim.",
+            label="System Prompt",
+            tab="xai_tts",
+            description="System prompt to guide TTS style",
+            tooltip="System prompt for voice output",
+            persist=True,
+        )
+        self.plugin.add_option(
+            "xai_tts_file_container",
+            type="text",
+            value="wav",
+            label="File container",
+            tab="xai_tts",
+            description="wav or raw",
+        )
+        self.plugin.add_option(
+            "xai_tts_region",
+            type="text",
+            value="",
+            label="Region (optional)",
+            tab="xai_tts",
+            description="Regional endpoint like us-east-1; leave empty for global",
+        )
+    def speech(self, text: str) -> str:
+        """
+        Speech text to audio
+        :param text: text to speech
+        :return: path to generated audio file
+        """
+        try:
+            _ = self.plugin.window.core.api.xai.get_client()
+        except Exception:
+            pass
+        api_key = self._get_api_key()
+        if not api_key:
+            raise RuntimeError("xAI API key is not set. Please configure it in settings.")
+        voice = (self.plugin.get_option_value("xai_tts_voice") or "Ara").strip() or "Ara"
+        sr_opt = str(self.plugin.get_option_value("xai_tts_sample_rate") or "24000").strip()
+        try:
+            sample_rate = max(8000, int(sr_opt))
+        except Exception:
+            sample_rate = 24000
+        instructions = self.plugin.get_option_value("xai_tts_instructions") or ""
+        container = (self.plugin.get_option_value("xai_tts_file_container") or "wav").strip().lower()
+        if container not in ("wav", "raw"):
+            container = "wav"
+        region = (self.plugin.get_option_value("xai_tts_region") or "").strip()
+        host = f"{region}.api.x.ai" if region else "api.x.ai"
+        ws_uri = f"wss://{host}/v1/realtime"
+        base_dir = self.plugin.window.core.config.path
+        default_name = getattr(self.plugin, "output_file", "output.wav")
+        out_path = os.path.join(base_dir, default_name)
+        out_path = self._ensure_extension(out_path, ".wav" if container == "wav" else ".raw")
+        result_queue: queue.Queue[Tuple[bool, Optional[str], Optional[bytes]]] = queue.Queue()
+        def _runner():
+            loop = asyncio.new_event_loop()
+            try:
+                asyncio.set_event_loop(loop)
+                ok, err, pcm = loop.run_until_complete(
+                    self._synthesize_async(
+                        ws_uri=ws_uri,
+                        api_key=api_key,
+                        input_text=text,
+                        voice=voice,
+                        sample_rate=sample_rate,
+                        instructions=instructions,
+                    )
+                )
+                result_queue.put((ok, err, pcm))
+            finally:
+                try:
+                    loop.close()
+                except Exception:
+                    pass
+        t = threading.Thread(target=_runner, daemon=True)
+        t.start()
+        t.join()
+        ok, err, pcm_bytes = result_queue.get() if not result_queue.empty() else (False, "Unknown error", None)
+        if not ok or not pcm_bytes:
+            raise RuntimeError(err or "xAI TTS failed.")
+        if container == "wav":
+            self._write_wav(out_path, sample_rate, pcm_bytes)
+        else:
+            with open(out_path, "wb") as f:
+                f.write(pcm_bytes)
+        return str(out_path)
+    async def _synthesize_async(
+        self,
+        ws_uri: str,
+        api_key: str,
+        input_text: str,
+        voice: str,
+        sample_rate: int,
+        instructions: str,
+    ) -> Tuple[bool, Optional[str], Optional[bytes]]:
+        """
+        Connects to xAI Voice Agent realtime WebSocket and requests audio for the given text.
+        Returns (ok, error_message, pcm_bytes).
+        """
+        try:
+            import websockets  # type: ignore
+            from websockets.asyncio.client import ClientConnection  # type: ignore
+        except Exception:
+            return False, (
+                "The 'websockets' package is required for xAI TTS. Please install it in your environment."
+            ), None
+        audio_buf = bytearray()
+        transcript_buf = []
+        try:
+            async with websockets.connect(
+                uri=ws_uri,
+                ssl=True,
+                open_timeout=30,
+                close_timeout=10,
+                additional_headers={"Authorization": f"Bearer {api_key}"},
+                max_size=None,
+            ) as ws:  # type: ClientConnection
+                session_config = {
+                    "type": "session.update",
+                    "session": {
+                        "instructions": instructions,
+                        "voice": voice,
+                        "turn_detection": {"type": None},
+                        "audio": {
+                            "input": {"format": {"type": "audio/pcm", "rate": sample_rate}},
+                            "output": {"format": {"type": "audio/pcm", "rate": sample_rate}},
+                        },
+                    },
+                }
+                await ws.send(json.dumps(session_config))
+                await ws.send(
+                    json.dumps(
+                        {
+                            "type": "conversation.item.create",
+                            "item": {
+                                "type": "message",
+                                "role": "user",
+                                "content": [{"type": "input_text", "text": input_text}],
+                            },
+                        }
+                    )
+                )
+                await ws.send(
+                    json.dumps(
+                        {
+                            "type": "response.create",
+                            "response": {
+                                "modalities": ["text", "audio"],
+                            },
+                        }
+                    )
+                )
+                end_time = asyncio.get_event_loop().time() + 90.0
+                got_any_audio = False
+                while True:
+                    remaining = end_time - asyncio.get_event_loop().time()
+                    if remaining <= 0:
+                        return False, "Timed out waiting for xAI audio output.", None
+                    try:
+                        msg = await asyncio.wait_for(ws.recv(), timeout=remaining)
+                    except asyncio.TimeoutError:
+                        return False, "Timed out waiting for xAI audio output.", None
+                    except Exception as e:
+                        return False, f"WebSocket error: {e}", None
+                    try:
+                        event = json.loads(msg)
+                    except Exception:
+                        continue
+                    etype = event.get("type", "")
+                    if etype == "response.output_audio.delta":
+                        # xAI sends base64 audio in the 'delta' field
+                        chunk_b64 = event.get("delta")
+                        if chunk_b64:
+                            try:
+                                audio_buf.extend(base64.b64decode(chunk_b64))
+                                got_any_audio = True
+                            except Exception:
+                                pass
+                    elif etype == "response.output_audio_transcript.delta":
+                        # Collect transcript (not used for file, helpful for debugging)
+                        delta_txt = event.get("delta")
+                        if delta_txt:
+                            transcript_buf.append(delta_txt)
+                    elif etype == "response.output_audio.done":
+                        # Wait for response.done to ensure turn completion
+                        continue
+                    elif etype == "response.done":
+                        break
+                    elif etype == "response.error":
+                        return False, event.get("message") or "xAI TTS error.", None
+                if not got_any_audio:
+                    # Provide a more helpful error if we at least got transcript
+                    if transcript_buf:
+                        return False, "Empty audio from xAI TTS, but transcript was returned.", None
+                    return False, "Empty audio from xAI TTS.", None
+                return True, None, bytes(audio_buf)
+        except Exception as e:
+            return False, f"WebSocket connection failed: {e}", None
+    def _write_wav(self, path: str, sample_rate: int, pcm_bytes: bytes):
+        """
+        Writes PCM16LE mono samples into a WAV container.
+        """
+        with wave.open(path, "wb") as wf:
+            wf.setnchannels(1)
+            wf.setsampwidth(2)
+            wf.setframerate(sample_rate)
+            wf.writeframes(pcm_bytes)
+    def _ensure_extension(self, path: str, desired_ext: str) -> str:
+        """
+        Replaces the file extension with desired_ext.
+        """
+        root, _ = os.path.splitext(path)
+        return root + desired_ext
+    def _get_api_key(self) -> Optional[str]:
+        """
+        Resolve xAI API key from the app's configuration or environment.
+        """
+        key = self.plugin.window.core.config.get("api_key_xai")
+        if key:
+            return key
+        return os.getenv("XAI_API_KEY")
+    def is_configured(self) -> bool:
+        """
+        Check if provider is configured
+        :return: True if configured, False otherwise
+        """
+        api_key = self._get_api_key()
+        return api_key is not None and api_key != ""
+    def get_config_message(self) -> str:
+        """
+        Return message to display when provider is not configured
+        :return: message
+        """
+        return "xAI API key is not set yet. Please configure it in settings."

pygpt_net/provider/core/config/patch.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2026.01.05 20:00:00                  #
+# Updated Date: 2026.01.06 06:00:00                  #
 # ================================================== #
 import copy
@@ -234,8 +234,8 @@ class Patch:
                     data["remote_tools.google.file_search.args"] = ""
                 if "remote_tools.google.maps" not in data:
                     data["remote_tools.google.maps"] = False
-                if "remote_store.openai.hide_threads" not in data:
-                    data["remote_store.openai.hide_threads"] = True
+                if "remote_store.hide_threads" not in data:
+                    data["remote_store.hide_threads"] = True
                 updated = True
             # < 2.7.7
@@ -259,6 +259,21 @@ class Patch:
                         data[key] = cfg_get_base(key)
                 updated = True
+            # < 2.7.8
+            if old < parse_version("2.7.8"):
+                print("Migrating config from < 2.7.8...")
+                to_add = [
+                    "remote_store.hide_threads",
+                    "remote_store.provider",
+                    "api_key_management_xai",
+                    "remote_tools.xai.collections",
+                    "remote_tools.xai.collections.args",
+                ]
+                for key in to_add:
+                    if key not in data:
+                        data[key] = cfg_get_base(key)
+                updated = True
         # update file
         migrated = False
         if updated:

pygpt_net/provider/core/config/patches/patch_before_2_6_42.py CHANGED Viewed

@@ -1404,8 +1404,8 @@ class Patch:
             # < 2.1.79
             if old < parse_version("2.1.79"):
                 print("Migrating config from < 2.1.79...")
-                if 'remote_store.openai.hide_threads' not in data:
-                    data["remote_store.openai.hide_threads"] = True
+                if 'remote_store.hide_threads' not in data:
+                    data["remote_store.hide_threads"] = True
                 updated = True
             # < 2.2.2

pygpt_net/provider/core/model/patch.py CHANGED Viewed

@@ -141,6 +141,19 @@ class Patch:
                             m.input.append("image")
                 updated = True
+            # <  2.7.8 <--- add missing image input
+            if old < parse_version("2.7.8"):
+                print("Migrating models from < 2.7.8...")
+                models_to_update = [
+                    "grok-4"
+                ]
+                for model in models_to_update:
+                    if model in data:
+                        m = data[model]
+                        if not m.is_image_input():
+                            m.input.append("image")
+                updated = True
         # update file
         if updated:
             # fix empty/broken data

pygpt-net 2.7.7__py3-none-any.whl → 2.7.8__py3-none-any.whl

pygpt-net 2.7.7py3-none-any.whl → 2.7.8py3-none-any.whl