PyPI - pygpt-net - Versions diffs - 2.5.14__py3-none-any.whl → 2.5.16__py3-none-any.whl - Mend

pygpt-net 2.5.14py3-none-any.whl → 2.5.16py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

pygpt_net/CHANGELOG.txt +12 -0
pygpt_net/__init__.py +3 -3
pygpt_net/controller/chat/input.py +9 -2
pygpt_net/controller/chat/stream.py +65 -17
pygpt_net/controller/lang/mapping.py +4 -2
pygpt_net/controller/model/__init__.py +3 -1
pygpt_net/controller/model/importer.py +337 -0
pygpt_net/controller/settings/editor.py +3 -0
pygpt_net/core/bridge/worker.py +4 -2
pygpt_net/core/command/__init__.py +33 -2
pygpt_net/core/models/__init__.py +6 -3
pygpt_net/core/models/ollama.py +7 -2
pygpt_net/data/config/config.json +9 -4
pygpt_net/data/config/models.json +22 -22
pygpt_net/data/locale/locale.de.ini +18 -0
pygpt_net/data/locale/locale.en.ini +19 -2
pygpt_net/data/locale/locale.es.ini +18 -0
pygpt_net/data/locale/locale.fr.ini +18 -0
pygpt_net/data/locale/locale.it.ini +18 -0
pygpt_net/data/locale/locale.pl.ini +19 -1
pygpt_net/data/locale/locale.uk.ini +18 -0
pygpt_net/data/locale/locale.zh.ini +17 -0
pygpt_net/item/ctx.py +2 -1
pygpt_net/item/model.py +5 -1
pygpt_net/plugin/cmd_files/__init__.py +2 -2
pygpt_net/plugin/cmd_files/worker.py +2 -2
pygpt_net/provider/core/model/json_file.py +3 -0
pygpt_net/provider/core/model/patch.py +24 -1
pygpt_net/provider/gpt/__init__.py +54 -21
pygpt_net/provider/gpt/responses.py +279 -0
pygpt_net/provider/gpt/vision.py +40 -16
pygpt_net/provider/llms/ollama.py +7 -2
pygpt_net/provider/llms/ollama_custom.py +693 -0
pygpt_net/ui/dialog/models_importer.py +82 -0
pygpt_net/ui/dialogs.py +3 -1
pygpt_net/ui/menu/config.py +18 -7
pygpt_net/ui/widget/dialog/model_importer.py +55 -0
pygpt_net/ui/widget/lists/model_importer.py +151 -0
{pygpt_net-2.5.14.dist-info → pygpt_net-2.5.16.dist-info}/METADATA +75 -9
{pygpt_net-2.5.14.dist-info → pygpt_net-2.5.16.dist-info}/RECORD +43 -37
{pygpt_net-2.5.14.dist-info → pygpt_net-2.5.16.dist-info}/LICENSE +0 -0
{pygpt_net-2.5.14.dist-info → pygpt_net-2.5.16.dist-info}/WHEEL +0 -0
{pygpt_net-2.5.14.dist-info → pygpt_net-2.5.16.dist-info}/entry_points.txt +0 -0

pygpt_net/provider/gpt/__init__.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.03.02 19:00:00                  #
+# Updated Date: 2025.06.25 02:00:00                  #
 # ================================================== #
 from httpx_socks import SyncProxyTransport
@@ -29,6 +29,7 @@ from .assistants import Assistants
 from .chat import Chat
 from .completion import Completion
 from .image import Image
+from .responses import Responses
 from .store import Store
 from .summarizer import Summarizer
 from .vision import Vision
@@ -47,6 +48,7 @@ class Gpt:
         self.chat = Chat(window)
         self.completion = Completion(window)
         self.image = Image(window)
+        self.responses = Responses(window)
         self.store = Store(window)
         self.summarizer = Summarizer(window)
         self.vision = Vision(window)
@@ -108,6 +110,12 @@ class Gpt:
         ai_name = ctx.output_name
         thread_id = ctx.thread  # from ctx
+        # --- Responses API ---- /beta/
+        use_responses_api = False
+        if mode == MODE_CHAT:
+            use_responses_api = True  # use responses API for chat, audio, research modes
+        ctx.use_responses_api = use_responses_api  # set in context
         # get model id
         model_id = None
         if model is not None:
@@ -128,20 +136,30 @@ class Gpt:
             )
             used_tokens = self.completion.get_used_tokens()
-        # chat (OpenAI) | research (Perplexity)
+        # chat, audio (OpenAI) | research (Perplexity)
         elif mode in [
             MODE_CHAT,
             MODE_AUDIO,
             MODE_RESEARCH
         ]:
-            response = self.chat.send(
-                context=context,
-                extra=extra,
-            )
-            if hasattr(response, "citations"):
-                if response.citations:
-                    ctx.urls = response.citations
-            used_tokens = self.chat.get_used_tokens()
+            # responses API
+            if use_responses_api:
+                response = self.responses.send(
+                    context=context,
+                    extra=extra,
+                )
+                used_tokens = self.responses.get_used_tokens()
+            else:
+                # chat completion API
+                response = self.chat.send(
+                    context=context,
+                    extra=extra,
+                )
+                if hasattr(response, "citations"):
+                    if response.citations:
+                        ctx.urls = response.citations
+                used_tokens = self.chat.get_used_tokens()
             self.vision.append_images(ctx)  # append images to ctx if provided
         # image
@@ -184,7 +202,7 @@ class Gpt:
         # if stream
         if stream:
-            ctx.stream = response
+            ctx.stream = response  # generator
             ctx.set_output("", ai_name)  # set empty output
             ctx.input_tokens = used_tokens  # get from input tokens calculation
             return True
@@ -206,13 +224,21 @@ class Gpt:
             MODE_VISION,
             MODE_RESEARCH
         ]:
-            if response.choices[0]:
-                if response.choices[0].message.content:
-                    output = response.choices[0].message.content.strip()
-                elif response.choices[0].message.tool_calls:
-                    ctx.tool_calls = self.window.core.command.unpack_tool_calls(
-                        response.choices[0].message.tool_calls,
+            if use_responses_api:
+                if response.output_text:
+                    output = response.output_text.strip()
+                if response.output:
+                    ctx.tool_calls = self.window.core.command.unpack_tool_calls_responses(
+                        response.output,
                     )
+            else:
+                if response.choices[0]:
+                    if response.choices[0].message.content:
+                        output = response.choices[0].message.content.strip()
+                    elif response.choices[0].message.tool_calls:
+                        ctx.tool_calls = self.window.core.command.unpack_tool_calls(
+                            response.choices[0].message.tool_calls,
+                        )
         # audio
         elif mode in [MODE_AUDIO]:
             if response.choices[0]:
@@ -234,10 +260,17 @@ class Gpt:
                     )
         ctx.set_output(output, ai_name)
-        ctx.set_tokens(
-            response.usage.prompt_tokens,
-            response.usage.completion_tokens,
-        )
+        if not use_responses_api:
+            ctx.set_tokens(
+                response.usage.prompt_tokens,
+                response.usage.completion_tokens,
+            )
+        else:
+            ctx.set_tokens(
+                response.usage.input_tokens,
+                response.usage.output_tokens,
+            )
         return True
     def quick_call(self, context: BridgeContext, extra: dict = None) -> str:

pygpt_net/provider/gpt/responses.py ADDED Viewed

@@ -0,0 +1,279 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# ================================================== #
+# This file is a part of PYGPT package               #
+# Website: https://pygpt.net                         #
+# GitHub:  https://github.com/szczyglis-dev/py-gpt   #
+# MIT License                                        #
+# Created By  : Marcin Szczygliński                  #
+# Updated Date: 2025.06.25 02:00:00                  #
+# ================================================== #
+import json
+import time
+from typing import Optional, Dict, Any, List
+from pygpt_net.core.types import (
+    MODE_CHAT,
+    MODE_VISION,
+    MODE_AUDIO,
+    MODE_RESEARCH,
+)
+from pygpt_net.core.bridge.context import BridgeContext, MultimodalContext
+from pygpt_net.item.ctx import CtxItem
+from pygpt_net.item.model import ModelItem
+from .utils import sanitize_name
+from pygpt_net.item.attachment import AttachmentItem
+class Responses:
+    def __init__(self, window=None):
+        """
+        Responses API wrapper
+        :param window: Window instance
+        """
+        self.window = window
+        self.input_tokens = 0
+        self.audio_prev_id = None
+        self.audio_prev_expires_ts = None
+    def send(
+            self,
+            context: BridgeContext,
+            extra: Optional[Dict[str, Any]] = None
+    ):
+        """
+        Call OpenAI API for chat
+        :param context: Bridge context
+        :param extra: Extra arguments
+        :return: response or stream chunks
+        """
+        prompt = context.prompt
+        stream = context.stream
+        max_tokens = int(context.max_tokens or 0)
+        system_prompt = context.system_prompt
+        mode = context.mode
+        model = context.model
+        functions = context.external_functions
+        attachments = context.attachments
+        multimodal_ctx = context.multimodal_ctx
+        ctx = context.ctx
+        if ctx is None:
+            ctx = CtxItem()  # create empty context
+        user_name = ctx.input_name  # from ctx
+        ai_name = ctx.output_name  # from ctx
+        client = self.window.core.gpt.get_client(mode)
+        # build chat messages
+        messages = self.build(
+            prompt=prompt,
+            system_prompt=system_prompt,
+            model=model,
+            history=context.history,
+            attachments=attachments,
+            ai_name=ai_name,
+            user_name=user_name,
+            multimodal_ctx=multimodal_ctx,
+        )
+        msg_tokens = self.window.core.tokens.from_messages(
+            messages,
+            model.id,
+        )
+        # check if max tokens not exceeded
+        if max_tokens > 0:
+            if msg_tokens + int(max_tokens) > model.ctx:
+                max_tokens = model.ctx - msg_tokens - 1
+                if max_tokens < 0:
+                    max_tokens = 0
+        # extra API kwargs
+        response_kwargs = {}
+        # tools / functions
+        tools = []
+        if functions is not None and isinstance(functions, list):
+            for function in functions:
+                if str(function['name']).strip() == '' or function['name'] is None:
+                    continue
+                params = {}
+                if function['params'] is not None and function['params'] != "":
+                    params = json.loads(function['params'])  # unpack JSON from string
+                tools.append({
+                    "type": "function",
+                    "name": function['name'],
+                    "parameters": params,
+                    "description": function['desc'],
+                })
+        # extra arguments, o3 only
+        if model.extra and "reasoning_effort" in model.extra:
+            response_kwargs['reasoning'] = {}
+            response_kwargs['reasoning']['effort'] = model.extra["reasoning_effort"]
+        # extend tools with external tools
+        if not model.id.startswith("o1") and not model.id.startswith("o3"):
+            tools.append({"type": "web_search_preview"})
+        # tool calls are not supported for o1-mini and o1-preview
+        if (model.id is not None
+                and model.id not in ["o1-mini", "o1-preview"]):
+            if len(tools) > 0:
+                response_kwargs['tools'] = tools
+        # audio mode
+        if mode in [MODE_AUDIO]:
+            stream = False
+            voice_id = "alloy"
+            tmp_voice = self.window.core.plugins.get_option("audio_output", "openai_voice")
+            if tmp_voice:
+                voice_id = tmp_voice
+            response_kwargs["modalities"] = ["text", "audio"]
+            response_kwargs["audio"] = {
+                "voice": voice_id,
+                "format": "wav"
+            }
+        response = client.responses.create(
+            input=messages,
+            model=model.id,
+            stream=stream,
+            **response_kwargs,
+        )
+        return response
+    def build(
+            self,
+            prompt: str,
+            system_prompt: str,
+            model: ModelItem,
+            history: Optional[List[CtxItem]] = None,
+            attachments: Optional[Dict[str, AttachmentItem]] = None,
+            ai_name: Optional[str] = None,
+            user_name: Optional[str] = None,
+            multimodal_ctx: Optional[MultimodalContext] = None,
+    ) -> list:
+        """
+        Build list of chat messages
+        :param prompt: user prompt
+        :param system_prompt: system prompt
+        :param history: history
+        :param model: model item
+        :param attachments: attachments
+        :param ai_name: AI name
+        :param user_name: username
+        :param multimodal_ctx: Multimodal context
+        :return: messages list
+        """
+        messages = []
+        # tokens config
+        mode = MODE_CHAT
+        allowed_system = True
+        if (model.id is not None
+                and model.id in ["o1-mini", "o1-preview"]):
+            allowed_system = False
+        used_tokens = self.window.core.tokens.from_user(
+            prompt,
+            system_prompt,
+        )  # threshold and extra included
+        max_ctx_tokens = self.window.core.config.get('max_total_tokens')  # max context window
+        # fit to max model tokens
+        if max_ctx_tokens > model.ctx:
+            max_ctx_tokens = model.ctx
+        # input tokens: reset
+        self.reset_tokens()
+        # append system prompt
+        if allowed_system:
+            if system_prompt is not None and system_prompt != "":
+                messages.append({"role": "developer", "content": system_prompt})
+        # append messages from context (memory)
+        if self.window.core.config.get('use_context'):
+            items = self.window.core.ctx.get_history(
+                history,
+                model.id,
+                mode,
+                used_tokens,
+                max_ctx_tokens,
+            )
+            for item in items:
+                # input
+                if item.final_input is not None and item.final_input != "":
+                    messages.append({
+                        "role": "user",
+                        "content": item.final_input,
+                    })
+                # output
+                if item.final_output is not None and item.final_output != "":
+                    msg = {
+                        "role": "assistant",
+                        "content": item.final_output,
+                    }
+                    # append previous audio ID
+                    if MODE_AUDIO in model.mode:
+                        if item.audio_id:
+                            # at first check expires_at - expired audio throws error in API
+                            current_timestamp = time.time()
+                            audio_timestamp = int(item.audio_expires_ts) if item.audio_expires_ts else 0
+                            if audio_timestamp and audio_timestamp > current_timestamp:
+                                msg["audio"] = {
+                                    "id": item.audio_id
+                                }
+                        elif self.audio_prev_id:
+                            current_timestamp = time.time()
+                            audio_timestamp = int(self.audio_prev_expires_ts) if self.audio_prev_expires_ts else 0
+                            if audio_timestamp and audio_timestamp > current_timestamp:
+                                msg["audio"] = {
+                                    "id": self.audio_prev_id
+                                }
+                    messages.append(msg)
+        # use vision and audio if available in current model
+        content = str(prompt)
+        if MODE_VISION in model.mode:
+            content = self.window.core.gpt.vision.build_content(
+                content=content,
+                attachments=attachments,
+                responses_api=True,
+            )
+        if MODE_AUDIO in model.mode:
+            content = self.window.core.gpt.audio.build_content(
+                content=content,
+                multimodal_ctx=multimodal_ctx,
+            )
+        # append current prompt
+        messages.append({
+            "role": "user",
+            "content": content,
+        })
+        # input tokens: update
+        self.input_tokens += self.window.core.tokens.from_messages(
+            messages,
+            model.id,
+        )
+        return messages
+    def reset_tokens(self):
+        """Reset input tokens counter"""
+        self.input_tokens = 0
+    def get_used_tokens(self) -> int:
+        """
+        Get input tokens counter
+        :return: input tokens
+        """
+        return self.input_tokens

pygpt_net/provider/gpt/vision.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2024.12.14 22:00:00                  #
+# Updated Date: 2025.06.25 02:00:00                  #
 # ================================================== #
 import base64
@@ -168,18 +168,26 @@ class Vision:
             self,
             content: Union[str, list],
             attachments: Optional[Dict[str, AttachmentItem]] = None,
+            responses_api: Optional[bool] = False,
     ) -> List[dict]:
         """
         Build vision content
         :param content: content (str or list)
         :param attachments: attachments (dict, optional)
+        :param responses_api: if True, use responses API format
         :return: List of contents
         """
+        type_text = "text"
+        type_image = "image_url"
+        if responses_api:
+            type_text = "input_text"
+            type_image = "input_image"
         if not isinstance(content, list):
             content = [
                 {
-                    "type": "text",
+                    "type": type_text,
                     "text": str(content)
                 }
             ]
@@ -193,14 +201,22 @@ class Vision:
         urls = self.extract_urls(prompt)
         if len(urls) > 0:
             for url in urls:
-                content.append(
-                    {
-                        "type": "image_url",
-                        "image_url": {
-                            "url": url,
+                if not responses_api:
+                    content.append(
+                        {
+                            "type": type_image,
+                            "image_url": {
+                                "url": url,
+                            }
+                        }
+                    )
+                else:
+                    content.append(
+                        {
+                            "type": type_image,
+                            "image_url": url,
                         }
-                    }
-                )
+                    )
                 self.urls.append(url)
         # local images (attachments)
@@ -211,14 +227,22 @@ class Vision:
                     # check if it's an image
                     if self.is_image(attachment.path):
                         base64_image = self.encode_image(attachment.path)
-                        content.append(
-                            {
-                                "type": "image_url",
-                                "image_url": {
-                                    "url": f"data:image/jpeg;base64,{base64_image}",
+                        if not responses_api:
+                            content.append(
+                                {
+                                    "type": type_image,
+                                    "image_url": {
+                                        "url": f"data:image/jpeg;base64,{base64_image}",
+                                    }
                                 }
-                            }
-                        )
+                            )
+                        else:
+                            content.append(
+                                {
+                                    "type": type_image,
+                                    "image_url": f"data:image/jpeg;base64,{base64_image}",
+                                }
+                            )
                         self.attachments[id] = attachment.path
                         attachment.consumed = True

pygpt_net/provider/llms/ollama.py CHANGED Viewed

@@ -6,7 +6,7 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.01.31 19:00:00                  #
+# Updated Date: 2025.06.24 16:00:00                  #
 # ================================================== #
 import os
@@ -14,7 +14,8 @@ from typing import Optional, List, Dict
 from langchain_community.chat_models import ChatOllama
-from llama_index.llms.ollama import Ollama
+from .ollama_custom import Ollama
 from llama_index.core.llms.llm import BaseLLM as LlamaBaseLLM
 from llama_index.core.base.embeddings.base import BaseEmbedding
 from llama_index.embeddings.ollama import OllamaEmbedding
@@ -85,6 +86,8 @@ class OllamaLLM(BaseLLM):
         args = self.parse_args(model.llama_index)
         if "request_timeout" not in args:
             args["request_timeout"] = 120
+        if 'OLLAMA_API_BASE' in os.environ:
+            args["base_url"] = os.environ['OLLAMA_API_BASE']
         return Ollama(**args)
     def get_embeddings_model(
@@ -104,6 +107,8 @@ class OllamaLLM(BaseLLM):
             args = self.parse_args({
                 "args": config,
             })
+        if 'OLLAMA_API_BASE' in os.environ:
+            args["base_url"] = os.environ['OLLAMA_API_BASE']
         return OllamaEmbedding(**args)
     def init_embeddings(

pygpt-net 2.5.14__py3-none-any.whl → 2.5.16__py3-none-any.whl

pygpt-net 2.5.14py3-none-any.whl → 2.5.16py3-none-any.whl