PyPI - pygpt-net - Versions diffs - 2.7.6__py3-none-any.whl → 2.7.7__py3-none-any.whl - Mend

pygpt-net 2.7.6py3-none-any.whl → 2.7.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

pygpt_net/CHANGELOG.txt +6 -0
pygpt_net/__init__.py +3 -3
pygpt_net/controller/chat/remote_tools.py +3 -9
pygpt_net/controller/chat/stream.py +2 -2
pygpt_net/controller/chat/{handler/worker.py → stream_worker.py} +13 -35
pygpt_net/core/debug/models.py +2 -2
pygpt_net/data/config/config.json +14 -4
pygpt_net/data/config/models.json +192 -4
pygpt_net/data/config/settings.json +125 -35
pygpt_net/data/locale/locale.de.ini +2 -0
pygpt_net/data/locale/locale.en.ini +32 -8
pygpt_net/data/locale/locale.es.ini +2 -0
pygpt_net/data/locale/locale.fr.ini +2 -0
pygpt_net/data/locale/locale.it.ini +2 -0
pygpt_net/data/locale/locale.pl.ini +3 -1
pygpt_net/data/locale/locale.uk.ini +2 -0
pygpt_net/data/locale/locale.zh.ini +2 -0
pygpt_net/plugin/cmd_mouse_control/worker.py +2 -1
pygpt_net/plugin/cmd_mouse_control/worker_sandbox.py +2 -1
pygpt_net/provider/api/anthropic/__init__.py +8 -3
pygpt_net/provider/api/anthropic/chat.py +259 -11
pygpt_net/provider/api/anthropic/computer.py +844 -0
pygpt_net/provider/api/anthropic/remote_tools.py +172 -0
pygpt_net/{controller/chat/handler/anthropic_stream.py → provider/api/anthropic/stream.py} +24 -10
pygpt_net/provider/api/anthropic/tools.py +32 -77
pygpt_net/provider/api/anthropic/utils.py +30 -0
pygpt_net/provider/api/google/chat.py +3 -7
pygpt_net/{controller/chat/handler/google_stream.py → provider/api/google/stream.py} +1 -1
pygpt_net/provider/api/google/utils.py +185 -0
pygpt_net/{controller/chat/handler → provider/api/langchain}/__init__.py +0 -0
pygpt_net/{controller/chat/handler/langchain_stream.py → provider/api/langchain/stream.py} +1 -1
pygpt_net/provider/api/llama_index/__init__.py +0 -0
pygpt_net/{controller/chat/handler/llamaindex_stream.py → provider/api/llama_index/stream.py} +1 -1
pygpt_net/provider/api/openai/image.py +2 -2
pygpt_net/{controller/chat/handler/openai_stream.py → provider/api/openai/stream.py} +1 -1
pygpt_net/provider/api/openai/utils.py +69 -3
pygpt_net/provider/api/x_ai/__init__.py +109 -10
pygpt_net/provider/api/x_ai/chat.py +0 -0
pygpt_net/provider/api/x_ai/image.py +149 -47
pygpt_net/provider/api/x_ai/{remote.py → remote_tools.py} +165 -70
pygpt_net/provider/api/x_ai/responses.py +507 -0
pygpt_net/{controller/chat/handler/xai_stream.py → provider/api/x_ai/stream.py} +12 -1
pygpt_net/provider/api/x_ai/tools.py +59 -8
pygpt_net/{controller/chat/handler → provider/api/x_ai}/utils.py +1 -2
pygpt_net/provider/api/x_ai/vision.py +1 -4
pygpt_net/provider/core/config/patch.py +22 -1
pygpt_net/provider/core/model/patch.py +26 -1
pygpt_net/tools/image_viewer/ui/dialogs.py +3 -2
pygpt_net/tools/text_editor/ui/dialogs.py +3 -2
pygpt_net/tools/text_editor/ui/widgets.py +0 -0
pygpt_net/ui/widget/dialog/base.py +16 -5
pygpt_net/ui/widget/textarea/editor.py +0 -0
{pygpt_net-2.7.6.dist-info → pygpt_net-2.7.7.dist-info}/METADATA +8 -2
{pygpt_net-2.7.6.dist-info → pygpt_net-2.7.7.dist-info}/RECORD +54 -48
{pygpt_net-2.7.6.dist-info → pygpt_net-2.7.7.dist-info}/LICENSE +0 -0
{pygpt_net-2.7.6.dist-info → pygpt_net-2.7.7.dist-info}/WHEEL +0 -0
{pygpt_net-2.7.6.dist-info → pygpt_net-2.7.7.dist-info}/entry_points.txt +0 -0

pygpt_net/provider/api/anthropic/chat.py CHANGED Viewed

@@ -6,12 +6,13 @@
 # GitHub:  https://github.com/szczyglis-dev/py-gpt   #
 # MIT License                                        #
 # Created By  : Marcin Szczygliński                  #
-# Updated Date: 2025.09.05 01:00:00                  #
+# Updated Date: 2026.01.05 20:00:00                  #
 # ================================================== #
-from typing import Optional, Dict, Any, List
+import json
+from typing import Optional, Dict, Any, List, Set
-from pygpt_net.core.types import MODE_CHAT, MODE_AUDIO
+from pygpt_net.core.types import MODE_CHAT, MODE_AUDIO, MODE_COMPUTER
 from pygpt_net.core.bridge.context import BridgeContext, MultimodalContext
 from pygpt_net.item.attachment import AttachmentItem
 from pygpt_net.item.ctx import CtxItem
@@ -51,20 +52,43 @@ class Chat:
         api = self.window.core.api.anthropic
         client: anthropic.Anthropic = api.get_client(context.mode, model)
-        msgs = self.build_input(
-            prompt=prompt,
-            system_prompt=system_prompt,
+        # Tool result turn (Computer Use): if previous assistant emitted tool_use and we have tool output,
+        # build a minimal message triplet: [user(prompt that triggered tool), assistant(tool_use), user(tool_result + images)].
+        tool_result_messages = self._build_tool_result_messages_if_needed(
             model=model,
             history=context.history,
             attachments=attachments,
-            multimodal_ctx=multimodal_ctx,
         )
+        if tool_result_messages is not None:
+            msgs = tool_result_messages
+        else:
+            msgs = self.build_input(
+                prompt=prompt,
+                system_prompt=system_prompt,
+                model=model,
+                history=context.history,
+                attachments=attachments,
+                multimodal_ctx=multimodal_ctx,
+            )
         self.reset_tokens()
         count_msgs = self._build_count_messages(prompt, system_prompt, model, context.history)
         self.input_tokens += self.window.core.tokens.from_messages(count_msgs, model.id)
+        # Build tools (client tools + Anthropic server tools)
         tools = api.tools.get_all_tools(model, functions)
+        # Enable Computer Use tool in computer mode (use the official Tool/ComputerUse object)
+        if mode == MODE_COMPUTER or (model and isinstance(model.id, str) and "computer-use" in model.id.lower()):
+            tool = self.window.core.api.anthropic.computer.get_tool()
+            tools = [tool]  # reset tools to only Computer Use (multiple tools not supported together)
+        # MCP: servers from config
+        mcp_servers = self._load_mcp_servers_from_cfg()
+        # Compute betas required by selected server tools or MCP
+        betas = self._compute_required_betas(tools, mcp_servers)
         max_tokens = context.max_tokens if context.max_tokens else 1024
         temperature = self.window.core.config.get('temperature')
         top_p = self.window.core.config.get('top_p')
@@ -83,14 +107,25 @@ class Chat:
             params["top_p"] = top_p
         if tools:  # only include when non-empty list
             params["tools"] = tools  # must be a valid list per API
+        if mcp_servers:
+            params["mcp_servers"] = mcp_servers  # MCP connector servers per docs
         if mode == MODE_AUDIO:
             stream = False  # no native TTS
+        # Decide whether to call stable or beta endpoint
+        use_beta = len(betas) > 0
         if stream:
-            return client.messages.create(stream=True, **params)
+            if use_beta:
+                return client.beta.messages.create(stream=True, betas=list(betas), **params)
+            else:
+                return client.messages.create(stream=True, **params)
         else:
-            return client.messages.create(**params)
+            if use_beta:
+                return client.beta.messages.create(betas=list(betas), **params)
+            else:
+                return client.messages.create(**params)
     def unpack_response(self, mode: str, response: Message, ctx: CtxItem):
         """
@@ -115,7 +150,19 @@ class Chat:
                 ctx.set_tokens(p, c)
                 if not isinstance(ctx.extra, dict):
                     ctx.extra = {}
-                ctx.extra["usage"] = {"vendor": "anthropic", "input_tokens": p, "output_tokens": c}
+                # include server_tool_use counts if present
+                server_tool_use = {}
+                if hasattr(usage, "server_tool_use"):
+                    try:
+                        server_tool_use = dict(getattr(usage, "server_tool_use"))
+                    except Exception:
+                        server_tool_use = {}
+                ctx.extra["usage"] = {
+                    "vendor": "anthropic",
+                    "input_tokens": p,
+                    "output_tokens": c,
+                    "server_tool_use": server_tool_use,
+                }
         except Exception:
             pass
@@ -125,6 +172,12 @@ class Chat:
         except Exception:
             pass
+        # Collect fetched URLs from web_fetch_tool_result blocks
+        try:
+            self._collect_web_fetch_urls(response, ctx)
+        except Exception:
+            pass
     def extract_text(self, response: Message) -> str:
         """
         Extract text from response content blocks.
@@ -210,6 +263,39 @@ class Chat:
                 if u not in ctx.urls:
                     ctx.urls.append(u)
+    def _collect_web_fetch_urls(self, response: Message, ctx: CtxItem):
+        """
+        Collect URLs from web_fetch_tool_result blocks and attach to ctx.urls.
+        :param response: Message response from API
+        :param ctx: CtxItem to update
+        """
+        urls: List[str] = []
+        try:
+            for blk in getattr(response, "content", []) or []:
+                if getattr(blk, "type", "") == "web_fetch_tool_result":
+                    content = getattr(blk, "content", {}) or {}
+                    if isinstance(content, dict):
+                        if content.get("type") == "web_fetch_result":
+                            u = (content.get("url") or "").strip()
+                            if u.startswith("http://") or u.startswith("https://"):
+                                urls.append(u)
+                        # citations may embed multiple URLs
+                        if content.get("type") == "web_fetch_result" and isinstance(content.get("citations"), list):
+                            for cit in content["citations"]:
+                                u = (cit.get("url") or "").strip()
+                                if u.startswith("http://") or u.startswith("https://"):
+                                    urls.append(u)
+        except Exception:
+            pass
+        if urls:
+            if ctx.urls is None:
+                ctx.urls = []
+            for u in urls:
+                if u not in ctx.urls:
+                    ctx.urls.append(u)
     def build_input(
             self,
             prompt: str,
@@ -271,6 +357,7 @@ class Chat:
         if attachments:
             img_parts = self.window.core.api.anthropic.vision.build_blocks(content, attachments)
             parts.extend(img_parts)
+            content = ""  # image-first; do not duplicate text if build_blocks already added it
         if content:
             parts.append({"type": "text", "text": str(content)})
@@ -338,4 +425,165 @@ class Chat:
         :return: used input tokens
         """
-        return self.input_tokens
+        return self.input_tokens
+    def _load_mcp_servers_from_cfg(self) -> List[dict]:
+        """
+        Load MCP servers definition from config JSON string(s).
+        Supports keys:
+          - remote_tools.anthropic.mcp.mcp_servers
+        :return: list of MCP servers dicts
+        """
+        cfg = self.window.core.config
+        enabled = cfg.get("remote_tools.anthropic.mcp", False)
+        if not enabled:
+            return []  # do not load if MCP is disabled
+        raw = cfg.get("remote_tools.anthropic.mcp.mcp_servers")
+        if not raw:
+            return []
+        try:
+            if isinstance(raw, (list, dict)):
+                # ensure list
+                return list(raw) if isinstance(raw, list) else [raw]
+            return json.loads(raw) or []
+        except Exception:
+            return []
+    def _compute_required_betas(self, tools: List[dict], mcp_servers: List[dict]) -> Set[str]:
+        """
+        Compute required beta headers for enabled server tools.
+        :param tools: Final tools list
+        :param mcp_servers: MCP servers list
+        :return: set of beta header strings
+        """
+        betas: Set[str] = set()
+        is_mcp = False
+        for t in tools or []:
+            ttype = str(t.get("type") or "")
+            if ttype.startswith("web_fetch_"):
+                betas.add("web-fetch-2025-09-10")
+            elif ttype.startswith("code_execution_"):
+                betas.add("code-execution-2025-08-25")
+            elif ttype in ("tool_search_tool_regex_20251119", "tool_search_tool_bm25_20251119"):
+                betas.add("advanced-tool-use-2025-11-20")
+            elif ttype == "mcp_toolset":
+                is_mcp = True
+                betas.add("mcp-client-2025-11-20")
+            elif ttype.startswith("computer_"):
+                betas.add("computer-use-2025-01-24")
+        if is_mcp and mcp_servers:
+            betas.add("mcp-client-2025-11-20")
+        return betas
+    # -------------------------- Tool Result helpers (Anthropic Computer Use) -------------------------- #
+    def _build_tool_result_messages_if_needed(
+            self,
+            model: ModelItem,
+            history: Optional[List[CtxItem]],
+            attachments: Optional[Dict[str, AttachmentItem]],
+    ) -> Optional[List[dict]]:
+        """
+        If the previous assistant turn emitted tool_use (computer) and the plugin produced tool_output,
+        construct a minimal continuation with tool_result content block(s), as required by Anthropic.
+        Returns a messages list or None.
+        """
+        if not self.window.core.config.get('use_context'):
+            return None
+        items: List[CtxItem] = self.window.core.ctx.get_history(
+            history,
+            model.id,
+            MODE_CHAT,
+            self.window.core.tokens.from_user("", ""),
+            self._fit_ctx(model),
+        )
+        if not items:
+            return None
+        last = items[-1]
+        if not isinstance(getattr(last, "extra", None), dict):
+            return None
+        tool_uses = last.extra.get("anthropic_tool_uses") or []
+        tool_output = last.extra.get("tool_output") or []
+        if not tool_uses or not tool_output:
+            return None
+        # Build prior user message (the one that triggered the tool use)
+        prior_user_text = ""
+        if len(items) >= 2 and getattr(items[-2], "final_input", None):
+            prior_user_text = str(items[-2].final_input)
+        elif getattr(last, "input", None):
+            prior_user_text = str(last.input)
+        user_msg_1 = None
+        if prior_user_text:
+            user_msg_1 = {"role": "user", "content": [{"type": "text", "text": prior_user_text}]}
+        # Recreate assistant tool_use block(s)
+        assistant_parts: List[dict] = []
+        for tu in tool_uses:
+            tid = str(tu.get("id", "") or "")
+            name = str(tu.get("name", "") or "computer")
+            inp = tu.get("input", {}) or {}
+            assistant_parts.append({
+                "type": "tool_use",
+                "id": tid,
+                "name": name,
+                "input": inp,
+            })
+        assistant_msg = {"role": "assistant", "content": assistant_parts} if assistant_parts else None
+        # Build tool_result with last tool output; attach screenshot images (if any) as additional blocks
+        result_text = self._best_tool_result_text(tool_output)
+        last_tool_use_id = str(tool_uses[-1].get("id", "") or "")
+        tool_result_block = {
+            "type": "tool_result",
+            "tool_use_id": last_tool_use_id,
+            "content": [{"type": "text", "text": result_text}],
+        }
+        # Convert current attachments to image blocks and append after tool_result in the same user message
+        image_blocks: List[dict] = []
+        if attachments:
+            img_parts = self.window.core.api.anthropic.vision.build_blocks("", attachments)
+            for part in img_parts:
+                if isinstance(part, dict) and part.get("type") in ("image", "input_image", "document"):
+                    image_blocks.append(part)
+        user_msg_2 = {"role": "user", "content": [tool_result_block] + image_blocks}
+        out: List[dict] = []
+        if user_msg_1:
+            out.append(user_msg_1)
+        if assistant_msg:
+            out.append(assistant_msg)
+        out.append(user_msg_2)
+        return out
+    @staticmethod
+    def _best_tool_result_text(tool_output: List[dict]) -> str:
+        """
+        Build a compact text payload from plugin tool_output list.
+        Prefers the last item with 'result' field; falls back to the last dict JSON.
+        """
+        if not tool_output:
+            return "ok"
+        last = tool_output[-1]
+        try:
+            if isinstance(last, dict):
+                if "result" in last:
+                    val = last["result"]
+                    if isinstance(val, (dict, list)):
+                        return json.dumps(val, ensure_ascii=False)
+                    return str(val)
+                return json.dumps(last, ensure_ascii=False)
+            return str(last)
+        except Exception:
+            return "ok"

pygpt-net 2.7.6__py3-none-any.whl → 2.7.7__py3-none-any.whl

pygpt-net 2.7.6py3-none-any.whl → 2.7.7py3-none-any.whl