PyPI - wcgw - Versions diffs - 5.5.4__py3-none-any.whl - Mend

wcgw 5.5.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

wcgw/__init__.py +4 -0
wcgw/client/__init__.py +0 -0
wcgw/client/bash_state/bash_state.py +1426 -0
wcgw/client/bash_state/parser/__init__.py +7 -0
wcgw/client/bash_state/parser/bash_statement_parser.py +181 -0
wcgw/client/common.py +51 -0
wcgw/client/diff-instructions.txt +73 -0
wcgw/client/encoder/__init__.py +47 -0
wcgw/client/file_ops/diff_edit.py +619 -0
wcgw/client/file_ops/extensions.py +137 -0
wcgw/client/file_ops/search_replace.py +212 -0
wcgw/client/mcp_server/Readme.md +3 -0
wcgw/client/mcp_server/__init__.py +32 -0
wcgw/client/mcp_server/server.py +184 -0
wcgw/client/memory.py +103 -0
wcgw/client/modes.py +240 -0
wcgw/client/repo_ops/display_tree.py +116 -0
wcgw/client/repo_ops/file_stats.py +152 -0
wcgw/client/repo_ops/path_prob.py +58 -0
wcgw/client/repo_ops/paths_model.vocab +20000 -0
wcgw/client/repo_ops/paths_tokens.model +80042 -0
wcgw/client/repo_ops/repo_context.py +289 -0
wcgw/client/schema_generator.py +63 -0
wcgw/client/tool_prompts.py +98 -0
wcgw/client/tools.py +1432 -0
wcgw/py.typed +0 -0
wcgw/types_.py +318 -0
wcgw-5.5.4.dist-info/METADATA +339 -0
wcgw-5.5.4.dist-info/RECORD +38 -0
wcgw-5.5.4.dist-info/WHEEL +4 -0
wcgw-5.5.4.dist-info/entry_points.txt +4 -0
wcgw-5.5.4.dist-info/licenses/LICENSE +213 -0
wcgw_cli/__init__.py +1 -0
wcgw_cli/__main__.py +3 -0
wcgw_cli/anthropic_client.py +486 -0
wcgw_cli/cli.py +40 -0
wcgw_cli/openai_client.py +404 -0
wcgw_cli/openai_utils.py +67 -0

wcgw_cli/openai_client.py ADDED Viewed

@@ -0,0 +1,404 @@
+import base64
+import json
+import mimetypes
+import os
+import subprocess
+import tempfile
+import traceback
+import uuid
+from pathlib import Path
+from typing import DefaultDict, Optional, cast
+import openai
+import petname  # type: ignore[import-untyped]
+import rich
+import tokenizers  # type: ignore[import-untyped]
+from dotenv import load_dotenv
+from openai import OpenAI
+from openai.types.chat import (
+    ChatCompletionContentPartParam,
+    ChatCompletionMessageParam,
+    ChatCompletionUserMessageParam,
+)
+from pydantic import BaseModel
+from typer import Typer
+from wcgw.client.bash_state.bash_state import BashState
+from wcgw.client.common import CostData, History, Models, discard_input
+from wcgw.client.memory import load_memory
+from wcgw.client.tool_prompts import TOOL_PROMPTS
+from wcgw.client.tools import (
+    Context,
+    ImageData,
+    default_enc,
+    get_tool_output,
+    initialize,
+    which_tool,
+    which_tool_name,
+)
+from .openai_utils import get_input_cost, get_output_cost
+class Config(BaseModel):
+    model: Models
+    cost_limit: float
+    cost_file: dict[Models, CostData]
+    cost_unit: str = "$"
+def text_from_editor(console: rich.console.Console) -> str:
+    # First consume all the input till now
+    discard_input()
+    console.print("\n---------------------------------------\n# User message")
+    data = input()
+    if data:
+        return data
+    editor = os.environ.get("EDITOR", "vim")
+    with tempfile.NamedTemporaryFile(suffix=".tmp") as tf:
+        subprocess.run([editor, tf.name], check=True)
+        with open(tf.name, "r") as f:
+            data = f.read()
+            console.print(data)
+            return data
+def save_history(history: History, session_id: str) -> None:
+    myid = str(history[1]["content"]).replace("/", "_").replace(" ", "_").lower()[:60]
+    myid += "_" + session_id
+    myid = myid + ".json"
+    mypath = Path(".wcgw") / myid
+    mypath.parent.mkdir(parents=True, exist_ok=True)
+    with open(mypath, "w") as f:
+        json.dump(history, f, indent=3)
+def parse_user_message_special(msg: str) -> ChatCompletionUserMessageParam:
+    # Search for lines starting with `%` and treat them as special commands
+    parts: list[ChatCompletionContentPartParam] = []
+    for line in msg.split("\n"):
+        if line.startswith("%"):
+            args = line[1:].strip().split(" ")
+            command = args[0]
+            assert command == "image"
+            image_path = " ".join(args[1:])
+            with open(image_path, "rb") as f:
+                image_bytes = f.read()
+                image_b64 = base64.b64encode(image_bytes).decode("utf-8")
+                image_type = mimetypes.guess_type(image_path)[0]
+                dataurl = f"data:{image_type};base64,{image_b64}"
+            parts.append(
+                {"type": "image_url", "image_url": {"url": dataurl, "detail": "auto"}}
+            )
+        else:
+            if len(parts) > 0 and parts[-1]["type"] == "text":
+                parts[-1]["text"] += "\n" + line
+            else:
+                parts.append({"type": "text", "text": line})
+    return {"role": "user", "content": parts}
+app = Typer(pretty_exceptions_show_locals=False)
+@app.command()
+def loop(
+    first_message: Optional[str] = None,
+    limit: Optional[float] = None,
+    resume: Optional[str] = None,
+) -> tuple[str, float]:
+    load_dotenv()
+    session_id = str(uuid.uuid4())[:6]
+    history: History = []
+    waiting_for_assistant = False
+    memory = None
+    if resume:
+        try:
+            _, memory, _ = load_memory(
+                resume,
+                24000,  # coding_max_tokens
+                8000,   # noncoding_max_tokens
+                lambda x: default_enc.encoder(x),
+                lambda x: default_enc.decoder(x),
+            )
+        except OSError:
+            if resume == "latest":
+                resume_path = sorted(Path(".wcgw").iterdir(), key=os.path.getmtime)[-1]
+            else:
+                resume_path = Path(resume)
+            if not resume_path.exists():
+                raise FileNotFoundError(f"File {resume} not found")
+            with resume_path.open() as f:
+                history = json.load(f)
+            if len(history) <= 2:
+                raise ValueError("Invalid history file")
+            first_message = ""
+            waiting_for_assistant = history[-1]["role"] != "assistant"
+    my_dir = os.path.dirname(__file__)
+    config = Config(
+        model=cast(Models, os.getenv("OPENAI_MODEL", "gpt-4o-2024-08-06").lower()),
+        cost_limit=0.1,
+        cost_unit="$",
+        cost_file={
+            "gpt-4o-2024-08-06": CostData(
+                cost_per_1m_input_tokens=5, cost_per_1m_output_tokens=15
+            ),
+        },
+    )
+    if limit is not None:
+        config.cost_limit = limit
+    limit = config.cost_limit
+    enc = tokenizers.Tokenizer.from_pretrained("Xenova/gpt-4o")
+    tools = [
+        openai.pydantic_function_tool(
+            which_tool_name(tool.name), description=tool.description
+        )
+        for tool in TOOL_PROMPTS
+        if tool.name != "Initialize"
+    ]
+    cost: float = 0
+    input_toks = 0
+    output_toks = 0
+    system_console = rich.console.Console(style="blue", highlight=False, markup=False)
+    error_console = rich.console.Console(style="red", highlight=False, markup=False)
+    user_console = rich.console.Console(
+        style="bright_black", highlight=False, markup=False
+    )
+    assistant_console = rich.console.Console(
+        style="white bold", highlight=False, markup=False
+    )
+    with BashState(
+        system_console, os.getcwd(), None, None, None, None, True, None
+    ) as bash_state:
+        context = Context(bash_state, system_console)
+        system, context, _ = initialize(
+            "first_call",
+            context,
+            os.getcwd(),
+            [],
+            resume if (memory and resume) else "",
+            24000,  # coding_max_tokens
+            8000,   # noncoding_max_tokens
+            mode="wcgw",
+            thread_id="",
+        )
+        if not history:
+            history = [{"role": "system", "content": system}]
+        else:
+            if history[-1]["role"] == "tool":
+                waiting_for_assistant = True
+        client = OpenAI()
+        while True:
+            if cost > limit:
+                system_console.print(
+                    f"\nCost limit exceeded. Current cost: {cost}, input tokens: {input_toks}, output tokens: {output_toks}"
+                )
+                break
+            if not waiting_for_assistant:
+                if first_message:
+                    msg = first_message
+                    first_message = ""
+                else:
+                    msg = text_from_editor(user_console)
+                history.append(parse_user_message_special(msg))
+            else:
+                waiting_for_assistant = False
+            cost_, input_toks_ = get_input_cost(
+                config.cost_file[config.model], enc, history
+            )
+            cost += cost_
+            input_toks += input_toks_
+            stream = client.chat.completions.create(
+                messages=history,
+                model=config.model,
+                stream=True,
+                tools=tools,
+            )
+            system_console.print(
+                "\n---------------------------------------\n# Assistant response",
+                style="bold",
+            )
+            tool_call_args_by_id = DefaultDict[str, DefaultDict[int, str]](
+                lambda: DefaultDict(str)
+            )
+            _histories: History = []
+            item: ChatCompletionMessageParam
+            full_response: str = ""
+            image_histories: History = []
+            try:
+                for chunk in stream:
+                    if chunk.choices[0].finish_reason == "tool_calls":
+                        assert tool_call_args_by_id
+                        item = {
+                            "role": "assistant",
+                            "content": full_response,
+                            "tool_calls": [
+                                {
+                                    "id": tool_call_id + str(toolindex),
+                                    "type": "function",
+                                    "function": {
+                                        "arguments": tool_args,
+                                        "name": type(which_tool(tool_args)).__name__,
+                                    },
+                                }
+                                for tool_call_id, toolcallargs in tool_call_args_by_id.items()
+                                for toolindex, tool_args in toolcallargs.items()
+                            ],
+                        }
+                        cost_, output_toks_ = get_output_cost(
+                            config.cost_file[config.model], enc, item
+                        )
+                        cost += cost_
+                        system_console.print(
+                            f"\n---------------------------------------\n# Assistant invoked tools: {[which_tool(tool['function']['arguments']) for tool in item['tool_calls']]}"
+                        )
+                        system_console.print(
+                            f"\nTotal cost: {config.cost_unit}{cost:.3f}"
+                        )
+                        output_toks += output_toks_
+                        _histories.append(item)
+                        for tool_call_id, toolcallargs in tool_call_args_by_id.items():
+                            for toolindex, tool_args in toolcallargs.items():
+                                try:
+                                    output_or_dones, cost_ = get_tool_output(
+                                        context,
+                                        json.loads(tool_args),
+                                        enc,
+                                        limit - cost,
+                                        loop,
+                                        24000,  # coding_max_tokens
+                                        8000,   # noncoding_max_tokens
+                                    )
+                                    output_or_done = output_or_dones[0]
+                                except Exception as e:
+                                    output_or_done = (
+                                        f"GOT EXCEPTION while calling tool. Error: {e}"
+                                    )
+                                    tb = traceback.format_exc()
+                                    error_console.print(output_or_done + "\n" + tb)
+                                    cost_ = 0
+                                cost += cost_
+                                system_console.print(
+                                    f"\nTotal cost: {config.cost_unit}{cost:.3f}"
+                                )
+                                output = output_or_done
+                                if isinstance(output, ImageData):
+                                    randomId = petname.Generate(2, "-")
+                                    if not image_histories:
+                                        image_histories.extend(
+                                            [
+                                                {
+                                                    "role": "assistant",
+                                                    "content": f"Share images with ids: {randomId}",
+                                                },
+                                                {
+                                                    "role": "user",
+                                                    "content": [
+                                                        {
+                                                            "type": "image_url",
+                                                            "image_url": {
+                                                                "url": output.dataurl,
+                                                                "detail": "auto",
+                                                            },
+                                                        }
+                                                    ],
+                                                },
+                                            ]
+                                        )
+                                    else:
+                                        image_histories[0]["content"] += ", " + randomId
+                                        second_content = image_histories[1]["content"]
+                                        assert isinstance(second_content, list)
+                                        second_content.append(
+                                            {
+                                                "type": "image_url",
+                                                "image_url": {
+                                                    "url": output.dataurl,
+                                                    "detail": "auto",
+                                                },
+                                            }
+                                        )
+                                    item = {
+                                        "role": "tool",
+                                        "content": f"Ask user for image id: {randomId}",
+                                        "tool_call_id": tool_call_id + str(toolindex),
+                                    }
+                                else:
+                                    item = {
+                                        "role": "tool",
+                                        "content": str(output),
+                                        "tool_call_id": tool_call_id + str(toolindex),
+                                    }
+                                cost_, output_toks_ = get_output_cost(
+                                    config.cost_file[config.model], enc, item
+                                )
+                                cost += cost_
+                                output_toks += output_toks_
+                                _histories.append(item)
+                        waiting_for_assistant = True
+                        break
+                    elif chunk.choices[0].finish_reason:
+                        assistant_console.print("")
+                        item = {
+                            "role": "assistant",
+                            "content": full_response,
+                        }
+                        cost_, output_toks_ = get_output_cost(
+                            config.cost_file[config.model], enc, item
+                        )
+                        cost += cost_
+                        output_toks += output_toks_
+                        system_console.print(
+                            f"\nTotal cost: {config.cost_unit}{cost:.3f}"
+                        )
+                        _histories.append(item)
+                        break
+                    if chunk.choices[0].delta.tool_calls:
+                        tool_call = chunk.choices[0].delta.tool_calls[0]
+                        if tool_call.function and tool_call.function.arguments:
+                            tool_call_args_by_id[tool_call.id or ""][
+                                tool_call.index
+                            ] += tool_call.function.arguments
+                    chunk_str = chunk.choices[0].delta.content or ""
+                    assistant_console.print(chunk_str, end="")
+                    full_response += chunk_str
+            except KeyboardInterrupt:
+                waiting_for_assistant = False
+                input("Interrupted...enter to redo the current turn")
+            else:
+                history.extend(_histories)
+                history.extend(image_histories)
+                save_history(history, session_id)
+    return "Couldn't finish the task", cost
+if __name__ == "__main__":
+    app()

wcgw_cli/openai_utils.py ADDED Viewed

@@ -0,0 +1,67 @@
+from typing import cast
+from openai.types.chat import (
+    ChatCompletionAssistantMessageParam,
+    ChatCompletionMessage,
+    ChatCompletionMessageParam,
+    ParsedChatCompletionMessage,
+)
+from tokenizers import Tokenizer  # type: ignore[import-untyped]
+from wcgw.client.common import CostData, History
+def get_input_cost(
+    cost_map: CostData, enc: Tokenizer, history: History
+) -> tuple[float, int]:
+    input_tokens = 0
+    for msg in history:
+        content = msg["content"]
+        refusal = msg.get("refusal")
+        if isinstance(content, list):
+            for part in content:
+                if "text" in part:
+                    input_tokens += len(enc.encode(part["text"]))
+        elif content is None:
+            if refusal is None:
+                raise ValueError("Expected content or refusal to be present")
+            input_tokens += len(enc.encode(str(refusal)))
+        elif not isinstance(content, str):
+            raise ValueError(f"Expected content to be string, got {type(content)}")
+        else:
+            input_tokens += len(enc.encode(content))
+    cost = input_tokens * cost_map.cost_per_1m_input_tokens / 1_000_000
+    return cost, input_tokens
+def get_output_cost(
+    cost_map: CostData,
+    enc: Tokenizer,
+    item: ChatCompletionMessage | ChatCompletionMessageParam,
+) -> tuple[float, int]:
+    if isinstance(item, ChatCompletionMessage):
+        content = item.content
+        if not isinstance(content, str):
+            raise ValueError(f"Expected content to be string, got {type(content)}")
+    else:
+        if not isinstance(item["content"], str):
+            raise ValueError(
+                f"Expected content to be string, got {type(item['content'])}"
+            )
+        content = item["content"]
+        if item["role"] == "tool":
+            return 0, 0
+    output_tokens = len(enc.encode(content))
+    if "tool_calls" in item:
+        item = cast(ChatCompletionAssistantMessageParam, item)
+        toolcalls = item["tool_calls"]
+        for tool_call in toolcalls or []:
+            output_tokens += len(enc.encode(tool_call["function"]["arguments"]))
+    elif isinstance(item, ParsedChatCompletionMessage):
+        if item.tool_calls:
+            for tool_callf in item.tool_calls:
+                output_tokens += len(enc.encode(tool_callf.function.arguments))
+    cost = output_tokens * cost_map.cost_per_1m_output_tokens / 1_000_000
+    return cost, output_tokens