PyPI - universal-mcp-agents - Versions diffs - 0.1.10__tar.gz → 0.1.11__tar.gz - Mend

universal-mcp-agents 0.1.10tar.gz → 0.1.11tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of universal-mcp-agents might be problematic. Click here for more details.

Files changed (61) hide show

{universal_mcp_agents-0.1.10 → universal_mcp_agents-0.1.11}/GEMINI.md RENAMED Viewed

@@ -43,4 +43,8 @@ Common commands (copy/paste)
 - Remove: `uv remove <pkg>`
 - Run app: `uv run python -m <your_module>` or `uv run main.py`
 - Tests: `uv run pytest -q`
-- Lint/format: `uv run ruff check .` and/or `uv run ruff format .`
+- Lint/format: `uv run ruff check .` and/or `uv run ruff format .`
+NEVER commit or push changes without asking explicitly.

{universal_mcp_agents-0.1.10 → universal_mcp_agents-0.1.11}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: universal-mcp-agents
-Version: 0.1.10
+Version: 0.1.11
 Summary: Add your description here
 Project-URL: Homepage, https://github.com/universal-mcp/applications
 Project-URL: Repository, https://github.com/universal-mcp/applications

{universal_mcp_agents-0.1.10 → universal_mcp_agents-0.1.11}/bump_and_release.sh RENAMED Viewed

@@ -9,7 +9,7 @@ uv sync --all-extras
 # Run tests with pytest
 echo "Running tests with pytest..."
-# uv run pytest
+uv run pytest
 echo "Tests passed!"

{universal_mcp_agents-0.1.10 → universal_mcp_agents-0.1.11}/pyproject.toml RENAMED Viewed

@@ -6,7 +6,7 @@ build-backend = "hatchling.build"
 [project]
 name = "universal-mcp-agents"
-version = "0.1.10"
+version = "0.1.11"
 description = "Add your description here"
 readme = "README.md"
 authors = [

{universal_mcp_agents-0.1.10 → universal_mcp_agents-0.1.11}/src/universal_mcp/agents/codeact/agent.py RENAMED Viewed

@@ -11,8 +11,6 @@ from universal_mcp.types import ToolConfig, ToolFormat
 from universal_mcp.agents.base import BaseAgent
 from universal_mcp.agents.codeact.prompts import (
-    REFLECTION_PROMPT,
-    RETRY_PROMPT,
     create_default_prompt,
     make_safe_function_name,
 )
@@ -39,11 +37,6 @@ class CodeActAgent(BaseAgent):
         self.tools_config = tools or {}
         self.registry = registry
         self.eval_fn = eval_unsafe
-        self.reflection_prompt = REFLECTION_PROMPT
-        self.reflection_model = self.model_instance
-        self.max_reflections = 3
-        self.tools_context = {}
-        self.context = {}
         self.sandbox_timeout = sandbox_timeout
         self.processed_tools: list[StructuredTool | Callable] = []
@@ -57,13 +50,6 @@ class CodeActAgent(BaseAgent):
         self.instructions = create_default_prompt(self.processed_tools, self.instructions)
-        for tool in self.processed_tools:
-            safe_name = make_safe_function_name(tool.name)
-            tool_callable = tool.coroutine if hasattr(tool, "coroutine") and tool.coroutine is not None else tool.func
-            self.tools_context[safe_name] = tool_callable
-        self.context = {**self.context, **self.tools_context}
         agent = StateGraph(CodeActState)
         agent.add_node("call_model", self.call_model)
         agent.add_node("sandbox", self.sandbox)
@@ -97,64 +83,56 @@ class CodeActAgent(BaseAgent):
         return content
     async def call_model(self, state: CodeActState) -> dict:
+        logger.debug(f"Calling model with state: {state}")
         model = self.model_instance
-        reflection_model = self.reflection_model
-        messages = [{"role": "system", "content": self.instructions}] + state["messages"]
+        # Find the last script and its output in the message history
+        previous_script = state.get("script", "")
+        sandbox_output = state.get("sandbox_output", "")
+        logger.debug(f"Previous script: {previous_script}")
+        logger.debug(f"Sandbox output: {sandbox_output}")
+        prompt_messages = [
+            {"role": "system", "content": self.instructions},
+            *state["messages"],
+        ]
+        if previous_script:
+            feedback_message = (
+                f"Here is the script you generated in the last turn:\n\n```python\n{previous_script}\n```\n\n"
+            )
+            if sandbox_output:
+                feedback_message += (
+                    f"When executed, it produced the following output:\n\n```\n{sandbox_output}\n```\n\n"
+                )
+            feedback_message += "Based on this, please generate a new, improved script to continue the task. Remember to replace the old script entirely."
+            prompt_messages.append({"role": "user", "content": feedback_message})
+        logger.debug(f"Prompt messages: {prompt_messages}")
-        response = await model.ainvoke(messages)
+        response = await model.ainvoke(prompt_messages)
+        logger.debug(f"Model response: {response}")
         text_content = self._extract_content(response)
         if not isinstance(text_content, str):
             raise ValueError(f"Content is not a string: {text_content}")
         code = extract_and_combine_codeblocks(text_content)
-        logger.debug(f"Code: {code}")
-        if self.max_reflections > 0 and code:
-            reflection_count = 0
-            while reflection_count < self.max_reflections:
-                conversation_history = "\n".join(
-                    [
-                        f'<message role="{("user" if m.type == "human" else "assistant")}">\n{m.content}\n</message>'
-                        for m in state["messages"]
-                    ]
-                )
-                conversation_history += f'\n<message role="assistant">\n{response.content}\n</message>'
-                formatted_prompt = REFLECTION_PROMPT.format(conversation_history=conversation_history)
-                reflection_messages = [
-                    {"role": "system", "content": self.reflection_prompt},
-                    {"role": "user", "content": formatted_prompt},
-                ]
-                reflection_result = await reflection_model.ainvoke(reflection_messages)
-                if "NONE" in reflection_result.content:
-                    break
-                retry_prompt = RETRY_PROMPT.format(reflection_result=reflection_result.content)
-                regeneration_messages = [
-                    {"role": "system", "content": self.instructions},
-                    *state["messages"],
-                    {"role": "assistant", "content": response.content},
-                    {"role": "user", "content": retry_prompt},
-                ]
-                response = await model.ainvoke(regeneration_messages)
-                code = extract_and_combine_codeblocks(response.content)
-                if not code:
-                    break
-                reflection_count += 1
+        logger.debug(f"Extracted code: {code}")
         return {"messages": [response], "script": code}
     async def sandbox(self, state: CodeActState) -> dict:
-        output, new_vars = await self.eval_fn(state["script"], self.context, timeout=self.sandbox_timeout)
-        self.context = {**self.context, **new_vars}
+        logger.debug(f"Running sandbox with state: {state}")
+        tools_context = {}
+        for tool in self.processed_tools:
+            safe_name = make_safe_function_name(tool.name)
+            tool_callable = tool.coroutine if hasattr(tool, "coroutine") and tool.coroutine is not None else tool.func
+            tools_context[safe_name] = tool_callable
+        output, _ = await self.eval_fn(state["script"], tools_context, self.sandbox_timeout)
+        logger.debug(f"Sandbox output: {output}")
         return {
             "messages": [AIMessageChunk(content=output.strip())],
             "script": None,
+            "sandbox_output": output.strip(),
         }

universal_mcp_agents-0.1.11/src/universal_mcp/agents/codeact/prompts.py ADDED Viewed

@@ -0,0 +1,82 @@
+import inspect
+import re
+from collections.abc import Sequence
+from langchain_core.tools import StructuredTool
+def make_safe_function_name(name: str) -> str:
+    """Convert a tool name to a valid Python function name."""
+    # Replace non-alphanumeric characters with underscores
+    safe_name = re.sub(r"[^a-zA-Z0-9_]", "_", name)
+    # Ensure the name doesn't start with a digit
+    if safe_name and safe_name[0].isdigit():
+        safe_name = f"tool_{safe_name}"
+    # Handle empty name edge case
+    if not safe_name:
+        safe_name = "unnamed_tool"
+    return safe_name
+def create_default_prompt(
+    tools: Sequence[StructuredTool],
+    base_prompt: str | None = None,
+):
+    """Create default prompt for the CodeAct agent."""
+    prompt = f"{base_prompt}\n\n" if base_prompt else ""
+    prompt += """You are a Python programmer. You will be given a task to perform.
+Your goal is to write a self-contained Python script to accomplish the task.
+In each turn, you will generate a complete Python script. The script will be executed in a fresh, stateless environment.
+You will be given the previous script you generated and the output it produced.
+Your task is to analyze the output to find errors or opportunities for improvement, and then generate a new, improved script.
+You must take the previous script as a starting point and replace it with a new one that moves closer to the final solution.
+Your final script must be a single, complete piece of code that can be executed independently.
+The script must follow this structure:
+1. All necessary imports at the top.
+2. An `async def main():` function containing the core logic.
+3. Do NOT include any code outside of the `async def main()` function, and do NOT call it. The execution environment handles this.
+Any output you want to see from the code should be printed to the console from within the `main` function.
+Code should be output in a fenced code block (e.g. ```python ... ```).
+If you need to ask for more information or provide the final answer, you can output text to be shown directly to the user.
+In addition to the Python Standard Library, you can use the following functions:"""
+    for tool in tools:
+        # Use coroutine if it exists, otherwise use func
+        tool_callable = tool.coroutine if hasattr(tool, "coroutine") and tool.coroutine is not None else tool.func
+        # Create a safe function name
+        safe_name = make_safe_function_name(tool.name)
+        # Determine if it's an async function
+        is_async = inspect.iscoroutinefunction(tool_callable)
+        # Add appropriate function definition
+        prompt += f'''\n{"async " if is_async else ""}def {safe_name}{str(inspect.signature(tool_callable))}:
+    """{tool.description}"""
+    ...
+'''
+    prompt += """\n\n\nAlways use print() statements to explore data structures and function outputs. Simply returning values will not display them back to you for inspection. For example, use print(result) instead of just 'result'.
+As you don't know the output schema of the additional Python functions you have access to, start from exploring their contents before building a final solution.
+IMPORTANT CODING STRATEGY:
+1. All your code must be inside an `async def main()` function.
+2. Do NOT import `asyncio` or call `main()`. The execution environment handles this.
+3. Since many of the provided tools are async, you must use `await` to call them from within `main()`.
+4. Write code up to the point where you make an API call/tool usage with an output.
+5. Print the type/shape and a sample entry of this output, and using that knowledge proceed to write the further code.
+This means:
+- Write code that makes the API call or tool usage
+- Print the result with type information: print(f"Type: {type(result)}")
+- Print the shape/structure: print(f"Shape/Keys: {result.keys() if isinstance(result, dict) else len(result) if isinstance(result, (list, tuple)) else 'N/A'}")
+- Print a sample entry: print(f"Sample: {result[0] if isinstance(result, (list, tuple)) and len(result) > 0 else result}")
+- Then, based on this knowledge, write the code to process/use this data
+Reminder: use Python code snippets to call tools
+When you have completely finished the task, present the final result from your script to the user in a clean and readable Markdown format. Do not just summarize what you did; provide the actual output. For example, if you were asked to find unsubscribe links and your script found them, your final response should be a Markdown-formatted list of those links. After you have provided the final output, you MUST end your response with the exact phrase "TASK_COMPLETE"."""
+    return prompt

universal_mcp_agents-0.1.11/src/universal_mcp/agents/codeact/sandbox.py ADDED Viewed

@@ -0,0 +1,39 @@
+import asyncio
+import builtins
+import contextlib
+import io
+from typing import Any
+from loguru import logger
+async def eval_unsafe(code: str, _locals: dict[str, Any], timeout: int = 10) -> tuple[str, dict[str, Any]]:
+    """Executes a string of Python code in a sandboxed environment."""
+    # Store original keys before execution
+    original_keys = set(_locals.keys())
+    result = f"Executing code...\n{code}\n\nOutput:\n"
+    result += "=" * 50 + "\n"
+    try:
+        logger.debug(f"Executing code with timeout {timeout}")
+        with contextlib.redirect_stdout(io.StringIO()) as f:
+            # Execute the code in the provided locals context
+            # This should define an async function `main`
+            exec(code, builtins.__dict__, _locals)
+            if "main" in _locals and asyncio.iscoroutinefunction(_locals["main"]):
+                # Run the main async function
+                await asyncio.wait_for(_locals["main"](), timeout=timeout)
+            else:
+                result += "\nError: No `async def main()` function found in the script."
+        output = f.getvalue()
+        result += output
+        if not output:
+            result += "<code ran, no output printed to stdout>"
+    except Exception as e:
+        result += f"Error during execution: {repr(e)}"
+    # Determine new variables created during execution
+    new_keys = set(_locals.keys()) - original_keys
+    new_vars = {key: _locals[key] for key in new_keys}
+    return result, new_vars

universal_mcp_agents-0.1.11/src/universal_mcp/agents/codeact/state.py ADDED Viewed

@@ -0,0 +1,9 @@
+from langgraph.graph import MessagesState
+from pydantic import Field
+class CodeActState(MessagesState):
+    """State for CodeAct agent."""
+    script: str | None = Field(default=None, description="The Python code script to be executed.")
+    sandbox_output: str | None = Field(default=None, description="The output of the Python code script execution.")

{universal_mcp_agents-0.1.10 → universal_mcp_agents-0.1.11}/uv.lock RENAMED Viewed

@@ -1574,7 +1574,7 @@ name = "importlib-metadata"
 version = "8.7.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
-    { name = "zipp", marker = "python_full_version < '3.13'" },
+    { name = "zipp", marker = "python_full_version < '3.12'" },
 ]
 sdist = { url = "https://files.pythonhosted.org/packages/76/66/650a33bd90f786193e4de4b3ad86ea60b53c89b669a5c7be931fac31cdb0/importlib_metadata-8.7.0.tar.gz", hash = "sha256:d13b81ad223b890aa16c5471f2ac3056cf76c5f10f82d6f9292f0b415f389000", size = 56641, upload-time = "2025-04-27T15:29:01.736Z" }
 wheels = [
@@ -4389,7 +4389,7 @@ wheels = [
 [[package]]
 name = "universal-mcp-agents"
-version = "0.1.9"
+version = "0.1.10"
 source = { editable = "." }
 dependencies = [
     { name = "langchain-anthropic" },

universal_mcp_agents-0.1.10/src/universal_mcp/agents/codeact/prompts.py DELETED Viewed

@@ -1,91 +0,0 @@
-import inspect
-import re
-from collections.abc import Sequence
-from langchain_core.tools import StructuredTool
-def make_safe_function_name(name: str) -> str:
-    """Convert a tool name to a valid Python function name."""
-    # Replace non-alphanumeric characters with underscores
-    safe_name = re.sub(r"[^a-zA-Z0-9_]", "_", name)
-    # Ensure the name doesn't start with a digit
-    if safe_name and safe_name[0].isdigit():
-        safe_name = f"tool_{safe_name}"
-    # Handle empty name edge case
-    if not safe_name:
-        safe_name = "unnamed_tool"
-    return safe_name
-def create_default_prompt(
-    tools: Sequence[StructuredTool],
-    base_prompt: str | None = None,
-):
-    """Create default prompt for the CodeAct agent."""
-    prompt = f"{base_prompt}\n\n" if base_prompt else ""
-    prompt += """You will be given a task to perform. You should output either
-- a Python code snippet that provides the solution to the task, or a step towards the solution. Any output you want to extract from the code should be printed to the console. Code should be output in a fenced code block.
-- text to be shown directly to the user, if you want to ask for more information or provide the final answer.
-In addition to the Python Standard Library, you can use the following functions:"""
-    for tool in tools:
-        # Use coroutine if it exists, otherwise use func
-        tool_callable = tool.coroutine if hasattr(tool, "coroutine") and tool.coroutine is not None else tool.func
-        # Create a safe function name
-        safe_name = make_safe_function_name(tool.name)
-        # Determine if it's an async function
-        is_async = inspect.iscoroutinefunction(tool_callable)
-        # Add appropriate function definition
-        prompt += f'''\n{"async " if is_async else ""}def {safe_name}{str(inspect.signature(tool_callable))}:
-    """{tool.description}"""
-    ...
-'''
-    prompt += """
-Variables defined at the top level of previous code snippets can be referenced in your code.
-Always use print() statements to explore data structures and function outputs. Simply returning values will not display them back to you for inspection. For example, use print(result) instead of just 'result'.
-As you don't know the output schema of the additional Python functions you have access to, start from exploring their contents before building a final solution.
-IMPORTANT CODING STRATEGY:
-1. Only write code up to the point where you make an API call/tool usage with an output
-2. Print the type/shape and a sample entry of this output, and using that knowledge proceed to write the further code
-This means:
-- Write code that makes the API call or tool usage
-- Print the result with type information: print(f"Type: {type(result)}")
-- Print the shape/structure: print(f"Shape/Keys: {result.keys() if isinstance(result, dict) else len(result) if isinstance(result, (list, tuple)) else 'N/A'}")
-- Print a sample entry: print(f"Sample: {result[0] if isinstance(result, (list, tuple)) and len(result) > 0 else result}")
-- Then, based on this knowledge, write the code to process/use this data
-Reminder: use Python code snippets to call tools
-When you have completely finished the task and provided the final answer, you MUST end your response with the exact phrase "TASK_COMPLETE".
-"""
-    return prompt
-REFLECTION_PROMPT = """
-Review the assistant's latest code for as per the quality rules:
-<conversation_history>
-{conversation_history}
-</conversation_history>
-If you find ANY of these issues, describe the problem briefly and clearly.
-If NO issues are found, respond with EXACTLY: "NONE"
-"""
-RETRY_PROMPT = """
-I need you to completely regenerate your previous response based on this feedback:
-'''
-{reflection_result}
-'''
-DO NOT reference the feedback directly. Instead, provide a completely new response that addresses the issues.
-"""

universal_mcp_agents-0.1.10/src/universal_mcp/agents/codeact/sandbox.py DELETED Viewed

@@ -1,51 +0,0 @@
-import asyncio
-import builtins
-import contextlib
-import io
-from typing import Any
-async def eval_unsafe(code: str, _locals: dict[str, Any], timeout: int = 10) -> tuple[str, dict[str, Any]]:
-    """
-    Execute code in a non-blocking way and return the output and changed variables.
-    """
-    result = f"Executing code...\n{code}\n\nOutput:\n"
-    result += "=" * 50 + "\n"
-    # Create a combined globals/locals environment that includes builtins
-    # and the provided context. This allows nested functions to access tools.
-    execution_env = {**builtins.__dict__, **_locals}
-    def sync_eval_in_thread():
-        """Synchronously execute code and capture output."""
-        try:
-            with contextlib.redirect_stdout(io.StringIO()) as f:
-                exec(code, execution_env)
-            output = f.getvalue()
-            if not output:
-                output = "<code ran, no output printed to stdout>"
-            return output
-        except Exception as e:
-            return f"Error during execution: {repr(e)}"
-    # Run the synchronous exec in a separate thread to avoid blocking the event loop.
-    try:
-        output = await asyncio.wait_for(asyncio.to_thread(sync_eval_in_thread), timeout=timeout)
-    except asyncio.TimeoutError:
-        output = f"Error: Code execution timed out after {timeout} seconds."
-    result += output
-    # Identify all variables that are not part of the original builtins
-    # and were not in the initial _locals, or were changed.
-    changed_vars = {}
-    builtin_keys = set(builtins.__dict__.keys())
-    for key, value in execution_env.items():
-        if key in builtin_keys:
-            continue  # Skip builtins
-        # Check if the key is new or if the value has changed
-        if key not in _locals or _locals[key] is not value:
-            changed_vars[key] = value
-    return result, changed_vars

universal_mcp_agents-0.1.10/src/universal_mcp/agents/codeact/state.py DELETED Viewed

@@ -1,10 +0,0 @@
-from typing import Any
-from langgraph.graph import MessagesState
-class CodeActState(MessagesState):
-    """State for CodeAct agent."""
-    script: str | None
-    """The Python code script to be executed."""