PyPI - tactus - Versions diffs - 0.33.0__py3-none-any.whl → 0.34.1__py3-none-any.whl - Mend

tactus 0.33.0py3-none-any.whl → 0.34.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (100) hide show

tactus/__init__.py +1 -1
tactus/adapters/__init__.py +18 -1
tactus/adapters/broker_log.py +127 -34
tactus/adapters/channels/__init__.py +153 -0
tactus/adapters/channels/base.py +174 -0
tactus/adapters/channels/broker.py +179 -0
tactus/adapters/channels/cli.py +448 -0
tactus/adapters/channels/host.py +225 -0
tactus/adapters/channels/ipc.py +297 -0
tactus/adapters/channels/sse.py +305 -0
tactus/adapters/cli_hitl.py +223 -1
tactus/adapters/control_loop.py +879 -0
tactus/adapters/file_storage.py +35 -2
tactus/adapters/ide_log.py +7 -1
tactus/backends/http_backend.py +0 -1
tactus/broker/client.py +31 -1
tactus/broker/server.py +416 -92
tactus/cli/app.py +270 -7
tactus/cli/control.py +393 -0
tactus/core/config_manager.py +33 -6
tactus/core/dsl_stubs.py +102 -18
tactus/core/execution_context.py +265 -8
tactus/core/lua_sandbox.py +8 -9
tactus/core/registry.py +19 -2
tactus/core/runtime.py +235 -27
tactus/docker/Dockerfile.pypi +49 -0
tactus/docs/__init__.py +33 -0
tactus/docs/extractor.py +326 -0
tactus/docs/html_renderer.py +72 -0
tactus/docs/models.py +121 -0
tactus/docs/templates/base.html +204 -0
tactus/docs/templates/index.html +58 -0
tactus/docs/templates/module.html +96 -0
tactus/dspy/agent.py +382 -22
tactus/dspy/broker_lm.py +57 -6
tactus/dspy/config.py +14 -3
tactus/dspy/history.py +2 -1
tactus/dspy/module.py +136 -11
tactus/dspy/signature.py +0 -1
tactus/ide/server.py +300 -9
tactus/primitives/human.py +619 -47
tactus/primitives/system.py +0 -1
tactus/protocols/__init__.py +25 -0
tactus/protocols/control.py +427 -0
tactus/protocols/notification.py +207 -0
tactus/sandbox/container_runner.py +79 -11
tactus/sandbox/docker_manager.py +23 -0
tactus/sandbox/entrypoint.py +26 -0
tactus/sandbox/protocol.py +3 -0
tactus/stdlib/README.md +77 -0
tactus/stdlib/__init__.py +27 -1
tactus/stdlib/classify/__init__.py +165 -0
tactus/stdlib/classify/classify.spec.tac +195 -0
tactus/stdlib/classify/classify.tac +257 -0
tactus/stdlib/classify/fuzzy.py +282 -0
tactus/stdlib/classify/llm.py +319 -0
tactus/stdlib/classify/primitive.py +287 -0
tactus/stdlib/core/__init__.py +57 -0
tactus/stdlib/core/base.py +320 -0
tactus/stdlib/core/confidence.py +211 -0
tactus/stdlib/core/models.py +161 -0
tactus/stdlib/core/retry.py +171 -0
tactus/stdlib/core/validation.py +274 -0
tactus/stdlib/extract/__init__.py +125 -0
tactus/stdlib/extract/llm.py +330 -0
tactus/stdlib/extract/primitive.py +256 -0
tactus/stdlib/tac/tactus/classify/base.tac +51 -0
tactus/stdlib/tac/tactus/classify/fuzzy.tac +87 -0
tactus/stdlib/tac/tactus/classify/index.md +77 -0
tactus/stdlib/tac/tactus/classify/init.tac +29 -0
tactus/stdlib/tac/tactus/classify/llm.tac +150 -0
tactus/stdlib/tac/tactus/classify.spec.tac +191 -0
tactus/stdlib/tac/tactus/extract/base.tac +138 -0
tactus/stdlib/tac/tactus/extract/index.md +96 -0
tactus/stdlib/tac/tactus/extract/init.tac +27 -0
tactus/stdlib/tac/tactus/extract/llm.tac +201 -0
tactus/stdlib/tac/tactus/extract.spec.tac +153 -0
tactus/stdlib/tac/tactus/generate/base.tac +142 -0
tactus/stdlib/tac/tactus/generate/index.md +195 -0
tactus/stdlib/tac/tactus/generate/init.tac +28 -0
tactus/stdlib/tac/tactus/generate/llm.tac +169 -0
tactus/stdlib/tac/tactus/generate.spec.tac +210 -0
tactus/testing/behave_integration.py +171 -7
tactus/testing/context.py +0 -1
tactus/testing/evaluation_runner.py +0 -1
tactus/testing/gherkin_parser.py +0 -1
tactus/testing/mock_hitl.py +0 -1
tactus/testing/mock_tools.py +0 -1
tactus/testing/models.py +0 -1
tactus/testing/steps/builtin.py +0 -1
tactus/testing/steps/custom.py +81 -22
tactus/testing/steps/registry.py +0 -1
tactus/testing/test_runner.py +7 -1
tactus/validation/semantic_visitor.py +11 -5
tactus/validation/validator.py +0 -1
{tactus-0.33.0.dist-info → tactus-0.34.1.dist-info}/METADATA +14 -2
{tactus-0.33.0.dist-info → tactus-0.34.1.dist-info}/RECORD +100 -49
{tactus-0.33.0.dist-info → tactus-0.34.1.dist-info}/WHEEL +0 -0
{tactus-0.33.0.dist-info → tactus-0.34.1.dist-info}/entry_points.txt +0 -0
{tactus-0.33.0.dist-info → tactus-0.34.1.dist-info}/licenses/LICENSE +0 -0

tactus/dspy/agent.py CHANGED Viewed

@@ -12,6 +12,8 @@ The Agent uses:
 - Unified mocking via Mocks {} primitive
 """
+import asyncio
+import json
 import logging
 from typing import Any, Dict, List, Optional
@@ -61,6 +63,7 @@ class DSPyAgentHandle:
         mock_manager: Any = None,
         log_handler: Any = None,
         disable_streaming: bool = False,
+        execution_context: Any = None,
         **kwargs: Any,
     ):
         """
@@ -87,6 +90,7 @@ class DSPyAgentHandle:
             mock_manager: Optional MockManager instance for checking mocks
             log_handler: Optional log handler for emitting streaming events
             disable_streaming: If True, disable streaming even when log_handler is present
+            execution_context: Optional ExecutionContext for checkpointing agent calls
             **kwargs: Additional configuration
         """
         self.name = name
@@ -95,6 +99,8 @@ class DSPyAgentHandle:
         self.provider = provider
         self.tools = tools or []
         self.toolsets = toolsets or []
+        self.execution_context = execution_context
+        self._dspy_tools_cache = None  # Cache for converted DSPy tools
         # Default input schema: {message: string}
         self.input_schema = input_schema or {"message": {"type": "string", "required": False}}
         # Default output schema: {response: string}
@@ -108,8 +114,18 @@ class DSPyAgentHandle:
         self.mock_manager = mock_manager
         self.log_handler = log_handler
         self.disable_streaming = disable_streaming
+        self.tool_choice = kwargs.get("tool_choice")  # Extract tool_choice from kwargs
         self.kwargs = kwargs
+        # CRITICAL DEBUG: Log handler state at initialization
+        logger.info(
+            f"[AGENT_INIT] Agent '{self.name}' initialized with log_handler={log_handler is not None}, "
+            f"disable_streaming={disable_streaming}, "
+            f"log_handler_type={type(log_handler).__name__ if log_handler else 'None'}, "
+            f"tool_choice={self.tool_choice}, "
+            f"kwargs_keys={list(kwargs.keys())}"
+        )
         # Initialize conversation history
         self._history = create_history()
@@ -306,16 +322,173 @@ class DSPyAgentHandle:
             raise ValueError(f"Unknown module '{module}'. Supported: {list(mapping.keys())}")
         return strategy
+    def _convert_toolsets_to_dspy_tools_sync(self) -> list:
+        """
+        Convert Pydantic AI toolsets to DSPy Tool objects (synchronous version).
+        DSPy uses dspy.adapters.types.tool.Tool for native function calling.
+        Pydantic AI toolsets expose tools via .get_tools(ctx) method.
+        Returns:
+            List of DSPy Tool objects
+        """
+        try:
+            from dspy.adapters.types.tool import Tool as DSPyTool
+        except ImportError:
+            logger.error("Cannot import DSPyTool - DSPy installation may be incomplete")
+            return []
+        logger.info(f"Agent '{self.name}' has {len(self.toolsets)} toolsets to convert")
+        dspy_tools = []
+        # Convert toolsets to DSPy Tools
+        for idx, toolset in enumerate(self.toolsets):
+            logger.info(f"Agent '{self.name}' processing toolset {idx}: {type(toolset).__name__}")
+            try:
+                # Pydantic AI FunctionToolset has a .tools dict attribute that's directly accessible
+                # This avoids the need for async get_tools() call and RunContext
+                if hasattr(toolset, "tools") and isinstance(toolset.tools, dict):
+                    pydantic_tools = list(toolset.tools.values())
+                    logger.info(
+                        f"Agent '{self.name}' toolset {idx} has {len(pydantic_tools)} tools (from .tools attribute)"
+                    )
+                else:
+                    logger.warning(
+                        f"Toolset {toolset} doesn't have accessible .tools dict, skipping"
+                    )
+                    continue
+                for pydantic_tool in pydantic_tools:
+                    # Pydantic AI Tool has: name, description, function_schema.json_schema, function
+                    logger.info(
+                        f"Agent '{self.name}' converting tool: name={pydantic_tool.name}, desc={pydantic_tool.description[:50] if pydantic_tool.description else 'N/A'}..."
+                    )
+                    # Extract parameter schema from Pydantic AI tool
+                    tool_args = None
+                    if hasattr(pydantic_tool, "function_schema") and hasattr(
+                        pydantic_tool.function_schema, "json_schema"
+                    ):
+                        json_schema = pydantic_tool.function_schema.json_schema
+                        if "properties" in json_schema:
+                            # Convert JSON schema properties to DSPy's expected format
+                            tool_args = json_schema["properties"]
+                            logger.info(
+                                f"Extracted parameter schema for '{pydantic_tool.name}': {tool_args}"
+                            )
+                    dspy_tool = DSPyTool(
+                        func=pydantic_tool.function,
+                        name=pydantic_tool.name,
+                        desc=pydantic_tool.description,
+                        args=tool_args,  # Pass the parameter schema
+                    )
+                    dspy_tools.append(dspy_tool)
+                    logger.info(
+                        f"Converted tool '{pydantic_tool.name}' to DSPy Tool with args={tool_args}"
+                    )
+            except Exception as e:
+                import traceback
+                logger.error(f"Failed to convert toolset {toolset} to DSPy Tools: {e}")
+                logger.error(f"Traceback: {traceback.format_exc()}")
+        logger.info(f"Agent '{self.name}' converted {len(dspy_tools)} tools to DSPy format")
+        return dspy_tools
+    def _execute_tool(self, tool_name: str, tool_args: Dict[str, Any]) -> Any:
+        """
+        Execute a tool call using the available toolsets.
+        Args:
+            tool_name: Name of the tool to execute
+            tool_args: Arguments to pass to the tool
+        Returns:
+            Tool execution result
+        """
+        logger.info(f"[TOOL_EXEC] Executing tool '{tool_name}' with args: {tool_args}")
+        # Find the tool in our toolsets
+        for toolset in self.toolsets:
+            if hasattr(toolset, "tools") and isinstance(toolset.tools, dict):
+                for pydantic_tool in toolset.tools.values():
+                    if pydantic_tool.name == tool_name:
+                        logger.info(f"[TOOL_EXEC] Found tool '{tool_name}' in toolset")
+                        try:
+                            # Call the Pydantic AI tool function
+                            # The tool function might be async (wrapped Lua tools are)
+                            import asyncio
+                            import inspect
+                            # Check if the function is async before calling it
+                            if inspect.iscoroutinefunction(pydantic_tool.function):
+                                logger.info(
+                                    f"[TOOL_EXEC] Tool '{tool_name}' is async, running with nest_asyncio"
+                                )
+                                # Use nest_asyncio to allow running async code from sync context
+                                # even when there's already an event loop running
+                                try:
+                                    import nest_asyncio
+                                    nest_asyncio.apply()
+                                except ImportError:
+                                    logger.warning(
+                                        "[TOOL_EXEC] nest_asyncio not available, trying asyncio.run()"
+                                    )
+                                # Get the current event loop or create new one
+                                try:
+                                    loop = asyncio.get_event_loop()
+                                    if loop.is_running():
+                                        logger.info(
+                                            "[TOOL_EXEC] Loop is running, using run_until_complete with nest_asyncio"
+                                        )
+                                        # nest_asyncio allows this even though loop is running
+                                        coro = pydantic_tool.function(**tool_args)
+                                        result = loop.run_until_complete(coro)
+                                    else:
+                                        logger.info(
+                                            "[TOOL_EXEC] Loop not running, using run_until_complete"
+                                        )
+                                        coro = pydantic_tool.function(**tool_args)
+                                        result = loop.run_until_complete(coro)
+                                except RuntimeError:
+                                    # No loop at all
+                                    logger.info("[TOOL_EXEC] No event loop, using asyncio.run()")
+                                    result = asyncio.run(pydantic_tool.function(**tool_args))
+                            else:
+                                # Function is sync - just call it
+                                logger.info(
+                                    f"[TOOL_EXEC] Tool '{tool_name}' is sync, calling directly"
+                                )
+                                result = pydantic_tool.function(**tool_args)
+                            logger.info(f"[TOOL_EXEC] Tool '{tool_name}' returned: {result}")
+                            return result
+                        except Exception as e:
+                            logger.error(
+                                f"[TOOL_EXEC] Tool '{tool_name}' execution failed: {e}",
+                                exc_info=True,
+                            )
+                            return {"error": str(e)}
+        logger.warning(f"[TOOL_EXEC] Tool '{tool_name}' not found in any toolset")
+        return {"error": f"Tool '{tool_name}' not found"}
     def _build_module(self) -> TactusModule:
         """Build the internal DSPy module for this agent."""
         # Create a signature for agent turns
-        # Input: system_prompt, history, user_message, available_tools
+        # Input: system_prompt, history, user_message
+        # If tools available: also include tools as structured list[dspy.Tool]
         # Output: response and tool_calls (if tools are needed)
-        # Include tools in the signature if they're available
+        # Use DSPy's native function calling with structured tool input
+        # See: dspy/adapters/base.py - adapter preprocesses tools field
         if self.tools or self.toolsets:
-            signature = (
-                "system_prompt, history, user_message, available_tools -> response, tool_calls"
-            )
+            signature = "system_prompt, history, user_message, tools: list[dspy.Tool] -> response, tool_calls: dspy.ToolCalls"
         else:
             signature = "system_prompt, history, user_message -> response"
@@ -340,22 +513,29 @@ class DSPyAgentHandle:
         Returns:
             True if streaming should be enabled
         """
+        # CRITICAL DEBUG: Always log entry
+        logger.info(f"[STREAMING] Agent '{self.name}': _should_stream() called")
         # Must have log_handler to emit streaming events
         if self.log_handler is None:
-            logger.debug(f"[STREAMING] Agent '{self.name}': no log_handler, streaming disabled")
+            logger.info(f"[STREAMING] Agent '{self.name}': no log_handler, streaming disabled")
             return False
         # Allow log handlers to opt out of streaming (e.g., cost-only collectors)
         supports_streaming = getattr(self.log_handler, "supports_streaming", True)
+        logger.info(
+            f"[STREAMING] Agent '{self.name}': log_handler.supports_streaming={supports_streaming}"
+        )
         if not supports_streaming:
-            logger.debug(
+            logger.info(
                 f"[STREAMING] Agent '{self.name}': log_handler supports_streaming=False, streaming disabled"
             )
             return False
         # Respect explicit disable flag
+        logger.info(f"[STREAMING] Agent '{self.name}': disable_streaming={self.disable_streaming}")
         if self.disable_streaming:
-            logger.debug(
+            logger.info(
                 f"[STREAMING] Agent '{self.name}': disable_streaming=True, streaming disabled"
             )
             return False
@@ -480,7 +660,6 @@ class DSPyAgentHandle:
         Returns:
             TactusResult with value, usage, and cost_stats
         """
-        import asyncio
         import threading
         import queue
         from tactus.protocols.models import AgentTurnEvent, AgentStreamChunkEvent
@@ -644,9 +823,112 @@ class DSPyAgentHandle:
         # Add assistant response to new_messages
         if hasattr(result_holder["result"], "response"):
             assistant_msg = {"role": "assistant", "content": result_holder["result"].response}
+            # Include tool calls in the message if present (before wrapping)
+            has_tc = hasattr(result_holder["result"], "tool_calls")
+            tc_value = getattr(result_holder["result"], "tool_calls", None)
+            logger.info(
+                f"[ASYNC_STREAMING] Agent '{self.name}' result: has_tool_calls={has_tc}, tool_calls={tc_value}"
+            )
+            if (
+                hasattr(result_holder["result"], "tool_calls")
+                and result_holder["result"].tool_calls
+            ):
+                # Convert tool calls to JSON-serializable format
+                logger.info("[ASYNC_STREAMING] Converting tool_calls to dict format")
+                tool_calls_list = []
+                tc_obj = result_holder["result"].tool_calls
+                has_tc_attr = hasattr(tc_obj, "tool_calls")
+                logger.info(
+                    f"[ASYNC_STREAMING] tool_calls object: type={type(tc_obj)}, has_tool_calls_attr={has_tc_attr}"
+                )
+                for tc in (
+                    result_holder["result"].tool_calls.tool_calls
+                    if hasattr(result_holder["result"].tool_calls, "tool_calls")
+                    else []
+                ):
+                    logger.info(
+                        f"[ASYNC_STREAMING] Processing tool call: name={tc.name} args={tc.args}"
+                    )
+                    tool_calls_list.append(
+                        {
+                            "id": f"call_{tc.name}",  # Generate a simple ID
+                            "type": "function",
+                            "function": {
+                                "name": tc.name,
+                                "arguments": (
+                                    json.dumps(tc.args) if isinstance(tc.args, dict) else tc.args
+                                ),
+                            },
+                        }
+                    )
+                logger.info(
+                    f"[ASYNC_STREAMING] Built tool_calls_list with {len(tool_calls_list)} items"
+                )
+                if tool_calls_list:
+                    assistant_msg["tool_calls"] = tool_calls_list
+                    logger.info("[ASYNC_STREAMING] Added tool_calls to assistant_msg")
             new_messages.append(assistant_msg)
             self._history.add(assistant_msg)
+            # Execute tool calls and add tool result messages to history
+            if assistant_msg.get("tool_calls"):
+                logger.info(
+                    f"[ASYNC_STREAMING] Agent '{self.name}' executing {len(assistant_msg['tool_calls'])} tool calls"
+                )
+                for tc in assistant_msg["tool_calls"]:
+                    tool_name = tc["function"]["name"]
+                    tool_args_str = tc["function"]["arguments"]
+                    tool_args = (
+                        json.loads(tool_args_str)
+                        if isinstance(tool_args_str, str)
+                        else tool_args_str
+                    )
+                    tool_id = tc["id"]
+                    logger.info(
+                        f"[ASYNC_STREAMING] Executing tool: {tool_name} with args: {tool_args}"
+                    )
+                    # Execute the tool using toolsets
+                    tool_result = self._execute_tool(tool_name, tool_args)
+                    logger.info(f"[ASYNC_STREAMING] Tool executed successfully: {tool_result}")
+                    # Record the tool call so Lua can check if it was called
+                    tool_primitive = getattr(self, "_tool_primitive", None)
+                    if tool_primitive:
+                        # Remove agent name prefix from tool name if present
+                        # Tool names are stored as "agent_name_tool_name" in the primitive
+                        clean_tool_name = tool_name.replace(f"{self.name}_", "")
+                        tool_primitive.record_call(
+                            clean_tool_name, tool_args, tool_result, agent_name=self.name
+                        )
+                        logger.info(f"[ASYNC_STREAMING] Recorded tool call: {clean_tool_name}")
+                    # Add tool result to history in OpenAI's expected format
+                    # OpenAI requires: role="tool", tool_call_id=<id>, content=<result>
+                    tool_result_str = (
+                        json.dumps(tool_result)
+                        if isinstance(tool_result, dict)
+                        else str(tool_result)
+                    )
+                    tool_result_msg = {
+                        "role": "tool",
+                        "tool_call_id": tool_id,
+                        "name": tool_name,
+                        "content": tool_result_str,
+                    }
+                    logger.info(f"[ASYNC_STREAMING] Created tool result message: {tool_result_msg}")
+                    new_messages.append(tool_result_msg)
+                    logger.info(
+                        f"[ASYNC_STREAMING] Added tool result to new_messages, count={len(new_messages)}"
+                    )
+                    self._history.add(tool_result_msg)
+                    logger.info(
+                        f"[ASYNC_STREAMING] Added tool result to history for tool_call_id={tool_id}, history size={len(self._history)}"
+                    )
         # Wrap the result with message tracking
         wrapped_result = wrap_prediction(
             result_holder["result"],
@@ -726,6 +1008,38 @@ class DSPyAgentHandle:
         # Add assistant response to new_messages
         if hasattr(dspy_result, "response"):
             assistant_msg = {"role": "assistant", "content": dspy_result.response}
+            # Include tool calls in the message if present (before wrapping)
+            has_tc = hasattr(dspy_result, "tool_calls")
+            tc_value = getattr(dspy_result, "tool_calls", None)
+            logger.info(
+                f"Agent '{self.name}' dspy_result: has_tool_calls={has_tc}, tool_calls={tc_value}"
+            )
+            if hasattr(dspy_result, "tool_calls") and dspy_result.tool_calls:
+                # Convert tool calls to JSON-serializable format
+                tool_calls_list = []
+                for tc in (
+                    dspy_result.tool_calls.tool_calls
+                    if hasattr(dspy_result.tool_calls, "tool_calls")
+                    else []
+                ):
+                    tool_calls_list.append(
+                        {
+                            "id": f"call_{tc['name']}",  # Generate a simple ID
+                            "type": "function",
+                            "function": {
+                                "name": tc["name"],
+                                "arguments": (
+                                    json.dumps(tc["args"])
+                                    if isinstance(tc["args"], dict)
+                                    else tc["args"]
+                                ),
+                            },
+                        }
+                    )
+                if tool_calls_list:
+                    assistant_msg["tool_calls"] = tool_calls_list
             new_messages.append(assistant_msg)
             self._history.add(assistant_msg)
@@ -819,6 +1133,54 @@ class DSPyAgentHandle:
         if context:
             opts["context"] = context
+        # If execution_context is available, wrap in checkpoint for transparent durability
+        if self.execution_context:
+            def checkpoint_fn():
+                return self._execute_turn(opts)
+            result = self.execution_context.checkpoint(checkpoint_fn, f"agent_{self.name}_turn")
+        else:
+            # No checkpointing - execute directly
+            result = self._execute_turn(opts)
+        # Mirror AgentHandle convenience for Lua patterns like `agent(); return agent.output`.
+        output_text = None
+        if result is not None:
+            for attr in ("response", "message"):
+                try:
+                    value = getattr(result, attr, None)
+                except Exception:
+                    value = None
+                if isinstance(value, str):
+                    output_text = value
+                    break
+            if output_text is None and isinstance(result, dict):
+                for key in ("response", "message"):
+                    value = result.get(key)
+                    if isinstance(value, str):
+                        output_text = value
+                        break
+            if output_text is None:
+                output_text = str(result)
+        self.output = output_text
+        return result
+    def _execute_turn(self, opts: Dict[str, Any]) -> Any:
+        """
+        Execute a single agent turn (internal method for checkpointing).
+        This method contains the core agent execution logic that gets checkpointed.
+        Args:
+            opts: Turn options with message, context, and per-turn overrides
+        Returns:
+            Result object with response and other fields
+        """
         # Execute the turn (inlined from old turn() method)
         self._turn_count += 1
         logger.debug(f"Agent '{self.name}' turn {self._turn_count}")
@@ -848,6 +1210,9 @@ class DSPyAgentHandle:
                 config_kwargs["max_tokens"] = self.max_tokens
             if self.model_type is not None:
                 config_kwargs["model_type"] = self.model_type
+            if self.tool_choice is not None and (self.tools or self.toolsets):
+                config_kwargs["tool_choice"] = self.tool_choice
+                logger.info(f"Configuring LM with tool_choice={self.tool_choice}")
             configure_lm(model_for_litellm, **config_kwargs)
@@ -867,20 +1232,12 @@ class DSPyAgentHandle:
             "user_message": user_message or "",
         }
-        # Add available tools if agent has them
+        # Add tools as structured DSPy Tool objects if agent has them
+        # DSPy's adapter will convert these to OpenAI function call format
         if self.tools or self.toolsets:
-            # Format tools for the prompt
-            tool_descriptions = []
-            if self.toolsets:
-                # Convert toolsets to strings if they're not already
-                toolset_names = [str(ts) if not isinstance(ts, str) else ts for ts in self.toolsets]
-                tool_descriptions.append(f"Available toolsets: {', '.join(toolset_names)}")
-                tool_descriptions.append(
-                    "Use the 'done' tool with a 'reason' parameter to complete the task."
-                )
-            prompt_context["available_tools"] = (
-                "\n".join(tool_descriptions) if tool_descriptions else "No tools available"
-            )
+            dspy_tools = self._convert_toolsets_to_dspy_tools_sync()
+            prompt_context["tools"] = dspy_tools
+            logger.info(f"Agent '{self.name}' passing {len(dspy_tools)} DSPy tools to module")
         # Add any injected context (user_message is already in prompt_context)
         if context:
@@ -1094,6 +1451,7 @@ def create_dspy_agent(
     config: Dict[str, Any],
     registry: Any = None,
     mock_manager: Any = None,
+    execution_context: Any = None,
 ) -> DSPyAgentHandle:
     """
     Create a DSPy-based Agent from configuration.
@@ -1111,6 +1469,7 @@ def create_dspy_agent(
             - Other optional configuration
         registry: Optional Registry instance for accessing mocks
         mock_manager: Optional MockManager instance for checking mocks
+        execution_context: Optional ExecutionContext for checkpointing agent calls
     Returns:
         A DSPyAgentHandle instance
@@ -1141,6 +1500,7 @@ def create_dspy_agent(
         mock_manager=mock_manager,
         log_handler=config.get("log_handler"),
         disable_streaming=config.get("disable_streaming", False),
+        execution_context=execution_context,
         **{
             k: v
             for k, v in config.items()

tactus/dspy/broker_lm.py CHANGED Viewed

@@ -10,6 +10,7 @@ while still supporting streaming via DSPy's `streamify()` mechanism.
 from __future__ import annotations
+import logging
 from typing import Any
 import dspy
@@ -19,6 +20,8 @@ from litellm import ModelResponse, ModelResponseStream
 from tactus.broker.client import BrokerClient
+logger = logging.getLogger(__name__)
 def _split_provider_model(model: str) -> tuple[str, str]:
     if "/" not in model:
@@ -99,8 +102,16 @@ class BrokeredLM(dspy.BaseLM):
         caller_predict = dspy.settings.caller_predict
         caller_predict_id = id(caller_predict) if caller_predict else None
+        # Extract tools and tool_choice from kwargs
+        tools = merged_kwargs.get("tools")
+        tool_choice = merged_kwargs.get("tool_choice")
+        logger.debug(
+            f"[BROKER_LM] Calling LM with streaming={send_stream is not None}, tools={len(tools) if tools else 0}"
+        )
         if send_stream is not None:
             chunks: list[ModelResponseStream] = []
+            tool_calls_data = None
             async for event in self._client.llm_chat(
                 provider="openai",
                 model=model_id,
@@ -108,6 +119,8 @@ class BrokeredLM(dspy.BaseLM):
                 temperature=temperature,
                 max_tokens=max_tokens,
                 stream=True,
+                tools=tools,
+                tool_choice=tool_choice,
             ):
                 event_type = event.get("event")
                 if event_type == "delta":
@@ -125,23 +138,51 @@ class BrokeredLM(dspy.BaseLM):
                     continue
                 if event_type == "done":
+                    # Capture tool calls from done event
+                    data = event.get("data") or {}
+                    tool_calls_data = data.get("tool_calls")
+                    logger.debug(
+                        f"[BROKER_LM] Stream complete with {len(tool_calls_data) if tool_calls_data else 0} tool calls"
+                    )
                     break
                 if event_type == "error":
                     err = event.get("error") or {}
                     raise RuntimeError(err.get("message") or "Broker LLM error")
+            # Build response manually to ensure tool_calls stay as plain dicts
+            # (stream_chunk_builder might convert them to typed objects)
+            full_text = ""
             if chunks:
-                return litellm.stream_chunk_builder(chunks)
+                final_response = litellm.stream_chunk_builder(chunks)
+                if final_response.choices:
+                    message = (
+                        final_response.choices[0].get("message")
+                        if isinstance(final_response.choices[0], dict)
+                        else getattr(final_response.choices[0], "message", None)
+                    )
+                    if message:
+                        full_text = (
+                            message.get("content")
+                            if isinstance(message, dict)
+                            else getattr(message, "content", "") or ""
+                        )
+            message_data = {"role": "assistant", "content": full_text}
+            finish_reason = "stop"
+            if tool_calls_data:
+                # Keep tool calls as plain dictionaries (already in OpenAI format from broker)
+                message_data["tool_calls"] = tool_calls_data
+                finish_reason = "tool_calls"
-            # No streamed chunks; return an empty completion.
             return ModelResponse(
                 model=model_id,
                 choices=[
                     {
                         "index": 0,
-                        "finish_reason": "stop",
-                        "message": {"role": "assistant", "content": ""},
+                        "finish_reason": finish_reason,
+                        "message": message_data,
                     }
                 ],
                 usage={"prompt_tokens": 0, "completion_tokens": 0, "total_tokens": 0},
@@ -149,6 +190,7 @@ class BrokeredLM(dspy.BaseLM):
         # Non-streaming path
         final_text = ""
+        tool_calls_data = None
         usage = {"prompt_tokens": 0, "completion_tokens": 0, "total_tokens": 0}
         async for event in self._client.llm_chat(
             provider="openai",
@@ -157,24 +199,33 @@ class BrokeredLM(dspy.BaseLM):
             temperature=temperature,
             max_tokens=max_tokens,
             stream=False,
+            tools=tools,
+            tool_choice=tool_choice,
         ):
             event_type = event.get("event")
             if event_type == "done":
                 data = event.get("data") or {}
                 final_text = data.get("text") or ""
+                tool_calls_data = data.get("tool_calls")
                 usage = data.get("usage") or usage
                 break
             if event_type == "error":
                 err = event.get("error") or {}
                 raise RuntimeError(err.get("message") or "Broker LLM error")
+        # Build message response with tool calls if present
+        message_data = {"role": "assistant", "content": final_text}
+        if tool_calls_data:
+            # Keep tool calls as plain dictionaries (already in OpenAI format from broker)
+            message_data["tool_calls"] = tool_calls_data
         return ModelResponse(
             model=model_id,
             choices=[
                 {
                     "index": 0,
-                    "finish_reason": "stop",
-                    "message": {"role": "assistant", "content": final_text},
+                    "finish_reason": "tool_calls" if tool_calls_data else "stop",
+                    "message": message_data,
                 }
             ],
             usage=usage,

tactus 0.33.0__py3-none-any.whl → 0.34.1__py3-none-any.whl

tactus 0.33.0py3-none-any.whl → 0.34.1py3-none-any.whl