PyPI - kailash - Versions diffs - 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl - Mend

kailash 0.1.3py3-none-any.whl → 0.1.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

kailash/__init__.py +1 -1
kailash/api/__init__.py +11 -1
kailash/api/gateway.py +394 -0
kailash/api/mcp_integration.py +478 -0
kailash/api/workflow_api.py +29 -13
kailash/nodes/ai/__init__.py +4 -4
kailash/nodes/ai/agents.py +4 -4
kailash/nodes/ai/ai_providers.py +18 -22
kailash/nodes/ai/embedding_generator.py +34 -38
kailash/nodes/ai/llm_agent.py +351 -356
kailash/nodes/base.py +60 -64
kailash/nodes/code/python.py +61 -42
kailash/nodes/data/__init__.py +10 -10
kailash/nodes/data/readers.py +27 -29
kailash/nodes/data/retrieval.py +1 -1
kailash/nodes/data/sharepoint_graph.py +23 -25
kailash/nodes/data/sql.py +24 -26
kailash/nodes/data/writers.py +41 -44
kailash/nodes/logic/__init__.py +9 -3
kailash/nodes/logic/async_operations.py +14 -14
kailash/nodes/logic/operations.py +18 -22
kailash/nodes/mcp/client.py +29 -33
kailash/nodes/transform/formatters.py +1 -1
kailash/tracking/metrics_collector.py +6 -7
kailash/utils/export.py +2 -2
kailash/utils/templates.py +16 -16
{kailash-0.1.3.dist-info → kailash-0.1.4.dist-info}/METADATA +103 -28
{kailash-0.1.3.dist-info → kailash-0.1.4.dist-info}/RECORD +32 -30
{kailash-0.1.3.dist-info → kailash-0.1.4.dist-info}/WHEEL +0 -0
{kailash-0.1.3.dist-info → kailash-0.1.4.dist-info}/entry_points.txt +0 -0
{kailash-0.1.3.dist-info → kailash-0.1.4.dist-info}/licenses/LICENSE +0 -0
{kailash-0.1.3.dist-info → kailash-0.1.4.dist-info}/top_level.txt +0 -0

kailash/api/mcp_integration.py ADDED Viewed

@@ -0,0 +1,478 @@
+"""MCP (Model Context Protocol) integration for Kailash workflows.
+This module provides integration between MCP servers and Kailash workflows,
+allowing workflows to access MCP tools and resources.
+Design Philosophy:
+    MCP servers provide tools and context that can be used by workflows.
+    This integration allows workflows to discover and use MCP tools dynamically,
+    bridging the gap between workflow automation and AI-powered tools.
+Example:
+    Basic MCP integration:
+    >>> from kailash.api.mcp_integration import MCPIntegration
+    >>> # from kailash.workflow import Workflow  # doctest: +SKIP
+    >>> # Create MCP integration
+    >>> mcp = MCPIntegration("tools_server")
+    >>> # Add tools
+    >>> # mcp.add_tool("search", search_function)  # doctest: +SKIP
+    >>> # mcp.add_tool("calculate", calculator_function)  # doctest: +SKIP
+    >>> # Use in workflow
+    >>> # workflow = Workflow("mcp_workflow")  # doctest: +SKIP
+    >>> # workflow.register_mcp_server(mcp)  # doctest: +SKIP
+    >>> # Nodes can now access MCP tools
+    >>> # node = MCPToolNode(tool_name="search")  # doctest: +SKIP
+    >>> # workflow.add_node("search_data", node)  # doctest: +SKIP
+"""
+import asyncio
+import logging
+from typing import Any, Callable, Dict, List, Optional, Union
+from pydantic import BaseModel, Field
+from ..nodes.base_async import AsyncNode
+logger = logging.getLogger(__name__)
+class MCPTool(BaseModel):
+    """Definition of an MCP tool."""
+    name: str
+    description: str
+    parameters: Dict[str, Any] = Field(default_factory=dict)
+    function: Optional[Callable] = None
+    async_function: Optional[Callable] = None
+    metadata: Dict[str, Any] = Field(default_factory=dict)
+class MCPResource(BaseModel):
+    """Definition of an MCP resource."""
+    name: str
+    uri: str
+    description: str
+    mime_type: str = "text/plain"
+    metadata: Dict[str, Any] = Field(default_factory=dict)
+class MCPIntegration:
+    """MCP server integration for Kailash workflows.
+    Provides:
+    - Tool registration and discovery
+    - Resource management
+    - Async/sync tool execution
+    - Context sharing between workflows and MCP
+    Attributes:
+        name: MCP server name
+        tools: Registry of available tools
+        resources: Registry of available resources
+    """
+    def __init__(
+        self, name: str, description: str = "", capabilities: List[str] = None
+    ):
+        """Initialize MCP integration.
+        Args:
+            name: MCP server name
+            description: Server description
+            capabilities: List of server capabilities
+        """
+        self.name = name
+        self.description = description
+        self.capabilities = capabilities or ["tools", "resources"]
+        self.tools: Dict[str, MCPTool] = {}
+        self.resources: Dict[str, MCPResource] = {}
+        self._context: Dict[str, Any] = {}
+    def add_tool(
+        self,
+        name: str,
+        function: Union[Callable, Callable[..., asyncio.Future]],
+        description: str = "",
+        parameters: Dict[str, Any] = None,
+    ):
+        """Add a tool to the MCP server.
+        Args:
+            name: Tool name
+            function: Tool implementation (sync or async)
+            description: Tool description
+            parameters: Tool parameter schema
+        """
+        tool = MCPTool(
+            name=name,
+            description=description,
+            parameters=parameters or {},
+            function=function if not asyncio.iscoroutinefunction(function) else None,
+            async_function=function if asyncio.iscoroutinefunction(function) else None,
+        )
+        self.tools[name] = tool
+        logger.info(f"Added tool '{name}' to MCP server '{self.name}'")
+    def add_resource(
+        self, name: str, uri: str, description: str = "", mime_type: str = "text/plain"
+    ):
+        """Add a resource to the MCP server.
+        Args:
+            name: Resource name
+            uri: Resource URI
+            description: Resource description
+            mime_type: MIME type of the resource
+        """
+        resource = MCPResource(
+            name=name, uri=uri, description=description, mime_type=mime_type
+        )
+        self.resources[name] = resource
+        logger.info(f"Added resource '{name}' to MCP server '{self.name}'")
+    async def execute_tool(self, tool_name: str, parameters: Dict[str, Any]) -> Any:
+        """Execute a tool asynchronously.
+        Args:
+            tool_name: Name of the tool to execute
+            parameters: Tool parameters
+        Returns:
+            Tool execution result
+        """
+        tool = self.tools.get(tool_name)
+        if not tool:
+            raise ValueError(f"Tool '{tool_name}' not found")
+        # Add context to parameters only if function accepts it
+        import inspect
+        if tool.async_function:
+            sig = inspect.signature(tool.async_function)
+        else:
+            sig = inspect.signature(tool.function)
+        if "_context" in sig.parameters:
+            params = {**parameters, "_context": self._context}
+        else:
+            params = parameters
+        if tool.async_function:
+            return await tool.async_function(**params)
+        elif tool.function:
+            # Run sync function in executor
+            loop = asyncio.get_event_loop()
+            from functools import partial
+            func = partial(tool.function, **params)
+            return await loop.run_in_executor(None, func)
+        else:
+            raise ValueError(f"Tool '{tool_name}' has no implementation")
+    def execute_tool_sync(self, tool_name: str, parameters: Dict[str, Any]) -> Any:
+        """Execute a tool synchronously.
+        Args:
+            tool_name: Name of the tool to execute
+            parameters: Tool parameters
+        Returns:
+            Tool execution result
+        """
+        tool = self.tools.get(tool_name)
+        if not tool:
+            raise ValueError(f"Tool '{tool_name}' not found")
+        if tool.function:
+            # Check if function accepts _context parameter
+            import inspect
+            sig = inspect.signature(tool.function)
+            if "_context" in sig.parameters:
+                params = {**parameters, "_context": self._context}
+            else:
+                params = parameters
+            return tool.function(**params)
+        else:
+            raise ValueError(f"Tool '{tool_name}' requires async execution")
+    def get_resource(self, resource_name: str) -> Optional[MCPResource]:
+        """Get a resource by name.
+        Args:
+            resource_name: Resource name
+        Returns:
+            Resource if found
+        """
+        return self.resources.get(resource_name)
+    def set_context(self, key: str, value: Any):
+        """Set context value.
+        Args:
+            key: Context key
+            value: Context value
+        """
+        self._context[key] = value
+    def get_context(self, key: str) -> Any:
+        """Get context value.
+        Args:
+            key: Context key
+        Returns:
+            Context value
+        """
+        return self._context.get(key)
+    def list_tools(self) -> List[Dict[str, Any]]:
+        """List all available tools.
+        Returns:
+            List of tool definitions
+        """
+        return [
+            {
+                "name": tool.name,
+                "description": tool.description,
+                "parameters": tool.parameters,
+            }
+            for tool in self.tools.values()
+        ]
+    def list_resources(self) -> List[Dict[str, Any]]:
+        """List all available resources.
+        Returns:
+            List of resource definitions
+        """
+        return [
+            {
+                "name": resource.name,
+                "uri": resource.uri,
+                "description": resource.description,
+                "mime_type": resource.mime_type,
+            }
+            for resource in self.resources.values()
+        ]
+    def to_mcp_protocol(self) -> Dict[str, Any]:
+        """Convert to MCP protocol format.
+        Returns:
+            MCP server definition
+        """
+        return {
+            "name": self.name,
+            "description": self.description,
+            "capabilities": self.capabilities,
+            "tools": self.list_tools(),
+            "resources": self.list_resources(),
+        }
+class MCPToolNode(AsyncNode):
+    """Node that executes MCP tools within a workflow.
+    This node allows workflows to use tools provided by MCP servers,
+    bridging the gap between workflow automation and AI-powered tools.
+    Example:
+        Using an MCP tool in a workflow:
+        >>> # Create node for specific tool
+        >>> search_node = MCPToolNode(
+        ...     mcp_server="tools",
+        ...     tool_name="web_search"
+        ... )
+        >>> # Add to workflow
+        >>> # workflow.add_node("search", search_node)  # doctest: +SKIP
+        >>> # Execute with parameters
+        >>> # result = workflow.run({"search": {"query": "Kailash SDK documentation"}})  # doctest: +SKIP
+    """
+    def __init__(
+        self, mcp_server: str, tool_name: str, parameter_mapping: Dict[str, str] = None
+    ):
+        """Initialize MCP tool node.
+        Args:
+            mcp_server: Name of the MCP server
+            tool_name: Name of the tool to execute
+            parameter_mapping: Map input keys to tool parameters
+        """
+        super().__init__()
+        self.mcp_server = mcp_server
+        self.tool_name = tool_name
+        self.parameter_mapping = parameter_mapping or {}
+        self._mcp_integration: Optional[MCPIntegration] = None
+    def set_mcp_integration(self, mcp: MCPIntegration):
+        """Set the MCP integration instance."""
+        self._mcp_integration = mcp
+    def get_parameters(self) -> Dict[str, Any]:
+        """Get node parameters.
+        Returns:
+            Dictionary of parameters
+        """
+        # For MCP tools, parameters are dynamic based on the tool
+        return {}
+    def validate_inputs(self, **kwargs) -> Dict[str, Any]:
+        """Validate runtime inputs.
+        For MCPToolNode, we accept any inputs since the parameters
+        are dynamic based on the MCP tool being used.
+        Args:
+            **kwargs: Runtime inputs
+        Returns:
+            All inputs as-is
+        """
+        # For MCP tools, pass through all inputs without validation
+        # The actual validation happens in the MCP tool itself
+        return kwargs
+    def run(self, **kwargs) -> Any:
+        """Run the node synchronously.
+        Args:
+            **kwargs: Input parameters
+        Returns:
+            Execution result
+        """
+        if not self._mcp_integration:
+            raise RuntimeError("MCP integration not set")
+        # Map parameters if needed
+        tool_params = {}
+        for input_key, tool_key in self.parameter_mapping.items():
+            if input_key in kwargs:
+                tool_params[tool_key] = kwargs[input_key]
+        # Add unmapped parameters
+        for key, value in kwargs.items():
+            if key not in self.parameter_mapping:
+                tool_params[key] = value
+        # Use synchronous execution
+        result = self._mcp_integration.execute_tool_sync(self.tool_name, tool_params)
+        # Ensure result is wrapped in a dict for consistency
+        if not isinstance(result, dict):
+            return {"result": result}
+        return result
+    async def async_run(self, **kwargs) -> Dict[str, Any]:
+        """Run the node asynchronously.
+        Args:
+            **kwargs: Input parameters
+        Returns:
+            Dictionary of outputs
+        """
+        if not self._mcp_integration:
+            raise RuntimeError("MCP integration not set")
+        # Map parameters if needed
+        tool_params = {}
+        for input_key, tool_key in self.parameter_mapping.items():
+            if input_key in kwargs:
+                tool_params[tool_key] = kwargs[input_key]
+        # Add unmapped parameters
+        for key, value in kwargs.items():
+            if key not in self.parameter_mapping:
+                tool_params[key] = value
+        # Execute tool asynchronously
+        result = await self._mcp_integration.execute_tool(self.tool_name, tool_params)
+        # Ensure result is wrapped in a dict for consistency
+        if not isinstance(result, dict):
+            return {"result": result}
+        return result
+def create_example_mcp_server() -> MCPIntegration:
+    """Create an example MCP server with common tools."""
+    mcp = MCPIntegration("example_tools", "Example MCP server with utility tools")
+    # Add search tool
+    async def web_search(query: str, max_results: int = 10, **kwargs):
+        """Simulate web search."""
+        return {
+            "query": query,
+            "results": [
+                {"title": f"Result {i}", "url": f"https://example.com/{i}"}
+                for i in range(max_results)
+            ],
+        }
+    mcp.add_tool(
+        "web_search",
+        web_search,
+        "Search the web",
+        {
+            "query": {"type": "string", "required": True},
+            "max_results": {"type": "integer", "default": 10},
+        },
+    )
+    # Add calculator tool
+    def calculate(expression: str, **kwargs):
+        """Evaluate mathematical expression."""
+        try:
+            # Safe evaluation of mathematical expressions
+            import ast
+            import operator as op
+            # Operators would be used for safe eval implementation
+            # Currently using simple eval for the expression
+            _ = {
+                ast.Add: op.add,
+                ast.Sub: op.sub,
+                ast.Mult: op.mul,
+                ast.Div: op.truediv,
+                ast.Pow: op.pow,
+            }
+            def eval_expr(expr):
+                return eval(expr, {"__builtins__": {}}, {})
+            result = eval_expr(expression)
+            return {"expression": expression, "result": result}
+        except Exception as e:
+            return {"error": str(e)}
+    mcp.add_tool(
+        "calculate",
+        calculate,
+        "Evaluate mathematical expressions",
+        {"expression": {"type": "string", "required": True}},
+    )
+    # Add resources
+    mcp.add_resource(
+        "documentation", "https://docs.kailash.io", "Kailash SDK documentation"
+    )
+    mcp.add_resource(
+        "examples",
+        "https://github.com/kailash/examples",
+        "Example workflows and patterns",
+    )
+    return mcp

kailash/api/workflow_api.py CHANGED Viewed

@@ -116,7 +116,7 @@ class WorkflowAPI:
         """Setup API routes dynamically based on workflow."""
         # Main execution endpoint
-        @self.app.post("/execute", response_model=WorkflowResponse)
+        @self.app.post("/execute")
         async def execute_workflow(
             request: WorkflowRequest, background_tasks: BackgroundTasks
         ):
@@ -143,18 +143,34 @@ class WorkflowAPI:
         @self.app.get("/workflow/info")
         async def get_workflow_info():
             """Get workflow metadata and structure."""
-            graph_data = self.workflow_graph
+            workflow = self.workflow_graph
+            # Get node information
+            nodes = []
+            for node_id, node_instance in workflow.nodes.items():
+                nodes.append({"id": node_id, "type": node_instance.node_type})
+            # Get edge information
+            edges = []
+            for conn in workflow.connections:
+                edges.append(
+                    {
+                        "source": conn.source_node,
+                        "target": conn.target_node,
+                        "source_output": conn.source_output,
+                        "target_input": conn.target_input,
+                    }
+                )
             return {
-                "id": self.workflow_id,
-                "version": self.version,
-                "nodes": list(graph_data.nodes()),
-                "edges": list(graph_data.edges()),
-                "input_nodes": [
-                    n for n in graph_data.nodes() if graph_data.in_degree(n) == 0
-                ],
-                "output_nodes": [
-                    n for n in graph_data.nodes() if graph_data.out_degree(n) == 0
-                ],
+                "workflow_id": workflow.workflow_id,
+                "name": workflow.name,
+                "description": workflow.description,
+                "version": workflow.version,
+                "nodes": nodes,
+                "edges": edges,
+                "node_count": len(nodes),
+                "edge_count": len(edges),
             }
         # Health check
@@ -179,7 +195,7 @@ class WorkflowAPI:
             # Execute workflow with inputs
             results = await asyncio.to_thread(
-                self.runtime.execute, self.workflow_graph, request.inputs
+                self.runtime.execute, self.workflow_graph, parameters=request.inputs
             )
             # Handle tuple return from runtime

kailash/nodes/ai/__init__.py CHANGED Viewed

@@ -13,8 +13,8 @@ from .ai_providers import (
     get_available_providers,
     get_provider,
 )
-from .embedding_generator import EmbeddingGenerator
-from .llm_agent import LLMAgent
+from .embedding_generator import EmbeddingGeneratorNode
+from .llm_agent import LLMAgentNode
 from .models import (
     ModelPredictor,
     NamedEntityRecognizer,
@@ -30,9 +30,9 @@ __all__ = [
     "RetrievalAgent",
     "FunctionCallingAgent",
     "PlanningAgent",
-    "LLMAgent",
+    "LLMAgentNode",
     # Embedding and Vector Operations
-    "EmbeddingGenerator",
+    "EmbeddingGeneratorNode",
     # Provider Infrastructure
     "LLMProvider",
     "OllamaProvider",

kailash/nodes/ai/agents.py CHANGED Viewed

@@ -333,7 +333,7 @@ class PlanningAgent(Node):
             # Data processing workflow
             potential_steps = [
                 {
-                    "tool": "CSVReader",
+                    "tool": "CSVReaderNode",
                     "description": "Read input data",
                     "parameters": {"file_path": "input.csv"},
                 },
@@ -348,7 +348,7 @@ class PlanningAgent(Node):
                     "parameters": {"group_by": "category", "operation": "sum"},
                 },
                 {
-                    "tool": "CSVWriter",
+                    "tool": "CSVWriterNode",
                     "description": "Write results",
                     "parameters": {"file_path": "output.csv"},
                 },
@@ -357,7 +357,7 @@ class PlanningAgent(Node):
             # Text analysis workflow
             potential_steps = [
                 {
-                    "tool": "TextReader",
+                    "tool": "TextReaderNode",
                     "description": "Read text data",
                     "parameters": {"file_path": "text.txt"},
                 },
@@ -372,7 +372,7 @@ class PlanningAgent(Node):
                     "parameters": {"max_length": 200},
                 },
                 {
-                    "tool": "JSONWriter",
+                    "tool": "JSONWriterNode",
                     "description": "Save analysis results",
                     "parameters": {"file_path": "analysis.json"},
                 },

kailash/nodes/ai/ai_providers.py CHANGED Viewed

@@ -1159,18 +1159,17 @@ def get_provider(
         ValueError: If the provider name is not recognized or doesn't support the requested type.
     Examples:
-        Get any provider::
-        provider = get_provider("openai")
-        if provider.supports_chat():
-            # Use for chat
-        if provider.supports_embeddings():
-            # Use for embeddings
-        Get chat-only provider:
-        chat_provider = get_provider("anthropic", "chat")
+        >>> # Get any provider
+        >>> provider = get_provider("openai")
+        >>> if provider.supports_chat():
+        ...     # Use for chat
+        ...     pass
+        >>> if provider.supports_embeddings():
+        ...     # Use for embeddings
+        ...     pass
+        >>> # Get chat-only provider
+        >>> chat_provider = get_provider("anthropic", "chat")
         response = chat_provider.chat(messages, model="claude-3-sonnet")
         Get embedding-only provider:
@@ -1223,18 +1222,15 @@ def get_available_providers(
         Dict mapping provider names to their availability and capabilities.
     Examples:
+        >>> # Get all providers
+        >>> all_providers = get_available_providers()
+        >>> for name, info in all_providers.items():
+        ...     print(f"{name}: Available={info['available']}, Chat={info['chat']}, Embeddings={info['embeddings']}")
-        Get all providers::
-        all_providers = get_available_providers()
-        for name, info in all_providers.items():
-            print(f"{name}: Available={info['available']}, Chat={info['chat']}, Embeddings={info['embeddings']}")
-        Get only chat providers:
-        chat_providers = get_available_providers("chat")
+        >>> # Get only chat providers
+        >>> chat_providers = get_available_providers("chat")
-        Get only embedding providers:
+        >>> # Get only embedding providers
         embed_providers = get_available_providers("embeddings")
     """

kailash 0.1.3__py3-none-any.whl → 0.1.4__py3-none-any.whl

kailash 0.1.3py3-none-any.whl → 0.1.4py3-none-any.whl