PyPI - kailash - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl - Mend

kailash 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

kailash/__init__.py +1 -1
kailash/api/__init__.py +17 -0
kailash/api/gateway.py +394 -0
kailash/api/mcp_integration.py +478 -0
kailash/api/workflow_api.py +399 -0
kailash/nodes/ai/__init__.py +4 -4
kailash/nodes/ai/agents.py +4 -4
kailash/nodes/ai/ai_providers.py +18 -22
kailash/nodes/ai/embedding_generator.py +34 -38
kailash/nodes/ai/llm_agent.py +351 -356
kailash/nodes/api/http.py +0 -4
kailash/nodes/api/rest.py +1 -1
kailash/nodes/base.py +60 -64
kailash/nodes/code/python.py +61 -42
kailash/nodes/data/__init__.py +10 -10
kailash/nodes/data/readers.py +27 -29
kailash/nodes/data/retrieval.py +1 -1
kailash/nodes/data/sharepoint_graph.py +23 -25
kailash/nodes/data/sql.py +27 -29
kailash/nodes/data/vector_db.py +2 -2
kailash/nodes/data/writers.py +41 -44
kailash/nodes/logic/__init__.py +10 -3
kailash/nodes/logic/async_operations.py +14 -14
kailash/nodes/logic/operations.py +18 -22
kailash/nodes/logic/workflow.py +439 -0
kailash/nodes/mcp/client.py +29 -33
kailash/nodes/mcp/resource.py +1 -1
kailash/nodes/mcp/server.py +10 -4
kailash/nodes/transform/formatters.py +1 -1
kailash/nodes/transform/processors.py +5 -3
kailash/runtime/docker.py +2 -0
kailash/tracking/metrics_collector.py +6 -7
kailash/tracking/models.py +0 -20
kailash/tracking/storage/database.py +4 -4
kailash/tracking/storage/filesystem.py +0 -1
kailash/utils/export.py +2 -2
kailash/utils/templates.py +16 -16
kailash/visualization/performance.py +7 -7
kailash/visualization/reports.py +1 -1
kailash/workflow/graph.py +4 -4
kailash/workflow/mock_registry.py +1 -1
{kailash-0.1.2.dist-info → kailash-0.1.4.dist-info}/METADATA +198 -27
kailash-0.1.4.dist-info/RECORD +85 -0
kailash-0.1.2.dist-info/RECORD +0 -80
{kailash-0.1.2.dist-info → kailash-0.1.4.dist-info}/WHEEL +0 -0
{kailash-0.1.2.dist-info → kailash-0.1.4.dist-info}/entry_points.txt +0 -0
{kailash-0.1.2.dist-info → kailash-0.1.4.dist-info}/licenses/LICENSE +0 -0
{kailash-0.1.2.dist-info → kailash-0.1.4.dist-info}/top_level.txt +0 -0

kailash/api/workflow_api.py ADDED Viewed

@@ -0,0 +1,399 @@
+"""
+Lean API wrapper for Kailash workflows using FastAPI.
+This module provides a general-purpose API wrapper that can expose any Kailash
+workflow as a REST API with minimal configuration.
+"""
+import asyncio
+from contextlib import asynccontextmanager
+from enum import Enum
+from typing import Any, Dict, List, Optional, Union
+import uvicorn
+from fastapi import BackgroundTasks, FastAPI, HTTPException
+from fastapi.responses import StreamingResponse
+from pydantic import BaseModel, Field
+from kailash.runtime.local import LocalRuntime
+from kailash.workflow.builder import WorkflowBuilder
+from kailash.workflow.graph import Workflow
+class ExecutionMode(str, Enum):
+    """Execution modes for workflow API."""
+    SYNC = "sync"
+    ASYNC = "async"
+    STREAM = "stream"
+class WorkflowRequest(BaseModel):
+    """Base request model for workflow execution."""
+    inputs: Dict[str, Any] = Field(..., description="Input data for workflow nodes")
+    config: Optional[Dict[str, Any]] = Field(
+        None, description="Node configuration overrides"
+    )
+    mode: ExecutionMode = Field(ExecutionMode.SYNC, description="Execution mode")
+class WorkflowResponse(BaseModel):
+    """Base response model for workflow execution."""
+    outputs: Dict[str, Any] = Field(..., description="Output data from workflow nodes")
+    execution_time: float = Field(..., description="Execution time in seconds")
+    workflow_id: str = Field(..., description="Workflow identifier")
+    version: str = Field(..., description="Workflow version")
+class WorkflowAPI:
+    """
+    Lean API wrapper for Kailash workflows.
+    This class provides a minimal, efficient way to expose any Kailash workflow
+    as a REST API with support for synchronous, asynchronous, and streaming execution.
+    Example:
+        >>> # For any workflow
+        >>> from my_workflows import rag_workflow
+        >>> api = WorkflowAPI(rag_workflow)
+        >>> api.run(port=8000)
+    """
+    def __init__(
+        self,
+        workflow: Union[WorkflowBuilder, Workflow],
+        app_name: str = "Kailash Workflow API",
+        version: str = "1.0.0",
+        description: str = "API wrapper for Kailash workflow execution",
+    ):
+        """
+        Initialize the API wrapper.
+        Args:
+            workflow: The WorkflowBuilder or Workflow instance to expose
+            app_name: Name of the API application
+            version: API version
+            description: API description
+        """
+        if isinstance(workflow, WorkflowBuilder):
+            self.workflow = workflow
+            self.workflow_graph = workflow.build()
+            self.workflow_id = getattr(workflow, "workflow_id", "unnamed")
+            self.version = getattr(workflow, "version", "1.0.0")
+        else:  # Workflow instance
+            self.workflow = workflow
+            self.workflow_graph = workflow
+            self.workflow_id = workflow.workflow_id
+            self.version = workflow.version
+        self.runtime = LocalRuntime()
+        # Create FastAPI app with lifespan management
+        self.app = FastAPI(
+            title=app_name,
+            version=version,
+            description=description,
+            lifespan=self._lifespan,
+        )
+        # Setup routes
+        self._setup_routes()
+        # Cache for async executions
+        self._execution_cache: Dict[str, Dict[str, Any]] = {}
+    @asynccontextmanager
+    async def _lifespan(self, app: FastAPI):
+        """Manage app lifecycle."""
+        # Startup
+        yield
+        # Shutdown - cleanup cache
+        self._execution_cache.clear()
+    def _setup_routes(self):
+        """Setup API routes dynamically based on workflow."""
+        # Main execution endpoint
+        @self.app.post("/execute")
+        async def execute_workflow(
+            request: WorkflowRequest, background_tasks: BackgroundTasks
+        ):
+            """Execute the workflow with provided inputs."""
+            if request.mode == ExecutionMode.SYNC:
+                return await self._execute_sync(request)
+            elif request.mode == ExecutionMode.ASYNC:
+                return await self._execute_async(request, background_tasks)
+            else:  # STREAM
+                return StreamingResponse(
+                    self._execute_stream(request), media_type="application/json"
+                )
+        # Status endpoint for async executions
+        @self.app.get("/status/{execution_id}")
+        async def get_execution_status(execution_id: str):
+            """Get status of async execution."""
+            if execution_id not in self._execution_cache:
+                raise HTTPException(status_code=404, detail="Execution not found")
+            return self._execution_cache[execution_id]
+        # Workflow metadata endpoint
+        @self.app.get("/workflow/info")
+        async def get_workflow_info():
+            """Get workflow metadata and structure."""
+            workflow = self.workflow_graph
+            # Get node information
+            nodes = []
+            for node_id, node_instance in workflow.nodes.items():
+                nodes.append({"id": node_id, "type": node_instance.node_type})
+            # Get edge information
+            edges = []
+            for conn in workflow.connections:
+                edges.append(
+                    {
+                        "source": conn.source_node,
+                        "target": conn.target_node,
+                        "source_output": conn.source_output,
+                        "target_input": conn.target_input,
+                    }
+                )
+            return {
+                "workflow_id": workflow.workflow_id,
+                "name": workflow.name,
+                "description": workflow.description,
+                "version": workflow.version,
+                "nodes": nodes,
+                "edges": edges,
+                "node_count": len(nodes),
+                "edge_count": len(edges),
+            }
+        # Health check
+        @self.app.get("/health")
+        async def health_check():
+            """Check API health."""
+            return {"status": "healthy", "workflow": self.workflow_id}
+    async def _execute_sync(self, request: WorkflowRequest) -> WorkflowResponse:
+        """Execute workflow synchronously."""
+        import time
+        start_time = time.time()
+        try:
+            # Apply configuration overrides if provided
+            if request.config:
+                for node_id, config in request.config.items():
+                    # This would need workflow builder enhancement to support
+                    # dynamic config updates
+                    pass
+            # Execute workflow with inputs
+            results = await asyncio.to_thread(
+                self.runtime.execute, self.workflow_graph, parameters=request.inputs
+            )
+            # Handle tuple return from runtime
+            if isinstance(results, tuple):
+                results = results[0] if results else {}
+            execution_time = time.time() - start_time
+            return WorkflowResponse(
+                outputs=results,
+                execution_time=execution_time,
+                workflow_id=self.workflow_id,
+                version=self.version,
+            )
+        except Exception as e:
+            raise HTTPException(status_code=500, detail=str(e))
+    async def _execute_async(
+        self, request: WorkflowRequest, background_tasks: BackgroundTasks
+    ):
+        """Execute workflow asynchronously."""
+        import uuid
+        execution_id = str(uuid.uuid4())
+        # Initialize cache entry
+        self._execution_cache[execution_id] = {
+            "status": "pending",
+            "workflow_id": self.workflow_id,
+            "version": self.version,
+        }
+        # Schedule background execution
+        background_tasks.add_task(self._run_async_execution, execution_id, request)
+        return {
+            "execution_id": execution_id,
+            "status": "pending",
+            "message": f"Execution started. Check status at /status/{execution_id}",
+        }
+    async def _run_async_execution(self, execution_id: str, request: WorkflowRequest):
+        """Run async execution in background."""
+        try:
+            self._execution_cache[execution_id]["status"] = "running"
+            result = await self._execute_sync(request)
+            self._execution_cache[execution_id].update(
+                {"status": "completed", "result": result.dict()}
+            )
+        except Exception as e:
+            self._execution_cache[execution_id].update(
+                {"status": "failed", "error": str(e)}
+            )
+    async def _execute_stream(self, request: WorkflowRequest):
+        """Execute workflow with streaming response."""
+        import json
+        import time
+        try:
+            # For streaming, we'd need workflow runner enhancement
+            # to support progress callbacks. For now, simulate with
+            # start/end events
+            yield json.dumps(
+                {
+                    "event": "start",
+                    "workflow_id": self.workflow_id,
+                    "timestamp": time.time(),
+                }
+            ) + "\n"
+            result = await self._execute_sync(request)
+            yield json.dumps(
+                {"event": "complete", "result": result.dict(), "timestamp": time.time()}
+            ) + "\n"
+        except Exception as e:
+            yield json.dumps(
+                {"event": "error", "error": str(e), "timestamp": time.time()}
+            ) + "\n"
+    def run(self, host: str = "0.0.0.0", port: int = 8000, **kwargs):
+        """Run the API server."""
+        uvicorn.run(self.app, host=host, port=port, **kwargs)
+# Specialized API wrapper for Hierarchical RAG workflows
+class HierarchicalRAGAPI(WorkflowAPI):
+    """
+    Specialized API wrapper for Hierarchical RAG workflows.
+    Provides RAG-specific endpoints and models for better developer experience.
+    """
+    def __init__(self, workflow: WorkflowBuilder, **kwargs):
+        super().__init__(workflow, **kwargs)
+        self._setup_rag_routes()
+    def _setup_rag_routes(self):
+        """Setup RAG-specific routes."""
+        class Document(BaseModel):
+            id: str
+            title: str
+            content: str
+        class RAGQuery(BaseModel):
+            query: str
+            top_k: int = 3
+            similarity_method: str = "cosine"
+            temperature: float = 0.7
+            max_tokens: int = 500
+        class RAGResponse(BaseModel):
+            answer: str
+            sources: List[Dict[str, Any]]
+            query: str
+            execution_time: float
+        @self.app.post("/documents")
+        async def add_documents(documents: List[Document]):
+            """Add documents to the knowledge base."""
+            # This would integrate with document storage
+            return {"message": f"Added {len(documents)} documents"}
+        @self.app.post("/query", response_model=RAGResponse)
+        async def query_rag(request: RAGQuery):
+            """Query the RAG system."""
+            import time
+            start_time = time.time()
+            # Transform to workflow format
+            workflow_request = WorkflowRequest(
+                inputs={
+                    "query": request.query,
+                    "config": {
+                        "relevance_scorer": {
+                            "top_k": request.top_k,
+                            "similarity_method": request.similarity_method,
+                        },
+                        "llm_agent": {
+                            "temperature": request.temperature,
+                            "max_tokens": request.max_tokens,
+                        },
+                    },
+                }
+            )
+            result = await self._execute_sync(workflow_request)
+            # Extract RAG-specific outputs
+            outputs = result.outputs
+            answer = (
+                outputs.get("llm_response", {})
+                .get("choices", [{}])[0]
+                .get("message", {})
+                .get("content", "")
+            )
+            sources = outputs.get("relevant_chunks", [])
+            return RAGResponse(
+                answer=answer,
+                sources=sources,
+                query=request.query,
+                execution_time=time.time() - start_time,
+            )
+# Factory function for creating API wrappers
+def create_workflow_api(
+    workflow: WorkflowBuilder, api_type: str = "generic", **kwargs
+) -> WorkflowAPI:
+    """
+    Factory function to create appropriate API wrapper.
+    Args:
+        workflow: The workflow to wrap
+        api_type: Type of API wrapper ("generic", "rag", etc.)
+        **kwargs: Additional arguments for API initialization
+    Returns:
+        Configured WorkflowAPI instance
+    Example:
+        >>> api = create_workflow_api(my_workflow, api_type="rag")
+        >>> api.run(port=8000)
+    """
+    api_classes = {
+        "generic": WorkflowAPI,
+        "rag": HierarchicalRAGAPI,
+    }
+    api_class = api_classes.get(api_type, WorkflowAPI)
+    return api_class(workflow, **kwargs)

kailash/nodes/ai/__init__.py CHANGED Viewed

@@ -13,8 +13,8 @@ from .ai_providers import (
     get_available_providers,
     get_provider,
 )
-from .embedding_generator import EmbeddingGenerator
-from .llm_agent import LLMAgent
+from .embedding_generator import EmbeddingGeneratorNode
+from .llm_agent import LLMAgentNode
 from .models import (
     ModelPredictor,
     NamedEntityRecognizer,
@@ -30,9 +30,9 @@ __all__ = [
     "RetrievalAgent",
     "FunctionCallingAgent",
     "PlanningAgent",
-    "LLMAgent",
+    "LLMAgentNode",
     # Embedding and Vector Operations
-    "EmbeddingGenerator",
+    "EmbeddingGeneratorNode",
     # Provider Infrastructure
     "LLMProvider",
     "OllamaProvider",

kailash/nodes/ai/agents.py CHANGED Viewed

@@ -333,7 +333,7 @@ class PlanningAgent(Node):
             # Data processing workflow
             potential_steps = [
                 {
-                    "tool": "CSVReader",
+                    "tool": "CSVReaderNode",
                     "description": "Read input data",
                     "parameters": {"file_path": "input.csv"},
                 },
@@ -348,7 +348,7 @@ class PlanningAgent(Node):
                     "parameters": {"group_by": "category", "operation": "sum"},
                 },
                 {
-                    "tool": "CSVWriter",
+                    "tool": "CSVWriterNode",
                     "description": "Write results",
                     "parameters": {"file_path": "output.csv"},
                 },
@@ -357,7 +357,7 @@ class PlanningAgent(Node):
             # Text analysis workflow
             potential_steps = [
                 {
-                    "tool": "TextReader",
+                    "tool": "TextReaderNode",
                     "description": "Read text data",
                     "parameters": {"file_path": "text.txt"},
                 },
@@ -372,7 +372,7 @@ class PlanningAgent(Node):
                     "parameters": {"max_length": 200},
                 },
                 {
-                    "tool": "JSONWriter",
+                    "tool": "JSONWriterNode",
                     "description": "Save analysis results",
                     "parameters": {"file_path": "analysis.json"},
                 },

kailash/nodes/ai/ai_providers.py CHANGED Viewed

@@ -1159,18 +1159,17 @@ def get_provider(
         ValueError: If the provider name is not recognized or doesn't support the requested type.
     Examples:
-        Get any provider::
-        provider = get_provider("openai")
-        if provider.supports_chat():
-            # Use for chat
-        if provider.supports_embeddings():
-            # Use for embeddings
-        Get chat-only provider:
-        chat_provider = get_provider("anthropic", "chat")
+        >>> # Get any provider
+        >>> provider = get_provider("openai")
+        >>> if provider.supports_chat():
+        ...     # Use for chat
+        ...     pass
+        >>> if provider.supports_embeddings():
+        ...     # Use for embeddings
+        ...     pass
+        >>> # Get chat-only provider
+        >>> chat_provider = get_provider("anthropic", "chat")
         response = chat_provider.chat(messages, model="claude-3-sonnet")
         Get embedding-only provider:
@@ -1223,18 +1222,15 @@ def get_available_providers(
         Dict mapping provider names to their availability and capabilities.
     Examples:
+        >>> # Get all providers
+        >>> all_providers = get_available_providers()
+        >>> for name, info in all_providers.items():
+        ...     print(f"{name}: Available={info['available']}, Chat={info['chat']}, Embeddings={info['embeddings']}")
-        Get all providers::
-        all_providers = get_available_providers()
-        for name, info in all_providers.items():
-            print(f"{name}: Available={info['available']}, Chat={info['chat']}, Embeddings={info['embeddings']}")
-        Get only chat providers:
-        chat_providers = get_available_providers("chat")
+        >>> # Get only chat providers
+        >>> chat_providers = get_available_providers("chat")
-        Get only embedding providers:
+        >>> # Get only embedding providers
         embed_providers = get_available_providers("embeddings")
     """

kailash/nodes/ai/embedding_generator.py CHANGED Viewed

@@ -7,7 +7,7 @@ from kailash.nodes.base import Node, NodeParameter, register_node
 @register_node()
-class EmbeddingGenerator(Node):
+class EmbeddingGeneratorNode(Node):
     """
     Vector embedding generator for RAG systems and semantic similarity operations.
@@ -61,46 +61,42 @@ class EmbeddingGenerator(Node):
     - Updates usage statistics and cost tracking
     Examples:
-        Single text embedding::
-        embedder = EmbeddingGenerator()
-        result = embedder.run(
-            provider="openai",
-            model="text-embedding-3-large",
-            input_text="This is a sample document to embed",
-            operation="embed_text"
-        )
-        Batch document embedding:
-        batch_embedder = EmbeddingGenerator()
-        result = batch_embedder.run(
-            provider="huggingface",
-            model="sentence-transformers/all-MiniLM-L6-v2",
-            input_texts=[
-                "First document content...",
-                "Second document content...",
-                "Third document content..."
-            ],
-            operation="embed_batch",
-            batch_size=32,
-            cache_enabled=True
-        )
-        Similarity calculation:
-        similarity = EmbeddingGenerator()
-        result = similarity.run(
-            operation="calculate_similarity",
-            embedding_1=[0.1, 0.2, 0.3, ...],
-            embedding_2=[0.15, 0.25, 0.35, ...],
-            similarity_metric="cosine"
-        )
+        >>> # Single text embedding
+        >>> embedder = EmbeddingGeneratorNode()
+        >>> result = embedder.run(
+        ...     provider="openai",
+        ...     model="text-embedding-3-large",
+        ...     input_text="This is a sample document to embed",
+        ...     operation="embed_text"
+        ... )
+        >>> # Batch document embedding
+        >>> batch_embedder = EmbeddingGeneratorNode()
+        >>> result = batch_embedder.run(
+        ...     provider="huggingface",
+        ...     model="sentence-transformers/all-MiniLM-L6-v2",
+        ...     input_texts=[
+        ...         "First document content...",
+        ...         "Second document content...",
+        ...         "Third document content..."
+        ...     ],
+        ...     operation="embed_batch",
+        ...     batch_size=32,
+        ...     cache_enabled=True
+        ... )
+        >>> # Similarity calculation
+        >>> similarity = EmbeddingGeneratorNode()
+        >>> result = similarity.run(
+        ...     operation="calculate_similarity",
+        ...     embedding_1=[0.1, 0.2, 0.3],  # ... removed for doctest
+        ...     embedding_2=[0.15, 0.25, 0.35],  # ... removed for doctest
+        ...     similarity_metric="cosine"
+        ... )
         Cached embedding with MCP integration:
-        mcp_embedder = EmbeddingGenerator()
+        mcp_embedder = EmbeddingGeneratorNode()
         result = mcp_embedder.run(
             provider="azure",
             model="text-embedding-3-small",

kailash 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl

kailash 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl