PyPI - kailash - Versions diffs - 0.1.0__py3-none-any.whl - Mend

kailash 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (69) hide show

kailash/__init__.py +31 -0
kailash/__main__.py +11 -0
kailash/cli/__init__.py +5 -0
kailash/cli/commands.py +563 -0
kailash/manifest.py +778 -0
kailash/nodes/__init__.py +23 -0
kailash/nodes/ai/__init__.py +26 -0
kailash/nodes/ai/agents.py +417 -0
kailash/nodes/ai/models.py +488 -0
kailash/nodes/api/__init__.py +52 -0
kailash/nodes/api/auth.py +567 -0
kailash/nodes/api/graphql.py +480 -0
kailash/nodes/api/http.py +598 -0
kailash/nodes/api/rate_limiting.py +572 -0
kailash/nodes/api/rest.py +665 -0
kailash/nodes/base.py +1032 -0
kailash/nodes/base_async.py +128 -0
kailash/nodes/code/__init__.py +32 -0
kailash/nodes/code/python.py +1021 -0
kailash/nodes/data/__init__.py +125 -0
kailash/nodes/data/readers.py +496 -0
kailash/nodes/data/sharepoint_graph.py +623 -0
kailash/nodes/data/sql.py +380 -0
kailash/nodes/data/streaming.py +1168 -0
kailash/nodes/data/vector_db.py +964 -0
kailash/nodes/data/writers.py +529 -0
kailash/nodes/logic/__init__.py +6 -0
kailash/nodes/logic/async_operations.py +702 -0
kailash/nodes/logic/operations.py +551 -0
kailash/nodes/transform/__init__.py +5 -0
kailash/nodes/transform/processors.py +379 -0
kailash/runtime/__init__.py +6 -0
kailash/runtime/async_local.py +356 -0
kailash/runtime/docker.py +697 -0
kailash/runtime/local.py +434 -0
kailash/runtime/parallel.py +557 -0
kailash/runtime/runner.py +110 -0
kailash/runtime/testing.py +347 -0
kailash/sdk_exceptions.py +307 -0
kailash/tracking/__init__.py +7 -0
kailash/tracking/manager.py +885 -0
kailash/tracking/metrics_collector.py +342 -0
kailash/tracking/models.py +535 -0
kailash/tracking/storage/__init__.py +0 -0
kailash/tracking/storage/base.py +113 -0
kailash/tracking/storage/database.py +619 -0
kailash/tracking/storage/filesystem.py +543 -0
kailash/utils/__init__.py +0 -0
kailash/utils/export.py +924 -0
kailash/utils/templates.py +680 -0
kailash/visualization/__init__.py +62 -0
kailash/visualization/api.py +732 -0
kailash/visualization/dashboard.py +951 -0
kailash/visualization/performance.py +808 -0
kailash/visualization/reports.py +1471 -0
kailash/workflow/__init__.py +15 -0
kailash/workflow/builder.py +245 -0
kailash/workflow/graph.py +827 -0
kailash/workflow/mermaid_visualizer.py +628 -0
kailash/workflow/mock_registry.py +63 -0
kailash/workflow/runner.py +302 -0
kailash/workflow/state.py +238 -0
kailash/workflow/visualization.py +588 -0
kailash-0.1.0.dist-info/METADATA +710 -0
kailash-0.1.0.dist-info/RECORD +69 -0
kailash-0.1.0.dist-info/WHEEL +5 -0
kailash-0.1.0.dist-info/entry_points.txt +2 -0
kailash-0.1.0.dist-info/licenses/LICENSE +21 -0
kailash-0.1.0.dist-info/top_level.txt +1 -0

kailash/nodes/api/http.py ADDED Viewed

@@ -0,0 +1,598 @@
+"""HTTP client nodes for making requests to external APIs.
+This module provides nodes for making HTTP requests to external services.
+Both synchronous and asynchronous versions are provided to support different workflow
+execution modes.
+Key Components:
+- HTTPRequestNode: Synchronous HTTP client node
+- AsyncHTTPRequestNode: Asynchronous HTTP client node
+- Authentication helpers and utilities
+"""
+import asyncio
+from enum import Enum
+from typing import Any, Dict, Optional
+import aiohttp
+import requests
+from pydantic import BaseModel
+from kailash.nodes.base import Node, NodeParameter, register_node
+from kailash.nodes.base_async import AsyncNode
+from kailash.sdk_exceptions import NodeExecutionError, NodeValidationError
+class HTTPMethod(str, Enum):
+    """HTTP methods supported by the HTTPRequestNode."""
+    GET = "GET"
+    POST = "POST"
+    PUT = "PUT"
+    PATCH = "PATCH"
+    DELETE = "DELETE"
+    HEAD = "HEAD"
+    OPTIONS = "OPTIONS"
+class ResponseFormat(str, Enum):
+    """Response formats supported by the HTTPRequestNode."""
+    JSON = "json"
+    TEXT = "text"
+    BINARY = "binary"
+    AUTO = "auto"  # Determine based on Content-Type header
+class HTTPResponse(BaseModel):
+    """Model for HTTP response data.
+    This model provides a consistent structure for HTTP responses
+    returned by the HTTPRequestNode.
+    """
+    status_code: int
+    headers: Dict[str, str]
+    content_type: Optional[str] = None
+    content: Any  # Can be dict, str, bytes depending on response format
+    response_time_ms: float
+    url: str
+@register_node(alias="HTTPRequest")
+class HTTPRequestNode(Node):
+    """Node for making HTTP requests to external APIs.
+    This node provides a flexible interface for making HTTP requests with support for:
+    - All common HTTP methods (GET, POST, PUT, PATCH, DELETE, HEAD, OPTIONS)
+    - JSON, form, and multipart request bodies
+    - Custom headers and query parameters
+    - Response parsing (JSON, text, binary)
+    - Basic error handling and retries
+    Design Purpose:
+    - Enable workflow integration with external HTTP APIs
+    - Provide a consistent interface for HTTP operations
+    - Support common authentication patterns
+    - Handle response parsing and error handling
+    Upstream Usage:
+    - Workflow: Creates and configures node for API integration
+    - Specialized API nodes: May extend this node for specific APIs
+    Downstream Consumers:
+    - Data processing nodes: Consume API response data
+    - Decision nodes: Route workflow based on API responses
+    - Custom nodes: Process API-specific data formats
+    """
+    def __init__(self, **kwargs):
+        """Initialize the HTTP request node.
+        Args:
+            url (str): The URL to send the request to
+            method (str): HTTP method to use (GET, POST, PUT, etc.)
+            headers (dict, optional): HTTP headers to include in the request
+            params (dict, optional): Query parameters to include in the URL
+            data (dict/str, optional): Request body data (for POST, PUT, etc.)
+            json_data (dict, optional): JSON data to send (automatically sets Content-Type)
+            response_format (str, optional): Format to parse response as (json, text, binary, auto)
+            timeout (int, optional): Request timeout in seconds
+            verify_ssl (bool, optional): Whether to verify SSL certificates
+            retry_count (int, optional): Number of times to retry failed requests
+            retry_backoff (float, optional): Backoff factor for retries
+            **kwargs: Additional parameters passed to base Node
+        """
+        super().__init__(**kwargs)
+        self.session = requests.Session()
+    def get_parameters(self) -> Dict[str, NodeParameter]:
+        """Define the parameters this node accepts.
+        Returns:
+            Dictionary of parameter definitions
+        """
+        return {
+            "url": NodeParameter(
+                name="url",
+                type=str,
+                required=True,
+                description="URL to send the request to",
+            ),
+            "method": NodeParameter(
+                name="method",
+                type=str,
+                required=True,
+                default="GET",
+                description="HTTP method (GET, POST, PUT, PATCH, DELETE)",
+            ),
+            "headers": NodeParameter(
+                name="headers",
+                type=dict,
+                required=False,
+                default={},
+                description="HTTP headers to include in the request",
+            ),
+            "params": NodeParameter(
+                name="params",
+                type=dict,
+                required=False,
+                default={},
+                description="Query parameters to include in the URL",
+            ),
+            "data": NodeParameter(
+                name="data",
+                type=Any,
+                required=False,
+                default=None,
+                description="Request body data (for POST, PUT, etc.)",
+            ),
+            "json_data": NodeParameter(
+                name="json_data",
+                type=dict,
+                required=False,
+                default=None,
+                description="JSON data to send (automatically sets Content-Type)",
+            ),
+            "response_format": NodeParameter(
+                name="response_format",
+                type=str,
+                required=False,
+                default="auto",
+                description="Format to parse response as (json, text, binary, auto)",
+            ),
+            "timeout": NodeParameter(
+                name="timeout",
+                type=int,
+                required=False,
+                default=30,
+                description="Request timeout in seconds",
+            ),
+            "verify_ssl": NodeParameter(
+                name="verify_ssl",
+                type=bool,
+                required=False,
+                default=True,
+                description="Whether to verify SSL certificates",
+            ),
+            "retry_count": NodeParameter(
+                name="retry_count",
+                type=int,
+                required=False,
+                default=0,
+                description="Number of times to retry failed requests",
+            ),
+            "retry_backoff": NodeParameter(
+                name="retry_backoff",
+                type=float,
+                required=False,
+                default=0.5,
+                description="Backoff factor for retries",
+            ),
+        }
+    def get_output_schema(self) -> Dict[str, NodeParameter]:
+        """Define the output schema for this node.
+        Returns:
+            Dictionary of output parameter definitions
+        """
+        return {
+            "response": NodeParameter(
+                name="response",
+                type=dict,
+                required=True,
+                description="HTTP response data including status, headers, and content",
+            ),
+            "status_code": NodeParameter(
+                name="status_code",
+                type=int,
+                required=True,
+                description="HTTP status code",
+            ),
+            "success": NodeParameter(
+                name="success",
+                type=bool,
+                required=True,
+                description="Whether the request was successful (status code 200-299)",
+            ),
+        }
+    def run(self, **kwargs) -> Dict[str, Any]:
+        """Execute an HTTP request.
+        Args:
+            url (str): The URL to send the request to
+            method (str): HTTP method to use
+            headers (dict, optional): HTTP headers
+            params (dict, optional): Query parameters
+            data (dict/str, optional): Request body data
+            json_data (dict, optional): JSON data to send
+            response_format (str, optional): Format to parse response as
+            timeout (int, optional): Request timeout in seconds
+            verify_ssl (bool, optional): Whether to verify SSL certificates
+            retry_count (int, optional): Number of times to retry failed requests
+            retry_backoff (float, optional): Backoff factor for retries
+        Returns:
+            Dictionary containing:
+                response: HTTPResponse object
+                status_code: HTTP status code
+                success: Boolean indicating request success
+        Raises:
+            NodeExecutionError: If the request fails or returns an error status
+        """
+        url = kwargs.get("url")
+        method = kwargs.get("method", "GET").upper()
+        headers = kwargs.get("headers", {})
+        params = kwargs.get("params", {})
+        data = kwargs.get("data")
+        json_data = kwargs.get("json_data")
+        response_format = kwargs.get("response_format", "auto")
+        timeout = kwargs.get("timeout", 30)
+        verify_ssl = kwargs.get("verify_ssl", True)
+        retry_count = kwargs.get("retry_count", 0)
+        retry_backoff = kwargs.get("retry_backoff", 0.5)
+        # Validate method
+        try:
+            method = HTTPMethod(method)
+        except ValueError:
+            raise NodeValidationError(
+                f"Invalid HTTP method: {method}. "
+                f"Supported methods: {', '.join([m.value for m in HTTPMethod])}"
+            )
+        # Validate response format
+        try:
+            response_format = ResponseFormat(response_format)
+        except ValueError:
+            raise NodeValidationError(
+                f"Invalid response format: {response_format}. "
+                f"Supported formats: {', '.join([f.value for f in ResponseFormat])}"
+            )
+        # Prepare request kwargs
+        request_kwargs = {
+            "url": url,
+            "headers": headers,
+            "params": params,
+            "timeout": timeout,
+            "verify": verify_ssl,
+        }
+        # Add data or json based on what was provided
+        if json_data is not None:
+            request_kwargs["json"] = json_data
+        elif data is not None:
+            request_kwargs["data"] = data
+        # Execute request with retries
+        self.logger.info(f"Making {method} request to {url}")
+        response = None
+        last_error = None
+        for attempt in range(retry_count + 1):
+            if attempt > 0:
+                wait_time = retry_backoff * (2 ** (attempt - 1))
+                self.logger.info(
+                    f"Retry attempt {attempt}/{retry_count} after {wait_time:.2f}s"
+                )
+                import time
+                time.sleep(wait_time)
+            try:
+                import time
+                start_time = time.time()
+                response = self.session.request(method=method.value, **request_kwargs)
+                response_time = (time.time() - start_time) * 1000  # Convert to ms
+                # Success, break the retry loop
+                break
+            except requests.RequestException as e:
+                last_error = e
+                self.logger.warning(f"Request failed: {str(e)}")
+                # Last attempt, no more retries
+                if attempt == retry_count:
+                    raise NodeExecutionError(
+                        f"HTTP request failed after {retry_count + 1} attempts: {str(e)}"
+                    ) from e
+        # Parse response based on format
+        content_type = response.headers.get("Content-Type", "")
+        if response_format == ResponseFormat.AUTO:
+            if "application/json" in content_type:
+                response_format = ResponseFormat.JSON
+            elif "text/" in content_type:
+                response_format = ResponseFormat.TEXT
+            else:
+                response_format = ResponseFormat.BINARY
+        try:
+            if response_format == ResponseFormat.JSON:
+                content = response.json()
+            elif response_format == ResponseFormat.TEXT:
+                content = response.text
+            elif response_format == ResponseFormat.BINARY:
+                content = response.content
+            else:
+                content = response.text  # Fallback to text
+        except Exception as e:
+            self.logger.warning(
+                f"Failed to parse response as {response_format}: {str(e)}"
+            )
+            content = response.text  # Fallback to text
+        # Create response object
+        http_response = HTTPResponse(
+            status_code=response.status_code,
+            headers=dict(response.headers),
+            content_type=content_type,
+            content=content,
+            response_time_ms=response_time,
+            url=response.url,
+        ).model_dump()
+        # Return results
+        success = 200 <= response.status_code < 300
+        return {
+            "response": http_response,
+            "status_code": response.status_code,
+            "success": success,
+        }
+@register_node(alias="AsyncHTTPRequest")
+class AsyncHTTPRequestNode(AsyncNode):
+    """Asynchronous node for making HTTP requests to external APIs.
+    This node provides the same functionality as HTTPRequestNode but uses
+    asynchronous I/O for better performance, especially for concurrent requests.
+    Design Purpose:
+    - Enable efficient, non-blocking HTTP operations in workflows
+    - Provide the same interface as HTTPRequestNode but with async execution
+    - Support high-throughput API integrations with minimal overhead
+    Upstream Usage:
+    - AsyncLocalRuntime: Executes workflow with async support
+    - Specialized async API nodes: May extend this node
+    Downstream Consumers:
+    - Data processing nodes: Consume API response data
+    - Decision nodes: Route workflow based on API responses
+    """
+    def __init__(self, **kwargs):
+        """Initialize the async HTTP request node.
+        Args:
+            Same as HTTPRequestNode
+        """
+        super().__init__(**kwargs)
+        self._session = None  # Will be created when needed
+    def get_parameters(self) -> Dict[str, NodeParameter]:
+        """Define the parameters this node accepts.
+        Returns:
+            Dictionary of parameter definitions
+        """
+        # Same parameters as the synchronous version
+        return HTTPRequestNode().get_parameters()
+    def get_output_schema(self) -> Dict[str, NodeParameter]:
+        """Define the output schema for this node.
+        Returns:
+            Dictionary of output parameter definitions
+        """
+        # Same output schema as the synchronous version
+        return HTTPRequestNode().get_output_schema()
+    def run(self, **kwargs) -> Dict[str, Any]:
+        """Synchronous version of the request, for compatibility.
+        This is implemented for compatibility but users should use the
+        async_run method for better performance.
+        Args:
+            Same as HTTPRequestNode.run()
+        Returns:
+            Same as HTTPRequestNode.run()
+        Raises:
+            NodeExecutionError: If the request fails or returns an error status
+        """
+        # For compatibility, create a requests.Session() and use it
+        http_node = HTTPRequestNode(**self.config)
+        return http_node.run(**kwargs)
+    async def async_run(self, **kwargs) -> Dict[str, Any]:
+        """Execute an HTTP request asynchronously.
+        Args:
+            Same as HTTPRequestNode.run()
+        Returns:
+            Same as HTTPRequestNode.run()
+        Raises:
+            NodeExecutionError: If the request fails or returns an error status
+        """
+        url = kwargs.get("url")
+        method = kwargs.get("method", "GET").upper()
+        headers = kwargs.get("headers", {})
+        params = kwargs.get("params", {})
+        data = kwargs.get("data")
+        json_data = kwargs.get("json_data")
+        response_format = kwargs.get("response_format", "auto")
+        timeout = kwargs.get("timeout", 30)
+        verify_ssl = kwargs.get("verify_ssl", True)
+        retry_count = kwargs.get("retry_count", 0)
+        retry_backoff = kwargs.get("retry_backoff", 0.5)
+        # Validate method
+        try:
+            method = HTTPMethod(method)
+        except ValueError:
+            raise NodeValidationError(
+                f"Invalid HTTP method: {method}. "
+                f"Supported methods: {', '.join([m.value for m in HTTPMethod])}"
+            )
+        # Validate response format
+        try:
+            response_format = ResponseFormat(response_format)
+        except ValueError:
+            raise NodeValidationError(
+                f"Invalid response format: {response_format}. "
+                f"Supported formats: {', '.join([f.value for f in ResponseFormat])}"
+            )
+        # Create session if needed
+        if self._session is None:
+            self._session = aiohttp.ClientSession()
+        # Prepare request kwargs
+        request_kwargs = {
+            "url": url,
+            "headers": headers,
+            "params": params,
+            "timeout": aiohttp.ClientTimeout(total=timeout),
+            "ssl": verify_ssl,
+        }
+        # Add data or json based on what was provided
+        if json_data is not None:
+            request_kwargs["json"] = json_data
+        elif data is not None:
+            request_kwargs["data"] = data
+        # Execute request with retries
+        self.logger.info(f"Making async {method} request to {url}")
+        response = None
+        last_error = None
+        for attempt in range(retry_count + 1):
+            if attempt > 0:
+                wait_time = retry_backoff * (2 ** (attempt - 1))
+                self.logger.info(
+                    f"Retry attempt {attempt}/{retry_count} after {wait_time:.2f}s"
+                )
+                await asyncio.sleep(wait_time)
+            try:
+                import time
+                start_time = time.time()
+                async with self._session.request(
+                    method=method.value, **request_kwargs
+                ) as response:
+                    response_time = (time.time() - start_time) * 1000  # Convert to ms
+                    # Get content type
+                    content_type = response.headers.get("Content-Type", "")
+                    # Determine response format
+                    actual_format = response_format
+                    if actual_format == ResponseFormat.AUTO:
+                        if "application/json" in content_type:
+                            actual_format = ResponseFormat.JSON
+                        elif "text/" in content_type:
+                            actual_format = ResponseFormat.TEXT
+                        else:
+                            actual_format = ResponseFormat.BINARY
+                    # Parse response
+                    try:
+                        if actual_format == ResponseFormat.JSON:
+                            content = await response.json()
+                        elif actual_format == ResponseFormat.TEXT:
+                            content = await response.text()
+                        elif actual_format == ResponseFormat.BINARY:
+                            content = await response.read()
+                        else:
+                            content = await response.text()  # Fallback to text
+                    except Exception as e:
+                        self.logger.warning(
+                            f"Failed to parse response as {actual_format}: {str(e)}"
+                        )
+                        content = await response.text()  # Fallback to text
+                    # Create response object
+                    http_response = HTTPResponse(
+                        status_code=response.status,
+                        headers=dict(response.headers),
+                        content_type=content_type,
+                        content=content,
+                        response_time_ms=response_time,
+                        url=str(response.url),
+                    ).model_dump()
+                    # Return results
+                    success = 200 <= response.status < 300
+                    return {
+                        "response": http_response,
+                        "status_code": response.status,
+                        "success": success,
+                    }
+            except (aiohttp.ClientError, asyncio.TimeoutError) as e:
+                last_error = e
+                self.logger.warning(f"Async request failed: {str(e)}")
+                # Last attempt, no more retries
+                if attempt == retry_count:
+                    raise NodeExecutionError(
+                        f"Async HTTP request failed after {retry_count + 1} attempts: {str(e)}"
+                    ) from e
+        # Should not reach here, but just in case
+        raise NodeExecutionError(
+            f"Async HTTP request failed after {retry_count + 1} attempts."
+        )
+    async def __aenter__(self):
+        """Context manager support for 'async with' statements."""
+        if self._session is None:
+            self._session = aiohttp.ClientSession()
+        return self
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        """Clean up session when exiting context."""
+        if self._session is not None:
+            await self._session.close()
+            self._session = None