PyPI - ragaai-catalyst - Versions diffs - 2.2.4b5__py3-none-any.whl → 2.2.5b2__py3-none-any.whl - Mend

ragaai-catalyst 2.2.4b5py3-none-any.whl → 2.2.5b2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

ragaai_catalyst/tracers/agentic_tracing/tracers/tool_tracer.py DELETED Viewed

@@ -1,557 +0,0 @@
-import os
-import uuid
-from datetime import datetime
-from langchain_core.tools import tool
-import psutil
-import functools
-from typing import Optional, Any, Dict, List
-from pydantic import tools
-from .base import BaseTracer
-from ..utils.unique_decorator import generate_unique_hash_simple
-import contextvars
-import asyncio
-from ..utils.file_name_tracker import TrackName
-from ..utils.span_attributes import SpanAttributes
-import logging
-import wrapt
-import time
-import inspect
-logger = logging.getLogger(__name__)
-logging_level = (
-    logger.setLevel(logging.DEBUG)
-    if os.getenv("DEBUG")
-    else logger.setLevel(logging.INFO)
-)
-class ToolTracerMixin:
-    def __init__(self, *args, **kwargs):
-        super().__init__(*args, **kwargs)
-        self.file_tracker = TrackName()
-        self.current_tool_name = contextvars.ContextVar("tool_name", default=None)
-        self.current_tool_id = contextvars.ContextVar("tool_id", default=None)
-        self.component_network_calls = {}
-        self.component_user_interaction = {}
-        self.gt = None
-        # add auto_instrument option
-        self.auto_instrument_tool = False
-        self.auto_instrument_user_interaction = False
-        self.auto_instrument_file_io = False
-        self.auto_instrument_network = False
-        self._instrumented_tools = set()  # Track which tools we've instrumented
-        self._method_usage = {}  # Track which methods are actually used
-        self._active_tool_calls = set()  # Track active tool calls to prevent duplicates
-    # take care of auto_instrument
-    def instrument_tool_calls(self):
-        """Enable tool instrumentation"""
-        self.auto_instrument_tool = True
-        # Handle modules that are already imported
-        import sys
-        if "langchain_community.tools" in sys.modules:
-            self.patch_langchain_tools(sys.modules["langchain_community.tools"])
-        if "langchain.tools" in sys.modules:
-            self.patch_langchain_tools(sys.modules["langchain.tools"])
-        if "langchain_core.tools" in sys.modules:
-            self.patch_langchain_core_tools(sys.modules["langchain_core.tools"])
-        # Register hooks for future imports
-        wrapt.register_post_import_hook(
-            self.patch_langchain_tools, "langchain_community.tools"
-        )
-        wrapt.register_post_import_hook(
-            self.patch_langchain_tools, "langchain.tools"
-        )
-        wrapt.register_post_import_hook(
-            self.patch_langchain_core_tools, "langchain_core.tools"
-        )
-    def patch_langchain_core_tools(self, module):
-        """Patch langchain tool methods"""
-        from langchain_core.tools import BaseTool, StructuredTool, Tool
-        # Process tool classes in order of inheritance (base class first)
-        tool_classes = [BaseTool]  # Start with base class
-        # Add derived classes that don't inherit from already processed classes
-        for tool_class in [StructuredTool, Tool]:
-            if not any(issubclass(tool_class, processed) for processed in tool_classes):
-                tool_classes.append(tool_class)
-        for tool_class in tool_classes:
-            if tool_class in self._instrumented_tools:
-                continue
-            # Create proxy instead of directly wrapping methods
-            self.ToolMethodProxy(self, tool_class, tool_class.__name__)
-            self._instrumented_tools.add(tool_class)
-    def patch_langchain_tools(self, module):
-        """Patch langchain tool methods"""
-        for directory in dir(module):
-            dir_class = getattr(module, directory)
-            tools = getattr(dir_class, "__all__", None)
-            if tools is None:
-                continue
-            for tool in tools:
-                tool_class = getattr(dir_class, tool)
-                # Skip if already instrumented
-                if tool_class in self._instrumented_tools:
-                    continue
-                # Create proxy instead of directly wrapping methods
-                self.ToolMethodProxy(self, tool_class, tool)
-                self._instrumented_tools.add(tool_class)
-    class ToolMethodProxy:
-        def __init__(self, tracer, tool_class, tool_name):
-            self.tracer = tracer
-            self.tool_class = tool_class
-            self.tool_name = tool_name
-            self._original_methods = {}
-            self._wrapped = False
-            # Store original methods
-            for method in ['run', 'arun', 'invoke', 'ainvoke']:
-                if hasattr(tool_class, method):
-                    self._original_methods[method] = getattr(tool_class, method)
-                    setattr(tool_class, method, self._create_proxy_method(method))
-        def _create_proxy_method(self, method_name):
-            original_method = self._original_methods[method_name]
-            async def async_proxy_method(*args, **kwargs):
-                if not self._wrapped:
-                    self._cleanup_proxy()
-                    self.tracer._wrap_specific_method(self.tool_class, method_name, self.tool_name)
-                    self._wrapped = True
-                # Get the now-wrapped method
-                wrapped_method = getattr(self.tool_class, method_name)
-                return await wrapped_method(*args, **kwargs)
-            def sync_proxy_method(*args, **kwargs):
-                if not self._wrapped:
-                    self._cleanup_proxy()
-                    self.tracer._wrap_specific_method(self.tool_class, method_name, self.tool_name)
-                    self._wrapped = True
-                # Get the now-wrapped method
-                wrapped_method = getattr(self.tool_class, method_name)
-                return wrapped_method(*args, **kwargs)
-            # Use appropriate proxy based on whether original method is async
-            proxy_method = async_proxy_method if asyncio.iscoroutinefunction(original_method) else sync_proxy_method
-            proxy_method.__name__ = method_name
-            return proxy_method
-        def _cleanup_proxy(self):
-            # Restore all original methods except the one that was called
-            for method, original in self._original_methods.items():
-                if not self._wrapped:
-                    setattr(self.tool_class, method, original)
-    def _wrap_specific_method(self, tool_class, method_name, tool_name):
-        """Wrap only the specific method that is being used"""
-        original_method = getattr(tool_class, method_name)
-        async def async_wrapper(*args, **kwargs):
-            tool_call_id = kwargs.get('tool_call_id', None)
-            if tool_call_id and tool_call_id in self._active_tool_calls:
-                # Skip tracing if this tool call is already being traced
-                return await original_method(*args, **kwargs)
-            if tool_call_id:
-                self._active_tool_calls.add(tool_call_id)
-            try:
-                name = tool_name
-                tool_type = "langchain"
-                version = None
-                return await self._trace_tool_execution(original_method, name, tool_type, version, *args, **kwargs)
-            finally:
-                if tool_call_id:
-                    self._active_tool_calls.remove(tool_call_id)
-        def sync_wrapper(*args, **kwargs):
-            tool_call_id = kwargs.get('tool_call_id', None)
-            if tool_call_id and tool_call_id in self._active_tool_calls:
-                # Skip tracing if this tool call is already being traced
-                return original_method(*args, **kwargs)
-            if tool_call_id:
-                self._active_tool_calls.add(tool_call_id)
-            try:
-                name = tool_name
-                tool_type = "langchain"
-                version = None
-                return self._trace_sync_tool_execution(original_method, name, tool_type, version, *args, **kwargs)
-            finally:
-                if tool_call_id:
-                    self._active_tool_calls.remove(tool_call_id)
-        wrapper = async_wrapper if asyncio.iscoroutinefunction(original_method) else sync_wrapper
-        wrapper.__name__ = method_name
-        setattr(tool_class, method_name, wrapper)
-    def instrument_user_interaction_calls(self):
-        self.auto_instrument_user_interaction = True
-    def instrument_file_io_calls(self):
-        self.auto_instrument_file_io = True
-    def instrument_network_calls(self):
-        self.auto_instrument_network = True
-    def trace_tool(
-        self,
-        name: str,
-        tool_type: str = "generic",
-        version: str = "1.0.0",
-        tags: List[str] = [],
-        metadata: Dict[str, Any] = {},
-        metrics: List[Dict[str, Any]] = [],
-        feedback: Optional[Any] = None,
-    ):
-        if name not in self.span_attributes_dict:
-            self.span_attributes_dict[name] = SpanAttributes(name)
-        if tags:
-            self.span(name).add_tags(tags)
-        if metadata:
-            self.span(name).add_metadata(metadata)
-        if metrics:
-            if isinstance(metrics, dict):
-                metrics = [metrics]
-            try:
-                for metric in metrics:
-                    self.span(name).add_metrics(
-                        name=metric["name"],
-                        score=metric["score"],
-                        reasoning=metric.get("reasoning", ""),
-                        cost=metric.get("cost", None),
-                        latency=metric.get("latency", None),
-                        metadata=metric.get("metadata", {}),
-                        config=metric.get("config", {}),
-                    )
-            except ValueError as e:
-                    logger.error(f"Validation Error: {e}")
-            except Exception as e:
-                logger.error(f"Error adding metric: {e}")
-        if feedback:
-            self.span(name).add_feedback(feedback)
-        def decorator(func):
-            # Add metadata attribute to the function
-            metadata = {
-                "name": name,
-                "tool_type": tool_type,
-                "version": version,
-                "is_active": self.is_active,
-            }
-            # Check if the function is async
-            is_async = asyncio.iscoroutinefunction(func)
-            @functools.wraps(func)
-            async def async_wrapper(*args, **kwargs):
-                async_wrapper.metadata = metadata
-                gt = kwargs.get("gt") if kwargs else None
-                if gt is not None:
-                    span = self.span(name)
-                    span.add_gt(gt)
-                return await self._trace_tool_execution(
-                    func, name, tool_type, version, *args, **kwargs
-                )
-            @functools.wraps(func)
-            def sync_wrapper(*args, **kwargs):
-                sync_wrapper.metadata = metadata
-                gt = kwargs.get("gt") if kwargs else None
-                if gt is not None:
-                    span = self.span(name)
-                    span.add_gt(gt)
-                return self._trace_sync_tool_execution(
-                    func, name, tool_type, version, *args, **kwargs
-                )
-            wrapper = async_wrapper if is_async else sync_wrapper
-            wrapper.metadata = metadata
-            return wrapper
-        return decorator
-    def _trace_sync_tool_execution(
-        self, func, name, tool_type, version, *args, **kwargs
-    ):
-        """Synchronous version of tool tracing"""
-        if not self.is_active:
-            return func(*args, **kwargs)
-        if not self.auto_instrument_tool:
-            return func(*args, **kwargs)
-        start_time = datetime.now().astimezone()
-        start_memory = psutil.Process().memory_info().rss
-        component_id = str(uuid.uuid4())
-        hash_id = generate_unique_hash_simple(func)
-        # Set current tool name and store the token
-        name_token = self.current_tool_name.set(name)
-        id_token = self.current_tool_id.set(component_id)
-        # Start tracking network calls for this component
-        self.start_component(component_id)
-        try:
-            # Execute the tool
-            result = func(*args, **kwargs)
-            # Calculate resource usage
-            end_memory = psutil.Process().memory_info().rss
-            memory_used = max(0, end_memory - start_memory)
-            # End tracking network calls for this component
-            self.end_component(component_id)
-            # Create tool component
-            tool_component = self.create_tool_component(
-                component_id=component_id,
-                hash_id=hash_id,
-                name=name,
-                tool_type=tool_type,
-                version=version,
-                memory_used=memory_used,
-                start_time=start_time,
-                input_data=self._sanitize_input(args, kwargs),
-                output_data=self._sanitize_output(result),
-            )
-            self.add_component(tool_component)
-            return result
-        except Exception as e:
-            error_component = {
-                "code": 500,
-                "type": type(e).__name__,
-                "message": str(e),
-                "details": {},
-            }
-            # End tracking network calls for this component
-            self.end_component(component_id)
-            tool_component = self.create_tool_component(
-                component_id=component_id,
-                hash_id=hash_id,
-                name=name,
-                tool_type=tool_type,
-                version=version,
-                memory_used=0,
-                start_time=start_time,
-                input_data=self._sanitize_input(args, kwargs),
-                output_data=None,
-                error=error_component,
-            )
-            self.add_component(tool_component, is_error=True)
-            raise
-        finally:
-            # Reset the tool name and id context
-            if name_token:
-                self.current_tool_name.reset(name_token)
-            if id_token:
-                self.current_tool_id.reset(id_token)
-    async def _trace_tool_execution(
-        self, func, name, tool_type, version, *args, **kwargs
-    ):
-        """Asynchronous version of tool tracing"""
-        if not self.is_active:
-            return await func(*args, **kwargs)
-        if not self.auto_instrument_tool:
-            return await func(*args, **kwargs)
-        start_time = datetime.now().astimezone()
-        start_memory = psutil.Process().memory_info().rss
-        component_id = str(uuid.uuid4())
-        hash_id = generate_unique_hash_simple(func)
-        # Set current tool name and store the token
-        name_token = self.current_tool_name.set(name)
-        id_token = self.current_tool_id.set(component_id)
-        self.start_component(component_id)
-        try:
-            # Execute the tool
-            result = await func(*args, **kwargs)
-            # Calculate resource usage
-            end_memory = psutil.Process().memory_info().rss
-            memory_used = max(0, end_memory - start_memory)
-            self.end_component(component_id)
-            # Create tool component
-            tool_component = self.create_tool_component(
-                component_id=component_id,
-                hash_id=hash_id,
-                name=name,
-                tool_type=tool_type,
-                version=version,
-                start_time=start_time,
-                memory_used=memory_used,
-                input_data=self._sanitize_input(args, kwargs),
-                output_data=self._sanitize_output(result),
-            )
-            self.add_component(tool_component)
-            return result
-        except Exception as e:
-            error_component = {
-                "code": 500,
-                "type": type(e).__name__,
-                "message": str(e),
-                "details": {},
-            }
-            tool_component = self.create_tool_component(
-                component_id=component_id,
-                hash_id=hash_id,
-                name=name,
-                tool_type=tool_type,
-                version=version,
-                start_time=start_time,
-                memory_used=0,
-                input_data=self._sanitize_input(args, kwargs),
-                output_data=None,
-                error=error_component,
-            )
-            self.add_component(tool_component, is_error=True)
-            raise
-        finally:
-            # Reset the tool name and id context
-            if name_token:
-                self.current_tool_name.reset(name_token)
-            if id_token:
-                self.current_tool_id.reset(id_token)
-    def create_tool_component(self, **kwargs):
-        """Create a tool component according to the data structure"""
-        network_calls = []
-        if self.auto_instrument_network:
-            network_calls = self.component_network_calls.get(kwargs["component_id"], [])
-        interactions = []
-        if self.auto_instrument_user_interaction:
-            input_output_interactions = []
-            for interaction in self.component_user_interaction.get(kwargs["component_id"], []):
-                if interaction["interaction_type"] in ["input", "output"]:
-                    input_output_interactions.append(interaction)
-            if input_output_interactions!=[]:
-                interactions.extend(input_output_interactions)
-        if self.auto_instrument_file_io:
-            file_io_interactions = []
-            for interaction in self.component_user_interaction.get(kwargs["component_id"], []):
-                if interaction["interaction_type"] in ["file_read", "file_write"]:
-                    file_io_interactions.append(interaction)
-            if file_io_interactions!=[]:
-                interactions.extend(file_io_interactions)
-        # Get tags, metrics
-        name = kwargs["name"]
-        # tags
-        tags = []
-        if name in self.span_attributes_dict:
-            tags = self.span_attributes_dict[name].tags or []
-        # metrics
-        metrics = []
-        if name in self.span_attributes_dict:
-            raw_metrics = self.span_attributes_dict[name].metrics or []
-            for metric in raw_metrics:
-                base_metric_name = metric["name"]
-                counter = sum(1 for x in self.visited_metrics if x.startswith(base_metric_name))
-                metric_name = f'{base_metric_name}_{counter}' if counter > 0 else base_metric_name
-                self.visited_metrics.append(metric_name)
-                metric["name"] = metric_name
-                metrics.append(metric)
-        formatted_metrics = BaseTracer.get_formatted_metric(self.span_attributes_dict, self.project_id, name)
-        if formatted_metrics:
-            metrics.extend(formatted_metrics)
-        start_time = kwargs["start_time"]
-        component = {
-            "id": kwargs["component_id"],
-            "hash_id": kwargs["hash_id"],
-            "source_hash_id": None,
-            "type": "tool",
-            "name": kwargs["name"],
-            "start_time": start_time.isoformat(),
-            "end_time": datetime.now().astimezone().isoformat(),
-            "error": kwargs.get("error"),
-            "parent_id": self.current_agent_id.get(),
-            "info": {
-                "tool_type": kwargs["tool_type"],
-                "version": kwargs["version"],
-                "memory_used": kwargs["memory_used"],
-                "tags": tags,
-            },
-            "data": {
-                "input": kwargs["input_data"],
-                "output": kwargs["output_data"],
-                "memory_used": kwargs["memory_used"],
-            },
-            "metrics": metrics,
-            "network_calls": network_calls,
-            "interactions": interactions,
-        }
-        if name in self.span_attributes_dict:
-            span_gt = self.span_attributes_dict[name].gt
-            if span_gt is not None:
-                component["data"]["gt"] = span_gt
-            span_context = self.span_attributes_dict[name].context
-            if span_context:
-                component["data"]["context"] = span_context
-        # Reset the SpanAttributes context variable
-        self.span_attributes_dict[kwargs["name"]] = SpanAttributes(kwargs["name"])
-        return component
-    def start_component(self, component_id):
-        self.component_network_calls[component_id] = []
-    def end_component(self, component_id):
-        pass
-    def _sanitize_input(self, args: tuple, kwargs: dict) -> dict:
-        """Sanitize and format input data, including handling of nested lists and dictionaries."""
-        def sanitize_value(value):
-            if isinstance(value, (int, float, bool, str)):
-                return value
-            elif isinstance(value, list):
-                return [sanitize_value(item) for item in value]
-            elif isinstance(value, dict):
-                return {key: sanitize_value(val) for key, val in value.items()}
-            else:
-                return str(value)  # Convert non-standard types to string
-        return {
-            "args": [sanitize_value(arg) for arg in args],
-            "kwargs": {key: sanitize_value(val) for key, val in kwargs.items()},
-        }
-    def _sanitize_output(self, output: Any) -> Any:
-        """Sanitize and format output data"""
-        if isinstance(output, (int, float, bool, str, list, dict)):
-            return output
-        return str(output)

ragaai_catalyst/tracers/agentic_tracing/tracers/user_interaction_tracer.py DELETED Viewed

@@ -1,129 +0,0 @@
-import builtins
-from datetime import datetime
-import contextvars
-import inspect
-import uuid
-from typing import Optional, Any
-class TracedFile:
-    def __init__(self, file_obj, file_path: str, tracer):
-        self._file = file_obj
-        self._file_path = file_path
-        self._tracer = tracer
-    def write(self, content: str) -> int:
-        self._tracer.trace_file_operation("write", self._file_path, content=content)
-        return self._file.write(content)
-    def read(self, size: Optional[int] = None) -> str:
-        content = self._file.read() if size is None else self._file.read(size)
-        self._tracer.trace_file_operation("read", self._file_path, content=content)
-        return content
-    def close(self) -> None:
-        return self._file.close()
-    def __enter__(self):
-        return self
-    def __exit__(self, exc_type, exc_val, exc_tb):
-        self.close()
-        return None
-    def __getattr__(self, name: str) -> Any:
-        return getattr(self._file, name)
-class UserInteractionTracer:
-    def __init__(self, *args, **kwargs):
-        self.project_id = contextvars.ContextVar("project_id", default=None)
-        self.trace_id = contextvars.ContextVar("trace_id", default=None)
-        self.tracer = contextvars.ContextVar("tracer", default=None)
-        self.component_id = contextvars.ContextVar("component_id", default=None)
-        self.original_input = builtins.input
-        self.original_print = builtins.print
-        self.original_open = builtins.open
-        self.interactions = []
-    def traced_input(self, prompt=""):
-        # Get caller information
-        if prompt:
-            self.traced_print(prompt, end="")
-        try:
-            content = self.original_input()
-        except EOFError:
-            content = ""  # Return empty string on EOF
-        self.interactions.append({
-            "id": str(uuid.uuid4()),
-            "component_id": self.component_id.get(),
-            "interaction_type": "input",
-            "content": content,
-            "timestamp": datetime.now().astimezone().isoformat()
-        })
-        return content
-    def traced_print(self, *args, **kwargs):
-        content = " ".join(str(arg) for arg in args)
-        self.interactions.append({
-            "id": str(uuid.uuid4()),
-            "component_id": self.component_id.get(),
-            "interaction_type": "output",
-            "content": content,
-            "timestamp": datetime.now().astimezone().isoformat()
-        })
-        return self.original_print(*args, **kwargs)
-    def traced_open(self, file: str, mode: str = 'r', *args, **kwargs):
-        # Skip tracing for system and virtual environment paths
-        system_paths = [
-            'site-packages',
-            'dist-packages',
-            '/proc/',
-            '/sys/',
-            '/var/lib/',
-            '/usr/lib/',
-            '/System/Library'
-        ]
-        file_str = str(file)
-        if any(path in file_str for path in system_paths):
-            return self.original_open(file, mode, *args, **kwargs)
-        file_obj = self.original_open(file, mode, *args, **kwargs)
-        return TracedFile(file_obj, file, self)
-    def trace_file_operation(self, operation: str, file_path: str, **kwargs):
-        interaction_type = f"file_{operation}"
-        # Check for existing interaction with same file_path and operation
-        for existing in reversed(self.interactions):
-            if (existing.get("file_path") == file_path and
-                existing.get("interaction_type") == interaction_type):
-                # Merge content if it exists
-                if "content" in kwargs and "content" in existing:
-                    existing["content"] += kwargs["content"]
-                    return
-                break
-        # If no matching interaction found or couldn't merge, create new one
-        interaction = {
-            "id": str(uuid.uuid4()),
-            "component_id": self.component_id.get(),
-            "interaction_type": interaction_type,
-            "file_path": file_path,
-            "timestamp": datetime.now().astimezone().isoformat()
-        }
-        interaction.update(kwargs)
-        self.interactions.append(interaction)
-    def __enter__(self):
-        builtins.input = self.traced_input
-        builtins.print = self.traced_print
-        builtins.open = self.traced_open
-        return self
-    def __exit__(self, exc_type, exc_val, exc_tb):
-        builtins.input = self.original_input
-        builtins.print = self.original_print
-        builtins.open = self.original_open

ragaai-catalyst 2.2.4b5__py3-none-any.whl → 2.2.5b2__py3-none-any.whl

ragaai-catalyst 2.2.4b5py3-none-any.whl → 2.2.5b2py3-none-any.whl