PyPI - interactiveai - Versions diffs - 0.0.1__py3-none-any.whl - Mend

interactiveai 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

interactiveai/__init__.py +16 -0
interactiveai/interactive.py +471 -0
interactiveai-0.0.1.dist-info/METADATA +16 -0
interactiveai-0.0.1.dist-info/RECORD +6 -0
interactiveai-0.0.1.dist-info/WHEEL +5 -0
interactiveai-0.0.1.dist-info/top_level.txt +1 -0

interactiveai/__init__.py ADDED Viewed

@@ -0,0 +1,16 @@
+"""
+Interactive Language Processing Package
+A comprehensive package for managing Langfuse utilities including initialization,
+observation, scoring, dataset management, and parallel processing.
+"""
+from .interactive import Interactive, CallbackHandler
+__version__ = "1.0.0"
+__author__ = "Your Name"
+__email__ = "your.email@example.com"
+__all__ = ["Interactive", "CallbackHandler"]

interactiveai/interactive.py ADDED Viewed

@@ -0,0 +1,471 @@
+import time
+from typing import Dict, Any, List, Optional, Callable, Union
+from concurrent.futures import ThreadPoolExecutor, as_completed
+from langfuse import Langfuse
+from langchain_core.prompts import ChatPromptTemplate
+from langfuse.langchain import CallbackHandler
+from loguru import logger
+from schemas import Evaluator
+class Interactive(Langfuse):
+    """
+    A comprehensive manager class for InteractiveAI utilities including initialization,
+    observation, scoring, dataset management, and parallel processing.
+    """
+    def __init__(self,
+                 public_key: str,
+                 secret_key: str,
+                 host: Optional[str] = "https://app.interactiveai.com",
+                 **kwargs):
+        """
+        Initialize the InteractiveAI Client
+        To get your keys go to https://app.interactiveai.com/settings/api-keys
+        Args:
+            public_key: InteractiveAI public key
+            secret_key: InteractiveAI secret key
+            host: InteractiveAI host (defaults to https://app.interactiveai.com)
+        """
+        # Initialize Langfuse client
+        super().__init__(
+            public_key=public_key,
+            secret_key=secret_key,
+            host=host,
+            **kwargs
+        )
+    def generate_thread_id(self) -> str:
+        """Generate a unique thread ID"""
+        thread_id = f"thread_{int(time.time() * 1000)}"
+        logger.debug(f"Generated thread ID: {thread_id}")
+        return thread_id
+    def get_prompt(self, name: str, version: Optional[int] = None, label: Optional[str] = None) -> ChatPromptTemplate:
+        prompt = self.get_prompt(name=name, version=version, label=label)
+        return ChatPromptTemplate.from_template(
+            prompt.get_langchain_prompt(),
+            metadata={"langfuse_prompt": prompt},
+        )
+    def create_or_get_dataset(self, dataset_name: str, description: str = "") -> Any:
+        """
+        Create a dataset or get existing one
+        Args:
+            dataset_name: Name of the dataset
+            description: Dataset description
+        Returns:
+            Dataset object
+        """
+        try:
+            logger.debug(f"Attempting to retrieve dataset: {dataset_name}")
+            dataset = self.get_dataset(dataset_name)
+            logger.info(f"Retrieved existing dataset: {dataset_name}")
+            return dataset
+        except Exception as e:
+            logger.info(f"Dataset '{dataset_name}' not found, creating new one")
+            try:
+                dataset = self.create_dataset(
+                    name=dataset_name,
+                    description=description or "Dataset for response evaluation",
+                )
+                logger.success(f"Successfully created dataset: {dataset_name}")
+                return dataset
+            except Exception as create_error:
+                logger.error(f"Error creating dataset '{dataset_name}': {create_error}")
+                raise
+    def add_dataset_item(self, dataset_name: str, item_id: str, input_data: Dict[str, Any],
+                        expected_output: Dict[str, Any], metadata: Dict[str, Any]):
+        """
+        Add an item to a dataset
+        Args:
+            dataset_name: Name of the dataset
+            item_id: Unique identifier for the item
+            input_data: Input data
+            expected_output: Expected output
+            metadata: Additional metadata
+        """
+        try:
+            logger.debug(f"Adding item to dataset '{dataset_name}'")
+            self.create_dataset_item(
+                dataset_name=dataset_name,
+                input=input_data,
+                expected_output=expected_output,
+                metadata=metadata,
+                id=item_id
+            )
+            logger.debug(f"Successfully added item to dataset {dataset_name}")
+        except Exception as e:
+            logger.error(f"Error adding dataset item to '{dataset_name}': {e}")
+            raise
+    def add_dataset_items_parallel(self, dataset_name: str, data: List[tuple[str, Any]], max_workers: int = 4):
+        """
+        Add multiple items to a dataset in parallel
+        Args:
+            dataset_name: Name of the dataset
+            data: List of tuples containing (item_id, input_data, expected_output, metadata)
+            max_workers: Maximum number of parallel workers (default: 4)
+        """
+        try:
+            logger.debug(f"Adding {len(data)} items to dataset '{dataset_name}' in parallel")
+            with ThreadPoolExecutor(max_workers=max_workers) as executor:
+                futures = []
+                for item_id, input_data, expected_output, metadata in data:
+                    futures.append(
+                        executor.submit(
+                            self.add_dataset_item,
+                            dataset_name,
+                            item_id,
+                            input_data,
+                            expected_output,
+                            metadata
+                        )
+                    )
+                for future in as_completed(futures):
+                    future.result()  # Wait for all tasks to complete
+            logger.success(f"Successfully added {len(data)} items to dataset '{dataset_name}'")
+        except Exception as e:
+            logger.error(f"Error adding dataset items to '{dataset_name}': {e}")
+            raise
+    def process_single_item(
+            self,
+            idx: int,
+            item: Any,
+            experiment_name: str,
+            handler: CallbackHandler,
+            workflow: Any,
+            evaluations: List[Evaluator]
+    ) -> Dict[str, Union[str, Dict[str, Any]]]:
+        """Process a single dataset item through the workflow and evaluate results.
+        Args:
+            idx: Index of the item in the dataset
+            item: Dataset item containing input and expected output
+            experiment_name: Name of the experiment for tracking
+            handler: Langfuse callback handler for logging
+            workflow: The workflow/model to process the item
+            evaluations: List of evaluation functions to apply
+        Returns:
+            Dictionary containing processing status and results or error information
+        """
+        logger.debug(f"Processing item {idx} for experiment '{experiment_name}'")
+        try:
+            # Create a separate trace for each item using the item.run() context manager
+            with item.run(run_name=experiment_name) as root_span:
+                logger.debug(f"Invoking workflow for item {idx}")
+                # Process the item through the workflow
+                output = workflow.invoke(
+                    state=item.input,
+                    config={
+                        "callbacks": [handler],
+                        "configurable": {"thread_id": idx}  # Use idx as thread_id for uniqueness
+                    }
+                )
+                # Update the trace with input/output information
+                root_span.update_trace(
+                    name=f"{experiment_name}_{idx}",
+                    input=item.input,
+                    output=output,
+                    tags=[experiment_name],
+                    metadata=item.metadata
+                )
+                logger.debug(f"Running {len(evaluations)} evaluations for item {idx}")
+                # Apply all evaluation functions to the output
+                for evaluation in evaluations:
+                    try:
+                        evaluation_result = evaluation.function(output, item.expected_output)
+                        root_span.score_trace(
+                            name=evaluation.name,
+                            value=evaluation_result.score,
+                            data_type=evaluation.data_type,
+                            comment=evaluation_result.reasoning
+                        )
+                        logger.debug(
+                            f"Evaluation '{evaluation.name}' completed for item {idx}: {evaluation_result.score}")
+                    except Exception as eval_error:
+                        logger.warning(f"Evaluation '{evaluation.name}' failed for item {idx}: {eval_error}")
+                        # Continue with other evaluations even if one fails
+                logger.debug(f"Successfully processed item {idx}")
+                return {"status": "success", "output": output}
+        except Exception as e:
+            logger.error(f"Error processing item {idx}: {str(e)}")
+            return {"status": "error", "error": str(e)}
+    def run_langchain_experiment_multi(
+            self,
+            experiment_name: str,
+            dataset: Any,
+            workflow: Any,
+            evaluations: List[Evaluator],
+            max_workers: int = 4,
+            start_index: int = 0,
+            end_index: Optional[int] = None,
+            process_single_item_func: Optional[Callable] = None
+    ) -> List[Dict[str, Union[str, Dict[str, Any]]]]:
+        """Run an experiment with parallel processing using ThreadPool.
+        This function processes multiple dataset items in parallel, applies evaluations,
+        and tracks results using Langfuse for monitoring and analysis.
+        Args:
+            experiment_name: Name of the experiment for tracking and logging
+            dataset: Dataset containing items to process
+            workflow: The workflow/model to process items
+            evaluations: List of evaluation functions to apply to results
+            max_workers: Maximum number of parallel workers (default: 4)
+            start_index: Index to start processing from (default: 0)
+            end_index: Index to stop processing at (default: None for all items)
+            process_single_item_func: Optional custom processing function (default: None)
+        Returns:
+            List of result dictionaries containing status and output/error information
+        Raises:
+            ValueError: If start_index >= end_index or if indices are out of bounds
+        """
+        # Set end_index to dataset length if not provided
+        if end_index is None:
+            end_index = len(dataset.items)
+        # Validate indices
+        if start_index >= end_index:
+            raise ValueError(f"start_index ({start_index}) must be less than end_index ({end_index})")
+        if start_index < 0 or end_index > len(dataset.items):
+            raise ValueError(f"Indices out of bounds: dataset has {len(dataset.items)} items")
+        # Use provided processing function or default
+        if process_single_item_func:
+            processing_func = process_single_item_func
+        else:
+            processing_func = self.process_single_item
+            logger.warning(f" Using default processing function: {self.process_single_item.__name__}")
+        # Calculate actual number of items to process
+        items_to_process = end_index - start_index
+        logger.info(f"Starting experiment '{experiment_name}'")
+        logger.info(f"Processing {items_to_process} items (indices {start_index} to {end_index - 1})")
+        logger.info(f"Using {max_workers} parallel workers")
+        logger.info(f"Applying {len(evaluations)} evaluation metrics")
+        # Initialize Langfuse handler for tracking
+        handler = CallbackHandler()
+        # Process items in parallel using ThreadPoolExecutor
+        with ThreadPoolExecutor(max_workers=max_workers) as executor:
+            logger.debug(f"Creating thread pool with {max_workers} workers")
+            # Prepare arguments for each item to process
+            process_args = [
+                (idx, item, experiment_name, handler, workflow, evaluations)
+                for idx, item in enumerate(dataset.items[start_index:end_index], start=start_index)
+            ]
+            # Submit all tasks to the executor
+            future_to_args = {
+                executor.submit(processing_func, *args): args
+                for args in process_args
+            }
+            logger.info(f"Submitted {len(future_to_args)} tasks to thread pool")
+            # Collect results as they complete
+            results: List[Dict[str, Union[str, Dict[str, Any]]]] = []
+            completed_count = 0
+            for future in as_completed(future_to_args):
+                args = future_to_args[future]
+                item_idx = args[0]  # First argument is the index
+                try:
+                    result = future.result()
+                    results.append(result)
+                    completed_count += 1
+                    # Log progress with appropriate level based on result
+                    if result["status"] == "success":
+                        logger.success(f"Item {item_idx} processed successfully ({completed_count}/{items_to_process})")
+                    else:
+                        logger.warning(
+                            f"Item {item_idx} failed ({completed_count}/{items_to_process}): {result.get('error', 'Unknown error')}")
+                except Exception as e:
+                    logger.error(
+                        f"Exception processing item {item_idx} ({completed_count + 1}/{items_to_process}): {str(e)}")
+                    results.append({"status": "exception", "error": str(e)})
+                    completed_count += 1
+        # Calculate and log summary statistics
+        successful = sum(1 for r in results if r["status"] == "success")
+        failed = len(results) - successful
+        success_rate = (successful / len(results)) * 100 if results else 0
+        logger.info(f" Experiment '{experiment_name}' completed!")
+        logger.info(f" Results Summary:")
+        logger.info(f"   • Total items processed: {len(results)}")
+        logger.info(f"   • Successful: {successful}")
+        logger.info(f"   • Failed: {failed}")
+        logger.info(f"   • Success rate: {success_rate:.1f}%")
+        if failed > 0:
+            logger.warning(f"{failed} items failed processing - check logs for details")
+        return results
+    def run_langchain_experiment_sequential(
+            self,
+            experiment_name: str,
+            dataset: Any,
+            workflow: Any,
+            evaluations: List[Evaluator],
+            start_index: int = 0,
+            end_index: Optional[int] = None,
+            process_single_item_func: Optional[Callable] = None
+    ) -> List[Dict[str, Union[str, Dict[str, Any]]]]:
+        """Run an experiment with sequential processing (no parallel processing).
+        This function processes multiple dataset items sequentially, applies evaluations,
+        and tracks results using Langfuse for monitoring and analysis.
+        Args:
+            experiment_name: Name of the experiment for tracking and logging
+            dataset: Dataset containing items to process
+            workflow: The workflow/model to process items
+            evaluations: List of evaluation functions to apply to results
+            start_index: Index to start processing from (default: 0)
+            end_index: Index to stop processing at (default: None for all items)
+            process_single_item_func: Optional custom processing function (default: None)
+        Returns:
+            List of result dictionaries containing status and output/error information
+        Raises:
+            ValueError: If start_index >= end_index or if indices are out of bounds
+        """
+        # Set end_index to dataset length if not provided
+        if end_index is None:
+            end_index = len(dataset.items)
+        # Validate indices
+        if start_index >= end_index:
+            raise ValueError(f"start_index ({start_index}) must be less than end_index ({end_index})")
+        if start_index < 0 or end_index > len(dataset.items):
+            raise ValueError(f"Indices out of bounds: dataset has {len(dataset.items)} items")
+        # Use provided processing function or default
+        if process_single_item_func:
+            processing_func = process_single_item_func
+        else:
+            processing_func = self.process_single_item
+            logger.warning(f" Using default processing function: {self.process_single_item.__name__}")
+        # Calculate actual number of items to process
+        items_to_process = end_index - start_index
+        logger.info(f"Starting experiment '{experiment_name}'")
+        logger.info(f"Processing {items_to_process} items (indices {start_index} to {end_index - 1})")
+        logger.info(f"Processing sequentially (max_workers parameter ignored)")
+        logger.info(f"Applying {len(evaluations)} evaluation metrics")
+        # Initialize Langfuse handler for tracking
+        handler = CallbackHandler()
+        # Process items sequentially
+        results: List[Dict[str, Union[str, Dict[str, Any]]]] = []
+        completed_count = 0
+        for idx, item in enumerate(dataset.items[start_index:end_index], start=start_index):
+            logger.debug(f"Processing item {idx} sequentially")
+            try:
+                result = processing_func(idx, item, experiment_name, handler, workflow, evaluations)
+                results.append(result)
+                completed_count += 1
+                # Log progress with appropriate level based on result
+                if result["status"] == "success":
+                    logger.success(f"Item {idx} processed successfully ({completed_count}/{items_to_process})")
+                else:
+                    logger.warning(
+                        f"Item {idx} failed ({completed_count}/{items_to_process}): {result.get('error', 'Unknown error')}")
+            except Exception as e:
+                logger.error(
+                    f"Exception processing item {idx} ({completed_count + 1}/{items_to_process}): {str(e)}")
+                results.append({"status": "exception", "error": str(e)})
+                completed_count += 1
+        # Calculate and log summary statistics
+        successful = sum(1 for r in results if r["status"] == "success")
+        failed = len(results) - successful
+        success_rate = (successful / len(results)) * 100 if results else 0
+        logger.info(f" Experiment '{experiment_name}' completed!")
+        logger.info(f" Results Summary:")
+        logger.info(f"   • Total items processed: {len(results)}")
+        logger.info(f"   • Successful: {successful}")
+        logger.info(f"   • Failed: {failed}")
+        logger.info(f"   • Success rate: {success_rate:.1f}%")
+        if failed > 0:
+            logger.warning(f"{failed} items failed processing - check logs for details")
+        return results
+    def flush(self):
+        """Flush any pending Langfuse operations"""
+        try:
+            logger.debug("Flushing Langfuse operations...")
+            self.flush()
+            logger.success("Langfuse operations flushed successfully")
+        except Exception as e:
+            logger.error(f"Error flushing Langfuse operations: {e}")
+    def __enter__(self):
+        """Context manager entry"""
+        return self
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        """Context manager exit - flush operations"""
+        if exc_type:
+            logger.error(f"Exiting context manager due to exception: {exc_type.__name__}: {exc_val}")
+        self.flush()

interactiveai-0.0.1.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,16 @@
+Metadata-Version: 2.4
+Name: interactiveai
+Version: 0.0.1
+Summary: InteractiveAI client package
+Author: InteractiveAI
+License: MIT License
+Project-URL: Homepage, https://interactive.ai
+Project-URL: App, https://app.interactive.ai
+Project-URL: Repository, https://github.com/Interactive-AI-Labs/interactiveai-sdk
+Classifier: Programming Language :: Python :: 3
+Classifier: Operating System :: OS Independent
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+# interactive-sdk
+InteractiveAI platform SDK

interactiveai-0.0.1.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,6 @@
+interactiveai/__init__.py,sha256=0c4BSy0x0awPyM1uE0dIPVxikx-zOsIOaEB9C5HIDCQ,386
+interactiveai/interactive.py,sha256=ouiqdM-fKscyIUbfr2qkZYT5XvD-kNkZQpPKRXstqcM,19274
+interactiveai-0.0.1.dist-info/METADATA,sha256=QrRGF41Ofq1KzEh1KVIS7EDQBF_oCsreye-0859TuFU,515
+interactiveai-0.0.1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+interactiveai-0.0.1.dist-info/top_level.txt,sha256=GkGPBUGTyN4pdleSXMxvlfNHKNsQZpn6YBabTx-2sao,14
+interactiveai-0.0.1.dist-info/RECORD,,

interactiveai-0.0.1.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,5 @@
+Wheel-Version: 1.0
+Generator: setuptools (80.9.0)
+Root-Is-Purelib: true
+Tag: py3-none-any

interactiveai-0.0.1.dist-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ interactiveai