PyPI - local-deep-research - Versions diffs - 0.3.12__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

local-deep-research 0.3.12py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (92) hide show

local_deep_research/benchmarks/datasets/utils.py ADDED Viewed

@@ -0,0 +1,116 @@
+"""
+Utility functions for dataset handling.
+This module provides utility functions for common dataset operations like
+decryption, encoding detection, etc.
+"""
+import base64
+import hashlib
+import logging
+from typing import Dict, Any
+logger = logging.getLogger(__name__)
+def derive_key(password: str, length: int) -> bytes:
+    """Derive a fixed-length key from the password using SHA256."""
+    hasher = hashlib.sha256()
+    hasher.update(password.encode())
+    key = hasher.digest()
+    return key * (length // len(key)) + key[: length % len(key)]
+def decrypt(ciphertext_b64: str, password: str) -> str:
+    """
+    Decrypt base64-encoded ciphertext with XOR.
+    Uses multiple approaches to handle different encoding formats.
+    """
+    # Skip decryption for non-encoded strings
+    if not isinstance(ciphertext_b64, str) or len(ciphertext_b64) < 8:
+        return ciphertext_b64
+    # Skip if the string doesn't look like base64
+    if not all(c in 'ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/=' for c in ciphertext_b64):
+        return ciphertext_b64
+    # Attempt standard decryption
+    try:
+        encrypted = base64.b64decode(ciphertext_b64)
+        key = derive_key(password, len(encrypted))
+        decrypted = bytes(a ^ b for a, b in zip(encrypted, key))
+        # Check if the result looks like valid text
+        result = decrypted.decode('utf-8', errors='replace')
+        # Heuristic check - if the decrypted text is mostly ASCII and contains spaces
+        if all(32 <= ord(c) < 127 for c in result[:50]) and ' ' in result[:50]:
+            logger.debug(f"Successfully decrypted with standard method: {result[:50]}...")
+            return result
+    except Exception as e:
+        logger.debug(f"Standard decryption failed: {str(e)}")
+    # Alternative method - try using just the first part of the password
+    try:
+        if len(password) > 30:
+            alt_password = password.split()[0]  # Use first word
+            encrypted = base64.b64decode(ciphertext_b64)
+            key = derive_key(alt_password, len(encrypted))
+            decrypted = bytes(a ^ b for a, b in zip(encrypted, key))
+            result = decrypted.decode('utf-8', errors='replace')
+            if all(32 <= ord(c) < 127 for c in result[:50]) and ' ' in result[:50]:
+                logger.debug(f"Successfully decrypted with alternate method 1: {result[:50]}...")
+                return result
+    except Exception:
+        pass
+    # Alternative method 2 - try using the GUID part
+    try:
+        if "GUID" in password:
+            guid_part = password.split("GUID")[1].strip()
+            encrypted = base64.b64decode(ciphertext_b64)
+            key = derive_key(guid_part, len(encrypted))
+            decrypted = bytes(a ^ b for a, b in zip(encrypted, key))
+            result = decrypted.decode('utf-8', errors='replace')
+            if all(32 <= ord(c) < 127 for c in result[:50]) and ' ' in result[:50]:
+                logger.debug(f"Successfully decrypted with GUID method: {result[:50]}...")
+                return result
+    except Exception:
+        pass
+    # Alternative method 3 - hardcoded key for BrowseComp
+    try:
+        hardcoded_key = "MHGGF2022!"  # Known key for BrowseComp dataset
+        encrypted = base64.b64decode(ciphertext_b64)
+        key = derive_key(hardcoded_key, len(encrypted))
+        decrypted = bytes(a ^ b for a, b in zip(encrypted, key))
+        result = decrypted.decode('utf-8', errors='replace')
+        if all(32 <= ord(c) < 127 for c in result[:50]) and ' ' in result[:50]:
+            logger.debug(f"Successfully decrypted with hardcoded key: {result[:50]}...")
+            return result
+    except Exception:
+        pass
+    # If all attempts fail, return the original
+    logger.debug(f"All decryption attempts failed for: {ciphertext_b64[:20]}...")
+    return ciphertext_b64
+def get_known_answer_map() -> Dict[str, str]:
+    """Get a mapping of known encrypted answers to their decrypted values.
+    This function maintains a catalog of known encrypted strings that
+    couldn't be automatically decrypted, along with their verified
+    plaintext values.
+    Returns:
+        Dictionary mapping encrypted strings to their plaintext values.
+    """
+    return {
+        "dFoTn+K+bcdyWg==": "Tooth Rock",
+        "ERFIwA==": "1945",
+        # Add more mappings as they are discovered during benchmark runs
+    }

local_deep_research/benchmarks/datasets.py ADDED Viewed

@@ -0,0 +1,31 @@
+"""
+Dataset handling for benchmarks.
+This is a legacy module that provides backwards compatibility with the old
+dataset handling functions. New code should use the classes in the datasets
+package directly.
+Notes on BrowseComp dataset:
+- BrowseComp data is encrypted with the canary string used as the decryption key
+- The decrypt() function handles decrypting both problems and answers
+- For some examples where standard decryption doesn't work, we use additional methods:
+  1. Try using various parts of the canary string as the key
+  2. Try using hardcoded keys that are known to work
+  3. Use a manual mapping for specific encrypted strings that have been verified
+"""
+import logging
+from typing import Any, Dict, List, Optional
+from .datasets import DatasetRegistry, load_dataset
+logger = logging.getLogger(__name__)
+# Re-export the default dataset URLs
+from .datasets import DEFAULT_DATASET_URLS
+# Re-export the get_available_datasets function
+from .datasets import get_available_datasets
+# Re-export the load_dataset function
+__all__ = ['DEFAULT_DATASET_URLS', 'get_available_datasets', 'load_dataset']

local_deep_research/benchmarks/efficiency/__init__.py ADDED Viewed

@@ -0,0 +1,14 @@
+"""
+Efficiency submodule for speed and resource monitoring in Local Deep Research.
+This module provides tools for measuring and optimizing execution speed
+and resource usage of the research system.
+"""
+from local_deep_research.benchmarks.efficiency.speed_profiler import SpeedProfiler
+from local_deep_research.benchmarks.efficiency.resource_monitor import ResourceMonitor
+__all__ = [
+    'SpeedProfiler',
+    'ResourceMonitor',
+]

local_deep_research/benchmarks/efficiency/resource_monitor.py ADDED Viewed

@@ -0,0 +1,367 @@
+"""
+Resource monitoring tools for Local Deep Research.
+This module provides functionality for tracking CPU, memory and other
+system resource usage during the research process.
+"""
+import logging
+import threading
+import time
+from contextlib import contextmanager
+from typing import Dict, List, Optional, Any, Callable, Tuple
+logger = logging.getLogger(__name__)
+# Try to import psutil, but don't fail if not available
+try:
+    import psutil
+    PSUTIL_AVAILABLE = True
+except ImportError:
+    PSUTIL_AVAILABLE = False
+    logger.warning("psutil not available, resource monitoring will be limited")
+class ResourceMonitor:
+    """
+    Monitor system resource usage during research.
+    This class provides methods for tracking CPU, memory, and disk usage
+    during system execution. It can be used to identify resource bottlenecks
+    and optimize configurations for different hardware environments.
+    """
+    def __init__(self,
+                 sampling_interval: float = 1.0,
+                 track_process: bool = True,
+                 track_system: bool = True):
+        """
+        Initialize the resource monitor.
+        Args:
+            sampling_interval: Seconds between resource usage measurements
+            track_process: Whether to track this process's resource usage
+            track_system: Whether to track overall system resource usage
+        """
+        self.sampling_interval = sampling_interval
+        self.track_process = track_process
+        self.track_system = track_system
+        self.monitoring = False
+        self.monitor_thread = None
+        # Resource usage data
+        self.process_data = []
+        self.system_data = []
+        self.start_time = None
+        self.end_time = None
+        # Check if we can monitor resources
+        self.can_monitor = PSUTIL_AVAILABLE
+        if not self.can_monitor:
+            logger.warning("Resource monitoring requires psutil. Install with: pip install psutil")
+    def start(self):
+        """Start monitoring resource usage."""
+        if not self.can_monitor:
+            logger.warning("Resource monitoring not available (psutil not installed)")
+            return
+        if self.monitoring:
+            logger.warning("Resource monitoring already started")
+            return
+        self.process_data = []
+        self.system_data = []
+        self.start_time = time.time()
+        self.monitoring = True
+        # Start monitoring in a background thread
+        self.monitor_thread = threading.Thread(
+            target=self._monitor_resources,
+            daemon=True
+        )
+        self.monitor_thread.start()
+        logger.info(f"Resource monitoring started with {self.sampling_interval}s interval")
+    def stop(self):
+        """Stop monitoring resource usage."""
+        if not self.monitoring:
+            return
+        self.monitoring = False
+        self.end_time = time.time()
+        # Wait for the monitoring thread to finish
+        if self.monitor_thread:
+            self.monitor_thread.join(timeout=2.0)
+            self.monitor_thread = None
+        logger.info("Resource monitoring stopped")
+    def _monitor_resources(self):
+        """Background thread that collects resource usage data."""
+        if not PSUTIL_AVAILABLE:
+            return
+        # Get this process
+        current_process = psutil.Process()
+        while self.monitoring:
+            timestamp = time.time()
+            try:
+                # Monitor this process
+                if self.track_process:
+                    process_cpu = current_process.cpu_percent(interval=None)
+                    process_memory = current_process.memory_info()
+                    self.process_data.append({
+                        'timestamp': timestamp,
+                        'cpu_percent': process_cpu,
+                        'memory_rss': process_memory.rss,  # Resident Set Size in bytes
+                        'memory_vms': process_memory.vms,  # Virtual Memory Size in bytes
+                        'memory_shared': getattr(process_memory, 'shared', 0),
+                        'num_threads': current_process.num_threads(),
+                        'open_files': len(current_process.open_files()),
+                        'status': current_process.status()
+                    })
+                # Monitor overall system
+                if self.track_system:
+                    system_cpu = psutil.cpu_percent(interval=None)
+                    system_memory = psutil.virtual_memory()
+                    system_disk = psutil.disk_usage('/')
+                    self.system_data.append({
+                        'timestamp': timestamp,
+                        'cpu_percent': system_cpu,
+                        'memory_total': system_memory.total,
+                        'memory_available': system_memory.available,
+                        'memory_used': system_memory.used,
+                        'memory_percent': system_memory.percent,
+                        'disk_total': system_disk.total,
+                        'disk_used': system_disk.used,
+                        'disk_percent': system_disk.percent
+                    })
+            except Exception as e:
+                logger.error(f"Error monitoring resources: {str(e)}")
+            # Sleep until next sampling interval
+            time.sleep(self.sampling_interval)
+    @contextmanager
+    def monitor(self):
+        """
+        Context manager for monitoring resources during a block of code.
+        Example:
+            with resource_monitor.monitor():
+                # Code to monitor
+                do_something_resource_intensive()
+        """
+        self.start()
+        try:
+            yield
+        finally:
+            self.stop()
+    def get_process_stats(self) -> Dict[str, Any]:
+        """
+        Get statistics about this process's resource usage.
+        Returns:
+            Dictionary with process resource usage statistics
+        """
+        if not self.process_data:
+            return {}
+        # Extract data series
+        timestamps = [d['timestamp'] for d in self.process_data]
+        cpu_values = [d['cpu_percent'] for d in self.process_data]
+        memory_values = [d['memory_rss'] / (1024 * 1024) for d in self.process_data]  # Convert to MB
+        # Calculate statistics
+        stats = {
+            'start_time': self.start_time,
+            'end_time': self.end_time,
+            'duration': self.end_time - self.start_time if self.end_time else None,
+            'sample_count': len(self.process_data),
+            'cpu_min': min(cpu_values) if cpu_values else None,
+            'cpu_max': max(cpu_values) if cpu_values else None,
+            'cpu_avg': sum(cpu_values) / len(cpu_values) if cpu_values else None,
+            'memory_min_mb': min(memory_values) if memory_values else None,
+            'memory_max_mb': max(memory_values) if memory_values else None,
+            'memory_avg_mb': sum(memory_values) / len(memory_values) if memory_values else None,
+            'thread_max': max(d['num_threads'] for d in self.process_data) if self.process_data else None,
+        }
+        return stats
+    def get_system_stats(self) -> Dict[str, Any]:
+        """
+        Get statistics about overall system resource usage.
+        Returns:
+            Dictionary with system resource usage statistics
+        """
+        if not self.system_data:
+            return {}
+        # Extract data series
+        timestamps = [d['timestamp'] for d in self.system_data]
+        cpu_values = [d['cpu_percent'] for d in self.system_data]
+        memory_values = [d['memory_percent'] for d in self.system_data]
+        disk_values = [d['disk_percent'] for d in self.system_data]
+        # Calculate statistics
+        stats = {
+            'start_time': self.start_time,
+            'end_time': self.end_time,
+            'duration': self.end_time - self.start_time if self.end_time else None,
+            'sample_count': len(self.system_data),
+            'cpu_min': min(cpu_values) if cpu_values else None,
+            'cpu_max': max(cpu_values) if cpu_values else None,
+            'cpu_avg': sum(cpu_values) / len(cpu_values) if cpu_values else None,
+            'memory_min_percent': min(memory_values) if memory_values else None,
+            'memory_max_percent': max(memory_values) if memory_values else None,
+            'memory_avg_percent': sum(memory_values) / len(memory_values) if memory_values else None,
+            'disk_min_percent': min(disk_values) if disk_values else None,
+            'disk_max_percent': max(disk_values) if disk_values else None,
+            'disk_avg_percent': sum(disk_values) / len(disk_values) if disk_values else None,
+            'memory_total_gb': self.system_data[0]['memory_total'] / (1024**3) if self.system_data else None,
+            'disk_total_gb': self.system_data[0]['disk_total'] / (1024**3) if self.system_data else None,
+        }
+        return stats
+    def get_combined_stats(self) -> Dict[str, Any]:
+        """
+        Get combined resource usage statistics.
+        Returns:
+            Dictionary with both process and system statistics
+        """
+        process_stats = self.get_process_stats()
+        system_stats = self.get_system_stats()
+        # Combine stats
+        stats = {
+            'start_time': self.start_time,
+            'end_time': self.end_time,
+            'duration': self.end_time - self.start_time if self.end_time else None,
+        }
+        # Add process stats with 'process_' prefix
+        for key, value in process_stats.items():
+            if key not in ['start_time', 'end_time', 'duration']:
+                stats[f'process_{key}'] = value
+        # Add system stats with 'system_' prefix
+        for key, value in system_stats.items():
+            if key not in ['start_time', 'end_time', 'duration']:
+                stats[f'system_{key}'] = value
+        # Calculate derived metrics
+        if (process_stats.get('memory_max_mb') is not None and
+            system_stats.get('memory_total_gb') is not None):
+            # Process memory as percentage of total system memory
+            system_memory_mb = system_stats['memory_total_gb'] * 1024
+            stats['process_memory_percent'] = (
+                (process_stats['memory_max_mb'] / system_memory_mb) * 100
+                if system_memory_mb > 0 else 0
+            )
+        return stats
+    def print_summary(self):
+        """Print a formatted summary of resource usage."""
+        process_stats = self.get_process_stats()
+        system_stats = self.get_system_stats()
+        print("\n===== RESOURCE USAGE SUMMARY =====")
+        if process_stats:
+            print("\n--- Process Resources ---")
+            print(f"CPU usage: {process_stats.get('cpu_avg', 0):.1f}% avg, "
+                  f"{process_stats.get('cpu_max', 0):.1f}% peak")
+            print(f"Memory usage: {process_stats.get('memory_avg_mb', 0):.1f} MB avg, "
+                  f"{process_stats.get('memory_max_mb', 0):.1f} MB peak")
+            print(f"Threads: {process_stats.get('thread_max', 0)} max")
+        if system_stats:
+            print("\n--- System Resources ---")
+            print(f"CPU usage: {system_stats.get('cpu_avg', 0):.1f}% avg, "
+                  f"{system_stats.get('cpu_max', 0):.1f}% peak")
+            print(f"Memory usage: {system_stats.get('memory_avg_percent', 0):.1f}% avg, "
+                  f"{system_stats.get('memory_max_percent', 0):.1f}% peak "
+                  f"(Total: {system_stats.get('memory_total_gb', 0):.1f} GB)")
+            print(f"Disk usage: {system_stats.get('disk_avg_percent', 0):.1f}% avg "
+                  f"(Total: {system_stats.get('disk_total_gb', 0):.1f} GB)")
+        print("\n===================================")
+    def export_data(self) -> Dict[str, Any]:
+        """
+        Export all collected data.
+        Returns:
+            Dictionary with all collected resource usage data
+        """
+        return {
+            'start_time': self.start_time,
+            'end_time': self.end_time,
+            'sampling_interval': self.sampling_interval,
+            'process_data': self.process_data,
+            'system_data': self.system_data
+        }
+def check_system_resources() -> Dict[str, Any]:
+    """
+    Check current system resources.
+    Returns:
+        Dictionary with current resource usage information
+    """
+    if not PSUTIL_AVAILABLE:
+        return {
+            'error': 'psutil not available',
+            'available': False
+        }
+    try:
+        # Get basic system information
+        cpu_count = psutil.cpu_count(logical=True)
+        cpu_physical = psutil.cpu_count(logical=False)
+        cpu_percent = psutil.cpu_percent(interval=0.1)
+        memory = psutil.virtual_memory()
+        disk = psutil.disk_usage('/')
+        # Format results
+        result = {
+            'available': True,
+            'cpu_count': cpu_count,
+            'cpu_physical': cpu_physical,
+            'cpu_percent': cpu_percent,
+            'memory_total_gb': memory.total / (1024**3),
+            'memory_available_gb': memory.available / (1024**3),
+            'memory_used_gb': memory.used / (1024**3),
+            'memory_percent': memory.percent,
+            'disk_total_gb': disk.total / (1024**3),
+            'disk_free_gb': disk.free / (1024**3),
+            'disk_percent': disk.percent
+        }
+        return result
+    except Exception as e:
+        logger.error(f"Error checking system resources: {str(e)}")
+        return {
+            'error': str(e),
+            'available': False
+        }

local-deep-research 0.3.12__py3-none-any.whl → 0.4.0__py3-none-any.whl

local-deep-research 0.3.12py3-none-any.whl → 0.4.0py3-none-any.whl