PyPI - remdb - Versions diffs - 0.3.118__py3-none-any.whl → 0.3.146__py3-none-any.whl - Mend

remdb 0.3.118py3-none-any.whl → 0.3.146py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of remdb might be problematic. Click here for more details.

Files changed (44) hide show

rem/agentic/agents/sse_simulator.py +2 -0
rem/agentic/context.py +23 -3
rem/agentic/mcp/tool_wrapper.py +126 -15
rem/agentic/otel/setup.py +1 -0
rem/agentic/providers/phoenix.py +371 -108
rem/agentic/providers/pydantic_ai.py +122 -43
rem/agentic/schema.py +4 -1
rem/api/mcp_router/tools.py +13 -2
rem/api/routers/chat/completions.py +250 -4
rem/api/routers/chat/models.py +81 -7
rem/api/routers/chat/otel_utils.py +33 -0
rem/api/routers/chat/sse_events.py +17 -1
rem/api/routers/chat/streaming.py +35 -1
rem/api/routers/feedback.py +134 -14
rem/auth/middleware.py +66 -1
rem/cli/commands/cluster.py +590 -82
rem/cli/commands/configure.py +3 -4
rem/cli/commands/experiments.py +468 -76
rem/cli/commands/session.py +336 -0
rem/cli/dreaming.py +2 -2
rem/cli/main.py +2 -0
rem/config.py +8 -1
rem/models/core/experiment.py +58 -14
rem/models/entities/ontology.py +1 -1
rem/models/entities/ontology_config.py +1 -1
rem/schemas/agents/examples/contract-analyzer.yaml +1 -1
rem/schemas/agents/examples/contract-extractor.yaml +1 -1
rem/schemas/agents/examples/cv-parser.yaml +1 -1
rem/services/phoenix/client.py +59 -18
rem/services/postgres/pydantic_to_sqlalchemy.py +9 -12
rem/services/session/compression.py +7 -0
rem/settings.py +260 -17
rem/sql/migrations/002_install_models.sql +91 -91
rem/sql/migrations/004_cache_system.sql +1 -1
rem/utils/README.md +45 -0
rem/utils/files.py +157 -1
rem/utils/schema_loader.py +94 -3
rem/utils/vision.py +1 -1
rem/workers/__init__.py +2 -1
rem/workers/db_listener.py +579 -0
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/METADATA +161 -147
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/RECORD +44 -41
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/WHEEL +0 -0
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/entry_points.txt +0 -0

rem/utils/files.py CHANGED Viewed

@@ -3,13 +3,18 @@ File utilities for consistent file handling throughout REM.
 Provides context managers and helpers for temporary file operations,
 ensuring proper cleanup and consistent patterns.
+Also provides DataFrame I/O utilities using Polars with automatic
+format detection based on file extension.
 """
 import tempfile
 from contextlib import contextmanager
+from io import BytesIO
 from pathlib import Path
-from typing import Generator, Optional
+from typing import Generator, Optional, Union
+import polars as pl
 from loguru import logger
@@ -165,3 +170,154 @@ def safe_delete(path: Path) -> bool:
     except Exception as e:
         logger.warning(f"Failed to delete {path}: {e}")
         return False
+# Extension to Polars reader mapping
+_EXTENSION_READERS = {
+    ".csv": pl.read_csv,
+    ".tsv": lambda p, **kw: pl.read_csv(p, separator="\t", **kw),
+    ".parquet": pl.read_parquet,
+    ".pq": pl.read_parquet,
+    ".json": pl.read_json,
+    ".jsonl": pl.read_ndjson,
+    ".ndjson": pl.read_ndjson,
+    ".avro": pl.read_avro,
+    ".xlsx": pl.read_excel,
+    ".xls": pl.read_excel,
+    ".ods": pl.read_ods,
+    ".ipc": pl.read_ipc,
+    ".arrow": pl.read_ipc,
+    ".feather": pl.read_ipc,
+}
+# Extension to Polars writer mapping
+_EXTENSION_WRITERS = {
+    ".csv": "write_csv",
+    ".tsv": "write_csv",  # with separator="\t"
+    ".parquet": "write_parquet",
+    ".pq": "write_parquet",
+    ".json": "write_json",
+    ".jsonl": "write_ndjson",
+    ".ndjson": "write_ndjson",
+    ".avro": "write_avro",
+    ".xlsx": "write_excel",
+    ".ipc": "write_ipc",
+    ".arrow": "write_ipc",
+    ".feather": "write_ipc",
+}
+def read_dataframe(
+    source: Union[str, Path, bytes],
+    filename: Optional[str] = None,
+    **kwargs,
+) -> pl.DataFrame:
+    """
+    Read a DataFrame from a file, inferring format from extension.
+    Supports all Polars-compatible formats:
+    - CSV (.csv), TSV (.tsv)
+    - Parquet (.parquet, .pq)
+    - JSON (.json), JSONL/NDJSON (.jsonl, .ndjson)
+    - Avro (.avro)
+    - Excel (.xlsx, .xls)
+    - OpenDocument (.ods)
+    - Arrow IPC (.ipc, .arrow, .feather)
+    Args:
+        source: File path (str/Path) or bytes content
+        filename: Required when source is bytes, to determine format
+        **kwargs: Additional arguments passed to the Polars reader
+    Returns:
+        Polars DataFrame
+    Raises:
+        ValueError: If format cannot be determined or is unsupported
+    Examples:
+        >>> df = read_dataframe("data.csv")
+        >>> df = read_dataframe("data.parquet")
+        >>> df = read_dataframe(csv_bytes, filename="data.csv")
+    """
+    # Determine the file extension
+    if isinstance(source, bytes):
+        if not filename:
+            raise ValueError("filename is required when source is bytes")
+        ext = Path(filename).suffix.lower()
+        # For bytes, we need to wrap in BytesIO
+        file_like = BytesIO(source)
+    else:
+        path = Path(source)
+        ext = path.suffix.lower()
+        file_like = path
+    # Get the appropriate reader
+    reader = _EXTENSION_READERS.get(ext)
+    if reader is None:
+        supported = ", ".join(sorted(_EXTENSION_READERS.keys()))
+        raise ValueError(
+            f"Unsupported file format: {ext}. "
+            f"Supported formats: {supported}"
+        )
+    try:
+        return reader(file_like, **kwargs)
+    except Exception as e:
+        logger.error(f"Failed to read DataFrame from {ext} format: {e}")
+        raise
+def write_dataframe(
+    df: pl.DataFrame,
+    dest: Union[str, Path],
+    **kwargs,
+) -> None:
+    """
+    Write a DataFrame to a file, inferring format from extension.
+    Supports most Polars-writable formats:
+    - CSV (.csv), TSV (.tsv)
+    - Parquet (.parquet, .pq)
+    - JSON (.json), JSONL/NDJSON (.jsonl, .ndjson)
+    - Avro (.avro)
+    - Excel (.xlsx)
+    - Arrow IPC (.ipc, .arrow, .feather)
+    Args:
+        df: Polars DataFrame to write
+        dest: Destination file path
+        **kwargs: Additional arguments passed to the Polars writer
+    Raises:
+        ValueError: If format cannot be determined or is unsupported
+    Examples:
+        >>> write_dataframe(df, "output.csv")
+        >>> write_dataframe(df, "output.parquet")
+        >>> write_dataframe(df, "output.jsonl")
+    """
+    path = Path(dest)
+    ext = path.suffix.lower()
+    writer_method = _EXTENSION_WRITERS.get(ext)
+    if writer_method is None:
+        supported = ", ".join(sorted(_EXTENSION_WRITERS.keys()))
+        raise ValueError(
+            f"Unsupported file format for writing: {ext}. "
+            f"Supported formats: {supported}"
+        )
+    # Ensure parent directory exists
+    ensure_parent_exists(path)
+    # Handle TSV special case
+    if ext == ".tsv":
+        kwargs.setdefault("separator", "\t")
+    try:
+        writer = getattr(df, writer_method)
+        writer(path, **kwargs)
+    except Exception as e:
+        logger.error(f"Failed to write DataFrame to {ext} format: {e}")
+        raise

rem/utils/schema_loader.py CHANGED Viewed

@@ -195,7 +195,7 @@ def load_agent_schema(
     """
     Load agent schema from YAML file with unified search logic and caching.
-    Schema names are case-invariant - "Siggy", "siggy", "SIGGY" all resolve to the same schema.
+    Schema names are case-invariant - "Rem", "rem", "REM" all resolve to the same schema.
     Filesystem schemas are cached indefinitely (immutable, versioned with code).
     Database schemas (future) will be cached with TTL for invalidation.
@@ -271,10 +271,20 @@ def load_agent_schema(
     # 2. Normalize name for package resource search (lowercase)
     base_name = cache_key
-    # 3. Try custom schema paths (from registry + SCHEMA__PATHS env var)
+    # 3. Try custom schema paths (from registry + SCHEMA__PATHS env var + auto-detected)
     from ..registry import get_schema_paths
     custom_paths = get_schema_paths()
+    # Auto-detect local folders if they exist (convention over configuration)
+    auto_detect_folders = ["./agents", "./schemas", "./evaluators"]
+    for auto_folder in auto_detect_folders:
+        auto_path = Path(auto_folder)
+        if auto_path.exists() and auto_path.is_dir():
+            resolved = str(auto_path.resolve())
+            if resolved not in custom_paths:
+                custom_paths.insert(0, resolved)
+                logger.debug(f"Auto-detected schema directory: {auto_folder}")
     for custom_dir in custom_paths:
         # Try various patterns within each custom directory
         for pattern in [
@@ -400,9 +410,20 @@ async def load_agent_schema_async(
     base_name = cache_key
-    # Try custom schema paths
+    # Try custom schema paths (from registry + SCHEMA__PATHS env var + auto-detected)
     from ..registry import get_schema_paths
     custom_paths = get_schema_paths()
+    # Auto-detect local folders if they exist (convention over configuration)
+    auto_detect_folders = ["./agents", "./schemas", "./evaluators"]
+    for auto_folder in auto_detect_folders:
+        auto_path = Path(auto_folder)
+        if auto_path.exists() and auto_path.is_dir():
+            resolved = str(auto_path.resolve())
+            if resolved not in custom_paths:
+                custom_paths.insert(0, resolved)
+                logger.debug(f"Auto-detected schema directory: {auto_folder}")
     for custom_dir in custom_paths:
         for pattern in [f"{base_name}.yaml", f"{base_name}.yml", f"agents/{base_name}.yaml"]:
             custom_path = Path(custom_dir) / pattern
@@ -490,3 +511,73 @@ def validate_agent_schema(schema: dict[str, Any]) -> bool:
     logger.debug("Schema validation passed")
     return True
+def get_evaluator_schema_path(evaluator_name: str) -> Path | None:
+    """
+    Find the file path to an evaluator schema.
+    Searches standard locations for the evaluator schema YAML file:
+    - ./evaluators/{name}.yaml (local project)
+    - Custom schema paths from registry
+    - Package resources: schemas/evaluators/{name}.yaml
+    Args:
+        evaluator_name: Name of the evaluator (e.g., "mental-health-classifier")
+    Returns:
+        Path to the evaluator schema file, or None if not found
+    Example:
+        >>> path = get_evaluator_schema_path("mental-health-classifier")
+        >>> if path:
+        ...     print(f"Found evaluator at: {path}")
+    """
+    from ..registry import get_schema_paths
+    base_name = evaluator_name.lower().replace('.yaml', '').replace('.yml', '')
+    # 1. Try custom schema paths (from registry + auto-detected)
+    custom_paths = get_schema_paths()
+    # Auto-detect local folders
+    auto_detect_folders = ["./evaluators", "./schemas", "./agents"]
+    for auto_folder in auto_detect_folders:
+        auto_path = Path(auto_folder)
+        if auto_path.exists() and auto_path.is_dir():
+            resolved = str(auto_path.resolve())
+            if resolved not in custom_paths:
+                custom_paths.insert(0, resolved)
+    for custom_dir in custom_paths:
+        # Try various patterns within each custom directory
+        for pattern in [
+            f"{base_name}.yaml",
+            f"{base_name}.yml",
+            f"evaluators/{base_name}.yaml",
+        ]:
+            custom_path = Path(custom_dir) / pattern
+            if custom_path.exists():
+                logger.debug(f"Found evaluator schema: {custom_path}")
+                return custom_path
+    # 2. Try package resources
+    evaluator_search_paths = [
+        f"schemas/evaluators/{base_name}.yaml",
+        f"schemas/evaluators/rem/{base_name}.yaml",
+    ]
+    for search_path in evaluator_search_paths:
+        try:
+            schema_ref = importlib.resources.files("rem") / search_path
+            schema_path = Path(str(schema_ref))
+            if schema_path.exists():
+                logger.debug(f"Found evaluator schema in package: {schema_path}")
+                return schema_path
+        except Exception as e:
+            logger.debug(f"Could not check {search_path}: {e}")
+            continue
+    logger.warning(f"Evaluator schema not found: {evaluator_name}")
+    return None

rem/utils/vision.py CHANGED Viewed

@@ -106,7 +106,7 @@ class ImageAnalyzer:
             elif provider == VisionProvider.GEMINI:
                 model = "gemini-2.0-flash-exp"
             elif provider == VisionProvider.OPENAI:
-                model = "gpt-4o"
+                model = "gpt-4.1"
         self.model = model
         self.base_url = base_url

rem/workers/__init__.py CHANGED Viewed

@@ -1,6 +1,7 @@
 """Background workers for processing tasks."""
+from .db_listener import DBListener
 from .sqs_file_processor import SQSFileProcessor
 from .unlogged_maintainer import UnloggedMaintainer
-__all__ = ["SQSFileProcessor", "UnloggedMaintainer"]
+__all__ = ["DBListener", "SQSFileProcessor", "UnloggedMaintainer"]

remdb 0.3.118__py3-none-any.whl → 0.3.146__py3-none-any.whl

Potentially problematic release.

remdb 0.3.118py3-none-any.whl → 0.3.146py3-none-any.whl