PyPI - remdb - Versions diffs - 0.2.6__py3-none-any.whl - Mend

remdb 0.2.6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of remdb might be problematic. Click here for more details.

Files changed (187) hide show

rem/__init__.py +2 -0
rem/agentic/README.md +650 -0
rem/agentic/__init__.py +39 -0
rem/agentic/agents/README.md +155 -0
rem/agentic/agents/__init__.py +8 -0
rem/agentic/context.py +148 -0
rem/agentic/context_builder.py +329 -0
rem/agentic/mcp/__init__.py +0 -0
rem/agentic/mcp/tool_wrapper.py +107 -0
rem/agentic/otel/__init__.py +5 -0
rem/agentic/otel/setup.py +151 -0
rem/agentic/providers/phoenix.py +674 -0
rem/agentic/providers/pydantic_ai.py +572 -0
rem/agentic/query.py +117 -0
rem/agentic/query_helper.py +89 -0
rem/agentic/schema.py +396 -0
rem/agentic/serialization.py +245 -0
rem/agentic/tools/__init__.py +5 -0
rem/agentic/tools/rem_tools.py +231 -0
rem/api/README.md +420 -0
rem/api/main.py +324 -0
rem/api/mcp_router/prompts.py +182 -0
rem/api/mcp_router/resources.py +536 -0
rem/api/mcp_router/server.py +213 -0
rem/api/mcp_router/tools.py +584 -0
rem/api/routers/auth.py +229 -0
rem/api/routers/chat/__init__.py +5 -0
rem/api/routers/chat/completions.py +281 -0
rem/api/routers/chat/json_utils.py +76 -0
rem/api/routers/chat/models.py +124 -0
rem/api/routers/chat/streaming.py +185 -0
rem/auth/README.md +258 -0
rem/auth/__init__.py +26 -0
rem/auth/middleware.py +100 -0
rem/auth/providers/__init__.py +13 -0
rem/auth/providers/base.py +376 -0
rem/auth/providers/google.py +163 -0
rem/auth/providers/microsoft.py +237 -0
rem/cli/README.md +455 -0
rem/cli/__init__.py +8 -0
rem/cli/commands/README.md +126 -0
rem/cli/commands/__init__.py +3 -0
rem/cli/commands/ask.py +565 -0
rem/cli/commands/configure.py +423 -0
rem/cli/commands/db.py +493 -0
rem/cli/commands/dreaming.py +324 -0
rem/cli/commands/experiments.py +1124 -0
rem/cli/commands/mcp.py +66 -0
rem/cli/commands/process.py +245 -0
rem/cli/commands/schema.py +183 -0
rem/cli/commands/serve.py +106 -0
rem/cli/dreaming.py +363 -0
rem/cli/main.py +88 -0
rem/config.py +237 -0
rem/mcp_server.py +41 -0
rem/models/core/__init__.py +49 -0
rem/models/core/core_model.py +64 -0
rem/models/core/engram.py +333 -0
rem/models/core/experiment.py +628 -0
rem/models/core/inline_edge.py +132 -0
rem/models/core/rem_query.py +243 -0
rem/models/entities/__init__.py +43 -0
rem/models/entities/file.py +57 -0
rem/models/entities/image_resource.py +88 -0
rem/models/entities/message.py +35 -0
rem/models/entities/moment.py +123 -0
rem/models/entities/ontology.py +191 -0
rem/models/entities/ontology_config.py +131 -0
rem/models/entities/resource.py +95 -0
rem/models/entities/schema.py +87 -0
rem/models/entities/user.py +85 -0
rem/py.typed +0 -0
rem/schemas/README.md +507 -0
rem/schemas/__init__.py +6 -0
rem/schemas/agents/README.md +92 -0
rem/schemas/agents/core/moment-builder.yaml +178 -0
rem/schemas/agents/core/rem-query-agent.yaml +226 -0
rem/schemas/agents/core/resource-affinity-assessor.yaml +99 -0
rem/schemas/agents/core/simple-assistant.yaml +19 -0
rem/schemas/agents/core/user-profile-builder.yaml +163 -0
rem/schemas/agents/examples/contract-analyzer.yaml +317 -0
rem/schemas/agents/examples/contract-extractor.yaml +134 -0
rem/schemas/agents/examples/cv-parser.yaml +263 -0
rem/schemas/agents/examples/hello-world.yaml +37 -0
rem/schemas/agents/examples/query.yaml +54 -0
rem/schemas/agents/examples/simple.yaml +21 -0
rem/schemas/agents/examples/test.yaml +29 -0
rem/schemas/agents/rem.yaml +128 -0
rem/schemas/evaluators/hello-world/default.yaml +77 -0
rem/schemas/evaluators/rem/faithfulness.yaml +219 -0
rem/schemas/evaluators/rem/lookup-correctness.yaml +182 -0
rem/schemas/evaluators/rem/retrieval-precision.yaml +199 -0
rem/schemas/evaluators/rem/retrieval-recall.yaml +211 -0
rem/schemas/evaluators/rem/search-correctness.yaml +192 -0
rem/services/__init__.py +16 -0
rem/services/audio/INTEGRATION.md +308 -0
rem/services/audio/README.md +376 -0
rem/services/audio/__init__.py +15 -0
rem/services/audio/chunker.py +354 -0
rem/services/audio/transcriber.py +259 -0
rem/services/content/README.md +1269 -0
rem/services/content/__init__.py +5 -0
rem/services/content/providers.py +806 -0
rem/services/content/service.py +657 -0
rem/services/dreaming/README.md +230 -0
rem/services/dreaming/__init__.py +53 -0
rem/services/dreaming/affinity_service.py +336 -0
rem/services/dreaming/moment_service.py +264 -0
rem/services/dreaming/ontology_service.py +54 -0
rem/services/dreaming/user_model_service.py +297 -0
rem/services/dreaming/utils.py +39 -0
rem/services/embeddings/__init__.py +11 -0
rem/services/embeddings/api.py +120 -0
rem/services/embeddings/worker.py +421 -0
rem/services/fs/README.md +662 -0
rem/services/fs/__init__.py +62 -0
rem/services/fs/examples.py +206 -0
rem/services/fs/examples_paths.py +204 -0
rem/services/fs/git_provider.py +935 -0
rem/services/fs/local_provider.py +760 -0
rem/services/fs/parsing-hooks-examples.md +172 -0
rem/services/fs/paths.py +276 -0
rem/services/fs/provider.py +460 -0
rem/services/fs/s3_provider.py +1042 -0
rem/services/fs/service.py +186 -0
rem/services/git/README.md +1075 -0
rem/services/git/__init__.py +17 -0
rem/services/git/service.py +469 -0
rem/services/phoenix/EXPERIMENT_DESIGN.md +1146 -0
rem/services/phoenix/README.md +453 -0
rem/services/phoenix/__init__.py +46 -0
rem/services/phoenix/client.py +686 -0
rem/services/phoenix/config.py +88 -0
rem/services/phoenix/prompt_labels.py +477 -0
rem/services/postgres/README.md +575 -0
rem/services/postgres/__init__.py +23 -0
rem/services/postgres/migration_service.py +427 -0
rem/services/postgres/pydantic_to_sqlalchemy.py +232 -0
rem/services/postgres/register_type.py +352 -0
rem/services/postgres/repository.py +337 -0
rem/services/postgres/schema_generator.py +379 -0
rem/services/postgres/service.py +802 -0
rem/services/postgres/sql_builder.py +354 -0
rem/services/rem/README.md +304 -0
rem/services/rem/__init__.py +23 -0
rem/services/rem/exceptions.py +71 -0
rem/services/rem/executor.py +293 -0
rem/services/rem/parser.py +145 -0
rem/services/rem/queries.py +196 -0
rem/services/rem/query.py +371 -0
rem/services/rem/service.py +527 -0
rem/services/session/README.md +374 -0
rem/services/session/__init__.py +6 -0
rem/services/session/compression.py +360 -0
rem/services/session/reload.py +77 -0
rem/settings.py +1235 -0
rem/sql/002_install_models.sql +1068 -0
rem/sql/background_indexes.sql +42 -0
rem/sql/install_models.sql +1038 -0
rem/sql/migrations/001_install.sql +503 -0
rem/sql/migrations/002_install_models.sql +1202 -0
rem/utils/AGENTIC_CHUNKING.md +597 -0
rem/utils/README.md +583 -0
rem/utils/__init__.py +43 -0
rem/utils/agentic_chunking.py +622 -0
rem/utils/batch_ops.py +343 -0
rem/utils/chunking.py +108 -0
rem/utils/clip_embeddings.py +276 -0
rem/utils/dict_utils.py +98 -0
rem/utils/embeddings.py +423 -0
rem/utils/examples/embeddings_example.py +305 -0
rem/utils/examples/sql_types_example.py +202 -0
rem/utils/markdown.py +16 -0
rem/utils/model_helpers.py +236 -0
rem/utils/schema_loader.py +229 -0
rem/utils/sql_types.py +348 -0
rem/utils/user_id.py +81 -0
rem/utils/vision.py +330 -0
rem/workers/README.md +506 -0
rem/workers/__init__.py +5 -0
rem/workers/dreaming.py +502 -0
rem/workers/engram_processor.py +312 -0
rem/workers/sqs_file_processor.py +193 -0
remdb-0.2.6.dist-info/METADATA +1191 -0
remdb-0.2.6.dist-info/RECORD +187 -0
remdb-0.2.6.dist-info/WHEEL +4 -0
remdb-0.2.6.dist-info/entry_points.txt +2 -0

rem/cli/dreaming.py ADDED Viewed

@@ -0,0 +1,363 @@
+"""
+REM Dreaming CLI - Memory indexing and insight extraction.
+Command-line interface for running dreaming workers to build the
+REM knowledge graph through user model updates, moment construction,
+and resource affinity operations.
+Commands:
+- user-model: Update user profiles from activity
+- moments: Extract temporal narratives from resources
+- affinity: Build semantic relationships between resources
+- custom: Run custom extractors on user's resources/sessions
+- full: Run complete dreaming workflow (all operations)
+Usage Examples:
+```bash
+# Update user model for specific user
+rem-dreaming user-model --user-id=user-123
+# Extract moments with custom lookback
+rem-dreaming moments --user-id=user-123 --lookback-hours=48
+# Build resource affinity (semantic mode, fast)
+rem-dreaming affinity --user-id=user-123
+# Build resource affinity (LLM mode, intelligent but expensive)
+rem-dreaming affinity --user-id=user-123 --use-llm --limit=100
+# Run custom extractor on user's data
+rem-dreaming custom --user-id=user-123 --extractor cv-parser-v1
+rem-dreaming custom --user-id=user-123 --extractor contract-analyzer-v1 --lookback-hours=168
+# Run full workflow for user
+rem-dreaming full --user-id=user-123
+# Process all active users (daily cron)
+rem-dreaming full --all-users
+# Process with custom REM API endpoint
+rem-dreaming full --user-id=user-123 --rem-api-url=http://localhost:8000
+```
+Environment Variables:
+- REM_API_URL: REM API endpoint (default: http://rem-api:8000)
+- REM_EMBEDDING_PROVIDER: Embedding provider (default: text-embedding-3-small)
+- REM_DEFAULT_MODEL: LLM model (default: gpt-4o)
+- REM_LOOKBACK_HOURS: Default lookback window (default: 24)
+- OPENAI_API_KEY: OpenAI API key
+Exit Codes:
+- 0: Success
+- 1: Validation error (missing required args)
+- 2: Execution error (worker failed)
+"""
+import asyncio
+import os
+import sys
+from typing import Optional
+import typer
+from rich.console import Console
+from rich.progress import Progress, SpinnerColumn, TextColumn
+from rem.workers.dreaming import (
+    AffinityMode,
+    DreamingWorker,
+    TaskType,
+)
+app = typer.Typer(
+    name="rem-dreaming",
+    help="REM dreaming worker for memory indexing",
+    add_completion=False,
+)
+console = Console()
+def get_worker() -> DreamingWorker:
+    """Create dreaming worker from environment."""
+    return DreamingWorker(
+        rem_api_url=os.getenv("REM_API_URL", "http://rem-api:8000"),
+        embedding_provider=os.getenv(
+            "REM_EMBEDDING_PROVIDER", "text-embedding-3-small"
+        ),
+        default_model=os.getenv("REM_DEFAULT_MODEL", "gpt-4o"),
+        lookback_hours=int(os.getenv("REM_LOOKBACK_HOURS", "24")),
+    )
+@app.command()
+def user_model(
+    user_id: str = typer.Option(..., help="User ID to process"),
+    max_sessions: int = typer.Option(100, help="Max sessions to analyze"),
+    max_moments: int = typer.Option(20, help="Max moments to include"),
+    max_resources: int = typer.Option(20, help="Max resources to include"),
+):
+    """
+    Update user model from recent activity.
+    Reads recent sessions, moments, and resources to generate
+    a comprehensive user profile summary using LLM analysis.
+    """
+    async def run():
+        worker = get_worker()
+        try:
+            with Progress(
+                SpinnerColumn(),
+                TextColumn("[progress.description]{task.description}"),
+                console=console,
+            ) as progress:
+                task = progress.add_task(
+                    f"Updating user model for {user_id}...", total=None
+                )
+                result = await worker.update_user_model(
+                    user_id=user_id,
+                    max_sessions=max_sessions,
+                    max_moments=max_moments,
+                    max_resources=max_resources,
+                )
+                progress.update(task, completed=True)
+                console.print(f"[green]✓[/green] User model updated")
+                console.print(result)
+        except Exception as e:
+            console.print(f"[red]✗[/red] Failed: {e}", style="red")
+            sys.exit(2)
+        finally:
+            await worker.close()
+    asyncio.run(run())
+@app.command()
+def moments(
+    user_id: str = typer.Option(..., help="User ID to process"),
+    lookback_hours: Optional[int] = typer.Option(
+        None, help="Hours to look back (default: from env)"
+    ),
+    limit: Optional[int] = typer.Option(None, help="Max resources to process"),
+):
+    """
+    Extract moments from resources.
+    Analyzes recent resources to identify temporal narratives
+    (meetings, coding sessions, conversations) and creates
+    Moment entities with temporal boundaries and metadata.
+    """
+    async def run():
+        worker = get_worker()
+        try:
+            with Progress(
+                SpinnerColumn(),
+                TextColumn("[progress.description]{task.description}"),
+                console=console,
+            ) as progress:
+                task = progress.add_task(
+                    f"Constructing moments for {user_id}...", total=None
+                )
+                result = await worker.construct_moments(
+                    user_id=user_id,
+                    lookback_hours=lookback_hours,
+                    limit=limit,
+                )
+                progress.update(task, completed=True)
+                console.print(f"[green]✓[/green] Moments constructed")
+                console.print(result)
+        except Exception as e:
+            console.print(f"[red]✗[/red] Failed: {e}", style="red")
+            sys.exit(2)
+        finally:
+            await worker.close()
+    asyncio.run(run())
+@app.command()
+def affinity(
+    user_id: str = typer.Option(..., help="User ID to process"),
+    use_llm: bool = typer.Option(
+        False, "--use-llm", help="Use LLM mode (expensive, use --limit)"
+    ),
+    lookback_hours: Optional[int] = typer.Option(
+        None, help="Hours to look back (default: from env)"
+    ),
+    limit: Optional[int] = typer.Option(
+        None, help="Max resources to process (REQUIRED for LLM mode)"
+    ),
+):
+    """
+    Build resource affinity graph.
+    Creates semantic relationships between resources using either
+    vector similarity (fast, default) or LLM analysis (intelligent but expensive).
+    Semantic Mode (default):
+    - Fast vector similarity search
+    - No LLM calls, just embedding cosine similarity
+    - Good for frequent updates
+    LLM Mode (--use-llm):
+    - Intelligent relationship assessment
+    - Expensive: ALWAYS use --limit to control costs
+    - Good for deep analysis (weekly or monthly)
+    Example:
+        # Semantic mode (fast, cheap)
+        rem-dreaming affinity --user-id=user-123
+        # LLM mode (intelligent, expensive)
+        rem-dreaming affinity --user-id=user-123 --use-llm --limit=100
+    """
+    if use_llm and not limit:
+        console.print(
+            "[red]Error:[/red] --limit is REQUIRED when using --use-llm to control costs",
+            style="red",
+        )
+        sys.exit(1)
+    async def run():
+        worker = get_worker()
+        try:
+            mode = AffinityMode.LLM if use_llm else AffinityMode.SEMANTIC
+            mode_str = "LLM" if use_llm else "semantic"
+            with Progress(
+                SpinnerColumn(),
+                TextColumn("[progress.description]{task.description}"),
+                console=console,
+            ) as progress:
+                task = progress.add_task(
+                    f"Building {mode_str} affinity for {user_id}...", total=None
+                )
+                result = await worker.build_affinity(
+                    user_id=user_id,
+                    mode=mode,
+                    lookback_hours=lookback_hours,
+                    limit=limit,
+                )
+                progress.update(task, completed=True)
+                console.print(f"[green]✓[/green] Resource affinity built ({mode_str} mode)")
+                console.print(result)
+        except Exception as e:
+            console.print(f"[red]✗[/red] Failed: {e}", style="red")
+            sys.exit(2)
+        finally:
+            await worker.close()
+    asyncio.run(run())
+@app.command()
+def full(
+    user_id: Optional[str] = typer.Option(None, help="User ID (or --all-users)"),
+    all_users: bool = typer.Option(
+        False, "--all-users", help="Process all active users"
+    ),
+    use_llm_affinity: bool = typer.Option(
+        False, "--use-llm-affinity", help="Use LLM mode for affinity (expensive)"
+    ),
+    lookback_hours: Optional[int] = typer.Option(
+        None, help="Hours to look back (default: from env)"
+    ),
+):
+    """
+    Run complete dreaming workflow.
+    Executes all dreaming operations in sequence:
+    1. Update user model
+    2. Construct moments
+    3. Build resource affinity
+    Recommended for daily cron execution.
+    Examples:
+        # Process single user
+        rem-dreaming full --user-id=user-123
+        # Process all active users (daily cron)
+        rem-dreaming full --all-users
+        # Use LLM affinity mode (expensive)
+        rem-dreaming full --user-id=user-123 --use-llm-affinity
+    """
+    if not user_id and not all_users:
+        console.print(
+            "[red]Error:[/red] Either --user-id or --all-users is required",
+            style="red",
+        )
+        sys.exit(1)
+    if user_id and all_users:
+        console.print(
+            "[red]Error:[/red] Cannot use both --user-id and --all-users",
+            style="red",
+        )
+        sys.exit(1)
+    async def run():
+        worker = get_worker()
+        try:
+            if all_users:
+                with Progress(
+                    SpinnerColumn(),
+                    TextColumn("[progress.description]{task.description}"),
+                    console=console,
+                ) as progress:
+                    task = progress.add_task("Processing all users...", total=None)
+                    results = await worker.process_all_users(
+                        task_type=TaskType.FULL,
+                        use_llm_affinity=use_llm_affinity,
+                        lookback_hours=lookback_hours,
+                    )
+                    progress.update(task, completed=True)
+                    console.print(
+                        f"[green]✓[/green] Processed {len(results)} users"
+                    )
+                    for result in results:
+                        console.print(result)
+            else:
+                with Progress(
+                    SpinnerColumn(),
+                    TextColumn("[progress.description]{task.description}"),
+                    console=console,
+                ) as progress:
+                    task = progress.add_task(
+                        f"Running full workflow for {user_id}...", total=None
+                    )
+                    result = await worker.process_full(
+                        user_id=user_id,
+                        use_llm_affinity=use_llm_affinity,
+                        lookback_hours=lookback_hours,
+                    )
+                    progress.update(task, completed=True)
+                    console.print(f"[green]✓[/green] Full workflow completed")
+                    console.print(result)
+        except Exception as e:
+            console.print(f"[red]✗[/red] Failed: {e}", style="red")
+            sys.exit(2)
+        finally:
+            await worker.close()
+    asyncio.run(run())
+def main():
+    """Entry point."""
+    app()
+if __name__ == "__main__":
+    main()

rem/cli/main.py ADDED Viewed

@@ -0,0 +1,88 @@
+"""
+REM CLI entry point.
+Usage:
+    rem db schema generate --models src/rem/models/entities
+    rem db schema validate
+    rem db migrate up
+    rem dev run-server
+"""
+import sys
+from pathlib import Path
+import click
+from loguru import logger
+@click.group()
+@click.option("--verbose", "-v", is_flag=True, help="Enable verbose logging")
+def cli(verbose: bool):
+    """REM - Resources Entities Moments system CLI."""
+    if verbose:
+        logger.remove()
+        logger.add(sys.stderr, level="DEBUG")
+    else:
+        logger.remove()
+        logger.add(sys.stderr, level="INFO")
+@cli.group()
+def db():
+    """Database operations (schema, migrate, status, etc.)."""
+    pass
+@db.group()
+def schema():
+    """Database schema management commands."""
+    pass
+@cli.group()
+def dev():
+    """Development utilities."""
+    pass
+@cli.group()
+def process():
+    """File processing commands."""
+    pass
+@cli.group()
+def dreaming():
+    """Memory indexing and knowledge extraction."""
+    pass
+# Register commands
+from .commands.schema import register_commands as register_schema_commands
+from .commands.db import register_commands as register_db_commands
+from .commands.process import register_commands as register_process_commands
+from .commands.ask import register_command as register_ask_command
+from .commands.dreaming import register_commands as register_dreaming_commands
+from .commands.experiments import experiments as experiments_group
+from .commands.configure import register_command as register_configure_command
+from .commands.serve import register_command as register_serve_command
+from .commands.mcp import register_command as register_mcp_command
+register_schema_commands(schema)
+register_db_commands(db)
+register_process_commands(process)
+register_dreaming_commands(dreaming)
+register_ask_command(cli)
+register_configure_command(cli)
+register_serve_command(cli)
+register_mcp_command(cli)
+cli.add_command(experiments_group)
+def main():
+    """Main entry point for CLI."""
+    cli()
+if __name__ == "__main__":
+    main()

rem/config.py ADDED Viewed

@@ -0,0 +1,237 @@
+"""
+REM Configuration Management.
+Provides persistent configuration in ~/.rem/config.yaml with environment variable overrides.
+Configuration Precedence (highest to lowest):
+1. Environment variables (POSTGRES__CONNECTION_STRING, etc.)
+2. ~/.rem/config.yaml (user configuration)
+3. Default values (from settings.py)
+File Format (~/.rem/config.yaml):
+    postgres:
+      connection_string: postgresql://user:pass@localhost:5432/rem
+      pool_min_size: 5
+      pool_max_size: 20
+    llm:
+      default_model: anthropic:claude-sonnet-4-5-20250929
+      openai_api_key: sk-...
+      anthropic_api_key: sk-ant-...
+    s3:
+      bucket_name: rem-storage
+      region: us-east-1
+      endpoint_url: http://localhost:9000
+    # Additional custom environment variables
+    env:
+      MY_CUSTOM_VAR: value
+Usage:
+    from rem.config import load_config, get_config_path, ensure_config_dir
+    # Load configuration and merge with environment
+    config = load_config()
+    # Get configuration file path
+    config_path = get_config_path()
+    # Ensure ~/.rem directory exists
+    ensure_config_dir()
+"""
+import os
+from pathlib import Path
+from typing import Any
+import yaml
+from loguru import logger
+def get_rem_home() -> Path:
+    """
+    Get REM home directory (~/.rem).
+    Returns:
+        Path to ~/.rem directory
+    """
+    return Path.home() / ".rem"
+def ensure_config_dir() -> Path:
+    """
+    Ensure ~/.rem directory exists.
+    Returns:
+        Path to ~/.rem directory
+    """
+    rem_home = get_rem_home()
+    rem_home.mkdir(exist_ok=True, mode=0o700)  # User-only permissions
+    return rem_home
+def get_config_path() -> Path:
+    """
+    Get path to configuration file (~/.rem/config.yaml).
+    Returns:
+        Path to configuration file
+    """
+    return get_rem_home() / "config.yaml"
+def config_exists() -> bool:
+    """
+    Check if configuration file exists.
+    Returns:
+        True if ~/.rem/config.yaml exists
+    """
+    return get_config_path().exists()
+def load_config() -> dict[str, Any]:
+    """
+    Load configuration from ~/.rem/config.yaml.
+    Returns:
+        Configuration dictionary (empty if file doesn't exist)
+    """
+    config_path = get_config_path()
+    if not config_path.exists():
+        logger.debug(f"Configuration file not found: {config_path}")
+        return {}
+    try:
+        with open(config_path, "r") as f:
+            config = yaml.safe_load(f) or {}
+            logger.debug(f"Loaded configuration from {config_path}")
+            return config
+    except Exception as e:
+        logger.warning(f"Failed to load configuration from {config_path}: {e}")
+        return {}
+def save_config(config: dict[str, Any]) -> None:
+    """
+    Save configuration to ~/.rem/config.yaml.
+    Args:
+        config: Configuration dictionary to save
+    """
+    ensure_config_dir()
+    config_path = get_config_path()
+    try:
+        with open(config_path, "w") as f:
+            yaml.dump(config, f, default_flow_style=False, sort_keys=False)
+            logger.info(f"Configuration saved to {config_path}")
+    except Exception as e:
+        logger.error(f"Failed to save configuration to {config_path}: {e}")
+        raise
+def merge_config_to_env(config: dict[str, Any]) -> None:
+    """
+    Merge configuration file into environment variables.
+    This allows Pydantic Settings to pick up values from the config file
+    by setting environment variables before settings initialization.
+    Precedence:
+    - Existing environment variables are NOT overwritten
+    - Only sets env vars if they don't already exist
+    Args:
+        config: Configuration dictionary from ~/.rem/config.yaml
+    Example:
+        config = {"postgres": {"connection_string": "postgresql://..."}}
+        merge_config_to_env(config)
+        # Sets POSTGRES__CONNECTION_STRING if not already set
+    """
+    # Handle custom env vars first
+    if "env" in config:
+        for key, value in config["env"].items():
+            if key not in os.environ:
+                os.environ[key] = str(value)
+                logger.debug(f"Set env var from config: {key}")
+    # Convert nested config to environment variables
+    for section, values in config.items():
+        if section == "env":
+            continue  # Already handled
+        if not isinstance(values, dict):
+            continue
+        for key, value in values.items():
+            # Convert to environment variable format (SECTION__KEY)
+            env_key = f"{section.upper()}__{key.upper()}"
+            # Only set if not already in environment
+            if env_key not in os.environ:
+                os.environ[env_key] = str(value)
+                logger.debug(f"Set env var from config: {env_key}")
+def validate_config(config: dict[str, Any]) -> list[str]:
+    """
+    Validate configuration for required fields.
+    Args:
+        config: Configuration dictionary
+    Returns:
+        List of validation error messages (empty if valid)
+    """
+    errors = []
+    # Postgres connection is required
+    postgres = config.get("postgres", {})
+    if not postgres.get("connection_string"):
+        errors.append("PostgreSQL connection string is required (postgres.connection_string)")
+    # Validate connection string format
+    conn_str = postgres.get("connection_string", "")
+    if conn_str and not conn_str.startswith("postgresql://"):
+        errors.append("PostgreSQL connection string must start with 'postgresql://'")
+    return errors
+def get_default_config() -> dict[str, Any]:
+    """
+    Get default configuration template for new installations.
+    Returns:
+        Default configuration dictionary
+    """
+    return {
+        "postgres": {
+            "connection_string": "postgresql://rem:rem@localhost:5432/rem",
+            "pool_min_size": 5,
+            "pool_max_size": 20,
+        },
+        "llm": {
+            "default_model": "anthropic:claude-sonnet-4-5-20250929",
+            "default_temperature": 0.5,
+            # API keys will be prompted for in wizard
+            # "openai_api_key": "",
+            # "anthropic_api_key": "",
+        },
+        "s3": {
+            "bucket_name": "rem-storage",
+            "region": "us-east-1",
+            # Optional fields
+            # "endpoint_url": "http://localhost:9000",  # For MinIO
+            # "access_key_id": "",
+            # "secret_access_key": "",
+        },
+        "env": {
+            # Custom environment variables
+            # "MY_VAR": "value",
+        },
+    }