PyPI - remdb - Versions diffs - 0.2.6__py3-none-any.whl - Mend

remdb 0.2.6__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of remdb might be problematic. Click here for more details.

Files changed (187) hide show

rem/__init__.py +2 -0
rem/agentic/README.md +650 -0
rem/agentic/__init__.py +39 -0
rem/agentic/agents/README.md +155 -0
rem/agentic/agents/__init__.py +8 -0
rem/agentic/context.py +148 -0
rem/agentic/context_builder.py +329 -0
rem/agentic/mcp/__init__.py +0 -0
rem/agentic/mcp/tool_wrapper.py +107 -0
rem/agentic/otel/__init__.py +5 -0
rem/agentic/otel/setup.py +151 -0
rem/agentic/providers/phoenix.py +674 -0
rem/agentic/providers/pydantic_ai.py +572 -0
rem/agentic/query.py +117 -0
rem/agentic/query_helper.py +89 -0
rem/agentic/schema.py +396 -0
rem/agentic/serialization.py +245 -0
rem/agentic/tools/__init__.py +5 -0
rem/agentic/tools/rem_tools.py +231 -0
rem/api/README.md +420 -0
rem/api/main.py +324 -0
rem/api/mcp_router/prompts.py +182 -0
rem/api/mcp_router/resources.py +536 -0
rem/api/mcp_router/server.py +213 -0
rem/api/mcp_router/tools.py +584 -0
rem/api/routers/auth.py +229 -0
rem/api/routers/chat/__init__.py +5 -0
rem/api/routers/chat/completions.py +281 -0
rem/api/routers/chat/json_utils.py +76 -0
rem/api/routers/chat/models.py +124 -0
rem/api/routers/chat/streaming.py +185 -0
rem/auth/README.md +258 -0
rem/auth/__init__.py +26 -0
rem/auth/middleware.py +100 -0
rem/auth/providers/__init__.py +13 -0
rem/auth/providers/base.py +376 -0
rem/auth/providers/google.py +163 -0
rem/auth/providers/microsoft.py +237 -0
rem/cli/README.md +455 -0
rem/cli/__init__.py +8 -0
rem/cli/commands/README.md +126 -0
rem/cli/commands/__init__.py +3 -0
rem/cli/commands/ask.py +565 -0
rem/cli/commands/configure.py +423 -0
rem/cli/commands/db.py +493 -0
rem/cli/commands/dreaming.py +324 -0
rem/cli/commands/experiments.py +1124 -0
rem/cli/commands/mcp.py +66 -0
rem/cli/commands/process.py +245 -0
rem/cli/commands/schema.py +183 -0
rem/cli/commands/serve.py +106 -0
rem/cli/dreaming.py +363 -0
rem/cli/main.py +88 -0
rem/config.py +237 -0
rem/mcp_server.py +41 -0
rem/models/core/__init__.py +49 -0
rem/models/core/core_model.py +64 -0
rem/models/core/engram.py +333 -0
rem/models/core/experiment.py +628 -0
rem/models/core/inline_edge.py +132 -0
rem/models/core/rem_query.py +243 -0
rem/models/entities/__init__.py +43 -0
rem/models/entities/file.py +57 -0
rem/models/entities/image_resource.py +88 -0
rem/models/entities/message.py +35 -0
rem/models/entities/moment.py +123 -0
rem/models/entities/ontology.py +191 -0
rem/models/entities/ontology_config.py +131 -0
rem/models/entities/resource.py +95 -0
rem/models/entities/schema.py +87 -0
rem/models/entities/user.py +85 -0
rem/py.typed +0 -0
rem/schemas/README.md +507 -0
rem/schemas/__init__.py +6 -0
rem/schemas/agents/README.md +92 -0
rem/schemas/agents/core/moment-builder.yaml +178 -0
rem/schemas/agents/core/rem-query-agent.yaml +226 -0
rem/schemas/agents/core/resource-affinity-assessor.yaml +99 -0
rem/schemas/agents/core/simple-assistant.yaml +19 -0
rem/schemas/agents/core/user-profile-builder.yaml +163 -0
rem/schemas/agents/examples/contract-analyzer.yaml +317 -0
rem/schemas/agents/examples/contract-extractor.yaml +134 -0
rem/schemas/agents/examples/cv-parser.yaml +263 -0
rem/schemas/agents/examples/hello-world.yaml +37 -0
rem/schemas/agents/examples/query.yaml +54 -0
rem/schemas/agents/examples/simple.yaml +21 -0
rem/schemas/agents/examples/test.yaml +29 -0
rem/schemas/agents/rem.yaml +128 -0
rem/schemas/evaluators/hello-world/default.yaml +77 -0
rem/schemas/evaluators/rem/faithfulness.yaml +219 -0
rem/schemas/evaluators/rem/lookup-correctness.yaml +182 -0
rem/schemas/evaluators/rem/retrieval-precision.yaml +199 -0
rem/schemas/evaluators/rem/retrieval-recall.yaml +211 -0
rem/schemas/evaluators/rem/search-correctness.yaml +192 -0
rem/services/__init__.py +16 -0
rem/services/audio/INTEGRATION.md +308 -0
rem/services/audio/README.md +376 -0
rem/services/audio/__init__.py +15 -0
rem/services/audio/chunker.py +354 -0
rem/services/audio/transcriber.py +259 -0
rem/services/content/README.md +1269 -0
rem/services/content/__init__.py +5 -0
rem/services/content/providers.py +806 -0
rem/services/content/service.py +657 -0
rem/services/dreaming/README.md +230 -0
rem/services/dreaming/__init__.py +53 -0
rem/services/dreaming/affinity_service.py +336 -0
rem/services/dreaming/moment_service.py +264 -0
rem/services/dreaming/ontology_service.py +54 -0
rem/services/dreaming/user_model_service.py +297 -0
rem/services/dreaming/utils.py +39 -0
rem/services/embeddings/__init__.py +11 -0
rem/services/embeddings/api.py +120 -0
rem/services/embeddings/worker.py +421 -0
rem/services/fs/README.md +662 -0
rem/services/fs/__init__.py +62 -0
rem/services/fs/examples.py +206 -0
rem/services/fs/examples_paths.py +204 -0
rem/services/fs/git_provider.py +935 -0
rem/services/fs/local_provider.py +760 -0
rem/services/fs/parsing-hooks-examples.md +172 -0
rem/services/fs/paths.py +276 -0
rem/services/fs/provider.py +460 -0
rem/services/fs/s3_provider.py +1042 -0
rem/services/fs/service.py +186 -0
rem/services/git/README.md +1075 -0
rem/services/git/__init__.py +17 -0
rem/services/git/service.py +469 -0
rem/services/phoenix/EXPERIMENT_DESIGN.md +1146 -0
rem/services/phoenix/README.md +453 -0
rem/services/phoenix/__init__.py +46 -0
rem/services/phoenix/client.py +686 -0
rem/services/phoenix/config.py +88 -0
rem/services/phoenix/prompt_labels.py +477 -0
rem/services/postgres/README.md +575 -0
rem/services/postgres/__init__.py +23 -0
rem/services/postgres/migration_service.py +427 -0
rem/services/postgres/pydantic_to_sqlalchemy.py +232 -0
rem/services/postgres/register_type.py +352 -0
rem/services/postgres/repository.py +337 -0
rem/services/postgres/schema_generator.py +379 -0
rem/services/postgres/service.py +802 -0
rem/services/postgres/sql_builder.py +354 -0
rem/services/rem/README.md +304 -0
rem/services/rem/__init__.py +23 -0
rem/services/rem/exceptions.py +71 -0
rem/services/rem/executor.py +293 -0
rem/services/rem/parser.py +145 -0
rem/services/rem/queries.py +196 -0
rem/services/rem/query.py +371 -0
rem/services/rem/service.py +527 -0
rem/services/session/README.md +374 -0
rem/services/session/__init__.py +6 -0
rem/services/session/compression.py +360 -0
rem/services/session/reload.py +77 -0
rem/settings.py +1235 -0
rem/sql/002_install_models.sql +1068 -0
rem/sql/background_indexes.sql +42 -0
rem/sql/install_models.sql +1038 -0
rem/sql/migrations/001_install.sql +503 -0
rem/sql/migrations/002_install_models.sql +1202 -0
rem/utils/AGENTIC_CHUNKING.md +597 -0
rem/utils/README.md +583 -0
rem/utils/__init__.py +43 -0
rem/utils/agentic_chunking.py +622 -0
rem/utils/batch_ops.py +343 -0
rem/utils/chunking.py +108 -0
rem/utils/clip_embeddings.py +276 -0
rem/utils/dict_utils.py +98 -0
rem/utils/embeddings.py +423 -0
rem/utils/examples/embeddings_example.py +305 -0
rem/utils/examples/sql_types_example.py +202 -0
rem/utils/markdown.py +16 -0
rem/utils/model_helpers.py +236 -0
rem/utils/schema_loader.py +229 -0
rem/utils/sql_types.py +348 -0
rem/utils/user_id.py +81 -0
rem/utils/vision.py +330 -0
rem/workers/README.md +506 -0
rem/workers/__init__.py +5 -0
rem/workers/dreaming.py +502 -0
rem/workers/engram_processor.py +312 -0
rem/workers/sqs_file_processor.py +193 -0
remdb-0.2.6.dist-info/METADATA +1191 -0
remdb-0.2.6.dist-info/RECORD +187 -0
remdb-0.2.6.dist-info/WHEEL +4 -0
remdb-0.2.6.dist-info/entry_points.txt +2 -0

rem/cli/commands/README.md ADDED Viewed

@@ -0,0 +1,126 @@
+# REM CLI Commands
+## Configuration (`rem configure`)
+Interactive configuration wizard for REM setup.
+### Quick Start
+```bash
+# Basic configuration (creates ~/.rem/config.yaml)
+rem configure
+# Configure + install database tables
+rem configure --install
+# Configure + install + register with Claude Desktop
+rem configure --install --claude-desktop
+```
+### Managing Configuration
+```bash
+# View current configuration
+rem configure --show
+# Edit configuration file
+rem configure --edit  # Opens in $EDITOR (defaults to vim)
+# Or edit manually
+vim ~/.rem/config.yaml
+```
+### Configuration File Structure
+`~/.rem/config.yaml`:
+```yaml
+postgres:
+  connection_string: postgresql://user:pass@localhost:5432/rem
+  pool_min_size: 5
+  pool_max_size: 20
+llm:
+  default_model: anthropic:claude-sonnet-4-5-20250929
+  default_temperature: 0.5
+  openai_api_key: sk-...
+  anthropic_api_key: sk-ant-...
+s3:
+  bucket_name: rem-storage
+  region: us-east-1
+  # Optional: for MinIO/LocalStack
+  endpoint_url: http://localhost:9000
+  access_key_id: minioadmin
+  secret_access_key: minioadmin
+```
+### Environment Variables
+All configuration can be overridden via environment variables using double underscore delimiter:
+```bash
+# Postgres
+export POSTGRES__CONNECTION_STRING=postgresql://user:pass@host:5432/db
+export POSTGRES__POOL_MIN_SIZE=5
+export POSTGRES__POOL_MAX_SIZE=20
+# LLM
+export LLM__DEFAULT_MODEL=anthropic:claude-sonnet-4-5-20250929
+export LLM__OPENAI_API_KEY=sk-...
+export LLM__ANTHROPIC_API_KEY=sk-ant-...
+# S3
+export S3__BUCKET_NAME=rem-storage
+export S3__REGION=us-east-1
+```
+### Configuration Precedence
+1. **Environment variables** (highest priority)
+2. **Configuration file** (`~/.rem/config.yaml`)
+3. **Default values** (from `rem/settings.py`)
+### Docker/Kubernetes
+In containerized environments, use environment variables exclusively:
+```yaml
+# docker-compose.yml
+services:
+  rem-api:
+    image: rem:latest
+    environment:
+      POSTGRES__CONNECTION_STRING: postgresql://rem:rem@postgres:5432/rem
+      LLM__OPENAI_API_KEY: ${OPENAI_API_KEY}
+```
+```yaml
+# Kubernetes ConfigMap/Secret
+apiVersion: v1
+kind: Secret
+metadata:
+  name: rem-secrets
+stringData:
+  POSTGRES__CONNECTION_STRING: postgresql://rem:rem@postgres:5432/rem
+  LLM__OPENAI_API_KEY: sk-...
+```
+## Other Commands
+- **`rem ask`** - Interactive chat with REM memory
+- **`rem serve`** - Start FastAPI server
+- **`rem db`** - Database management (migrate, seed, etc.)
+- **`rem schema`** - Schema generation and validation
+- **`rem mcp`** - MCP server commands
+- **`rem dreaming`** - Background knowledge processing
+- **`rem process`** - File processing utilities
+- **`rem experiments`** - Experiment management (datasets, prompts, traces, runs)
+Run `rem COMMAND --help` for detailed usage of each command.
+## See Also
+- [README.md](../../../../../README.md) - Main documentation
+- [CLAUDE.md](../../../../../CLAUDE.md) - Architecture overview
+- [settings.py](../../settings.py) - All available settings

rem/cli/commands/__init__.py ADDED Viewed

@@ -0,0 +1,3 @@
+"""
+CLI commands for REM.
+"""

rem/cli/commands/ask.py ADDED Viewed

@@ -0,0 +1,565 @@
+"""
+CLI command for testing Pydantic AI agents.
+Usage:
+    rem ask query-agent "Find all documents by Sarah" --model anthropic:claude-sonnet-4-5-20250929
+    rem ask schemas/query-agent.yaml "What is the weather?" --temperature 0.7 --max-turns 5
+    rem ask my-agent "Hello" --stream --version 1.2.0
+"""
+import asyncio
+import json
+import sys
+from pathlib import Path
+from typing import Any
+import click
+from loguru import logger
+from ...agentic.context import AgentContext
+from ...agentic.providers.pydantic_ai import create_agent
+from ...agentic.query import AgentQuery
+from ...settings import settings
+from ...utils.schema_loader import load_agent_schema
+async def load_schema_from_registry(
+    name: str, version: str | None = None
+) -> dict[str, Any]:
+    """
+    Load agent schema from registry (database or cache).
+    TODO: Implement schema registry with:
+    - Database table: agent_schemas (name, version, schema_json, created_at)
+    - Cache layer: Redis/in-memory for fast lookups
+    - Versioning: semantic versioning with latest fallback
+    Args:
+        name: Schema name (e.g., "query-agent", "rem-agents-query-agent")
+        version: Optional version (e.g., "1.2.0", defaults to latest)
+    Returns:
+        Agent schema as dictionary
+    Example:
+        schema = await load_schema_from_registry("query-agent", version="1.0.0")
+    """
+    # TODO: Implement database/cache lookup
+    # from ...db import get_db_pool
+    # async with get_db_pool() as pool:
+    #     if version:
+    #         query = "SELECT schema_json FROM agent_schemas WHERE name = $1 AND version = $2"
+    #         row = await pool.fetchrow(query, name, version)
+    #     else:
+    #         query = "SELECT schema_json FROM agent_schemas WHERE name = $1 ORDER BY created_at DESC LIMIT 1"
+    #         row = await pool.fetchrow(query, name)
+    #
+    #     if not row:
+    #         raise ValueError(f"Schema not found: {name} (version: {version or 'latest'})")
+    #
+    #     return json.loads(row["schema_json"])
+    raise NotImplementedError(
+        f"Schema registry not implemented yet. Please use a file path instead.\n"
+        f"Attempted to load: {name} (version: {version or 'latest'})"
+    )
+async def run_agent_streaming(
+    agent,
+    prompt: str,
+    max_turns: int = 10,
+    context: AgentContext | None = None,
+    max_iterations: int | None = None,
+) -> None:
+    """
+    Run agent in streaming mode using agent.iter() with usage limits.
+    Design Pattern (from carrier):
+    - Use agent.iter() for complete execution with tool call visibility
+    - run_stream() stops after first output, missing tool calls
+    - Stream tool call markers: [Calling: tool_name]
+    - Stream text content deltas as they arrive
+    - Show final structured result
+    Args:
+        agent: Pydantic AI agent
+        prompt: Complete prompt (includes system context + history + query)
+        max_turns: Maximum turns for agent execution (not used in current API)
+        context: Optional AgentContext for session persistence
+        max_iterations: Maximum iterations/requests (from agent schema or settings)
+    """
+    from datetime import datetime, timezone
+    from pydantic_ai import UsageLimits
+    logger.info("Running agent in streaming mode...")
+    try:
+        # Import event types for streaming
+        from pydantic_ai import Agent as PydanticAgent
+        from pydantic_ai.messages import PartStartEvent, PartDeltaEvent, TextPartDelta, ToolCallPart
+        # Accumulate assistant response for session persistence
+        assistant_response_parts = []
+        # Use agent.iter() to get complete execution with tool calls
+        usage_limits = UsageLimits(request_limit=max_iterations) if max_iterations else None
+        async with agent.iter(prompt, usage_limits=usage_limits) as agent_run:
+            async for node in agent_run:
+                # Check if this is a model request node (includes tool calls and text)
+                if PydanticAgent.is_model_request_node(node):
+                    # Stream events from model request
+                    request_stream: Any
+                    async with node.stream(agent_run.ctx) as request_stream:
+                        async for event in request_stream:
+                            # Tool call start event
+                            if isinstance(event, PartStartEvent) and isinstance(
+                                event.part, ToolCallPart
+                            ):
+                                tool_marker = f"\n[Calling: {event.part.tool_name}]"
+                                print(tool_marker, flush=True)
+                                assistant_response_parts.append(tool_marker)
+                            # Text content delta
+                            elif isinstance(event, PartDeltaEvent) and isinstance(
+                                event.delta, TextPartDelta
+                            ):
+                                print(event.delta.content_delta, end="", flush=True)
+                                assistant_response_parts.append(event.delta.content_delta)
+        print("\n")  # Final newline after streaming
+        # Get final result from agent_run
+        result = agent_run.result
+        if hasattr(result, "output"):
+            logger.info("Final structured result:")
+            output = result.output
+            from rem.agentic.serialization import serialize_agent_result
+            output_json = json.dumps(serialize_agent_result(output), indent=2)
+            print(output_json)
+            assistant_response_parts.append(f"\n{output_json}")
+        # Save session messages (if session_id provided and postgres enabled)
+        if context and context.session_id and settings.postgres.enabled:
+            from ...services.session.compression import SessionMessageStore
+            # Extract just the user query from prompt
+            # Prompt format from ContextBuilder: system + history + user message
+            # We need to extract the last user message
+            user_message_content = prompt.split("\n\n")[-1] if "\n\n" in prompt else prompt
+            user_message = {
+                "role": "user",
+                "content": user_message_content,
+                "timestamp": datetime.now(timezone.utc).isoformat(),
+            }
+            assistant_message = {
+                "role": "assistant",
+                "content": "".join(assistant_response_parts),
+                "timestamp": datetime.now(timezone.utc).isoformat(),
+            }
+            # Store messages with compression
+            store = SessionMessageStore(user_id=context.user_id or settings.test.effective_user_id)
+            await store.store_session_messages(
+                session_id=context.session_id,
+                messages=[user_message, assistant_message],
+                user_id=context.user_id,
+                compress=True,
+            )
+            logger.debug(f"Saved conversation to session {context.session_id}")
+    except Exception as e:
+        logger.error(f"Agent execution failed: {e}")
+        raise
+async def run_agent_non_streaming(
+    agent,
+    prompt: str,
+    max_turns: int = 10,
+    output_file: Path | None = None,
+    context: AgentContext | None = None,
+    plan: bool = False,
+    max_iterations: int | None = None,
+) -> dict[str, Any] | None:
+    """
+    Run agent in non-streaming mode using agent.run() with usage limits.
+    Args:
+        agent: Pydantic AI agent
+        prompt: Complete prompt (includes system context + history + query)
+        max_turns: Maximum turns for agent execution (not used in current API)
+        output_file: Optional path to save output
+        context: Optional AgentContext for session persistence
+        plan: If True, output only the generated query (for query-agent)
+        max_iterations: Maximum iterations/requests (from agent schema or settings)
+    Returns:
+        Output data if successful, None otherwise
+    """
+    from datetime import datetime, timezone
+    from pydantic_ai import UsageLimits
+    logger.info("Running agent in non-streaming mode...")
+    try:
+        # Run agent and get complete result with usage limits
+        usage_limits = UsageLimits(request_limit=max_iterations) if max_iterations else None
+        result = await agent.run(prompt, usage_limits=usage_limits)
+        # Extract output data
+        output_data = None
+        assistant_content = None
+        if hasattr(result, "output"):
+            output = result.output
+            from rem.agentic.serialization import serialize_agent_result
+            output_data = serialize_agent_result(output)
+            if plan and isinstance(output_data, dict) and "query" in output_data:
+                # Plan mode: Output only the query
+                # Use sql formatting if possible or just raw string
+                assistant_content = output_data["query"]
+                print(assistant_content)
+            else:
+                # Normal mode
+                assistant_content = json.dumps(output_data, indent=2)
+                print(assistant_content)
+        else:
+            # Fallback for text-only results
+            assistant_content = str(result)
+            print(assistant_content)
+        # Save to file if requested
+        if output_file and output_data:
+            await _save_output_file(output_file, output_data)
+        # Save session messages (if session_id provided and postgres enabled)
+        if context and context.session_id and settings.postgres.enabled:
+            from ...services.session.compression import SessionMessageStore
+            # Extract just the user query from prompt
+            # Prompt format from ContextBuilder: system + history + user message
+            # We need to extract the last user message
+            user_message_content = prompt.split("\n\n")[-1] if "\n\n" in prompt else prompt
+            user_message = {
+                "role": "user",
+                "content": user_message_content,
+                "timestamp": datetime.now(timezone.utc).isoformat(),
+            }
+            assistant_message = {
+                "role": "assistant",
+                "content": assistant_content,
+                "timestamp": datetime.now(timezone.utc).isoformat(),
+            }
+            # Store messages with compression
+            store = SessionMessageStore(user_id=context.user_id or settings.test.effective_user_id)
+            await store.store_session_messages(
+                session_id=context.session_id,
+                messages=[user_message, assistant_message],
+                user_id=context.user_id,
+                compress=True,
+            )
+            logger.debug(f"Saved conversation to session {context.session_id}")
+        return output_data
+    except Exception as e:
+        logger.error(f"Agent execution failed: {e}")
+        raise
+async def _load_input_file(
+    file_path: Path, user_id: str | None = None
+) -> str:
+    """
+    Load content from input file using ContentService.
+    Simple parse operation - just extracts content without creating Resources.
+    Args:
+        file_path: Path to input file
+        user_id: Optional user ID (not used for simple parse)
+    Returns:
+        Parsed file content as string (markdown format)
+    """
+    from ...services.content import ContentService
+    # Create ContentService instance
+    content_service = ContentService()
+    # Parse file (read-only, no database writes)
+    logger.info(f"Parsing file: {file_path}")
+    result = content_service.process_uri(str(file_path))
+    content = result["content"]
+    logger.info(
+        f"Loaded {len(content)} characters from {file_path.suffix} file using {result['provider']}"
+    )
+    return content
+async def _save_output_file(file_path: Path, data: dict[str, Any]) -> None:
+    """
+    Save output data to file in YAML format.
+    Args:
+        file_path: Path to output file
+        data: Data to save
+    """
+    import yaml
+    with open(file_path, "w", encoding="utf-8") as f:
+        yaml.safe_dump(data, f, default_flow_style=False, allow_unicode=True, sort_keys=False)
+    logger.success(f"Output saved to: {file_path}")
+@click.command()
+@click.argument("name_or_query")
+@click.argument("query", required=False)
+@click.option(
+    "--model",
+    "-m",
+    default=None,
+    help=f"LLM model (default: {settings.llm.default_model})",
+)
+@click.option(
+    "--temperature",
+    "-t",
+    type=float,
+    default=None,
+    help=f"Temperature for generation (default: {settings.llm.default_temperature})",
+)
+@click.option(
+    "--max-turns",
+    type=int,
+    default=10,
+    help="Maximum turns for agent execution (default: 10)",
+)
+@click.option(
+    "--version",
+    "-v",
+    default=None,
+    help="Schema version (for registry lookup, defaults to latest)",
+)
+@click.option(
+    "--stream/--no-stream",
+    default=False,
+    help="Enable streaming mode (default: disabled)",
+)
+@click.option(
+    "--user-id",
+    default="test-user",
+    help="User ID for context (default: test-user)",
+)
+@click.option(
+    "--session-id",
+    default=None,
+    help="Session ID for context (default: auto-generated)",
+)
+@click.option(
+    "--input-file",
+    "-i",
+    type=click.Path(exists=True, path_type=Path),
+    default=None,
+    help="Read input from file instead of QUERY argument (supports PDF, TXT, Markdown)",
+)
+@click.option(
+    "--output-file",
+    "-o",
+    type=click.Path(path_type=Path),
+    default=None,
+    help="Write output to file (YAML format)",
+)
+@click.option(
+    "--plan",
+    is_flag=True,
+    default=False,
+    help="Output only the generated plan/query (useful for query-agent)",
+)
+def ask(
+    name_or_query: str,
+    query: str | None,
+    model: str | None,
+    temperature: float | None,
+    max_turns: int,
+    version: str | None,
+    stream: bool,
+    user_id: str,
+    session_id: str | None,
+    input_file: Path | None,
+    output_file: Path | None,
+    plan: bool,
+):
+    """
+    Run an agent with a query or file input.
+    Arguments:
+        NAME_OR_QUERY: Agent schema name OR query string.
+        QUERY: Query string (if first arg is agent name).
+    Examples:
+        # Simple query (uses default 'rem' agent)
+        rem ask "What documents did I upload?"
+        # Explicit agent
+        rem ask contract-analyzer "Analyze this contract"
+        # Process file
+        rem ask contract-analyzer -i contract.pdf -o output.yaml
+    """
+    # Smart argument handling
+    name = "rem"  # Default agent
+    if query is None and not input_file:
+        # Single argument provided
+        # Heuristic: If it looks like a schema file or known agent, treat as name
+        # Otherwise treat as query
+        if name_or_query.endswith((".yaml", ".yml", ".json")) or name_or_query in ["rem", "query-agent", "rem-query-agent"]:
+             # It's an agent name, query is missing (unless input_file)
+             name = name_or_query
+             # Query remains None, _ask_async will check input_file
+        else:
+             # It's a query, use default agent
+             query = name_or_query
+    elif query is not None:
+        # Two arguments provided
+        name = name_or_query
+    asyncio.run(
+        _ask_async(
+            name=name,
+            query=query,
+            model=model,
+            temperature=temperature,
+            max_turns=max_turns,
+            version=version,
+            stream=stream,
+            user_id=user_id,
+            session_id=session_id,
+            input_file=input_file,
+            output_file=output_file,
+            plan=plan,
+        )
+    )
+async def _ask_async(
+    name: str,
+    query: str | None,
+    model: str | None,
+    temperature: float | None,
+    max_turns: int,
+    version: str | None,
+    stream: bool,
+    user_id: str,
+    session_id: str | None,
+    input_file: Path | None,
+    output_file: Path | None,
+    plan: bool,
+):
+    """Async implementation of ask command."""
+    import uuid
+    from ...agentic.context_builder import ContextBuilder
+    # Validate input arguments
+    if not query and not input_file:
+        logger.error("Either QUERY argument or --input-file must be provided")
+        sys.exit(1)
+    if query and input_file:
+        logger.error("Cannot use both QUERY argument and --input-file")
+        sys.exit(1)
+    # Load input from file if specified
+    if input_file:
+        logger.info(f"Loading input from file: {input_file}")
+        query = await _load_input_file(input_file, user_id=user_id)
+    # Load schema using centralized utility
+    # Handles both file paths and schema names automatically
+    logger.info(f"Loading schema: {name} (version: {version or 'latest'})")
+    try:
+        schema = load_agent_schema(name)
+    except FileNotFoundError as e:
+        logger.error(str(e))
+        sys.exit(1)
+    # Generate session ID if not provided
+    if not session_id:
+        session_id = str(uuid.uuid4())
+        logger.info(f"Generated session ID: {session_id}")
+    # Build context with session history using ContextBuilder
+    # This provides:
+    # - System context message with date and user profile hints
+    # - Compressed session history (if session exists)
+    # - Proper message structure for agent
+    logger.info(f"Building context for user {user_id}, session {session_id}")
+    # Prepare new message for ContextBuilder
+    new_messages = [{"role": "user", "content": query}]
+    # Build context with session history
+    context, messages = await ContextBuilder.build_from_headers(
+        headers={
+            "X-User-Id": user_id,
+            "X-Session-Id": session_id,
+        },
+        new_messages=new_messages,
+    )
+    # Override model if specified via CLI flag
+    if model:
+        context.default_model = model
+    logger.info(
+        f"Creating agent: model={context.default_model}, stream={stream}, max_turns={max_turns}, messages={len(messages)}"
+    )
+    # Create agent
+    agent = await create_agent(
+        context=context,
+        agent_schema_override=schema,
+        model_override=model,
+    )
+    # Temperature is now handled in agent factory (schema override or settings default)
+    if temperature is not None:
+        logger.warning(
+            f"CLI temperature override ({temperature}) not yet supported. "
+            "Use agent schema 'override_temperature' field or LLM__DEFAULT_TEMPERATURE setting."
+        )
+    # Combine messages into single prompt
+    # ContextBuilder already assembled: system context + history + new message
+    prompt = "\n\n".join(msg.content for msg in messages)
+    # Run agent with session persistence
+    if stream:
+        await run_agent_streaming(agent, prompt, max_turns=max_turns, context=context)
+    else:
+        await run_agent_non_streaming(
+            agent,
+            prompt,
+            max_turns=max_turns,
+            output_file=output_file,
+            context=context,
+            plan=plan,
+        )
+    # Log session ID for reuse
+    logger.success(f"Session ID: {session_id} (use --session-id to continue this conversation)")
+def register_command(parent_group):
+    """Register ask command with parent CLI group."""
+    parent_group.add_command(ask)