PyPI - remdb - Versions diffs - 0.3.7__py3-none-any.whl - Mend

remdb 0.3.7__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (187) hide show

rem/__init__.py +2 -0
rem/agentic/README.md +650 -0
rem/agentic/__init__.py +39 -0
rem/agentic/agents/README.md +155 -0
rem/agentic/agents/__init__.py +8 -0
rem/agentic/context.py +148 -0
rem/agentic/context_builder.py +329 -0
rem/agentic/mcp/__init__.py +0 -0
rem/agentic/mcp/tool_wrapper.py +107 -0
rem/agentic/otel/__init__.py +5 -0
rem/agentic/otel/setup.py +151 -0
rem/agentic/providers/phoenix.py +674 -0
rem/agentic/providers/pydantic_ai.py +572 -0
rem/agentic/query.py +117 -0
rem/agentic/query_helper.py +89 -0
rem/agentic/schema.py +396 -0
rem/agentic/serialization.py +245 -0
rem/agentic/tools/__init__.py +5 -0
rem/agentic/tools/rem_tools.py +231 -0
rem/api/README.md +420 -0
rem/api/main.py +324 -0
rem/api/mcp_router/prompts.py +182 -0
rem/api/mcp_router/resources.py +536 -0
rem/api/mcp_router/server.py +213 -0
rem/api/mcp_router/tools.py +584 -0
rem/api/routers/auth.py +229 -0
rem/api/routers/chat/__init__.py +5 -0
rem/api/routers/chat/completions.py +281 -0
rem/api/routers/chat/json_utils.py +76 -0
rem/api/routers/chat/models.py +124 -0
rem/api/routers/chat/streaming.py +185 -0
rem/auth/README.md +258 -0
rem/auth/__init__.py +26 -0
rem/auth/middleware.py +100 -0
rem/auth/providers/__init__.py +13 -0
rem/auth/providers/base.py +376 -0
rem/auth/providers/google.py +163 -0
rem/auth/providers/microsoft.py +237 -0
rem/cli/README.md +455 -0
rem/cli/__init__.py +8 -0
rem/cli/commands/README.md +126 -0
rem/cli/commands/__init__.py +3 -0
rem/cli/commands/ask.py +566 -0
rem/cli/commands/configure.py +497 -0
rem/cli/commands/db.py +493 -0
rem/cli/commands/dreaming.py +324 -0
rem/cli/commands/experiments.py +1302 -0
rem/cli/commands/mcp.py +66 -0
rem/cli/commands/process.py +245 -0
rem/cli/commands/schema.py +183 -0
rem/cli/commands/serve.py +106 -0
rem/cli/dreaming.py +363 -0
rem/cli/main.py +96 -0
rem/config.py +237 -0
rem/mcp_server.py +41 -0
rem/models/core/__init__.py +49 -0
rem/models/core/core_model.py +64 -0
rem/models/core/engram.py +333 -0
rem/models/core/experiment.py +628 -0
rem/models/core/inline_edge.py +132 -0
rem/models/core/rem_query.py +243 -0
rem/models/entities/__init__.py +43 -0
rem/models/entities/file.py +57 -0
rem/models/entities/image_resource.py +88 -0
rem/models/entities/message.py +35 -0
rem/models/entities/moment.py +123 -0
rem/models/entities/ontology.py +191 -0
rem/models/entities/ontology_config.py +131 -0
rem/models/entities/resource.py +95 -0
rem/models/entities/schema.py +87 -0
rem/models/entities/user.py +85 -0
rem/py.typed +0 -0
rem/schemas/README.md +507 -0
rem/schemas/__init__.py +6 -0
rem/schemas/agents/README.md +92 -0
rem/schemas/agents/core/moment-builder.yaml +178 -0
rem/schemas/agents/core/rem-query-agent.yaml +226 -0
rem/schemas/agents/core/resource-affinity-assessor.yaml +99 -0
rem/schemas/agents/core/simple-assistant.yaml +19 -0
rem/schemas/agents/core/user-profile-builder.yaml +163 -0
rem/schemas/agents/examples/contract-analyzer.yaml +317 -0
rem/schemas/agents/examples/contract-extractor.yaml +134 -0
rem/schemas/agents/examples/cv-parser.yaml +263 -0
rem/schemas/agents/examples/hello-world.yaml +37 -0
rem/schemas/agents/examples/query.yaml +54 -0
rem/schemas/agents/examples/simple.yaml +21 -0
rem/schemas/agents/examples/test.yaml +29 -0
rem/schemas/agents/rem.yaml +128 -0
rem/schemas/evaluators/hello-world/default.yaml +77 -0
rem/schemas/evaluators/rem/faithfulness.yaml +219 -0
rem/schemas/evaluators/rem/lookup-correctness.yaml +182 -0
rem/schemas/evaluators/rem/retrieval-precision.yaml +199 -0
rem/schemas/evaluators/rem/retrieval-recall.yaml +211 -0
rem/schemas/evaluators/rem/search-correctness.yaml +192 -0
rem/services/__init__.py +16 -0
rem/services/audio/INTEGRATION.md +308 -0
rem/services/audio/README.md +376 -0
rem/services/audio/__init__.py +15 -0
rem/services/audio/chunker.py +354 -0
rem/services/audio/transcriber.py +259 -0
rem/services/content/README.md +1269 -0
rem/services/content/__init__.py +5 -0
rem/services/content/providers.py +801 -0
rem/services/content/service.py +676 -0
rem/services/dreaming/README.md +230 -0
rem/services/dreaming/__init__.py +53 -0
rem/services/dreaming/affinity_service.py +336 -0
rem/services/dreaming/moment_service.py +264 -0
rem/services/dreaming/ontology_service.py +54 -0
rem/services/dreaming/user_model_service.py +297 -0
rem/services/dreaming/utils.py +39 -0
rem/services/embeddings/__init__.py +11 -0
rem/services/embeddings/api.py +120 -0
rem/services/embeddings/worker.py +421 -0
rem/services/fs/README.md +662 -0
rem/services/fs/__init__.py +62 -0
rem/services/fs/examples.py +206 -0
rem/services/fs/examples_paths.py +204 -0
rem/services/fs/git_provider.py +935 -0
rem/services/fs/local_provider.py +760 -0
rem/services/fs/parsing-hooks-examples.md +172 -0
rem/services/fs/paths.py +276 -0
rem/services/fs/provider.py +460 -0
rem/services/fs/s3_provider.py +1042 -0
rem/services/fs/service.py +186 -0
rem/services/git/README.md +1075 -0
rem/services/git/__init__.py +17 -0
rem/services/git/service.py +469 -0
rem/services/phoenix/EXPERIMENT_DESIGN.md +1146 -0
rem/services/phoenix/README.md +453 -0
rem/services/phoenix/__init__.py +46 -0
rem/services/phoenix/client.py +686 -0
rem/services/phoenix/config.py +88 -0
rem/services/phoenix/prompt_labels.py +477 -0
rem/services/postgres/README.md +575 -0
rem/services/postgres/__init__.py +23 -0
rem/services/postgres/migration_service.py +427 -0
rem/services/postgres/pydantic_to_sqlalchemy.py +232 -0
rem/services/postgres/register_type.py +352 -0
rem/services/postgres/repository.py +337 -0
rem/services/postgres/schema_generator.py +379 -0
rem/services/postgres/service.py +802 -0
rem/services/postgres/sql_builder.py +354 -0
rem/services/rem/README.md +304 -0
rem/services/rem/__init__.py +23 -0
rem/services/rem/exceptions.py +71 -0
rem/services/rem/executor.py +293 -0
rem/services/rem/parser.py +145 -0
rem/services/rem/queries.py +196 -0
rem/services/rem/query.py +371 -0
rem/services/rem/service.py +527 -0
rem/services/session/README.md +374 -0
rem/services/session/__init__.py +6 -0
rem/services/session/compression.py +360 -0
rem/services/session/reload.py +77 -0
rem/settings.py +1235 -0
rem/sql/002_install_models.sql +1068 -0
rem/sql/background_indexes.sql +42 -0
rem/sql/install_models.sql +1038 -0
rem/sql/migrations/001_install.sql +503 -0
rem/sql/migrations/002_install_models.sql +1202 -0
rem/utils/AGENTIC_CHUNKING.md +597 -0
rem/utils/README.md +583 -0
rem/utils/__init__.py +43 -0
rem/utils/agentic_chunking.py +622 -0
rem/utils/batch_ops.py +343 -0
rem/utils/chunking.py +108 -0
rem/utils/clip_embeddings.py +276 -0
rem/utils/dict_utils.py +98 -0
rem/utils/embeddings.py +423 -0
rem/utils/examples/embeddings_example.py +305 -0
rem/utils/examples/sql_types_example.py +202 -0
rem/utils/markdown.py +16 -0
rem/utils/model_helpers.py +236 -0
rem/utils/schema_loader.py +336 -0
rem/utils/sql_types.py +348 -0
rem/utils/user_id.py +81 -0
rem/utils/vision.py +330 -0
rem/workers/README.md +506 -0
rem/workers/__init__.py +5 -0
rem/workers/dreaming.py +502 -0
rem/workers/engram_processor.py +312 -0
rem/workers/sqs_file_processor.py +193 -0
remdb-0.3.7.dist-info/METADATA +1473 -0
remdb-0.3.7.dist-info/RECORD +187 -0
remdb-0.3.7.dist-info/WHEEL +4 -0
remdb-0.3.7.dist-info/entry_points.txt +2 -0

rem/agentic/providers/pydantic_ai.py ADDED Viewed

@@ -0,0 +1,572 @@
+"""
+Pydantic AI agent factory with dynamic JsonSchema to Pydantic model conversion.
+AgentRuntime Pattern:
+    The create_agent() factory returns an AgentRuntime object containing:
+    - agent: The Pydantic AI Agent instance
+    - temperature: Resolved temperature (schema override or settings default)
+    - max_iterations: Resolved max iterations (schema override or settings default)
+    This ensures runtime configuration is determined once at agent creation,
+    not re-computed at every call site.
+Known Issues:
+    1. Cerebras Qwen Strict Mode Incompatibility
+       - Cerebras qwen-3-32b requires additionalProperties=false for all object fields
+       - Cannot use dict[str, Any] for flexible parameters (breaks Qwen compatibility)
+       - Cannot use minimum/maximum constraints on number fields (Qwen rejects these)
+       - Workaround: Use cerebras:llama-3.3-70b instead (fully compatible)
+       - Future fix: Redesign REM agent to use discriminated union instead of dict
+Key Design Pattern:
+    1. JsonSchema → Pydantic Model (json-schema-to-pydantic library)
+    2. Agent schema contains both system prompt AND output schema
+    3. MCP tools loaded dynamically from schema metadata
+    4. Result type can be stripped of description to avoid duplication with system prompt
+    5. OTEL instrumentation conditional based on settings
+Unique Design:
+    - Agent schemas are JSON Schema with embedded metadata:
+      - description: System prompt for agent
+      - properties: Output schema fields
+      - json_schema_extra.tools: MCP tool configurations
+      - json_schema_extra.resources: MCP resource configurations
+    - Dynamic model creation from schema using json-schema-to-pydantic
+    - Tools and resources loaded from MCP servers via schema config
+    - Stripped descriptions to avoid LLM schema bloat
+TODO:
+    Model Cache Implementation (Critical for Production Scale)
+    Current bottleneck: Every agent.run() call creates a new Agent instance with
+    model initialization overhead. At scale (100+ requests/sec), this becomes expensive.
+    Need two-tier caching strategy:
+    1. Schema Cache (see rem/utils/schema_loader.py TODO):
+       - Filesystem schemas: LRU cache, no TTL (immutable)
+       - Database schemas: TTL cache (5-15 min)
+       - Reduces disk I/O and DB queries
+    2. Model Instance Cache (THIS TODO):
+       - Cache Pydantic AI Model() instances (connection pools, tokenizers)
+       - Key: (provider, model_name) → Model instance
+       - Benefits:
+         * Reuse HTTP connection pools (httpx.AsyncClient)
+         * Reuse tokenizer instances
+         * Faster model initialization
+         * Lower memory footprint
+       - Implementation:
+         ```python
+         _model_cache: dict[tuple[str, str], Model] = {}
+         def get_or_create_model(model_name: str) -> Model:
+             cache_key = _parse_model_name(model_name)  # ("anthropic", "claude-3-5-sonnet")
+             if cache_key not in _model_cache:
+                 _model_cache[cache_key] = Model(model_name)
+             return _model_cache[cache_key]
+         ```
+       - Considerations:
+         * Max cache size (LRU eviction, e.g., 20 models)
+         * Thread safety (asyncio.Lock for cache access)
+         * Model warmup on server startup for hot paths
+         * Clear cache on model config changes
+    3. Agent Instance Caching (Advanced):
+       - Cache complete Agent instances (model + schema + tools)
+       - Key: (schema_name, model_name) → Agent instance
+       - Benefits:
+         * Skip schema parsing and model creation entirely
+         * Fastest possible agent.run() latency
+       - Challenges:
+         * Agent state management (stateless required)
+         * Tool/resource updates (cache invalidation)
+         * Memory usage (agents are heavier than models)
+       - Recommendation: Start with Model cache, add Agent cache if profiling shows benefit
+    Profiling Targets (measure before optimizing):
+    - schema_loader.load_agent_schema() calls per request
+    - create_agent() execution time (model init overhead)
+    - Model() instance creation time by provider
+    - Agent.run() total latency breakdown
+    Related Files:
+    - rem/utils/schema_loader.py (schema caching TODO)
+    - rem/agentic/providers/pydantic_ai.py:339 (create_agent - this file)
+    - rem/services/schema_repository.py (database schema loading)
+    Priority: HIGH (blocks production scaling beyond 50 req/sec)
+Example Agent Schema:
+{
+  "type": "object",
+  "description": "Agent that answers REM queries...",
+  "properties": {
+    "answer": {"type": "string", "description": "Query answer"},
+    "confidence": {"type": "number"}
+  },
+  "required": ["answer", "confidence"],
+  "json_schema_extra": {
+    "kind": "agent",
+    "name": "query-agent",
+    "tools": [
+      {"name": "search_knowledge_base", "mcp_server": "rem"}
+    ],
+    "resources": [
+      {"uri_pattern": "cda://.*", "mcp_server": "rem"}
+    ]
+  }
+}
+"""
+from typing import Any
+from loguru import logger
+from pydantic import BaseModel
+from pydantic_ai import Agent
+from pydantic_ai.models import KnownModelName, Model
+try:
+    from json_schema_to_pydantic import PydanticModelBuilder
+    JSON_SCHEMA_TO_PYDANTIC_AVAILABLE = True
+except ImportError:
+    JSON_SCHEMA_TO_PYDANTIC_AVAILABLE = False
+    logger.warning(
+        "json-schema-to-pydantic not installed. "
+        "Install with: pip install 'rem[schema]' or pip install json-schema-to-pydantic"
+    )
+from ..context import AgentContext
+from ...settings import settings
+class AgentRuntime:
+    """
+    Agent runtime configuration bundle with delegation pattern.
+    Contains the agent instance and its resolved runtime parameters
+    (temperature, max_iterations) determined from schema overrides + settings defaults.
+    Delegates run() and iter() calls to the inner agent with automatic UsageLimits.
+    This allows callers to use AgentRuntime as a drop-in replacement for Agent.
+    """
+    def __init__(self, agent: Agent[None, Any], temperature: float, max_iterations: int):
+        self.agent = agent
+        self.temperature = temperature
+        self.max_iterations = max_iterations
+    async def run(self, *args, **kwargs):
+        """Delegate to agent.run() with automatic UsageLimits."""
+        from pydantic_ai import UsageLimits
+        # Only apply usage_limits if not already provided
+        if "usage_limits" not in kwargs:
+            kwargs["usage_limits"] = UsageLimits(request_limit=self.max_iterations)
+        return await self.agent.run(*args, **kwargs)
+    def iter(self, *args, **kwargs):
+        """Delegate to agent.iter() with automatic UsageLimits."""
+        from pydantic_ai import UsageLimits
+        # Only apply usage_limits if not already provided
+        if "usage_limits" not in kwargs:
+            kwargs["usage_limits"] = UsageLimits(request_limit=self.max_iterations)
+        return self.agent.iter(*args, **kwargs)
+def _create_model_from_schema(agent_schema: dict[str, Any]) -> type[BaseModel]:
+    """
+    Create Pydantic model dynamically from JSON Schema.
+    Uses json-schema-to-pydantic library for robust conversion of:
+    - Nested objects
+    - Arrays
+    - Required fields
+    - Validation constraints
+    Args:
+        agent_schema: JSON Schema dict with agent output structure
+    Returns:
+        Dynamically created Pydantic BaseModel class
+    Example:
+        schema = {
+            "type": "object",
+            "properties": {
+                "answer": {"type": "string"},
+                "confidence": {"type": "number", "minimum": 0, "maximum": 1}
+            },
+            "required": ["answer", "confidence"]
+        }
+        Model = _create_model_from_schema(schema)
+        # Model is now a Pydantic class with answer: str and confidence: float fields
+    """
+    if not JSON_SCHEMA_TO_PYDANTIC_AVAILABLE:
+        raise ImportError(
+            "json-schema-to-pydantic is required for dynamic schema conversion. "
+            "Install with: pip install 'rem[schema]' or pip install json-schema-to-pydantic"
+        )
+    # Create Pydantic model from JSON Schema
+    builder = PydanticModelBuilder()
+    model = builder.create_pydantic_model(agent_schema, root_schema=agent_schema)
+    # Override model name with schema name if available
+    json_extra = agent_schema.get("json_schema_extra", {})
+    schema_name = json_extra.get("name")
+    if schema_name:
+        # Convert kebab-case to PascalCase for class name
+        class_name = "".join(word.capitalize() for word in schema_name.split("-"))
+        model.__name__ = class_name
+        model.__qualname__ = class_name
+    logger.debug(
+        f"Created Pydantic model '{model.__name__}' from JSON Schema with fields: "
+        f"{list(model.model_fields.keys())}"
+    )
+    return model
+def _prepare_schema_for_qwen(schema: dict[str, Any]) -> dict[str, Any]:
+    """
+    Prepare JSON schema for Cerebras Qwen strict mode compatibility.
+    Cerebras Qwen strict mode requirements:
+    1. additionalProperties MUST be false (this is mandatory in strict mode)
+    2. All object types must have explicit properties field
+    3. Cannot use minimum/maximum constraints (Pydantic ge/le works fine)
+    This function transforms schemas to meet these requirements:
+    - Changes additionalProperties from true to false
+    - Adds empty properties {} to objects that don't have it
+    - Preserves all other schema features
+    IMPORTANT: This breaks dict[str, Any] flexibility!
+    - dict[str, Any] generates {"type": "object", "additionalProperties": true}
+    - Qwen requires additionalProperties: false
+    - Result: Empty dict {} becomes the only valid value
+    Recommendation: Don't use dict[str, Any] with Qwen. Use explicit Pydantic models instead.
+    Args:
+        schema: JSON schema dict (typically from model.model_json_schema())
+    Returns:
+        Modified schema compatible with Cerebras Qwen strict mode
+    Example:
+        # Pydantic generates for dict[str, Any]:
+        {"type": "object", "additionalProperties": true}
+        # Qwen requires:
+        {"type": "object", "properties": {}, "additionalProperties": false}
+        # This means dict can only be {}
+    """
+    def fix_object_properties(obj: dict[str, Any]) -> None:
+        """Recursively fix object schemas for Qwen strict mode."""
+        if isinstance(obj, dict):
+            # Fix current object if it's type=object
+            if obj.get("type") == "object":
+                # Add empty properties if missing
+                if "properties" not in obj and "anyOf" not in obj and "oneOf" not in obj:
+                    obj["properties"] = {}
+                # Force additionalProperties to false (required by Qwen strict mode)
+                if "additionalProperties" in obj:
+                    obj["additionalProperties"] = False
+            # Remove minimum/maximum from number fields (Qwen rejects these)
+            if obj.get("type") == "number":
+                if "minimum" in obj or "maximum" in obj:
+                    logger.warning(f"Stripping min/max from number field in Qwen schema: {obj.keys()}")
+                obj.pop("minimum", None)
+                obj.pop("maximum", None)
+            # Recursively fix nested schemas
+            for key, value in obj.items():
+                if isinstance(value, dict):
+                    fix_object_properties(value)
+                elif isinstance(value, list):
+                    for item in value:
+                        if isinstance(item, dict):
+                            fix_object_properties(item)
+    # Work on a copy to avoid mutating original
+    import copy
+    schema_copy = copy.deepcopy(schema)
+    fix_object_properties(schema_copy)
+    return schema_copy
+def _create_schema_wrapper(
+    result_type: type[BaseModel], strip_description: bool = True
+) -> type[BaseModel]:
+    """
+    Create wrapper model that customizes schema generation.
+    Prevents redundant descriptions in LLM schema while keeping
+    docstrings in Python code for documentation.
+    Design Pattern
+    - Agent schema.description contains full system prompt
+    - Output model description would duplicate this
+    - Stripping description reduces token usage without losing information
+    Args:
+        result_type: Original Pydantic model with docstring
+        strip_description: If True, removes model-level description from schema
+    Returns:
+        Wrapper model that generates schema without description field
+    Example:
+        class AgentOutput(BaseModel):
+            \"\"\"Agent output with answer and confidence.\"\"\"
+            answer: str
+            confidence: float
+        Wrapped = _create_schema_wrapper(AgentOutput, strip_description=True)
+        # Wrapped.model_json_schema() excludes top-level description
+    """
+    if not strip_description:
+        return result_type
+    # Create model that overrides schema generation
+    class SchemaWrapper(result_type):  # type: ignore
+        @classmethod
+        def model_json_schema(cls, **kwargs):
+            schema = super().model_json_schema(**kwargs)
+            # Remove model-level description to avoid duplication with system prompt
+            schema.pop("description", None)
+            # Prepare schema for Qwen compatibility
+            schema = _prepare_schema_for_qwen(schema)
+            return schema
+    # Preserve original model name for debugging
+    SchemaWrapper.__name__ = result_type.__name__
+    return SchemaWrapper
+async def create_agent_from_schema_file(
+    schema_name_or_path: str,
+    context: AgentContext | None = None,
+    model_override: KnownModelName | Model | None = None,
+) -> Agent:
+    """
+    Create agent from schema file (YAML/JSON).
+    Handles path resolution automatically:
+    - "contract-analyzer" → searches schemas/agents/examples/contract-analyzer.yaml
+    - "moment-builder" → searches schemas/agents/core/moment-builder.yaml
+    - "rem" → searches schemas/agents/rem.yaml
+    - "/absolute/path.yaml" → loads directly
+    - "relative/path.yaml" → loads relative to cwd
+    Args:
+        schema_name_or_path: Schema name or file path
+        context: Optional agent context
+        model_override: Optional model override
+    Returns:
+        Configured Agent instance
+    Example:
+        # Load by name (searches package schemas)
+        agent = await create_agent_from_schema_file("contract-analyzer")
+        # Load from custom path
+        agent = await create_agent_from_schema_file("./my-agent.yaml")
+    """
+    from ...utils.schema_loader import load_agent_schema
+    # Load schema using centralized utility
+    agent_schema = load_agent_schema(schema_name_or_path)
+    # Create agent using existing factory
+    return await create_agent(
+        context=context,
+        agent_schema_override=agent_schema,
+        model_override=model_override,
+    )
+async def create_agent(
+    context: AgentContext | None = None,
+    agent_schema_override: dict[str, Any] | None = None,
+    model_override: KnownModelName | Model | None = None,
+    result_type: type[BaseModel] | None = None,
+    strip_model_description: bool = True,
+) -> AgentRuntime:
+    """
+    Create agent from context with dynamic schema loading.
+    Provider-agnostic interface - currently implemented with Pydantic AI.
+    Design Pattern:
+    1. Load agent schema from context.agent_schema_uri or use override
+    2. Extract system prompt from schema.description
+    3. Create dynamic Pydantic model from schema.properties
+    4. Load MCP tools from schema.json_schema_extra.tools
+    5. Create agent with model, prompt, output_type, and tools
+    6. Enable OTEL instrumentation conditionally
+    All configuration comes from context unless explicitly overridden.
+    MCP server URLs resolved from environment variables (MCP_SERVER_{NAME}).
+    Args:
+        context: AgentContext with schema URI, model, session info
+        agent_schema_override: Optional explicit schema (bypasses context.agent_schema_uri)
+        model_override: Optional explicit model (bypasses context.default_model)
+        result_type: Optional Pydantic model for structured output
+        strip_model_description: If True, removes model docstring from LLM schema
+    Returns:
+        Configured Pydantic.AI Agent with MCP tools
+    Example:
+        # From context with schema URI
+        context = AgentContext(
+            user_id="user123",
+            tenant_id="acme-corp",
+            agent_schema_uri="rem-agents-query-agent"
+        )
+        agent = await create_agent(context)
+        # With explicit schema and result type
+        schema = {...}  # JSON Schema
+        class Output(BaseModel):
+            answer: str
+            confidence: float
+        agent = await create_agent(
+            agent_schema_override=schema,
+            result_type=Output
+        )
+    """
+    # Initialize OTEL instrumentation if enabled (idempotent)
+    if settings.otel.enabled:
+        from ..otel import setup_instrumentation
+        setup_instrumentation()
+    # Load agent schema from context or use override
+    agent_schema = agent_schema_override
+    if agent_schema is None and context and context.agent_schema_uri:
+        # TODO: Load schema from schema registry or file
+        # from ..schema import load_agent_schema
+        # agent_schema = load_agent_schema(context.agent_schema_uri)
+        pass
+    # Determine model: override > context.default_model > settings
+    model = (
+        model_override or (context.default_model if context else settings.llm.default_model)
+    )
+    # Extract schema fields
+    system_prompt = agent_schema.get("description", "") if agent_schema else ""
+    metadata = agent_schema.get("json_schema_extra", {}) if agent_schema else {}
+    mcp_server_configs = metadata.get("mcp_servers", [])
+    resource_configs = metadata.get("resources", [])
+    # Extract temperature and max_iterations from schema metadata (with fallback to settings defaults)
+    temperature = metadata.get("override_temperature", settings.llm.default_temperature)
+    max_iterations = metadata.get("override_max_iterations", settings.llm.default_max_iterations)
+    logger.info(
+        f"Creating agent: model={model}, mcp_servers={len(mcp_server_configs)}, resources={len(resource_configs)}"
+    )
+    # Set agent resource attributes for OTEL (before creating agent)
+    if settings.otel.enabled and agent_schema:
+        from ..otel import set_agent_resource_attributes
+        set_agent_resource_attributes(agent_schema=agent_schema)
+    # Build list of tools from MCP server (in-process, no subprocess)
+    tools = []
+    if mcp_server_configs:
+        for server_config in mcp_server_configs:
+            server_type = server_config.get("type")
+            server_id = server_config.get("id", "mcp-server")
+            if server_type == "local":
+                # Import MCP server directly (in-process)
+                module_path = server_config.get("module", "rem.mcp_server")
+                try:
+                    # Dynamic import of MCP server module
+                    import importlib
+                    mcp_module = importlib.import_module(module_path)
+                    mcp_server = mcp_module.mcp
+                    # Extract tools from MCP server (get_tools is async)
+                    from ..mcp.tool_wrapper import create_mcp_tool_wrapper
+                    # Await async get_tools() call
+                    mcp_tools_dict = await mcp_server.get_tools()
+                    for tool_name, tool_func in mcp_tools_dict.items():
+                        wrapped_tool = create_mcp_tool_wrapper(tool_name, tool_func, user_id=context.user_id if context else None)
+                        tools.append(wrapped_tool)
+                        logger.debug(f"Loaded MCP tool: {tool_name}")
+                    logger.info(f"Loaded {len(mcp_tools_dict)} tools from MCP server: {server_id} (in-process)")
+                except Exception as e:
+                    logger.error(f"Failed to load MCP server {server_id}: {e}", exc_info=True)
+            else:
+                logger.warning(f"Unsupported MCP server type: {server_type}")
+    if resource_configs:
+        # TODO: Convert resources to tools (MCP convenience syntax)
+        pass
+    # Create dynamic result_type from schema if not provided
+    if result_type is None and agent_schema and "properties" in agent_schema:
+        # Pre-process schema for Qwen compatibility (strips min/max, sets additionalProperties=False)
+        # This ensures the generated Pydantic model doesn't have incompatible constraints
+        sanitized_schema = _prepare_schema_for_qwen(agent_schema)
+        result_type = _create_model_from_schema(sanitized_schema)
+        logger.debug(f"Created dynamic Pydantic model: {result_type.__name__}")
+        logger.debug(f"Created dynamic Pydantic model: {result_type.__name__}")
+    # Create agent with optional output_type for structured output and tools
+    if result_type:
+        # Wrap result_type to strip description if needed
+        wrapped_result_type = _create_schema_wrapper(
+            result_type, strip_description=strip_model_description
+        )
+        agent = Agent(
+            model=model,
+            system_prompt=system_prompt,
+            output_type=wrapped_result_type,
+            tools=tools,
+            instrument=settings.otel.enabled,  # Conditional OTEL instrumentation
+            model_settings={"temperature": temperature},
+            retries=settings.llm.max_retries,
+        )
+    else:
+        agent = Agent(
+            model=model,
+            system_prompt=system_prompt,
+            tools=tools,
+            instrument=settings.otel.enabled,
+            model_settings={"temperature": temperature},
+            retries=settings.llm.max_retries,
+        )
+    # TODO: Set agent context attributes for OTEL spans
+    # if context:
+    #     from ..otel import set_agent_context_attributes
+    #     set_agent_context_attributes(context)
+    return AgentRuntime(
+        agent=agent,
+        temperature=temperature,
+        max_iterations=max_iterations,
+    )

rem/agentic/query.py ADDED Viewed

@@ -0,0 +1,117 @@
+"""
+Agent query model for structured agent input.
+Design pattern for standardized agent query structure with:
+- Primary query (user question/task)
+- Knowledge context (retrieved context, documentation)
+- Scratchpad (working memory, session state)
+Key Design Pattern
+- Separates query from retrieval (query is what user asks, knowledge is what we retrieve)
+- Scratchpad enables multi-turn reasoning and state tracking
+- Supports markdown + fenced JSON for structured data
+- Converts to single prompt string for agent consumption
+"""
+from typing import Any
+from pydantic import BaseModel, Field
+class AgentQuery(BaseModel):
+    """
+    Standard query structure for agent execution.
+    Provides consistent structure for queries, knowledge context, and
+    working memory across all agent types.
+    Design Pattern
+    - query: User's question/task (markdown + fenced JSON)
+    - knowledge: Retrieved context from REM queries (markdown + fenced JSON)
+    - scratchpad: Working memory for multi-turn reasoning (JSON or markdown)
+    Example:
+        query = AgentQuery(
+            query="Find all documents Sarah authored",
+            knowledge=\"\"\"
+            # Entity Information
+            Sarah Chen (person/employee)
+            - Role: Senior Engineer
+            - Projects: [Project Alpha, TiDB Migration]
+            \"\"\",
+            scratchpad={"current_case": "TAP-1234", "stage": "entity_lookup"}
+        )
+        prompt = query.to_prompt()
+        result = await agent.run(prompt)
+    """
+    query: str = Field(
+        ...,
+        description="Primary user query or task (markdown format, may include fenced JSON)",
+        examples=[
+            "Find all documents Sarah authored",
+            "What happened in Q4 retrospective?",
+            "TRAVERSE manages WITH LOOKUP sarah-chen DEPTH 2",
+        ],
+    )
+    knowledge: str = Field(
+        default="",
+        description="Background knowledge and context (markdown, may include fenced JSON/code)",
+        examples=[
+            "# Entity: sarah-chen\nType: person/employee\nRole: Senior Engineer",
+            "Retrieved resources:\n```json\n[{...}]\n```",
+        ],
+    )
+    scratchpad: str | dict[str, Any] = Field(
+        default="",
+        description="Working memory for session state (JSON object or markdown with fenced JSON)",
+        examples=[
+            {"stage": "lookup", "visited_entities": ["sarah-chen"]},
+            "# Session State\n\nStage: TRAVERSE depth 1\n\n```json\n{\"nodes\": [...]}\n```",
+        ],
+    )
+    def to_prompt(self) -> str:
+        """
+        Convert query components to single prompt string.
+        Combines query, knowledge, and scratchpad into formatted prompt
+        for agent consumption.
+        Returns:
+            Formatted prompt string with sections
+        Example:
+            # Query
+            Find all documents Sarah authored
+            # Knowledge
+            Entity: sarah-chen
+            Type: person/employee
+            # Scratchpad
+            ```json
+            {"stage": "lookup"}
+            ```
+        """
+        parts = [f"# Query\n\n{self.query}"]
+        if self.knowledge:
+            parts.append(f"\n# Knowledge\n\n{self.knowledge}")
+        if self.scratchpad:
+            if isinstance(self.scratchpad, dict):
+                import json
+                scratchpad_str = json.dumps(self.scratchpad, indent=2)
+                parts.append(f"\n# Scratchpad\n\n```json\n{scratchpad_str}\n```")
+            else:
+                parts.append(f"\n# Scratchpad\n\n{self.scratchpad}")
+        return "\n".join(parts)