PyPI - remdb - Versions diffs - 0.3.118__py3-none-any.whl → 0.3.146__py3-none-any.whl - Mend

remdb 0.3.118py3-none-any.whl → 0.3.146py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of remdb might be problematic. Click here for more details.

Files changed (44) hide show

rem/agentic/agents/sse_simulator.py +2 -0
rem/agentic/context.py +23 -3
rem/agentic/mcp/tool_wrapper.py +126 -15
rem/agentic/otel/setup.py +1 -0
rem/agentic/providers/phoenix.py +371 -108
rem/agentic/providers/pydantic_ai.py +122 -43
rem/agentic/schema.py +4 -1
rem/api/mcp_router/tools.py +13 -2
rem/api/routers/chat/completions.py +250 -4
rem/api/routers/chat/models.py +81 -7
rem/api/routers/chat/otel_utils.py +33 -0
rem/api/routers/chat/sse_events.py +17 -1
rem/api/routers/chat/streaming.py +35 -1
rem/api/routers/feedback.py +134 -14
rem/auth/middleware.py +66 -1
rem/cli/commands/cluster.py +590 -82
rem/cli/commands/configure.py +3 -4
rem/cli/commands/experiments.py +468 -76
rem/cli/commands/session.py +336 -0
rem/cli/dreaming.py +2 -2
rem/cli/main.py +2 -0
rem/config.py +8 -1
rem/models/core/experiment.py +58 -14
rem/models/entities/ontology.py +1 -1
rem/models/entities/ontology_config.py +1 -1
rem/schemas/agents/examples/contract-analyzer.yaml +1 -1
rem/schemas/agents/examples/contract-extractor.yaml +1 -1
rem/schemas/agents/examples/cv-parser.yaml +1 -1
rem/services/phoenix/client.py +59 -18
rem/services/postgres/pydantic_to_sqlalchemy.py +9 -12
rem/services/session/compression.py +7 -0
rem/settings.py +260 -17
rem/sql/migrations/002_install_models.sql +91 -91
rem/sql/migrations/004_cache_system.sql +1 -1
rem/utils/README.md +45 -0
rem/utils/files.py +157 -1
rem/utils/schema_loader.py +94 -3
rem/utils/vision.py +1 -1
rem/workers/__init__.py +2 -1
rem/workers/db_listener.py +579 -0
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/METADATA +161 -147
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/RECORD +44 -41
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/WHEEL +0 -0
{remdb-0.3.118.dist-info → remdb-0.3.146.dist-info}/entry_points.txt +0 -0

rem/sql/migrations/002_install_models.sql CHANGED Viewed

@@ -56,11 +56,11 @@ CREATE TABLE IF NOT EXISTS feedbacks (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_feedbacks_tenant ON feedbacks (tenant_id);
-CREATE INDEX idx_feedbacks_user ON feedbacks (user_id);
-CREATE INDEX idx_feedbacks_graph_edges ON feedbacks USING GIN (graph_edges);
-CREATE INDEX idx_feedbacks_metadata ON feedbacks USING GIN (metadata);
-CREATE INDEX idx_feedbacks_tags ON feedbacks USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_feedbacks_tenant ON feedbacks (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_feedbacks_user ON feedbacks (user_id);
+CREATE INDEX IF NOT EXISTS idx_feedbacks_graph_edges ON feedbacks USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_feedbacks_metadata ON feedbacks USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_feedbacks_tags ON feedbacks USING GIN (tags);
 -- KV_STORE trigger for feedbacks
 -- Trigger function to maintain KV_STORE for feedbacks
@@ -135,11 +135,11 @@ CREATE TABLE IF NOT EXISTS files (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_files_tenant ON files (tenant_id);
-CREATE INDEX idx_files_user ON files (user_id);
-CREATE INDEX idx_files_graph_edges ON files USING GIN (graph_edges);
-CREATE INDEX idx_files_metadata ON files USING GIN (metadata);
-CREATE INDEX idx_files_tags ON files USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_files_tenant ON files (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_files_user ON files (user_id);
+CREATE INDEX IF NOT EXISTS idx_files_graph_edges ON files USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_files_metadata ON files USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_files_tags ON files USING GIN (tags);
 -- Embeddings for files
 CREATE TABLE IF NOT EXISTS embeddings_files (
@@ -157,14 +157,14 @@ CREATE TABLE IF NOT EXISTS embeddings_files (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_files_entity ON embeddings_files (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_files_entity ON embeddings_files (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_files_field_provider ON embeddings_files (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_files_field_provider ON embeddings_files (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_files_vector_hnsw ON embeddings_files
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_files_vector_hnsw ON embeddings_files
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for files
@@ -248,11 +248,11 @@ CREATE TABLE IF NOT EXISTS image_resources (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_image_resources_tenant ON image_resources (tenant_id);
-CREATE INDEX idx_image_resources_user ON image_resources (user_id);
-CREATE INDEX idx_image_resources_graph_edges ON image_resources USING GIN (graph_edges);
-CREATE INDEX idx_image_resources_metadata ON image_resources USING GIN (metadata);
-CREATE INDEX idx_image_resources_tags ON image_resources USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_image_resources_tenant ON image_resources (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_image_resources_user ON image_resources (user_id);
+CREATE INDEX IF NOT EXISTS idx_image_resources_graph_edges ON image_resources USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_image_resources_metadata ON image_resources USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_image_resources_tags ON image_resources USING GIN (tags);
 -- Embeddings for image_resources
 CREATE TABLE IF NOT EXISTS embeddings_image_resources (
@@ -270,14 +270,14 @@ CREATE TABLE IF NOT EXISTS embeddings_image_resources (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_image_resources_entity ON embeddings_image_resources (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_image_resources_entity ON embeddings_image_resources (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_image_resources_field_provider ON embeddings_image_resources (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_image_resources_field_provider ON embeddings_image_resources (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_image_resources_vector_hnsw ON embeddings_image_resources
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_image_resources_vector_hnsw ON embeddings_image_resources
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for image_resources
@@ -354,11 +354,11 @@ CREATE TABLE IF NOT EXISTS messages (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_messages_tenant ON messages (tenant_id);
-CREATE INDEX idx_messages_user ON messages (user_id);
-CREATE INDEX idx_messages_graph_edges ON messages USING GIN (graph_edges);
-CREATE INDEX idx_messages_metadata ON messages USING GIN (metadata);
-CREATE INDEX idx_messages_tags ON messages USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_messages_tenant ON messages (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_messages_user ON messages (user_id);
+CREATE INDEX IF NOT EXISTS idx_messages_graph_edges ON messages USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_messages_metadata ON messages USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_messages_tags ON messages USING GIN (tags);
 -- Embeddings for messages
 CREATE TABLE IF NOT EXISTS embeddings_messages (
@@ -376,14 +376,14 @@ CREATE TABLE IF NOT EXISTS embeddings_messages (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_messages_entity ON embeddings_messages (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_messages_entity ON embeddings_messages (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_messages_field_provider ON embeddings_messages (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_messages_field_provider ON embeddings_messages (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_messages_vector_hnsw ON embeddings_messages
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_messages_vector_hnsw ON embeddings_messages
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for messages
@@ -462,11 +462,11 @@ CREATE TABLE IF NOT EXISTS moments (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_moments_tenant ON moments (tenant_id);
-CREATE INDEX idx_moments_user ON moments (user_id);
-CREATE INDEX idx_moments_graph_edges ON moments USING GIN (graph_edges);
-CREATE INDEX idx_moments_metadata ON moments USING GIN (metadata);
-CREATE INDEX idx_moments_tags ON moments USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_moments_tenant ON moments (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_moments_user ON moments (user_id);
+CREATE INDEX IF NOT EXISTS idx_moments_graph_edges ON moments USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_moments_metadata ON moments USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_moments_tags ON moments USING GIN (tags);
 -- Embeddings for moments
 CREATE TABLE IF NOT EXISTS embeddings_moments (
@@ -484,14 +484,14 @@ CREATE TABLE IF NOT EXISTS embeddings_moments (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_moments_entity ON embeddings_moments (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_moments_entity ON embeddings_moments (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_moments_field_provider ON embeddings_moments (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_moments_field_provider ON embeddings_moments (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_moments_vector_hnsw ON embeddings_moments
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_moments_vector_hnsw ON embeddings_moments
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for moments
@@ -569,11 +569,11 @@ CREATE TABLE IF NOT EXISTS ontologies (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_ontologies_tenant ON ontologies (tenant_id);
-CREATE INDEX idx_ontologies_user ON ontologies (user_id);
-CREATE INDEX idx_ontologies_graph_edges ON ontologies USING GIN (graph_edges);
-CREATE INDEX idx_ontologies_metadata ON ontologies USING GIN (metadata);
-CREATE INDEX idx_ontologies_tags ON ontologies USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_ontologies_tenant ON ontologies (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_ontologies_user ON ontologies (user_id);
+CREATE INDEX IF NOT EXISTS idx_ontologies_graph_edges ON ontologies USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_ontologies_metadata ON ontologies USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_ontologies_tags ON ontologies USING GIN (tags);
 -- KV_STORE trigger for ontologies
 -- Trigger function to maintain KV_STORE for ontologies
@@ -651,11 +651,11 @@ CREATE TABLE IF NOT EXISTS ontology_configs (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_ontology_configs_tenant ON ontology_configs (tenant_id);
-CREATE INDEX idx_ontology_configs_user ON ontology_configs (user_id);
-CREATE INDEX idx_ontology_configs_graph_edges ON ontology_configs USING GIN (graph_edges);
-CREATE INDEX idx_ontology_configs_metadata ON ontology_configs USING GIN (metadata);
-CREATE INDEX idx_ontology_configs_tags ON ontology_configs USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_ontology_configs_tenant ON ontology_configs (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_ontology_configs_user ON ontology_configs (user_id);
+CREATE INDEX IF NOT EXISTS idx_ontology_configs_graph_edges ON ontology_configs USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_ontology_configs_metadata ON ontology_configs USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_ontology_configs_tags ON ontology_configs USING GIN (tags);
 -- Embeddings for ontology_configs
 CREATE TABLE IF NOT EXISTS embeddings_ontology_configs (
@@ -673,14 +673,14 @@ CREATE TABLE IF NOT EXISTS embeddings_ontology_configs (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_ontology_configs_entity ON embeddings_ontology_configs (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_ontology_configs_entity ON embeddings_ontology_configs (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_ontology_configs_field_provider ON embeddings_ontology_configs (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_ontology_configs_field_provider ON embeddings_ontology_configs (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_ontology_configs_vector_hnsw ON embeddings_ontology_configs
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_ontology_configs_vector_hnsw ON embeddings_ontology_configs
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for ontology_configs
@@ -756,11 +756,11 @@ CREATE TABLE IF NOT EXISTS resources (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_resources_tenant ON resources (tenant_id);
-CREATE INDEX idx_resources_user ON resources (user_id);
-CREATE INDEX idx_resources_graph_edges ON resources USING GIN (graph_edges);
-CREATE INDEX idx_resources_metadata ON resources USING GIN (metadata);
-CREATE INDEX idx_resources_tags ON resources USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_resources_tenant ON resources (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_resources_user ON resources (user_id);
+CREATE INDEX IF NOT EXISTS idx_resources_graph_edges ON resources USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_resources_metadata ON resources USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_resources_tags ON resources USING GIN (tags);
 -- Embeddings for resources
 CREATE TABLE IF NOT EXISTS embeddings_resources (
@@ -778,14 +778,14 @@ CREATE TABLE IF NOT EXISTS embeddings_resources (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_resources_entity ON embeddings_resources (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_resources_entity ON embeddings_resources (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_resources_field_provider ON embeddings_resources (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_resources_field_provider ON embeddings_resources (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_resources_vector_hnsw ON embeddings_resources
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_resources_vector_hnsw ON embeddings_resources
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for resources
@@ -860,11 +860,11 @@ CREATE TABLE IF NOT EXISTS schemas (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_schemas_tenant ON schemas (tenant_id);
-CREATE INDEX idx_schemas_user ON schemas (user_id);
-CREATE INDEX idx_schemas_graph_edges ON schemas USING GIN (graph_edges);
-CREATE INDEX idx_schemas_metadata ON schemas USING GIN (metadata);
-CREATE INDEX idx_schemas_tags ON schemas USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_schemas_tenant ON schemas (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_schemas_user ON schemas (user_id);
+CREATE INDEX IF NOT EXISTS idx_schemas_graph_edges ON schemas USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_schemas_metadata ON schemas USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_schemas_tags ON schemas USING GIN (tags);
 -- Embeddings for schemas
 CREATE TABLE IF NOT EXISTS embeddings_schemas (
@@ -882,14 +882,14 @@ CREATE TABLE IF NOT EXISTS embeddings_schemas (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_schemas_entity ON embeddings_schemas (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_schemas_entity ON embeddings_schemas (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_schemas_field_provider ON embeddings_schemas (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_schemas_field_provider ON embeddings_schemas (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_schemas_vector_hnsw ON embeddings_schemas
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_schemas_vector_hnsw ON embeddings_schemas
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for schemas
@@ -967,11 +967,11 @@ CREATE TABLE IF NOT EXISTS sessions (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_sessions_tenant ON sessions (tenant_id);
-CREATE INDEX idx_sessions_user ON sessions (user_id);
-CREATE INDEX idx_sessions_graph_edges ON sessions USING GIN (graph_edges);
-CREATE INDEX idx_sessions_metadata ON sessions USING GIN (metadata);
-CREATE INDEX idx_sessions_tags ON sessions USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_sessions_tenant ON sessions (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_sessions_user ON sessions (user_id);
+CREATE INDEX IF NOT EXISTS idx_sessions_graph_edges ON sessions USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_sessions_metadata ON sessions USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_sessions_tags ON sessions USING GIN (tags);
 -- Embeddings for sessions
 CREATE TABLE IF NOT EXISTS embeddings_sessions (
@@ -989,14 +989,14 @@ CREATE TABLE IF NOT EXISTS embeddings_sessions (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_sessions_entity ON embeddings_sessions (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_sessions_entity ON embeddings_sessions (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_sessions_field_provider ON embeddings_sessions (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_sessions_field_provider ON embeddings_sessions (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_sessions_vector_hnsw ON embeddings_sessions
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_sessions_vector_hnsw ON embeddings_sessions
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for sessions
@@ -1068,11 +1068,11 @@ CREATE TABLE IF NOT EXISTS shared_sessions (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_shared_sessions_tenant ON shared_sessions (tenant_id);
-CREATE INDEX idx_shared_sessions_user ON shared_sessions (user_id);
-CREATE INDEX idx_shared_sessions_graph_edges ON shared_sessions USING GIN (graph_edges);
-CREATE INDEX idx_shared_sessions_metadata ON shared_sessions USING GIN (metadata);
-CREATE INDEX idx_shared_sessions_tags ON shared_sessions USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_shared_sessions_tenant ON shared_sessions (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_shared_sessions_user ON shared_sessions (user_id);
+CREATE INDEX IF NOT EXISTS idx_shared_sessions_graph_edges ON shared_sessions USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_shared_sessions_metadata ON shared_sessions USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_shared_sessions_tags ON shared_sessions USING GIN (tags);
 -- KV_STORE trigger for shared_sessions
 -- Trigger function to maintain KV_STORE for shared_sessions
@@ -1151,11 +1151,11 @@ CREATE TABLE IF NOT EXISTS users (
     tags TEXT[] DEFAULT ARRAY[]::TEXT[]
 );
-CREATE INDEX idx_users_tenant ON users (tenant_id);
-CREATE INDEX idx_users_user ON users (user_id);
-CREATE INDEX idx_users_graph_edges ON users USING GIN (graph_edges);
-CREATE INDEX idx_users_metadata ON users USING GIN (metadata);
-CREATE INDEX idx_users_tags ON users USING GIN (tags);
+CREATE INDEX IF NOT EXISTS idx_users_tenant ON users (tenant_id);
+CREATE INDEX IF NOT EXISTS idx_users_user ON users (user_id);
+CREATE INDEX IF NOT EXISTS idx_users_graph_edges ON users USING GIN (graph_edges);
+CREATE INDEX IF NOT EXISTS idx_users_metadata ON users USING GIN (metadata);
+CREATE INDEX IF NOT EXISTS idx_users_tags ON users USING GIN (tags);
 -- Embeddings for users
 CREATE TABLE IF NOT EXISTS embeddings_users (
@@ -1173,14 +1173,14 @@ CREATE TABLE IF NOT EXISTS embeddings_users (
 );
 -- Index for entity lookup (get all embeddings for entity)
-CREATE INDEX idx_embeddings_users_entity ON embeddings_users (entity_id);
+CREATE INDEX IF NOT EXISTS idx_embeddings_users_entity ON embeddings_users (entity_id);
 -- Index for field + provider lookup
-CREATE INDEX idx_embeddings_users_field_provider ON embeddings_users (field_name, provider);
+CREATE INDEX IF NOT EXISTS idx_embeddings_users_field_provider ON embeddings_users (field_name, provider);
 -- HNSW index for vector similarity search (created in background)
 -- Note: This will be created by background thread after data load
--- CREATE INDEX idx_embeddings_users_vector_hnsw ON embeddings_users
+-- CREATE INDEX IF NOT EXISTS idx_embeddings_users_vector_hnsw ON embeddings_users
 -- USING hnsw (embedding vector_cosine_ops);
 -- KV_STORE trigger for users
@@ -2067,7 +2067,7 @@ Domain-specific knowledge extracted from files using custom agents.
             file_id="file-uuid-456",
             agent_schema_id="contract-parser-v2",
             provider_name="openai",
-            model_name="gpt-4o",
+            model_name="gpt-4.1",
             extracted_data={
                 "contract_type": "supplier_agreement",
                 "parties": [
@@ -2197,7 +2197,7 @@ This schema includes the `search_rem` tool which supports:
 - **Optional**
 ',
-    '{"type": "object", "description": "Domain-specific knowledge extracted from files using custom agents.\n\n    Attributes:\n        name: Human-readable label for this ontology instance\n        file_id: Foreign key to File entity that was processed\n        agent_schema_id: Foreign key to Schema entity that performed extraction\n        provider_name: LLM provider used for extraction (e.g., \"anthropic\", \"openai\")\n        model_name: Specific model used (e.g., \"claude-sonnet-4-5\")\n        extracted_data: Structured data extracted by agent (arbitrary JSON)\n        confidence_score: Optional confidence score from extraction (0.0-1.0)\n        extraction_timestamp: When extraction was performed\n        embedding_text: Text used for generating embedding (derived from extracted_data)\n\n    Inherited from CoreModel:\n        id: UUID or string identifier\n        created_at: Entity creation timestamp\n        updated_at: Last update timestamp\n        deleted_at: Soft deletion timestamp\n        tenant_id: Multi-tenancy isolation\n        user_id: Ownership\n        graph_edges: Relationships to other entities\n        metadata: Flexible metadata storage\n        tags: Classification tags\n        column: Database schema metadata\n\n    Example Usage:\n        # CV extraction\n        cv_ontology = Ontology(\n            name=\"john-doe-cv-2024\",\n            file_id=\"file-uuid-123\",\n            agent_schema_id=\"cv-parser-v1\",\n            provider_name=\"anthropic\",\n            model_name=\"claude-sonnet-4-5-20250929\",\n            extracted_data={\n                \"candidate_name\": \"John Doe\",\n                \"email\": \"john@example.com\",\n                \"skills\": [\"Python\", \"PostgreSQL\", \"Kubernetes\"],\n                \"experience\": [\n                    {\n                        \"company\": \"TechCorp\",\n                        \"role\": \"Senior Engineer\",\n                        \"years\": 3,\n                        \"achievements\": [\"Led migration to k8s\", \"Reduced costs 40%\"]\n                    }\n                ],\n                \"education\": [\n                    {\"degree\": \"BS Computer Science\", \"institution\": \"MIT\", \"year\": 2018}\n                ]\n            },\n            confidence_score=0.95,\n            tags=[\"cv\", \"engineering\", \"senior-level\"]\n        )\n\n        # Contract extraction\n        contract_ontology = Ontology(\n            name=\"acme-supplier-agreement-2024\",\n            file_id=\"file-uuid-456\",\n            agent_schema_id=\"contract-parser-v2\",\n            provider_name=\"openai\",\n            model_name=\"gpt-4o\",\n            extracted_data={\n                \"contract_type\": \"supplier_agreement\",\n                \"parties\": [\n                    {\"name\": \"ACME Corp\", \"role\": \"buyer\"},\n                    {\"name\": \"SupplyChain Inc\", \"role\": \"supplier\"}\n                ],\n                \"effective_date\": \"2024-01-01\",\n                \"termination_date\": \"2026-12-31\",\n                \"payment_terms\": {\n                    \"amount\": 500000,\n                    \"currency\": \"USD\",\n                    \"frequency\": \"quarterly\"\n                },\n                \"key_obligations\": [\n                    \"Supplier must deliver within 30 days\",\n                    \"Buyer must pay within 60 days of invoice\"\n                ]\n            },\n            confidence_score=0.92,\n            tags=[\"contract\", \"supplier\", \"procurement\"]\n        )\n    \n\nThis agent can search the `ontologies` table using the `search_rem` tool. Use REM query syntax: LOOKUP for exact match, FUZZY for typo-tolerant search, SEARCH for semantic similarity, or SQL for complex queries.", "properties": {"id": {"anyOf": [{"format": "uuid", "type": "string"}, {"type": "string"}, {"type": "null"}], "default": null, "description": "Unique identifier (UUID or string, generated per model type). Generated automatically if not provided.", "title": "Id"}, "created_at": {"description": "Entity creation timestamp", "format": "date-time", "title": "Created At", "type": "string"}, "updated_at": {"description": "Last update timestamp", "format": "date-time", "title": "Updated At", "type": "string"}, "deleted_at": {"anyOf": [{"format": "date-time", "type": "string"}, {"type": "null"}], "default": null, "description": "Soft deletion timestamp", "title": "Deleted At"}, "tenant_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Tenant identifier for multi-tenancy isolation", "title": "Tenant Id"}, "user_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Owner user identifier (tenant-scoped). This is a VARCHAR(256), not a UUID, to allow flexibility for external identity providers. Typically generated as a hash of the user''s email address. In future, other strong unique claims (e.g., OAuth sub, verified phone) could also be used for generation.", "title": "User Id"}, "graph_edges": {"description": "Knowledge graph edges stored as InlineEdge dicts", "items": {"additionalProperties": true, "type": "object"}, "title": "Graph Edges", "type": "array"}, "metadata": {"additionalProperties": true, "description": "Flexible metadata storage", "title": "Metadata", "type": "object"}, "tags": {"description": "Entity tags", "items": {"type": "string"}, "title": "Tags", "type": "array"}, "name": {"title": "Name", "type": "string"}, "file_id": {"anyOf": [{"format": "uuid", "type": "string"}, {"type": "string"}], "title": "File Id"}, "agent_schema_id": {"title": "Agent Schema Id", "type": "string"}, "provider_name": {"title": "Provider Name", "type": "string"}, "model_name": {"title": "Model Name", "type": "string"}, "extracted_data": {"additionalProperties": true, "title": "Extracted Data", "type": "object"}, "confidence_score": {"anyOf": [{"type": "number"}, {"type": "null"}], "default": null, "title": "Confidence Score"}, "extraction_timestamp": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Extraction Timestamp"}, "embedding_text": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Embedding Text"}}, "required": ["name", "file_id", "agent_schema_id", "provider_name", "model_name", "extracted_data"], "json_schema_extra": {"table_name": "ontologies", "entity_key_field": "id", "embedding_fields": [], "fully_qualified_name": "rem.models.entities.ontology.Ontology", "tools": ["search_rem"], "default_search_table": "ontologies", "has_embeddings": false}}'::jsonb,
+    '{"type": "object", "description": "Domain-specific knowledge extracted from files using custom agents.\n\n    Attributes:\n        name: Human-readable label for this ontology instance\n        file_id: Foreign key to File entity that was processed\n        agent_schema_id: Foreign key to Schema entity that performed extraction\n        provider_name: LLM provider used for extraction (e.g., \"anthropic\", \"openai\")\n        model_name: Specific model used (e.g., \"claude-sonnet-4-5\")\n        extracted_data: Structured data extracted by agent (arbitrary JSON)\n        confidence_score: Optional confidence score from extraction (0.0-1.0)\n        extraction_timestamp: When extraction was performed\n        embedding_text: Text used for generating embedding (derived from extracted_data)\n\n    Inherited from CoreModel:\n        id: UUID or string identifier\n        created_at: Entity creation timestamp\n        updated_at: Last update timestamp\n        deleted_at: Soft deletion timestamp\n        tenant_id: Multi-tenancy isolation\n        user_id: Ownership\n        graph_edges: Relationships to other entities\n        metadata: Flexible metadata storage\n        tags: Classification tags\n        column: Database schema metadata\n\n    Example Usage:\n        # CV extraction\n        cv_ontology = Ontology(\n            name=\"john-doe-cv-2024\",\n            file_id=\"file-uuid-123\",\n            agent_schema_id=\"cv-parser-v1\",\n            provider_name=\"anthropic\",\n            model_name=\"claude-sonnet-4-5-20250929\",\n            extracted_data={\n                \"candidate_name\": \"John Doe\",\n                \"email\": \"john@example.com\",\n                \"skills\": [\"Python\", \"PostgreSQL\", \"Kubernetes\"],\n                \"experience\": [\n                    {\n                        \"company\": \"TechCorp\",\n                        \"role\": \"Senior Engineer\",\n                        \"years\": 3,\n                        \"achievements\": [\"Led migration to k8s\", \"Reduced costs 40%\"]\n                    }\n                ],\n                \"education\": [\n                    {\"degree\": \"BS Computer Science\", \"institution\": \"MIT\", \"year\": 2018}\n                ]\n            },\n            confidence_score=0.95,\n            tags=[\"cv\", \"engineering\", \"senior-level\"]\n        )\n\n        # Contract extraction\n        contract_ontology = Ontology(\n            name=\"acme-supplier-agreement-2024\",\n            file_id=\"file-uuid-456\",\n            agent_schema_id=\"contract-parser-v2\",\n            provider_name=\"openai\",\n            model_name=\"gpt-4.1\",\n            extracted_data={\n                \"contract_type\": \"supplier_agreement\",\n                \"parties\": [\n                    {\"name\": \"ACME Corp\", \"role\": \"buyer\"},\n                    {\"name\": \"SupplyChain Inc\", \"role\": \"supplier\"}\n                ],\n                \"effective_date\": \"2024-01-01\",\n                \"termination_date\": \"2026-12-31\",\n                \"payment_terms\": {\n                    \"amount\": 500000,\n                    \"currency\": \"USD\",\n                    \"frequency\": \"quarterly\"\n                },\n                \"key_obligations\": [\n                    \"Supplier must deliver within 30 days\",\n                    \"Buyer must pay within 60 days of invoice\"\n                ]\n            },\n            confidence_score=0.92,\n            tags=[\"contract\", \"supplier\", \"procurement\"]\n        )\n    \n\nThis agent can search the `ontologies` table using the `search_rem` tool. Use REM query syntax: LOOKUP for exact match, FUZZY for typo-tolerant search, SEARCH for semantic similarity, or SQL for complex queries.", "properties": {"id": {"anyOf": [{"format": "uuid", "type": "string"}, {"type": "string"}, {"type": "null"}], "default": null, "description": "Unique identifier (UUID or string, generated per model type). Generated automatically if not provided.", "title": "Id"}, "created_at": {"description": "Entity creation timestamp", "format": "date-time", "title": "Created At", "type": "string"}, "updated_at": {"description": "Last update timestamp", "format": "date-time", "title": "Updated At", "type": "string"}, "deleted_at": {"anyOf": [{"format": "date-time", "type": "string"}, {"type": "null"}], "default": null, "description": "Soft deletion timestamp", "title": "Deleted At"}, "tenant_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Tenant identifier for multi-tenancy isolation", "title": "Tenant Id"}, "user_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Owner user identifier (tenant-scoped). This is a VARCHAR(256), not a UUID, to allow flexibility for external identity providers. Typically generated as a hash of the user''s email address. In future, other strong unique claims (e.g., OAuth sub, verified phone) could also be used for generation.", "title": "User Id"}, "graph_edges": {"description": "Knowledge graph edges stored as InlineEdge dicts", "items": {"additionalProperties": true, "type": "object"}, "title": "Graph Edges", "type": "array"}, "metadata": {"additionalProperties": true, "description": "Flexible metadata storage", "title": "Metadata", "type": "object"}, "tags": {"description": "Entity tags", "items": {"type": "string"}, "title": "Tags", "type": "array"}, "name": {"title": "Name", "type": "string"}, "file_id": {"anyOf": [{"format": "uuid", "type": "string"}, {"type": "string"}], "title": "File Id"}, "agent_schema_id": {"title": "Agent Schema Id", "type": "string"}, "provider_name": {"title": "Provider Name", "type": "string"}, "model_name": {"title": "Model Name", "type": "string"}, "extracted_data": {"additionalProperties": true, "title": "Extracted Data", "type": "object"}, "confidence_score": {"anyOf": [{"type": "number"}, {"type": "null"}], "default": null, "title": "Confidence Score"}, "extraction_timestamp": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Extraction Timestamp"}, "embedding_text": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Embedding Text"}}, "required": ["name", "file_id", "agent_schema_id", "provider_name", "model_name", "extracted_data"], "json_schema_extra": {"table_name": "ontologies", "entity_key_field": "id", "embedding_fields": [], "fully_qualified_name": "rem.models.entities.ontology.Ontology", "tools": ["search_rem"], "default_search_table": "ontologies", "has_embeddings": false}}'::jsonb,
     'entity',
     '{"table_name": "ontologies", "entity_key_field": "id", "embedding_fields": [], "fqn": "rem.models.entities.ontology.Ontology"}'::jsonb
 )
@@ -2266,7 +2266,7 @@ User configuration for automatic ontology extraction.
             priority=200,  # Higher priority = runs first
             enabled=True,
             provider_name="openai",  # Override default provider
-            model_name="gpt-4o",
+            model_name="gpt-4.1",
             tenant_id="acme-corp",
             tags=["legal", "procurement"]
         )
@@ -2395,7 +2395,7 @@ This schema includes the `search_rem` tool which supports:
 - **Optional**
 ',
-    '{"type": "object", "description": "User configuration for automatic ontology extraction.\n\n    Attributes:\n        name: Human-readable config name\n        agent_schema_id: Foreign key to Schema entity to use for extraction\n        description: Purpose and scope of this config\n\n        # File matching rules (ANY matching rule triggers extraction)\n        mime_type_pattern: Regex pattern for file MIME types (e.g., \"application/pdf\")\n        uri_pattern: Regex pattern for file URIs (e.g., \"s3://bucket/resumes/.*\")\n        tag_filter: List of tags (file must have ALL tags to match)\n\n        # Execution control\n        priority: Execution order (higher = earlier, default 100)\n        enabled: Whether this config is active (default True)\n\n        # LLM provider configuration\n        provider_name: Optional LLM provider override (defaults to settings)\n        model_name: Optional model override (defaults to settings)\n\n    Inherited from CoreModel:\n        id, created_at, updated_at, deleted_at, tenant_id, user_id,\n        graph_edges, metadata, tags, column\n\n    Example Usage:\n        # CV extraction for recruitment\n        cv_config = OntologyConfig(\n            name=\"recruitment-cv-parser\",\n            agent_schema_id=\"cv-parser-v1\",\n            description=\"Extract candidate information from resumes\",\n            mime_type_pattern=\"application/pdf\",\n            uri_pattern=\".*/resumes/.*\",\n            tag_filter=[\"cv\", \"candidate\"],\n            priority=100,\n            enabled=True,\n            tenant_id=\"acme-corp\",\n            tags=[\"recruitment\", \"hr\"]\n        )\n\n        # Contract analysis for legal team\n        contract_config = OntologyConfig(\n            name=\"legal-contract-analyzer\",\n            agent_schema_id=\"contract-parser-v2\",\n            description=\"Extract key terms from supplier contracts\",\n            mime_type_pattern=\"application/(pdf|msword|vnd.openxmlformats.*)\",\n            tag_filter=[\"legal\", \"contract\"],\n            priority=200,  # Higher priority = runs first\n            enabled=True,\n            provider_name=\"openai\",  # Override default provider\n            model_name=\"gpt-4o\",\n            tenant_id=\"acme-corp\",\n            tags=[\"legal\", \"procurement\"]\n        )\n\n        # Medical records for healthcare\n        medical_config = OntologyConfig(\n            name=\"medical-records-extractor\",\n            agent_schema_id=\"medical-parser-v1\",\n            description=\"Extract diagnoses and treatments from medical records\",\n            mime_type_pattern=\"application/pdf\",\n            tag_filter=[\"medical\", \"patient-record\"],\n            priority=50,\n            enabled=True,\n            tenant_id=\"healthsystem\",\n            tags=[\"medical\", \"hipaa-compliant\"]\n        )\n    \n\nThis agent can search the `ontology_configs` table using the `search_rem` tool. Use REM query syntax: LOOKUP for exact match, FUZZY for typo-tolerant search, SEARCH for semantic similarity, or SQL for complex queries.", "properties": {"id": {"anyOf": [{"format": "uuid", "type": "string"}, {"type": "string"}, {"type": "null"}], "default": null, "description": "Unique identifier (UUID or string, generated per model type). Generated automatically if not provided.", "title": "Id"}, "created_at": {"description": "Entity creation timestamp", "format": "date-time", "title": "Created At", "type": "string"}, "updated_at": {"description": "Last update timestamp", "format": "date-time", "title": "Updated At", "type": "string"}, "deleted_at": {"anyOf": [{"format": "date-time", "type": "string"}, {"type": "null"}], "default": null, "description": "Soft deletion timestamp", "title": "Deleted At"}, "tenant_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Tenant identifier for multi-tenancy isolation", "title": "Tenant Id"}, "user_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Owner user identifier (tenant-scoped). This is a VARCHAR(256), not a UUID, to allow flexibility for external identity providers. Typically generated as a hash of the user''s email address. In future, other strong unique claims (e.g., OAuth sub, verified phone) could also be used for generation.", "title": "User Id"}, "graph_edges": {"description": "Knowledge graph edges stored as InlineEdge dicts", "items": {"additionalProperties": true, "type": "object"}, "title": "Graph Edges", "type": "array"}, "metadata": {"additionalProperties": true, "description": "Flexible metadata storage", "title": "Metadata", "type": "object"}, "tags": {"description": "Entity tags", "items": {"type": "string"}, "title": "Tags", "type": "array"}, "name": {"title": "Name", "type": "string"}, "agent_schema_id": {"title": "Agent Schema Id", "type": "string"}, "description": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Description"}, "mime_type_pattern": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Mime Type Pattern"}, "uri_pattern": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Uri Pattern"}, "tag_filter": {"default": [], "items": {"type": "string"}, "title": "Tag Filter", "type": "array"}, "priority": {"default": 100, "title": "Priority", "type": "integer"}, "enabled": {"default": true, "title": "Enabled", "type": "boolean"}, "provider_name": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Provider Name"}, "model_name": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Model Name"}}, "required": ["name", "agent_schema_id"], "json_schema_extra": {"table_name": "ontology_configs", "entity_key_field": "id", "embedding_fields": ["description"], "fully_qualified_name": "rem.models.entities.ontology_config.OntologyConfig", "tools": ["search_rem"], "default_search_table": "ontology_configs", "has_embeddings": true}}'::jsonb,
+    '{"type": "object", "description": "User configuration for automatic ontology extraction.\n\n    Attributes:\n        name: Human-readable config name\n        agent_schema_id: Foreign key to Schema entity to use for extraction\n        description: Purpose and scope of this config\n\n        # File matching rules (ANY matching rule triggers extraction)\n        mime_type_pattern: Regex pattern for file MIME types (e.g., \"application/pdf\")\n        uri_pattern: Regex pattern for file URIs (e.g., \"s3://bucket/resumes/.*\")\n        tag_filter: List of tags (file must have ALL tags to match)\n\n        # Execution control\n        priority: Execution order (higher = earlier, default 100)\n        enabled: Whether this config is active (default True)\n\n        # LLM provider configuration\n        provider_name: Optional LLM provider override (defaults to settings)\n        model_name: Optional model override (defaults to settings)\n\n    Inherited from CoreModel:\n        id, created_at, updated_at, deleted_at, tenant_id, user_id,\n        graph_edges, metadata, tags, column\n\n    Example Usage:\n        # CV extraction for recruitment\n        cv_config = OntologyConfig(\n            name=\"recruitment-cv-parser\",\n            agent_schema_id=\"cv-parser-v1\",\n            description=\"Extract candidate information from resumes\",\n            mime_type_pattern=\"application/pdf\",\n            uri_pattern=\".*/resumes/.*\",\n            tag_filter=[\"cv\", \"candidate\"],\n            priority=100,\n            enabled=True,\n            tenant_id=\"acme-corp\",\n            tags=[\"recruitment\", \"hr\"]\n        )\n\n        # Contract analysis for legal team\n        contract_config = OntologyConfig(\n            name=\"legal-contract-analyzer\",\n            agent_schema_id=\"contract-parser-v2\",\n            description=\"Extract key terms from supplier contracts\",\n            mime_type_pattern=\"application/(pdf|msword|vnd.openxmlformats.*)\",\n            tag_filter=[\"legal\", \"contract\"],\n            priority=200,  # Higher priority = runs first\n            enabled=True,\n            provider_name=\"openai\",  # Override default provider\n            model_name=\"gpt-4.1\",\n            tenant_id=\"acme-corp\",\n            tags=[\"legal\", \"procurement\"]\n        )\n\n        # Medical records for healthcare\n        medical_config = OntologyConfig(\n            name=\"medical-records-extractor\",\n            agent_schema_id=\"medical-parser-v1\",\n            description=\"Extract diagnoses and treatments from medical records\",\n            mime_type_pattern=\"application/pdf\",\n            tag_filter=[\"medical\", \"patient-record\"],\n            priority=50,\n            enabled=True,\n            tenant_id=\"healthsystem\",\n            tags=[\"medical\", \"hipaa-compliant\"]\n        )\n    \n\nThis agent can search the `ontology_configs` table using the `search_rem` tool. Use REM query syntax: LOOKUP for exact match, FUZZY for typo-tolerant search, SEARCH for semantic similarity, or SQL for complex queries.", "properties": {"id": {"anyOf": [{"format": "uuid", "type": "string"}, {"type": "string"}, {"type": "null"}], "default": null, "description": "Unique identifier (UUID or string, generated per model type). Generated automatically if not provided.", "title": "Id"}, "created_at": {"description": "Entity creation timestamp", "format": "date-time", "title": "Created At", "type": "string"}, "updated_at": {"description": "Last update timestamp", "format": "date-time", "title": "Updated At", "type": "string"}, "deleted_at": {"anyOf": [{"format": "date-time", "type": "string"}, {"type": "null"}], "default": null, "description": "Soft deletion timestamp", "title": "Deleted At"}, "tenant_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Tenant identifier for multi-tenancy isolation", "title": "Tenant Id"}, "user_id": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "description": "Owner user identifier (tenant-scoped). This is a VARCHAR(256), not a UUID, to allow flexibility for external identity providers. Typically generated as a hash of the user''s email address. In future, other strong unique claims (e.g., OAuth sub, verified phone) could also be used for generation.", "title": "User Id"}, "graph_edges": {"description": "Knowledge graph edges stored as InlineEdge dicts", "items": {"additionalProperties": true, "type": "object"}, "title": "Graph Edges", "type": "array"}, "metadata": {"additionalProperties": true, "description": "Flexible metadata storage", "title": "Metadata", "type": "object"}, "tags": {"description": "Entity tags", "items": {"type": "string"}, "title": "Tags", "type": "array"}, "name": {"title": "Name", "type": "string"}, "agent_schema_id": {"title": "Agent Schema Id", "type": "string"}, "description": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Description"}, "mime_type_pattern": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Mime Type Pattern"}, "uri_pattern": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Uri Pattern"}, "tag_filter": {"default": [], "items": {"type": "string"}, "title": "Tag Filter", "type": "array"}, "priority": {"default": 100, "title": "Priority", "type": "integer"}, "enabled": {"default": true, "title": "Enabled", "type": "boolean"}, "provider_name": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Provider Name"}, "model_name": {"anyOf": [{"type": "string"}, {"type": "null"}], "default": null, "title": "Model Name"}}, "required": ["name", "agent_schema_id"], "json_schema_extra": {"table_name": "ontology_configs", "entity_key_field": "id", "embedding_fields": ["description"], "fully_qualified_name": "rem.models.entities.ontology_config.OntologyConfig", "tools": ["search_rem"], "default_search_table": "ontology_configs", "has_embeddings": true}}'::jsonb,
     'entity',
     '{"table_name": "ontology_configs", "entity_key_field": "id", "embedding_fields": ["description"], "fqn": "rem.models.entities.ontology_config.OntologyConfig"}'::jsonb
 )

rem/sql/migrations/004_cache_system.sql CHANGED Viewed

@@ -91,7 +91,7 @@ DECLARE
     v_last_trigger TIMESTAMPTZ;
     v_api_secret TEXT;
     v_debounce_seconds CONSTANT INTEGER := 30;
-    v_api_url TEXT := 'http://rem-api.siggy.svc.cluster.local:8000/api/admin/internal/rebuild-kv';
+    v_api_url TEXT := 'http://rem-api.rem.svc.cluster.local:8000/api/admin/internal/rebuild-kv';
     v_request_id BIGINT;
 BEGIN
     -- Quick check: is kv_store actually empty for this user?

rem/utils/README.md CHANGED Viewed

@@ -4,6 +4,7 @@
 1. [SQL Types](#sql-types-sql_typespy) - Pydantic to PostgreSQL type mapping
 2. [Embeddings](#embeddings-embeddingspy) - Vector embeddings generation
+3. [Files](#files-filespy) - File utilities and DataFrame I/O
 ## SQL Types (`sql_types.py`)
@@ -581,3 +582,47 @@ This will demonstrate:
 - `sql_types.py` - Use `embedding_provider` in json_schema_extra for TEXT fields
 - OpenAI Embeddings API: https://platform.openai.com/docs/api-reference/embeddings
 - pgvector Documentation: https://github.com/pgvector/pgvector
+---
+## Files (`files.py`)
+File utilities including temporary file handling and DataFrame I/O with automatic format detection.
+### DataFrame I/O
+Read and write DataFrames with format auto-detected from file extension:
+```python
+from rem.utils.files import read_dataframe, write_dataframe
+# Read - format inferred from extension
+df = read_dataframe("data.csv")
+df = read_dataframe("data.parquet")
+df = read_dataframe("data.xlsx")
+# Read from bytes (e.g., from S3)
+df = read_dataframe(content_bytes, filename="data.csv")
+# Write - format inferred from extension
+write_dataframe(df, "output.parquet")
+```
+**Supported formats**: `.csv`, `.tsv`, `.parquet`, `.json`, `.jsonl`, `.avro`, `.xlsx`, `.xls`, `.ods`, `.ipc`, `.arrow`, `.feather`
+Note: Some formats require optional dependencies (e.g., `fastexcel` for Excel).
+### Temporary File Utilities
+```python
+from rem.utils.files import temp_file_from_bytes, temp_directory
+# Create temp file from bytes, auto-cleanup
+with temp_file_from_bytes(pdf_bytes, suffix=".pdf") as tmp_path:
+    result = process_pdf(tmp_path)
+# Create temp directory, auto-cleanup
+with temp_directory() as tmp_dir:
+    # Work with files in tmp_dir
+    pass
+```

remdb 0.3.118__py3-none-any.whl → 0.3.146__py3-none-any.whl

Potentially problematic release.

remdb 0.3.118py3-none-any.whl → 0.3.146py3-none-any.whl