PyPI - basic-memory - Versions diffs - 0.7.0__py3-none-any.whl → 0.17.4__py3-none-any.whl - Mend

basic-memory 0.7.0py3-none-any.whl → 0.17.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of basic-memory might be problematic. Click here for more details.

Files changed (195) hide show

basic_memory/__init__.py +5 -1
basic_memory/alembic/alembic.ini +119 -0
basic_memory/alembic/env.py +130 -20
basic_memory/alembic/migrations.py +4 -9
basic_memory/alembic/versions/314f1ea54dc4_add_postgres_full_text_search_support_.py +131 -0
basic_memory/alembic/versions/502b60eaa905_remove_required_from_entity_permalink.py +51 -0
basic_memory/alembic/versions/5fe1ab1ccebe_add_projects_table.py +120 -0
basic_memory/alembic/versions/647e7a75e2cd_project_constraint_fix.py +112 -0
basic_memory/alembic/versions/6830751f5fb6_merge_multiple_heads.py +24 -0
basic_memory/alembic/versions/9d9c1cb7d8f5_add_mtime_and_size_columns_to_entity_.py +49 -0
basic_memory/alembic/versions/a1b2c3d4e5f6_fix_project_foreign_keys.py +49 -0
basic_memory/alembic/versions/a2b3c4d5e6f7_add_search_index_entity_cascade.py +56 -0
basic_memory/alembic/versions/b3c3938bacdb_relation_to_name_unique_index.py +44 -0
basic_memory/alembic/versions/cc7172b46608_update_search_index_schema.py +113 -0
basic_memory/alembic/versions/e7e1f4367280_add_scan_watermark_tracking_to_project.py +37 -0
basic_memory/alembic/versions/f8a9b2c3d4e5_add_pg_trgm_for_fuzzy_link_resolution.py +239 -0
basic_memory/alembic/versions/g9a0b3c4d5e6_add_external_id_to_project_and_entity.py +173 -0
basic_memory/api/app.py +87 -20
basic_memory/api/container.py +133 -0
basic_memory/api/routers/__init__.py +4 -1
basic_memory/api/routers/directory_router.py +84 -0
basic_memory/api/routers/importer_router.py +152 -0
basic_memory/api/routers/knowledge_router.py +180 -23
basic_memory/api/routers/management_router.py +80 -0
basic_memory/api/routers/memory_router.py +9 -64
basic_memory/api/routers/project_router.py +460 -0
basic_memory/api/routers/prompt_router.py +260 -0
basic_memory/api/routers/resource_router.py +136 -11
basic_memory/api/routers/search_router.py +5 -5
basic_memory/api/routers/utils.py +169 -0
basic_memory/api/template_loader.py +292 -0
basic_memory/api/v2/__init__.py +35 -0
basic_memory/api/v2/routers/__init__.py +21 -0
basic_memory/api/v2/routers/directory_router.py +93 -0
basic_memory/api/v2/routers/importer_router.py +181 -0
basic_memory/api/v2/routers/knowledge_router.py +427 -0
basic_memory/api/v2/routers/memory_router.py +130 -0
basic_memory/api/v2/routers/project_router.py +359 -0
basic_memory/api/v2/routers/prompt_router.py +269 -0
basic_memory/api/v2/routers/resource_router.py +286 -0
basic_memory/api/v2/routers/search_router.py +73 -0
basic_memory/cli/app.py +80 -10
basic_memory/cli/auth.py +300 -0
basic_memory/cli/commands/__init__.py +15 -2
basic_memory/cli/commands/cloud/__init__.py +6 -0
basic_memory/cli/commands/cloud/api_client.py +127 -0
basic_memory/cli/commands/cloud/bisync_commands.py +110 -0
basic_memory/cli/commands/cloud/cloud_utils.py +108 -0
basic_memory/cli/commands/cloud/core_commands.py +195 -0
basic_memory/cli/commands/cloud/rclone_commands.py +397 -0
basic_memory/cli/commands/cloud/rclone_config.py +110 -0
basic_memory/cli/commands/cloud/rclone_installer.py +263 -0
basic_memory/cli/commands/cloud/upload.py +240 -0
basic_memory/cli/commands/cloud/upload_command.py +124 -0
basic_memory/cli/commands/command_utils.py +99 -0
basic_memory/cli/commands/db.py +87 -12
basic_memory/cli/commands/format.py +198 -0
basic_memory/cli/commands/import_chatgpt.py +47 -223
basic_memory/cli/commands/import_claude_conversations.py +48 -171
basic_memory/cli/commands/import_claude_projects.py +53 -160
basic_memory/cli/commands/import_memory_json.py +55 -111
basic_memory/cli/commands/mcp.py +67 -11
basic_memory/cli/commands/project.py +889 -0
basic_memory/cli/commands/status.py +52 -34
basic_memory/cli/commands/telemetry.py +81 -0
basic_memory/cli/commands/tool.py +341 -0
basic_memory/cli/container.py +84 -0
basic_memory/cli/main.py +14 -6
basic_memory/config.py +580 -26
basic_memory/db.py +285 -28
basic_memory/deps/__init__.py +293 -0
basic_memory/deps/config.py +26 -0
basic_memory/deps/db.py +56 -0
basic_memory/deps/importers.py +200 -0
basic_memory/deps/projects.py +238 -0
basic_memory/deps/repositories.py +179 -0
basic_memory/deps/services.py +480 -0
basic_memory/deps.py +16 -185
basic_memory/file_utils.py +318 -54
basic_memory/ignore_utils.py +297 -0
basic_memory/importers/__init__.py +27 -0
basic_memory/importers/base.py +100 -0
basic_memory/importers/chatgpt_importer.py +245 -0
basic_memory/importers/claude_conversations_importer.py +192 -0
basic_memory/importers/claude_projects_importer.py +184 -0
basic_memory/importers/memory_json_importer.py +128 -0
basic_memory/importers/utils.py +61 -0
basic_memory/markdown/entity_parser.py +182 -23
basic_memory/markdown/markdown_processor.py +70 -7
basic_memory/markdown/plugins.py +43 -23
basic_memory/markdown/schemas.py +1 -1
basic_memory/markdown/utils.py +38 -14
basic_memory/mcp/async_client.py +135 -4
basic_memory/mcp/clients/__init__.py +28 -0
basic_memory/mcp/clients/directory.py +70 -0
basic_memory/mcp/clients/knowledge.py +176 -0
basic_memory/mcp/clients/memory.py +120 -0
basic_memory/mcp/clients/project.py +89 -0
basic_memory/mcp/clients/resource.py +71 -0
basic_memory/mcp/clients/search.py +65 -0
basic_memory/mcp/container.py +110 -0
basic_memory/mcp/project_context.py +155 -0
basic_memory/mcp/prompts/__init__.py +19 -0
basic_memory/mcp/prompts/ai_assistant_guide.py +70 -0
basic_memory/mcp/prompts/continue_conversation.py +62 -0
basic_memory/mcp/prompts/recent_activity.py +188 -0
basic_memory/mcp/prompts/search.py +57 -0
basic_memory/mcp/prompts/utils.py +162 -0
basic_memory/mcp/resources/ai_assistant_guide.md +283 -0
basic_memory/mcp/resources/project_info.py +71 -0
basic_memory/mcp/server.py +61 -9
basic_memory/mcp/tools/__init__.py +33 -21
basic_memory/mcp/tools/build_context.py +120 -0
basic_memory/mcp/tools/canvas.py +152 -0
basic_memory/mcp/tools/chatgpt_tools.py +190 -0
basic_memory/mcp/tools/delete_note.py +249 -0
basic_memory/mcp/tools/edit_note.py +325 -0
basic_memory/mcp/tools/list_directory.py +157 -0
basic_memory/mcp/tools/move_note.py +549 -0
basic_memory/mcp/tools/project_management.py +204 -0
basic_memory/mcp/tools/read_content.py +281 -0
basic_memory/mcp/tools/read_note.py +265 -0
basic_memory/mcp/tools/recent_activity.py +528 -0
basic_memory/mcp/tools/search.py +377 -24
basic_memory/mcp/tools/utils.py +402 -16
basic_memory/mcp/tools/view_note.py +78 -0
basic_memory/mcp/tools/write_note.py +230 -0
basic_memory/models/__init__.py +3 -2
basic_memory/models/knowledge.py +82 -17
basic_memory/models/project.py +93 -0
basic_memory/models/search.py +68 -8
basic_memory/project_resolver.py +222 -0
basic_memory/repository/__init__.py +2 -0
basic_memory/repository/entity_repository.py +437 -8
basic_memory/repository/observation_repository.py +36 -3
basic_memory/repository/postgres_search_repository.py +451 -0
basic_memory/repository/project_info_repository.py +10 -0
basic_memory/repository/project_repository.py +140 -0
basic_memory/repository/relation_repository.py +79 -4
basic_memory/repository/repository.py +148 -29
basic_memory/repository/search_index_row.py +95 -0
basic_memory/repository/search_repository.py +79 -268
basic_memory/repository/search_repository_base.py +241 -0
basic_memory/repository/sqlite_search_repository.py +437 -0
basic_memory/runtime.py +61 -0
basic_memory/schemas/__init__.py +22 -9
basic_memory/schemas/base.py +131 -12
basic_memory/schemas/cloud.py +50 -0
basic_memory/schemas/directory.py +31 -0
basic_memory/schemas/importer.py +35 -0
basic_memory/schemas/memory.py +194 -25
basic_memory/schemas/project_info.py +213 -0
basic_memory/schemas/prompt.py +90 -0
basic_memory/schemas/request.py +56 -2
basic_memory/schemas/response.py +85 -28
basic_memory/schemas/search.py +36 -35
basic_memory/schemas/sync_report.py +72 -0
basic_memory/schemas/v2/__init__.py +27 -0
basic_memory/schemas/v2/entity.py +133 -0
basic_memory/schemas/v2/resource.py +47 -0
basic_memory/services/__init__.py +2 -1
basic_memory/services/context_service.py +451 -138
basic_memory/services/directory_service.py +310 -0
basic_memory/services/entity_service.py +636 -71
basic_memory/services/exceptions.py +21 -0
basic_memory/services/file_service.py +402 -33
basic_memory/services/initialization.py +216 -0
basic_memory/services/link_resolver.py +50 -56
basic_memory/services/project_service.py +888 -0
basic_memory/services/search_service.py +232 -37
basic_memory/sync/__init__.py +4 -2
basic_memory/sync/background_sync.py +26 -0
basic_memory/sync/coordinator.py +160 -0
basic_memory/sync/sync_service.py +1200 -109
basic_memory/sync/watch_service.py +432 -135
basic_memory/telemetry.py +249 -0
basic_memory/templates/prompts/continue_conversation.hbs +110 -0
basic_memory/templates/prompts/search.hbs +101 -0
basic_memory/utils.py +407 -54
basic_memory-0.17.4.dist-info/METADATA +617 -0
basic_memory-0.17.4.dist-info/RECORD +193 -0
{basic_memory-0.7.0.dist-info → basic_memory-0.17.4.dist-info}/WHEEL +1 -1
{basic_memory-0.7.0.dist-info → basic_memory-0.17.4.dist-info}/entry_points.txt +1 -0
basic_memory/alembic/README +0 -1
basic_memory/cli/commands/sync.py +0 -206
basic_memory/cli/commands/tools.py +0 -157
basic_memory/mcp/tools/knowledge.py +0 -68
basic_memory/mcp/tools/memory.py +0 -170
basic_memory/mcp/tools/notes.py +0 -202
basic_memory/schemas/discovery.py +0 -28
basic_memory/sync/file_change_scanner.py +0 -158
basic_memory/sync/utils.py +0 -31
basic_memory-0.7.0.dist-info/METADATA +0 -378
basic_memory-0.7.0.dist-info/RECORD +0 -82
{basic_memory-0.7.0.dist-info → basic_memory-0.17.4.dist-info}/licenses/LICENSE +0 -0

basic_memory/repository/postgres_search_repository.py ADDED Viewed

@@ -0,0 +1,451 @@
+"""PostgreSQL tsvector-based search repository implementation."""
+import json
+import re
+from datetime import datetime
+from typing import List, Optional
+from loguru import logger
+from sqlalchemy import text
+from basic_memory import db
+from basic_memory.repository.search_index_row import SearchIndexRow
+from basic_memory.repository.search_repository_base import SearchRepositoryBase
+from basic_memory.schemas.search import SearchItemType
+class PostgresSearchRepository(SearchRepositoryBase):
+    """PostgreSQL tsvector implementation of search repository.
+    Uses PostgreSQL's full-text search capabilities with:
+    - tsvector for document representation
+    - tsquery for query representation
+    - GIN indexes for performance
+    - ts_rank() function for relevance scoring
+    - JSONB containment operators for metadata search
+    Note: This implementation uses UPSERT patterns (INSERT ... ON CONFLICT) instead of
+    delete-then-insert to handle race conditions during parallel entity indexing.
+    The partial unique index uix_search_index_permalink_project prevents duplicate
+    permalinks per project.
+    """
+    async def init_search_index(self):
+        """Create Postgres table with tsvector column and GIN indexes.
+        Note: This is handled by Alembic migrations. This method is a no-op
+        for Postgres as the schema is created via migrations.
+        """
+        logger.info("PostgreSQL search index initialization handled by migrations")
+        # Table creation is done via Alembic migrations
+        # This includes:
+        # - CREATE TABLE search_index (...)
+        # - ADD COLUMN textsearchable_index_col tsvector GENERATED ALWAYS AS (...)
+        # - CREATE INDEX USING GIN on textsearchable_index_col
+        # - CREATE INDEX USING GIN on metadata jsonb_path_ops
+        pass
+    async def index_item(self, search_index_row: SearchIndexRow) -> None:
+        """Index or update a single item using UPSERT.
+        Uses INSERT ... ON CONFLICT to handle race conditions during parallel
+        entity indexing. The partial unique index uix_search_index_permalink_project
+        on (permalink, project_id) WHERE permalink IS NOT NULL prevents duplicate
+        permalinks.
+        For rows with non-null permalinks (entities), conflicts are resolved by
+        updating the existing row. For rows with null permalinks, no conflict
+        occurs on this index.
+        """
+        async with db.scoped_session(self.session_maker) as session:
+            # Serialize JSON for raw SQL
+            insert_data = search_index_row.to_insert(serialize_json=True)
+            insert_data["project_id"] = self.project_id
+            # Use upsert to handle race conditions during parallel indexing
+            # ON CONFLICT (permalink, project_id) matches the partial unique index
+            # uix_search_index_permalink_project WHERE permalink IS NOT NULL
+            # For rows with NULL permalinks, no conflict occurs (partial index doesn't apply)
+            await session.execute(
+                text("""
+                    INSERT INTO search_index (
+                        id, title, content_stems, content_snippet, permalink, file_path, type, metadata,
+                        from_id, to_id, relation_type,
+                        entity_id, category,
+                        created_at, updated_at,
+                        project_id
+                    ) VALUES (
+                        :id, :title, :content_stems, :content_snippet, :permalink, :file_path, :type, :metadata,
+                        :from_id, :to_id, :relation_type,
+                        :entity_id, :category,
+                        :created_at, :updated_at,
+                        :project_id
+                    )
+                    ON CONFLICT (permalink, project_id) WHERE permalink IS NOT NULL DO UPDATE SET
+                        id = EXCLUDED.id,
+                        title = EXCLUDED.title,
+                        content_stems = EXCLUDED.content_stems,
+                        content_snippet = EXCLUDED.content_snippet,
+                        file_path = EXCLUDED.file_path,
+                        type = EXCLUDED.type,
+                        metadata = EXCLUDED.metadata,
+                        from_id = EXCLUDED.from_id,
+                        to_id = EXCLUDED.to_id,
+                        relation_type = EXCLUDED.relation_type,
+                        entity_id = EXCLUDED.entity_id,
+                        category = EXCLUDED.category,
+                        created_at = EXCLUDED.created_at,
+                        updated_at = EXCLUDED.updated_at
+                """),
+                insert_data,
+            )
+            logger.debug(f"indexed row {search_index_row}")
+            await session.commit()
+    def _prepare_search_term(self, term: str, is_prefix: bool = True) -> str:
+        """Prepare a search term for tsquery format.
+        Args:
+            term: The search term to prepare
+            is_prefix: Whether to add prefix search capability (:* operator)
+        Returns:
+            Formatted search term for tsquery
+        For Postgres:
+        - Boolean operators are converted to tsquery format (&, |, !)
+        - Prefix matching uses the :* operator
+        - Terms are sanitized to prevent tsquery syntax errors
+        """
+        # Check for explicit boolean operators
+        boolean_operators = [" AND ", " OR ", " NOT "]
+        if any(op in f" {term} " for op in boolean_operators):
+            return self._prepare_boolean_query(term)
+        # For non-Boolean queries, prepare single term
+        return self._prepare_single_term(term, is_prefix)
+    def _prepare_boolean_query(self, query: str) -> str:
+        """Convert Boolean query to tsquery format.
+        Args:
+            query: A Boolean query like "coffee AND brewing" or "(pour OR french) AND press"
+        Returns:
+            tsquery-formatted string with & (AND), | (OR), ! (NOT) operators
+        Examples:
+            "coffee AND brewing" -> "coffee & brewing"
+            "(pour OR french) AND press" -> "(pour | french) & press"
+            "coffee NOT decaf" -> "coffee & !decaf"
+        """
+        # Replace Boolean operators with tsquery operators
+        # Keep parentheses for grouping
+        result = query
+        result = re.sub(r"\bAND\b", "&", result)
+        result = re.sub(r"\bOR\b", "|", result)
+        # NOT must be converted to "& !" and the ! must be attached to the following term
+        # "Python NOT Django" -> "Python & !Django"
+        result = re.sub(r"\bNOT\s+", "& !", result)
+        return result
+    def _prepare_single_term(self, term: str, is_prefix: bool = True) -> str:
+        """Prepare a single search term for tsquery.
+        Args:
+            term: A single search term
+            is_prefix: Whether to add prefix search capability (:* suffix)
+        Returns:
+            A properly formatted single term for tsquery
+        For Postgres tsquery:
+        - Multi-word queries become "word1 & word2"
+        - Prefix matching uses ":*" suffix (e.g., "coff:*")
+        - Special characters that need escaping: & | ! ( ) :
+        """
+        if not term or not term.strip():
+            return term
+        term = term.strip()
+        # Check if term is already a wildcard pattern
+        if "*" in term:
+            # Replace * with :* for Postgres prefix matching
+            return term.replace("*", ":*")
+        # Remove tsquery special characters from the search term
+        # These characters have special meaning in tsquery and cause syntax errors
+        # if not used as operators
+        special_chars = ["&", "|", "!", "(", ")", ":"]
+        cleaned_term = term
+        for char in special_chars:
+            cleaned_term = cleaned_term.replace(char, " ")
+        # Handle multi-word queries
+        if " " in cleaned_term:
+            words = [w for w in cleaned_term.split() if w.strip()]
+            if not words:
+                # All characters were special chars, search won't match anything
+                # Return a safe search term that won't cause syntax errors
+                return "NOSPECIALCHARS:*"
+            if is_prefix:
+                # Add prefix matching to each word
+                prepared_words = [f"{word}:*" for word in words]
+            else:
+                prepared_words = words
+            # Join with AND operator
+            return " & ".join(prepared_words)
+        # Single word
+        cleaned_term = cleaned_term.strip()
+        if is_prefix:
+            return f"{cleaned_term}:*"
+        else:
+            return cleaned_term
+    async def search(
+        self,
+        search_text: Optional[str] = None,
+        permalink: Optional[str] = None,
+        permalink_match: Optional[str] = None,
+        title: Optional[str] = None,
+        types: Optional[List[str]] = None,
+        after_date: Optional[datetime] = None,
+        search_item_types: Optional[List[SearchItemType]] = None,
+        limit: int = 10,
+        offset: int = 0,
+    ) -> List[SearchIndexRow]:
+        """Search across all indexed content using PostgreSQL tsvector."""
+        conditions = []
+        params = {}
+        order_by_clause = ""
+        # Handle text search for title and content using tsvector
+        if search_text:
+            if search_text.strip() == "*" or search_text.strip() == "":
+                # For wildcard searches, don't add any text conditions
+                pass
+            else:
+                # Prepare search term for tsquery
+                processed_text = self._prepare_search_term(search_text.strip())
+                params["text"] = processed_text
+                # Use @@ operator for tsvector matching
+                conditions.append("textsearchable_index_col @@ to_tsquery('english', :text)")
+        # Handle title search
+        if title:
+            title_text = self._prepare_search_term(title.strip(), is_prefix=False)
+            params["title_text"] = title_text
+            conditions.append("to_tsvector('english', title) @@ to_tsquery('english', :title_text)")
+        # Handle permalink exact search
+        if permalink:
+            params["permalink"] = permalink
+            conditions.append("permalink = :permalink")
+        # Handle permalink pattern match
+        if permalink_match:
+            permalink_text = permalink_match.lower().strip()
+            params["permalink"] = permalink_text
+            if "*" in permalink_match:
+                # Use LIKE for pattern matching in Postgres
+                # Convert * to % for SQL LIKE
+                permalink_pattern = permalink_text.replace("*", "%")
+                params["permalink"] = permalink_pattern
+                conditions.append("permalink LIKE :permalink")
+            else:
+                conditions.append("permalink = :permalink")
+        # Handle search item type filter
+        if search_item_types:
+            type_list = ", ".join(f"'{t.value}'" for t in search_item_types)
+            conditions.append(f"type IN ({type_list})")
+        # Handle entity type filter using JSONB containment
+        if types:
+            # Use JSONB @> operator for efficient containment queries
+            type_conditions = []
+            for entity_type in types:
+                # Create JSONB containment condition for each type
+                type_conditions.append(f'metadata @> \'{{"entity_type": "{entity_type}"}}\'')
+            conditions.append(f"({' OR '.join(type_conditions)})")
+        # Handle date filter
+        if after_date:
+            params["after_date"] = after_date
+            conditions.append("created_at > :after_date")
+            # order by most recent first
+            order_by_clause = ", updated_at DESC"
+        # Always filter by project_id
+        params["project_id"] = self.project_id
+        conditions.append("project_id = :project_id")
+        # set limit and offset
+        params["limit"] = limit
+        params["offset"] = offset
+        # Build WHERE clause
+        where_clause = " AND ".join(conditions) if conditions else "1=1"
+        # Build SQL with ts_rank() for scoring
+        # Note: If no text search, score will be NULL, so we use COALESCE to default to 0
+        if search_text and search_text.strip() and search_text.strip() != "*":
+            score_expr = "ts_rank(textsearchable_index_col, to_tsquery('english', :text))"
+        else:
+            score_expr = "0"
+        sql = f"""
+            SELECT
+                project_id,
+                id,
+                title,
+                permalink,
+                file_path,
+                type,
+                metadata,
+                from_id,
+                to_id,
+                relation_type,
+                entity_id,
+                content_snippet,
+                category,
+                created_at,
+                updated_at,
+                {score_expr} as score
+            FROM search_index
+            WHERE {where_clause}
+            ORDER BY score DESC, id ASC {order_by_clause}
+            LIMIT :limit
+            OFFSET :offset
+        """
+        logger.trace(f"Search {sql} params: {params}")
+        try:
+            async with db.scoped_session(self.session_maker) as session:
+                result = await session.execute(text(sql), params)
+                rows = result.fetchall()
+        except Exception as e:
+            # Handle tsquery syntax errors (and only those).
+            #
+            # Important: Postgres errors for other failures (e.g. missing table) will still mention
+            # `to_tsquery(...)` in the SQL text, so checking for the substring "tsquery" is too broad.
+            msg = str(e).lower()
+            if (
+                "syntax error in tsquery" in msg
+                or "invalid input syntax for type tsquery" in msg
+                or "no operand in tsquery" in msg
+                or "no operator in tsquery" in msg
+            ):
+                logger.warning(f"tsquery syntax error for search term: {search_text}, error: {e}")
+                return []
+            # Re-raise other database errors
+            logger.error(f"Database error during search: {e}")
+            raise
+        results = [
+            SearchIndexRow(
+                project_id=self.project_id,
+                id=row.id,
+                title=row.title,
+                permalink=row.permalink,
+                file_path=row.file_path,
+                type=row.type,
+                score=float(row.score) if row.score else 0.0,
+                metadata=(
+                    row.metadata
+                    if isinstance(row.metadata, dict)
+                    else (json.loads(row.metadata) if row.metadata else {})
+                ),
+                from_id=row.from_id,
+                to_id=row.to_id,
+                relation_type=row.relation_type,
+                entity_id=row.entity_id,
+                content_snippet=row.content_snippet,
+                category=row.category,
+                created_at=row.created_at,
+                updated_at=row.updated_at,
+            )
+            for row in rows
+        ]
+        logger.trace(f"Found {len(results)} search results")
+        for r in results:
+            logger.trace(
+                f"Search result: project_id: {r.project_id} type:{r.type} title: {r.title} permalink: {r.permalink} score: {r.score}"
+            )
+        return results
+    async def bulk_index_items(self, search_index_rows: List[SearchIndexRow]) -> None:
+        """Index multiple items in a single batch operation using UPSERT.
+        Uses INSERT ... ON CONFLICT to handle race conditions during parallel
+        entity indexing. The partial unique index uix_search_index_permalink_project
+        on (permalink, project_id) WHERE permalink IS NOT NULL prevents duplicate
+        permalinks.
+        For rows with non-null permalinks (entities), conflicts are resolved by
+        updating the existing row. For rows with null permalinks (observations,
+        relations), the partial index doesn't apply and they are inserted directly.
+        Args:
+            search_index_rows: List of SearchIndexRow objects to index
+        """
+        if not search_index_rows:
+            return
+        async with db.scoped_session(self.session_maker) as session:
+            # When using text() raw SQL, always serialize JSON to string
+            # Both SQLite (TEXT) and Postgres (JSONB) accept JSON strings in raw SQL
+            # The database driver/column type will handle conversion
+            insert_data_list = []
+            for row in search_index_rows:
+                insert_data = row.to_insert(serialize_json=True)
+                insert_data["project_id"] = self.project_id
+                insert_data_list.append(insert_data)
+            # Use upsert to handle race conditions during parallel indexing
+            # ON CONFLICT (permalink, project_id) matches the partial unique index
+            # uix_search_index_permalink_project WHERE permalink IS NOT NULL
+            # For rows with NULL permalinks (observations, relations), no conflict occurs
+            await session.execute(
+                text("""
+                    INSERT INTO search_index (
+                        id, title, content_stems, content_snippet, permalink, file_path, type, metadata,
+                        from_id, to_id, relation_type,
+                        entity_id, category,
+                        created_at, updated_at,
+                        project_id
+                    ) VALUES (
+                        :id, :title, :content_stems, :content_snippet, :permalink, :file_path, :type, :metadata,
+                        :from_id, :to_id, :relation_type,
+                        :entity_id, :category,
+                        :created_at, :updated_at,
+                        :project_id
+                    )
+                    ON CONFLICT (permalink, project_id) WHERE permalink IS NOT NULL DO UPDATE SET
+                        id = EXCLUDED.id,
+                        title = EXCLUDED.title,
+                        content_stems = EXCLUDED.content_stems,
+                        content_snippet = EXCLUDED.content_snippet,
+                        file_path = EXCLUDED.file_path,
+                        type = EXCLUDED.type,
+                        metadata = EXCLUDED.metadata,
+                        from_id = EXCLUDED.from_id,
+                        to_id = EXCLUDED.to_id,
+                        relation_type = EXCLUDED.relation_type,
+                        entity_id = EXCLUDED.entity_id,
+                        category = EXCLUDED.category,
+                        created_at = EXCLUDED.created_at,
+                        updated_at = EXCLUDED.updated_at
+                """),
+                insert_data_list,
+            )
+            logger.debug(f"Bulk indexed {len(search_index_rows)} rows")
+            await session.commit()

basic_memory/repository/project_info_repository.py ADDED Viewed

@@ -0,0 +1,10 @@
+from basic_memory.repository.repository import Repository
+from basic_memory.models.project import Project
+class ProjectInfoRepository(Repository):
+    """Repository for statistics queries."""
+    def __init__(self, session_maker):
+        # Initialize with Project model as a reference
+        super().__init__(session_maker, Project)

basic_memory/repository/project_repository.py ADDED Viewed

@@ -0,0 +1,140 @@
+"""Repository for managing projects in Basic Memory."""
+from pathlib import Path
+from typing import Optional, Sequence, Union
+from sqlalchemy import text
+from sqlalchemy.ext.asyncio import AsyncSession, async_sessionmaker
+from basic_memory import db
+from basic_memory.models.project import Project
+from basic_memory.repository.repository import Repository
+class ProjectRepository(Repository[Project]):
+    """Repository for Project model.
+    Projects represent collections of knowledge entities grouped together.
+    Each entity, observation, and relation belongs to a specific project.
+    """
+    def __init__(self, session_maker: async_sessionmaker[AsyncSession]):
+        """Initialize with session maker."""
+        super().__init__(session_maker, Project)
+    async def get_by_name(self, name: str) -> Optional[Project]:
+        """Get project by name (exact match).
+        Args:
+            name: Unique name of the project
+        """
+        query = self.select().where(Project.name == name)
+        return await self.find_one(query)
+    async def get_by_name_case_insensitive(self, name: str) -> Optional[Project]:
+        """Get project by name (case-insensitive match).
+        Args:
+            name: Project name (case-insensitive)
+        Returns:
+            Project if found, None otherwise
+        """
+        query = self.select().where(Project.name.ilike(name))
+        return await self.find_one(query)
+    async def get_by_permalink(self, permalink: str) -> Optional[Project]:
+        """Get project by permalink.
+        Args:
+            permalink: URL-friendly identifier for the project
+        """
+        query = self.select().where(Project.permalink == permalink)
+        return await self.find_one(query)
+    async def get_by_path(self, path: Union[Path, str]) -> Optional[Project]:
+        """Get project by filesystem path.
+        Args:
+            path: Path to the project directory (will be converted to string internally)
+        """
+        query = self.select().where(Project.path == Path(path).as_posix())
+        return await self.find_one(query)
+    async def get_by_id(self, project_id: int) -> Optional[Project]:
+        """Get project by numeric ID.
+        Args:
+            project_id: Numeric project ID
+        Returns:
+            Project if found, None otherwise
+        """
+        async with db.scoped_session(self.session_maker) as session:
+            return await self.select_by_id(session, project_id)
+    async def get_by_external_id(self, external_id: str) -> Optional[Project]:
+        """Get project by external UUID.
+        Args:
+            external_id: External UUID identifier
+        Returns:
+            Project if found, None otherwise
+        """
+        query = self.select().where(Project.external_id == external_id)
+        return await self.find_one(query)
+    async def get_default_project(self) -> Optional[Project]:
+        """Get the default project (the one marked as is_default=True)."""
+        query = self.select().where(Project.is_default.is_not(None))
+        return await self.find_one(query)
+    async def get_active_projects(self) -> Sequence[Project]:
+        """Get all active projects."""
+        query = self.select().where(Project.is_active == True)  # noqa: E712
+        result = await self.execute_query(query)
+        return list(result.scalars().all())
+    async def set_as_default(self, project_id: int) -> Optional[Project]:
+        """Set a project as the default and unset previous default.
+        Args:
+            project_id: ID of the project to set as default
+        Returns:
+            The updated project if found, None otherwise
+        """
+        async with db.scoped_session(self.session_maker) as session:
+            # First, clear the default flag for all projects using direct SQL
+            await session.execute(
+                text("UPDATE project SET is_default = NULL WHERE is_default IS NOT NULL")
+            )
+            await session.flush()
+            # Set the new default project
+            target_project = await self.select_by_id(session, project_id)
+            if target_project:
+                target_project.is_default = True
+                await session.flush()
+                return target_project
+            return None  # pragma: no cover
+    async def update_path(self, project_id: int, new_path: str) -> Optional[Project]:
+        """Update project path.
+        Args:
+            project_id: ID of the project to update
+            new_path: New filesystem path for the project
+        Returns:
+            The updated project if found, None otherwise
+        """
+        async with db.scoped_session(self.session_maker) as session:
+            project = await self.select_by_id(session, project_id)
+            if project:
+                project.path = new_path
+                await session.flush()
+                return project
+            return None

basic-memory 0.7.0__py3-none-any.whl → 0.17.4__py3-none-any.whl

Potentially problematic release.

basic-memory 0.7.0py3-none-any.whl → 0.17.4py3-none-any.whl