PyPI - gnosisllm-knowledge - Versions diffs - 0.2.0__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

gnosisllm-knowledge 0.2.0py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (44) hide show

gnosisllm_knowledge/__init__.py +91 -39
gnosisllm_knowledge/api/__init__.py +3 -2
gnosisllm_knowledge/api/knowledge.py +287 -7
gnosisllm_knowledge/api/memory.py +966 -0
gnosisllm_knowledge/backends/__init__.py +14 -5
gnosisllm_knowledge/backends/opensearch/agentic.py +341 -39
gnosisllm_knowledge/backends/opensearch/config.py +49 -28
gnosisllm_knowledge/backends/opensearch/indexer.py +1 -0
gnosisllm_knowledge/backends/opensearch/mappings.py +2 -1
gnosisllm_knowledge/backends/opensearch/memory/__init__.py +12 -0
gnosisllm_knowledge/backends/opensearch/memory/client.py +1380 -0
gnosisllm_knowledge/backends/opensearch/memory/config.py +127 -0
gnosisllm_knowledge/backends/opensearch/memory/setup.py +322 -0
gnosisllm_knowledge/backends/opensearch/searcher.py +235 -0
gnosisllm_knowledge/backends/opensearch/setup.py +308 -148
gnosisllm_knowledge/cli/app.py +378 -12
gnosisllm_knowledge/cli/commands/agentic.py +11 -0
gnosisllm_knowledge/cli/commands/memory.py +723 -0
gnosisllm_knowledge/cli/commands/setup.py +24 -22
gnosisllm_knowledge/cli/display/service.py +43 -0
gnosisllm_knowledge/cli/utils/config.py +58 -0
gnosisllm_knowledge/core/domain/__init__.py +41 -0
gnosisllm_knowledge/core/domain/document.py +5 -0
gnosisllm_knowledge/core/domain/memory.py +440 -0
gnosisllm_knowledge/core/domain/result.py +11 -3
gnosisllm_knowledge/core/domain/search.py +2 -0
gnosisllm_knowledge/core/events/types.py +76 -0
gnosisllm_knowledge/core/exceptions.py +134 -0
gnosisllm_knowledge/core/interfaces/__init__.py +17 -0
gnosisllm_knowledge/core/interfaces/memory.py +524 -0
gnosisllm_knowledge/core/interfaces/streaming.py +127 -0
gnosisllm_knowledge/core/streaming/__init__.py +36 -0
gnosisllm_knowledge/core/streaming/pipeline.py +228 -0
gnosisllm_knowledge/loaders/base.py +3 -4
gnosisllm_knowledge/loaders/sitemap.py +129 -1
gnosisllm_knowledge/loaders/sitemap_streaming.py +258 -0
gnosisllm_knowledge/services/indexing.py +67 -75
gnosisllm_knowledge/services/search.py +47 -11
gnosisllm_knowledge/services/streaming_pipeline.py +302 -0
{gnosisllm_knowledge-0.2.0.dist-info → gnosisllm_knowledge-0.3.0.dist-info}/METADATA +44 -1
gnosisllm_knowledge-0.3.0.dist-info/RECORD +77 -0
gnosisllm_knowledge-0.2.0.dist-info/RECORD +0 -64
{gnosisllm_knowledge-0.2.0.dist-info → gnosisllm_knowledge-0.3.0.dist-info}/WHEEL +0 -0
{gnosisllm_knowledge-0.2.0.dist-info → gnosisllm_knowledge-0.3.0.dist-info}/entry_points.txt +0 -0

gnosisllm_knowledge/cli/commands/setup.py CHANGED Viewed

@@ -26,12 +26,12 @@ if TYPE_CHECKING:
 async def setup_command(
     display: RichDisplayService,
-    host: str = "localhost",
-    port: int = 9200,
+    host: str | None = None,
+    port: int | None = None,
     username: str | None = None,
     password: str | None = None,
-    use_ssl: bool = False,
-    verify_certs: bool = False,
+    use_ssl: bool | None = None,
+    verify_certs: bool | None = None,
     force: bool = False,
     no_sample_data: bool = False,
     no_hybrid: bool = False,
@@ -40,24 +40,26 @@ async def setup_command(
     Args:
         display: Display service for output.
-        host: OpenSearch host.
-        port: OpenSearch port.
-        username: OpenSearch username.
-        password: OpenSearch password.
-        use_ssl: Enable SSL.
-        verify_certs: Verify SSL certificates.
+        host: OpenSearch host (overrides env).
+        port: OpenSearch port (overrides env).
+        username: OpenSearch username (overrides env).
+        password: OpenSearch password (overrides env).
+        use_ssl: Enable SSL (overrides env).
+        verify_certs: Verify SSL certificates (overrides env).
         force: Clean up existing resources first.
         no_sample_data: Skip sample data ingestion.
         no_hybrid: Skip hybrid search pipeline.
     """
-    # Load configuration
+    # Load configuration from environment
     cli_config = CliConfig.from_env()
-    # Override with CLI arguments
-    final_host = host or cli_config.opensearch_host
-    final_port = port or cli_config.opensearch_port
-    final_username = username or cli_config.opensearch_username
-    final_password = password or cli_config.opensearch_password
+    # CLI arguments override environment variables (only if explicitly provided)
+    final_host = host if host is not None else cli_config.opensearch_host
+    final_port = port if port is not None else cli_config.opensearch_port
+    final_username = username if username is not None else cli_config.opensearch_username
+    final_password = password if password is not None else cli_config.opensearch_password
+    final_use_ssl = use_ssl if use_ssl is not None else cli_config.opensearch_use_ssl
+    final_verify_certs = verify_certs if verify_certs is not None else cli_config.opensearch_verify_certs
     # Validate required config
     if not cli_config.openai_api_key:
@@ -79,7 +81,7 @@ async def setup_command(
         "Configuration",
         [
             ("Host", f"{final_host}:{final_port}"),
-            ("SSL", "Enabled" if use_ssl else "Disabled"),
+            ("SSL", "Enabled" if final_use_ssl else "Disabled"),
             ("Auth", "Configured" if final_username else "None"),
             ("Hybrid Search", "Disabled" if no_hybrid else "Enabled"),
             ("Force Recreate", "Yes" if force else "No"),
@@ -94,8 +96,8 @@ async def setup_command(
         port=final_port,
         username=final_username,
         password=final_password,
-        use_ssl=use_ssl,
-        verify_certs=verify_certs,
+        use_ssl=final_use_ssl,
+        verify_certs=final_verify_certs,
         openai_api_key=cli_config.openai_api_key,
         embedding_model=cli_config.openai_embedding_model,
         embedding_dimension=cli_config.openai_embedding_dimension,
@@ -109,8 +111,8 @@ async def setup_command(
     client = AsyncOpenSearch(
         hosts=[{"host": final_host, "port": final_port}],
         http_auth=http_auth,
-        use_ssl=use_ssl,
-        verify_certs=verify_certs,
+        use_ssl=final_use_ssl,
+        verify_certs=final_verify_certs,
         ssl_show_warn=False,
     )
@@ -124,7 +126,7 @@ async def setup_command(
             display.format_error_with_suggestion(
                 error=f"Cannot connect to OpenSearch at {final_host}:{final_port}",
                 suggestion="Ensure OpenSearch is running and accessible.",
-                command=f"curl http{'s' if use_ssl else ''}://{final_host}:{final_port}",
+                command=f"curl http{'s' if final_use_ssl else ''}://{final_host}:{final_port}",
             )
             sys.exit(1)

gnosisllm_knowledge/cli/display/service.py CHANGED Viewed

@@ -553,3 +553,46 @@ class RichDisplayService:
                 suggestion="Run agentic setup to create agents.",
                 command="gnosisllm-knowledge agentic setup",
             )
+    def memory_status(
+        self,
+        llm_model_id: str | None,
+        embedding_model_id: str | None,
+        llm_model: str = "gpt-4o",
+        embedding_model: str = "text-embedding-3-small",
+    ) -> None:
+        """Display agentic memory configuration status.
+        Args:
+            llm_model_id: LLM model ID if configured.
+            embedding_model_id: Embedding model ID if configured.
+            llm_model: LLM model name for fact extraction.
+            embedding_model: Embedding model name.
+        """
+        status_rows = []
+        # LLM Model
+        if llm_model_id:
+            status_rows.append(("LLM Model", "[green]Configured[/green]"))
+            status_rows.append(("  ID", f"[dim]{llm_model_id}[/dim]"))
+            status_rows.append(("  Model", llm_model))
+        else:
+            status_rows.append(("LLM Model", "[red]Not configured[/red]"))
+        # Embedding Model
+        if embedding_model_id:
+            status_rows.append(("Embedding Model", "[green]Configured[/green]"))
+            status_rows.append(("  ID", f"[dim]{embedding_model_id}[/dim]"))
+            status_rows.append(("  Model", embedding_model))
+        else:
+            status_rows.append(("Embedding Model", "[red]Not configured[/red]"))
+        self.table("Agentic Memory Configuration", status_rows)
+        if not llm_model_id or not embedding_model_id:
+            self.newline()
+            self.format_error_with_suggestion(
+                error="Memory models not configured.",
+                suggestion="Run memory setup to create connectors and models.",
+                command="gnosisllm-knowledge memory setup --openai-key sk-...",
+            )

gnosisllm_knowledge/cli/utils/config.py CHANGED Viewed

@@ -42,6 +42,13 @@ class CliConfig:
     agentic_max_iterations: int = 5
     agentic_timeout_seconds: int = 60
+    # Agentic Memory
+    memory_llm_model_id: str | None = None
+    memory_embedding_model_id: str | None = None
+    memory_llm_model: str = "gpt-4o"
+    memory_embedding_model: str = "text-embedding-3-small"
+    memory_embedding_dimension: int = 1536
     # Neoreader
     neoreader_host: str = "https://api.neoreader.dev"
@@ -86,6 +93,12 @@ class CliConfig:
             agentic_llm_model=os.getenv("AGENTIC_LLM_MODEL", "gpt-4o"),
             agentic_max_iterations=int(os.getenv("AGENTIC_MAX_ITERATIONS", "5")),
             agentic_timeout_seconds=int(os.getenv("AGENTIC_TIMEOUT_SECONDS", "60")),
+            # Agentic Memory configuration
+            memory_llm_model_id=os.getenv("OPENSEARCH_MEMORY_LLM_MODEL_ID"),
+            memory_embedding_model_id=os.getenv("OPENSEARCH_MEMORY_EMBEDDING_MODEL_ID"),
+            memory_llm_model=os.getenv("MEMORY_LLM_MODEL", "gpt-4o"),
+            memory_embedding_model=os.getenv("MEMORY_EMBEDDING_MODEL", "text-embedding-3-small"),
+            memory_embedding_dimension=int(os.getenv("MEMORY_EMBEDDING_DIMENSION", "1536")),
             neoreader_host=os.getenv("NEOREADER_HOST", "https://api.neoreader.dev"),
         )
@@ -205,3 +218,48 @@ class CliConfig:
     def has_conversational_agent(self) -> bool:
         """Check if conversational agent is configured."""
         return bool(self.opensearch_conversational_agent_id)
+    # === Memory Configuration ===
+    def validate_for_memory(self) -> list[str]:
+        """Validate configuration for memory commands.
+        Returns:
+            List of validation errors (empty if valid).
+        """
+        errors = []
+        if not self.memory_llm_model_id:
+            errors.append(
+                "OPENSEARCH_MEMORY_LLM_MODEL_ID is required for memory operations. "
+                "Run 'gnosisllm-knowledge memory setup' first."
+            )
+        if not self.memory_embedding_model_id:
+            errors.append(
+                "OPENSEARCH_MEMORY_EMBEDDING_MODEL_ID is required for memory operations. "
+                "Run 'gnosisllm-knowledge memory setup' first."
+            )
+        return errors
+    def validate_for_memory_setup(self) -> list[str]:
+        """Validate configuration for memory setup command.
+        Returns:
+            List of validation errors (empty if valid).
+        """
+        errors = []
+        if not self.openai_api_key:
+            errors.append(
+                "OPENAI_API_KEY is required for memory setup. "
+                "Use --openai-key or set the environment variable."
+            )
+        return errors
+    @property
+    def has_memory_models(self) -> bool:
+        """Check if memory models are configured."""
+        return bool(self.memory_llm_model_id and self.memory_embedding_model_id)
+    @property
+    def memory_is_configured(self) -> bool:
+        """Check if memory is fully configured for operations."""
+        return self.has_memory_models

gnosisllm_knowledge/core/domain/__init__.py CHANGED Viewed

@@ -1,6 +1,27 @@
 """Domain models - Value objects and entities."""
 from gnosisllm_knowledge.core.domain.document import Document, DocumentStatus, TextChunk
+from gnosisllm_knowledge.core.domain.memory import (
+    ContainerConfig,
+    ContainerIndexSettings,
+    ContainerInfo,
+    EmbeddingModelType,
+    HistoryAction,
+    HistoryEntry,
+    IndexSettings,
+    MemoryEntry,
+    MemoryStats,
+    MemoryStrategy,
+    MemoryType,
+    Message,
+    Namespace,
+    PayloadType,
+    RecallResult,
+    SessionInfo,
+    StoreRequest,
+    StoreResult,
+    StrategyConfig,
+)
 from gnosisllm_knowledge.core.domain.result import (
     BatchResult,
     IndexResult,
@@ -24,6 +45,26 @@ __all__ = [
     "Document",
     "DocumentStatus",
     "TextChunk",
+    # Memory
+    "MemoryStrategy",
+    "MemoryType",
+    "PayloadType",
+    "EmbeddingModelType",
+    "HistoryAction",
+    "StrategyConfig",
+    "IndexSettings",
+    "ContainerIndexSettings",
+    "ContainerConfig",
+    "ContainerInfo",
+    "Message",
+    "Namespace",
+    "StoreRequest",
+    "StoreResult",
+    "MemoryEntry",
+    "RecallResult",
+    "SessionInfo",
+    "HistoryEntry",
+    "MemoryStats",
     # Result
     "LoadResult",
     "IndexResult",

gnosisllm_knowledge/core/domain/document.py CHANGED Viewed

@@ -73,6 +73,7 @@ class Document:
     # Multi-tenancy fields
     account_id: str | None = None
     collection_id: str | None = None
+    collection_name: str | None = None  # For display in aggregations
     source_id: str | None = None
     # Chunking info
@@ -140,6 +141,7 @@ class Document:
             metadata=self.metadata.copy(),
             account_id=self.account_id,
             collection_id=self.collection_id,
+            collection_name=self.collection_name,
             source_id=self.source_id,
             chunk_index=chunk_index,
             total_chunks=total_chunks,
@@ -156,6 +158,7 @@ class Document:
         self,
         account_id: str,
         collection_id: str | None = None,
+        collection_name: str | None = None,
         source_id: str | None = None,
     ) -> Document:
         """Create a new document with tenant information.
@@ -163,6 +166,7 @@ class Document:
         Args:
             account_id: Account/tenant identifier.
             collection_id: Collection identifier.
+            collection_name: Collection name for display.
             source_id: Source identifier.
         Returns:
@@ -177,6 +181,7 @@ class Document:
             metadata=self.metadata.copy(),
             account_id=account_id,
             collection_id=collection_id or self.collection_id,
+            collection_name=collection_name or self.collection_name,
             source_id=source_id or self.source_id,
             chunk_index=self.chunk_index,
             total_chunks=self.total_chunks,

gnosisllm-knowledge 0.2.0__py3-none-any.whl → 0.3.0__py3-none-any.whl

gnosisllm-knowledge 0.2.0py3-none-any.whl → 0.3.0py3-none-any.whl