PyPI - cognee - Versions diffs - 0.3.2__py3-none-any.whl → 0.3.3__py3-none-any.whl - Mend

cognee 0.3.2py3-none-any.whl → 0.3.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

cognee/api/v1/notebooks/routers/get_notebooks_router.py CHANGED Viewed

@@ -31,7 +31,8 @@ def get_notebooks_router():
     @router.get("")
     async def get_notebooks_endpoint(user: User = Depends(get_authenticated_user)):
-        return await get_notebooks(user.id)
+        async with get_async_session() as session:
+            return await get_notebooks(user.id, session)
     @router.post("")
     async def create_notebook_endpoint(

cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py CHANGED Viewed

@@ -58,8 +58,8 @@ class SQLAlchemyAdapter:
         else:
             self.engine = create_async_engine(
                 connection_string,
-                pool_size=5,
-                max_overflow=10,
+                pool_size=20,
+                max_overflow=20,
                 pool_recycle=280,
                 pool_pre_ping=True,
                 pool_timeout=280,

cognee/infrastructure/databases/vector/config.py CHANGED Viewed

@@ -39,7 +39,7 @@ class VectorConfig(BaseSettings):
             values.vector_db_url = ensure_absolute_path(
                 values.vector_db_url,
             )
-        else:
+        elif not values.vector_db_url:
             # Default path
             databases_directory_path = os.path.join(base_config.system_root_directory, "databases")
             values.vector_db_url = os.path.join(databases_directory_path, "cognee.lancedb")

cognee/infrastructure/utils/run_async.py CHANGED Viewed

@@ -1,13 +1,18 @@
 import asyncio
 from functools import partial
+import inspect
 async def run_async(func, *args, loop=None, executor=None, **kwargs):
     if loop is None:
         try:
-            running_loop = asyncio.get_running_loop()
+            loop = asyncio.get_running_loop()
         except RuntimeError:
-            running_loop = asyncio.get_event_loop()
+            loop = asyncio.get_event_loop()
-    pfunc = partial(func, *args, **kwargs)
-    return await running_loop.run_in_executor(executor, pfunc)
+    if "loop" in inspect.signature(func).parameters:
+        pfunc = partial(func, *args, loop=loop, **kwargs)
+    else:
+        pfunc = partial(func, *args, **kwargs)
+    return await loop.run_in_executor(executor, pfunc)

cognee/infrastructure/utils/run_sync.py CHANGED Viewed

@@ -2,16 +2,17 @@ import asyncio
 import threading
-def run_sync(coro, timeout=None):
+def run_sync(coro, running_loop=None, timeout=None):
     result = None
     exception = None
     def runner():
-        nonlocal result, exception
+        nonlocal result, exception, running_loop
         try:
             try:
-                running_loop = asyncio.get_running_loop()
+                if not running_loop:
+                    running_loop = asyncio.get_running_loop()
                 result = asyncio.run_coroutine_threadsafe(coro, running_loop).result(timeout)
             except RuntimeError:

cognee/modules/notebooks/methods/create_tutorial_notebook.py ADDED Viewed

@@ -0,0 +1,92 @@
+from uuid import UUID, uuid4
+from sqlalchemy.ext.asyncio import AsyncSession
+from ..models import NotebookCell
+from .create_notebook import create_notebook
+async def create_tutorial_notebook(user_id: UUID, session: AsyncSession):
+    await create_notebook(
+        user_id=user_id,
+        notebook_name="Welcome to cognee 🧠",
+        cells=[
+            NotebookCell(
+                id=uuid4(),
+                name="Welcome",
+                content="Cognee is your toolkit for turning text into a structured knowledge graph, optionally enhanced by ontologies, and then querying it with advanced retrieval techniques. This notebook will guide you through a simple example.",
+                type="markdown",
+            ),
+            NotebookCell(
+                id=uuid4(),
+                name="Example",
+                content="",
+                type="markdown",
+            ),
+        ],
+        deletable=False,
+        session=session,
+    )
+cell_content = [
+"""
+# Using Cognee with Python Development Data
+Unite authoritative Python practice (Guido van Rossum's own contributions!), normative guidance (Zen/PEP 8), and your lived context (rules + conversations) into one *AI memory* that produces answers that are relevant, explainable, and consistent.
+""",
+"""
+## What You'll Learn
+In this comprehensive tutorial, you'll discover how to transform scattered development data into an intelligent knowledge system that enhances your coding workflow. By the end, you'll have:
+- Connected disparate data sources (Guido's CPython contributions, mypy development, PEP discussions, your Python projects) into a unified AI memory graph
+- Built an memory layer that understands Python design philosophy, best practice coding patterns, and your preferences and experience
+- Learn how to use intelligent search capabilities that combine the diverse context
+- Integrated everything with your coding environment through MCP (Model Context Protocol)
+This tutorial demonstrates the power of **knowledge graphs** and **retrieval-augmented generation (RAG)** for software development, showing you how to build systems that learn from Python's creator and improve your own Python development.
+""",
+"""
+## Cognee and its core operations
+Before we dive in, let's understand the core Cognee operations we'll be working with:
+- `cognee.add()` - Ingests raw data (files, text, APIs) into the system
+- `cognee.cognify()` - Processes and structures data into a knowledge graph using AI
+- `cognee.search()` - Queries the knowledge graph with natural language or Cypher
+- `cognee.memify()` - Cognee's \"secret sauce\" that infers implicit connections and rules from your data
+""",
+"""
+## Data used in this tutorial
+Cognee can ingest many types of sources. In this tutorial, we use a small, concrete set of files that cover different perspectives:
+- `guido_contributions.json` — Authoritative exemplars. Real PRs and commits from Guido van Rossum (mypy, CPython). These show how Python's creator solved problems and provide concrete anchors for patterns.
+- `pep_style_guide.md` — Norms. Encodes community style and typing conventions (PEP 8 and related). Ensures that search results and inferred rules align with widely accepted standards.
+- `zen_principles.md` — Philosophy. The Zen of Python. Grounds design trade-offs (simplicity, explicitness, readability) beyond syntax or mechanics.
+- `my_developer_rules.md` — Local constraints. Your house rules, conventions, and project-specific requirements (scope, privacy, Spec.md). Keeps recommendations relevant to your actual workflow.
+- `copilot_conversations.json` — Personal history. Transcripts of real assistant conversations, including your questions, code snippets, and discussion topics. Captures "how you code" and connects it to "how Guido codes."
+""",
+"""
+# Preliminaries
+To strike the balanace between speed, cost, anc quality, we recommend using OpenAI's `4o-mini` model; make sure your `.env` file contains this line:
+`
+LLM_MODEL="gpt-4o-mini"
+`
+""",
+"""
+import cognee
+result = await cognee.add(
+    "file://data/guido_contributions.json",
+    node_set=["guido_data"]
+)
+await cognee.cognify(temporal_cognify=True)
+results = await cognee.search("Show me commits")
+"""
+]

cognee/modules/notebooks/methods/get_notebook.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from uuid import UUID
 from typing import Optional
-from sqlalchemy import select
+from sqlalchemy import and_, select
 from sqlalchemy.ext.asyncio import AsyncSession
 from cognee.infrastructure.databases.relational import with_async_session
@@ -15,7 +15,7 @@ async def get_notebook(
     session: AsyncSession,
 ) -> Optional[Notebook]:
     result = await session.execute(
-        select(Notebook).where(Notebook.owner_id == user_id and Notebook.id == notebook_id)
+        select(Notebook).where(and_(Notebook.owner_id == user_id, Notebook.id == notebook_id))
     )
     return result.scalar()

cognee/modules/notebooks/methods/update_notebook.py CHANGED Viewed

@@ -1,4 +1,3 @@
-from typing import Callable, AsyncContextManager
 from sqlalchemy.ext.asyncio import AsyncSession
 from cognee.infrastructure.databases.relational import with_async_session

cognee/modules/notebooks/operations/run_in_local_sandbox.py CHANGED Viewed

@@ -5,16 +5,18 @@ import traceback
 def wrap_in_async_handler(user_code: str) -> str:
     return (
-        "from cognee.infrastructure.utils.run_sync import run_sync\n\n"
-        "async def __user_main__():\n"
+        "import asyncio\n"
+        + "asyncio.set_event_loop(running_loop)\n\n"
+        + "from cognee.infrastructure.utils.run_sync import run_sync\n\n"
+        + "async def __user_main__():\n"
         + "\n".join("    " + line for line in user_code.strip().split("\n"))
         + "\n"
-        "    globals().update(locals())\n\n"
-        "run_sync(__user_main__())\n"
+        + "    globals().update(locals())\n\n"
+        + "run_sync(__user_main__(), running_loop)\n"
     )
-def run_in_local_sandbox(code, environment=None):
+def run_in_local_sandbox(code, environment=None, loop=None):
     environment = environment or {}
     code = wrap_in_async_handler(code.replace("\xa0", "\n"))
@@ -31,6 +33,7 @@ def run_in_local_sandbox(code, environment=None):
         printOutput.append(output)
     environment["print"] = customPrintFunction
+    environment["running_loop"] = loop
     try:
         exec(code, environment)

cognee/modules/retrieval/graph_completion_context_extension_retriever.py CHANGED Viewed

@@ -48,7 +48,7 @@ class GraphCompletionContextExtensionRetriever(GraphCompletionRetriever):
         query: str,
         context: Optional[List[Edge]] = None,
         context_extension_rounds=4,
-    ) -> str:
+    ) -> List[str]:
         """
         Extends the context for a given query by retrieving related triplets and generating new
         completions based on them.

cognee/modules/retrieval/graph_completion_cot_retriever.py CHANGED Viewed

@@ -58,7 +58,7 @@ class GraphCompletionCotRetriever(GraphCompletionRetriever):
         query: str,
         context: Optional[List[Edge]] = None,
         max_iter=4,
-    ) -> str:
+    ) -> List[str]:
         """
         Generate completion responses based on a user query and contextual information.

cognee/modules/retrieval/graph_completion_retriever.py CHANGED Viewed

@@ -135,7 +135,7 @@ class GraphCompletionRetriever(BaseGraphRetriever):
         self,
         query: str,
         context: Optional[List[Edge]] = None,
-    ) -> Any:
+    ) -> List[str]:
         """
         Generates a completion using graph connections context based on a query.

cognee/modules/retrieval/temporal_retriever.py CHANGED Viewed

@@ -136,7 +136,7 @@ class TemporalRetriever(GraphCompletionRetriever):
         return self.descriptions_to_string(top_k_events)
-    async def get_completion(self, query: str, context: Optional[str] = None) -> str:
+    async def get_completion(self, query: str, context: Optional[str] = None) -> List[str]:
         """Generates a response using the query and optional context."""
         if not context:
             context = await self.get_context(query=query)

cognee/modules/retrieval/user_qa_feedback.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from typing import Any, Optional, List
+from typing import Optional, List
 from uuid import NAMESPACE_OID, uuid5, UUID
 from cognee.infrastructure.databases.graph import get_graph_engine

cognee/modules/search/utils/prepare_search_result.py CHANGED Viewed

@@ -6,7 +6,7 @@ from cognee.modules.search.utils.transform_context_to_graph import transform_con
 async def prepare_search_result(search_result):
-    result, context, datasets = search_result
+    results, context, datasets = search_result
     graphs = None
     result_graph = None
@@ -30,11 +30,11 @@ async def prepare_search_result(search_result):
             "*": "\n".join(cast(List[str], context)),
         }
-    if isinstance(result, List) and len(result) > 0 and isinstance(result[0], Edge):
-        result_graph = transform_context_to_graph(result)
+    if isinstance(results, List) and len(results) > 0 and isinstance(results[0], Edge):
+        result_graph = transform_context_to_graph(results)
     return {
-        "result": result_graph or result,
+        "result": result_graph or results[0] if len(results) == 1 else results,
         "graphs": graphs,
         "context": context_texts,
         "datasets": datasets,

{cognee-0.3.2.dist-info → cognee-0.3.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cognee
-Version: 0.3.2
+Version: 0.3.3
 Summary: Cognee - is a library for enriching LLM context with a semantic layer for better understanding and reasoning.
 Project-URL: Homepage, https://www.cognee.ai
 Project-URL: Repository, https://github.com/topoteretes/cognee

{cognee-0.3.2.dist-info → cognee-0.3.3.dist-info}/RECORD RENAMED Viewed

@@ -41,7 +41,7 @@ cognee/api/v1/memify/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hS
 cognee/api/v1/memify/routers/__init__.py,sha256=Uv25PVGhfjnNi1NYWOmOLIlzaeTlyMYF9m7BEfdu45Q,49
 cognee/api/v1/memify/routers/get_memify_router.py,sha256=C1Cjt9D5TxhqBPmXZGNrCS4lJqPVXIJYgxZFtWVjZNs,4599
 cognee/api/v1/notebooks/routers/__init__.py,sha256=TvQz6caluaMoXNvjbE1p_C8savypgs8rAyP5lQ8jlpc,55
-cognee/api/v1/notebooks/routers/get_notebooks_router.py,sha256=YFxvs3WR5RCjB-Rk4uJ8yZtlLU0vl0AcOuRNFrb-i6U,3420
+cognee/api/v1/notebooks/routers/get_notebooks_router.py,sha256=m8OH3Kw1UHF8aTP4yNuSpv7gNThE4HxmLIrUnvECYGA,3484
 cognee/api/v1/permissions/routers/__init__.py,sha256=ljE3YnrzlMcVfThmkR5GSIxkm7sQVyibaLNtYQL4HO0,59
 cognee/api/v1/permissions/routers/get_permissions_router.py,sha256=tqd-J__UBlstTWnQocesdjVM9JnYO5rtJhhFj-Zv1_o,8316
 cognee/api/v1/prune/__init__.py,sha256=FEr5tTlX7wf3X4aFff6NPlVhNrPyqx7RBoJ71bJN1cY,25
@@ -53,7 +53,6 @@ cognee/api/v1/responses/models.py,sha256=MylzSnK-QB0kXe7nS-Mu4XRKZa-uBw8qP7Ke9On
 cognee/api/v1/responses/routers/__init__.py,sha256=X2qishwGRVFXawnvkZ5bv420PuPRLvknaFO2jdfiR10,122
 cognee/api/v1/responses/routers/default_tools.py,sha256=9qqzEZhrt3_YMKzUA06ke8P-2WeLXhYpKgVW6mLHlzw,3004
 cognee/api/v1/responses/routers/get_responses_router.py,sha256=ggbLhY9IXaInCgIs5TUuOCkFW64xmTKZQsc2ENq2Ocs,5979
-cognee/api/v1/save/save.py,sha256=xRthVNANIsrVJlLa5QKrdSiwCSckr7HBLmoeVJ_gEdE,12639
 cognee/api/v1/search/__init__.py,sha256=Sqw60DcOj4Bnvt-EWFknT31sPcvROIRKCWLr5pbkFr4,39
 cognee/api/v1/search/search.py,sha256=YQicNVi9q4FteAmt_EtY75I_EuNZ9ZjGE73wg-NcDwY,8824
 cognee/api/v1/search/routers/__init__.py,sha256=6RebeLX_2NTRxIMPH_mGuLztPxnGnMJK1y_O93CtRm8,49
@@ -182,12 +181,12 @@ cognee/infrastructure/databases/relational/get_async_session.py,sha256=qfiXSsTAA
 cognee/infrastructure/databases/relational/get_migration_relational_engine.py,sha256=5RtH281iIQo3vqgwmKT0nuiJp9jNd7vw6xRUjc5xIDM,1070
 cognee/infrastructure/databases/relational/get_relational_engine.py,sha256=De51ieg9eFhRLX08k9oNc-oszvt_9J5DHebqI1qI8_U,741
 cognee/infrastructure/databases/relational/with_async_session.py,sha256=UgQeJOvgeM6yhyNDwWdGULtTjZosTnjDlr267Losnfs,803
-cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py,sha256=uuX2tFPWueX0etooLFFr1PvaPQSdFtZRyCnRYSau20Q,27539
+cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py,sha256=j4mnqNJAO-U-Qfveam6NgjIH5lt7WjSMLVlemBrdpYU,27540
 cognee/infrastructure/databases/relational/sqlalchemy/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 cognee/infrastructure/databases/utils/__init__.py,sha256=4C0ncZG-O6bOFJpKgscCHu6D5vodLWRIKpe-WT4Ijbs,75
 cognee/infrastructure/databases/utils/get_or_create_dataset_database.py,sha256=wn7pRgeX-BU0L191_6pgT9P54uhVQlGMPqxQdvIlv4Y,2101
 cognee/infrastructure/databases/vector/__init__.py,sha256=7MdGJ3Mxdh2RyDq39rcjD99liIa-yGXxDUzq--1qQZs,291
-cognee/infrastructure/databases/vector/config.py,sha256=cY833pGsse4_dBmacNXmsdNZJQrSWPevKcGW1f_klYU,2927
+cognee/infrastructure/databases/vector/config.py,sha256=4HOmqZOEfVNmAhjxRNePMU9haTVeR35R2XbhPTcMqFg,2952
 cognee/infrastructure/databases/vector/create_vector_engine.py,sha256=ECtICkIW5QM_lX9465ZTxVXC5MCRo_h219q3GyFXxpc,4716
 cognee/infrastructure/databases/vector/get_vector_engine.py,sha256=y4TMWJ6B6DxwKF9PMfjB6WqujPnVhf0oR2j35Q-KhvA,272
 cognee/infrastructure/databases/vector/supported_databases.py,sha256=0UIYcQ15p7-rq5y_2A-E9ydcXyP6frdg8T5e5ECDDMI,25
@@ -366,8 +365,8 @@ cognee/infrastructure/loaders/external/pypdf_loader.py,sha256=nFa_h3LURBPoguRIID
 cognee/infrastructure/loaders/external/unstructured_loader.py,sha256=XCRVHwpM5XmcjRmL4Pr9ELzBU_qYDPhX_Ahn5K8w0AU,4603
 cognee/infrastructure/loaders/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 cognee/infrastructure/utils/calculate_backoff.py,sha256=O6h4MCe357BKaECmLZPLGYpffrMol65LwQCklBj4sh4,935
-cognee/infrastructure/utils/run_async.py,sha256=3J0OGzh3HLO6wHQN-rjEnGitVD_mbs4AO6VFgZ47eQE,393
-cognee/infrastructure/utils/run_sync.py,sha256=wLhXUdopsEaIRU7CrzcfPdj1KiRBjCf83HjqvSsace8,726
+cognee/infrastructure/utils/run_async.py,sha256=gZY8ZLG_86O9YVK8hciduIoDONHaEEnGOILh3EeD9LA,510
+cognee/infrastructure/utils/run_sync.py,sha256=9pAXc-EmjtV03exnUMOVSC-IJq_KCslX05z62MHQjlQ,800
 cognee/modules/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 cognee/modules/chunking/Chunker.py,sha256=KezN4WBiV0KNJtx6daMg4g1-a-_oJxn_l_iQT94T1lQ,343
 cognee/modules/chunking/LangchainChunker.py,sha256=Yo9Jza-t3x3V8I8PWbxUu48vlVVdvJKxwzL2gManwDc,2351
@@ -483,14 +482,15 @@ cognee/modules/metrics/operations/__init__.py,sha256=MZ3xbVdfEKqfLct8WnbyFVyZmkB
 cognee/modules/metrics/operations/get_pipeline_run_metrics.py,sha256=upIWnzKeJT1_XbL_ABdGxW-Ai7mO3AqMK35BNmItIQQ,2434
 cognee/modules/notebooks/methods/__init__.py,sha256=IhY4fUVPJbuvS83QESsWzjZRC6oC1I-kJi5gr3kPTLk,215
 cognee/modules/notebooks/methods/create_notebook.py,sha256=S41H3Rha0pj9dEKFy1nBG9atTGHhUdOmDZgr0ckUA6M,633
+cognee/modules/notebooks/methods/create_tutorial_notebook.py,sha256=8YPoDcMUZSNhEWSKxUcPOM61y0St2Z1Y-PC1HFRmlbk,4248
 cognee/modules/notebooks/methods/delete_notebook.py,sha256=BKxoRlPzkwXvTYh5WcF-zo_iVmaXqEiptS42JwB0KQU,309
-cognee/modules/notebooks/methods/get_notebook.py,sha256=O-iWX4sElOn_5EpI9_WCwdvbfPRgVQVGBev1U4tI8AA,545
+cognee/modules/notebooks/methods/get_notebook.py,sha256=IP4imsdt9X6GYd6i6WF6PlVhotGNH0i7XZpPqbtqMwo,554
 cognee/modules/notebooks/methods/get_notebooks.py,sha256=ee40ALHvebVORuwZVkQ271qAj260rrYy6eVGxAmfo8c,483
-cognee/modules/notebooks/methods/update_notebook.py,sha256=L-WgIxEr_uPClRZQZtnBEV9iT2C7aWqs0FuSW-F5qqk,410
+cognee/modules/notebooks/methods/update_notebook.py,sha256=MnZbfh-WfEfH3ImNvyQNhDeNwpYeS7p8FPVwnmBvZVg,361
 cognee/modules/notebooks/models/Notebook.py,sha256=Jth47QxJQ2-VGPyIcS0ul3bS8bgGrk9vCGoJVagxanw,1690
 cognee/modules/notebooks/models/__init__.py,sha256=jldsDjwRvFMreGpe4wxxr5TlFXTZuU7rbsRkGQvTO5s,45
 cognee/modules/notebooks/operations/__init__.py,sha256=VR_2w_d0lEiJ5Xw7_mboo2qWUv0umrR_Bp58MaMoE6w,55
-cognee/modules/notebooks/operations/run_in_local_sandbox.py,sha256=0Au8-bDy7S-c1eNLKInQI5HV7u3bhl7Lvvtt79c5J4Q,1186
+cognee/modules/notebooks/operations/run_in_local_sandbox.py,sha256=17hMEQC3LZTfPvbRUrPN9SzDeJPWSTq_BAhtwRZiqT8,1338
 cognee/modules/observability/get_observe.py,sha256=chRw4jmpmrwEvDecF9sgApm23IOzVgCbwkKEAyz1_AI,264
 cognee/modules/observability/observers.py,sha256=SKQSWWyGDG0QY2_bqsFgfpLUb7OUL4WFf8tDZYe5JMM,157
 cognee/modules/ontology/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -550,15 +550,15 @@ cognee/modules/retrieval/code_retriever.py,sha256=cnOjgfCATzz0-XZGFrIIkuVZLc6HBh
 cognee/modules/retrieval/coding_rules_retriever.py,sha256=3GU259jTbGLqmp_A8sUdE4fyf0td06SKuxBJVW-npIQ,1134
 cognee/modules/retrieval/completion_retriever.py,sha256=Lw5sxN_UrtmWSOtcSS7Yj50Gw9p4nNBmW3dr2kV9JJ0,3754
 cognee/modules/retrieval/cypher_search_retriever.py,sha256=_3rZJ23hSZpDa8kVyOSWN3fwjMI_aLF2m5p-FtBek8k,2440
-cognee/modules/retrieval/graph_completion_context_extension_retriever.py,sha256=PUJRR13MZ6eAjOH3HeQRRl0rEElHEBh4IKahgrDUXPo,4526
-cognee/modules/retrieval/graph_completion_cot_retriever.py,sha256=quJYusaUNTvy7A3V_PAIbDLBMrFDuX8_wT0NnTcE5x8,6134
-cognee/modules/retrieval/graph_completion_retriever.py,sha256=XHuu1kvANGNMz-j6UkW2mpUpb1sf3hXcmMhu4TVM03c,8816
+cognee/modules/retrieval/graph_completion_context_extension_retriever.py,sha256=-6yN8gpRlDue8d28rk-Ly-gq0T8BW-i1-Jgbp1x-Zsg,4532
+cognee/modules/retrieval/graph_completion_cot_retriever.py,sha256=JU-FkikaU68v8fT8VAmG6jojwhwroKYW2RUxdlJ1R-k,6140
+cognee/modules/retrieval/graph_completion_retriever.py,sha256=VnrFD4xUQewIO83mfmIUcPLA_HBGdUlDVRyA2Pm4ARo,8822
 cognee/modules/retrieval/graph_summary_completion_retriever.py,sha256=3AMisk3fObk2Vh1heY4veHkDjLsHgSSUc_ChZseJUYw,2456
 cognee/modules/retrieval/insights_retriever.py,sha256=1pcYd34EfKk85MSPFQ8b-ZbSARmnauks8TxXfNOxvOw,4953
 cognee/modules/retrieval/natural_language_retriever.py,sha256=zJz35zRmBP8-pRlkoxxSxn3-jtG2lUW0xcu58bq9Ebs,5761
 cognee/modules/retrieval/summaries_retriever.py,sha256=joXYphypACm2JiCjbC8nBS61m1q2oYkzyIt9bdgALNw,3384
-cognee/modules/retrieval/temporal_retriever.py,sha256=mYik14shVjK24fNEtYzjte5ovwwTdROn5Kxy5FrOE10,5679
-cognee/modules/retrieval/user_qa_feedback.py,sha256=WSMPg6WjteR-XgK0vK9f_bkZ_o0JMPb4XZ9OAcFyz9E,3371
+cognee/modules/retrieval/temporal_retriever.py,sha256=EUEYN94LpoWfbPjsToe_pC3rFsUUTIPA5K6wNjv8Nds,5685
+cognee/modules/retrieval/user_qa_feedback.py,sha256=-VEOsE_t0FiTy00OpOMWAYv12YSLPieAcMsu82vm7h4,3366
 cognee/modules/retrieval/context_providers/DummyContextProvider.py,sha256=9GsvINc7ekRyRWO5IefFGyytRYqsSlhpwAOw6Q691cA,419
 cognee/modules/retrieval/context_providers/SummarizedTripletSearchContextProvider.py,sha256=ypO6yWLxvmRsj_5dyYdvXTbztJmB_ioLrgyG6bF5WGA,894
 cognee/modules/retrieval/context_providers/TripletSearchContextProvider.py,sha256=8PzksHAtRw7tZarP3nZuxhi0cd1EYEDHOT4Q74mNEvc,3656
@@ -593,7 +593,7 @@ cognee/modules/search/types/SearchResult.py,sha256=blEean6PRFKcDRQugsojZPfH-Wohx
 cognee/modules/search/types/SearchType.py,sha256=-lT4bLKKunV4cL4FfF3tjNbdN7X4AsRMLpTkReNwXZM,594
 cognee/modules/search/types/__init__.py,sha256=8k6OjVrL70W1Jh-ClTbG2ETYIhOtSk3tfqjzYgEdPzA,117
 cognee/modules/search/utils/__init__.py,sha256=86mRtCN-B5-2NNChdQoU5x8_8hqTczGZjBoKVE9O7hA,124
-cognee/modules/search/utils/prepare_search_result.py,sha256=nfK8aqR2tRL_SYHqtkK1ssG8Ws_oflEDZZAEvQmu5F4,1293
+cognee/modules/search/utils/prepare_search_result.py,sha256=FTM-tVlprL8EswIcwOy8jO1bRmKG61GZqFfM8FNJUJg,1336
 cognee/modules/search/utils/transform_context_to_graph.py,sha256=rUQeEH-Z-GqAzAZTCetRVpwgrOHlNe3mUBRLwRb0478,1238
 cognee/modules/settings/__init__.py,sha256=_SZQgCQnnnIHLJuKOMO9uWzXNBQxwYHHMUSBp0qa2uQ,210
 cognee/modules/settings/get_current_settings.py,sha256=R2lOusG5Q2PMa2-2vDndh3Lm7nXyZVkdzTV7vQHT81Y,1642
@@ -789,7 +789,6 @@ cognee/tests/test_remote_kuzu.py,sha256=2GG05MtGuhOo6ST82OxjdVDetBS0GWHvKKmmmEtQ
 cognee/tests/test_remote_kuzu_stress.py,sha256=5vgnu4Uz_NoKKqFZJeVceHwb2zNhvdTVBgpN3NjhfAE,5304
 cognee/tests/test_s3.py,sha256=rY2UDK15cdyywlyVrR8N2DRtVXWYIW5REaaz99gaQeE,2694
 cognee/tests/test_s3_file_storage.py,sha256=62tvIFyh_uTP0TFF9Ck4Y-sxWPW-cwJKYEJUJI1atPI,5654
-cognee/tests/test_save_export_path.py,sha256=z07oQao82INzldg2mesS3ZGt7fl7rcjKx15JwoGT5tI,3898
 cognee/tests/test_search_db.py,sha256=4GpLx8ZJoMjkp-XqQ-LCrkf3NhAM4j_rMmlOFgmDO-A,13420
 cognee/tests/test_starter_pipelines.py,sha256=X1J8RDD0bFMKnRETyi5nyaF4TYdmUIu0EuD3WQwShNs,2475
 cognee/tests/test_telemetry.py,sha256=FIneuVofSKWFYqxNC88sT_P5GPzgfjVyqDCf2TYBE2E,4130
@@ -890,9 +889,9 @@ distributed/tasks/queued_add_edges.py,sha256=kz1DHE05y-kNHORQJjYWHUi6Q1QWUp_v3Dl
 distributed/tasks/queued_add_nodes.py,sha256=aqK4Ij--ADwUWknxYpiwbYrpa6CcvFfqHWbUZW4Kh3A,452
 distributed/workers/data_point_saving_worker.py,sha256=jFmA0-P_0Ru2IUDrSug0wML-5goAKrGtlBm5BA5Ryw4,3229
 distributed/workers/graph_saving_worker.py,sha256=oUYl99CdhlrPAIsUOHbHnS3d4XhGoV0_OIbCO8wYzRg,3648
-cognee-0.3.2.dist-info/METADATA,sha256=psFYLZRaPVkg3zbOTWugIyH0H_3RL0hxAQHqYNXCz54,14753
-cognee-0.3.2.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-cognee-0.3.2.dist-info/entry_points.txt,sha256=4Fe5PRV0e3j5MFUo7kYyRFa3MhMNbOu69pGBazTxPps,51
-cognee-0.3.2.dist-info/licenses/LICENSE,sha256=pHHjSQj1DD8SDppW88MMs04TPk7eAanL1c5xj8NY7NQ,11344
-cognee-0.3.2.dist-info/licenses/NOTICE.md,sha256=6L3saP3kSpcingOxDh-SGjMS8GY79Rlh2dBNLaO0o5c,339
-cognee-0.3.2.dist-info/RECORD,,
+cognee-0.3.3.dist-info/METADATA,sha256=MofBzxb-pUo59hyKjasnooG9SDbuVPsvy5UK6sjXluA,14753
+cognee-0.3.3.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+cognee-0.3.3.dist-info/entry_points.txt,sha256=GCCTsNg8gzOJkolq7dR7OK1VlIAO202dGDnMI8nm8oQ,55
+cognee-0.3.3.dist-info/licenses/LICENSE,sha256=pHHjSQj1DD8SDppW88MMs04TPk7eAanL1c5xj8NY7NQ,11344
+cognee-0.3.3.dist-info/licenses/NOTICE.md,sha256=6L3saP3kSpcingOxDh-SGjMS8GY79Rlh2dBNLaO0o5c,339
+cognee-0.3.3.dist-info/RECORD,,

cognee-0.3.3.dist-info/entry_points.txt ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ [console_scripts]
2	+ cognee-cli = cognee.cli._cognee:main

cognee/api/v1/save/save.py DELETED Viewed

@@ -1,335 +0,0 @@
-import os
-import asyncio
-import json
-from typing import Optional, Union, List, Dict
-from uuid import UUID
-from pydantic import BaseModel
-from cognee.base_config import get_base_config
-from cognee.modules.users.models import User
-from cognee.modules.users.methods import get_default_user
-from cognee.modules.data.methods import get_authorized_existing_datasets, get_dataset_data
-from cognee.infrastructure.files.utils.get_data_file_path import get_data_file_path
-from cognee.infrastructure.llm.LLMGateway import LLMGateway
-from cognee.shared.logging_utils import get_logger
-from cognee.api.v1.search import search
-from cognee.modules.search.types import SearchType
-logger = get_logger("save")
-class QuestionsModel(BaseModel):
-    questions: List[str]
-def _sanitize_filename(name: str) -> str:
-    safe = "".join(c if c.isalnum() or c in ("-", "_", ".", " ") else "_" for c in name)
-    return safe.strip().replace(" ", "_")
-def _dataset_dir_name(dataset) -> str:
-    # Prefer readable dataset name when available, fallback to id
-    if getattr(dataset, "name", None):
-        return _sanitize_filename(str(dataset.name))
-    return str(dataset.id)
-def _file_markdown_name(data_item, used_names: set[str]) -> str:
-    # Use original file name if present, else data.name
-    name = getattr(data_item, "name", None) or "file"
-    base = _sanitize_filename(str(name))
-    filename = f"{base}.md"
-    if filename in used_names:
-        short_id = str(getattr(data_item, "id", ""))[:8]
-        filename = f"{base}__{short_id}.md"
-    used_names.add(filename)
-    return filename
-def _ascii_path_tree(path_str: str) -> str:
-    if not path_str:
-        return "(no path)"
-    # Normalize special schemes but keep segments readable
-    try:
-        normalized = get_data_file_path(path_str)
-    except Exception:
-        normalized = path_str
-    # Keep the path compact – show last 5 segments
-    parts = [p for p in normalized.replace("\\", "/").split("/") if p]
-    if len(parts) > 6:
-        display = ["…"] + parts[-5:]
-    else:
-        display = parts
-    # Render a single-branch tree
-    lines = []
-    for idx, seg in enumerate(display):
-        prefix = "└── " if idx == 0 else ("    " * idx + "└── ")
-        lines.append(f"{prefix}{seg}")
-    return "\n".join(lines)
-async def _get_summary_via_summaries(query_text: str, dataset_id: UUID, top_k: int) -> str:
-    try:
-        results = await search(
-            query_text=query_text,
-            query_type=SearchType.SUMMARIES,
-            dataset_ids=[dataset_id],
-            top_k=top_k,
-        )
-        if not results:
-            return ""
-        texts: List[str] = []
-        for r in results[:top_k]:
-            texts.append(str(r))
-        return "\n\n".join(texts)
-    except Exception as e:
-        logger.error(
-            "SUMMARIES search failed for '%s' in dataset %s: %s",
-            query_text,
-            str(dataset_id),
-            str(e),
-        )
-        return ""
-async def _generate_questions(file_name: str, summary_text: str) -> List[str]:
-    prompt = (
-        "You are an expert analyst. Given a file and its summary, propose 10 diverse, high-signal "
-        "questions to further explore the file's content, implications, relationships, and gaps. "
-        "Avoid duplicates; vary depth and angle (overview, details, cross-references, temporal, quality).\n\n"
-        f"File: {file_name}\n\nSummary:\n{summary_text[:4000]}"
-    )
-    model = await LLMGateway.acreate_structured_output(
-        text_input=prompt,
-        system_prompt="Return strictly a JSON with key 'questions' and value as an array of 10 concise strings.",
-        response_model=QuestionsModel,
-    )
-    # model can be either pydantic model or dict-like, normalize
-    try:
-        questions = list(getattr(model, "questions", []))
-    except Exception:
-        questions = []
-    # Fallback if the tool returned a dict-like
-    if not questions and isinstance(model, dict):
-        questions = list(model.get("questions", []) or [])
-    # Enforce 10 max
-    return questions[:10]
-async def _run_searches_for_question(
-    question: str, dataset_id: UUID, search_types: List[SearchType], top_k: int
-) -> Dict[str, Union[str, List[dict], List[str]]]:
-    async def run_one(st: SearchType):
-        try:
-            result = await search(
-                query_text=question,
-                query_type=st,
-                dataset_ids=[dataset_id],
-                top_k=top_k,
-            )
-            return st.value, result
-        except Exception as e:
-            logger.error("Search failed for type %s: %s", st.value, str(e))
-            return st.value, [f"Error: {str(e)}"]
-    pairs = await asyncio.gather(*[run_one(st) for st in search_types])
-    return {k: v for k, v in pairs}
-def _format_results_md(results: Dict[str, Union[str, List[dict], List[str]]]) -> str:
-    lines: List[str] = []
-    for st, payload in results.items():
-        lines.append(f"#### {st}")
-        if isinstance(payload, list):
-            # Printed as bullet items; stringify dicts
-            for item in payload[:5]:
-                if isinstance(item, dict):
-                    # compact representation
-                    snippet = json.dumps(item, ensure_ascii=False)[:800]
-                    lines.append(f"- {snippet}")
-                else:
-                    text = str(item)
-                    lines.append(f"- {text[:800]}")
-        else:
-            lines.append(str(payload))
-        lines.append("")
-    return "\n".join(lines)
-async def save(
-    datasets: Optional[Union[List[str], List[UUID]]] = None,
-    export_root_directory: Optional[str] = None,
-    user: Optional[User] = None,
-    # Configurable knobs
-    max_questions: int = 10,
-    search_types: Optional[List[Union[str, SearchType]]] = None,
-    top_k: int = 5,
-    include_summary: bool = True,
-    include_ascii_tree: bool = True,
-    concurrency: int = 4,
-    timeout: Optional[float] = None,
-) -> Dict[str, str]:
-    """
-    Export per-dataset markdown summaries and search insights for each ingested file.
-    For every dataset the user can read:
-    - Create a folder under export_root_directory (or data_root_directory/exports)
-    - For each data item (file), create a .md containing:
-      - Summary of the file (from existing TextSummary nodes)
-      - A small ASCII path tree showing its folder position
-      - Up to N LLM-generated question ideas (configurable)
-      - Results of configured Cognee searches per question
-    Also creates an index.md per dataset with links to files and an optional dataset summary.
-    Returns a mapping of dataset_id -> export_directory path.
-    """
-    base_config = get_base_config()
-    export_root = export_root_directory or os.path.join(
-        base_config.data_root_directory, "memory_export"
-    )
-    os.makedirs(export_root, exist_ok=True)
-    if user is None:
-        user = await get_default_user()
-    datasets_list = await get_authorized_existing_datasets(datasets, "read", user)
-    results: Dict[str, str] = {}
-    for dataset in datasets_list:
-        ds_dir = os.path.join(export_root, _dataset_dir_name(dataset))
-        os.makedirs(ds_dir, exist_ok=True)
-        results[str(dataset.id)] = ds_dir
-        data_items = await get_dataset_data(dataset.id)
-        # Normalize search types
-        if not search_types:
-            effective_search_types = [
-                SearchType.GRAPH_COMPLETION,
-                SearchType.INSIGHTS,
-                SearchType.CHUNKS,
-            ]
-        else:
-            effective_search_types = []
-            for st in search_types:
-                if isinstance(st, SearchType):
-                    effective_search_types.append(st)
-                else:
-                    try:
-                        effective_search_types.append(SearchType[str(st)])
-                    except Exception:
-                        logger.warning("Unknown search type '%s', skipping", str(st))
-        sem = asyncio.Semaphore(max(1, int(concurrency)))
-        used_names: set[str] = set()
-        index_entries: List[tuple[str, str]] = []
-        async def process_one(data_item):
-            async with sem:
-                file_label = getattr(data_item, "name", str(data_item.id))
-                original_path = getattr(data_item, "original_data_location", None)
-                ascii_tree = (
-                    _ascii_path_tree(original_path or file_label) if include_ascii_tree else ""
-                )
-                summary_text = ""
-                if include_summary:
-                    # Use SUMMARIES search scoped to dataset to derive file summary
-                    file_query = getattr(data_item, "name", str(data_item.id)) or "file"
-                    summary_text = await _get_summary_via_summaries(file_query, dataset.id, top_k)
-                    if not summary_text:
-                        summary_text = "Summary not available."
-                if max_questions == 0:
-                    questions = []
-                else:
-                    questions = await _generate_questions(file_label, summary_text)
-                    if max_questions is not None and max_questions >= 0:
-                        questions = questions[:max_questions]
-                async def searches_for_question(q: str):
-                    return await _run_searches_for_question(
-                        q, dataset.id, effective_search_types, top_k
-                    )
-                # Run per-question searches concurrently
-                per_q_results = await asyncio.gather(*[searches_for_question(q) for q in questions])
-                # Build markdown content
-                md_lines = [f"# {file_label}", ""]
-                if include_ascii_tree:
-                    md_lines.extend(["## Location", "", "```", ascii_tree, "```", ""])
-                if include_summary:
-                    md_lines.extend(["## Summary", "", summary_text, ""])
-                md_lines.append("## Question ideas")
-                for idx, q in enumerate(questions, start=1):
-                    md_lines.append(f"- {idx}. {q}")
-                md_lines.append("")
-                md_lines.append("## Searches")
-                md_lines.append("")
-                for q, per_type in zip(questions, per_q_results):
-                    md_lines.append(f"### Q: {q}")
-                    md_lines.append(_format_results_md(per_type))
-                    md_lines.append("")
-                # Write to file (collision-safe)
-                md_filename = _file_markdown_name(data_item, used_names)
-                export_path = os.path.join(ds_dir, md_filename)
-                tmp_path = export_path + ".tmp"
-                with open(tmp_path, "w", encoding="utf-8") as f:
-                    f.write("\n".join(md_lines))
-                os.replace(tmp_path, export_path)
-                index_entries.append((file_label, md_filename))
-        tasks = [asyncio.create_task(process_one(item)) for item in data_items]
-        if timeout and timeout > 0:
-            try:
-                await asyncio.wait_for(asyncio.gather(*tasks, return_exceptions=True), timeout)
-            except asyncio.TimeoutError:
-                logger.error("Save timed out for dataset %s", str(dataset.id))
-        else:
-            await asyncio.gather(*tasks, return_exceptions=True)
-        # Build dataset index.md with TOC and optional dataset summary via SUMMARIES
-        try:
-            index_lines = [f"# Dataset: {_dataset_dir_name(dataset)}", "", "## Files", ""]
-            for display, fname in sorted(index_entries, key=lambda x: x[0].lower()):
-                index_lines.append(f"- [{display}]({fname})")
-            # Dataset summary section
-            try:
-                summaries = await search(
-                    query_text="dataset overview",
-                    query_type=SearchType.SUMMARIES,
-                    dataset_ids=[dataset.id],
-                    top_k=top_k,
-                )
-            except Exception as e:
-                logger.error("Dataset summary search failed: %s", str(e))
-                summaries = []
-            if summaries:
-                index_lines.extend(["", "## Dataset summary (top summaries)", ""])
-                for s in summaries[:top_k]:
-                    index_lines.append(f"- {str(s)[:800]}")
-            with open(os.path.join(ds_dir, "index.md"), "w", encoding="utf-8") as f:
-                f.write("\n".join(index_lines))
-        except Exception as e:
-            logger.error("Failed to write dataset index for %s: %s", str(dataset.id), str(e))
-    return results

cognee/tests/test_save_export_path.py DELETED Viewed

@@ -1,116 +0,0 @@
-import os
-import asyncio
-from uuid import uuid4
-import pytest
-@pytest.mark.asyncio
-async def test_save_uses_custom_export_path(tmp_path, monkeypatch):
-    # Import target after tmp fixtures are ready
-    from cognee.api.v1.save import save as save_mod
-    # Prepare two mock datasets
-    class Dataset:
-        def __init__(self, id_, name):
-            self.id = id_
-            self.name = name
-    ds1 = Dataset(uuid4(), "dataset_alpha")
-    ds2 = Dataset(uuid4(), "dataset_beta")
-    # Mock dataset discovery
-    async def mock_get_authorized_existing_datasets(datasets, permission_type, user):
-        return [ds1, ds2]
-    monkeypatch.setattr(
-        save_mod, "get_authorized_existing_datasets", mock_get_authorized_existing_datasets
-    )
-    # Mock data items (with filename collision in ds1)
-    class DataItem:
-        def __init__(self, id_, name, original_path=None):
-            self.id = id_
-            self.name = name
-            self.original_data_location = original_path
-    ds1_items = [
-        DataItem(uuid4(), "report.txt", "/root/a/report.txt"),
-        DataItem(uuid4(), "report.txt", "/root/b/report.txt"),  # collision
-    ]
-    ds2_items = [
-        DataItem(uuid4(), "notes.md", "/root/x/notes.md"),
-    ]
-    async def mock_get_dataset_data(dataset_id):
-        if dataset_id == ds1.id:
-            return ds1_items
-        if dataset_id == ds2.id:
-            return ds2_items
-        return []
-    monkeypatch.setattr(save_mod, "get_dataset_data", mock_get_dataset_data)
-    # Mock summary retrieval
-    async def mock_get_document_summaries_text(data_id: str) -> str:
-        return "This is a summary."
-    monkeypatch.setattr(save_mod, "_get_document_summaries_text", mock_get_document_summaries_text)
-    # Mock questions
-    async def mock_generate_questions(file_name: str, summary_text: str):
-        return ["Q1?", "Q2?", "Q3?"]
-    monkeypatch.setattr(save_mod, "_generate_questions", mock_generate_questions)
-    # Mock searches per question
-    async def mock_run_searches_for_question(question, dataset_id, search_types, top_k):
-        return {st.value: [f"{question} -> ok"] for st in search_types}
-    monkeypatch.setattr(save_mod, "_run_searches_for_question", mock_run_searches_for_question)
-    # Use custom export path
-    export_dir = tmp_path / "my_exports"
-    export_dir_str = str(export_dir)
-    # Run
-    result = await save_mod.save(
-        datasets=None,
-        export_root_directory=export_dir_str,
-        max_questions=3,
-        search_types=["GRAPH_COMPLETION", "INSIGHTS", "CHUNKS"],
-        top_k=2,
-        include_summary=True,
-        include_ascii_tree=True,
-        concurrency=2,
-        timeout=None,
-    )
-    # Verify returned mapping points to our custom path
-    assert str(ds1.id) in result and str(ds2.id) in result
-    assert result[str(ds1.id)].startswith(export_dir_str)
-    assert result[str(ds2.id)].startswith(export_dir_str)
-    # Verify directories and files exist
-    ds1_dir = result[str(ds1.id)]
-    ds2_dir = result[str(ds2.id)]
-    assert os.path.isdir(ds1_dir)
-    assert os.path.isdir(ds2_dir)
-    # index.md present
-    assert os.path.isfile(os.path.join(ds1_dir, "index.md"))
-    assert os.path.isfile(os.path.join(ds2_dir, "index.md"))
-    # File markdowns exist; collision handling: two files with similar base
-    ds1_files = [f for f in os.listdir(ds1_dir) if f.endswith(".md") and f != "index.md"]
-    assert len(ds1_files) == 2
-    assert any(f == "report.txt.md" for f in ds1_files)
-    assert any(f.startswith("report.txt__") and f.endswith(".md") for f in ds1_files)
-    # Content sanity: ensure question headers exist in one file
-    sample_md_path = os.path.join(ds1_dir, ds1_files[0])
-    with open(sample_md_path, "r", encoding="utf-8") as fh:
-        content = fh.read()
-        assert "## Question ideas" in content
-        assert "## Searches" in content

cognee-0.3.2.dist-info/entry_points.txt DELETED Viewed

	@@ -1,2 +0,0 @@
1	- [console_scripts]
2	- cognee = cognee.cli._cognee:main

{cognee-0.3.2.dist-info → cognee-0.3.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{cognee-0.3.2.dist-info → cognee-0.3.3.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{cognee-0.3.2.dist-info → cognee-0.3.3.dist-info}/licenses/NOTICE.md RENAMED Viewed

File without changes

cognee 0.3.2__py3-none-any.whl → 0.3.3__py3-none-any.whl

cognee 0.3.2py3-none-any.whl → 0.3.3py3-none-any.whl