cognee 0.2.3.dev1__py3-none-any.whl → 0.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (252) hide show
  1. cognee/__init__.py +2 -0
  2. cognee/__main__.py +4 -0
  3. cognee/api/client.py +28 -3
  4. cognee/api/health.py +10 -13
  5. cognee/api/v1/add/add.py +20 -6
  6. cognee/api/v1/add/routers/get_add_router.py +12 -37
  7. cognee/api/v1/cloud/routers/__init__.py +1 -0
  8. cognee/api/v1/cloud/routers/get_checks_router.py +23 -0
  9. cognee/api/v1/cognify/code_graph_pipeline.py +14 -3
  10. cognee/api/v1/cognify/cognify.py +67 -105
  11. cognee/api/v1/cognify/routers/get_cognify_router.py +11 -3
  12. cognee/api/v1/datasets/routers/get_datasets_router.py +16 -5
  13. cognee/api/v1/memify/routers/__init__.py +1 -0
  14. cognee/api/v1/memify/routers/get_memify_router.py +100 -0
  15. cognee/api/v1/notebooks/routers/__init__.py +1 -0
  16. cognee/api/v1/notebooks/routers/get_notebooks_router.py +96 -0
  17. cognee/api/v1/responses/default_tools.py +4 -0
  18. cognee/api/v1/responses/dispatch_function.py +6 -1
  19. cognee/api/v1/responses/models.py +1 -1
  20. cognee/api/v1/search/routers/get_search_router.py +20 -1
  21. cognee/api/v1/search/search.py +17 -4
  22. cognee/api/v1/sync/__init__.py +17 -0
  23. cognee/api/v1/sync/routers/__init__.py +3 -0
  24. cognee/api/v1/sync/routers/get_sync_router.py +241 -0
  25. cognee/api/v1/sync/sync.py +877 -0
  26. cognee/api/v1/ui/__init__.py +1 -0
  27. cognee/api/v1/ui/ui.py +529 -0
  28. cognee/api/v1/users/routers/get_auth_router.py +13 -1
  29. cognee/base_config.py +10 -1
  30. cognee/cli/__init__.py +10 -0
  31. cognee/cli/_cognee.py +273 -0
  32. cognee/cli/commands/__init__.py +1 -0
  33. cognee/cli/commands/add_command.py +80 -0
  34. cognee/cli/commands/cognify_command.py +128 -0
  35. cognee/cli/commands/config_command.py +225 -0
  36. cognee/cli/commands/delete_command.py +80 -0
  37. cognee/cli/commands/search_command.py +149 -0
  38. cognee/cli/config.py +33 -0
  39. cognee/cli/debug.py +21 -0
  40. cognee/cli/echo.py +45 -0
  41. cognee/cli/exceptions.py +23 -0
  42. cognee/cli/minimal_cli.py +97 -0
  43. cognee/cli/reference.py +26 -0
  44. cognee/cli/suppress_logging.py +12 -0
  45. cognee/eval_framework/corpus_builder/corpus_builder_executor.py +2 -2
  46. cognee/eval_framework/eval_config.py +1 -1
  47. cognee/infrastructure/databases/graph/config.py +10 -4
  48. cognee/infrastructure/databases/graph/get_graph_engine.py +4 -9
  49. cognee/infrastructure/databases/graph/kuzu/adapter.py +199 -2
  50. cognee/infrastructure/databases/graph/neo4j_driver/adapter.py +138 -0
  51. cognee/infrastructure/databases/relational/__init__.py +2 -0
  52. cognee/infrastructure/databases/relational/get_async_session.py +15 -0
  53. cognee/infrastructure/databases/relational/sqlalchemy/SqlAlchemyAdapter.py +6 -1
  54. cognee/infrastructure/databases/relational/with_async_session.py +25 -0
  55. cognee/infrastructure/databases/vector/chromadb/ChromaDBAdapter.py +1 -1
  56. cognee/infrastructure/databases/vector/config.py +13 -6
  57. cognee/infrastructure/databases/vector/embeddings/FastembedEmbeddingEngine.py +6 -4
  58. cognee/infrastructure/databases/vector/embeddings/LiteLLMEmbeddingEngine.py +16 -7
  59. cognee/infrastructure/databases/vector/embeddings/OllamaEmbeddingEngine.py +5 -5
  60. cognee/infrastructure/databases/vector/embeddings/config.py +2 -2
  61. cognee/infrastructure/databases/vector/embeddings/embedding_rate_limiter.py +2 -6
  62. cognee/infrastructure/databases/vector/embeddings/get_embedding_engine.py +10 -7
  63. cognee/infrastructure/files/storage/LocalFileStorage.py +9 -0
  64. cognee/infrastructure/files/storage/S3FileStorage.py +5 -0
  65. cognee/infrastructure/files/storage/StorageManager.py +7 -1
  66. cognee/infrastructure/files/storage/storage.py +16 -0
  67. cognee/infrastructure/files/utils/get_data_file_path.py +14 -9
  68. cognee/infrastructure/files/utils/get_file_metadata.py +2 -1
  69. cognee/infrastructure/llm/LLMGateway.py +32 -5
  70. cognee/infrastructure/llm/config.py +6 -4
  71. cognee/infrastructure/llm/prompts/extract_query_time.txt +15 -0
  72. cognee/infrastructure/llm/prompts/generate_event_entity_prompt.txt +25 -0
  73. cognee/infrastructure/llm/prompts/generate_event_graph_prompt.txt +30 -0
  74. cognee/infrastructure/llm/structured_output_framework/baml/baml_src/extraction/knowledge_graph/extract_content_graph.py +16 -5
  75. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/extraction/__init__.py +2 -0
  76. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/extraction/extract_event_entities.py +44 -0
  77. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/extraction/knowledge_graph/__init__.py +1 -0
  78. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/extraction/knowledge_graph/extract_content_graph.py +19 -15
  79. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/extraction/knowledge_graph/extract_event_graph.py +46 -0
  80. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/anthropic/adapter.py +3 -3
  81. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/gemini/adapter.py +3 -3
  82. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/generic_llm_api/adapter.py +2 -2
  83. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/get_llm_client.py +14 -8
  84. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/ollama/adapter.py +6 -4
  85. cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/openai/adapter.py +28 -4
  86. cognee/infrastructure/llm/tokenizer/Gemini/adapter.py +2 -2
  87. cognee/infrastructure/llm/tokenizer/HuggingFace/adapter.py +3 -3
  88. cognee/infrastructure/llm/tokenizer/Mistral/adapter.py +3 -3
  89. cognee/infrastructure/llm/tokenizer/TikToken/adapter.py +6 -6
  90. cognee/infrastructure/llm/utils.py +7 -7
  91. cognee/infrastructure/utils/run_sync.py +8 -1
  92. cognee/modules/chunking/models/DocumentChunk.py +4 -3
  93. cognee/modules/cloud/exceptions/CloudApiKeyMissingError.py +15 -0
  94. cognee/modules/cloud/exceptions/CloudConnectionError.py +15 -0
  95. cognee/modules/cloud/exceptions/__init__.py +2 -0
  96. cognee/modules/cloud/operations/__init__.py +1 -0
  97. cognee/modules/cloud/operations/check_api_key.py +25 -0
  98. cognee/modules/data/deletion/prune_system.py +1 -1
  99. cognee/modules/data/methods/__init__.py +2 -0
  100. cognee/modules/data/methods/check_dataset_name.py +1 -1
  101. cognee/modules/data/methods/create_authorized_dataset.py +19 -0
  102. cognee/modules/data/methods/get_authorized_dataset.py +11 -5
  103. cognee/modules/data/methods/get_authorized_dataset_by_name.py +16 -0
  104. cognee/modules/data/methods/get_dataset_data.py +1 -1
  105. cognee/modules/data/methods/load_or_create_datasets.py +2 -20
  106. cognee/modules/engine/models/Event.py +16 -0
  107. cognee/modules/engine/models/Interval.py +8 -0
  108. cognee/modules/engine/models/Timestamp.py +13 -0
  109. cognee/modules/engine/models/__init__.py +3 -0
  110. cognee/modules/engine/utils/__init__.py +2 -0
  111. cognee/modules/engine/utils/generate_event_datapoint.py +46 -0
  112. cognee/modules/engine/utils/generate_timestamp_datapoint.py +51 -0
  113. cognee/modules/graph/cognee_graph/CogneeGraph.py +2 -2
  114. cognee/modules/graph/methods/get_formatted_graph_data.py +3 -2
  115. cognee/modules/graph/utils/__init__.py +1 -0
  116. cognee/modules/graph/utils/resolve_edges_to_text.py +71 -0
  117. cognee/modules/memify/__init__.py +1 -0
  118. cognee/modules/memify/memify.py +118 -0
  119. cognee/modules/notebooks/methods/__init__.py +5 -0
  120. cognee/modules/notebooks/methods/create_notebook.py +26 -0
  121. cognee/modules/notebooks/methods/delete_notebook.py +13 -0
  122. cognee/modules/notebooks/methods/get_notebook.py +21 -0
  123. cognee/modules/notebooks/methods/get_notebooks.py +18 -0
  124. cognee/modules/notebooks/methods/update_notebook.py +17 -0
  125. cognee/modules/notebooks/models/Notebook.py +53 -0
  126. cognee/modules/notebooks/models/__init__.py +1 -0
  127. cognee/modules/notebooks/operations/__init__.py +1 -0
  128. cognee/modules/notebooks/operations/run_in_local_sandbox.py +55 -0
  129. cognee/modules/pipelines/__init__.py +1 -1
  130. cognee/modules/pipelines/exceptions/tasks.py +18 -0
  131. cognee/modules/pipelines/layers/__init__.py +1 -0
  132. cognee/modules/pipelines/layers/check_pipeline_run_qualification.py +59 -0
  133. cognee/modules/pipelines/layers/pipeline_execution_mode.py +127 -0
  134. cognee/modules/pipelines/layers/reset_dataset_pipeline_run_status.py +28 -0
  135. cognee/modules/pipelines/layers/resolve_authorized_user_dataset.py +34 -0
  136. cognee/modules/pipelines/layers/resolve_authorized_user_datasets.py +55 -0
  137. cognee/modules/pipelines/layers/setup_and_check_environment.py +41 -0
  138. cognee/modules/pipelines/layers/validate_pipeline_tasks.py +20 -0
  139. cognee/modules/pipelines/methods/__init__.py +2 -0
  140. cognee/modules/pipelines/methods/get_pipeline_runs_by_dataset.py +34 -0
  141. cognee/modules/pipelines/methods/reset_pipeline_run_status.py +16 -0
  142. cognee/modules/pipelines/operations/__init__.py +0 -1
  143. cognee/modules/pipelines/operations/log_pipeline_run_initiated.py +1 -1
  144. cognee/modules/pipelines/operations/pipeline.py +24 -138
  145. cognee/modules/pipelines/operations/run_tasks.py +17 -41
  146. cognee/modules/retrieval/base_feedback.py +11 -0
  147. cognee/modules/retrieval/base_graph_retriever.py +18 -0
  148. cognee/modules/retrieval/base_retriever.py +1 -1
  149. cognee/modules/retrieval/code_retriever.py +8 -0
  150. cognee/modules/retrieval/coding_rules_retriever.py +31 -0
  151. cognee/modules/retrieval/completion_retriever.py +9 -3
  152. cognee/modules/retrieval/context_providers/TripletSearchContextProvider.py +1 -0
  153. cognee/modules/retrieval/cypher_search_retriever.py +1 -9
  154. cognee/modules/retrieval/graph_completion_context_extension_retriever.py +29 -13
  155. cognee/modules/retrieval/graph_completion_cot_retriever.py +30 -13
  156. cognee/modules/retrieval/graph_completion_retriever.py +107 -56
  157. cognee/modules/retrieval/graph_summary_completion_retriever.py +5 -1
  158. cognee/modules/retrieval/insights_retriever.py +14 -3
  159. cognee/modules/retrieval/natural_language_retriever.py +0 -4
  160. cognee/modules/retrieval/summaries_retriever.py +1 -1
  161. cognee/modules/retrieval/temporal_retriever.py +152 -0
  162. cognee/modules/retrieval/user_qa_feedback.py +83 -0
  163. cognee/modules/retrieval/utils/brute_force_triplet_search.py +7 -32
  164. cognee/modules/retrieval/utils/completion.py +10 -3
  165. cognee/modules/retrieval/utils/extract_uuid_from_node.py +18 -0
  166. cognee/modules/retrieval/utils/models.py +40 -0
  167. cognee/modules/search/methods/get_search_type_tools.py +168 -0
  168. cognee/modules/search/methods/no_access_control_search.py +47 -0
  169. cognee/modules/search/methods/search.py +239 -118
  170. cognee/modules/search/types/SearchResult.py +21 -0
  171. cognee/modules/search/types/SearchType.py +3 -0
  172. cognee/modules/search/types/__init__.py +1 -0
  173. cognee/modules/search/utils/__init__.py +2 -0
  174. cognee/modules/search/utils/prepare_search_result.py +41 -0
  175. cognee/modules/search/utils/transform_context_to_graph.py +38 -0
  176. cognee/modules/settings/get_settings.py +2 -2
  177. cognee/modules/sync/__init__.py +1 -0
  178. cognee/modules/sync/methods/__init__.py +23 -0
  179. cognee/modules/sync/methods/create_sync_operation.py +53 -0
  180. cognee/modules/sync/methods/get_sync_operation.py +107 -0
  181. cognee/modules/sync/methods/update_sync_operation.py +248 -0
  182. cognee/modules/sync/models/SyncOperation.py +142 -0
  183. cognee/modules/sync/models/__init__.py +3 -0
  184. cognee/modules/users/__init__.py +0 -1
  185. cognee/modules/users/methods/__init__.py +4 -1
  186. cognee/modules/users/methods/create_user.py +26 -1
  187. cognee/modules/users/methods/get_authenticated_user.py +36 -42
  188. cognee/modules/users/methods/get_default_user.py +3 -1
  189. cognee/modules/users/permissions/methods/get_specific_user_permission_datasets.py +2 -1
  190. cognee/root_dir.py +19 -0
  191. cognee/shared/CodeGraphEntities.py +1 -0
  192. cognee/shared/logging_utils.py +143 -32
  193. cognee/shared/utils.py +0 -1
  194. cognee/tasks/codingagents/coding_rule_associations.py +127 -0
  195. cognee/tasks/graph/extract_graph_from_data.py +6 -2
  196. cognee/tasks/ingestion/save_data_item_to_storage.py +23 -0
  197. cognee/tasks/memify/__init__.py +2 -0
  198. cognee/tasks/memify/extract_subgraph.py +7 -0
  199. cognee/tasks/memify/extract_subgraph_chunks.py +11 -0
  200. cognee/tasks/repo_processor/get_local_dependencies.py +2 -0
  201. cognee/tasks/repo_processor/get_repo_file_dependencies.py +144 -47
  202. cognee/tasks/storage/add_data_points.py +33 -3
  203. cognee/tasks/temporal_graph/__init__.py +1 -0
  204. cognee/tasks/temporal_graph/add_entities_to_event.py +85 -0
  205. cognee/tasks/temporal_graph/enrich_events.py +34 -0
  206. cognee/tasks/temporal_graph/extract_events_and_entities.py +32 -0
  207. cognee/tasks/temporal_graph/extract_knowledge_graph_from_events.py +41 -0
  208. cognee/tasks/temporal_graph/models.py +49 -0
  209. cognee/tests/integration/cli/__init__.py +3 -0
  210. cognee/tests/integration/cli/test_cli_integration.py +331 -0
  211. cognee/tests/integration/documents/PdfDocument_test.py +2 -2
  212. cognee/tests/integration/documents/TextDocument_test.py +2 -4
  213. cognee/tests/integration/documents/UnstructuredDocument_test.py +5 -8
  214. cognee/tests/{test_deletion.py → test_delete_hard.py} +0 -37
  215. cognee/tests/test_delete_soft.py +85 -0
  216. cognee/tests/test_kuzu.py +2 -2
  217. cognee/tests/test_neo4j.py +2 -2
  218. cognee/tests/test_permissions.py +3 -3
  219. cognee/tests/test_relational_db_migration.py +7 -5
  220. cognee/tests/test_search_db.py +136 -23
  221. cognee/tests/test_temporal_graph.py +167 -0
  222. cognee/tests/unit/api/__init__.py +1 -0
  223. cognee/tests/unit/api/test_conditional_authentication_endpoints.py +246 -0
  224. cognee/tests/unit/cli/__init__.py +3 -0
  225. cognee/tests/unit/cli/test_cli_commands.py +483 -0
  226. cognee/tests/unit/cli/test_cli_edge_cases.py +625 -0
  227. cognee/tests/unit/cli/test_cli_main.py +173 -0
  228. cognee/tests/unit/cli/test_cli_runner.py +62 -0
  229. cognee/tests/unit/cli/test_cli_utils.py +127 -0
  230. cognee/tests/unit/modules/retrieval/chunks_retriever_test.py +18 -2
  231. cognee/tests/unit/modules/retrieval/graph_completion_retriever_context_extension_test.py +12 -15
  232. cognee/tests/unit/modules/retrieval/graph_completion_retriever_cot_test.py +10 -15
  233. cognee/tests/unit/modules/retrieval/graph_completion_retriever_test.py +4 -3
  234. cognee/tests/unit/modules/retrieval/insights_retriever_test.py +4 -2
  235. cognee/tests/unit/modules/retrieval/rag_completion_retriever_test.py +18 -2
  236. cognee/tests/unit/modules/retrieval/temporal_retriever_test.py +225 -0
  237. cognee/tests/unit/modules/users/__init__.py +1 -0
  238. cognee/tests/unit/modules/users/test_conditional_authentication.py +277 -0
  239. cognee/tests/unit/processing/utils/utils_test.py +20 -1
  240. {cognee-0.2.3.dev1.dist-info → cognee-0.3.0.dist-info}/METADATA +13 -9
  241. {cognee-0.2.3.dev1.dist-info → cognee-0.3.0.dist-info}/RECORD +247 -135
  242. cognee-0.3.0.dist-info/entry_points.txt +2 -0
  243. cognee/infrastructure/databases/graph/networkx/adapter.py +0 -1017
  244. cognee/infrastructure/pipeline/models/Operation.py +0 -60
  245. cognee/notebooks/github_analysis_step_by_step.ipynb +0 -37
  246. cognee/tests/tasks/descriptive_metrics/networkx_metrics_test.py +0 -7
  247. cognee/tests/unit/modules/search/search_methods_test.py +0 -223
  248. /cognee/{infrastructure/databases/graph/networkx → api/v1/memify}/__init__.py +0 -0
  249. /cognee/{infrastructure/pipeline/models → tasks/codingagents}/__init__.py +0 -0
  250. {cognee-0.2.3.dev1.dist-info → cognee-0.3.0.dist-info}/WHEEL +0 -0
  251. {cognee-0.2.3.dev1.dist-info → cognee-0.3.0.dist-info}/licenses/LICENSE +0 -0
  252. {cognee-0.2.3.dev1.dist-info → cognee-0.3.0.dist-info}/licenses/NOTICE.md +0 -0
@@ -1,19 +1,25 @@
1
1
  from typing import Any, Optional, Type, List
2
- from collections import Counter
3
- import string
2
+ from uuid import NAMESPACE_OID, uuid5
4
3
 
5
4
  from cognee.infrastructure.engine import DataPoint
5
+ from cognee.modules.graph.cognee_graph.CogneeGraphElements import Edge
6
+ from cognee.modules.users.methods import get_default_user
7
+ from cognee.tasks.storage import add_data_points
8
+ from cognee.modules.graph.utils import resolve_edges_to_text
6
9
  from cognee.modules.graph.utils.convert_node_to_data_point import get_all_subclasses
7
- from cognee.modules.retrieval.base_retriever import BaseRetriever
10
+ from cognee.modules.retrieval.base_graph_retriever import BaseGraphRetriever
8
11
  from cognee.modules.retrieval.utils.brute_force_triplet_search import brute_force_triplet_search
9
12
  from cognee.modules.retrieval.utils.completion import generate_completion
10
- from cognee.modules.retrieval.utils.stop_words import DEFAULT_STOP_WORDS
11
13
  from cognee.shared.logging_utils import get_logger
14
+ from cognee.modules.retrieval.utils.extract_uuid_from_node import extract_uuid_from_node
15
+ from cognee.modules.retrieval.utils.models import CogneeUserInteraction
16
+ from cognee.modules.engine.models.node_set import NodeSet
17
+ from cognee.infrastructure.databases.graph import get_graph_engine
12
18
 
13
19
  logger = get_logger("GraphCompletionRetriever")
14
20
 
15
21
 
16
- class GraphCompletionRetriever(BaseRetriever):
22
+ class GraphCompletionRetriever(BaseGraphRetriever):
17
23
  """
18
24
  Retriever for handling graph-based completion searches.
19
25
 
@@ -30,33 +36,21 @@ class GraphCompletionRetriever(BaseRetriever):
30
36
  self,
31
37
  user_prompt_path: str = "graph_context_for_question.txt",
32
38
  system_prompt_path: str = "answer_simple_question.txt",
39
+ system_prompt: Optional[str] = None,
33
40
  top_k: Optional[int] = 5,
34
41
  node_type: Optional[Type] = None,
35
42
  node_name: Optional[List[str]] = None,
43
+ save_interaction: bool = False,
36
44
  ):
37
45
  """Initialize retriever with prompt paths and search parameters."""
46
+ self.save_interaction = save_interaction
38
47
  self.user_prompt_path = user_prompt_path
39
48
  self.system_prompt_path = system_prompt_path
49
+ self.system_prompt = system_prompt
40
50
  self.top_k = top_k if top_k is not None else 5
41
51
  self.node_type = node_type
42
52
  self.node_name = node_name
43
53
 
44
- def _get_nodes(self, retrieved_edges: list) -> dict:
45
- """Creates a dictionary of nodes with their names and content."""
46
- nodes = {}
47
- for edge in retrieved_edges:
48
- for node in (edge.node1, edge.node2):
49
- if node.id not in nodes:
50
- text = node.attributes.get("text")
51
- if text:
52
- name = self._get_title(text)
53
- content = text
54
- else:
55
- name = node.attributes.get("name", "Unnamed Node")
56
- content = node.attributes.get("description", name)
57
- nodes[node.id] = {"node": node, "name": name, "content": content}
58
- return nodes
59
-
60
54
  async def resolve_edges_to_text(self, retrieved_edges: list) -> str:
61
55
  """
62
56
  Converts retrieved graph edges into a human-readable string format.
@@ -71,18 +65,9 @@ class GraphCompletionRetriever(BaseRetriever):
71
65
 
72
66
  - str: A formatted string representation of the nodes and their connections.
73
67
  """
74
- nodes = self._get_nodes(retrieved_edges)
75
- node_section = "\n".join(
76
- f"Node: {info['name']}\n__node_content_start__\n{info['content']}\n__node_content_end__\n"
77
- for info in nodes.values()
78
- )
79
- connection_section = "\n".join(
80
- f"{nodes[edge.node1.id]['name']} --[{edge.attributes['relationship_type']}]--> {nodes[edge.node2.id]['name']}"
81
- for edge in retrieved_edges
82
- )
83
- return f"Nodes:\n{node_section}\n\nConnections:\n{connection_section}"
68
+ return await resolve_edges_to_text(retrieved_edges)
84
69
 
85
- async def get_triplets(self, query: str) -> list:
70
+ async def get_triplets(self, query: str) -> List[Edge]:
86
71
  """
87
72
  Retrieves relevant graph triplets based on a query string.
88
73
 
@@ -97,7 +82,7 @@ class GraphCompletionRetriever(BaseRetriever):
97
82
  - list: A list of found triplets that match the query.
98
83
  """
99
84
  subclasses = get_all_subclasses(DataPoint)
100
- vector_index_collections = []
85
+ vector_index_collections: List[str] = []
101
86
 
102
87
  for subclass in subclasses:
103
88
  if "metadata" in subclass.model_fields:
@@ -108,8 +93,11 @@ class GraphCompletionRetriever(BaseRetriever):
108
93
  for field_name in index_fields:
109
94
  vector_index_collections.append(f"{subclass.__name__}_{field_name}")
110
95
 
96
+ user = await get_default_user()
97
+
111
98
  found_triplets = await brute_force_triplet_search(
112
99
  query,
100
+ user=user,
113
101
  top_k=self.top_k,
114
102
  collections=vector_index_collections or None,
115
103
  node_type=self.node_type,
@@ -118,7 +106,7 @@ class GraphCompletionRetriever(BaseRetriever):
118
106
 
119
107
  return found_triplets
120
108
 
121
- async def get_context(self, query: str) -> str:
109
+ async def get_context(self, query: str) -> List[Edge]:
122
110
  """
123
111
  Retrieves and resolves graph triplets into context based on a query.
124
112
 
@@ -137,11 +125,17 @@ class GraphCompletionRetriever(BaseRetriever):
137
125
 
138
126
  if len(triplets) == 0:
139
127
  logger.warning("Empty context was provided to the completion")
140
- return ""
128
+ return []
129
+
130
+ # context = await self.resolve_edges_to_text(triplets)
141
131
 
142
- return await self.resolve_edges_to_text(triplets)
132
+ return triplets
143
133
 
144
- async def get_completion(self, query: str, context: Optional[Any] = None) -> Any:
134
+ async def get_completion(
135
+ self,
136
+ query: str,
137
+ context: Optional[List[Edge]] = None,
138
+ ) -> Any:
145
139
  """
146
140
  Generates a completion using graph connections context based on a query.
147
141
 
@@ -157,33 +151,90 @@ class GraphCompletionRetriever(BaseRetriever):
157
151
 
158
152
  - Any: A generated completion based on the query and context provided.
159
153
  """
160
- if context is None:
161
- context = await self.get_context(query)
154
+ triplets = context
155
+
156
+ if triplets is None:
157
+ triplets = await self.get_context(query)
158
+
159
+ context_text = await resolve_edges_to_text(triplets)
162
160
 
163
161
  completion = await generate_completion(
164
162
  query=query,
165
- context=context,
163
+ context=context_text,
166
164
  user_prompt_path=self.user_prompt_path,
167
165
  system_prompt_path=self.system_prompt_path,
166
+ system_prompt=self.system_prompt,
168
167
  )
169
- return [completion]
170
168
 
171
- def _top_n_words(self, text, stop_words=None, top_n=3, separator=", "):
172
- """Concatenates the top N frequent words in text."""
173
- if stop_words is None:
174
- stop_words = DEFAULT_STOP_WORDS
169
+ if self.save_interaction and context and triplets and completion:
170
+ await self.save_qa(
171
+ question=query, answer=completion, context=context_text, triplets=triplets
172
+ )
175
173
 
176
- words = [word.lower().strip(string.punctuation) for word in text.split()]
174
+ return completion
177
175
 
178
- if stop_words:
179
- words = [word for word in words if word and word not in stop_words]
180
-
181
- top_words = [word for word, freq in Counter(words).most_common(top_n)]
176
+ async def save_qa(self, question: str, answer: str, context: str, triplets: List) -> None:
177
+ """
178
+ Saves a question and answer pair for later analysis or storage.
179
+ Parameters:
180
+ -----------
181
+ - question (str): The question text.
182
+ - answer (str): The answer text.
183
+ - context (str): The context text.
184
+ - triplets (List): A list of triples retrieved from the graph.
185
+ """
186
+ nodeset_name = "Interactions"
187
+ interactions_node_set = NodeSet(
188
+ id=uuid5(NAMESPACE_OID, name=nodeset_name), name=nodeset_name
189
+ )
190
+ source_id = uuid5(NAMESPACE_OID, name=(question + answer + context))
182
191
 
183
- return separator.join(top_words)
192
+ cognee_user_interaction = CogneeUserInteraction(
193
+ id=source_id,
194
+ question=question,
195
+ answer=answer,
196
+ context=context,
197
+ belongs_to_set=interactions_node_set,
198
+ )
184
199
 
185
- def _get_title(self, text: str, first_n_words: int = 7, top_n_words: int = 3) -> str:
186
- """Creates a title, by combining first words with most frequent words from the text."""
187
- first_n_words = text.split()[:first_n_words]
188
- top_n_words = self._top_n_words(text, top_n=top_n_words)
189
- return f"{' '.join(first_n_words)}... [{top_n_words}]"
200
+ await add_data_points(data_points=[cognee_user_interaction], update_edge_collection=False)
201
+
202
+ relationships = []
203
+ relationship_name = "used_graph_element_to_answer"
204
+ for triplet in triplets:
205
+ target_id_1 = extract_uuid_from_node(triplet.node1)
206
+ target_id_2 = extract_uuid_from_node(triplet.node2)
207
+ if target_id_1 and target_id_2:
208
+ relationships.append(
209
+ (
210
+ source_id,
211
+ target_id_1,
212
+ relationship_name,
213
+ {
214
+ "relationship_name": relationship_name,
215
+ "source_node_id": source_id,
216
+ "target_node_id": target_id_1,
217
+ "ontology_valid": False,
218
+ "feedback_weight": 0,
219
+ },
220
+ )
221
+ )
222
+
223
+ relationships.append(
224
+ (
225
+ source_id,
226
+ target_id_2,
227
+ relationship_name,
228
+ {
229
+ "relationship_name": relationship_name,
230
+ "source_node_id": source_id,
231
+ "target_node_id": target_id_2,
232
+ "ontology_valid": False,
233
+ "feedback_weight": 0,
234
+ },
235
+ )
236
+ )
237
+
238
+ if len(relationships) > 0:
239
+ graph_engine = await get_graph_engine()
240
+ await graph_engine.add_edges(relationships)
@@ -21,9 +21,11 @@ class GraphSummaryCompletionRetriever(GraphCompletionRetriever):
21
21
  user_prompt_path: str = "graph_context_for_question.txt",
22
22
  system_prompt_path: str = "answer_simple_question.txt",
23
23
  summarize_prompt_path: str = "summarize_search_results.txt",
24
+ system_prompt: Optional[str] = None,
24
25
  top_k: Optional[int] = 5,
25
26
  node_type: Optional[Type] = None,
26
27
  node_name: Optional[List[str]] = None,
28
+ save_interaction: bool = False,
27
29
  ):
28
30
  """Initialize retriever with default prompt paths and search parameters."""
29
31
  super().__init__(
@@ -32,6 +34,8 @@ class GraphSummaryCompletionRetriever(GraphCompletionRetriever):
32
34
  top_k=top_k,
33
35
  node_type=node_type,
34
36
  node_name=node_name,
37
+ save_interaction=save_interaction,
38
+ system_prompt=system_prompt,
35
39
  )
36
40
  self.summarize_prompt_path = summarize_prompt_path
37
41
 
@@ -55,4 +59,4 @@ class GraphSummaryCompletionRetriever(GraphCompletionRetriever):
55
59
  - str: A summary string representing the content of the retrieved edges.
56
60
  """
57
61
  direct_text = await super().resolve_edges_to_text(retrieved_edges)
58
- return await summarize_text(direct_text, self.summarize_prompt_path)
62
+ return await summarize_text(direct_text, self.summarize_prompt_path, self.system_prompt)
@@ -1,17 +1,18 @@
1
1
  import asyncio
2
2
  from typing import Any, Optional
3
3
 
4
+ from cognee.modules.graph.cognee_graph.CogneeGraphElements import Edge, Node
5
+ from cognee.modules.retrieval.base_graph_retriever import BaseGraphRetriever
4
6
  from cognee.shared.logging_utils import get_logger
5
7
  from cognee.infrastructure.databases.graph import get_graph_engine
6
8
  from cognee.infrastructure.databases.vector import get_vector_engine
7
- from cognee.modules.retrieval.base_retriever import BaseRetriever
8
9
  from cognee.modules.retrieval.exceptions.exceptions import NoDataError
9
10
  from cognee.infrastructure.databases.vector.exceptions.exceptions import CollectionNotFoundError
10
11
 
11
12
  logger = get_logger("InsightsRetriever")
12
13
 
13
14
 
14
- class InsightsRetriever(BaseRetriever):
15
+ class InsightsRetriever(BaseGraphRetriever):
15
16
  """
16
17
  Retriever for handling graph connection-based insights.
17
18
 
@@ -95,7 +96,17 @@ class InsightsRetriever(BaseRetriever):
95
96
  unique_node_connections_map[unique_id] = True
96
97
  unique_node_connections.append(node_connection)
97
98
 
98
- return unique_node_connections
99
+ return [
100
+ Edge(
101
+ node1=Node(node_id=connection[0]["id"], attributes=connection[0]),
102
+ node2=Node(node_id=connection[2]["id"], attributes=connection[2]),
103
+ attributes={
104
+ **connection[1],
105
+ "relationship_type": connection[1]["relationship_name"],
106
+ },
107
+ )
108
+ for connection in unique_node_connections
109
+ ]
99
110
 
100
111
  async def get_completion(self, query: str, context: Optional[Any] = None) -> Any:
101
112
  """
@@ -1,7 +1,6 @@
1
1
  from typing import Any, Optional
2
2
  from cognee.shared.logging_utils import get_logger
3
3
  from cognee.infrastructure.databases.graph import get_graph_engine
4
- from cognee.infrastructure.databases.graph.networkx.adapter import NetworkXAdapter
5
4
  from cognee.infrastructure.llm.LLMGateway import LLMGateway
6
5
  from cognee.modules.retrieval.base_retriever import BaseRetriever
7
6
  from cognee.modules.retrieval.exceptions import SearchTypeNotSupported
@@ -123,9 +122,6 @@ class NaturalLanguageRetriever(BaseRetriever):
123
122
  """
124
123
  graph_engine = await get_graph_engine()
125
124
 
126
- if isinstance(graph_engine, (NetworkXAdapter)):
127
- raise SearchTypeNotSupported("Natural language search type not supported.")
128
-
129
125
  return await self._execute_cypher_query(query, graph_engine)
130
126
 
131
127
  async def get_completion(self, query: str, context: Optional[Any] = None) -> Any:
@@ -62,7 +62,7 @@ class SummariesRetriever(BaseRetriever):
62
62
  logger.info(f"Returning {len(summary_payloads)} summary payloads")
63
63
  return summary_payloads
64
64
 
65
- async def get_completion(self, query: str, context: Optional[Any] = None) -> Any:
65
+ async def get_completion(self, query: str, context: Optional[Any] = None, **kwargs) -> Any:
66
66
  """
67
67
  Generates a completion using summaries context.
68
68
 
@@ -0,0 +1,152 @@
1
+ import os
2
+ from typing import Any, Optional, List, Type
3
+
4
+
5
+ from operator import itemgetter
6
+ from cognee.infrastructure.databases.vector import get_vector_engine
7
+ from cognee.modules.retrieval.utils.completion import generate_completion
8
+ from cognee.infrastructure.databases.graph import get_graph_engine
9
+ from cognee.infrastructure.llm import LLMGateway
10
+ from cognee.modules.retrieval.graph_completion_retriever import GraphCompletionRetriever
11
+ from cognee.shared.logging_utils import get_logger
12
+
13
+
14
+ from cognee.tasks.temporal_graph.models import QueryInterval
15
+
16
+ logger = get_logger()
17
+
18
+
19
+ class TemporalRetriever(GraphCompletionRetriever):
20
+ """
21
+ Handles graph completion by generating responses based on a series of interactions with
22
+ a language model. This class extends from GraphCompletionRetriever and is designed to
23
+ manage the retrieval and validation process for user queries, integrating follow-up
24
+ questions based on reasoning. The public methods are:
25
+
26
+ - get_completion
27
+
28
+ Instance variables include:
29
+ - validation_system_prompt_path
30
+ - validation_user_prompt_path
31
+ - followup_system_prompt_path
32
+ - followup_user_prompt_path
33
+ """
34
+
35
+ def __init__(
36
+ self,
37
+ user_prompt_path: str = "graph_context_for_question.txt",
38
+ system_prompt_path: str = "answer_simple_question.txt",
39
+ time_extraction_prompt_path: str = "extract_query_time.txt",
40
+ top_k: Optional[int] = 5,
41
+ node_type: Optional[Type] = None,
42
+ node_name: Optional[List[str]] = None,
43
+ ):
44
+ super().__init__(
45
+ user_prompt_path=user_prompt_path,
46
+ system_prompt_path=system_prompt_path,
47
+ top_k=top_k,
48
+ node_type=node_type,
49
+ node_name=node_name,
50
+ )
51
+ self.user_prompt_path = user_prompt_path
52
+ self.system_prompt_path = system_prompt_path
53
+ self.time_extraction_prompt_path = time_extraction_prompt_path
54
+ self.top_k = top_k if top_k is not None else 5
55
+ self.node_type = node_type
56
+ self.node_name = node_name
57
+
58
+ def descriptions_to_string(self, results):
59
+ descs = []
60
+ for entry in results:
61
+ d = entry.get("description")
62
+ if d:
63
+ descs.append(d.strip())
64
+ return "\n#####################\n".join(descs)
65
+
66
+ async def extract_time_from_query(self, query: str):
67
+ prompt_path = self.time_extraction_prompt_path
68
+
69
+ if os.path.isabs(prompt_path):
70
+ base_directory = os.path.dirname(prompt_path)
71
+ prompt_path = os.path.basename(prompt_path)
72
+ else:
73
+ base_directory = None
74
+
75
+ system_prompt = LLMGateway.render_prompt(prompt_path, {}, base_directory=base_directory)
76
+
77
+ interval = await LLMGateway.acreate_structured_output(query, system_prompt, QueryInterval)
78
+
79
+ time_from = interval.starts_at
80
+ time_to = interval.ends_at
81
+
82
+ return time_from, time_to
83
+
84
+ async def filter_top_k_events(self, relevant_events, scored_results):
85
+ # Build a score lookup from vector search results
86
+ score_lookup = {res.payload["id"]: res.score for res in scored_results}
87
+
88
+ events_with_scores = []
89
+ for event in relevant_events[0]["events"]:
90
+ score = score_lookup.get(event["id"], float("inf"))
91
+ events_with_scores.append({**event, "score": score})
92
+
93
+ events_with_scores.sort(key=itemgetter("score"))
94
+
95
+ return events_with_scores[: self.top_k]
96
+
97
+ async def get_context(self, query: str) -> Any:
98
+ """Retrieves context based on the query."""
99
+
100
+ time_from, time_to = await self.extract_time_from_query(query)
101
+
102
+ graph_engine = await get_graph_engine()
103
+
104
+ triplets = []
105
+
106
+ if time_from and time_to:
107
+ ids = await graph_engine.collect_time_ids(time_from=time_from, time_to=time_to)
108
+ elif time_from:
109
+ ids = await graph_engine.collect_time_ids(time_from=time_from)
110
+ elif time_to:
111
+ ids = await graph_engine.collect_time_ids(time_to=time_to)
112
+ else:
113
+ logger.info(
114
+ "No timestamps identified based on the query, performing retrieval using triplet search on events and entities."
115
+ )
116
+ triplets = await self.get_context(query)
117
+ return await self.resolve_edges_to_text(triplets)
118
+
119
+ if ids:
120
+ relevant_events = await graph_engine.collect_events(ids=ids)
121
+ else:
122
+ logger.info(
123
+ "No events identified based on timestamp filtering, performing retrieval using triplet search on events and entities."
124
+ )
125
+ triplets = await self.get_context(query)
126
+ return await self.resolve_edges_to_text(triplets)
127
+
128
+ vector_engine = get_vector_engine()
129
+ query_vector = (await vector_engine.embedding_engine.embed_text([query]))[0]
130
+
131
+ vector_search_results = await vector_engine.search(
132
+ collection_name="Event_name", query_vector=query_vector, limit=0
133
+ )
134
+
135
+ top_k_events = await self.filter_top_k_events(relevant_events, vector_search_results)
136
+
137
+ return self.descriptions_to_string(top_k_events)
138
+
139
+ async def get_completion(self, query: str, context: Optional[str] = None) -> str:
140
+ """Generates a response using the query and optional context."""
141
+ if not context:
142
+ context = await self.get_context(query=query)
143
+
144
+ if context:
145
+ completion = await generate_completion(
146
+ query=query,
147
+ context=context,
148
+ user_prompt_path=self.user_prompt_path,
149
+ system_prompt_path=self.system_prompt_path,
150
+ )
151
+
152
+ return completion
@@ -0,0 +1,83 @@
1
+ from typing import Any, Optional, List
2
+
3
+ from uuid import NAMESPACE_OID, uuid5, UUID
4
+ from cognee.infrastructure.databases.graph import get_graph_engine
5
+ from cognee.infrastructure.llm import LLMGateway
6
+ from cognee.modules.engine.models import NodeSet
7
+ from cognee.shared.logging_utils import get_logger
8
+ from cognee.modules.retrieval.base_feedback import BaseFeedback
9
+ from cognee.modules.retrieval.utils.models import CogneeUserFeedback
10
+ from cognee.modules.retrieval.utils.models import UserFeedbackEvaluation
11
+ from cognee.tasks.storage import add_data_points
12
+
13
+ logger = get_logger("CompletionRetriever")
14
+
15
+
16
+ class UserQAFeedback(BaseFeedback):
17
+ """
18
+ Interface for handling user feedback queries.
19
+ Public methods:
20
+ - get_context(query: str) -> str
21
+ - get_completion(query: str, context: Optional[Any] = None) -> Any
22
+ """
23
+
24
+ def __init__(self, last_k: Optional[int] = 1) -> None:
25
+ """Initialize retriever with optional custom prompt paths."""
26
+ self.last_k = last_k
27
+
28
+ async def add_feedback(self, feedback_text: str) -> List[str]:
29
+ feedback_sentiment = await LLMGateway.acreate_structured_output(
30
+ text_input=feedback_text,
31
+ system_prompt="You are a sentiment analysis assistant. For each piece of user feedback you receive, return exactly one of: Positive, Negative, or Neutral classification and a corresponding score from -5 (worst negative) to 5 (best positive)",
32
+ response_model=UserFeedbackEvaluation,
33
+ )
34
+
35
+ graph_engine = await get_graph_engine()
36
+ last_interaction_ids = await graph_engine.get_last_user_interaction_ids(limit=self.last_k)
37
+
38
+ nodeset_name = "UserQAFeedbacks"
39
+ feedbacks_node_set = NodeSet(id=uuid5(NAMESPACE_OID, name=nodeset_name), name=nodeset_name)
40
+ feedback_id = uuid5(NAMESPACE_OID, name=feedback_text)
41
+
42
+ cognee_user_feedback = CogneeUserFeedback(
43
+ id=feedback_id,
44
+ feedback=feedback_text,
45
+ sentiment=feedback_sentiment.evaluation.value,
46
+ score=feedback_sentiment.score,
47
+ belongs_to_set=feedbacks_node_set,
48
+ )
49
+
50
+ await add_data_points(data_points=[cognee_user_feedback], update_edge_collection=False)
51
+
52
+ relationships = []
53
+ relationship_name = "gives_feedback_to"
54
+ to_node_ids = []
55
+
56
+ for interaction_id in last_interaction_ids:
57
+ target_id_1 = feedback_id
58
+ target_id_2 = UUID(interaction_id)
59
+
60
+ if target_id_1 and target_id_2:
61
+ relationships.append(
62
+ (
63
+ target_id_1,
64
+ target_id_2,
65
+ relationship_name,
66
+ {
67
+ "relationship_name": relationship_name,
68
+ "source_node_id": target_id_1,
69
+ "target_node_id": target_id_2,
70
+ "ontology_valid": False,
71
+ },
72
+ )
73
+ )
74
+ to_node_ids.append(str(target_id_2))
75
+
76
+ if len(relationships) > 0:
77
+ graph_engine = await get_graph_engine()
78
+ await graph_engine.add_edges(relationships)
79
+ await graph_engine.apply_feedback_weight(
80
+ node_ids=to_node_ids, weight=feedback_sentiment.score
81
+ )
82
+
83
+ return [feedback_text]
@@ -8,7 +8,7 @@ from cognee.infrastructure.databases.vector.exceptions import CollectionNotFound
8
8
  from cognee.infrastructure.databases.graph import get_graph_engine
9
9
  from cognee.infrastructure.databases.vector import get_vector_engine
10
10
  from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
11
- from cognee.modules.users.methods import get_default_user
11
+ from cognee.modules.graph.cognee_graph.CogneeGraphElements import Edge
12
12
  from cognee.modules.users.models import User
13
13
  from cognee.shared.utils import send_telemetry
14
14
 
@@ -63,9 +63,10 @@ async def get_memory_fragment(
63
63
  if properties_to_project is None:
64
64
  properties_to_project = ["id", "description", "name", "type", "text"]
65
65
 
66
+ memory_fragment = CogneeGraph()
67
+
66
68
  try:
67
69
  graph_engine = await get_graph_engine()
68
- memory_fragment = CogneeGraph()
69
70
 
70
71
  await memory_fragment.project_graph_from_db(
71
72
  graph_engine,
@@ -87,41 +88,15 @@ async def get_memory_fragment(
87
88
 
88
89
 
89
90
  async def brute_force_triplet_search(
90
- query: str,
91
- user: User = None,
92
- top_k: int = 5,
93
- collections: List[str] = None,
94
- properties_to_project: List[str] = None,
95
- memory_fragment: Optional[CogneeGraph] = None,
96
- node_type: Optional[Type] = None,
97
- node_name: Optional[List[str]] = None,
98
- ) -> list:
99
- if user is None:
100
- user = await get_default_user()
101
-
102
- retrieved_results = await brute_force_search(
103
- query,
104
- user,
105
- top_k,
106
- collections=collections,
107
- properties_to_project=properties_to_project,
108
- memory_fragment=memory_fragment,
109
- node_type=node_type,
110
- node_name=node_name,
111
- )
112
- return retrieved_results
113
-
114
-
115
- async def brute_force_search(
116
91
  query: str,
117
92
  user: User,
118
- top_k: int,
119
- collections: List[str] = None,
120
- properties_to_project: List[str] = None,
93
+ top_k: int = 5,
94
+ collections: Optional[List[str]] = None,
95
+ properties_to_project: Optional[List[str]] = None,
121
96
  memory_fragment: Optional[CogneeGraph] = None,
122
97
  node_type: Optional[Type] = None,
123
98
  node_name: Optional[List[str]] = None,
124
- ) -> list:
99
+ ) -> List[Edge]:
125
100
  """
126
101
  Performs a brute force search to retrieve the top triplets from the graph.
127
102