cognee 0.5.0__py3-none-any.whl → 0.5.0.dev0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- cognee/api/client.py +5 -1
- cognee/api/v1/add/add.py +1 -2
- cognee/api/v1/cognify/code_graph_pipeline.py +119 -0
- cognee/api/v1/cognify/cognify.py +16 -24
- cognee/api/v1/cognify/routers/__init__.py +1 -0
- cognee/api/v1/cognify/routers/get_code_pipeline_router.py +90 -0
- cognee/api/v1/cognify/routers/get_cognify_router.py +1 -3
- cognee/api/v1/datasets/routers/get_datasets_router.py +3 -3
- cognee/api/v1/ontologies/ontologies.py +37 -12
- cognee/api/v1/ontologies/routers/get_ontology_router.py +25 -27
- cognee/api/v1/search/search.py +0 -4
- cognee/api/v1/ui/ui.py +68 -38
- cognee/context_global_variables.py +16 -61
- cognee/eval_framework/answer_generation/answer_generation_executor.py +0 -10
- cognee/eval_framework/answer_generation/run_question_answering_module.py +1 -1
- cognee/eval_framework/corpus_builder/task_getters/get_cascade_graph_tasks.py +2 -0
- cognee/eval_framework/corpus_builder/task_getters/get_default_tasks_by_indices.py +4 -4
- cognee/eval_framework/eval_config.py +2 -2
- cognee/eval_framework/modal_run_eval.py +28 -16
- cognee/infrastructure/databases/graph/config.py +0 -3
- cognee/infrastructure/databases/graph/get_graph_engine.py +0 -1
- cognee/infrastructure/databases/graph/graph_db_interface.py +0 -15
- cognee/infrastructure/databases/graph/kuzu/adapter.py +0 -228
- cognee/infrastructure/databases/graph/neo4j_driver/adapter.py +1 -80
- cognee/infrastructure/databases/utils/__init__.py +0 -3
- cognee/infrastructure/databases/utils/get_or_create_dataset_database.py +48 -62
- cognee/infrastructure/databases/vector/config.py +0 -2
- cognee/infrastructure/databases/vector/create_vector_engine.py +0 -1
- cognee/infrastructure/databases/vector/embeddings/FastembedEmbeddingEngine.py +6 -8
- cognee/infrastructure/databases/vector/embeddings/LiteLLMEmbeddingEngine.py +7 -9
- cognee/infrastructure/databases/vector/embeddings/OllamaEmbeddingEngine.py +10 -11
- cognee/infrastructure/databases/vector/embeddings/embedding_rate_limiter.py +544 -0
- cognee/infrastructure/databases/vector/lancedb/LanceDBAdapter.py +0 -2
- cognee/infrastructure/databases/vector/vector_db_interface.py +0 -35
- cognee/infrastructure/files/storage/s3_config.py +0 -2
- cognee/infrastructure/llm/LLMGateway.py +2 -5
- cognee/infrastructure/llm/config.py +0 -35
- cognee/infrastructure/llm/extraction/knowledge_graph/extract_content_graph.py +2 -2
- cognee/infrastructure/llm/structured_output_framework/baml/baml_src/extraction/acreate_structured_output.py +8 -23
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/anthropic/adapter.py +16 -17
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/gemini/adapter.py +37 -40
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/generic_llm_api/adapter.py +36 -39
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/get_llm_client.py +1 -19
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/mistral/adapter.py +9 -11
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/ollama/adapter.py +21 -23
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/openai/adapter.py +34 -42
- cognee/modules/cognify/config.py +0 -2
- cognee/modules/data/deletion/prune_system.py +2 -52
- cognee/modules/data/methods/delete_dataset.py +0 -26
- cognee/modules/engine/models/__init__.py +0 -1
- cognee/modules/graph/cognee_graph/CogneeGraph.py +37 -85
- cognee/modules/graph/cognee_graph/CogneeGraphElements.py +3 -8
- cognee/modules/memify/memify.py +7 -1
- cognee/modules/pipelines/operations/pipeline.py +2 -18
- cognee/modules/retrieval/__init__.py +1 -1
- cognee/modules/retrieval/code_retriever.py +232 -0
- cognee/modules/retrieval/graph_completion_context_extension_retriever.py +0 -4
- cognee/modules/retrieval/graph_completion_cot_retriever.py +0 -4
- cognee/modules/retrieval/graph_completion_retriever.py +0 -10
- cognee/modules/retrieval/graph_summary_completion_retriever.py +0 -4
- cognee/modules/retrieval/temporal_retriever.py +0 -4
- cognee/modules/retrieval/utils/brute_force_triplet_search.py +10 -42
- cognee/modules/run_custom_pipeline/run_custom_pipeline.py +1 -8
- cognee/modules/search/methods/get_search_type_tools.py +8 -54
- cognee/modules/search/methods/no_access_control_search.py +0 -4
- cognee/modules/search/methods/search.py +0 -21
- cognee/modules/search/types/SearchType.py +1 -1
- cognee/modules/settings/get_settings.py +0 -19
- cognee/modules/users/methods/get_authenticated_user.py +2 -2
- cognee/modules/users/models/DatasetDatabase.py +3 -15
- cognee/shared/logging_utils.py +0 -4
- cognee/tasks/code/enrich_dependency_graph_checker.py +35 -0
- cognee/tasks/code/get_local_dependencies_checker.py +20 -0
- cognee/tasks/code/get_repo_dependency_graph_checker.py +35 -0
- cognee/tasks/documents/__init__.py +1 -0
- cognee/tasks/documents/check_permissions_on_dataset.py +26 -0
- cognee/tasks/graph/extract_graph_from_data.py +10 -9
- cognee/tasks/repo_processor/__init__.py +2 -0
- cognee/tasks/repo_processor/get_local_dependencies.py +335 -0
- cognee/tasks/repo_processor/get_non_code_files.py +158 -0
- cognee/tasks/repo_processor/get_repo_file_dependencies.py +243 -0
- cognee/tasks/storage/add_data_points.py +2 -142
- cognee/tests/test_cognee_server_start.py +4 -2
- cognee/tests/test_conversation_history.py +1 -23
- cognee/tests/test_delete_bmw_example.py +60 -0
- cognee/tests/test_search_db.py +1 -37
- cognee/tests/unit/api/test_ontology_endpoint.py +89 -77
- cognee/tests/unit/infrastructure/mock_embedding_engine.py +7 -3
- cognee/tests/unit/infrastructure/test_embedding_rate_limiting_realistic.py +5 -0
- cognee/tests/unit/modules/graph/cognee_graph_elements_test.py +2 -2
- cognee/tests/unit/modules/graph/cognee_graph_test.py +0 -406
- {cognee-0.5.0.dist-info → cognee-0.5.0.dev0.dist-info}/METADATA +89 -76
- {cognee-0.5.0.dist-info → cognee-0.5.0.dev0.dist-info}/RECORD +97 -118
- {cognee-0.5.0.dist-info → cognee-0.5.0.dev0.dist-info}/WHEEL +1 -1
- cognee/api/v1/ui/node_setup.py +0 -360
- cognee/api/v1/ui/npm_utils.py +0 -50
- cognee/eval_framework/Dockerfile +0 -29
- cognee/infrastructure/databases/dataset_database_handler/__init__.py +0 -3
- cognee/infrastructure/databases/dataset_database_handler/dataset_database_handler_interface.py +0 -80
- cognee/infrastructure/databases/dataset_database_handler/supported_dataset_database_handlers.py +0 -18
- cognee/infrastructure/databases/dataset_database_handler/use_dataset_database_handler.py +0 -10
- cognee/infrastructure/databases/graph/kuzu/KuzuDatasetDatabaseHandler.py +0 -81
- cognee/infrastructure/databases/graph/neo4j_driver/Neo4jAuraDevDatasetDatabaseHandler.py +0 -168
- cognee/infrastructure/databases/utils/get_graph_dataset_database_handler.py +0 -10
- cognee/infrastructure/databases/utils/get_vector_dataset_database_handler.py +0 -10
- cognee/infrastructure/databases/utils/resolve_dataset_database_connection_info.py +0 -30
- cognee/infrastructure/databases/vector/lancedb/LanceDBDatasetDatabaseHandler.py +0 -50
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/bedrock/__init__.py +0 -5
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/bedrock/adapter.py +0 -153
- cognee/memify_pipelines/create_triplet_embeddings.py +0 -53
- cognee/modules/engine/models/Triplet.py +0 -9
- cognee/modules/retrieval/register_retriever.py +0 -10
- cognee/modules/retrieval/registered_community_retrievers.py +0 -1
- cognee/modules/retrieval/triplet_retriever.py +0 -182
- cognee/shared/rate_limiting.py +0 -30
- cognee/tasks/memify/get_triplet_datapoints.py +0 -289
- cognee/tests/integration/retrieval/test_triplet_retriever.py +0 -84
- cognee/tests/integration/tasks/test_add_data_points.py +0 -139
- cognee/tests/integration/tasks/test_get_triplet_datapoints.py +0 -69
- cognee/tests/test_dataset_database_handler.py +0 -137
- cognee/tests/test_dataset_delete.py +0 -76
- cognee/tests/test_edge_centered_payload.py +0 -170
- cognee/tests/test_pipeline_cache.py +0 -164
- cognee/tests/unit/infrastructure/llm/test_llm_config.py +0 -46
- cognee/tests/unit/modules/memify_tasks/test_get_triplet_datapoints.py +0 -214
- cognee/tests/unit/modules/retrieval/test_brute_force_triplet_search.py +0 -608
- cognee/tests/unit/modules/retrieval/triplet_retriever_test.py +0 -83
- cognee/tests/unit/tasks/storage/test_add_data_points.py +0 -288
- {cognee-0.5.0.dist-info → cognee-0.5.0.dev0.dist-info}/entry_points.txt +0 -0
- {cognee-0.5.0.dist-info → cognee-0.5.0.dev0.dist-info}/licenses/LICENSE +0 -0
- {cognee-0.5.0.dist-info → cognee-0.5.0.dev0.dist-info}/licenses/NOTICE.md +0 -0
|
@@ -1,5 +1,4 @@
|
|
|
1
1
|
import pytest
|
|
2
|
-
from unittest.mock import AsyncMock
|
|
3
2
|
|
|
4
3
|
from cognee.modules.graph.exceptions import EntityNotFoundError, EntityAlreadyExistsError
|
|
5
4
|
from cognee.modules.graph.cognee_graph.CogneeGraph import CogneeGraph
|
|
@@ -12,30 +11,6 @@ def setup_graph():
|
|
|
12
11
|
return CogneeGraph()
|
|
13
12
|
|
|
14
13
|
|
|
15
|
-
@pytest.fixture
|
|
16
|
-
def mock_adapter():
|
|
17
|
-
"""Fixture to create a mock adapter for database operations."""
|
|
18
|
-
adapter = AsyncMock()
|
|
19
|
-
return adapter
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
@pytest.fixture
|
|
23
|
-
def mock_vector_engine():
|
|
24
|
-
"""Fixture to create a mock vector engine."""
|
|
25
|
-
engine = AsyncMock()
|
|
26
|
-
engine.search = AsyncMock()
|
|
27
|
-
return engine
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
class MockScoredResult:
|
|
31
|
-
"""Mock class for vector search results."""
|
|
32
|
-
|
|
33
|
-
def __init__(self, id, score, payload=None):
|
|
34
|
-
self.id = id
|
|
35
|
-
self.score = score
|
|
36
|
-
self.payload = payload or {}
|
|
37
|
-
|
|
38
|
-
|
|
39
14
|
def test_add_node_success(setup_graph):
|
|
40
15
|
"""Test successful addition of a node."""
|
|
41
16
|
graph = setup_graph
|
|
@@ -98,384 +73,3 @@ def test_get_edges_nonexistent_node(setup_graph):
|
|
|
98
73
|
graph = setup_graph
|
|
99
74
|
with pytest.raises(EntityNotFoundError, match="Node with id nonexistent does not exist."):
|
|
100
75
|
graph.get_edges_from_node("nonexistent")
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
@pytest.mark.asyncio
|
|
104
|
-
async def test_project_graph_from_db_full_graph(setup_graph, mock_adapter):
|
|
105
|
-
"""Test projecting a full graph from database."""
|
|
106
|
-
graph = setup_graph
|
|
107
|
-
|
|
108
|
-
nodes_data = [
|
|
109
|
-
("1", {"name": "Node1", "description": "First node"}),
|
|
110
|
-
("2", {"name": "Node2", "description": "Second node"}),
|
|
111
|
-
]
|
|
112
|
-
edges_data = [
|
|
113
|
-
("1", "2", "CONNECTS_TO", {"relationship_name": "connects"}),
|
|
114
|
-
]
|
|
115
|
-
|
|
116
|
-
mock_adapter.get_graph_data = AsyncMock(return_value=(nodes_data, edges_data))
|
|
117
|
-
|
|
118
|
-
await graph.project_graph_from_db(
|
|
119
|
-
adapter=mock_adapter,
|
|
120
|
-
node_properties_to_project=["name", "description"],
|
|
121
|
-
edge_properties_to_project=["relationship_name"],
|
|
122
|
-
)
|
|
123
|
-
|
|
124
|
-
assert len(graph.nodes) == 2
|
|
125
|
-
assert len(graph.edges) == 1
|
|
126
|
-
assert graph.get_node("1") is not None
|
|
127
|
-
assert graph.get_node("2") is not None
|
|
128
|
-
assert graph.edges[0].node1.id == "1"
|
|
129
|
-
assert graph.edges[0].node2.id == "2"
|
|
130
|
-
|
|
131
|
-
|
|
132
|
-
@pytest.mark.asyncio
|
|
133
|
-
async def test_project_graph_from_db_id_filtered(setup_graph, mock_adapter):
|
|
134
|
-
"""Test projecting an ID-filtered graph from database."""
|
|
135
|
-
graph = setup_graph
|
|
136
|
-
|
|
137
|
-
nodes_data = [
|
|
138
|
-
("1", {"name": "Node1"}),
|
|
139
|
-
("2", {"name": "Node2"}),
|
|
140
|
-
]
|
|
141
|
-
edges_data = [
|
|
142
|
-
("1", "2", "CONNECTS_TO", {"relationship_name": "connects"}),
|
|
143
|
-
]
|
|
144
|
-
|
|
145
|
-
mock_adapter.get_id_filtered_graph_data = AsyncMock(return_value=(nodes_data, edges_data))
|
|
146
|
-
|
|
147
|
-
await graph.project_graph_from_db(
|
|
148
|
-
adapter=mock_adapter,
|
|
149
|
-
node_properties_to_project=["name"],
|
|
150
|
-
edge_properties_to_project=["relationship_name"],
|
|
151
|
-
relevant_ids_to_filter=["1", "2"],
|
|
152
|
-
)
|
|
153
|
-
|
|
154
|
-
assert len(graph.nodes) == 2
|
|
155
|
-
assert len(graph.edges) == 1
|
|
156
|
-
mock_adapter.get_id_filtered_graph_data.assert_called_once()
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
@pytest.mark.asyncio
|
|
160
|
-
async def test_project_graph_from_db_nodeset_subgraph(setup_graph, mock_adapter):
|
|
161
|
-
"""Test projecting a nodeset subgraph filtered by node type and name."""
|
|
162
|
-
graph = setup_graph
|
|
163
|
-
|
|
164
|
-
nodes_data = [
|
|
165
|
-
("1", {"name": "Alice", "type": "Person"}),
|
|
166
|
-
("2", {"name": "Bob", "type": "Person"}),
|
|
167
|
-
]
|
|
168
|
-
edges_data = [
|
|
169
|
-
("1", "2", "KNOWS", {"relationship_name": "knows"}),
|
|
170
|
-
]
|
|
171
|
-
|
|
172
|
-
mock_adapter.get_nodeset_subgraph = AsyncMock(return_value=(nodes_data, edges_data))
|
|
173
|
-
|
|
174
|
-
await graph.project_graph_from_db(
|
|
175
|
-
adapter=mock_adapter,
|
|
176
|
-
node_properties_to_project=["name", "type"],
|
|
177
|
-
edge_properties_to_project=["relationship_name"],
|
|
178
|
-
node_type="Person",
|
|
179
|
-
node_name=["Alice"],
|
|
180
|
-
)
|
|
181
|
-
|
|
182
|
-
assert len(graph.nodes) == 2
|
|
183
|
-
assert graph.get_node("1") is not None
|
|
184
|
-
assert len(graph.edges) == 1
|
|
185
|
-
mock_adapter.get_nodeset_subgraph.assert_called_once()
|
|
186
|
-
|
|
187
|
-
|
|
188
|
-
@pytest.mark.asyncio
|
|
189
|
-
async def test_project_graph_from_db_empty_graph(setup_graph, mock_adapter):
|
|
190
|
-
"""Test projecting empty graph raises EntityNotFoundError."""
|
|
191
|
-
graph = setup_graph
|
|
192
|
-
|
|
193
|
-
mock_adapter.get_graph_data = AsyncMock(return_value=([], []))
|
|
194
|
-
|
|
195
|
-
with pytest.raises(EntityNotFoundError, match="Empty graph projected from the database."):
|
|
196
|
-
await graph.project_graph_from_db(
|
|
197
|
-
adapter=mock_adapter,
|
|
198
|
-
node_properties_to_project=["name"],
|
|
199
|
-
edge_properties_to_project=[],
|
|
200
|
-
)
|
|
201
|
-
|
|
202
|
-
|
|
203
|
-
@pytest.mark.asyncio
|
|
204
|
-
async def test_project_graph_from_db_missing_nodes(setup_graph, mock_adapter):
|
|
205
|
-
"""Test that edges referencing missing nodes raise error."""
|
|
206
|
-
graph = setup_graph
|
|
207
|
-
|
|
208
|
-
nodes_data = [
|
|
209
|
-
("1", {"name": "Node1"}),
|
|
210
|
-
]
|
|
211
|
-
edges_data = [
|
|
212
|
-
("1", "999", "CONNECTS_TO", {"relationship_name": "connects"}),
|
|
213
|
-
]
|
|
214
|
-
|
|
215
|
-
mock_adapter.get_graph_data = AsyncMock(return_value=(nodes_data, edges_data))
|
|
216
|
-
|
|
217
|
-
with pytest.raises(EntityNotFoundError, match="Edge references nonexistent nodes"):
|
|
218
|
-
await graph.project_graph_from_db(
|
|
219
|
-
adapter=mock_adapter,
|
|
220
|
-
node_properties_to_project=["name"],
|
|
221
|
-
edge_properties_to_project=["relationship_name"],
|
|
222
|
-
)
|
|
223
|
-
|
|
224
|
-
|
|
225
|
-
@pytest.mark.asyncio
|
|
226
|
-
async def test_map_vector_distances_to_graph_nodes(setup_graph):
|
|
227
|
-
"""Test mapping vector distances to graph nodes."""
|
|
228
|
-
graph = setup_graph
|
|
229
|
-
|
|
230
|
-
node1 = Node("1", {"name": "Node1"})
|
|
231
|
-
node2 = Node("2", {"name": "Node2"})
|
|
232
|
-
graph.add_node(node1)
|
|
233
|
-
graph.add_node(node2)
|
|
234
|
-
|
|
235
|
-
node_distances = {
|
|
236
|
-
"Entity_name": [
|
|
237
|
-
MockScoredResult("1", 0.95),
|
|
238
|
-
MockScoredResult("2", 0.87),
|
|
239
|
-
]
|
|
240
|
-
}
|
|
241
|
-
|
|
242
|
-
await graph.map_vector_distances_to_graph_nodes(node_distances)
|
|
243
|
-
|
|
244
|
-
assert graph.get_node("1").attributes.get("vector_distance") == 0.95
|
|
245
|
-
assert graph.get_node("2").attributes.get("vector_distance") == 0.87
|
|
246
|
-
|
|
247
|
-
|
|
248
|
-
@pytest.mark.asyncio
|
|
249
|
-
async def test_map_vector_distances_partial_node_coverage(setup_graph):
|
|
250
|
-
"""Test mapping vector distances when only some nodes have results."""
|
|
251
|
-
graph = setup_graph
|
|
252
|
-
|
|
253
|
-
node1 = Node("1", {"name": "Node1"})
|
|
254
|
-
node2 = Node("2", {"name": "Node2"})
|
|
255
|
-
node3 = Node("3", {"name": "Node3"})
|
|
256
|
-
graph.add_node(node1)
|
|
257
|
-
graph.add_node(node2)
|
|
258
|
-
graph.add_node(node3)
|
|
259
|
-
|
|
260
|
-
node_distances = {
|
|
261
|
-
"Entity_name": [
|
|
262
|
-
MockScoredResult("1", 0.95),
|
|
263
|
-
MockScoredResult("2", 0.87),
|
|
264
|
-
]
|
|
265
|
-
}
|
|
266
|
-
|
|
267
|
-
await graph.map_vector_distances_to_graph_nodes(node_distances)
|
|
268
|
-
|
|
269
|
-
assert graph.get_node("1").attributes.get("vector_distance") == 0.95
|
|
270
|
-
assert graph.get_node("2").attributes.get("vector_distance") == 0.87
|
|
271
|
-
assert graph.get_node("3").attributes.get("vector_distance") == 3.5
|
|
272
|
-
|
|
273
|
-
|
|
274
|
-
@pytest.mark.asyncio
|
|
275
|
-
async def test_map_vector_distances_multiple_categories(setup_graph):
|
|
276
|
-
"""Test mapping vector distances from multiple collection categories."""
|
|
277
|
-
graph = setup_graph
|
|
278
|
-
|
|
279
|
-
# Create nodes
|
|
280
|
-
node1 = Node("1")
|
|
281
|
-
node2 = Node("2")
|
|
282
|
-
node3 = Node("3")
|
|
283
|
-
node4 = Node("4")
|
|
284
|
-
graph.add_node(node1)
|
|
285
|
-
graph.add_node(node2)
|
|
286
|
-
graph.add_node(node3)
|
|
287
|
-
graph.add_node(node4)
|
|
288
|
-
|
|
289
|
-
node_distances = {
|
|
290
|
-
"Entity_name": [
|
|
291
|
-
MockScoredResult("1", 0.95),
|
|
292
|
-
MockScoredResult("2", 0.87),
|
|
293
|
-
],
|
|
294
|
-
"TextSummary_text": [
|
|
295
|
-
MockScoredResult("3", 0.92),
|
|
296
|
-
],
|
|
297
|
-
}
|
|
298
|
-
|
|
299
|
-
await graph.map_vector_distances_to_graph_nodes(node_distances)
|
|
300
|
-
|
|
301
|
-
assert graph.get_node("1").attributes.get("vector_distance") == 0.95
|
|
302
|
-
assert graph.get_node("2").attributes.get("vector_distance") == 0.87
|
|
303
|
-
assert graph.get_node("3").attributes.get("vector_distance") == 0.92
|
|
304
|
-
assert graph.get_node("4").attributes.get("vector_distance") == 3.5
|
|
305
|
-
|
|
306
|
-
|
|
307
|
-
@pytest.mark.asyncio
|
|
308
|
-
async def test_map_vector_distances_to_graph_edges_with_payload(setup_graph):
|
|
309
|
-
"""Test mapping vector distances to edges when edge_distances provided."""
|
|
310
|
-
graph = setup_graph
|
|
311
|
-
|
|
312
|
-
node1 = Node("1")
|
|
313
|
-
node2 = Node("2")
|
|
314
|
-
graph.add_node(node1)
|
|
315
|
-
graph.add_node(node2)
|
|
316
|
-
|
|
317
|
-
edge = Edge(
|
|
318
|
-
node1,
|
|
319
|
-
node2,
|
|
320
|
-
attributes={"edge_text": "CONNECTS_TO", "relationship_type": "connects"},
|
|
321
|
-
)
|
|
322
|
-
graph.add_edge(edge)
|
|
323
|
-
|
|
324
|
-
edge_distances = [
|
|
325
|
-
MockScoredResult("e1", 0.92, payload={"text": "CONNECTS_TO"}),
|
|
326
|
-
]
|
|
327
|
-
|
|
328
|
-
await graph.map_vector_distances_to_graph_edges(edge_distances=edge_distances)
|
|
329
|
-
|
|
330
|
-
assert graph.edges[0].attributes.get("vector_distance") == 0.92
|
|
331
|
-
|
|
332
|
-
|
|
333
|
-
@pytest.mark.asyncio
|
|
334
|
-
async def test_map_vector_distances_partial_edge_coverage(setup_graph):
|
|
335
|
-
"""Test mapping edge distances when only some edges have results."""
|
|
336
|
-
graph = setup_graph
|
|
337
|
-
|
|
338
|
-
node1 = Node("1")
|
|
339
|
-
node2 = Node("2")
|
|
340
|
-
node3 = Node("3")
|
|
341
|
-
graph.add_node(node1)
|
|
342
|
-
graph.add_node(node2)
|
|
343
|
-
graph.add_node(node3)
|
|
344
|
-
|
|
345
|
-
edge1 = Edge(node1, node2, attributes={"edge_text": "CONNECTS_TO"})
|
|
346
|
-
edge2 = Edge(node2, node3, attributes={"edge_text": "DEPENDS_ON"})
|
|
347
|
-
graph.add_edge(edge1)
|
|
348
|
-
graph.add_edge(edge2)
|
|
349
|
-
|
|
350
|
-
edge_distances = [
|
|
351
|
-
MockScoredResult("e1", 0.92, payload={"text": "CONNECTS_TO"}),
|
|
352
|
-
]
|
|
353
|
-
|
|
354
|
-
await graph.map_vector_distances_to_graph_edges(edge_distances=edge_distances)
|
|
355
|
-
|
|
356
|
-
assert graph.edges[0].attributes.get("vector_distance") == 0.92
|
|
357
|
-
assert graph.edges[1].attributes.get("vector_distance") == 3.5
|
|
358
|
-
|
|
359
|
-
|
|
360
|
-
@pytest.mark.asyncio
|
|
361
|
-
async def test_map_vector_distances_edges_fallback_to_relationship_type(setup_graph):
|
|
362
|
-
"""Test that edge mapping falls back to relationship_type when edge_text is missing."""
|
|
363
|
-
graph = setup_graph
|
|
364
|
-
|
|
365
|
-
node1 = Node("1")
|
|
366
|
-
node2 = Node("2")
|
|
367
|
-
graph.add_node(node1)
|
|
368
|
-
graph.add_node(node2)
|
|
369
|
-
|
|
370
|
-
edge = Edge(
|
|
371
|
-
node1,
|
|
372
|
-
node2,
|
|
373
|
-
attributes={"relationship_type": "KNOWS"},
|
|
374
|
-
)
|
|
375
|
-
graph.add_edge(edge)
|
|
376
|
-
|
|
377
|
-
edge_distances = [
|
|
378
|
-
MockScoredResult("e1", 0.85, payload={"text": "KNOWS"}),
|
|
379
|
-
]
|
|
380
|
-
|
|
381
|
-
await graph.map_vector_distances_to_graph_edges(edge_distances=edge_distances)
|
|
382
|
-
|
|
383
|
-
assert graph.edges[0].attributes.get("vector_distance") == 0.85
|
|
384
|
-
|
|
385
|
-
|
|
386
|
-
@pytest.mark.asyncio
|
|
387
|
-
async def test_map_vector_distances_no_edge_matches(setup_graph):
|
|
388
|
-
"""Test edge mapping when no edges match the distance results."""
|
|
389
|
-
graph = setup_graph
|
|
390
|
-
|
|
391
|
-
node1 = Node("1")
|
|
392
|
-
node2 = Node("2")
|
|
393
|
-
graph.add_node(node1)
|
|
394
|
-
graph.add_node(node2)
|
|
395
|
-
|
|
396
|
-
edge = Edge(
|
|
397
|
-
node1,
|
|
398
|
-
node2,
|
|
399
|
-
attributes={"edge_text": "CONNECTS_TO", "relationship_type": "connects"},
|
|
400
|
-
)
|
|
401
|
-
graph.add_edge(edge)
|
|
402
|
-
|
|
403
|
-
edge_distances = [
|
|
404
|
-
MockScoredResult("e1", 0.92, payload={"text": "SOME_OTHER_EDGE"}),
|
|
405
|
-
]
|
|
406
|
-
|
|
407
|
-
await graph.map_vector_distances_to_graph_edges(edge_distances=edge_distances)
|
|
408
|
-
|
|
409
|
-
assert graph.edges[0].attributes.get("vector_distance") == 3.5
|
|
410
|
-
|
|
411
|
-
|
|
412
|
-
@pytest.mark.asyncio
|
|
413
|
-
async def test_map_vector_distances_none_returns_early(setup_graph):
|
|
414
|
-
"""Test that edge_distances=None returns early without error."""
|
|
415
|
-
graph = setup_graph
|
|
416
|
-
graph.add_node(Node("1"))
|
|
417
|
-
graph.add_node(Node("2"))
|
|
418
|
-
graph.add_edge(Edge(graph.get_node("1"), graph.get_node("2")))
|
|
419
|
-
|
|
420
|
-
await graph.map_vector_distances_to_graph_edges(edge_distances=None)
|
|
421
|
-
|
|
422
|
-
assert graph.edges[0].attributes.get("vector_distance") == 3.5
|
|
423
|
-
|
|
424
|
-
|
|
425
|
-
@pytest.mark.asyncio
|
|
426
|
-
async def test_calculate_top_triplet_importances(setup_graph):
|
|
427
|
-
"""Test calculating top triplet importances by score."""
|
|
428
|
-
graph = setup_graph
|
|
429
|
-
|
|
430
|
-
node1 = Node("1")
|
|
431
|
-
node2 = Node("2")
|
|
432
|
-
node3 = Node("3")
|
|
433
|
-
node4 = Node("4")
|
|
434
|
-
|
|
435
|
-
node1.add_attribute("vector_distance", 0.9)
|
|
436
|
-
node2.add_attribute("vector_distance", 0.8)
|
|
437
|
-
node3.add_attribute("vector_distance", 0.7)
|
|
438
|
-
node4.add_attribute("vector_distance", 0.6)
|
|
439
|
-
|
|
440
|
-
graph.add_node(node1)
|
|
441
|
-
graph.add_node(node2)
|
|
442
|
-
graph.add_node(node3)
|
|
443
|
-
graph.add_node(node4)
|
|
444
|
-
|
|
445
|
-
edge1 = Edge(node1, node2)
|
|
446
|
-
edge2 = Edge(node2, node3)
|
|
447
|
-
edge3 = Edge(node3, node4)
|
|
448
|
-
|
|
449
|
-
edge1.add_attribute("vector_distance", 0.85)
|
|
450
|
-
edge2.add_attribute("vector_distance", 0.75)
|
|
451
|
-
edge3.add_attribute("vector_distance", 0.65)
|
|
452
|
-
|
|
453
|
-
graph.add_edge(edge1)
|
|
454
|
-
graph.add_edge(edge2)
|
|
455
|
-
graph.add_edge(edge3)
|
|
456
|
-
|
|
457
|
-
top_triplets = await graph.calculate_top_triplet_importances(k=2)
|
|
458
|
-
|
|
459
|
-
assert len(top_triplets) == 2
|
|
460
|
-
|
|
461
|
-
assert top_triplets[0] == edge3
|
|
462
|
-
assert top_triplets[1] == edge2
|
|
463
|
-
|
|
464
|
-
|
|
465
|
-
@pytest.mark.asyncio
|
|
466
|
-
async def test_calculate_top_triplet_importances_default_distances(setup_graph):
|
|
467
|
-
"""Test calculating importances when nodes/edges have no vector distances."""
|
|
468
|
-
graph = setup_graph
|
|
469
|
-
|
|
470
|
-
node1 = Node("1")
|
|
471
|
-
node2 = Node("2")
|
|
472
|
-
graph.add_node(node1)
|
|
473
|
-
graph.add_node(node2)
|
|
474
|
-
|
|
475
|
-
edge = Edge(node1, node2)
|
|
476
|
-
graph.add_edge(edge)
|
|
477
|
-
|
|
478
|
-
top_triplets = await graph.calculate_top_triplet_importances(k=1)
|
|
479
|
-
|
|
480
|
-
assert len(top_triplets) == 1
|
|
481
|
-
assert top_triplets[0] == edge
|