cognee 0.2.3.dev0__py3-none-any.whl → 0.2.4__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- cognee/__main__.py +4 -0
- cognee/api/v1/add/add.py +18 -11
- cognee/api/v1/cognify/code_graph_pipeline.py +7 -1
- cognee/api/v1/cognify/cognify.py +22 -115
- cognee/api/v1/cognify/routers/get_cognify_router.py +11 -3
- cognee/api/v1/config/config.py +5 -13
- cognee/api/v1/datasets/routers/get_datasets_router.py +2 -2
- cognee/api/v1/delete/delete.py +1 -1
- cognee/api/v1/exceptions/__init__.py +13 -0
- cognee/api/v1/{delete → exceptions}/exceptions.py +15 -12
- cognee/api/v1/responses/default_tools.py +4 -0
- cognee/api/v1/responses/dispatch_function.py +6 -1
- cognee/api/v1/responses/models.py +1 -1
- cognee/api/v1/search/search.py +6 -7
- cognee/cli/__init__.py +10 -0
- cognee/cli/_cognee.py +180 -0
- cognee/cli/commands/__init__.py +1 -0
- cognee/cli/commands/add_command.py +80 -0
- cognee/cli/commands/cognify_command.py +128 -0
- cognee/cli/commands/config_command.py +225 -0
- cognee/cli/commands/delete_command.py +80 -0
- cognee/cli/commands/search_command.py +149 -0
- cognee/cli/config.py +33 -0
- cognee/cli/debug.py +21 -0
- cognee/cli/echo.py +45 -0
- cognee/cli/exceptions.py +23 -0
- cognee/cli/minimal_cli.py +97 -0
- cognee/cli/reference.py +26 -0
- cognee/cli/suppress_logging.py +12 -0
- cognee/eval_framework/corpus_builder/corpus_builder_executor.py +2 -2
- cognee/eval_framework/eval_config.py +1 -1
- cognee/exceptions/__init__.py +5 -5
- cognee/exceptions/exceptions.py +37 -17
- cognee/infrastructure/data/exceptions/__init__.py +7 -0
- cognee/infrastructure/data/exceptions/exceptions.py +22 -0
- cognee/infrastructure/data/utils/extract_keywords.py +3 -3
- cognee/infrastructure/databases/exceptions/__init__.py +3 -0
- cognee/infrastructure/databases/exceptions/exceptions.py +57 -9
- cognee/infrastructure/databases/graph/get_graph_engine.py +4 -9
- cognee/infrastructure/databases/graph/kuzu/adapter.py +64 -2
- cognee/infrastructure/databases/graph/neo4j_driver/adapter.py +49 -0
- cognee/infrastructure/databases/graph/neptune_driver/exceptions.py +15 -10
- cognee/infrastructure/databases/hybrid/falkordb/FalkorDBAdapter.py +2 -2
- cognee/infrastructure/databases/hybrid/neptune_analytics/NeptuneAnalyticsAdapter.py +4 -5
- cognee/infrastructure/databases/vector/chromadb/ChromaDBAdapter.py +2 -2
- cognee/infrastructure/databases/vector/embeddings/FastembedEmbeddingEngine.py +5 -3
- cognee/infrastructure/databases/vector/embeddings/LiteLLMEmbeddingEngine.py +17 -8
- cognee/infrastructure/databases/vector/embeddings/OllamaEmbeddingEngine.py +5 -5
- cognee/infrastructure/databases/vector/embeddings/config.py +2 -2
- cognee/infrastructure/databases/vector/embeddings/get_embedding_engine.py +6 -6
- cognee/infrastructure/databases/vector/exceptions/exceptions.py +3 -3
- cognee/infrastructure/databases/vector/lancedb/LanceDBAdapter.py +2 -2
- cognee/infrastructure/databases/vector/pgvector/PGVectorAdapter.py +4 -3
- cognee/infrastructure/files/utils/get_data_file_path.py +14 -9
- cognee/infrastructure/files/utils/get_file_metadata.py +2 -1
- cognee/infrastructure/llm/LLMGateway.py +14 -5
- cognee/infrastructure/llm/config.py +5 -5
- cognee/infrastructure/llm/exceptions.py +30 -2
- cognee/infrastructure/llm/structured_output_framework/baml/baml_src/extraction/knowledge_graph/extract_content_graph.py +16 -5
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/extraction/knowledge_graph/extract_content_graph.py +19 -15
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/anthropic/adapter.py +5 -5
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/gemini/adapter.py +6 -6
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/generic_llm_api/adapter.py +2 -2
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/get_llm_client.py +24 -15
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/ollama/adapter.py +6 -4
- cognee/infrastructure/llm/structured_output_framework/litellm_instructor/llm/openai/adapter.py +9 -7
- cognee/infrastructure/llm/tokenizer/Gemini/adapter.py +2 -2
- cognee/infrastructure/llm/tokenizer/HuggingFace/adapter.py +3 -3
- cognee/infrastructure/llm/tokenizer/Mistral/adapter.py +3 -3
- cognee/infrastructure/llm/tokenizer/TikToken/adapter.py +6 -6
- cognee/infrastructure/llm/utils.py +7 -7
- cognee/modules/data/exceptions/exceptions.py +18 -5
- cognee/modules/data/methods/__init__.py +2 -0
- cognee/modules/data/methods/create_authorized_dataset.py +19 -0
- cognee/modules/data/methods/delete_data.py +2 -4
- cognee/modules/data/methods/get_authorized_dataset.py +11 -5
- cognee/modules/data/methods/get_authorized_dataset_by_name.py +16 -0
- cognee/modules/data/methods/load_or_create_datasets.py +2 -20
- cognee/modules/data/processing/document_types/exceptions/exceptions.py +2 -2
- cognee/modules/graph/cognee_graph/CogneeGraph.py +6 -4
- cognee/modules/graph/cognee_graph/CogneeGraphElements.py +5 -10
- cognee/modules/graph/exceptions/__init__.py +2 -0
- cognee/modules/graph/exceptions/exceptions.py +25 -3
- cognee/modules/graph/methods/get_formatted_graph_data.py +3 -2
- cognee/modules/ingestion/exceptions/exceptions.py +2 -2
- cognee/modules/ontology/exceptions/exceptions.py +4 -4
- cognee/modules/pipelines/__init__.py +1 -1
- cognee/modules/pipelines/exceptions/exceptions.py +2 -2
- cognee/modules/pipelines/exceptions/tasks.py +18 -0
- cognee/modules/pipelines/layers/__init__.py +1 -0
- cognee/modules/pipelines/layers/check_pipeline_run_qualification.py +59 -0
- cognee/modules/pipelines/layers/pipeline_execution_mode.py +127 -0
- cognee/modules/pipelines/layers/reset_dataset_pipeline_run_status.py +12 -0
- cognee/modules/pipelines/layers/resolve_authorized_user_dataset.py +34 -0
- cognee/modules/pipelines/layers/resolve_authorized_user_datasets.py +55 -0
- cognee/modules/pipelines/layers/setup_and_check_environment.py +41 -0
- cognee/modules/pipelines/layers/validate_pipeline_tasks.py +20 -0
- cognee/modules/pipelines/methods/__init__.py +2 -0
- cognee/modules/pipelines/methods/get_pipeline_runs_by_dataset.py +34 -0
- cognee/modules/pipelines/methods/reset_pipeline_run_status.py +16 -0
- cognee/modules/pipelines/operations/__init__.py +0 -1
- cognee/modules/pipelines/operations/log_pipeline_run_initiated.py +1 -1
- cognee/modules/pipelines/operations/pipeline.py +23 -138
- cognee/modules/retrieval/base_feedback.py +11 -0
- cognee/modules/retrieval/cypher_search_retriever.py +1 -9
- cognee/modules/retrieval/exceptions/exceptions.py +12 -6
- cognee/modules/retrieval/graph_completion_context_extension_retriever.py +9 -2
- cognee/modules/retrieval/graph_completion_cot_retriever.py +13 -6
- cognee/modules/retrieval/graph_completion_retriever.py +89 -5
- cognee/modules/retrieval/graph_summary_completion_retriever.py +2 -0
- cognee/modules/retrieval/natural_language_retriever.py +0 -4
- cognee/modules/retrieval/user_qa_feedback.py +83 -0
- cognee/modules/retrieval/utils/extract_uuid_from_node.py +18 -0
- cognee/modules/retrieval/utils/models.py +40 -0
- cognee/modules/search/exceptions/__init__.py +7 -0
- cognee/modules/search/exceptions/exceptions.py +15 -0
- cognee/modules/search/methods/search.py +47 -7
- cognee/modules/search/types/SearchType.py +1 -0
- cognee/modules/settings/get_settings.py +2 -2
- cognee/modules/users/exceptions/exceptions.py +6 -6
- cognee/shared/CodeGraphEntities.py +1 -0
- cognee/shared/exceptions/exceptions.py +2 -2
- cognee/shared/logging_utils.py +142 -31
- cognee/shared/utils.py +0 -1
- cognee/tasks/completion/exceptions/exceptions.py +3 -3
- cognee/tasks/documents/classify_documents.py +4 -0
- cognee/tasks/documents/exceptions/__init__.py +11 -0
- cognee/tasks/documents/exceptions/exceptions.py +36 -0
- cognee/tasks/documents/extract_chunks_from_documents.py +8 -2
- cognee/tasks/graph/exceptions/__init__.py +12 -0
- cognee/tasks/graph/exceptions/exceptions.py +41 -0
- cognee/tasks/graph/extract_graph_from_data.py +34 -2
- cognee/tasks/ingestion/exceptions/__init__.py +8 -0
- cognee/tasks/ingestion/exceptions/exceptions.py +12 -0
- cognee/tasks/ingestion/resolve_data_directories.py +5 -0
- cognee/tasks/repo_processor/get_local_dependencies.py +2 -0
- cognee/tasks/repo_processor/get_repo_file_dependencies.py +120 -48
- cognee/tasks/storage/add_data_points.py +41 -3
- cognee/tasks/storage/exceptions/__init__.py +9 -0
- cognee/tasks/storage/exceptions/exceptions.py +13 -0
- cognee/tasks/storage/index_data_points.py +1 -1
- cognee/tasks/summarization/exceptions/__init__.py +9 -0
- cognee/tasks/summarization/exceptions/exceptions.py +14 -0
- cognee/tasks/summarization/summarize_text.py +8 -1
- cognee/tests/integration/cli/__init__.py +3 -0
- cognee/tests/integration/cli/test_cli_integration.py +331 -0
- cognee/tests/integration/documents/PdfDocument_test.py +2 -2
- cognee/tests/integration/documents/TextDocument_test.py +2 -4
- cognee/tests/integration/documents/UnstructuredDocument_test.py +5 -8
- cognee/tests/test_delete_by_id.py +1 -1
- cognee/tests/{test_deletion.py → test_delete_hard.py} +0 -37
- cognee/tests/test_delete_soft.py +85 -0
- cognee/tests/test_kuzu.py +2 -2
- cognee/tests/test_neo4j.py +2 -2
- cognee/tests/test_search_db.py +126 -7
- cognee/tests/unit/cli/__init__.py +3 -0
- cognee/tests/unit/cli/test_cli_commands.py +483 -0
- cognee/tests/unit/cli/test_cli_edge_cases.py +625 -0
- cognee/tests/unit/cli/test_cli_main.py +173 -0
- cognee/tests/unit/cli/test_cli_runner.py +62 -0
- cognee/tests/unit/cli/test_cli_utils.py +127 -0
- cognee/tests/unit/modules/graph/cognee_graph_elements_test.py +5 -5
- cognee/tests/unit/modules/retrieval/graph_completion_retriever_context_extension_test.py +3 -3
- cognee/tests/unit/modules/retrieval/graph_completion_retriever_cot_test.py +3 -3
- cognee/tests/unit/modules/retrieval/graph_completion_retriever_test.py +3 -3
- cognee/tests/unit/modules/search/search_methods_test.py +4 -2
- {cognee-0.2.3.dev0.dist-info → cognee-0.2.4.dist-info}/METADATA +7 -5
- {cognee-0.2.3.dev0.dist-info → cognee-0.2.4.dist-info}/RECORD +172 -121
- cognee-0.2.4.dist-info/entry_points.txt +2 -0
- cognee/infrastructure/databases/exceptions/EmbeddingException.py +0 -20
- cognee/infrastructure/databases/graph/networkx/__init__.py +0 -0
- cognee/infrastructure/databases/graph/networkx/adapter.py +0 -1017
- cognee/infrastructure/pipeline/models/Operation.py +0 -60
- cognee/infrastructure/pipeline/models/__init__.py +0 -0
- cognee/notebooks/github_analysis_step_by_step.ipynb +0 -37
- cognee/tests/tasks/descriptive_metrics/networkx_metrics_test.py +0 -7
- {cognee-0.2.3.dev0.dist-info → cognee-0.2.4.dist-info}/WHEEL +0 -0
- {cognee-0.2.3.dev0.dist-info → cognee-0.2.4.dist-info}/licenses/LICENSE +0 -0
- {cognee-0.2.3.dev0.dist-info → cognee-0.2.4.dist-info}/licenses/NOTICE.md +0 -0
|
@@ -0,0 +1,80 @@
|
|
|
1
|
+
import argparse
|
|
2
|
+
import asyncio
|
|
3
|
+
from typing import Optional
|
|
4
|
+
|
|
5
|
+
from cognee.cli.reference import SupportsCliCommand
|
|
6
|
+
from cognee.cli import DEFAULT_DOCS_URL
|
|
7
|
+
import cognee.cli.echo as fmt
|
|
8
|
+
from cognee.cli.exceptions import CliCommandException, CliCommandInnerException
|
|
9
|
+
|
|
10
|
+
|
|
11
|
+
class DeleteCommand(SupportsCliCommand):
|
|
12
|
+
command_string = "delete"
|
|
13
|
+
help_string = "Delete data from cognee knowledge base"
|
|
14
|
+
docs_url = DEFAULT_DOCS_URL
|
|
15
|
+
description = """
|
|
16
|
+
The `cognee delete` command removes data from your knowledge base.
|
|
17
|
+
|
|
18
|
+
You can delete:
|
|
19
|
+
- Specific datasets by name
|
|
20
|
+
- All data (with confirmation)
|
|
21
|
+
- Data for specific users
|
|
22
|
+
|
|
23
|
+
Be careful with deletion operations as they are irreversible.
|
|
24
|
+
"""
|
|
25
|
+
|
|
26
|
+
def configure_parser(self, parser: argparse.ArgumentParser) -> None:
|
|
27
|
+
parser.add_argument("--dataset-name", "-d", help="Specific dataset to delete")
|
|
28
|
+
parser.add_argument("--user-id", "-u", help="User ID to delete data for")
|
|
29
|
+
parser.add_argument(
|
|
30
|
+
"--all", action="store_true", help="Delete all data (requires confirmation)"
|
|
31
|
+
)
|
|
32
|
+
parser.add_argument("--force", "-f", action="store_true", help="Skip confirmation prompts")
|
|
33
|
+
|
|
34
|
+
def execute(self, args: argparse.Namespace) -> None:
|
|
35
|
+
try:
|
|
36
|
+
# Import cognee here to avoid circular imports
|
|
37
|
+
import cognee
|
|
38
|
+
|
|
39
|
+
# Validate arguments
|
|
40
|
+
if not any([args.dataset_name, args.user_id, args.all]):
|
|
41
|
+
fmt.error("Please specify what to delete: --dataset-name, --user-id, or --all")
|
|
42
|
+
return
|
|
43
|
+
|
|
44
|
+
# Build confirmation message
|
|
45
|
+
if args.all:
|
|
46
|
+
confirm_msg = "Delete ALL data from cognee?"
|
|
47
|
+
operation = "all data"
|
|
48
|
+
elif args.dataset_name:
|
|
49
|
+
confirm_msg = f"Delete dataset '{args.dataset_name}'?"
|
|
50
|
+
operation = f"dataset '{args.dataset_name}'"
|
|
51
|
+
elif args.user_id:
|
|
52
|
+
confirm_msg = f"Delete all data for user '{args.user_id}'?"
|
|
53
|
+
operation = f"data for user '{args.user_id}'"
|
|
54
|
+
|
|
55
|
+
# Confirm deletion unless forced
|
|
56
|
+
if not args.force:
|
|
57
|
+
fmt.warning("This operation is irreversible!")
|
|
58
|
+
if not fmt.confirm(confirm_msg):
|
|
59
|
+
fmt.echo("Deletion cancelled.")
|
|
60
|
+
return
|
|
61
|
+
|
|
62
|
+
fmt.echo(f"Deleting {operation}...")
|
|
63
|
+
|
|
64
|
+
# Run the async delete function
|
|
65
|
+
async def run_delete():
|
|
66
|
+
try:
|
|
67
|
+
if args.all:
|
|
68
|
+
await cognee.delete(dataset_name=None, user_id=args.user_id)
|
|
69
|
+
else:
|
|
70
|
+
await cognee.delete(dataset_name=args.dataset_name, user_id=args.user_id)
|
|
71
|
+
except Exception as e:
|
|
72
|
+
raise CliCommandInnerException(f"Failed to delete: {str(e)}")
|
|
73
|
+
|
|
74
|
+
asyncio.run(run_delete())
|
|
75
|
+
fmt.success(f"Successfully deleted {operation}")
|
|
76
|
+
|
|
77
|
+
except Exception as e:
|
|
78
|
+
if isinstance(e, CliCommandInnerException):
|
|
79
|
+
raise CliCommandException(str(e), error_code=1)
|
|
80
|
+
raise CliCommandException(f"Error deleting data: {str(e)}", error_code=1)
|
|
@@ -0,0 +1,149 @@
|
|
|
1
|
+
import argparse
|
|
2
|
+
import asyncio
|
|
3
|
+
import json
|
|
4
|
+
from typing import Optional
|
|
5
|
+
|
|
6
|
+
from cognee.cli.reference import SupportsCliCommand
|
|
7
|
+
from cognee.cli import DEFAULT_DOCS_URL
|
|
8
|
+
from cognee.cli.config import SEARCH_TYPE_CHOICES, OUTPUT_FORMAT_CHOICES
|
|
9
|
+
import cognee.cli.echo as fmt
|
|
10
|
+
from cognee.cli.exceptions import CliCommandException, CliCommandInnerException
|
|
11
|
+
|
|
12
|
+
|
|
13
|
+
class SearchCommand(SupportsCliCommand):
|
|
14
|
+
command_string = "search"
|
|
15
|
+
help_string = "Search and query the knowledge graph for insights, information, and connections"
|
|
16
|
+
docs_url = DEFAULT_DOCS_URL
|
|
17
|
+
description = """
|
|
18
|
+
Search and query the knowledge graph for insights, information, and connections.
|
|
19
|
+
|
|
20
|
+
This is the final step in the Cognee workflow that retrieves information from the
|
|
21
|
+
processed knowledge graph. It supports multiple search modes optimized for different
|
|
22
|
+
use cases - from simple fact retrieval to complex reasoning and code analysis.
|
|
23
|
+
|
|
24
|
+
Search Types & Use Cases:
|
|
25
|
+
|
|
26
|
+
**GRAPH_COMPLETION** (Default - Recommended):
|
|
27
|
+
Natural language Q&A using full graph context and LLM reasoning.
|
|
28
|
+
Best for: Complex questions, analysis, summaries, insights.
|
|
29
|
+
|
|
30
|
+
**RAG_COMPLETION**:
|
|
31
|
+
Traditional RAG using document chunks without graph structure.
|
|
32
|
+
Best for: Direct document retrieval, specific fact-finding.
|
|
33
|
+
|
|
34
|
+
**INSIGHTS**:
|
|
35
|
+
Structured entity relationships and semantic connections.
|
|
36
|
+
Best for: Understanding concept relationships, knowledge mapping.
|
|
37
|
+
|
|
38
|
+
**CHUNKS**:
|
|
39
|
+
Raw text segments that match the query semantically.
|
|
40
|
+
Best for: Finding specific passages, citations, exact content.
|
|
41
|
+
|
|
42
|
+
**SUMMARIES**:
|
|
43
|
+
Pre-generated hierarchical summaries of content.
|
|
44
|
+
Best for: Quick overviews, document abstracts, topic summaries.
|
|
45
|
+
|
|
46
|
+
**CODE**:
|
|
47
|
+
Code-specific search with syntax and semantic understanding.
|
|
48
|
+
Best for: Finding functions, classes, implementation patterns.
|
|
49
|
+
"""
|
|
50
|
+
|
|
51
|
+
def configure_parser(self, parser: argparse.ArgumentParser) -> None:
|
|
52
|
+
parser.add_argument("query_text", help="Your question or search query in natural language")
|
|
53
|
+
parser.add_argument(
|
|
54
|
+
"--query-type",
|
|
55
|
+
"-t",
|
|
56
|
+
choices=SEARCH_TYPE_CHOICES,
|
|
57
|
+
default="GRAPH_COMPLETION",
|
|
58
|
+
help="Search mode (default: GRAPH_COMPLETION for conversational AI responses)",
|
|
59
|
+
)
|
|
60
|
+
parser.add_argument(
|
|
61
|
+
"--datasets",
|
|
62
|
+
"-d",
|
|
63
|
+
nargs="*",
|
|
64
|
+
help="Dataset name(s) to search within. Searches all accessible datasets if not specified",
|
|
65
|
+
)
|
|
66
|
+
parser.add_argument(
|
|
67
|
+
"--top-k",
|
|
68
|
+
"-k",
|
|
69
|
+
type=int,
|
|
70
|
+
default=10,
|
|
71
|
+
help="Maximum number of results to return (default: 10, max: 100)",
|
|
72
|
+
)
|
|
73
|
+
parser.add_argument(
|
|
74
|
+
"--system-prompt",
|
|
75
|
+
help="Custom system prompt file for LLM-based search types (default: answer_simple_question.txt)",
|
|
76
|
+
)
|
|
77
|
+
parser.add_argument(
|
|
78
|
+
"--output-format",
|
|
79
|
+
"-f",
|
|
80
|
+
choices=OUTPUT_FORMAT_CHOICES,
|
|
81
|
+
default="pretty",
|
|
82
|
+
help="Output format (default: pretty)",
|
|
83
|
+
)
|
|
84
|
+
|
|
85
|
+
def execute(self, args: argparse.Namespace) -> None:
|
|
86
|
+
try:
|
|
87
|
+
# Import cognee here to avoid circular imports
|
|
88
|
+
import cognee
|
|
89
|
+
from cognee.modules.search.types import SearchType
|
|
90
|
+
|
|
91
|
+
# Convert string to SearchType enum
|
|
92
|
+
query_type = SearchType[args.query_type]
|
|
93
|
+
|
|
94
|
+
datasets_msg = (
|
|
95
|
+
f" in datasets {args.datasets}" if args.datasets else " across all datasets"
|
|
96
|
+
)
|
|
97
|
+
fmt.echo(f"Searching for: '{args.query_text}' (type: {args.query_type}){datasets_msg}")
|
|
98
|
+
|
|
99
|
+
# Run the async search function
|
|
100
|
+
async def run_search():
|
|
101
|
+
try:
|
|
102
|
+
results = await cognee.search(
|
|
103
|
+
query_text=args.query_text,
|
|
104
|
+
query_type=query_type,
|
|
105
|
+
datasets=args.datasets,
|
|
106
|
+
system_prompt_path=args.system_prompt or "answer_simple_question.txt",
|
|
107
|
+
top_k=args.top_k,
|
|
108
|
+
)
|
|
109
|
+
return results
|
|
110
|
+
except Exception as e:
|
|
111
|
+
raise CliCommandInnerException(f"Failed to search: {str(e)}")
|
|
112
|
+
|
|
113
|
+
results = asyncio.run(run_search())
|
|
114
|
+
|
|
115
|
+
# Format and display results
|
|
116
|
+
if args.output_format == "json":
|
|
117
|
+
fmt.echo(json.dumps(results, indent=2, default=str))
|
|
118
|
+
elif args.output_format == "simple":
|
|
119
|
+
for i, result in enumerate(results, 1):
|
|
120
|
+
fmt.echo(f"{i}. {result}")
|
|
121
|
+
else: # pretty format
|
|
122
|
+
if not results:
|
|
123
|
+
fmt.warning("No results found for your query.")
|
|
124
|
+
return
|
|
125
|
+
|
|
126
|
+
fmt.echo(f"\nFound {len(results)} result(s) using {args.query_type}:")
|
|
127
|
+
fmt.echo("=" * 60)
|
|
128
|
+
|
|
129
|
+
if args.query_type in ["GRAPH_COMPLETION", "RAG_COMPLETION"]:
|
|
130
|
+
# These return conversational responses
|
|
131
|
+
for i, result in enumerate(results, 1):
|
|
132
|
+
fmt.echo(f"{fmt.bold('Response:')} {result}")
|
|
133
|
+
if i < len(results):
|
|
134
|
+
fmt.echo("-" * 40)
|
|
135
|
+
elif args.query_type == "CHUNKS":
|
|
136
|
+
# These return text chunks
|
|
137
|
+
for i, result in enumerate(results, 1):
|
|
138
|
+
fmt.echo(f"{fmt.bold(f'Chunk {i}:')} {result}")
|
|
139
|
+
fmt.echo()
|
|
140
|
+
else:
|
|
141
|
+
# Generic formatting for other types
|
|
142
|
+
for i, result in enumerate(results, 1):
|
|
143
|
+
fmt.echo(f"{fmt.bold(f'Result {i}:')} {result}")
|
|
144
|
+
fmt.echo()
|
|
145
|
+
|
|
146
|
+
except Exception as e:
|
|
147
|
+
if isinstance(e, CliCommandInnerException):
|
|
148
|
+
raise CliCommandException(str(e), error_code=1)
|
|
149
|
+
raise CliCommandException(f"Error searching: {str(e)}", error_code=1)
|
cognee/cli/config.py
ADDED
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
"""
|
|
2
|
+
CLI configuration and constants to avoid hardcoded values
|
|
3
|
+
"""
|
|
4
|
+
|
|
5
|
+
# CLI Constants
|
|
6
|
+
CLI_DESCRIPTION = "Cognee CLI - Manage your knowledge graphs and cognitive processing pipelines."
|
|
7
|
+
DEFAULT_DOCS_URL = "https://docs.cognee.ai"
|
|
8
|
+
|
|
9
|
+
# Command descriptions - these should match the actual command implementations
|
|
10
|
+
COMMAND_DESCRIPTIONS = {
|
|
11
|
+
"add": "Add data to Cognee for knowledge graph processing",
|
|
12
|
+
"search": "Search and query the knowledge graph for insights, information, and connections",
|
|
13
|
+
"cognify": "Transform ingested data into a structured knowledge graph",
|
|
14
|
+
"delete": "Delete data from cognee knowledge base",
|
|
15
|
+
"config": "Manage cognee configuration settings",
|
|
16
|
+
}
|
|
17
|
+
|
|
18
|
+
# Search type choices
|
|
19
|
+
SEARCH_TYPE_CHOICES = [
|
|
20
|
+
"GRAPH_COMPLETION",
|
|
21
|
+
"RAG_COMPLETION",
|
|
22
|
+
"INSIGHTS",
|
|
23
|
+
"CHUNKS",
|
|
24
|
+
"SUMMARIES",
|
|
25
|
+
"CODE",
|
|
26
|
+
"CYPHER",
|
|
27
|
+
]
|
|
28
|
+
|
|
29
|
+
# Chunker choices
|
|
30
|
+
CHUNKER_CHOICES = ["TextChunker", "LangchainChunker"]
|
|
31
|
+
|
|
32
|
+
# Output format choices
|
|
33
|
+
OUTPUT_FORMAT_CHOICES = ["json", "pretty", "simple"]
|
cognee/cli/debug.py
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
"""Provides a global debug setting for the CLI - following dlt patterns"""
|
|
2
|
+
|
|
3
|
+
_DEBUG_FLAG = False
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
def enable_debug() -> None:
|
|
7
|
+
"""Enable debug mode for CLI"""
|
|
8
|
+
global _DEBUG_FLAG
|
|
9
|
+
_DEBUG_FLAG = True
|
|
10
|
+
|
|
11
|
+
|
|
12
|
+
def disable_debug() -> None:
|
|
13
|
+
"""Disable debug mode for CLI"""
|
|
14
|
+
global _DEBUG_FLAG
|
|
15
|
+
_DEBUG_FLAG = False
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
def is_debug_enabled() -> bool:
|
|
19
|
+
"""Check if debug mode is enabled"""
|
|
20
|
+
global _DEBUG_FLAG
|
|
21
|
+
return _DEBUG_FLAG
|
cognee/cli/echo.py
ADDED
|
@@ -0,0 +1,45 @@
|
|
|
1
|
+
"""CLI output formatting utilities"""
|
|
2
|
+
|
|
3
|
+
import sys
|
|
4
|
+
import click
|
|
5
|
+
from typing import Any
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
def echo(message: str = "", color: str = None, err: bool = False) -> None:
|
|
9
|
+
"""Echo a message to stdout or stderr with optional color"""
|
|
10
|
+
click.secho(message, fg=color, err=err)
|
|
11
|
+
|
|
12
|
+
|
|
13
|
+
def note(message: str) -> None:
|
|
14
|
+
"""Print a note in blue"""
|
|
15
|
+
echo(f"Note: {message}", color="blue")
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
def warning(message: str) -> None:
|
|
19
|
+
"""Print a warning in yellow"""
|
|
20
|
+
echo(f"Warning: {message}", color="yellow")
|
|
21
|
+
|
|
22
|
+
|
|
23
|
+
def error(message: str) -> None:
|
|
24
|
+
"""Print an error in red"""
|
|
25
|
+
echo(f"Error: {message}", color="red", err=True)
|
|
26
|
+
|
|
27
|
+
|
|
28
|
+
def success(message: str) -> None:
|
|
29
|
+
"""Print a success message in green"""
|
|
30
|
+
echo(f"Success: {message}", color="green")
|
|
31
|
+
|
|
32
|
+
|
|
33
|
+
def bold(text: str) -> str:
|
|
34
|
+
"""Make text bold"""
|
|
35
|
+
return click.style(text, bold=True)
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
def confirm(message: str, default: bool = False) -> bool:
|
|
39
|
+
"""Ask for user confirmation"""
|
|
40
|
+
return click.confirm(message, default=default)
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
def prompt(message: str, default: Any = None) -> str:
|
|
44
|
+
"""Prompt user for input"""
|
|
45
|
+
return click.prompt(message, default=default)
|
cognee/cli/exceptions.py
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
from typing import Optional
|
|
2
|
+
|
|
3
|
+
|
|
4
|
+
class CliCommandException(Exception):
|
|
5
|
+
"""Exception raised by CLI commands with additional context"""
|
|
6
|
+
|
|
7
|
+
def __init__(
|
|
8
|
+
self,
|
|
9
|
+
message: str,
|
|
10
|
+
error_code: int = -1,
|
|
11
|
+
docs_url: Optional[str] = None,
|
|
12
|
+
raiseable_exception: Optional[Exception] = None,
|
|
13
|
+
) -> None:
|
|
14
|
+
super().__init__(message)
|
|
15
|
+
self.error_code = error_code
|
|
16
|
+
self.docs_url = docs_url
|
|
17
|
+
self.raiseable_exception = raiseable_exception
|
|
18
|
+
|
|
19
|
+
|
|
20
|
+
class CliCommandInnerException(Exception):
|
|
21
|
+
"""Inner exception for wrapping other exceptions in CLI context"""
|
|
22
|
+
|
|
23
|
+
pass
|
|
@@ -0,0 +1,97 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
Minimal CLI entry point for cognee that avoids early initialization
|
|
4
|
+
"""
|
|
5
|
+
|
|
6
|
+
import sys
|
|
7
|
+
import os
|
|
8
|
+
from typing import Any, Sequence
|
|
9
|
+
|
|
10
|
+
# CRITICAL: Prevent verbose logging initialization for CLI-only usage
|
|
11
|
+
# This must be set before any cognee imports to be effective
|
|
12
|
+
os.environ["COGNEE_MINIMAL_LOGGING"] = "true"
|
|
13
|
+
os.environ["COGNEE_CLI_MODE"] = "true"
|
|
14
|
+
|
|
15
|
+
|
|
16
|
+
def get_version() -> str:
|
|
17
|
+
"""Get cognee version without importing the main package"""
|
|
18
|
+
try:
|
|
19
|
+
# Try to get version from pyproject.toml first (for development)
|
|
20
|
+
from pathlib import Path
|
|
21
|
+
|
|
22
|
+
pyproject_path = Path(__file__).parent.parent.parent / "pyproject.toml"
|
|
23
|
+
if pyproject_path.exists():
|
|
24
|
+
with open(pyproject_path, encoding="utf-8") as f:
|
|
25
|
+
for line in f:
|
|
26
|
+
if line.startswith("version"):
|
|
27
|
+
version = line.split("=")[1].strip("'\"\n ")
|
|
28
|
+
return f"{version}-local"
|
|
29
|
+
|
|
30
|
+
# Fallback to installed package version
|
|
31
|
+
import importlib.metadata
|
|
32
|
+
|
|
33
|
+
return importlib.metadata.version("cognee")
|
|
34
|
+
except Exception:
|
|
35
|
+
return "unknown"
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
def get_command_info() -> dict:
|
|
39
|
+
"""Get command information without importing cognee"""
|
|
40
|
+
return {
|
|
41
|
+
"add": "Add data to Cognee for knowledge graph processing",
|
|
42
|
+
"search": "Search and query the knowledge graph for insights, information, and connections",
|
|
43
|
+
"cognify": "Transform ingested data into a structured knowledge graph",
|
|
44
|
+
"delete": "Delete data from cognee knowledge base",
|
|
45
|
+
"config": "Manage cognee configuration settings",
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
def print_help() -> None:
|
|
50
|
+
"""Print help message with dynamic command descriptions"""
|
|
51
|
+
commands = get_command_info()
|
|
52
|
+
command_list = "\n".join(f" {cmd:<12} {desc}" for cmd, desc in commands.items())
|
|
53
|
+
|
|
54
|
+
print(f"""
|
|
55
|
+
usage: cognee [-h] [--version] [--debug] {{{"|".join(commands.keys())}}} ...
|
|
56
|
+
|
|
57
|
+
Cognee CLI - Manage your knowledge graphs and cognitive processing pipelines.
|
|
58
|
+
|
|
59
|
+
options:
|
|
60
|
+
-h, --help show this help message and exit
|
|
61
|
+
--version show program's version number and exit
|
|
62
|
+
--debug Enable debug mode to show full stack traces on exceptions
|
|
63
|
+
|
|
64
|
+
Available commands:
|
|
65
|
+
{{{",".join(commands.keys())}}}
|
|
66
|
+
{command_list}
|
|
67
|
+
|
|
68
|
+
For more information on each command, use: cognee <command> --help
|
|
69
|
+
""")
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
def main() -> int:
|
|
73
|
+
"""Minimal CLI main function"""
|
|
74
|
+
# Handle help and version without any imports - purely static
|
|
75
|
+
if len(sys.argv) == 1 or (len(sys.argv) == 2 and sys.argv[1] in ["-h", "--help"]):
|
|
76
|
+
print_help()
|
|
77
|
+
return 0
|
|
78
|
+
|
|
79
|
+
if len(sys.argv) == 2 and sys.argv[1] == "--version":
|
|
80
|
+
print(f"cognee {get_version()}")
|
|
81
|
+
return 0
|
|
82
|
+
|
|
83
|
+
# For actual commands, import the full CLI with minimal logging
|
|
84
|
+
try:
|
|
85
|
+
from cognee.cli._cognee import main as full_main
|
|
86
|
+
|
|
87
|
+
return full_main()
|
|
88
|
+
except Exception as e:
|
|
89
|
+
if "--debug" in sys.argv:
|
|
90
|
+
raise
|
|
91
|
+
print(f"Error: {e}")
|
|
92
|
+
print("Use --debug for full stack trace")
|
|
93
|
+
return 1
|
|
94
|
+
|
|
95
|
+
|
|
96
|
+
if __name__ == "__main__":
|
|
97
|
+
sys.exit(main())
|
cognee/cli/reference.py
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
1
|
+
from abc import abstractmethod
|
|
2
|
+
from typing import Protocol, Optional
|
|
3
|
+
import argparse
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
class SupportsCliCommand(Protocol):
|
|
7
|
+
"""Protocol for defining one cognee cli command"""
|
|
8
|
+
|
|
9
|
+
command_string: str
|
|
10
|
+
"""name of the command"""
|
|
11
|
+
help_string: str
|
|
12
|
+
"""the help string for argparse"""
|
|
13
|
+
description: Optional[str]
|
|
14
|
+
"""the more detailed description for argparse, may include markdown for the docs"""
|
|
15
|
+
docs_url: Optional[str]
|
|
16
|
+
"""the default docs url to be printed in case of an exception"""
|
|
17
|
+
|
|
18
|
+
@abstractmethod
|
|
19
|
+
def configure_parser(self, parser: argparse.ArgumentParser) -> None:
|
|
20
|
+
"""Configures the parser for the given argument"""
|
|
21
|
+
...
|
|
22
|
+
|
|
23
|
+
@abstractmethod
|
|
24
|
+
def execute(self, args: argparse.Namespace) -> None:
|
|
25
|
+
"""Executes the command with the given arguments"""
|
|
26
|
+
...
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Module to suppress verbose logging before any cognee imports.
|
|
3
|
+
This must be imported before any other cognee modules.
|
|
4
|
+
"""
|
|
5
|
+
|
|
6
|
+
import os
|
|
7
|
+
|
|
8
|
+
# Set CLI mode to suppress verbose logging
|
|
9
|
+
os.environ["COGNEE_CLI_MODE"] = "true"
|
|
10
|
+
|
|
11
|
+
# Also set log level to ERROR for extra safety
|
|
12
|
+
os.environ["LOG_LEVEL"] = "ERROR"
|
|
@@ -5,7 +5,7 @@ from typing import Optional, Tuple, List, Dict, Union, Any, Callable, Awaitable
|
|
|
5
5
|
from cognee.eval_framework.benchmark_adapters.benchmark_adapters import BenchmarkAdapter
|
|
6
6
|
from cognee.modules.chunking.TextChunker import TextChunker
|
|
7
7
|
from cognee.modules.pipelines.tasks.task import Task
|
|
8
|
-
from cognee.modules.pipelines import
|
|
8
|
+
from cognee.modules.pipelines import run_pipeline
|
|
9
9
|
|
|
10
10
|
logger = get_logger(level=ERROR)
|
|
11
11
|
|
|
@@ -61,7 +61,7 @@ class CorpusBuilderExecutor:
|
|
|
61
61
|
await cognee.add(self.raw_corpus)
|
|
62
62
|
|
|
63
63
|
tasks = await self.task_getter(chunk_size=chunk_size, chunker=chunker)
|
|
64
|
-
pipeline_run =
|
|
64
|
+
pipeline_run = run_pipeline(tasks=tasks)
|
|
65
65
|
|
|
66
66
|
async for run_info in pipeline_run:
|
|
67
67
|
print(run_info)
|
cognee/exceptions/__init__.py
CHANGED
|
@@ -2,13 +2,13 @@
|
|
|
2
2
|
Custom exceptions for the Cognee API.
|
|
3
3
|
|
|
4
4
|
This module defines a set of exceptions for handling various application errors,
|
|
5
|
-
such as
|
|
5
|
+
such as System, Validation, Configuration or TransientErrors
|
|
6
6
|
"""
|
|
7
7
|
|
|
8
8
|
from .exceptions import (
|
|
9
9
|
CogneeApiError,
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
10
|
+
CogneeSystemError,
|
|
11
|
+
CogneeValidationError,
|
|
12
|
+
CogneeConfigurationError,
|
|
13
|
+
CogneeTransientError,
|
|
14
14
|
)
|
cognee/exceptions/exceptions.py
CHANGED
|
@@ -35,37 +35,57 @@ class CogneeApiError(Exception):
|
|
|
35
35
|
return f"{self.name}: {self.message} (Status code: {self.status_code})"
|
|
36
36
|
|
|
37
37
|
|
|
38
|
-
class
|
|
39
|
-
"""
|
|
38
|
+
class CogneeSystemError(CogneeApiError):
|
|
39
|
+
"""System error"""
|
|
40
40
|
|
|
41
41
|
def __init__(
|
|
42
42
|
self,
|
|
43
|
-
message: str = "
|
|
44
|
-
name: str = "
|
|
45
|
-
status_code=status.
|
|
43
|
+
message: str = "A system error occurred.",
|
|
44
|
+
name: str = "CogneeSystemError",
|
|
45
|
+
status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
|
|
46
|
+
log=True,
|
|
47
|
+
log_level="ERROR",
|
|
46
48
|
):
|
|
47
|
-
super().__init__(message, name, status_code)
|
|
49
|
+
super().__init__(message, name, status_code, log, log_level)
|
|
50
|
+
|
|
48
51
|
|
|
52
|
+
class CogneeValidationError(CogneeApiError):
|
|
53
|
+
"""Validation error"""
|
|
49
54
|
|
|
50
|
-
class InvalidValueError(CogneeApiError):
|
|
51
55
|
def __init__(
|
|
52
56
|
self,
|
|
53
|
-
message: str = "
|
|
54
|
-
name: str = "
|
|
57
|
+
message: str = "A validation error occurred.",
|
|
58
|
+
name: str = "CogneeValidationError",
|
|
55
59
|
status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,
|
|
60
|
+
log=True,
|
|
61
|
+
log_level="ERROR",
|
|
56
62
|
):
|
|
57
|
-
super().__init__(message, name, status_code)
|
|
63
|
+
super().__init__(message, name, status_code, log, log_level)
|
|
58
64
|
|
|
59
65
|
|
|
60
|
-
class
|
|
66
|
+
class CogneeConfigurationError(CogneeApiError):
|
|
67
|
+
"""SystemConfigError"""
|
|
68
|
+
|
|
61
69
|
def __init__(
|
|
62
70
|
self,
|
|
63
|
-
message: str = "
|
|
64
|
-
name: str = "
|
|
65
|
-
status_code=status.
|
|
71
|
+
message: str = "A system configuration error occurred.",
|
|
72
|
+
name: str = "CogneeConfigurationError",
|
|
73
|
+
status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
|
|
74
|
+
log=True,
|
|
75
|
+
log_level="ERROR",
|
|
66
76
|
):
|
|
67
|
-
super().__init__(message, name, status_code)
|
|
77
|
+
super().__init__(message, name, status_code, log, log_level)
|
|
68
78
|
|
|
69
79
|
|
|
70
|
-
class
|
|
71
|
-
|
|
80
|
+
class CogneeTransientError(CogneeApiError):
|
|
81
|
+
"""TransientError"""
|
|
82
|
+
|
|
83
|
+
def __init__(
|
|
84
|
+
self,
|
|
85
|
+
message: str = "A transient error occurred.",
|
|
86
|
+
name: str = "CogneeTransientError",
|
|
87
|
+
status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
|
|
88
|
+
log=True,
|
|
89
|
+
log_level="ERROR",
|
|
90
|
+
):
|
|
91
|
+
super().__init__(message, name, status_code, log, log_level)
|
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
from cognee.exceptions import (
|
|
2
|
+
CogneeValidationError,
|
|
3
|
+
)
|
|
4
|
+
from fastapi import status
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
class KeywordExtractionError(CogneeValidationError):
|
|
8
|
+
"""
|
|
9
|
+
Raised when a provided value is syntactically valid but semantically unacceptable
|
|
10
|
+
for the given operation.
|
|
11
|
+
|
|
12
|
+
Example:
|
|
13
|
+
- Passing an empty string to a keyword extraction function.
|
|
14
|
+
"""
|
|
15
|
+
|
|
16
|
+
def __init__(
|
|
17
|
+
self,
|
|
18
|
+
message: str = "Extract_keywords cannot extract keywords from empty text.",
|
|
19
|
+
name: str = "KeywordExtractionError",
|
|
20
|
+
status_code: int = status.HTTP_400_BAD_REQUEST,
|
|
21
|
+
):
|
|
22
|
+
super().__init__(message, name, status_code)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
from sklearn.feature_extraction.text import TfidfVectorizer
|
|
2
2
|
|
|
3
|
-
from cognee.exceptions import
|
|
3
|
+
from cognee.infrastructure.data.exceptions.exceptions import KeywordExtractionError
|
|
4
4
|
from cognee.shared.utils import extract_pos_tags
|
|
5
5
|
|
|
6
6
|
|
|
@@ -8,7 +8,7 @@ def extract_keywords(text: str) -> list[str]:
|
|
|
8
8
|
"""
|
|
9
9
|
Extract keywords from the provided text string.
|
|
10
10
|
|
|
11
|
-
This function raises an
|
|
11
|
+
This function raises an KeyWordExtractionError if the input text is empty. It processes the
|
|
12
12
|
text to extract parts of speech, focusing on nouns, and uses TF-IDF to identify the most
|
|
13
13
|
relevant keywords based on their frequency. The function returns a list of up to 15
|
|
14
14
|
keywords, each having more than 3 characters.
|
|
@@ -25,7 +25,7 @@ def extract_keywords(text: str) -> list[str]:
|
|
|
25
25
|
with more than 3 characters.
|
|
26
26
|
"""
|
|
27
27
|
if len(text) == 0:
|
|
28
|
-
raise
|
|
28
|
+
raise KeywordExtractionError()
|
|
29
29
|
|
|
30
30
|
tags = extract_pos_tags(text)
|
|
31
31
|
nouns = [word for (word, tag) in tags if tag == "NN"]
|