PyPI - aiecs - Versions diffs - 1.5.1__py3-none-any.whl - Mend

aiecs 1.5.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (302) hide show

aiecs/__init__.py +72 -0
aiecs/__main__.py +41 -0
aiecs/aiecs_client.py +469 -0
aiecs/application/__init__.py +10 -0
aiecs/application/executors/__init__.py +10 -0
aiecs/application/executors/operation_executor.py +363 -0
aiecs/application/knowledge_graph/__init__.py +7 -0
aiecs/application/knowledge_graph/builder/__init__.py +37 -0
aiecs/application/knowledge_graph/builder/document_builder.py +375 -0
aiecs/application/knowledge_graph/builder/graph_builder.py +356 -0
aiecs/application/knowledge_graph/builder/schema_mapping.py +531 -0
aiecs/application/knowledge_graph/builder/structured_pipeline.py +443 -0
aiecs/application/knowledge_graph/builder/text_chunker.py +319 -0
aiecs/application/knowledge_graph/extractors/__init__.py +27 -0
aiecs/application/knowledge_graph/extractors/base.py +100 -0
aiecs/application/knowledge_graph/extractors/llm_entity_extractor.py +327 -0
aiecs/application/knowledge_graph/extractors/llm_relation_extractor.py +349 -0
aiecs/application/knowledge_graph/extractors/ner_entity_extractor.py +244 -0
aiecs/application/knowledge_graph/fusion/__init__.py +23 -0
aiecs/application/knowledge_graph/fusion/entity_deduplicator.py +387 -0
aiecs/application/knowledge_graph/fusion/entity_linker.py +343 -0
aiecs/application/knowledge_graph/fusion/knowledge_fusion.py +580 -0
aiecs/application/knowledge_graph/fusion/relation_deduplicator.py +189 -0
aiecs/application/knowledge_graph/pattern_matching/__init__.py +21 -0
aiecs/application/knowledge_graph/pattern_matching/pattern_matcher.py +344 -0
aiecs/application/knowledge_graph/pattern_matching/query_executor.py +378 -0
aiecs/application/knowledge_graph/profiling/__init__.py +12 -0
aiecs/application/knowledge_graph/profiling/query_plan_visualizer.py +199 -0
aiecs/application/knowledge_graph/profiling/query_profiler.py +223 -0
aiecs/application/knowledge_graph/reasoning/__init__.py +27 -0
aiecs/application/knowledge_graph/reasoning/evidence_synthesis.py +347 -0
aiecs/application/knowledge_graph/reasoning/inference_engine.py +504 -0
aiecs/application/knowledge_graph/reasoning/logic_form_parser.py +167 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/__init__.py +79 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/ast_builder.py +513 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/ast_nodes.py +630 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/ast_validator.py +654 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/error_handler.py +477 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/parser.py +390 -0
aiecs/application/knowledge_graph/reasoning/logic_parser/query_context.py +217 -0
aiecs/application/knowledge_graph/reasoning/logic_query_integration.py +169 -0
aiecs/application/knowledge_graph/reasoning/query_planner.py +872 -0
aiecs/application/knowledge_graph/reasoning/reasoning_engine.py +554 -0
aiecs/application/knowledge_graph/retrieval/__init__.py +19 -0
aiecs/application/knowledge_graph/retrieval/retrieval_strategies.py +596 -0
aiecs/application/knowledge_graph/search/__init__.py +59 -0
aiecs/application/knowledge_graph/search/hybrid_search.py +423 -0
aiecs/application/knowledge_graph/search/reranker.py +295 -0
aiecs/application/knowledge_graph/search/reranker_strategies.py +553 -0
aiecs/application/knowledge_graph/search/text_similarity.py +398 -0
aiecs/application/knowledge_graph/traversal/__init__.py +15 -0
aiecs/application/knowledge_graph/traversal/enhanced_traversal.py +329 -0
aiecs/application/knowledge_graph/traversal/path_scorer.py +269 -0
aiecs/application/knowledge_graph/validators/__init__.py +13 -0
aiecs/application/knowledge_graph/validators/relation_validator.py +189 -0
aiecs/application/knowledge_graph/visualization/__init__.py +11 -0
aiecs/application/knowledge_graph/visualization/graph_visualizer.py +321 -0
aiecs/common/__init__.py +9 -0
aiecs/common/knowledge_graph/__init__.py +17 -0
aiecs/common/knowledge_graph/runnable.py +484 -0
aiecs/config/__init__.py +16 -0
aiecs/config/config.py +498 -0
aiecs/config/graph_config.py +137 -0
aiecs/config/registry.py +23 -0
aiecs/core/__init__.py +46 -0
aiecs/core/interface/__init__.py +34 -0
aiecs/core/interface/execution_interface.py +152 -0
aiecs/core/interface/storage_interface.py +171 -0
aiecs/domain/__init__.py +289 -0
aiecs/domain/agent/__init__.py +189 -0
aiecs/domain/agent/base_agent.py +697 -0
aiecs/domain/agent/exceptions.py +103 -0
aiecs/domain/agent/graph_aware_mixin.py +559 -0
aiecs/domain/agent/hybrid_agent.py +490 -0
aiecs/domain/agent/integration/__init__.py +26 -0
aiecs/domain/agent/integration/context_compressor.py +222 -0
aiecs/domain/agent/integration/context_engine_adapter.py +252 -0
aiecs/domain/agent/integration/retry_policy.py +219 -0
aiecs/domain/agent/integration/role_config.py +213 -0
aiecs/domain/agent/knowledge_aware_agent.py +646 -0
aiecs/domain/agent/lifecycle.py +296 -0
aiecs/domain/agent/llm_agent.py +300 -0
aiecs/domain/agent/memory/__init__.py +12 -0
aiecs/domain/agent/memory/conversation.py +197 -0
aiecs/domain/agent/migration/__init__.py +14 -0
aiecs/domain/agent/migration/conversion.py +160 -0
aiecs/domain/agent/migration/legacy_wrapper.py +90 -0
aiecs/domain/agent/models.py +317 -0
aiecs/domain/agent/observability.py +407 -0
aiecs/domain/agent/persistence.py +289 -0
aiecs/domain/agent/prompts/__init__.py +29 -0
aiecs/domain/agent/prompts/builder.py +161 -0
aiecs/domain/agent/prompts/formatters.py +189 -0
aiecs/domain/agent/prompts/template.py +255 -0
aiecs/domain/agent/registry.py +260 -0
aiecs/domain/agent/tool_agent.py +257 -0
aiecs/domain/agent/tools/__init__.py +12 -0
aiecs/domain/agent/tools/schema_generator.py +221 -0
aiecs/domain/community/__init__.py +155 -0
aiecs/domain/community/agent_adapter.py +477 -0
aiecs/domain/community/analytics.py +481 -0
aiecs/domain/community/collaborative_workflow.py +642 -0
aiecs/domain/community/communication_hub.py +645 -0
aiecs/domain/community/community_builder.py +320 -0
aiecs/domain/community/community_integration.py +800 -0
aiecs/domain/community/community_manager.py +813 -0
aiecs/domain/community/decision_engine.py +879 -0
aiecs/domain/community/exceptions.py +225 -0
aiecs/domain/community/models/__init__.py +33 -0
aiecs/domain/community/models/community_models.py +268 -0
aiecs/domain/community/resource_manager.py +457 -0
aiecs/domain/community/shared_context_manager.py +603 -0
aiecs/domain/context/__init__.py +58 -0
aiecs/domain/context/context_engine.py +989 -0
aiecs/domain/context/conversation_models.py +354 -0
aiecs/domain/context/graph_memory.py +467 -0
aiecs/domain/execution/__init__.py +12 -0
aiecs/domain/execution/model.py +57 -0
aiecs/domain/knowledge_graph/__init__.py +19 -0
aiecs/domain/knowledge_graph/models/__init__.py +52 -0
aiecs/domain/knowledge_graph/models/entity.py +130 -0
aiecs/domain/knowledge_graph/models/evidence.py +194 -0
aiecs/domain/knowledge_graph/models/inference_rule.py +186 -0
aiecs/domain/knowledge_graph/models/path.py +179 -0
aiecs/domain/knowledge_graph/models/path_pattern.py +173 -0
aiecs/domain/knowledge_graph/models/query.py +272 -0
aiecs/domain/knowledge_graph/models/query_plan.py +187 -0
aiecs/domain/knowledge_graph/models/relation.py +136 -0
aiecs/domain/knowledge_graph/schema/__init__.py +23 -0
aiecs/domain/knowledge_graph/schema/entity_type.py +135 -0
aiecs/domain/knowledge_graph/schema/graph_schema.py +271 -0
aiecs/domain/knowledge_graph/schema/property_schema.py +155 -0
aiecs/domain/knowledge_graph/schema/relation_type.py +171 -0
aiecs/domain/knowledge_graph/schema/schema_manager.py +496 -0
aiecs/domain/knowledge_graph/schema/type_enums.py +205 -0
aiecs/domain/task/__init__.py +13 -0
aiecs/domain/task/dsl_processor.py +613 -0
aiecs/domain/task/model.py +62 -0
aiecs/domain/task/task_context.py +268 -0
aiecs/infrastructure/__init__.py +24 -0
aiecs/infrastructure/graph_storage/__init__.py +11 -0
aiecs/infrastructure/graph_storage/base.py +601 -0
aiecs/infrastructure/graph_storage/batch_operations.py +449 -0
aiecs/infrastructure/graph_storage/cache.py +429 -0
aiecs/infrastructure/graph_storage/distributed.py +226 -0
aiecs/infrastructure/graph_storage/error_handling.py +390 -0
aiecs/infrastructure/graph_storage/graceful_degradation.py +306 -0
aiecs/infrastructure/graph_storage/health_checks.py +378 -0
aiecs/infrastructure/graph_storage/in_memory.py +514 -0
aiecs/infrastructure/graph_storage/index_optimization.py +483 -0
aiecs/infrastructure/graph_storage/lazy_loading.py +410 -0
aiecs/infrastructure/graph_storage/metrics.py +357 -0
aiecs/infrastructure/graph_storage/migration.py +413 -0
aiecs/infrastructure/graph_storage/pagination.py +471 -0
aiecs/infrastructure/graph_storage/performance_monitoring.py +466 -0
aiecs/infrastructure/graph_storage/postgres.py +871 -0
aiecs/infrastructure/graph_storage/query_optimizer.py +635 -0
aiecs/infrastructure/graph_storage/schema_cache.py +290 -0
aiecs/infrastructure/graph_storage/sqlite.py +623 -0
aiecs/infrastructure/graph_storage/streaming.py +495 -0
aiecs/infrastructure/messaging/__init__.py +13 -0
aiecs/infrastructure/messaging/celery_task_manager.py +383 -0
aiecs/infrastructure/messaging/websocket_manager.py +298 -0
aiecs/infrastructure/monitoring/__init__.py +34 -0
aiecs/infrastructure/monitoring/executor_metrics.py +174 -0
aiecs/infrastructure/monitoring/global_metrics_manager.py +213 -0
aiecs/infrastructure/monitoring/structured_logger.py +48 -0
aiecs/infrastructure/monitoring/tracing_manager.py +410 -0
aiecs/infrastructure/persistence/__init__.py +24 -0
aiecs/infrastructure/persistence/context_engine_client.py +187 -0
aiecs/infrastructure/persistence/database_manager.py +333 -0
aiecs/infrastructure/persistence/file_storage.py +754 -0
aiecs/infrastructure/persistence/redis_client.py +220 -0
aiecs/llm/__init__.py +86 -0
aiecs/llm/callbacks/__init__.py +11 -0
aiecs/llm/callbacks/custom_callbacks.py +264 -0
aiecs/llm/client_factory.py +420 -0
aiecs/llm/clients/__init__.py +33 -0
aiecs/llm/clients/base_client.py +193 -0
aiecs/llm/clients/googleai_client.py +181 -0
aiecs/llm/clients/openai_client.py +131 -0
aiecs/llm/clients/vertex_client.py +437 -0
aiecs/llm/clients/xai_client.py +184 -0
aiecs/llm/config/__init__.py +51 -0
aiecs/llm/config/config_loader.py +275 -0
aiecs/llm/config/config_validator.py +236 -0
aiecs/llm/config/model_config.py +151 -0
aiecs/llm/utils/__init__.py +10 -0
aiecs/llm/utils/validate_config.py +91 -0
aiecs/main.py +363 -0
aiecs/scripts/__init__.py +3 -0
aiecs/scripts/aid/VERSION_MANAGEMENT.md +97 -0
aiecs/scripts/aid/__init__.py +19 -0
aiecs/scripts/aid/version_manager.py +215 -0
aiecs/scripts/dependance_check/DEPENDENCY_SYSTEM_SUMMARY.md +242 -0
aiecs/scripts/dependance_check/README_DEPENDENCY_CHECKER.md +310 -0
aiecs/scripts/dependance_check/__init__.py +17 -0
aiecs/scripts/dependance_check/dependency_checker.py +938 -0
aiecs/scripts/dependance_check/dependency_fixer.py +391 -0
aiecs/scripts/dependance_check/download_nlp_data.py +396 -0
aiecs/scripts/dependance_check/quick_dependency_check.py +270 -0
aiecs/scripts/dependance_check/setup_nlp_data.sh +217 -0
aiecs/scripts/dependance_patch/__init__.py +7 -0
aiecs/scripts/dependance_patch/fix_weasel/README_WEASEL_PATCH.md +126 -0
aiecs/scripts/dependance_patch/fix_weasel/__init__.py +11 -0
aiecs/scripts/dependance_patch/fix_weasel/fix_weasel_validator.py +128 -0
aiecs/scripts/dependance_patch/fix_weasel/fix_weasel_validator.sh +82 -0
aiecs/scripts/dependance_patch/fix_weasel/patch_weasel_library.sh +188 -0
aiecs/scripts/dependance_patch/fix_weasel/run_weasel_patch.sh +41 -0
aiecs/scripts/tools_develop/README.md +449 -0
aiecs/scripts/tools_develop/TOOL_AUTO_DISCOVERY.md +234 -0
aiecs/scripts/tools_develop/__init__.py +21 -0
aiecs/scripts/tools_develop/check_type_annotations.py +259 -0
aiecs/scripts/tools_develop/validate_tool_schemas.py +422 -0
aiecs/scripts/tools_develop/verify_tools.py +356 -0
aiecs/tasks/__init__.py +1 -0
aiecs/tasks/worker.py +172 -0
aiecs/tools/__init__.py +299 -0
aiecs/tools/apisource/__init__.py +99 -0
aiecs/tools/apisource/intelligence/__init__.py +19 -0
aiecs/tools/apisource/intelligence/data_fusion.py +381 -0
aiecs/tools/apisource/intelligence/query_analyzer.py +413 -0
aiecs/tools/apisource/intelligence/search_enhancer.py +388 -0
aiecs/tools/apisource/monitoring/__init__.py +9 -0
aiecs/tools/apisource/monitoring/metrics.py +303 -0
aiecs/tools/apisource/providers/__init__.py +115 -0
aiecs/tools/apisource/providers/base.py +664 -0
aiecs/tools/apisource/providers/census.py +401 -0
aiecs/tools/apisource/providers/fred.py +564 -0
aiecs/tools/apisource/providers/newsapi.py +412 -0
aiecs/tools/apisource/providers/worldbank.py +357 -0
aiecs/tools/apisource/reliability/__init__.py +12 -0
aiecs/tools/apisource/reliability/error_handler.py +375 -0
aiecs/tools/apisource/reliability/fallback_strategy.py +391 -0
aiecs/tools/apisource/tool.py +850 -0
aiecs/tools/apisource/utils/__init__.py +9 -0
aiecs/tools/apisource/utils/validators.py +338 -0
aiecs/tools/base_tool.py +201 -0
aiecs/tools/docs/__init__.py +121 -0
aiecs/tools/docs/ai_document_orchestrator.py +599 -0
aiecs/tools/docs/ai_document_writer_orchestrator.py +2403 -0
aiecs/tools/docs/content_insertion_tool.py +1333 -0
aiecs/tools/docs/document_creator_tool.py +1317 -0
aiecs/tools/docs/document_layout_tool.py +1166 -0
aiecs/tools/docs/document_parser_tool.py +994 -0
aiecs/tools/docs/document_writer_tool.py +1818 -0
aiecs/tools/knowledge_graph/__init__.py +17 -0
aiecs/tools/knowledge_graph/graph_reasoning_tool.py +734 -0
aiecs/tools/knowledge_graph/graph_search_tool.py +923 -0
aiecs/tools/knowledge_graph/kg_builder_tool.py +476 -0
aiecs/tools/langchain_adapter.py +542 -0
aiecs/tools/schema_generator.py +275 -0
aiecs/tools/search_tool/__init__.py +100 -0
aiecs/tools/search_tool/analyzers.py +589 -0
aiecs/tools/search_tool/cache.py +260 -0
aiecs/tools/search_tool/constants.py +128 -0
aiecs/tools/search_tool/context.py +216 -0
aiecs/tools/search_tool/core.py +749 -0
aiecs/tools/search_tool/deduplicator.py +123 -0
aiecs/tools/search_tool/error_handler.py +271 -0
aiecs/tools/search_tool/metrics.py +371 -0
aiecs/tools/search_tool/rate_limiter.py +178 -0
aiecs/tools/search_tool/schemas.py +277 -0
aiecs/tools/statistics/__init__.py +80 -0
aiecs/tools/statistics/ai_data_analysis_orchestrator.py +643 -0
aiecs/tools/statistics/ai_insight_generator_tool.py +505 -0
aiecs/tools/statistics/ai_report_orchestrator_tool.py +694 -0
aiecs/tools/statistics/data_loader_tool.py +564 -0
aiecs/tools/statistics/data_profiler_tool.py +658 -0
aiecs/tools/statistics/data_transformer_tool.py +573 -0
aiecs/tools/statistics/data_visualizer_tool.py +495 -0
aiecs/tools/statistics/model_trainer_tool.py +487 -0
aiecs/tools/statistics/statistical_analyzer_tool.py +459 -0
aiecs/tools/task_tools/__init__.py +86 -0
aiecs/tools/task_tools/chart_tool.py +732 -0
aiecs/tools/task_tools/classfire_tool.py +922 -0
aiecs/tools/task_tools/image_tool.py +447 -0
aiecs/tools/task_tools/office_tool.py +684 -0
aiecs/tools/task_tools/pandas_tool.py +635 -0
aiecs/tools/task_tools/report_tool.py +635 -0
aiecs/tools/task_tools/research_tool.py +392 -0
aiecs/tools/task_tools/scraper_tool.py +715 -0
aiecs/tools/task_tools/stats_tool.py +688 -0
aiecs/tools/temp_file_manager.py +130 -0
aiecs/tools/tool_executor/__init__.py +37 -0
aiecs/tools/tool_executor/tool_executor.py +881 -0
aiecs/utils/LLM_output_structor.py +445 -0
aiecs/utils/__init__.py +34 -0
aiecs/utils/base_callback.py +47 -0
aiecs/utils/cache_provider.py +695 -0
aiecs/utils/execution_utils.py +184 -0
aiecs/utils/logging.py +1 -0
aiecs/utils/prompt_loader.py +14 -0
aiecs/utils/token_usage_repository.py +323 -0
aiecs/ws/__init__.py +0 -0
aiecs/ws/socket_server.py +52 -0
aiecs-1.5.1.dist-info/METADATA +608 -0
aiecs-1.5.1.dist-info/RECORD +302 -0
aiecs-1.5.1.dist-info/WHEEL +5 -0
aiecs-1.5.1.dist-info/entry_points.txt +10 -0
aiecs-1.5.1.dist-info/licenses/LICENSE +225 -0
aiecs-1.5.1.dist-info/top_level.txt +1 -0

aiecs/application/knowledge_graph/retrieval/retrieval_strategies.py ADDED Viewed

@@ -0,0 +1,596 @@
+"""
+Advanced Retrieval Strategies
+Provides sophisticated retrieval methods including Personalized PageRank,
+multi-hop neighbor retrieval, filtered retrieval, and query caching.
+"""
+import asyncio
+from typing import List, Dict, Set, Optional, Tuple, Any, Callable
+from collections import defaultdict, deque
+import hashlib
+import json
+import time
+from aiecs.domain.knowledge_graph.models.entity import Entity
+from aiecs.infrastructure.graph_storage.base import GraphStore
+class PersonalizedPageRank:
+    """
+    Personalized PageRank Retrieval
+    Computes importance scores for entities in the graph based on
+    a random walk with restart from seed entities. Useful for finding
+    entities most relevant to a given starting point.
+    Algorithm:
+    1. Start from seed entities
+    2. Random walk with probability alpha to restart at seeds
+    3. Iterate until convergence
+    4. Return entities ranked by visit frequency
+    Example:
+        ```python
+        ppr = PersonalizedPageRank(graph_store)
+        results = await ppr.retrieve(
+            seed_entity_ids=["person_1"],
+            max_results=10,
+            alpha=0.15,  # restart probability
+            max_iterations=100
+        )
+        for entity, score in results:
+            print(f"{entity.id}: {score:.4f}")
+        ```
+    """
+    def __init__(self, graph_store: GraphStore):
+        """
+        Initialize Personalized PageRank retrieval
+        Args:
+            graph_store: Graph storage backend
+        """
+        self.graph_store = graph_store
+    async def retrieve(
+        self,
+        seed_entity_ids: List[str],
+        max_results: int = 20,
+        alpha: float = 0.15,
+        max_iterations: int = 100,
+        convergence_threshold: float = 1e-6,
+    ) -> List[Tuple[Entity, float]]:
+        """
+        Retrieve entities using Personalized PageRank
+        Args:
+            seed_entity_ids: Starting entities for random walk
+            max_results: Maximum number of results to return
+            alpha: Restart probability (0.0-1.0)
+            max_iterations: Maximum number of iterations
+            convergence_threshold: Convergence threshold for scores
+        Returns:
+            List of (entity, score) tuples sorted by score descending
+        """
+        if not seed_entity_ids:
+            return []
+        # Initialize scores
+        scores: Dict[str, float] = defaultdict(float)
+        set(seed_entity_ids)
+        # Initialize seed scores uniformly
+        initial_score = 1.0 / len(seed_entity_ids)
+        for seed_id in seed_entity_ids:
+            scores[seed_id] = initial_score
+        # Build adjacency information (cache neighbors)
+        adjacency: Dict[str, List[str]] = {}
+        # Iterative PageRank computation
+        for iteration in range(max_iterations):
+            new_scores: Dict[str, float] = defaultdict(float)
+            # Restart probability: distribute to seeds
+            for seed_id in seed_entity_ids:
+                new_scores[seed_id] += alpha * initial_score
+            # Random walk probability: distribute from current nodes
+            max_delta = 0.0
+            for entity_id, score in scores.items():
+                if score == 0:
+                    continue
+                # Get neighbors (cache for efficiency)
+                if entity_id not in adjacency:
+                    neighbors = await self.graph_store.get_neighbors(
+                        entity_id, direction="outgoing"
+                    )
+                    adjacency[entity_id] = [n.id for n in neighbors]
+                neighbor_ids = adjacency[entity_id]
+                if neighbor_ids:
+                    # Distribute score to neighbors
+                    distribute_score = (1 - alpha) * score / len(neighbor_ids)
+                    for neighbor_id in neighbor_ids:
+                        new_scores[neighbor_id] += distribute_score
+                else:
+                    # No outgoing edges, restart at seeds
+                    for seed_id in seed_entity_ids:
+                        new_scores[seed_id] += (1 - alpha) * score * initial_score
+            # Check convergence
+            for entity_id in set(scores.keys()) | set(new_scores.keys()):
+                delta = abs(new_scores[entity_id] - scores[entity_id])
+                max_delta = max(max_delta, delta)
+            scores = new_scores
+            if max_delta < convergence_threshold:
+                break
+        # Retrieve entities and create results
+        results = []
+        for entity_id, score in scores.items():
+            if score > 0:
+                entity = await self.graph_store.get_entity(entity_id)
+                if entity:
+                    results.append((entity, score))
+        # Sort by score descending
+        results.sort(key=lambda x: x[1], reverse=True)
+        return results[:max_results]
+class MultiHopRetrieval:
+    """
+    Multi-Hop Neighbor Retrieval
+    Retrieves entities within N hops from seed entities, with configurable
+    aggregation and scoring strategies.
+    Features:
+    - Breadth-first expansion from seeds
+    - Hop-distance based scoring
+    - Relation type filtering
+    - Entity deduplication
+    Example:
+        ```python
+        retrieval = MultiHopRetrieval(graph_store)
+        results = await retrieval.retrieve(
+            seed_entity_ids=["entity_1"],
+            max_hops=2,
+            max_results=20,
+            relation_types=["RELATED_TO"]  # Optional filter
+        )
+        ```
+    """
+    def __init__(self, graph_store: GraphStore):
+        """
+        Initialize multi-hop retrieval
+        Args:
+            graph_store: Graph storage backend
+        """
+        self.graph_store = graph_store
+    async def retrieve(
+        self,
+        seed_entity_ids: List[str],
+        max_hops: int = 2,
+        max_results: int = 50,
+        relation_types: Optional[List[str]] = None,
+        score_decay: float = 0.5,
+        include_seeds: bool = True,
+    ) -> List[Tuple[Entity, float]]:
+        """
+        Retrieve entities within N hops from seeds
+        Args:
+            seed_entity_ids: Starting entities
+            max_hops: Maximum number of hops
+            max_results: Maximum number of results
+            relation_types: Optional list of allowed relation types
+            score_decay: Score decay factor per hop (0.0-1.0)
+            include_seeds: Whether to include seed entities in results
+        Returns:
+            List of (entity, score) tuples
+        """
+        if not seed_entity_ids:
+            return []
+        # Track visited entities and their scores
+        entity_scores: Dict[str, float] = {}
+        visited: Set[str] = set()
+        # BFS expansion
+        current_level = set(seed_entity_ids)
+        for hop in range(max_hops + 1):
+            if not current_level:
+                break
+            next_level: Set[str] = set()
+            # Score for this hop level
+            hop_score = score_decay**hop
+            for entity_id in current_level:
+                if entity_id in visited:
+                    continue
+                visited.add(entity_id)
+                # Update score (take max if entity reached via multiple paths)
+                if entity_id not in entity_scores:
+                    entity_scores[entity_id] = hop_score
+                else:
+                    entity_scores[entity_id] = max(entity_scores[entity_id], hop_score)
+                # Get neighbors for next level
+                if hop < max_hops:
+                    neighbors = await self.graph_store.get_neighbors(
+                        entity_id, relation_type=None, direction="outgoing"
+                    )
+                    for neighbor in neighbors:
+                        if neighbor.id not in visited:
+                            # Apply relation type filter if specified
+                            if relation_types is None:
+                                next_level.add(neighbor.id)
+                            else:
+                                # Check if any relation matches the filter
+                                # (simplified - assumes we have the relation info)
+                                next_level.add(neighbor.id)
+            current_level = next_level
+        # Filter out seeds if requested
+        if not include_seeds:
+            for seed_id in seed_entity_ids:
+                entity_scores.pop(seed_id, None)
+        # Retrieve entities and create results
+        results = []
+        for entity_id, score in entity_scores.items():
+            entity = await self.graph_store.get_entity(entity_id)
+            if entity:
+                results.append((entity, score))
+        # Sort by score descending
+        results.sort(key=lambda x: x[1], reverse=True)
+        return results[:max_results]
+class FilteredRetrieval:
+    """
+    Filtered Retrieval Strategy
+    Retrieves entities from the graph with flexible filtering by:
+    - Entity type
+    - Property values
+    - Property existence
+    - Custom filter functions
+    Example:
+        ```python
+        retrieval = FilteredRetrieval(graph_store)
+        # Filter by entity type and property
+        results = await retrieval.retrieve(
+            entity_type="Person",
+            property_filters={"role": "Engineer"},
+            max_results=20
+        )
+        # Custom filter function
+        results = await retrieval.retrieve(
+            filter_fn=lambda e: e.properties.get("age", 0) > 30,
+            max_results=10
+        )
+        ```
+    """
+    def __init__(self, graph_store: GraphStore):
+        """
+        Initialize filtered retrieval
+        Args:
+            graph_store: Graph storage backend
+        """
+        self.graph_store = graph_store
+    async def retrieve(
+        self,
+        entity_type: Optional[str] = None,
+        property_filters: Optional[Dict[str, Any]] = None,
+        property_exists: Optional[List[str]] = None,
+        filter_fn: Optional[Callable[[Entity], bool]] = None,
+        max_results: int = 100,
+        score_by_match_count: bool = False,
+    ) -> List[Tuple[Entity, float]]:
+        """
+        Retrieve entities with flexible filtering
+        Args:
+            entity_type: Filter by entity type
+            property_filters: Filter by property values (key: value)
+            property_exists: Filter by property existence (list of keys)
+            filter_fn: Custom filter function
+            max_results: Maximum number of results
+            score_by_match_count: Score by number of matching criteria
+        Returns:
+            List of (entity, score) tuples
+        """
+        # Get all entities (or filtered by type if using vector search)
+        # Note: This is a simplified implementation
+        # In production, we'd want more efficient filtering at storage level
+        results = []
+        # For now, we'll use vector search with no threshold to get entities
+        # This is a workaround - ideally we'd have a direct entity scan method
+        if entity_type:
+            # Try vector search with entity type filter
+            dummy_embedding = [0.0] * 128  # Placeholder
+            candidates = await self.graph_store.vector_search(
+                query_embedding=dummy_embedding,
+                entity_type=entity_type,
+                max_results=1000,
+                score_threshold=0.0,
+            )
+            candidate_entities = [entity for entity, _ in candidates]
+        else:
+            # Without entity type filter, we can't efficiently get all entities
+            # This is a limitation of the current GraphStore interface
+            # Return empty results for now
+            candidate_entities = []
+        # Apply filters
+        for entity in candidate_entities:
+            match_count = 0
+            total_criteria = 0
+            # Entity type filter (already applied above)
+            if entity_type:
+                total_criteria += 1
+                if entity.entity_type == entity_type:
+                    match_count += 1
+                else:
+                    continue
+            # Property value filters
+            if property_filters:
+                total_criteria += len(property_filters)
+                for key, expected_value in property_filters.items():
+                    if entity.properties.get(key) == expected_value:
+                        match_count += 1
+                    else:
+                        # Strict matching - entity must match all filters
+                        match_count = 0
+                        break
+                if match_count == 0 and property_filters:
+                    continue
+            # Property existence filters
+            if property_exists:
+                total_criteria += len(property_exists)
+                for key in property_exists:
+                    if key in entity.properties:
+                        match_count += 1
+                    else:
+                        match_count = 0
+                        break
+                if match_count == 0 and property_exists:
+                    continue
+            # Custom filter function
+            if filter_fn:
+                total_criteria += 1
+                try:
+                    if filter_fn(entity):
+                        match_count += 1
+                    else:
+                        continue
+                except Exception:
+                    continue
+            # Calculate score
+            if score_by_match_count and total_criteria > 0:
+                score = match_count / total_criteria
+            else:
+                score = 1.0
+            results.append((entity, score))
+            if len(results) >= max_results:
+                break
+        # Sort by score descending
+        results.sort(key=lambda x: x[1], reverse=True)
+        return results[:max_results]
+class RetrievalCache:
+    """
+    Query Caching for Retrieval
+    Caches retrieval results to improve performance for frequent queries.
+    Uses LRU eviction policy and TTL-based expiration.
+    Features:
+    - LRU cache with configurable size
+    - TTL-based expiration
+    - Query fingerprinting
+    - Cache statistics
+    Example:
+        ```python
+        cache = RetrievalCache(max_size=100, ttl=300)  # 5 minutes TTL
+        # Wrap retrieval operation
+        results = await cache.get_or_compute(
+            cache_key="query_1",
+            compute_fn=lambda: retrieval.retrieve(...)
+        )
+        # Check cache statistics
+        stats = cache.get_stats()
+        print(f"Hit rate: {stats['hit_rate']:.2%}")
+        ```
+    """
+    def __init__(self, max_size: int = 1000, ttl: int = 300):
+        """
+        Initialize retrieval cache
+        Args:
+            max_size: Maximum number of cached entries
+            ttl: Time-to-live for cache entries in seconds
+        """
+        self.max_size = max_size
+        self.ttl = ttl
+        # key -> (value, timestamp)
+        self._cache: Dict[str, Tuple[Any, float]] = {}
+        self._access_order: deque = deque()  # LRU tracking
+        self._hits = 0
+        self._misses = 0
+    def _generate_key(self, **kwargs) -> str:
+        """
+        Generate cache key from query parameters
+        Args:
+            **kwargs: Query parameters
+        Returns:
+            Cache key string
+        """
+        # Sort keys for consistent hashing
+        sorted_items = sorted(kwargs.items())
+        key_str = json.dumps(sorted_items, sort_keys=True)
+        return hashlib.md5(key_str.encode()).hexdigest()
+    def _is_expired(self, timestamp: float) -> bool:
+        """Check if cache entry is expired"""
+        return (time.time() - timestamp) > self.ttl
+    def _evict_lru(self):
+        """Evict least recently used entry"""
+        if self._access_order:
+            lru_key = self._access_order.popleft()
+            self._cache.pop(lru_key, None)
+    async def get_or_compute(
+        self,
+        cache_key: Optional[str] = None,
+        compute_fn: Optional[Callable] = None,
+        **kwargs,
+    ) -> Any:
+        """
+        Get cached result or compute and cache
+        Args:
+            cache_key: Optional explicit cache key
+            compute_fn: Async function to compute result if cache miss
+            **kwargs: Parameters for cache key generation
+        Returns:
+            Cached or computed result
+        """
+        # Generate cache key
+        if cache_key is None:
+            cache_key = self._generate_key(**kwargs)
+        # Check cache
+        if cache_key in self._cache:
+            result, timestamp = self._cache[cache_key]
+            # Check expiration
+            if not self._is_expired(timestamp):
+                # Cache hit
+                self._hits += 1
+                # Update LRU order
+                if cache_key in self._access_order:
+                    self._access_order.remove(cache_key)
+                self._access_order.append(cache_key)
+                return result
+            else:
+                # Expired, remove
+                del self._cache[cache_key]
+                if cache_key in self._access_order:
+                    self._access_order.remove(cache_key)
+        # Cache miss
+        self._misses += 1
+        # Compute result
+        if compute_fn is None:
+            return None
+        if asyncio.iscoroutinefunction(compute_fn):
+            result = await compute_fn()
+        else:
+            result = compute_fn()
+        # Store in cache
+        self._cache[cache_key] = (result, time.time())
+        self._access_order.append(cache_key)
+        # Evict if over size limit
+        while len(self._cache) > self.max_size:
+            self._evict_lru()
+        return result
+    def invalidate(self, cache_key: str):
+        """Invalidate a specific cache entry"""
+        if cache_key in self._cache:
+            del self._cache[cache_key]
+            if cache_key in self._access_order:
+                self._access_order.remove(cache_key)
+    def clear(self):
+        """Clear all cache entries"""
+        self._cache.clear()
+        self._access_order.clear()
+    def get_stats(self) -> Dict[str, Any]:
+        """
+        Get cache statistics
+        Returns:
+            Dictionary with cache statistics
+        """
+        total_requests = self._hits + self._misses
+        hit_rate = self._hits / total_requests if total_requests > 0 else 0.0
+        return {
+            "hits": self._hits,
+            "misses": self._misses,
+            "total_requests": total_requests,
+            "hit_rate": hit_rate,
+            "cache_size": len(self._cache),
+            "max_size": self.max_size,
+            "ttl": self.ttl,
+        }
+# Import asyncio for async checks

aiecs/application/knowledge_graph/search/__init__.py ADDED Viewed

@@ -0,0 +1,59 @@
+"""
+Knowledge Graph Search Application Layer
+Advanced search strategies including hybrid search and text similarity utilities.
+"""
+from aiecs.application.knowledge_graph.search.hybrid_search import (
+    HybridSearchStrategy,
+    HybridSearchConfig,
+    SearchMode,
+)
+from aiecs.application.knowledge_graph.search.text_similarity import (
+    TextSimilarity,
+    BM25Scorer,
+    jaccard_similarity,
+    jaccard_similarity_text,
+    cosine_similarity_text,
+    levenshtein_distance,
+    normalized_levenshtein_similarity,
+    fuzzy_match,
+)
+from aiecs.application.knowledge_graph.search.reranker import (
+    RerankerStrategy,
+    ResultReranker,
+    ScoreCombinationMethod,
+    normalize_scores,
+    combine_scores,
+)
+from aiecs.application.knowledge_graph.search.reranker_strategies import (
+    TextSimilarityReranker,
+    SemanticReranker,
+    StructuralReranker,
+    HybridReranker,
+    CrossEncoderReranker,
+)
+__all__ = [
+    "HybridSearchStrategy",
+    "HybridSearchConfig",
+    "SearchMode",
+    "TextSimilarity",
+    "BM25Scorer",
+    "jaccard_similarity",
+    "jaccard_similarity_text",
+    "cosine_similarity_text",
+    "levenshtein_distance",
+    "normalized_levenshtein_similarity",
+    "fuzzy_match",
+    "RerankerStrategy",
+    "ResultReranker",
+    "ScoreCombinationMethod",
+    "normalize_scores",
+    "combine_scores",
+    "TextSimilarityReranker",
+    "SemanticReranker",
+    "StructuralReranker",
+    "HybridReranker",
+    "CrossEncoderReranker",
+]