PyPI - orchestrator-core - Versions diffs - 4.6.2__py3-none-any.whl → 4.6.3rc1__py3-none-any.whl - Mend

orchestrator-core 4.6.2py3-none-any.whl → 4.6.3rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

orchestrator/__init__.py +1 -1
orchestrator/api/api_v1/endpoints/search.py +44 -34
orchestrator/{search/retrieval/utils.py → cli/search/display.py} +4 -29
orchestrator/cli/search/search_explore.py +22 -24
orchestrator/cli/search/speedtest.py +11 -9
orchestrator/db/models.py +6 -6
orchestrator/log_config.py +2 -0
orchestrator/schemas/search.py +1 -1
orchestrator/schemas/search_requests.py +59 -0
orchestrator/search/agent/handlers.py +129 -0
orchestrator/search/agent/prompts.py +54 -33
orchestrator/search/agent/state.py +9 -24
orchestrator/search/agent/tools.py +223 -144
orchestrator/search/agent/validation.py +80 -0
orchestrator/search/{schemas → aggregations}/__init__.py +20 -0
orchestrator/search/aggregations/base.py +201 -0
orchestrator/search/core/types.py +3 -2
orchestrator/search/filters/__init__.py +4 -0
orchestrator/search/filters/definitions.py +22 -1
orchestrator/search/filters/numeric_filter.py +3 -3
orchestrator/search/llm_migration.py +2 -1
orchestrator/search/query/__init__.py +90 -0
orchestrator/search/query/builder.py +285 -0
orchestrator/search/query/engine.py +162 -0
orchestrator/search/{retrieval → query}/exceptions.py +38 -7
orchestrator/search/query/mixins.py +95 -0
orchestrator/search/query/queries.py +129 -0
orchestrator/search/query/results.py +252 -0
orchestrator/search/{retrieval/query_state.py → query/state.py} +31 -11
orchestrator/search/{retrieval → query}/validation.py +58 -1
orchestrator/search/retrieval/__init__.py +0 -5
orchestrator/search/retrieval/pagination.py +7 -8
orchestrator/search/retrieval/retrievers/base.py +9 -9
{orchestrator_core-4.6.2.dist-info → orchestrator_core-4.6.3rc1.dist-info}/METADATA +6 -6
{orchestrator_core-4.6.2.dist-info → orchestrator_core-4.6.3rc1.dist-info}/RECORD +38 -32
orchestrator/search/retrieval/builder.py +0 -127
orchestrator/search/retrieval/engine.py +0 -197
orchestrator/search/schemas/parameters.py +0 -133
orchestrator/search/schemas/results.py +0 -80
/orchestrator/search/{export.py → query/export.py} +0 -0
{orchestrator_core-4.6.2.dist-info → orchestrator_core-4.6.3rc1.dist-info}/WHEEL +0 -0
{orchestrator_core-4.6.2.dist-info → orchestrator_core-4.6.3rc1.dist-info}/licenses/LICENSE +0 -0

orchestrator/search/agent/prompts.py CHANGED Viewed

@@ -19,6 +19,7 @@ from pydantic_ai import RunContext
 from pydantic_ai.ag_ui import StateDeps
 from orchestrator.search.agent.state import SearchState
+from orchestrator.search.core.types import ActionType
 logger = structlog.get_logger(__name__)
@@ -33,7 +34,6 @@ async def get_base_instructions() -> str:
         Your ultimate goal is to **find information** that answers the user's request.
-        To do this, you will perform either a broad search or a filtered search.
         For **filtered searches**, your primary method is to **construct a valid `FilterTree` object**.
         To do this correctly, you must infer the exact structure, operators, and nesting rules from the Pydantic schema of the `set_filter_tree` tool itself.
@@ -48,15 +48,19 @@ async def get_base_instructions() -> str:
         ---
         ### 3. Execution Workflow
-        Follow these steps in strict order:
+        Follow these steps:
-        1.  **Set Context**: If the user is asking for a NEW search, call `start_new_search`.
-        2.  **Analyze for Filters**: Based on the user's request, decide if specific filters are necessary.
-            - **If filters ARE required**, follow these sub-steps:
-                a. **Gather Intel**: Identify all needed field names, then call `discover_filter_paths` and `get_valid_operators` **once each** to get all required information.
-                b. **Construct FilterTree**: Build the `FilterTree` object.
-                c. **Set Filters**: Call `set_filter_tree`.
-        3.  **Execute**: Call `run_search`. This is done for both filtered and non-filtered searches.
+        1.  **Set Context**: Call `start_new_search` with appropriate entity_type and action
+        2.  **Set Filters** (if needed): Discover paths, build FilterTree, call `set_filter_tree`
+            - IMPORTANT: Temporal constraints like "in 2025", "in January", "between X and Y" require filters on datetime fields
+            - Filters restrict WHICH records to include; grouping controls HOW to aggregate them
+        3.  **Set Grouping/Aggregations** (for COUNT/AGGREGATE):
+            - For temporal grouping (per month, per year, per day, etc.): Use `set_temporal_grouping`
+            - For regular grouping (by status, by name, etc.): Use `set_grouping`
+            - For aggregations: Use `set_aggregations`
+        4.  **Execute**:
+            - For SELECT action: Call `run_search()`
+            - For COUNT/AGGREGATE actions: Call `run_aggregation()`
         After search execution, follow the dynamic instructions based on the current state.
@@ -73,31 +77,46 @@ async def get_base_instructions() -> str:
 async def get_dynamic_instructions(ctx: RunContext[StateDeps[SearchState]]) -> str:
     """Dynamically provides 'next step' coaching based on the current state."""
     state = ctx.deps.state
-    param_state_str = json.dumps(state.parameters, indent=2, default=str) if state.parameters else "Not set."
-    results_count = state.results_data.total_count if state.results_data else 0
+    query_state_str = json.dumps(state.query.model_dump(), indent=2, default=str) if state.query else "Not set."
+    results_count = state.results_count or 0
+    action = state.action or ActionType.SELECT
-    if state.export_data:
+    if not state.query:
         next_step_guidance = (
-            "INSTRUCTION: Export has been prepared successfully. "
-            "Simply confirm to the user that the export is ready for download. "
-            "DO NOT include or mention the download URL - the UI will display it automatically."
-        )
-    elif not state.parameters or not state.parameters.get("entity_type"):
-        next_step_guidance = (
-            "INSTRUCTION: The search context is not set. Your next action is to call `start_new_search`."
+            f"INSTRUCTION: The search context is not set. Your next action is to call `start_new_search`. "
+            f"For counting or aggregation queries, set action='{ActionType.COUNT.value}' or action='{ActionType.AGGREGATE.value}'."
         )
     elif results_count > 0:
-        next_step_guidance = dedent(
-            f"""
-            INSTRUCTION: Search completed successfully.
-            Found {results_count} results containing only: entity_id, title, score.
-            Choose your next action based on what the user requested:
-            1. **Broad/generic search** (e.g., 'show me subscriptions'): Confirm search completed and report count. Do nothing else.
-            2. **Question answerable with entity_id/title/score**: Answer directly using the current results.
-            3. **Question requiring other details**: Call `fetch_entity_details` first, then answer with the detailed data.
-            4. **Export request** (phrases like 'export', 'download', 'save as CSV'): Call `prepare_export` directly.
-            """
+        if action in (ActionType.COUNT, ActionType.AGGREGATE):
+            # Aggregation completed
+            next_step_guidance = (
+                "INSTRUCTION: Aggregation completed successfully. "
+                "The results are already displayed in the UI. "
+                "Simply confirm completion to the user in a brief sentence. "
+                "DO NOT repeat, summarize, or restate the aggregation data."
+            )
+        else:
+            # Search completed
+            next_step_guidance = dedent(
+                f"""
+                INSTRUCTION: Search completed successfully.
+                Found {results_count} results containing only: entity_id, title, score.
+                Choose your next action based on what the user requested:
+                1. **Broad/generic search** (e.g., 'show me subscriptions'): Confirm search completed and report count. Do not repeat the results.
+                2. **Question answerable with entity_id/title/score**: Answer directly using the current results.
+                3. **Question requiring other details**: Call `fetch_entity_details` first, then answer with the detailed data.
+                4. **Export request** (phrases like 'export', 'download', 'save as CSV'): Call `prepare_export` directly. Simply confirm the export is ready. Do not repeat the results.
+                """
+            )
+    elif action in (ActionType.COUNT, ActionType.AGGREGATE):
+        # COUNT or AGGREGATE action but no results yet
+        next_step_guidance = (
+            "INSTRUCTION: Aggregation context is set. "
+            "For temporal queries (per month, per year, over time): call `set_temporal_grouping` with datetime field and period. "
+            "For regular grouping: call `set_grouping` with paths to group by. "
+            f"For {ActionType.AGGREGATE.value.upper()}: call `set_aggregations` with aggregation specs. "
+            "Then call `run_aggregation`."
         )
     else:
         next_step_guidance = (
@@ -106,17 +125,19 @@ async def get_dynamic_instructions(ctx: RunContext[StateDeps[SearchState]]) -> s
             "If no specific filters are needed, you can proceed directly to `run_search`."
         )
+    status_summary = f"Results: {results_count}" if results_count > 0 else "No results yet"
     return dedent(
         f"""
         ---
         ## CURRENT STATE
-        **Current Search Parameters:**
+        **Current Query:**
         ```json
-        {param_state_str}
+        {query_state_str}
         ```
-        **Current Results Count:** {results_count}
+        **Status:** {status_summary}
         ---
         ## NEXT ACTION REQUIRED

orchestrator/search/agent/state.py CHANGED Viewed

@@ -11,37 +11,22 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-from typing import Any
 from uuid import UUID
 from pydantic import BaseModel
-from orchestrator.search.schemas.results import SearchResult
+from orchestrator.search.core.types import ActionType
+from orchestrator.search.query.queries import Query
-class ExportData(BaseModel):
-    """Export metadata for download."""
-    action: str = "export"
-    query_id: str
-    download_url: str
-    message: str
-class SearchResultsData(BaseModel):
-    """Search results data for frontend display and agent context."""
-    action: str = "view_results"
-    query_id: str
-    results_url: str
-    total_count: int
-    message: str
-    results: list[SearchResult] = []
+class SearchState(BaseModel):
+    """Agent state for search operations.
+    Tracks the current search context and execution status.
+    """
-class SearchState(BaseModel):
     run_id: UUID | None = None
     query_id: UUID | None = None
-    parameters: dict[str, Any] | None = None
-    results_data: SearchResultsData | None = None
-    export_data: ExportData | None = None
+    action: ActionType | None = None
+    query: Query | None = None
+    results_count: int | None = None  # Number of results from last executed search/aggregation

orchestrator-core 4.6.2__py3-none-any.whl → 4.6.3rc1__py3-none-any.whl

orchestrator-core 4.6.2py3-none-any.whl → 4.6.3rc1py3-none-any.whl