PyPI - holmesgpt - Versions diffs - 0.16.2a0__py3-none-any.whl → 0.18.4__py3-none-any.whl - Mend

holmesgpt 0.16.2a0py3-none-any.whl → 0.18.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (162) hide show

holmes/__init__.py +3 -5
holmes/clients/robusta_client.py +4 -3
holmes/common/env_vars.py +18 -2
holmes/common/openshift.py +1 -1
holmes/config.py +11 -6
holmes/core/conversations.py +30 -13
holmes/core/investigation.py +21 -25
holmes/core/investigation_structured_output.py +3 -3
holmes/core/issue.py +1 -1
holmes/core/llm.py +50 -31
holmes/core/models.py +19 -17
holmes/core/openai_formatting.py +1 -1
holmes/core/prompt.py +47 -2
holmes/core/runbooks.py +1 -0
holmes/core/safeguards.py +4 -2
holmes/core/supabase_dal.py +4 -2
holmes/core/tool_calling_llm.py +102 -141
holmes/core/tools.py +19 -28
holmes/core/tools_utils/token_counting.py +9 -2
holmes/core/tools_utils/tool_context_window_limiter.py +13 -30
holmes/core/tools_utils/tool_executor.py +0 -18
holmes/core/tools_utils/toolset_utils.py +1 -0
holmes/core/toolset_manager.py +37 -2
holmes/core/tracing.py +13 -2
holmes/core/transformers/__init__.py +1 -1
holmes/core/transformers/base.py +1 -0
holmes/core/transformers/llm_summarize.py +3 -2
holmes/core/transformers/registry.py +2 -1
holmes/core/transformers/transformer.py +1 -0
holmes/core/truncation/compaction.py +37 -2
holmes/core/truncation/input_context_window_limiter.py +3 -2
holmes/interactive.py +52 -8
holmes/main.py +17 -37
holmes/plugins/interfaces.py +2 -1
holmes/plugins/prompts/__init__.py +2 -1
holmes/plugins/prompts/_fetch_logs.jinja2 +5 -5
holmes/plugins/prompts/_runbook_instructions.jinja2 +2 -1
holmes/plugins/prompts/base_user_prompt.jinja2 +7 -0
holmes/plugins/prompts/conversation_history_compaction.jinja2 +2 -1
holmes/plugins/prompts/generic_ask.jinja2 +0 -2
holmes/plugins/prompts/generic_ask_conversation.jinja2 +0 -2
holmes/plugins/prompts/generic_ask_for_issue_conversation.jinja2 +0 -2
holmes/plugins/prompts/generic_investigation.jinja2 +0 -2
holmes/plugins/prompts/investigation_procedure.jinja2 +2 -1
holmes/plugins/prompts/kubernetes_workload_ask.jinja2 +0 -2
holmes/plugins/prompts/kubernetes_workload_chat.jinja2 +0 -2
holmes/plugins/runbooks/__init__.py +32 -3
holmes/plugins/sources/github/__init__.py +4 -2
holmes/plugins/sources/prometheus/models.py +1 -0
holmes/plugins/toolsets/__init__.py +30 -26
holmes/plugins/toolsets/atlas_mongodb/mongodb_atlas.py +13 -12
holmes/plugins/toolsets/azure_sql/apis/alert_monitoring_api.py +3 -2
holmes/plugins/toolsets/azure_sql/apis/azure_sql_api.py +2 -1
holmes/plugins/toolsets/azure_sql/apis/connection_failure_api.py +3 -2
holmes/plugins/toolsets/azure_sql/apis/connection_monitoring_api.py +3 -1
holmes/plugins/toolsets/azure_sql/apis/storage_analysis_api.py +3 -1
holmes/plugins/toolsets/azure_sql/azure_sql_toolset.py +12 -12
holmes/plugins/toolsets/azure_sql/tools/analyze_connection_failures.py +7 -7
holmes/plugins/toolsets/azure_sql/tools/analyze_database_connections.py +7 -7
holmes/plugins/toolsets/azure_sql/tools/analyze_database_health_status.py +3 -5
holmes/plugins/toolsets/azure_sql/tools/analyze_database_performance.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/analyze_database_storage.py +7 -7
holmes/plugins/toolsets/azure_sql/tools/get_active_alerts.py +6 -8
holmes/plugins/toolsets/azure_sql/tools/get_slow_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/get_top_cpu_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/get_top_data_io_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/get_top_log_io_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/utils.py +0 -32
holmes/plugins/toolsets/bash/argocd/__init__.py +3 -3
holmes/plugins/toolsets/bash/aws/__init__.py +4 -4
holmes/plugins/toolsets/bash/azure/__init__.py +4 -4
holmes/plugins/toolsets/bash/bash_toolset.py +2 -3
holmes/plugins/toolsets/bash/common/bash.py +19 -9
holmes/plugins/toolsets/bash/common/bash_command.py +1 -1
holmes/plugins/toolsets/bash/common/stringify.py +1 -1
holmes/plugins/toolsets/bash/kubectl/__init__.py +2 -1
holmes/plugins/toolsets/bash/kubectl/constants.py +0 -1
holmes/plugins/toolsets/bash/kubectl/kubectl_get.py +3 -4
holmes/plugins/toolsets/bash/parse_command.py +12 -13
holmes/plugins/toolsets/connectivity_check.py +124 -0
holmes/plugins/toolsets/coralogix/api.py +132 -119
holmes/plugins/toolsets/coralogix/coralogix.jinja2 +14 -0
holmes/plugins/toolsets/coralogix/toolset_coralogix.py +219 -0
holmes/plugins/toolsets/coralogix/utils.py +15 -79
holmes/plugins/toolsets/datadog/datadog_api.py +36 -3
holmes/plugins/toolsets/datadog/datadog_logs_instructions.jinja2 +34 -1
holmes/plugins/toolsets/datadog/datadog_metrics_instructions.jinja2 +3 -3
holmes/plugins/toolsets/datadog/datadog_models.py +59 -0
holmes/plugins/toolsets/datadog/datadog_url_utils.py +213 -0
holmes/plugins/toolsets/datadog/instructions_datadog_traces.jinja2 +165 -28
holmes/plugins/toolsets/datadog/toolset_datadog_general.py +71 -28
holmes/plugins/toolsets/datadog/toolset_datadog_logs.py +224 -375
holmes/plugins/toolsets/datadog/toolset_datadog_metrics.py +67 -36
holmes/plugins/toolsets/datadog/toolset_datadog_traces.py +360 -343
holmes/plugins/toolsets/elasticsearch/__init__.py +6 -0
holmes/plugins/toolsets/elasticsearch/elasticsearch.py +834 -0
holmes/plugins/toolsets/git.py +7 -8
holmes/plugins/toolsets/grafana/base_grafana_toolset.py +16 -4
holmes/plugins/toolsets/grafana/common.py +2 -30
holmes/plugins/toolsets/grafana/grafana_tempo_api.py +2 -1
holmes/plugins/toolsets/grafana/loki/instructions.jinja2 +18 -2
holmes/plugins/toolsets/grafana/loki/toolset_grafana_loki.py +92 -18
holmes/plugins/toolsets/grafana/loki_api.py +4 -0
holmes/plugins/toolsets/grafana/toolset_grafana.py +109 -25
holmes/plugins/toolsets/grafana/toolset_grafana_dashboard.jinja2 +22 -0
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py +201 -33
holmes/plugins/toolsets/grafana/trace_parser.py +3 -2
holmes/plugins/toolsets/internet/internet.py +10 -10
holmes/plugins/toolsets/internet/notion.py +5 -6
holmes/plugins/toolsets/investigator/core_investigation.py +3 -3
holmes/plugins/toolsets/investigator/model.py +3 -1
holmes/plugins/toolsets/json_filter_mixin.py +134 -0
holmes/plugins/toolsets/kafka.py +12 -7
holmes/plugins/toolsets/kubernetes.yaml +260 -30
holmes/plugins/toolsets/kubernetes_logs.py +3 -3
holmes/plugins/toolsets/logging_utils/logging_api.py +16 -6
holmes/plugins/toolsets/mcp/toolset_mcp.py +88 -60
holmes/plugins/toolsets/newrelic/new_relic_api.py +41 -1
holmes/plugins/toolsets/newrelic/newrelic.jinja2 +24 -0
holmes/plugins/toolsets/newrelic/newrelic.py +212 -55
holmes/plugins/toolsets/prometheus/prometheus.py +358 -102
holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2 +11 -3
holmes/plugins/toolsets/rabbitmq/api.py +23 -4
holmes/plugins/toolsets/rabbitmq/toolset_rabbitmq.py +5 -5
holmes/plugins/toolsets/robusta/robusta.py +5 -5
holmes/plugins/toolsets/runbook/runbook_fetcher.py +25 -6
holmes/plugins/toolsets/servicenow_tables/servicenow_tables.py +1 -1
holmes/plugins/toolsets/utils.py +1 -1
holmes/utils/config_utils.py +1 -1
holmes/utils/connection_utils.py +31 -0
holmes/utils/console/result.py +10 -0
holmes/utils/file_utils.py +2 -1
holmes/utils/global_instructions.py +10 -26
holmes/utils/holmes_status.py +4 -3
holmes/utils/log.py +15 -0
holmes/utils/markdown_utils.py +2 -3
holmes/utils/memory_limit.py +58 -0
holmes/utils/sentry_helper.py +23 -0
holmes/utils/stream.py +12 -5
holmes/utils/tags.py +4 -3
holmes/version.py +3 -1
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/METADATA +12 -10
holmesgpt-0.18.4.dist-info/RECORD +258 -0
holmes/plugins/toolsets/aws.yaml +0 -80
holmes/plugins/toolsets/coralogix/toolset_coralogix_logs.py +0 -114
holmes/plugins/toolsets/datadog/datadog_traces_formatter.py +0 -310
holmes/plugins/toolsets/datadog/toolset_datadog_rds.py +0 -736
holmes/plugins/toolsets/grafana/grafana_api.py +0 -64
holmes/plugins/toolsets/opensearch/__init__.py +0 -0
holmes/plugins/toolsets/opensearch/opensearch.py +0 -250
holmes/plugins/toolsets/opensearch/opensearch_logs.py +0 -161
holmes/plugins/toolsets/opensearch/opensearch_traces.py +0 -215
holmes/plugins/toolsets/opensearch/opensearch_traces_instructions.jinja2 +0 -12
holmes/plugins/toolsets/opensearch/opensearch_utils.py +0 -166
holmes/utils/keygen_utils.py +0 -6
holmesgpt-0.16.2a0.dist-info/RECORD +0 -258
holmes/plugins/toolsets/{opensearch → elasticsearch}/opensearch_ppl_query_docs.jinja2 +0 -0
holmes/plugins/toolsets/{opensearch → elasticsearch}/opensearch_query_assist.py +2 -2
/holmes/plugins/toolsets/{opensearch → elasticsearch}/opensearch_query_assist_instructions.jinja2 +0 -0
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/LICENSE +0 -0
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/WHEEL +0 -0
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/entry_points.txt +0 -0

holmes/plugins/toolsets/datadog/toolset_datadog_traces.py CHANGED Viewed

@@ -1,44 +1,47 @@
 """Datadog Traces toolset for HolmesGPT."""
+import copy
 import json
 import logging
 import os
-import time
+import re
 from typing import Any, Dict, Optional, Tuple
+from pydantic import AnyUrl
 from holmes.core.tools import (
     CallablePrerequisite,
+    StructuredToolResult,
+    StructuredToolResultStatus,
     Tool,
     ToolInvokeContext,
     ToolParameter,
     Toolset,
-    StructuredToolResult,
-    StructuredToolResultStatus,
     ToolsetTag,
 )
+from holmes.plugins.toolsets.consts import STANDARD_END_DATETIME_TOOL_PARAM_DESCRIPTION
 from holmes.plugins.toolsets.datadog.datadog_api import (
+    MAX_RETRY_COUNT_ON_RATE_LIMIT,
     DataDogRequestError,
-    DatadogBaseConfig,
     execute_datadog_http_request,
     get_headers,
-    MAX_RETRY_COUNT_ON_RATE_LIMIT,
 )
-from holmes.plugins.toolsets.utils import (
-    process_timestamps_to_int,
-    toolset_name_for_one_liner,
-)
-from holmes.plugins.toolsets.datadog.datadog_traces_formatter import (
-    format_traces_list,
-    format_trace_hierarchy,
-    format_spans_search,
+from holmes.plugins.toolsets.datadog.datadog_models import DatadogTracesConfig
+from holmes.plugins.toolsets.datadog.datadog_url_utils import (
+    generate_datadog_spans_analytics_url,
+    generate_datadog_spans_url,
 )
 from holmes.plugins.toolsets.logging_utils.logging_api import (
     DEFAULT_TIME_SPAN_SECONDS,
 )
+from holmes.plugins.toolsets.utils import (
+    process_timestamps_to_int,
+    standard_start_datetime_tool_param_description,
+    toolset_name_for_one_liner,
+)
-class DatadogTracesConfig(DatadogBaseConfig):
-    indexes: list[str] = ["*"]
+# Valid percentile aggregations supported by Datadog
+PERCENTILE_AGGREGATIONS = ["pc75", "pc90", "pc95", "pc98", "pc99"]
 class DatadogTracesToolset(Toolset):
@@ -54,22 +57,14 @@ class DatadogTracesToolset(Toolset):
             icon_url="https://imgix.datadoghq.com//img/about/presskit/DDlogo.jpg",
             prerequisites=[CallablePrerequisite(callable=self.prerequisites_callable)],
             tools=[
-                FetchDatadogTracesList(toolset=self),
-                FetchDatadogTraceById(toolset=self),
-                FetchDatadogSpansByFilter(toolset=self),
+                GetSpans(toolset=self),
+                AggregateSpans(toolset=self),
             ],
             tags=[ToolsetTag.CORE],
         )
-        self._reload_instructions()
-    def _reload_instructions(self):
-        """Load Datadog traces specific troubleshooting instructions."""
-        template_file_path = os.path.abspath(
-            os.path.join(
-                os.path.dirname(__file__), "instructions_datadog_traces.jinja2"
-            )
+        self._load_llm_instructions_from_file(
+            os.path.dirname(__file__), "instructions_datadog_traces.jinja2"
         )
-        self._load_llm_instructions(jinja_template=f"file://{template_file_path}")
     def prerequisites_callable(self, config: dict[str, Any]) -> Tuple[bool, str]:
         """Check prerequisites with configuration."""
@@ -136,13 +131,12 @@ class DatadogTracesToolset(Toolset):
             return False, f"Healthcheck failed with exception: {str(e)}"
     def get_example_config(self) -> Dict[str, Any]:
-        """Get example configuration for this toolset."""
-        return {
-            "dd_api_key": "<your_datadog_api_key>",
-            "dd_app_key": "<your_datadog_app_key>",
-            "site_api_url": "https://api.datadoghq.com",  # or https://api.datadoghq.eu for EU
-            "request_timeout": 60,
-        }
+        example_config = DatadogTracesConfig(
+            dd_api_key="<your_datadog_api_key>",
+            dd_app_key="<your_datadog_app_key>",
+            site_api_url=AnyUrl("https://api.datadoghq.com"),
+        )
+        return example_config.model_dump(mode="json")
 class BaseDatadogTracesTool(Tool):
@@ -151,68 +145,88 @@ class BaseDatadogTracesTool(Tool):
     toolset: "DatadogTracesToolset"
-class FetchDatadogTracesList(BaseDatadogTracesTool):
-    """Tool to fetch a list of traces from Datadog."""
+# Schema defines what fields to keep in compact mode
+COMPACT_SCHEMA = {
+    "custom": {
+        "duration": True,
+        "http": {"status_code": True, "host": True, "method": True, "url": True},
+    },
+    "status": True,
+    "start_timestamp": True,
+    "end_timestamp": True,
+    "error": True,
+    "single_span": True,
+    "span_id": True,
+    "trace_id": True,
+    "parent_id": True,
+    "service": True,
+    "resource_name": True,
+    "tags": {"_filter": "startswith", "_values": ["pod_name:"]},  # Generic array filter
+}
+class GetSpans(BaseDatadogTracesTool):
+    """Tool to search for spans with specific filters."""
     def __init__(self, toolset: "DatadogTracesToolset"):
         super().__init__(
-            name="fetch_datadog_traces",
-            description="[datadog/traces toolset] Fetch a list of traces from Datadog with optional filters",
+            name="fetch_datadog_spans",
+            description="Search for spans in Datadog using span syntax. "
+            "Supports wildcards (*) for pattern matching: @http.route:*payment*, resource_name:*user*, service:*api*. "
+            "Uses the DataDog api endpoint: POST /api/v2/spans/events/search with 'query' parameter.",
             parameters={
-                "service": ToolParameter(
-                    description="Filter by service name",
-                    type="string",
-                    required=False,
-                ),
-                "operation": ToolParameter(
-                    description="Filter by operation name",
+                "query": ToolParameter(
+                    description="The search query following span syntax. Supports wildcards (*) for pattern matching. Examples: @http.route:*payment*, resource_name:*user*, service:*api*. Default: *",
                     type="string",
                     required=False,
                 ),
-                "resource": ToolParameter(
-                    description="Filter by resource name",
+                "start_datetime": ToolParameter(
+                    description=standard_start_datetime_tool_param_description(
+                        DEFAULT_TIME_SPAN_SECONDS
+                    ),
                     type="string",
                     required=False,
                 ),
-                "min_duration": ToolParameter(
-                    description="Minimum duration (e.g., '5s', '500ms', '1m')",
+                "end_datetime": ToolParameter(
+                    description=STANDARD_END_DATETIME_TOOL_PARAM_DESCRIPTION,
                     type="string",
                     required=False,
                 ),
-                "start_datetime": ToolParameter(
-                    description="Start time in RFC3339 format or relative time in seconds (negative for past)",
+                "timezone": ToolParameter(
+                    description="The timezone can be specified as GMT, UTC, an offset from UTC (like UTC+1), or as a Timezone Database identifier (like America/New_York). default: UTC",
                     type="string",
                     required=False,
                 ),
-                "end_datetime": ToolParameter(
-                    description="End time in RFC3339 format or relative time in seconds (negative for past)",
+                "cursor": ToolParameter(
+                    description="The returned paging point to use to get the next results. IMPORTANT: Cursors are single-use and stateful - never reuse the same cursor value multiple times or parallelize cursor-based calls. Each response provides a new cursor for the subsequent request.",
                     type="string",
                     required=False,
                 ),
                 "limit": ToolParameter(
-                    description="Maximum number of traces to return",
+                    description="Maximum number of spans to return. Default: 10. Warning: Using values higher than 10 may result in too much data and cause the tool call to fail.",
                     type="integer",
                     required=False,
                 ),
+                "sort_desc": ToolParameter(
+                    description="Get the results in descending order. default: true",
+                    type="boolean",
+                    required=False,
+                ),
+                "compact": ToolParameter(
+                    description="Return only essential fields to reduce output size. Use with higher limits (50-100) for initial exploration, then use compact=false with lower limits (5-10) for detailed investigation. Default: True",
+                    type="boolean",
+                    required=True,
+                ),
             },
             toolset=toolset,
         )
     def get_parameterized_one_liner(self, params: dict) -> str:
         """Get a one-liner description of the tool invocation."""
-        filters = []
-        if "service" in params:
-            filters.append(f"service={params['service']}")
-        if "operation" in params:
-            filters.append(f"operation={params['operation']}")
-        if "min_duration" in params:
-            filters.append(f"duration>{params['min_duration']}")
-        filter_str = ", ".join(filters) if filters else "all"
-        return f"{toolset_name_for_one_liner(self.toolset.name)}: Fetch Traces ({filter_str})"
+        return f"{toolset_name_for_one_liner(self.toolset.name)}: Search Spans ({params['query'] if 'query' in params else ''})"
     def _invoke(self, params: dict, context: ToolInvokeContext) -> StructuredToolResult:
-        """Execute the tool to fetch traces."""
+        """Execute the tool to search spans."""
         if not self.toolset.dd_config:
             return StructuredToolResult(
                 status=StructuredToolResultStatus.ERROR,
@@ -221,7 +235,7 @@ class FetchDatadogTracesList(BaseDatadogTracesTool):
             )
         url = None
-        payload = None
+        payload: Optional[Dict[str, Any]] = None
         try:
             # Process timestamps
@@ -235,36 +249,14 @@ class FetchDatadogTracesList(BaseDatadogTracesTool):
             from_time_ms = from_time_int * 1000
             to_time_ms = to_time_int * 1000
-            # Build search query
-            query_parts = []
-            if params.get("service"):
-                query_parts.append(f"service:{params['service']}")
-            if params.get("operation"):
-                query_parts.append(f"operation_name:{params['operation']}")
-            if params.get("resource"):
-                query_parts.append(f"resource_name:{params['resource']}")
-            if params.get("min_duration"):
-                # Parse duration string (e.g., "5s", "500ms", "1m")
-                duration_str = params["min_duration"].lower()
-                if duration_str.endswith("ms"):
-                    duration_ns = int(float(duration_str[:-2]) * 1_000_000)
-                elif duration_str.endswith("s"):
-                    duration_ns = int(float(duration_str[:-1]) * 1_000_000_000)
-                elif duration_str.endswith("m"):
-                    duration_ns = int(float(duration_str[:-1]) * 60 * 1_000_000_000)
-                else:
-                    # Assume milliseconds if no unit
-                    duration_ns = int(float(duration_str) * 1_000_000)
-                query_parts.append(f"@duration:>{duration_ns}")
-            query = " ".join(query_parts) if query_parts else "*"
+            query: str = params.get("query") if params.get("query") else "*"  # type: ignore
+            limit = params.get("limit") if params.get("limit") else 10
+            if params.get("sort") is not None:
+                sort = "-timestamp" if params.get("sort") else True
+            else:
+                sort = "-timestamp"
-            # Prepare API request - use POST search endpoint
+            # Use POST endpoint for more complex searches
             url = f"{self.toolset.dd_config.site_api_url}/api/v2/spans/events/search"
             headers = get_headers(self.toolset.dd_config)
@@ -278,12 +270,17 @@ class FetchDatadogTracesList(BaseDatadogTracesTool):
                             "to": str(to_time_ms),
                             "indexes": self.toolset.dd_config.indexes,
                         },
-                        "page": {"limit": params.get("limit", 50)},
-                        "sort": "-timestamp",
+                        "page": {
+                            "limit": limit,
+                        },
+                        "sort": sort,
                     },
                 }
             }
+            if params.get("cursor"):
+                payload["data"]["attributes"]["page"]["cursor"] = params["cursor"]
             response = execute_datadog_http_request(
                 url=url,
                 headers=headers,
@@ -292,32 +289,28 @@ class FetchDatadogTracesList(BaseDatadogTracesTool):
                 method="POST",
             )
-            # Handle tuple response from POST requests
-            if isinstance(response, tuple):
-                spans, _ = response
-            elif response:
-                spans = response.get("data", [])
-            else:
-                spans = []
-            # Format the traces using the formatter
-            formatted_output = format_traces_list(spans, limit=params.get("limit", 50))
-            if not formatted_output:
-                return StructuredToolResult(
-                    status=StructuredToolResultStatus.NO_DATA,
-                    params=params,
-                    data="No matching traces found.",
-                )
+            # Apply compact filtering if requested
+            if params.get("compact", False) and "data" in response:
+                response["data"] = [
+                    self._filter_span_attributes(span) for span in response["data"]
+                ]
+            web_url = generate_datadog_spans_url(
+                self.toolset.dd_config,
+                query,
+                from_time_ms,
+                to_time_ms,
+            )
             return StructuredToolResult(
                 status=StructuredToolResultStatus.SUCCESS,
-                data=formatted_output,
+                data=response,
                 params=params,
+                url=web_url,
             )
         except DataDogRequestError as e:
             logging.exception(e, exc_info=True)
             if e.status_code == 429:
                 error_msg = f"Datadog API rate limit exceeded. Failed after {MAX_RETRY_COUNT_ON_RATE_LIMIT} retry attempts."
             elif e.status_code == 403:
@@ -352,212 +345,254 @@ class FetchDatadogTracesList(BaseDatadogTracesTool):
                 ),
             )
+    def _apply_compact_schema(self, source: dict, schema: dict) -> dict:
+        """Apply schema to filter fields from source dict."""
+        result: Dict[str, Any] = {}
+        for key, value in schema.items():
+            if key not in source:
+                continue
+            source_value = source[key]
+            if isinstance(value, dict):
+                # Check if it's a filter directive for arrays
+                if "_filter" in value and isinstance(source_value, list):
+                    filter_type = value["_filter"]
+                    filter_values = value.get("_values", [])
+                    if filter_type == "startswith":
+                        # Filter array items that start with any of the specified values
+                        filtered = [
+                            item
+                            for item in source_value
+                            if isinstance(item, str)
+                            and any(item.startswith(prefix) for prefix in filter_values)
+                        ]
+                        if filtered:
+                            result[key] = filtered
+                elif isinstance(source_value, dict):
+                    # Regular nested object - recurse
+                    nested_result = self._apply_compact_schema(source_value, value)
+                    if nested_result:
+                        result[key] = nested_result
+            elif value is True:
+                # Copy the field as-is
+                result[key] = source_value
+        return result
+    def _filter_span_attributes(self, span: dict) -> dict:
+        """Filter span to include only essential fields."""
+        filtered_span = {
+            "id": span.get("id"),
+            "type": span.get("type"),
+        }
-class FetchDatadogTraceById(BaseDatadogTracesTool):
-    """Tool to fetch detailed information about a specific trace."""
-    def __init__(self, toolset: "DatadogTracesToolset"):
-        super().__init__(
-            name="fetch_datadog_trace_by_id",
-            description="[datadog/traces toolset] Fetch detailed information about a specific trace by its ID",
-            parameters={
-                "trace_id": ToolParameter(
-                    description="The trace ID to fetch details for",
-                    type="string",
-                    required=True,
-                ),
-            },
-            toolset=toolset,
-        )
-    def get_parameterized_one_liner(self, params: dict) -> str:
-        """Get a one-liner description of the tool invocation."""
-        trace_id = params.get("trace_id", "unknown")
-        return f"{toolset_name_for_one_liner(self.toolset.name)}: Fetch Trace Details ({trace_id})"
-    def _invoke(self, params: dict, context: ToolInvokeContext) -> StructuredToolResult:
-        """Execute the tool to fetch trace details."""
-        if not self.toolset.dd_config:
-            return StructuredToolResult(
-                status=StructuredToolResultStatus.ERROR,
-                error="Datadog configuration not initialized",
-                params=params,
-            )
-        trace_id = params.get("trace_id")
-        if not trace_id:
-            return StructuredToolResult(
-                status=StructuredToolResultStatus.ERROR,
-                error="trace_id parameter is required",
-                params=params,
-            )
-        url = None
-        payload = None
-        try:
-            # For Datadog, we need to search for all spans with the given trace_id
-            # Using a reasonable time window (last 7 days by default)
-            current_time = int(time.time())
-            from_time_ms = (current_time - 604800) * 1000  # 7 days ago
-            to_time_ms = current_time * 1000
-            url = f"{self.toolset.dd_config.site_api_url}/api/v2/spans/events/search"
-            headers = get_headers(self.toolset.dd_config)
-            payload = {
-                "data": {
-                    "type": "search_request",
-                    "attributes": {
-                        "filter": {
-                            "query": f"trace_id:{trace_id}",
-                            "from": str(from_time_ms),
-                            "to": str(to_time_ms),
-                            "indexes": self.toolset.dd_config.indexes,
-                        },
-                        "page": {"limit": 1000},  # Get all spans for the trace
-                        "sort": "timestamp",
-                    },
-                }
-            }
-            response = execute_datadog_http_request(
-                url=url,
-                headers=headers,
-                payload_or_params=payload,
-                timeout=self.toolset.dd_config.request_timeout,
-                method="POST",
-            )
-            # Handle tuple response from POST requests
-            if isinstance(response, tuple):
-                spans, _ = response
-            elif response:
-                spans = response.get("data", [])
-            else:
-                spans = []
-            # Format the trace hierarchy using the formatter
-            formatted_output = format_trace_hierarchy(trace_id, spans)
-            if not formatted_output:
-                return StructuredToolResult(
-                    status=StructuredToolResultStatus.NO_DATA,
-                    params=params,
-                    data=f"No trace found for trace_id: {trace_id}",
-                )
-            return StructuredToolResult(
-                status=StructuredToolResultStatus.SUCCESS,
-                data=formatted_output,
-                params=params,
-            )
-        except DataDogRequestError as e:
-            logging.exception(e, exc_info=True)
-            if e.status_code == 429:
-                error_msg = f"Datadog API rate limit exceeded. Failed after {MAX_RETRY_COUNT_ON_RATE_LIMIT} retry attempts."
-            elif e.status_code == 403:
-                error_msg = (
-                    f"Permission denied. Ensure your Datadog Application Key has the 'apm_read' "
-                    f"permission. Error: {str(e)}"
-                )
-            else:
-                error_msg = f"Exception while querying Datadog: {str(e)}"
-            return StructuredToolResult(
-                status=StructuredToolResultStatus.ERROR,
-                error=error_msg,
-                params=params,
-                invocation=(
-                    json.dumps({"url": url, "payload": payload})
-                    if url and payload
-                    else None
-                ),
+        if "attributes" in span:
+            filtered_span["attributes"] = self._apply_compact_schema(
+                span["attributes"], COMPACT_SCHEMA
             )
-        except Exception as e:
-            logging.exception(e, exc_info=True)
-            return StructuredToolResult(
-                status=StructuredToolResultStatus.ERROR,
-                error=f"Unexpected error: {str(e)}",
-                params=params,
-                invocation=(
-                    json.dumps({"url": url, "payload": payload})
-                    if url and payload
-                    else None
-                ),
-            )
+        return filtered_span
-class FetchDatadogSpansByFilter(BaseDatadogTracesTool):
-    """Tool to search for spans with specific filters."""
+class AggregateSpans(BaseDatadogTracesTool):
+    """Tool to aggregate span data into buckets and compute metrics and timeseries."""
     def __init__(self, toolset: "DatadogTracesToolset"):
         super().__init__(
-            name="fetch_datadog_spans",
-            description="[datadog/traces toolset] Search for spans in Datadog with detailed filters",
+            name="aggregate_datadog_spans",
+            description="Aggregate spans into buckets and compute metrics and timeseries. "
+            "Uses the DataDog api endpoint: POST /api/v2/spans/analytics/aggregate",
             parameters={
                 "query": ToolParameter(
-                    description="Datadog search query (e.g., 'service:web-app @http.status_code:500')",
-                    type="string",
-                    required=False,
-                ),
-                "service": ToolParameter(
-                    description="Filter by service name",
+                    description="Search query following span syntax. Default: '*'",
                     type="string",
                     required=False,
                 ),
-                "operation": ToolParameter(
-                    description="Filter by operation name",
+                "start_datetime": ToolParameter(
+                    description=standard_start_datetime_tool_param_description(
+                        DEFAULT_TIME_SPAN_SECONDS
+                    ),
                     type="string",
                     required=False,
                 ),
-                "resource": ToolParameter(
-                    description="Filter by resource name",
+                "end_datetime": ToolParameter(
+                    description=STANDARD_END_DATETIME_TOOL_PARAM_DESCRIPTION,
                     type="string",
                     required=False,
                 ),
-                "tags": ToolParameter(
-                    description="Filter by tags (e.g., {'env': 'production', 'version': '1.2.3'})",
-                    type="object",
-                    required=False,
+                "compute": ToolParameter(
+                    description="List of metrics to compute from the matching spans. Supports up to 10 computes at the same time.",
+                    type="array",
+                    required=True,
+                    items=ToolParameter(
+                        type="object",
+                        properties={
+                            "aggregation": ToolParameter(
+                                type="string",
+                                required=True,
+                                enum=[
+                                    "count",
+                                    "cardinality",
+                                    "sum",
+                                    "min",
+                                    "max",
+                                    "avg",
+                                    "median",
+                                ]
+                                + PERCENTILE_AGGREGATIONS,
+                                description="The aggregation method.",
+                            ),
+                            "metric": ToolParameter(
+                                type="string",
+                                required=False,
+                                description="The span attribute to aggregate. Required for all non-count aggregations",
+                            ),
+                            "type": ToolParameter(
+                                type="string",
+                                required=False,
+                                enum=["total", "timeseries"],
+                                description="Compute type for the aggregation. Default: 'total'",
+                            ),
+                            "interval": ToolParameter(
+                                type="string",
+                                required=False,
+                                description="The time buckets for timeseries results (e.g., '5m', '1h'). The time buckets' size (only used for type=timeseries) Defaults to a resolution of 150 points.",
+                            ),
+                        },
+                    ),
                 ),
-                "start_datetime": ToolParameter(
-                    description="Start time in RFC3339 format or relative time in seconds (negative for past)",
-                    type="string",
+                "group_by": ToolParameter(
+                    description="List of facets to split the aggregate data by",
+                    type="array",
                     required=False,
+                    items=ToolParameter(
+                        type="object",
+                        properties={
+                            "facet": ToolParameter(
+                                type="string",
+                                required=True,
+                                description="The span attribute to split by",
+                            ),
+                            "limit": ToolParameter(
+                                type="integer",
+                                required=False,
+                                description="Maximum number of facet groups to return. Default: 10",
+                            ),
+                            "missing": ToolParameter(
+                                type="string",
+                                required=False,
+                                description="The value to use for spans that don't have the facet",
+                            ),
+                            "sort": ToolParameter(
+                                type="object",
+                                required=False,
+                                description="Sort configuration for the groups",
+                                properties={
+                                    # Not working correctly
+                                    # "aggregation": ToolParameter(
+                                    #     type="string",
+                                    #     required=True,
+                                    #     description="The aggregation method to sort by",
+                                    # ),
+                                    "metric": ToolParameter(
+                                        type="string",
+                                        required=False,
+                                        description="The metric to sort by when using a metric aggregation. (only used for type=measure).",
+                                    ),
+                                    "type": ToolParameter(
+                                        type="string",
+                                        required=False,
+                                        enum=["alphabetical", "measure"],
+                                        description="The type of sorting to use",
+                                    ),
+                                    "order": ToolParameter(
+                                        type="string",
+                                        required=False,
+                                        enum=["asc", "desc"],
+                                        description="The sort order. Default: 'desc'",
+                                    ),
+                                },
+                            ),
+                            "total": ToolParameter(
+                                type="boolean",
+                                required=False,
+                                description="Whether to include a 'total' group with all non-faceted results",
+                            ),
+                            "histogram": ToolParameter(
+                                type="object",
+                                required=False,
+                                description="Histogram configuration for numeric facets",
+                                properties={
+                                    "interval": ToolParameter(
+                                        type="number",
+                                        required=True,
+                                        description="The bin size for the histogram",
+                                    ),
+                                    "min": ToolParameter(
+                                        type="number",
+                                        required=False,
+                                        description="The minimum value for the histogram",
+                                    ),
+                                    "max": ToolParameter(
+                                        type="number",
+                                        required=False,
+                                        description="The maximum value for the histogram",
+                                    ),
+                                },
+                            ),
+                        },
+                    ),
                 ),
-                "end_datetime": ToolParameter(
-                    description="End time in RFC3339 format or relative time in seconds (negative for past)",
+                "timezone": ToolParameter(
+                    description="The timezone for time-based results (e.g., 'GMT', 'UTC', 'America/New_York'). Default: 'UTC'",
                     type="string",
                     required=False,
                 ),
-                "limit": ToolParameter(
-                    description="Maximum number of spans to return",
-                    type="integer",
-                    required=False,
-                ),
             },
             toolset=toolset,
         )
     def get_parameterized_one_liner(self, params: dict) -> str:
         """Get a one-liner description of the tool invocation."""
-        if "query" in params:
-            return f"{toolset_name_for_one_liner(self.toolset.name)}: Search Spans ({params['query']})"
-        filters = []
-        if "service" in params:
-            filters.append(f"service={params['service']}")
-        if "operation" in params:
-            filters.append(f"operation={params['operation']}")
-        filter_str = ", ".join(filters) if filters else "all"
-        return f"{toolset_name_for_one_liner(self.toolset.name)}: Search Spans ({filter_str})"
+        query = params.get("query", "*")
+        compute_info = ""
+        if params.get("compute"):
+            aggregations = [c.get("aggregation", "") for c in params["compute"]]
+            compute_info = f" (computing: {', '.join(aggregations)})"
+        return f"{toolset_name_for_one_liner(self.toolset.name)}: Aggregate Spans ({query}){compute_info}"
+    def _fix_percentile_aggregations(self, compute_params: list) -> list:
+        """Fix common percentile format mistakes that the LLM makes when choosing from the enum (e.g., p95 -> pc95).
+        Args:
+            compute_params: List of compute parameter dictionaries
+        Returns:
+            List of compute parameters with corrected aggregation values
+        """
+        # Deep copy the entire compute params to avoid modifying the original
+        processed_compute = copy.deepcopy(compute_params)
+        # Simple replacement for each known percentile
+        for compute_item in processed_compute:
+            if isinstance(compute_item, dict) and "aggregation" in compute_item:
+                agg_value = compute_item["aggregation"]
+                # Check if it matches p\d\d pattern (e.g., p95)
+                if re.match(r"^p\d{2}$", agg_value):
+                    # Convert to pc format and check if it's valid
+                    pc_version = "pc" + agg_value[1:]
+                    if pc_version in PERCENTILE_AGGREGATIONS:
+                        compute_item["aggregation"] = pc_version
+        return processed_compute
     def _invoke(self, params: dict, context: ToolInvokeContext) -> StructuredToolResult:
-        """Execute the tool to search spans."""
+        """Execute the tool to aggregate spans."""
         if not self.toolset.dd_config:
             return StructuredToolResult(
                 status=StructuredToolResultStatus.ERROR,
@@ -580,51 +615,42 @@ class FetchDatadogSpansByFilter(BaseDatadogTracesTool):
             from_time_ms = from_time_int * 1000
             to_time_ms = to_time_int * 1000
-            # Build search query
-            query_parts = []
+            query = params.get("query", "*")
-            # If a custom query is provided, use it as the base
-            if params.get("query"):
-                query_parts.append(params["query"])
-            # Add additional filters
-            if params.get("service"):
-                query_parts.append(f"service:{params['service']}")
-            if params.get("operation"):
-                query_parts.append(f"operation_name:{params['operation']}")
+            # Build the request payload
+            url = f"{self.toolset.dd_config.site_api_url}/api/v2/spans/analytics/aggregate"
+            headers = get_headers(self.toolset.dd_config)
-            if params.get("resource"):
-                query_parts.append(f"resource_name:{params['resource']}")
+            # Build payload attributes first
+            # Process compute parameter to fix common p95->pc95 style mistakes
+            compute_params = params.get("compute", [])
+            processed_compute = self._fix_percentile_aggregations(compute_params)
+            attributes: Dict[str, Any] = {
+                "filter": {
+                    "query": query,
+                    "from": str(from_time_ms),
+                    "to": str(to_time_ms),
+                },
+                "compute": processed_compute,
+            }
-            # Add tag filters
-            if params.get("tags"):
-                tags = params["tags"]
-                if isinstance(tags, dict):
-                    for key, value in tags.items():
-                        query_parts.append(f"@{key}:{value}")
+            # Add optional fields
+            if params.get("group_by"):
+                attributes["group_by"] = params["group_by"]
-            query = " ".join(query_parts) if query_parts else "*"
+            # Add options if timezone is specified
+            options: Dict[str, Any] = {}
+            if params.get("timezone"):
+                options["timezone"] = params["timezone"]
-            # Use POST endpoint for more complex searches
-            url = f"{self.toolset.dd_config.site_api_url}/api/v2/spans/events/search"
-            headers = get_headers(self.toolset.dd_config)
+            if options:
+                attributes["options"] = options
             payload = {
                 "data": {
-                    "type": "search_request",
-                    "attributes": {
-                        "filter": {
-                            "query": query,
-                            "from": str(from_time_ms),
-                            "to": str(to_time_ms),
-                            "indexes": self.toolset.dd_config.indexes,
-                        },
-                        "page": {
-                            "limit": params.get("limit", 100),
-                        },
-                        "sort": "-timestamp",
-                    },
+                    "type": "aggregate_request",
+                    "attributes": attributes,
                 }
             }
@@ -636,27 +662,18 @@ class FetchDatadogSpansByFilter(BaseDatadogTracesTool):
                 method="POST",
             )
-            # Handle tuple response from POST requests
-            if isinstance(response, tuple):
-                spans, _ = response
-            elif response:
-                spans = response.get("data", [])
-            else:
-                spans = []
-            # Format the spans search results using the formatter
-            formatted_output = format_spans_search(spans)
-            if not formatted_output:
-                return StructuredToolResult(
-                    status=StructuredToolResultStatus.NO_DATA,
-                    params=params,
-                    data="No matching spans found.",
-                )
+            web_url = generate_datadog_spans_analytics_url(
+                self.toolset.dd_config,
+                query,
+                from_time_ms,
+                to_time_ms,
+            )
             return StructuredToolResult(
                 status=StructuredToolResultStatus.SUCCESS,
-                data=formatted_output,
+                data=response,
                 params=params,
+                url=web_url,
             )
         except DataDogRequestError as e:

holmesgpt 0.16.2a0__py3-none-any.whl → 0.18.4__py3-none-any.whl

holmesgpt 0.16.2a0py3-none-any.whl → 0.18.4py3-none-any.whl