PyPI - holmesgpt - Versions diffs - 0.13.2__py3-none-any.whl → 0.16.2a0__py3-none-any.whl - Mend

holmesgpt 0.13.2py3-none-any.whl → 0.16.2a0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

holmes/__init__.py +1 -1
holmes/clients/robusta_client.py +17 -4
holmes/common/env_vars.py +40 -1
holmes/config.py +114 -144
holmes/core/conversations.py +53 -14
holmes/core/feedback.py +191 -0
holmes/core/investigation.py +18 -22
holmes/core/llm.py +489 -88
holmes/core/models.py +103 -1
holmes/core/openai_formatting.py +13 -0
holmes/core/prompt.py +1 -1
holmes/core/safeguards.py +4 -4
holmes/core/supabase_dal.py +293 -100
holmes/core/tool_calling_llm.py +423 -323
holmes/core/tools.py +311 -33
holmes/core/tools_utils/token_counting.py +14 -0
holmes/core/tools_utils/tool_context_window_limiter.py +57 -0
holmes/core/tools_utils/tool_executor.py +13 -8
holmes/core/toolset_manager.py +155 -4
holmes/core/tracing.py +6 -1
holmes/core/transformers/__init__.py +23 -0
holmes/core/transformers/base.py +62 -0
holmes/core/transformers/llm_summarize.py +174 -0
holmes/core/transformers/registry.py +122 -0
holmes/core/transformers/transformer.py +31 -0
holmes/core/truncation/compaction.py +59 -0
holmes/core/truncation/dal_truncation_utils.py +23 -0
holmes/core/truncation/input_context_window_limiter.py +218 -0
holmes/interactive.py +177 -24
holmes/main.py +7 -4
holmes/plugins/prompts/_fetch_logs.jinja2 +26 -1
holmes/plugins/prompts/_general_instructions.jinja2 +1 -2
holmes/plugins/prompts/_runbook_instructions.jinja2 +23 -12
holmes/plugins/prompts/conversation_history_compaction.jinja2 +88 -0
holmes/plugins/prompts/generic_ask.jinja2 +2 -4
holmes/plugins/prompts/generic_ask_conversation.jinja2 +2 -1
holmes/plugins/prompts/generic_ask_for_issue_conversation.jinja2 +2 -1
holmes/plugins/prompts/generic_investigation.jinja2 +2 -1
holmes/plugins/prompts/investigation_procedure.jinja2 +48 -0
holmes/plugins/prompts/kubernetes_workload_ask.jinja2 +2 -1
holmes/plugins/prompts/kubernetes_workload_chat.jinja2 +2 -1
holmes/plugins/runbooks/__init__.py +117 -18
holmes/plugins/runbooks/catalog.json +2 -0
holmes/plugins/toolsets/__init__.py +21 -8
holmes/plugins/toolsets/aks-node-health.yaml +46 -0
holmes/plugins/toolsets/aks.yaml +64 -0
holmes/plugins/toolsets/atlas_mongodb/mongodb_atlas.py +26 -36
holmes/plugins/toolsets/azure_sql/azure_sql_toolset.py +0 -1
holmes/plugins/toolsets/azure_sql/tools/analyze_connection_failures.py +10 -7
holmes/plugins/toolsets/azure_sql/tools/analyze_database_connections.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/analyze_database_health_status.py +8 -6
holmes/plugins/toolsets/azure_sql/tools/analyze_database_performance.py +8 -6
holmes/plugins/toolsets/azure_sql/tools/analyze_database_storage.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_active_alerts.py +9 -7
holmes/plugins/toolsets/azure_sql/tools/get_slow_queries.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_top_cpu_queries.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_top_data_io_queries.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_top_log_io_queries.py +9 -6
holmes/plugins/toolsets/bash/bash_toolset.py +10 -13
holmes/plugins/toolsets/bash/common/bash.py +7 -7
holmes/plugins/toolsets/cilium.yaml +284 -0
holmes/plugins/toolsets/coralogix/toolset_coralogix_logs.py +5 -3
holmes/plugins/toolsets/datadog/datadog_api.py +490 -24
holmes/plugins/toolsets/datadog/datadog_logs_instructions.jinja2 +21 -10
holmes/plugins/toolsets/datadog/toolset_datadog_general.py +349 -216
holmes/plugins/toolsets/datadog/toolset_datadog_logs.py +190 -19
holmes/plugins/toolsets/datadog/toolset_datadog_metrics.py +101 -44
holmes/plugins/toolsets/datadog/toolset_datadog_rds.py +13 -16
holmes/plugins/toolsets/datadog/toolset_datadog_traces.py +25 -31
holmes/plugins/toolsets/git.py +51 -46
holmes/plugins/toolsets/grafana/common.py +15 -3
holmes/plugins/toolsets/grafana/grafana_api.py +46 -24
holmes/plugins/toolsets/grafana/grafana_tempo_api.py +454 -0
holmes/plugins/toolsets/grafana/loki/instructions.jinja2 +9 -0
holmes/plugins/toolsets/grafana/loki/toolset_grafana_loki.py +117 -0
holmes/plugins/toolsets/grafana/toolset_grafana.py +211 -91
holmes/plugins/toolsets/grafana/toolset_grafana_dashboard.jinja2 +27 -0
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.jinja2 +246 -11
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py +653 -293
holmes/plugins/toolsets/grafana/trace_parser.py +1 -1
holmes/plugins/toolsets/internet/internet.py +6 -7
holmes/plugins/toolsets/internet/notion.py +5 -6
holmes/plugins/toolsets/investigator/core_investigation.py +42 -34
holmes/plugins/toolsets/kafka.py +25 -36
holmes/plugins/toolsets/kubernetes.yaml +58 -84
holmes/plugins/toolsets/kubernetes_logs.py +6 -6
holmes/plugins/toolsets/kubernetes_logs.yaml +32 -0
holmes/plugins/toolsets/logging_utils/logging_api.py +80 -4
holmes/plugins/toolsets/mcp/toolset_mcp.py +181 -55
holmes/plugins/toolsets/newrelic/__init__.py +0 -0
holmes/plugins/toolsets/newrelic/new_relic_api.py +125 -0
holmes/plugins/toolsets/newrelic/newrelic.jinja2 +41 -0
holmes/plugins/toolsets/newrelic/newrelic.py +163 -0
holmes/plugins/toolsets/opensearch/opensearch.py +10 -17
holmes/plugins/toolsets/opensearch/opensearch_logs.py +7 -7
holmes/plugins/toolsets/opensearch/opensearch_ppl_query_docs.jinja2 +1616 -0
holmes/plugins/toolsets/opensearch/opensearch_query_assist.py +78 -0
holmes/plugins/toolsets/opensearch/opensearch_query_assist_instructions.jinja2 +223 -0
holmes/plugins/toolsets/opensearch/opensearch_traces.py +13 -16
holmes/plugins/toolsets/openshift.yaml +283 -0
holmes/plugins/toolsets/prometheus/prometheus.py +915 -390
holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2 +43 -2
holmes/plugins/toolsets/prometheus/utils.py +28 -0
holmes/plugins/toolsets/rabbitmq/toolset_rabbitmq.py +9 -10
holmes/plugins/toolsets/robusta/robusta.py +236 -65
holmes/plugins/toolsets/robusta/robusta_instructions.jinja2 +26 -9
holmes/plugins/toolsets/runbook/runbook_fetcher.py +137 -26
holmes/plugins/toolsets/service_discovery.py +1 -1
holmes/plugins/toolsets/servicenow_tables/instructions.jinja2 +83 -0
holmes/plugins/toolsets/servicenow_tables/servicenow_tables.py +426 -0
holmes/plugins/toolsets/utils.py +88 -0
holmes/utils/config_utils.py +91 -0
holmes/utils/default_toolset_installation_guide.jinja2 +1 -22
holmes/utils/env.py +7 -0
holmes/utils/global_instructions.py +75 -10
holmes/utils/holmes_status.py +2 -1
holmes/utils/holmes_sync_toolsets.py +0 -2
holmes/utils/krr_utils.py +188 -0
holmes/utils/sentry_helper.py +41 -0
holmes/utils/stream.py +61 -7
holmes/version.py +34 -14
holmesgpt-0.16.2a0.dist-info/LICENSE +178 -0
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/METADATA +29 -27
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/RECORD +126 -102
holmes/core/performance_timing.py +0 -72
holmes/plugins/toolsets/grafana/tempo_api.py +0 -124
holmes/plugins/toolsets/grafana/toolset_grafana_loki.py +0 -110
holmes/plugins/toolsets/newrelic.py +0 -231
holmes/plugins/toolsets/servicenow/install.md +0 -37
holmes/plugins/toolsets/servicenow/instructions.jinja2 +0 -3
holmes/plugins/toolsets/servicenow/servicenow.py +0 -219
holmesgpt-0.13.2.dist-info/LICENSE.txt +0 -21
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/WHEEL +0 -0
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/entry_points.txt +0 -0

holmes/plugins/toolsets/kubernetes_logs.py CHANGED Viewed

@@ -10,7 +10,7 @@ from holmes.common.env_vars import KUBERNETES_LOGS_TIMEOUT_SECONDS
 from holmes.core.tools import (
     StaticPrerequisite,
     StructuredToolResult,
-    ToolResultStatus,
+    StructuredToolResultStatus,
     ToolsetTag,
 )
 from holmes.plugins.toolsets.logging_utils.logging_api import (
@@ -140,7 +140,7 @@ class KubernetesLogsToolset(BasePodLoggingToolset):
             # Ensure both results are not None (they should always be set by the loop)
             if current_logs_result is None or previous_logs_result is None:
                 return StructuredToolResult(
-                    status=ToolResultStatus.ERROR,
+                    status=StructuredToolResultStatus.ERROR,
                     error="Internal error: Failed to fetch logs",
                     params=params.model_dump(),
                 )
@@ -162,7 +162,7 @@ class KubernetesLogsToolset(BasePodLoggingToolset):
             ):
                 # Both commands failed - return error from current logs
                 return StructuredToolResult(
-                    status=ToolResultStatus.ERROR,
+                    status=StructuredToolResultStatus.ERROR,
                     error=current_logs_result.error,
                     params=params.model_dump(),
                     return_code=return_code,
@@ -206,7 +206,7 @@ class KubernetesLogsToolset(BasePodLoggingToolset):
             if len(filtered_logs) == 0:
                 # Return NO_DATA status when there are no logs
                 return StructuredToolResult(
-                    status=ToolResultStatus.NO_DATA,
+                    status=StructuredToolResultStatus.NO_DATA,
                     data="\n".join(
                         metadata_lines
                     ),  # Still include metadata for context
@@ -218,7 +218,7 @@ class KubernetesLogsToolset(BasePodLoggingToolset):
             response_data = formatted_logs + "\n" + "\n".join(metadata_lines)
             return StructuredToolResult(
-                status=ToolResultStatus.SUCCESS,
+                status=StructuredToolResultStatus.SUCCESS,
                 data=response_data,
                 params=params.model_dump(),
                 return_code=return_code,
@@ -226,7 +226,7 @@ class KubernetesLogsToolset(BasePodLoggingToolset):
         except Exception as e:
             logging.exception(f"Error fetching logs for pod {params.pod_name}")
             return StructuredToolResult(
-                status=ToolResultStatus.ERROR,
+                status=StructuredToolResultStatus.ERROR,
                 error=f"Error fetching logs: {str(e)}",
                 params=params.model_dump(),
             )

holmes/plugins/toolsets/kubernetes_logs.yaml CHANGED Viewed

@@ -8,6 +8,10 @@ toolsets:
     prerequisites:
       - command: "kubectl version --client"
+    # Note: Log tools use transformers with llm_summarize to automatically
+    # summarize large log outputs when a fast model is configured. This helps
+    # focus on errors, patterns, and key information while reducing context usage.
     tools:
       - name: "kubectl_previous_logs"
         description: "Run `kubectl logs --previous` on a single Kubernetes pod. Used to fetch logs for a pod that crashed and see logs from before the crash. Never give a deployment name or a resource that is not a pod."
@@ -24,10 +28,38 @@ toolsets:
       - name: "kubectl_logs"
         description: "Run `kubectl logs` on a single Kubernetes pod. Never give a deployment name or a resource that is not a pod."
         command: "kubectl logs {{pod_name}} -n {{ namespace }}"
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize these pod logs focusing on:
+                - Errors, exceptions, and warning messages
+                - Recent activity patterns and trends
+                - Any authentication, connection, or startup issues
+                - Performance indicators (response times, throughput)
+                - Group similar log entries together
+                - When possible, mention exact error codes or keywords for easier searching
+                - Be concise: aim for ≤ 50% of the original text; prioritize aggregates and actionable outliers
+                - Include grep-ready keys/values; avoid repeating entire logs or unchanged defaults
       - name: "kubectl_logs_all_containers"
         description: "Run `kubectl logs` on all containers within a single Kubernetes pod."
         command: "kubectl logs {{pod_name}} -n {{ namespace }} --all-containers"
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize these multi-container pod logs focusing on:
+                - Errors, exceptions, and warning messages by container
+                - Inter-container communication patterns
+                - Any authentication, connection, or startup issues
+                - Performance indicators and resource usage patterns
+                - Group similar log entries together by container
+                - When possible, mention exact error codes or keywords for easier searching
+                - Strive for ≤ 50% of the original size; keep results compact and grep-friendly (one line per aggregate)
+                - Prioritize aggregates and actionable outliers over comprehensive details
       - name: "kubectl_container_logs"
         description: "Run `kubectl logs` on a single container within a Kubernetes pod. This is to get the logs of a specific container in a multi-container pod."

holmes/plugins/toolsets/logging_utils/logging_api.py CHANGED Viewed

@@ -1,27 +1,36 @@
 from abc import ABC, abstractmethod
 from datetime import datetime, timedelta
 import logging
+from math import ceil
 from typing import Optional, Set
 from enum import Enum
 from pydantic import BaseModel, field_validator
 from datetime import timezone
+from holmes.core.llm import LLM
 from holmes.core.tools import (
     StructuredToolResult,
     Tool,
+    ToolInvokeContext,
     ToolParameter,
     Toolset,
 )
+from holmes.core.tools_utils.token_counting import count_tool_response_tokens
 from holmes.plugins.toolsets.utils import get_param_or_raise
 # Default values for log fetching
 DEFAULT_LOG_LIMIT = 100
 SECONDS_PER_DAY = 24 * 60 * 60
 DEFAULT_TIME_SPAN_SECONDS = 7 * SECONDS_PER_DAY  # 1 week in seconds
-DEFAULT_GRAPH_TIME_SPAN_SECONDS = 1 * SECONDS_PER_DAY  # 1 day in seconds
+DEFAULT_GRAPH_TIME_SPAN_SECONDS = 1 * 60 * 60  # 1 hour in seconds
 POD_LOGGING_TOOL_NAME = "fetch_pod_logs"
+TRUNCATION_PROMPT_PREFIX = "[... PREVIOUS LOGS ABOVE THIS LINE HAVE BEEN TRUNCATED]"
+MIN_NUMBER_OF_CHARACTERS_TO_TRUNCATE: int = (
+    50 + len(TRUNCATION_PROMPT_PREFIX)
+)  # prevents the truncation algorithm from going too slow once the actual token count gets close to the expected limit
 class LoggingCapability(str, Enum):
     """Optional advanced logging capabilities"""
@@ -74,6 +83,68 @@ class BasePodLoggingToolset(Toolset, ABC):
         return ""
+def truncate_logs(
+    logging_structured_tool_result: StructuredToolResult,
+    llm: LLM,
+    token_limit: int,
+    structured_params: FetchPodLogsParams,
+):
+    original_token_count = count_tool_response_tokens(
+        llm=llm, structured_tool_result=logging_structured_tool_result
+    )
+    token_count = original_token_count
+    text = None
+    while token_count > token_limit:
+        # Loop because we are counting tokens but trimming characters. This means we try to trim a number of
+        # characters proportional to the number of tokens but we may still have too many tokens
+        if not text:
+            text = logging_structured_tool_result.get_stringified_data()
+        if not text:
+            # Weird scenario where the result exceeds the token allowance but there is not data.
+            # Exit and do nothing because I don't know how to handle such scenario.
+            logging.warning(
+                f"The calculated token count for logs is {token_count} but the limit is {token_limit}. However the data field is empty so there are no logs to truncate."
+            )
+            return
+        ratio = token_count / token_limit
+        character_count = len(text)
+        number_of_characters_to_truncate = character_count - ceil(
+            character_count / ratio
+        )
+        number_of_characters_to_truncate = max(
+            MIN_NUMBER_OF_CHARACTERS_TO_TRUNCATE, number_of_characters_to_truncate
+        )
+        if len(text) <= number_of_characters_to_truncate:
+            logging.warning(
+                f"The calculated token count for logs is {token_count} (max allowed tokens={token_limit}) but the logs are only {len(text)} characters which is below the intended truncation of {number_of_characters_to_truncate} characters. Logs will no longer be truncated"
+            )
+            return
+        else:
+            linefeed_truncation_offset = max(
+                text[number_of_characters_to_truncate:].find("\n"), 0
+            )  # keep log lines atomic
+            # Tentatively add the truncation prefix.
+            # When counting tokens, we want to include the TRUNCATION_PROMPT_PREFIX because it will be part of the tool response.
+            # Because we're truncating based on character counts but ultimately checking tokens count,
+            # it is possible that the character truncation is incorrect and more need to be truncated.
+            # This will be caught in the next iteration and the truncation prefix will be truncated
+            # because MIN_NUMBER_OF_CHARACTERS_TO_TRUNCATE cannot be smaller than TRUNCATION_PROMPT_PREFIX
+            text = (
+                TRUNCATION_PROMPT_PREFIX
+                + text[number_of_characters_to_truncate + linefeed_truncation_offset :]
+            )
+            logging_structured_tool_result.data = text
+            token_count = count_tool_response_tokens(
+                llm=llm, structured_tool_result=logging_structured_tool_result
+            )
+    if token_count < original_token_count:
+        logging.info(
+            f"Logs for pod {structured_params.pod_name}/{structured_params.namespace} have been truncated from {original_token_count} tokens down to {token_count} tokens."
+        )
 class PodLoggingTool(Tool):
     """Common tool for fetching pod logs across different logging backends"""
@@ -175,9 +246,7 @@ If you hit the log limit and see lots of repetitive INFO logs, use exclude_filte
         return params
-    def _invoke(
-        self, params: dict, user_approved: bool = False
-    ) -> StructuredToolResult:
+    def _invoke(self, params: dict, context: ToolInvokeContext) -> StructuredToolResult:
         structured_params = FetchPodLogsParams(
             namespace=get_param_or_raise(params, "namespace"),
             pod_name=get_param_or_raise(params, "pod_name"),
@@ -192,6 +261,13 @@ If you hit the log limit and see lots of repetitive INFO logs, use exclude_filte
             params=structured_params,
         )
+        truncate_logs(
+            logging_structured_tool_result=result,
+            llm=context.llm,
+            token_limit=context.max_token_count,
+            structured_params=structured_params,
+        )
         return result
     def get_parameterized_one_liner(self, params: dict) -> str:

holmes/plugins/toolsets/mcp/toolset_mcp.py CHANGED Viewed

@@ -1,71 +1,139 @@
+import json
+from holmes.common.env_vars import SSE_READ_TIMEOUT
 from holmes.core.tools import (
+    ToolInvokeContext,
     Toolset,
     Tool,
     ToolParameter,
     StructuredToolResult,
-    ToolResultStatus,
+    StructuredToolResultStatus,
     CallablePrerequisite,
 )
 from typing import Dict, Any, List, Optional
 from mcp.client.session import ClientSession
 from mcp.client.sse import sse_client
+from mcp.client.streamable_http import streamablehttp_client
 from mcp.types import Tool as MCP_Tool
-from mcp.types import CallToolResult
 import asyncio
-from pydantic import Field, AnyUrl, field_validator
+from contextlib import asynccontextmanager
+from pydantic import BaseModel, Field, AnyUrl, model_validator
 from typing import Tuple
 import logging
+from enum import Enum
+import threading
+# Lock per MCP server URL to serialize calls to the same server
+_server_locks: Dict[str, threading.Lock] = {}
+_locks_lock = threading.Lock()
-class RemoteMCPTool(Tool):
-    url: str
+def get_server_lock(url: str) -> threading.Lock:
+    """Get or create a lock for a specific MCP server URL."""
+    with _locks_lock:
+        if url not in _server_locks:
+            _server_locks[url] = threading.Lock()
+        return _server_locks[url]
+class MCPMode(str, Enum):
+    SSE = "sse"
+    STREAMABLE_HTTP = "streamable-http"
+class MCPConfig(BaseModel):
+    url: AnyUrl
+    mode: MCPMode = MCPMode.SSE
     headers: Optional[Dict[str, str]] = None
-    def _invoke(
-        self, params: dict, user_approved: bool = False
-    ) -> StructuredToolResult:
+@asynccontextmanager
+async def get_initialized_mcp_session(
+    url: str, headers: Optional[Dict[str, str]], mode: MCPMode
+):
+    if mode == MCPMode.SSE:
+        async with sse_client(
+            url, headers=headers, sse_read_timeout=SSE_READ_TIMEOUT
+        ) as (
+            read_stream,
+            write_stream,
+        ):
+            async with ClientSession(read_stream, write_stream) as session:
+                _ = await session.initialize()
+                yield session
+    else:
+        async with streamablehttp_client(
+            url, headers=headers, sse_read_timeout=SSE_READ_TIMEOUT
+        ) as (
+            read_stream,
+            write_stream,
+            _,
+        ):
+            async with ClientSession(read_stream, write_stream) as session:
+                _ = await session.initialize()
+                yield session
+class RemoteMCPTool(Tool):
+    toolset: "RemoteMCPToolset" = Field(exclude=True)
+    def _invoke(self, params: dict, context: ToolInvokeContext) -> StructuredToolResult:
         try:
-            return asyncio.run(self._invoke_async(params))
+            # Serialize calls to the same MCP server to prevent SSE conflicts
+            # Different servers can still run in parallel
+            if not self.toolset._mcp_config:
+                raise ValueError("MCP config not initialized")
+            lock = get_server_lock(str(self.toolset._mcp_config.url))
+            with lock:
+                return asyncio.run(self._invoke_async(params))
         except Exception as e:
             return StructuredToolResult(
-                status=ToolResultStatus.ERROR,
+                status=StructuredToolResultStatus.ERROR,
                 error=str(e.args),
                 params=params,
                 invocation=f"MCPtool {self.name} with params {params}",
             )
+    @staticmethod
+    def _is_content_error(content: str) -> bool:
+        try:  # aws mcp sometimes returns an error in content - status code != 200
+            json_content: dict = json.loads(content)
+            status_code = json_content.get("response", {}).get("status_code", 200)
+            return status_code >= 300
+        except Exception:
+            return False
     async def _invoke_async(self, params: Dict) -> StructuredToolResult:
-        async with sse_client(self.url, self.headers) as (read_stream, write_stream):
-            async with ClientSession(read_stream, write_stream) as session:
-                _ = await session.initialize()
-                tool_result: CallToolResult = await session.call_tool(self.name, params)
-                merged_text = " ".join(
-                    c.text for c in tool_result.content if c.type == "text"
-                )
-                return StructuredToolResult(
-                    status=(
-                        ToolResultStatus.ERROR
-                        if tool_result.isError
-                        else ToolResultStatus.SUCCESS
-                    ),
-                    data=merged_text,
-                    params=params,
-                    invocation=f"MCPtool {self.name} with params {params}",
-                )
+        async with self.toolset.get_initialized_session() as session:
+            tool_result = await session.call_tool(self.name, params)
+        merged_text = " ".join(c.text for c in tool_result.content if c.type == "text")
+        return StructuredToolResult(
+            status=(
+                StructuredToolResultStatus.ERROR
+                if (tool_result.isError or self._is_content_error(merged_text))
+                else StructuredToolResultStatus.SUCCESS
+            ),
+            data=merged_text,
+            params=params,
+            invocation=f"MCPtool {self.name} with params {params}",
+        )
     @classmethod
-    def create(cls, url: str, tool: MCP_Tool, headers: Optional[Dict[str, str]] = None):
+    def create(
+        cls,
+        tool: MCP_Tool,
+        toolset: "RemoteMCPToolset",
+    ):
         parameters = cls.parse_input_schema(tool.inputSchema)
         return cls(
-            url=url,
             name=tool.name,
             description=tool.description or "",
             parameters=parameters,
-            headers=headers,
+            toolset=toolset,
         )
     @classmethod
@@ -85,53 +153,111 @@ class RemoteMCPTool(Tool):
         return parameters
     def get_parameterized_one_liner(self, params: Dict) -> str:
-        return f"Call MCP Server ({self.url} - {self.name})"
+        if params:
+            if params.get("cli_command"):  # Return AWS MCP cli command, if available
+                return f"{params.get('cli_command')}"
+        url = (
+            str(self.toolset._mcp_config.url) if self.toolset._mcp_config else "unknown"
+        )
+        return f"Call MCP Server ({url} - {self.name})"
 class RemoteMCPToolset(Toolset):
-    url: AnyUrl
     tools: List[RemoteMCPTool] = Field(default_factory=list)  # type: ignore
     icon_url: str = "https://registry.npmmirror.com/@lobehub/icons-static-png/1.46.0/files/light/mcp.png"
+    _mcp_config: Optional[MCPConfig] = None
     def model_post_init(self, __context: Any) -> None:
-        self.prerequisites = [CallablePrerequisite(callable=self.init_server_tools)]
+        self.prerequisites = [
+            CallablePrerequisite(callable=self.prerequisites_callable)
+        ]
+    @model_validator(mode="before")
+    @classmethod
+    def migrate_url_to_config(cls, values: dict[str, Any]) -> dict[str, Any]:
+        """
+        Migrates url from field parameter to config object.
+        If url is passed as a parameter, it's moved to config (or config is created if it doesn't exist).
+        """
+        if not isinstance(values, dict) or "url" not in values:
+            return values
-    def get_headers(self) -> Optional[Dict[str, str]]:
-        return self.config and self.config.get("headers")
+        url_value = values.pop("url")
+        if url_value is None:
+            return values
-    @field_validator("url", mode="before")
-    def append_sse_if_missing(cls, v):
-        if isinstance(v, str) and not v.rstrip("/").endswith("/sse"):
-            v = v.rstrip("/") + "/sse"
-        return v
+        config = values.get("config")
+        if config is None:
+            config = {}
+            values["config"] = config
-    # used as a CallablePrerequisite, config added for that case.
-    def init_server_tools(self, config: dict[str, Any]) -> Tuple[bool, str]:
+        toolset_name = values.get("name", "unknown")
+        if "url" in config:
+            logging.warning(
+                f"Toolset {toolset_name}: has two urls defined, remove the 'url' field from the toolset configuration and keep the 'url' in the config section."
+            )
+            return values
+        logging.warning(
+            f"Toolset {toolset_name}: 'url' field has been migrated to config. "
+            "Please move 'url' to the config section."
+        )
+        config["url"] = url_value
+        return values
+    def prerequisites_callable(self, config) -> Tuple[bool, str]:
         try:
+            if not config:
+                return (False, f"Config is required for {self.name}")
+            if "mode" in config:
+                mode_value = config.get("mode")
+                allowed_modes = [e.value for e in MCPMode]
+                if mode_value not in allowed_modes:
+                    return (
+                        False,
+                        f'Invalid mode "{mode_value}", allowed modes are {", ".join(allowed_modes)}',
+                    )
+            self._mcp_config = MCPConfig(**config)
+            clean_url_str = str(self._mcp_config.url).rstrip("/")
+            if self._mcp_config.mode == MCPMode.SSE and not clean_url_str.endswith(
+                "/sse"
+            ):
+                self._mcp_config.url = AnyUrl(clean_url_str + "/sse")
             tools_result = asyncio.run(self._get_server_tools())
             self.tools = [
-                RemoteMCPTool.create(str(self.url), tool, self.get_headers())
-                for tool in tools_result.tools
+                RemoteMCPTool.create(tool, self) for tool in tools_result.tools
             ]
             if not self.tools:
                 logging.warning(f"mcp server {self.name} loaded 0 tools.")
             return (True, "")
         except Exception as e:
-            # using e.args, the asyncio wrapper could stack another exception this helps printing them all.
             return (
                 False,
-                f"Failed to load mcp server {self.name} {self.url} {str(e.args)}",
+                f"Failed to load mcp server {self.name} {self._mcp_config.url if self._mcp_config else 'unknown'}: {str(e)}",
             )
     async def _get_server_tools(self):
-        async with sse_client(str(self.url), headers=self.get_headers()) as (
-            read_stream,
-            write_stream,
-        ):
-            async with ClientSession(read_stream, write_stream) as session:
-                _ = await session.initialize()
-                return await session.list_tools()
+        async with self.get_initialized_session() as session:
+            return await session.list_tools()
+    def get_initialized_session(self):
+        return get_initialized_mcp_session(
+            str(self._mcp_config.url), self._mcp_config.headers, self._mcp_config.mode
+        )
     def get_example_config(self) -> Dict[str, Any]:
-        return {}
+        example_config = MCPConfig(
+            url=AnyUrl("http://example.com:8000/mcp/messages"),
+            mode=MCPMode.STREAMABLE_HTTP,
+            headers={"Authorization": "Bearer YOUR_TOKEN"},
+        )
+        return example_config.model_dump()

holmes/plugins/toolsets/newrelic/__init__.py ADDED Viewed

File without changes

holmes/plugins/toolsets/newrelic/new_relic_api.py ADDED Viewed

@@ -0,0 +1,125 @@
+"""NewRelic API wrapper for executing NRQL queries via GraphQL."""
+import logging
+from typing import Any, Dict
+import requests  # type: ignore
+logger = logging.getLogger(__name__)
+class NewRelicAPI:
+    """Python wrapper for NewRelic GraphQL API.
+    This class provides a clean interface to execute NRQL queries via the NewRelic GraphQL API,
+    supporting both US and EU datacenters.
+    """
+    def __init__(self, api_key: str, account_id: str, is_eu_datacenter: bool = False):
+        """Initialize the NewRelic API wrapper.
+        Args:
+            api_key: NewRelic API key
+            account_id: NewRelic account ID
+            is_eu_datacenter: If True, use EU datacenter URL. Defaults to False (US).
+        """
+        self.api_key = api_key
+        # Validate account_id is numeric to prevent injection
+        try:
+            self.account_id = int(account_id)
+        except ValueError:
+            raise ValueError(f"Invalid account_id: must be numeric, got '{account_id}'")
+        self.is_eu_datacenter = is_eu_datacenter
+    def _get_api_url(self) -> str:
+        """Get the appropriate API URL based on datacenter location.
+        Returns:
+            str: The GraphQL API endpoint URL
+        """
+        if self.is_eu_datacenter:
+            return "https://api.eu.newrelic.com/graphql"
+        return "https://api.newrelic.com/graphql"
+    def _make_request(
+        self, graphql_query: Dict[str, Any], timeout: int = 30
+    ) -> Dict[str, Any]:
+        """Make HTTP POST request to NewRelic GraphQL API.
+        Args:
+            graphql_query: The GraphQL query as a dictionary
+            timeout: Request timeout in seconds
+        Returns:
+            JSON response from the API
+        Raises:
+            requests.exceptions.HTTPError: If the request fails
+            Exception: If GraphQL returns errors
+        """
+        url = self._get_api_url()
+        headers = {
+            "Content-Type": "application/json",
+            "Api-Key": self.api_key,
+        }
+        response = requests.post(
+            url,
+            headers=headers,
+            json=graphql_query,
+            timeout=timeout,
+        )
+        response.raise_for_status()
+        # Parse JSON response
+        data = response.json()
+        # Check for GraphQL errors even on 200 responses
+        if "errors" in data and data["errors"]:
+            error_msg = data["errors"][0].get("message", "Unknown GraphQL error")
+            raise Exception(f"NewRelic GraphQL error: {error_msg}")
+        return data
+    def execute_nrql_query(self, nrql_query: str) -> list:
+        """Execute an NRQL query via the NewRelic GraphQL API.
+        Args:
+            nrql_query: The NRQL query string to execute
+        Returns:
+            list: The query results from NewRelic (extracted from the nested response)
+        Raises:
+            requests.exceptions.HTTPError: If the API request fails
+            Exception: If GraphQL returns errors
+        """
+        # Build the GraphQL query using variables to prevent injection
+        # Note: New Relic's GraphQL API requires the account ID to be inline, but we can use variables for the NRQL query
+        graphql_query = {
+            "query": f"""
+            query ExecuteNRQL($nrqlQuery: Nrql!) {{
+                actor {{
+                    account(id: {self.account_id}) {{
+                        nrql(query: $nrqlQuery) {{
+                            results
+                        }}
+                    }}
+                }}
+            }}
+            """,
+            "variables": {"nrqlQuery": nrql_query},
+        }
+        logger.info(f"Executing NRQL query: {nrql_query}")
+        response = self._make_request(graphql_query)
+        # Extract just the results array from the nested response
+        try:
+            results = response["data"]["actor"]["account"]["nrql"]["results"]
+            return results
+        except (KeyError, TypeError) as e:
+            raise Exception(
+                f"Failed to extract results from NewRelic response: {e}"
+            ) from e

holmesgpt 0.13.2__py3-none-any.whl → 0.16.2a0__py3-none-any.whl

holmesgpt 0.13.2py3-none-any.whl → 0.16.2a0py3-none-any.whl