PyPI - holmesgpt - Versions diffs - 0.16.2a0__py3-none-any.whl → 0.18.4__py3-none-any.whl - Mend

holmesgpt 0.16.2a0py3-none-any.whl → 0.18.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (162) hide show

holmes/__init__.py +3 -5
holmes/clients/robusta_client.py +4 -3
holmes/common/env_vars.py +18 -2
holmes/common/openshift.py +1 -1
holmes/config.py +11 -6
holmes/core/conversations.py +30 -13
holmes/core/investigation.py +21 -25
holmes/core/investigation_structured_output.py +3 -3
holmes/core/issue.py +1 -1
holmes/core/llm.py +50 -31
holmes/core/models.py +19 -17
holmes/core/openai_formatting.py +1 -1
holmes/core/prompt.py +47 -2
holmes/core/runbooks.py +1 -0
holmes/core/safeguards.py +4 -2
holmes/core/supabase_dal.py +4 -2
holmes/core/tool_calling_llm.py +102 -141
holmes/core/tools.py +19 -28
holmes/core/tools_utils/token_counting.py +9 -2
holmes/core/tools_utils/tool_context_window_limiter.py +13 -30
holmes/core/tools_utils/tool_executor.py +0 -18
holmes/core/tools_utils/toolset_utils.py +1 -0
holmes/core/toolset_manager.py +37 -2
holmes/core/tracing.py +13 -2
holmes/core/transformers/__init__.py +1 -1
holmes/core/transformers/base.py +1 -0
holmes/core/transformers/llm_summarize.py +3 -2
holmes/core/transformers/registry.py +2 -1
holmes/core/transformers/transformer.py +1 -0
holmes/core/truncation/compaction.py +37 -2
holmes/core/truncation/input_context_window_limiter.py +3 -2
holmes/interactive.py +52 -8
holmes/main.py +17 -37
holmes/plugins/interfaces.py +2 -1
holmes/plugins/prompts/__init__.py +2 -1
holmes/plugins/prompts/_fetch_logs.jinja2 +5 -5
holmes/plugins/prompts/_runbook_instructions.jinja2 +2 -1
holmes/plugins/prompts/base_user_prompt.jinja2 +7 -0
holmes/plugins/prompts/conversation_history_compaction.jinja2 +2 -1
holmes/plugins/prompts/generic_ask.jinja2 +0 -2
holmes/plugins/prompts/generic_ask_conversation.jinja2 +0 -2
holmes/plugins/prompts/generic_ask_for_issue_conversation.jinja2 +0 -2
holmes/plugins/prompts/generic_investigation.jinja2 +0 -2
holmes/plugins/prompts/investigation_procedure.jinja2 +2 -1
holmes/plugins/prompts/kubernetes_workload_ask.jinja2 +0 -2
holmes/plugins/prompts/kubernetes_workload_chat.jinja2 +0 -2
holmes/plugins/runbooks/__init__.py +32 -3
holmes/plugins/sources/github/__init__.py +4 -2
holmes/plugins/sources/prometheus/models.py +1 -0
holmes/plugins/toolsets/__init__.py +30 -26
holmes/plugins/toolsets/atlas_mongodb/mongodb_atlas.py +13 -12
holmes/plugins/toolsets/azure_sql/apis/alert_monitoring_api.py +3 -2
holmes/plugins/toolsets/azure_sql/apis/azure_sql_api.py +2 -1
holmes/plugins/toolsets/azure_sql/apis/connection_failure_api.py +3 -2
holmes/plugins/toolsets/azure_sql/apis/connection_monitoring_api.py +3 -1
holmes/plugins/toolsets/azure_sql/apis/storage_analysis_api.py +3 -1
holmes/plugins/toolsets/azure_sql/azure_sql_toolset.py +12 -12
holmes/plugins/toolsets/azure_sql/tools/analyze_connection_failures.py +7 -7
holmes/plugins/toolsets/azure_sql/tools/analyze_database_connections.py +7 -7
holmes/plugins/toolsets/azure_sql/tools/analyze_database_health_status.py +3 -5
holmes/plugins/toolsets/azure_sql/tools/analyze_database_performance.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/analyze_database_storage.py +7 -7
holmes/plugins/toolsets/azure_sql/tools/get_active_alerts.py +6 -8
holmes/plugins/toolsets/azure_sql/tools/get_slow_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/get_top_cpu_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/get_top_data_io_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/tools/get_top_log_io_queries.py +3 -3
holmes/plugins/toolsets/azure_sql/utils.py +0 -32
holmes/plugins/toolsets/bash/argocd/__init__.py +3 -3
holmes/plugins/toolsets/bash/aws/__init__.py +4 -4
holmes/plugins/toolsets/bash/azure/__init__.py +4 -4
holmes/plugins/toolsets/bash/bash_toolset.py +2 -3
holmes/plugins/toolsets/bash/common/bash.py +19 -9
holmes/plugins/toolsets/bash/common/bash_command.py +1 -1
holmes/plugins/toolsets/bash/common/stringify.py +1 -1
holmes/plugins/toolsets/bash/kubectl/__init__.py +2 -1
holmes/plugins/toolsets/bash/kubectl/constants.py +0 -1
holmes/plugins/toolsets/bash/kubectl/kubectl_get.py +3 -4
holmes/plugins/toolsets/bash/parse_command.py +12 -13
holmes/plugins/toolsets/connectivity_check.py +124 -0
holmes/plugins/toolsets/coralogix/api.py +132 -119
holmes/plugins/toolsets/coralogix/coralogix.jinja2 +14 -0
holmes/plugins/toolsets/coralogix/toolset_coralogix.py +219 -0
holmes/plugins/toolsets/coralogix/utils.py +15 -79
holmes/plugins/toolsets/datadog/datadog_api.py +36 -3
holmes/plugins/toolsets/datadog/datadog_logs_instructions.jinja2 +34 -1
holmes/plugins/toolsets/datadog/datadog_metrics_instructions.jinja2 +3 -3
holmes/plugins/toolsets/datadog/datadog_models.py +59 -0
holmes/plugins/toolsets/datadog/datadog_url_utils.py +213 -0
holmes/plugins/toolsets/datadog/instructions_datadog_traces.jinja2 +165 -28
holmes/plugins/toolsets/datadog/toolset_datadog_general.py +71 -28
holmes/plugins/toolsets/datadog/toolset_datadog_logs.py +224 -375
holmes/plugins/toolsets/datadog/toolset_datadog_metrics.py +67 -36
holmes/plugins/toolsets/datadog/toolset_datadog_traces.py +360 -343
holmes/plugins/toolsets/elasticsearch/__init__.py +6 -0
holmes/plugins/toolsets/elasticsearch/elasticsearch.py +834 -0
holmes/plugins/toolsets/git.py +7 -8
holmes/plugins/toolsets/grafana/base_grafana_toolset.py +16 -4
holmes/plugins/toolsets/grafana/common.py +2 -30
holmes/plugins/toolsets/grafana/grafana_tempo_api.py +2 -1
holmes/plugins/toolsets/grafana/loki/instructions.jinja2 +18 -2
holmes/plugins/toolsets/grafana/loki/toolset_grafana_loki.py +92 -18
holmes/plugins/toolsets/grafana/loki_api.py +4 -0
holmes/plugins/toolsets/grafana/toolset_grafana.py +109 -25
holmes/plugins/toolsets/grafana/toolset_grafana_dashboard.jinja2 +22 -0
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py +201 -33
holmes/plugins/toolsets/grafana/trace_parser.py +3 -2
holmes/plugins/toolsets/internet/internet.py +10 -10
holmes/plugins/toolsets/internet/notion.py +5 -6
holmes/plugins/toolsets/investigator/core_investigation.py +3 -3
holmes/plugins/toolsets/investigator/model.py +3 -1
holmes/plugins/toolsets/json_filter_mixin.py +134 -0
holmes/plugins/toolsets/kafka.py +12 -7
holmes/plugins/toolsets/kubernetes.yaml +260 -30
holmes/plugins/toolsets/kubernetes_logs.py +3 -3
holmes/plugins/toolsets/logging_utils/logging_api.py +16 -6
holmes/plugins/toolsets/mcp/toolset_mcp.py +88 -60
holmes/plugins/toolsets/newrelic/new_relic_api.py +41 -1
holmes/plugins/toolsets/newrelic/newrelic.jinja2 +24 -0
holmes/plugins/toolsets/newrelic/newrelic.py +212 -55
holmes/plugins/toolsets/prometheus/prometheus.py +358 -102
holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2 +11 -3
holmes/plugins/toolsets/rabbitmq/api.py +23 -4
holmes/plugins/toolsets/rabbitmq/toolset_rabbitmq.py +5 -5
holmes/plugins/toolsets/robusta/robusta.py +5 -5
holmes/plugins/toolsets/runbook/runbook_fetcher.py +25 -6
holmes/plugins/toolsets/servicenow_tables/servicenow_tables.py +1 -1
holmes/plugins/toolsets/utils.py +1 -1
holmes/utils/config_utils.py +1 -1
holmes/utils/connection_utils.py +31 -0
holmes/utils/console/result.py +10 -0
holmes/utils/file_utils.py +2 -1
holmes/utils/global_instructions.py +10 -26
holmes/utils/holmes_status.py +4 -3
holmes/utils/log.py +15 -0
holmes/utils/markdown_utils.py +2 -3
holmes/utils/memory_limit.py +58 -0
holmes/utils/sentry_helper.py +23 -0
holmes/utils/stream.py +12 -5
holmes/utils/tags.py +4 -3
holmes/version.py +3 -1
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/METADATA +12 -10
holmesgpt-0.18.4.dist-info/RECORD +258 -0
holmes/plugins/toolsets/aws.yaml +0 -80
holmes/plugins/toolsets/coralogix/toolset_coralogix_logs.py +0 -114
holmes/plugins/toolsets/datadog/datadog_traces_formatter.py +0 -310
holmes/plugins/toolsets/datadog/toolset_datadog_rds.py +0 -736
holmes/plugins/toolsets/grafana/grafana_api.py +0 -64
holmes/plugins/toolsets/opensearch/__init__.py +0 -0
holmes/plugins/toolsets/opensearch/opensearch.py +0 -250
holmes/plugins/toolsets/opensearch/opensearch_logs.py +0 -161
holmes/plugins/toolsets/opensearch/opensearch_traces.py +0 -215
holmes/plugins/toolsets/opensearch/opensearch_traces_instructions.jinja2 +0 -12
holmes/plugins/toolsets/opensearch/opensearch_utils.py +0 -166
holmes/utils/keygen_utils.py +0 -6
holmesgpt-0.16.2a0.dist-info/RECORD +0 -258
holmes/plugins/toolsets/{opensearch → elasticsearch}/opensearch_ppl_query_docs.jinja2 +0 -0
holmes/plugins/toolsets/{opensearch → elasticsearch}/opensearch_query_assist.py +2 -2
/holmes/plugins/toolsets/{opensearch → elasticsearch}/opensearch_query_assist_instructions.jinja2 +0 -0
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/LICENSE +0 -0
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/WHEEL +0 -0
{holmesgpt-0.16.2a0.dist-info → holmesgpt-0.18.4.dist-info}/entry_points.txt +0 -0

holmes/plugins/toolsets/kubernetes.yaml CHANGED Viewed

@@ -89,12 +89,124 @@ toolsets:
       - name: "kubernetes_jq_query"
         user_description: "Query Kubernetes Resources: kubectl get {{kind}} --all-namespaces -o json | jq -r {{jq_expr}}"
         description: >
-          Use kubectl to get json for all resources of a specific kind pipe the results to jq to filter them. Do not worry about escaping the jq_expr it will be done by the system on an unescaped expression that you give. e.g. give an expression like .items[] | .spec.containers[].image | select(test("^gcr.io/") | not)
-        command: kubectl get {{ kind }} --all-namespaces -o json | jq -r {{ jq_expr }}
+          Use kubectl to get json for all resources of a specific kind and filter with jq.
+          IMPORTANT: The 'kind' parameter must be the plural form of the resource type
+          (e.g., use "pods" not "pod", "services" not "service", "jobs" not "job").
+          Do not worry about escaping the jq_expr - it will be done by the system.
+          Example: .items[] | .spec.containers[].image | select(test("^gcr.io/") | not)
+        script: |
+          #!/bin/bash
+          echo "Executing paginated query for {{ kind }} resources..."
+          echo "Expression: {{ jq_expr }}"
+          echo "---"
+          # Get the API path for the resource kind using kubectl
+          API_INFO=$(kubectl api-resources --no-headers | grep "^{{ kind }} " | head -1)
+          if [ -z "$API_INFO" ]; then
+            echo "Error: Unable to find resource kind '{{ kind }}'" >&2
+            exit 1
+          fi
+          # Extract NAMESPACED value
+          if [[ "$API_INFO" == *" true "* ]]; then
+            NAMESPACED="true"
+            PREFIX=$(echo "$API_INFO" | sed 's/ true .*//')
+          elif [[ "$API_INFO" == *" false "* ]]; then
+            NAMESPACED="false"
+            PREFIX=$(echo "$API_INFO" | sed 's/ false .*//')
+          else
+            echo "Error: Could not find NAMESPACED field (true/false) in API info" >&2
+            exit 1
+          fi
+          # Trim trailing spaces from prefix and collapse internal spaces
+          PREFIX=$(echo "$PREFIX" | sed 's/  *$//' | sed 's/  */ /g')
+          IFS=' ' read -ra PREFIX_FIELDS <<< "$PREFIX"
+          FIELD_COUNT=0
+          for field in "${PREFIX_FIELDS[@]}"; do
+            ((FIELD_COUNT++))
+          done
+          RESOURCE_NAME="${PREFIX_FIELDS[0]}"
+          if [ $FIELD_COUNT -ge 2 ]; then
+            API_VERSION="${PREFIX_FIELDS[$((FIELD_COUNT - 1))]}"
+          else
+            API_VERSION=""
+          fi
+          if [ -z "$API_VERSION" ] || [ -z "$RESOURCE_NAME" ]; then
+            echo "Error: Unable to parse API info for resource kind '{{ kind }}'" >&2
+            exit 1
+          fi
+          # Build API path
+          if [[ "$API_VERSION" == "v1" ]]; then
+            API_PATH="/api/v1/${RESOURCE_NAME}"
+          else
+            API_PATH="/apis/${API_VERSION}/${RESOURCE_NAME}"
+          fi
+          # Process resources in chunks using API pagination
+          LIMIT=500  # Process 500 items at a time
+          CONTINUE=""
+          PROCESSED=0
+          TOTAL_MATCHES=0
+          while true; do
+            # Build API query with limit and continue token
+            if [ -z "$CONTINUE" ]; then
+              # First request - get from all namespaces
+              QUERY="${API_PATH}?limit=${LIMIT}"
+            else
+              # Subsequent requests with continue token
+              QUERY="${API_PATH}?limit=${LIMIT}&continue=${CONTINUE}"
+            fi
+            OUTPUT=$(kubectl get --raw "$QUERY" 2>&1)
+            exit_code=$?
+            if [ $exit_code -ne 0 ]; then
+              echo "Error: $OUTPUT" >&2
+              exit $exit_code
+            fi
+            ITEMS_COUNT=$(echo "$OUTPUT" | jq '.items | length')
+            MATCHES=$(echo "$OUTPUT" | jq -r {{ jq_expr }} 2>&1)
+            jq_exit=$?
+            if [ $jq_exit -ne 0 ]; then
+              echo "Error: jq expression failed: $MATCHES" >&2
+              exit $jq_exit
+            fi
+            if [ "$ITEMS_COUNT" -gt 0 ]; then
+              if [ -n "$MATCHES" ]; then
+                echo "$MATCHES"
+                MATCH_COUNT=$(echo "$MATCHES" | grep -c . || true)
+                TOTAL_MATCHES=$((TOTAL_MATCHES + MATCH_COUNT))
+              fi
+              PROCESSED=$((PROCESSED + ITEMS_COUNT))
+              echo "Processed $PROCESSED items, found $TOTAL_MATCHES matches so far..." >&2
+            fi
+            CONTINUE=$(echo "$OUTPUT" | jq -r '.metadata.continue // empty')
+            if [ -z "$CONTINUE" ]; then
+              break
+            fi
+          done
+          echo "---" >&2
+          echo "Total items processed: $PROCESSED, matches found: $TOTAL_MATCHES" >&2
         transformers:
           - name: llm_summarize
             config:
-              input_threshold: 1000
+              input_threshold: 10000
               prompt: |
                 Summarize this jq query output focusing on:
                 - Key patterns and commonalities in the data
@@ -106,52 +218,170 @@ toolsets:
                 - Be concise: aim for ≤ 50% of the original text; prioritize aggregates and actionable outliers
                 - Include grep-ready keys/values; avoid repeating entire objects or unchanged defaults
+      - name: "kubernetes_tabular_query"
+        user_description: "Tabular output of specific fields: kubectl get {{kind}} --all-namespaces -o custom-columns={{columns}}"
+        description: >
+          Extract specific fields from Kubernetes resources in tabular format with optional filtering.
+          Memory-efficient way to query large clusters - only requested fields are transmitted.
+          Column specification format: HEADER:FIELD_PATH,HEADER2:FIELD_PATH2,...
+          Optional filtering parameter:
+          - filter_pattern: Pattern to match in any column (supports grep regex)
+          Examples:
+          - Basic fields: NAME:.metadata.name,STATUS:.status.phase,NODE:.spec.nodeName
+          - Filter by status: filter_pattern="Running"
+          - Filter out lines with <none>: filter_pattern="-v '<none>'"
+          - Nested fields: CREATED:.metadata.creationTimestamp,IMAGE:.spec.containers[0].image
+          - Array fields: LABELS:.metadata.labels,PORTS:.spec.ports[*].port
+          Note: Output is tabular text with column headers. Filtering works on the entire line.
+          Note: not allowed characters are: ' / ; and newline
+        command: kubectl get {{ kind }} --all-namespaces -o custom-columns='{{ columns }}'{% if filter_pattern %} | (head -n 1; tail -n +2 | grep {{ filter_pattern }}){% endif %}
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 10000
+              prompt: |
+                Summarize this tabular output focusing on:
+                - Key patterns and trends in the data
+                - Resources that need attention (errors, pending, failures)
+                - Group similar items into aggregate descriptions
+                - Highlight outliers or unusual values
+                - Mention specific resource names only for problematic items
+                - Provide counts and distributions where relevant
+                - Be concise: aim for ≤ 50% of the original size
+                - Keep output actionable and focused on anomalies
       - name: "kubernetes_count"
         user_description: "Count Kubernetes Resources: kubectl get {{kind}} --all-namespaces -o json | jq -c -r {{ jq_expr }}"
         description: >
           Use kubectl to get apply a jq filter and then count the results.
           Use this whenever asked to count kubernetes resources.
+          IMPORTANT: The 'kind' parameter must be the plural form of the resource type
+          (e.g., use "pods" not "pod", "services" not "service", "jobs" not "job").
           Use select() to filter objects before extracting properties, e.g. .items[] | select(.metadata.namespace == "test-1") | .metadata.name
           Do not worry about escaping the jq_expr it will be done by the system on an unescaped expression that you give.
           e.g. give an expression like .items[] | select(.spec.containers[].image | test("^gcr.io/") | not) | .metadata.name
         script: |
+          #!/bin/bash
           echo "Command executed: kubectl get {{ kind }} --all-namespaces -o json | jq -c -r {{ jq_expr }}"
           echo "---"
-          # Execute the command and capture both stdout and stderr separately
-          temp_error=$(mktemp)
-          matches=$(kubectl get {{ kind }} --all-namespaces -o json 2>"$temp_error" | jq -c -r {{ jq_expr }} 2>>"$temp_error")
-          exit_code=$?
-          error_output=$(cat "$temp_error")
-          rm -f "$temp_error"
-          if [ $exit_code -ne 0 ]; then
-            echo "Error executing command (exit code: $exit_code):"
-            echo "$error_output"
-            exit $exit_code
+          # Get the API path for the resource kind
+          API_INFO=$(kubectl api-resources --no-headers | grep "^{{ kind }} " | head -1)
+          if [ -z "$API_INFO" ]; then
+            echo "Error: Unable to find resource kind '{{ kind }}'" >&2
+            exit 1
+          fi
+          if [[ "$API_INFO" == *" true "* ]]; then
+            NAMESPACED="true"
+            PREFIX=$(echo "$API_INFO" | sed 's/ true .*//')
+          elif [[ "$API_INFO" == *" false "* ]]; then
+            NAMESPACED="false"
+            PREFIX=$(echo "$API_INFO" | sed 's/ false .*//')
           else
-            # Show any stderr warnings even if command succeeded
-            if [ -n "$error_output" ]; then
-              echo "Warnings/stderr output:"
-              echo "$error_output"
-              echo "---"
-            fi
+            echo "Error: Could not find NAMESPACED field (true/false) in API info" >&2
+            exit 1
+          fi
+          PREFIX=$(echo "$PREFIX" | sed 's/  *$//' | sed 's/  */ /g')
+          IFS=' ' read -ra PREFIX_FIELDS <<< "$PREFIX"
+          FIELD_COUNT=0
+          for field in "${PREFIX_FIELDS[@]}"; do
+            ((FIELD_COUNT++))
+          done
+          RESOURCE_NAME="${PREFIX_FIELDS[0]}"
+          if [ $FIELD_COUNT -ge 2 ]; then
+            API_VERSION="${PREFIX_FIELDS[$((FIELD_COUNT - 1))]}"
+          else
+            API_VERSION=""
+          fi
+          if [ -z "$API_VERSION" ] || [ -z "$RESOURCE_NAME" ]; then
+            echo "Error: Unable to parse API info for resource kind '{{ kind }}'" >&2
+            exit 1
+          fi
-            # Filter out empty lines for accurate count
-            filtered_matches=$(echo "$matches" | grep -v '^$' | grep -v '^null$')
-            if [ -z "$filtered_matches" ]; then
-              count=0
+          # Build API path
+          if [[ "$API_VERSION" == "v1" ]]; then
+            API_PATH="/api/v1/${RESOURCE_NAME}"
+          else
+            API_PATH="/apis/${API_VERSION}/${RESOURCE_NAME}"
+          fi
+          # Process resources in chunks using API pagination
+          LIMIT=500
+          CONTINUE=""
+          ALL_MATCHES=""
+          BATCH_NUM=0
+          TOTAL_PROCESSED=0
+          while true; do
+            BATCH_NUM=$((BATCH_NUM + 1))
+            if [ -z "$CONTINUE" ]; then
+              QUERY="${API_PATH}?limit=${LIMIT}"
             else
-              count=$(echo "$filtered_matches" | wc -l)
+              QUERY="${API_PATH}?limit=${LIMIT}&continue=${CONTINUE}"
+            fi
+            OUTPUT=$(kubectl get --raw "$QUERY" 2>&1)
+            exit_code=$?
+            if [ $exit_code -ne 0 ]; then
+              echo "Error for query $QUERY: $OUTPUT" >&2
+              exit $exit_code
+            fi
+            ITEMS_COUNT=$(echo "$OUTPUT" | jq '.items | length')
+            TOTAL_PROCESSED=$((TOTAL_PROCESSED + ITEMS_COUNT))
+            BATCH_MATCHES=$(echo "$OUTPUT" | jq -c -r {{ jq_expr }} 2>&1)
+            jq_exit=$?
+            if [ $jq_exit -ne 0 ]; then
+              echo "Error: jq expression failed: $BATCH_MATCHES" >&2
+              exit $jq_exit
             fi
-            preview=$(echo "$filtered_matches" | head -n 10 | cut -c 1-200 | nl)
-            echo "$count results"
-            echo "---"
-            echo "A *preview* of results is shown below (up to 10 results, up to 200 chars):"
-            echo "$preview"
+            if [ -n "$BATCH_MATCHES" ]; then
+              if [ -z "$ALL_MATCHES" ]; then
+                ALL_MATCHES="$BATCH_MATCHES"
+              else
+                ALL_MATCHES="$ALL_MATCHES"$'\n'"$BATCH_MATCHES"
+              fi
+            fi
+            CONTINUE=$(echo "$OUTPUT" | jq -r '.metadata.continue // empty')
+            if [ -z "$CONTINUE" ]; then
+              break
+            fi
+            echo "Processed batch $BATCH_NUM ($TOTAL_PROCESSED items so far)..." >&2
+          done
+          # Now process the collected matches
+          filtered_matches=$(echo "$ALL_MATCHES" | grep -v '^$' | grep -v '^null$')
+          if [ -z "$filtered_matches" ]; then
+            count=0
+            preview=""
+          else
+            count=$(echo "$filtered_matches" | wc -l)
+            preview=$(echo "$filtered_matches" | head -n 10 | cut -c 1-200 | nl)
           fi
+          echo "$count results"
+          echo "---"
+          echo "A *preview* of results is shown below (up to 10 results, up to 200 chars):"
+          echo "$preview"
+          echo "---"
+          echo "Total items processed: $TOTAL_PROCESSED" >&2
     # NOTE: this is only possible for probes with a healthz endpoint - we do this to avoid giving the LLM generic
     # http GET capabilities which are more powerful than we want to expose
     #- name: "check_liveness_probe"

holmes/plugins/toolsets/kubernetes_logs.py CHANGED Viewed

@@ -3,7 +3,8 @@ import re
 import subprocess
 from concurrent.futures import ThreadPoolExecutor, as_completed
 from datetime import datetime, timezone
-from typing import Optional, List, Tuple, Set
+from typing import List, Optional, Set, Tuple
 from pydantic import BaseModel
 from holmes.common.env_vars import KUBERNETES_LOGS_TIMEOUT_SECONDS
@@ -14,16 +15,15 @@ from holmes.core.tools import (
     ToolsetTag,
 )
 from holmes.plugins.toolsets.logging_utils.logging_api import (
+    DEFAULT_TIME_SPAN_SECONDS,
     BasePodLoggingToolset,
     FetchPodLogsParams,
     LoggingCapability,
     LoggingConfig,
     PodLoggingTool,
-    DEFAULT_TIME_SPAN_SECONDS,
 )
 from holmes.plugins.toolsets.utils import process_timestamps_to_int, to_unix_ms
 # match ISO 8601 format (YYYY-MM-DDTHH:MM:SS[.fffffffff]Z) or (YYYY-MM-DDTHH:MM:SS[.fffffffff]+/-XX:XX)
 timestamp_pattern = re.compile(
     r"^(?P<ts>\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}(?:\.\d+)?(?:Z|[+-]\d{2}:\d{2}))"

holmes/plugins/toolsets/logging_utils/logging_api.py CHANGED Viewed

@@ -1,12 +1,12 @@
-from abc import ABC, abstractmethod
-from datetime import datetime, timedelta
 import logging
+from abc import ABC, abstractmethod
+from datetime import datetime, timedelta, timezone
+from enum import Enum
 from math import ceil
 from typing import Optional, Set
-from enum import Enum
 from pydantic import BaseModel, field_validator
-from datetime import timezone
 from holmes.core.llm import LLM
 from holmes.core.tools import (
     StructuredToolResult,
@@ -88,9 +88,14 @@ def truncate_logs(
     llm: LLM,
     token_limit: int,
     structured_params: FetchPodLogsParams,
+    tool_call_id: str,
+    tool_name: str,
 ):
     original_token_count = count_tool_response_tokens(
-        llm=llm, structured_tool_result=logging_structured_tool_result
+        llm=llm,
+        structured_tool_result=logging_structured_tool_result,
+        tool_call_id=tool_call_id,
+        tool_name=tool_name,
     )
     token_count = original_token_count
     text = None
@@ -137,7 +142,10 @@ def truncate_logs(
             )
             logging_structured_tool_result.data = text
             token_count = count_tool_response_tokens(
-                llm=llm, structured_tool_result=logging_structured_tool_result
+                llm=llm,
+                structured_tool_result=logging_structured_tool_result,
+                tool_call_id=tool_call_id,
+                tool_name=tool_name,
             )
     if token_count < original_token_count:
         logging.info(
@@ -266,6 +274,8 @@ If you hit the log limit and see lots of repetitive INFO logs, use exclude_filte
             llm=context.llm,
             token_limit=context.max_token_count,
             structured_params=structured_params,
+            tool_call_id=context.tool_call_id,
+            tool_name=context.tool_name,
         )
         return result

holmes/plugins/toolsets/mcp/toolset_mcp.py CHANGED Viewed

@@ -1,30 +1,28 @@
+import asyncio
 import json
+import logging
+import threading
+from contextlib import asynccontextmanager
+from enum import Enum
+from typing import Any, Dict, List, Optional, Tuple, Union
-from holmes.common.env_vars import SSE_READ_TIMEOUT
-from holmes.core.tools import (
-    ToolInvokeContext,
-    Toolset,
-    Tool,
-    ToolParameter,
-    StructuredToolResult,
-    StructuredToolResultStatus,
-    CallablePrerequisite,
-)
-from typing import Dict, Any, List, Optional
 from mcp.client.session import ClientSession
 from mcp.client.sse import sse_client
+from mcp.client.stdio import StdioServerParameters, stdio_client
 from mcp.client.streamable_http import streamablehttp_client
 from mcp.types import Tool as MCP_Tool
+from pydantic import AnyUrl, BaseModel, Field, model_validator
-import asyncio
-from contextlib import asynccontextmanager
-from pydantic import BaseModel, Field, AnyUrl, model_validator
-from typing import Tuple
-import logging
-from enum import Enum
-import threading
+from holmes.common.env_vars import SSE_READ_TIMEOUT
+from holmes.core.tools import (
+    CallablePrerequisite,
+    StructuredToolResult,
+    StructuredToolResultStatus,
+    Tool,
+    ToolInvokeContext,
+    ToolParameter,
+    Toolset,
+)
 # Lock per MCP server URL to serialize calls to the same server
 _server_locks: Dict[str, threading.Lock] = {}
@@ -42,6 +40,7 @@ def get_server_lock(url: str) -> threading.Lock:
 class MCPMode(str, Enum):
     SSE = "sse"
     STREAMABLE_HTTP = "streamable-http"
+    STDIO = "stdio"
 class MCPConfig(BaseModel):
@@ -49,14 +48,42 @@ class MCPConfig(BaseModel):
     mode: MCPMode = MCPMode.SSE
     headers: Optional[Dict[str, str]] = None
+    def get_lock_string(self) -> str:
+        return str(self.url)
+class StdioMCPConfig(BaseModel):
+    mode: MCPMode = MCPMode.STDIO
+    command: str
+    args: Optional[List[str]] = None
+    env: Optional[Dict[str, str]] = None
+    def get_lock_string(self) -> str:
+        return str(self.command)
 @asynccontextmanager
-async def get_initialized_mcp_session(
-    url: str, headers: Optional[Dict[str, str]], mode: MCPMode
-):
-    if mode == MCPMode.SSE:
+async def get_initialized_mcp_session(toolset: "RemoteMCPToolset"):
+    if toolset._mcp_config is None:
+        raise ValueError("MCP config is not initialized")
+    if isinstance(toolset._mcp_config, StdioMCPConfig):
+        server_params = StdioServerParameters(
+            command=toolset._mcp_config.command,
+            args=toolset._mcp_config.args or [],
+            env=toolset._mcp_config.env,
+        )
+        async with stdio_client(server_params) as (
+            read_stream,
+            write_stream,
+        ):
+            async with ClientSession(read_stream, write_stream) as session:
+                _ = await session.initialize()
+                yield session
+    elif toolset._mcp_config.mode == MCPMode.SSE:
+        url = str(toolset._mcp_config.url)
         async with sse_client(
-            url, headers=headers, sse_read_timeout=SSE_READ_TIMEOUT
+            url, toolset._mcp_config.headers, sse_read_timeout=SSE_READ_TIMEOUT
         ) as (
             read_stream,
             write_stream,
@@ -65,8 +92,9 @@ async def get_initialized_mcp_session(
                 _ = await session.initialize()
                 yield session
     else:
+        url = str(toolset._mcp_config.url)
         async with streamablehttp_client(
-            url, headers=headers, sse_read_timeout=SSE_READ_TIMEOUT
+            url, headers=toolset._mcp_config.headers, sse_read_timeout=SSE_READ_TIMEOUT
         ) as (
             read_stream,
             write_stream,
@@ -86,7 +114,8 @@ class RemoteMCPTool(Tool):
             # Different servers can still run in parallel
             if not self.toolset._mcp_config:
                 raise ValueError("MCP config not initialized")
-            lock = get_server_lock(str(self.toolset._mcp_config.url))
+            lock = get_server_lock(str(self.toolset._mcp_config.get_lock_string()))
             with lock:
                 return asyncio.run(self._invoke_async(params))
         except Exception as e:
@@ -107,7 +136,7 @@ class RemoteMCPTool(Tool):
             return False
     async def _invoke_async(self, params: Dict) -> StructuredToolResult:
-        async with self.toolset.get_initialized_session() as session:
+        async with get_initialized_mcp_session(self.toolset) as session:
             tool_result = await session.call_tool(self.name, params)
         merged_text = " ".join(c.text for c in tool_result.content if c.type == "text")
@@ -153,20 +182,23 @@ class RemoteMCPTool(Tool):
         return parameters
     def get_parameterized_one_liner(self, params: Dict) -> str:
-        if params:
-            if params.get("cli_command"):  # Return AWS MCP cli command, if available
-                return f"{params.get('cli_command')}"
+        # AWS MCP cli_command
+        if params and params.get("cli_command"):
+            return f"{params.get('cli_command')}"
-        url = (
-            str(self.toolset._mcp_config.url) if self.toolset._mcp_config else "unknown"
-        )
-        return f"Call MCP Server ({url} - {self.name})"
+        # gcloud MCP run_gcloud_command
+        if self.name == "run_gcloud_command" and params and "args" in params:
+            args = params.get("args", [])
+            if isinstance(args, list):
+                return f"gcloud {' '.join(str(arg) for arg in args)}"
+        return f"{self.toolset.name}: {self.name} {params}"
 class RemoteMCPToolset(Toolset):
     tools: List[RemoteMCPTool] = Field(default_factory=list)  # type: ignore
     icon_url: str = "https://registry.npmmirror.com/@lobehub/icons-static-png/1.46.0/files/light/mcp.png"
-    _mcp_config: Optional[MCPConfig] = None
+    _mcp_config: Optional[Union[MCPConfig, StdioMCPConfig]] = None
     def model_post_init(self, __context: Any) -> None:
         self.prerequisites = [
@@ -211,23 +243,24 @@ class RemoteMCPToolset(Toolset):
             if not config:
                 return (False, f"Config is required for {self.name}")
-            if "mode" in config:
-                mode_value = config.get("mode")
-                allowed_modes = [e.value for e in MCPMode]
-                if mode_value not in allowed_modes:
-                    return (
-                        False,
-                        f'Invalid mode "{mode_value}", allowed modes are {", ".join(allowed_modes)}',
-                    )
-            self._mcp_config = MCPConfig(**config)
-            clean_url_str = str(self._mcp_config.url).rstrip("/")
-            if self._mcp_config.mode == MCPMode.SSE and not clean_url_str.endswith(
-                "/sse"
-            ):
-                self._mcp_config.url = AnyUrl(clean_url_str + "/sse")
+            mode_value = config.get("mode", MCPMode.SSE.value)
+            allowed_modes = [e.value for e in MCPMode]
+            if mode_value not in allowed_modes:
+                return (
+                    False,
+                    f'Invalid mode "{mode_value}", allowed modes are {", ".join(allowed_modes)}',
+                )
+            if mode_value == MCPMode.STDIO.value:
+                self._mcp_config = StdioMCPConfig(**config)
+            else:
+                self._mcp_config = MCPConfig(**config)
+                clean_url_str = str(self._mcp_config.url).rstrip("/")
+                if self._mcp_config.mode == MCPMode.SSE and not clean_url_str.endswith(
+                    "/sse"
+                ):
+                    self._mcp_config.url = AnyUrl(clean_url_str + "/sse")
             tools_result = asyncio.run(self._get_server_tools())
@@ -242,18 +275,13 @@ class RemoteMCPToolset(Toolset):
         except Exception as e:
             return (
                 False,
-                f"Failed to load mcp server {self.name} {self._mcp_config.url if self._mcp_config else 'unknown'}: {str(e)}",
+                f"Failed to load mcp server {self.name}: {str(e)}",
             )
     async def _get_server_tools(self):
-        async with self.get_initialized_session() as session:
+        async with get_initialized_mcp_session(self) as session:
             return await session.list_tools()
-    def get_initialized_session(self):
-        return get_initialized_mcp_session(
-            str(self._mcp_config.url), self._mcp_config.headers, self._mcp_config.mode
-        )
     def get_example_config(self) -> Dict[str, Any]:
         example_config = MCPConfig(
             url=AnyUrl("http://example.com:8000/mcp/messages"),

holmesgpt 0.16.2a0__py3-none-any.whl → 0.18.4__py3-none-any.whl

holmesgpt 0.16.2a0py3-none-any.whl → 0.18.4py3-none-any.whl