PyPI - holmesgpt - Versions diffs - 0.13.2__py3-none-any.whl → 0.16.2a0__py3-none-any.whl - Mend

holmesgpt 0.13.2py3-none-any.whl → 0.16.2a0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (134) hide show

holmes/__init__.py +1 -1
holmes/clients/robusta_client.py +17 -4
holmes/common/env_vars.py +40 -1
holmes/config.py +114 -144
holmes/core/conversations.py +53 -14
holmes/core/feedback.py +191 -0
holmes/core/investigation.py +18 -22
holmes/core/llm.py +489 -88
holmes/core/models.py +103 -1
holmes/core/openai_formatting.py +13 -0
holmes/core/prompt.py +1 -1
holmes/core/safeguards.py +4 -4
holmes/core/supabase_dal.py +293 -100
holmes/core/tool_calling_llm.py +423 -323
holmes/core/tools.py +311 -33
holmes/core/tools_utils/token_counting.py +14 -0
holmes/core/tools_utils/tool_context_window_limiter.py +57 -0
holmes/core/tools_utils/tool_executor.py +13 -8
holmes/core/toolset_manager.py +155 -4
holmes/core/tracing.py +6 -1
holmes/core/transformers/__init__.py +23 -0
holmes/core/transformers/base.py +62 -0
holmes/core/transformers/llm_summarize.py +174 -0
holmes/core/transformers/registry.py +122 -0
holmes/core/transformers/transformer.py +31 -0
holmes/core/truncation/compaction.py +59 -0
holmes/core/truncation/dal_truncation_utils.py +23 -0
holmes/core/truncation/input_context_window_limiter.py +218 -0
holmes/interactive.py +177 -24
holmes/main.py +7 -4
holmes/plugins/prompts/_fetch_logs.jinja2 +26 -1
holmes/plugins/prompts/_general_instructions.jinja2 +1 -2
holmes/plugins/prompts/_runbook_instructions.jinja2 +23 -12
holmes/plugins/prompts/conversation_history_compaction.jinja2 +88 -0
holmes/plugins/prompts/generic_ask.jinja2 +2 -4
holmes/plugins/prompts/generic_ask_conversation.jinja2 +2 -1
holmes/plugins/prompts/generic_ask_for_issue_conversation.jinja2 +2 -1
holmes/plugins/prompts/generic_investigation.jinja2 +2 -1
holmes/plugins/prompts/investigation_procedure.jinja2 +48 -0
holmes/plugins/prompts/kubernetes_workload_ask.jinja2 +2 -1
holmes/plugins/prompts/kubernetes_workload_chat.jinja2 +2 -1
holmes/plugins/runbooks/__init__.py +117 -18
holmes/plugins/runbooks/catalog.json +2 -0
holmes/plugins/toolsets/__init__.py +21 -8
holmes/plugins/toolsets/aks-node-health.yaml +46 -0
holmes/plugins/toolsets/aks.yaml +64 -0
holmes/plugins/toolsets/atlas_mongodb/mongodb_atlas.py +26 -36
holmes/plugins/toolsets/azure_sql/azure_sql_toolset.py +0 -1
holmes/plugins/toolsets/azure_sql/tools/analyze_connection_failures.py +10 -7
holmes/plugins/toolsets/azure_sql/tools/analyze_database_connections.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/analyze_database_health_status.py +8 -6
holmes/plugins/toolsets/azure_sql/tools/analyze_database_performance.py +8 -6
holmes/plugins/toolsets/azure_sql/tools/analyze_database_storage.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_active_alerts.py +9 -7
holmes/plugins/toolsets/azure_sql/tools/get_slow_queries.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_top_cpu_queries.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_top_data_io_queries.py +9 -6
holmes/plugins/toolsets/azure_sql/tools/get_top_log_io_queries.py +9 -6
holmes/plugins/toolsets/bash/bash_toolset.py +10 -13
holmes/plugins/toolsets/bash/common/bash.py +7 -7
holmes/plugins/toolsets/cilium.yaml +284 -0
holmes/plugins/toolsets/coralogix/toolset_coralogix_logs.py +5 -3
holmes/plugins/toolsets/datadog/datadog_api.py +490 -24
holmes/plugins/toolsets/datadog/datadog_logs_instructions.jinja2 +21 -10
holmes/plugins/toolsets/datadog/toolset_datadog_general.py +349 -216
holmes/plugins/toolsets/datadog/toolset_datadog_logs.py +190 -19
holmes/plugins/toolsets/datadog/toolset_datadog_metrics.py +101 -44
holmes/plugins/toolsets/datadog/toolset_datadog_rds.py +13 -16
holmes/plugins/toolsets/datadog/toolset_datadog_traces.py +25 -31
holmes/plugins/toolsets/git.py +51 -46
holmes/plugins/toolsets/grafana/common.py +15 -3
holmes/plugins/toolsets/grafana/grafana_api.py +46 -24
holmes/plugins/toolsets/grafana/grafana_tempo_api.py +454 -0
holmes/plugins/toolsets/grafana/loki/instructions.jinja2 +9 -0
holmes/plugins/toolsets/grafana/loki/toolset_grafana_loki.py +117 -0
holmes/plugins/toolsets/grafana/toolset_grafana.py +211 -91
holmes/plugins/toolsets/grafana/toolset_grafana_dashboard.jinja2 +27 -0
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.jinja2 +246 -11
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py +653 -293
holmes/plugins/toolsets/grafana/trace_parser.py +1 -1
holmes/plugins/toolsets/internet/internet.py +6 -7
holmes/plugins/toolsets/internet/notion.py +5 -6
holmes/plugins/toolsets/investigator/core_investigation.py +42 -34
holmes/plugins/toolsets/kafka.py +25 -36
holmes/plugins/toolsets/kubernetes.yaml +58 -84
holmes/plugins/toolsets/kubernetes_logs.py +6 -6
holmes/plugins/toolsets/kubernetes_logs.yaml +32 -0
holmes/plugins/toolsets/logging_utils/logging_api.py +80 -4
holmes/plugins/toolsets/mcp/toolset_mcp.py +181 -55
holmes/plugins/toolsets/newrelic/__init__.py +0 -0
holmes/plugins/toolsets/newrelic/new_relic_api.py +125 -0
holmes/plugins/toolsets/newrelic/newrelic.jinja2 +41 -0
holmes/plugins/toolsets/newrelic/newrelic.py +163 -0
holmes/plugins/toolsets/opensearch/opensearch.py +10 -17
holmes/plugins/toolsets/opensearch/opensearch_logs.py +7 -7
holmes/plugins/toolsets/opensearch/opensearch_ppl_query_docs.jinja2 +1616 -0
holmes/plugins/toolsets/opensearch/opensearch_query_assist.py +78 -0
holmes/plugins/toolsets/opensearch/opensearch_query_assist_instructions.jinja2 +223 -0
holmes/plugins/toolsets/opensearch/opensearch_traces.py +13 -16
holmes/plugins/toolsets/openshift.yaml +283 -0
holmes/plugins/toolsets/prometheus/prometheus.py +915 -390
holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2 +43 -2
holmes/plugins/toolsets/prometheus/utils.py +28 -0
holmes/plugins/toolsets/rabbitmq/toolset_rabbitmq.py +9 -10
holmes/plugins/toolsets/robusta/robusta.py +236 -65
holmes/plugins/toolsets/robusta/robusta_instructions.jinja2 +26 -9
holmes/plugins/toolsets/runbook/runbook_fetcher.py +137 -26
holmes/plugins/toolsets/service_discovery.py +1 -1
holmes/plugins/toolsets/servicenow_tables/instructions.jinja2 +83 -0
holmes/plugins/toolsets/servicenow_tables/servicenow_tables.py +426 -0
holmes/plugins/toolsets/utils.py +88 -0
holmes/utils/config_utils.py +91 -0
holmes/utils/default_toolset_installation_guide.jinja2 +1 -22
holmes/utils/env.py +7 -0
holmes/utils/global_instructions.py +75 -10
holmes/utils/holmes_status.py +2 -1
holmes/utils/holmes_sync_toolsets.py +0 -2
holmes/utils/krr_utils.py +188 -0
holmes/utils/sentry_helper.py +41 -0
holmes/utils/stream.py +61 -7
holmes/version.py +34 -14
holmesgpt-0.16.2a0.dist-info/LICENSE +178 -0
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/METADATA +29 -27
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/RECORD +126 -102
holmes/core/performance_timing.py +0 -72
holmes/plugins/toolsets/grafana/tempo_api.py +0 -124
holmes/plugins/toolsets/grafana/toolset_grafana_loki.py +0 -110
holmes/plugins/toolsets/newrelic.py +0 -231
holmes/plugins/toolsets/servicenow/install.md +0 -37
holmes/plugins/toolsets/servicenow/instructions.jinja2 +0 -3
holmes/plugins/toolsets/servicenow/servicenow.py +0 -219
holmesgpt-0.13.2.dist-info/LICENSE.txt +0 -21
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/WHEEL +0 -0
{holmesgpt-0.13.2.dist-info → holmesgpt-0.16.2a0.dist-info}/entry_points.txt +0 -0

holmes/plugins/toolsets/openshift.yaml ADDED Viewed

@@ -0,0 +1,283 @@
+toolsets:
+  openshift/core:
+    description: "Read access to OpenShift cluster resources including projects, routes, and deployment configs"
+    docs_url: "https://holmesgpt.dev/data-sources/builtin-toolsets/openshift/"
+    tags:
+      - core
+    prerequisites:
+      - command: "oc version --client"
+    # Note: Many tools in this toolset use transformers with llm_summarize
+    # to automatically summarize large oc outputs when a fast model is configured.
+    # This reduces context window usage while preserving key information for debugging.
+    tools:
+      - name: "oc_describe"
+        description: >
+          Run oc describe <kind> <name> -n <namespace>,
+          call this when users ask for description,
+          for example when a user asks
+            - 'describe pod xyz-123'
+            - 'show service xyz-123 in namespace my-ns'
+            - 'describe route my-route'
+            - 'show deployment config xyz'
+        command: "oc describe {{ kind }} {{ name }}{% if namespace %} -n {{ namespace }}{% endif %}"
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize this oc describe output focusing on:
+                - What needs attention or immediate action
+                - Resource status and health indicators
+                - Any errors, warnings, or non-standard states
+                - Key configuration details that could affect functionality
+                - OpenShift-specific features like routes, image streams, or security context constraints
+                - When possible, mention exact field names so the user can grep for specific details
+                - Be concise: aim for ≤ 50% of the original length; avoid repeating defaults/healthy/unchanged details
+                - Prefer aggregates and counts; list only outliers and actionable items
+                - Keep grep-friendly: include exact field names/values that matter``
+      - name: "oc_get_by_name"
+        description: "Run `oc get <kind> <name> --show-labels`"
+        command: "oc get --show-labels -o wide {{ kind }} {{ name }}{% if namespace %} -n {{ namespace }}{% endif %}"
+      - name: "oc_get_by_kind_in_namespace"
+        description: "Run `oc get <kind> -n <namespace> --show-labels` to get all resources of a given type in namespace"
+        command: "oc get --show-labels -o wide {{ kind }} -n {{ namespace }}"
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize this oc output focusing on:
+                - What needs attention or immediate action
+                - Group similar resources into aggregate descriptions
+                - Make sure to mention outliers, errors, and non-standard states
+                - List healthy resources as aggregate descriptions
+                - When listing unhealthy resources, also try to use aggregate descriptions when possible
+                - When possible, mention exact keywords so the user can rerun the command with | grep <keyword> and drill down
+                - Be concise and avoid expansion: target ≤ 50% of input size; prefer counts + outliers over full listings
+      - name: "oc_get_by_kind_in_cluster"
+        description: "Run `oc get -A <kind> --show-labels` to get all resources of a given type in the cluster"
+        command: "oc get -A --show-labels -o wide {{ kind }}"
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize this oc output focusing on:
+                - What needs attention or immediate action
+                - Group similar resources into a single line and description
+                - Make sure to mention outliers, errors, and non-standard states
+                - List healthy resources as aggregate descriptions
+                - When listing unhealthy resources, also try to use aggregate descriptions when possible
+                - When possible, mention exact keywords so the user can rerun the command with | grep <keyword> and drill down on the parts they care about
+                - Strive for ≤ 50% of the original size; keep results compact and grep-friendly (one line per aggregate)
+      - name: "oc_find_resource"
+        description: "Run `oc get {{ kind }} -A --show-labels | grep {{ keyword }}` to find a resource where you know a substring of the name, IP, namespace, or labels"
+        command: "oc get -A --show-labels -o wide {{ kind }} | grep {{ keyword }}"
+      - name: "oc_get_yaml"
+        description: "Run `oc get -o yaml` on a single OpenShift resource"
+        command: "oc get -o yaml {{ kind }} {{ name }}{% if namespace %} -n {{ namespace }}{% endif %}"
+      - name: "oc_events"
+        description: "Retrieve the events for a specific OpenShift resource. `resource_type` can be any kubernetes resource type: 'pod', 'service', 'deployment', 'deploymentconfig', 'route', etc."
+        command: "oc get events --field-selector involvedObject.kind={{ resource_type }},involvedObject.name={{ resource_name }}{% if namespace %} -n {{ namespace }}{% endif %}"
+      - name: "oc_projects"
+        description: "List all projects (namespaces) in the OpenShift cluster"
+        command: "oc get projects"
+      - name: "oc_project_current"
+        description: "Show the current project (namespace) context"
+        command: "oc project"
+      - name: "oc_routes"
+        description: "List all routes in a specific namespace or cluster-wide"
+        command: "oc get routes{% if namespace %} -n {{ namespace }}{% else %} -A{% endif %} -o wide"
+      - name: "oc_route_describe"
+        description: "Describe a specific route to see its configuration and status"
+        command: "oc describe route {{ route_name }}{% if namespace %} -n {{ namespace }}{% endif %}"
+      - name: "oc_imagestreams"
+        description: "List image streams in a namespace or cluster-wide"
+        command: "oc get imagestreams{% if namespace %} -n {{ namespace }}{% else %} -A{% endif %} -o wide"
+      - name: "oc_deploymentconfigs"
+        description: "List deployment configs in a namespace or cluster-wide"
+        command: "oc get deploymentconfigs{% if namespace %} -n {{ namespace }}{% else %} -A{% endif %} -o wide"
+      - name: "oc_buildconfigs"
+        description: "List build configs in a namespace or cluster-wide"
+        command: "oc get buildconfigs{% if namespace %} -n {{ namespace }}{% else %} -A{% endif %} -o wide"
+      - name: "oc_builds"
+        description: "List builds in a namespace or cluster-wide"
+        command: "oc get builds{% if namespace %} -n {{ namespace }}{% else %} -A{% endif %} -o wide"
+      - name: "oc_adm_openshift_audit_logs"
+        description: "Get OpenShift audit logs from a specified node"
+        command: "oc adm node-logs {{ node_name }} --path=openshift-apiserver/audit.log"
+      - name: "oc_adm_openshift_audit_logs_with_filter"
+        description: "Get OpenShift audit logs from a specified node with an applied filter"
+        command: "oc adm node-logs {{ node_name }} --path=openshift-apiserver/audit.log | grep {{ grep_filter }}"
+      - name: "oc_build_logs"
+        description: "Get logs from a specific build"
+        command: "oc logs build/{{ build_name }}{% if namespace %} -n {{ namespace }}{% endif %}"
+      - name: "openshift_jq_query"
+        user_description: "Query OpenShift Resources: oc get {{kind}}  -n {{ namespace }} -o json | jq -r {{jq_expr}}"
+        description: >
+          Use oc to get json for all resources of a specific kind pipe the results to jq to filter them. Do not worry about escaping the jq_expr it will be done by the system on an unescaped expression that you give. e.g. give an expression like .items[] | .spec.containers[].image | select(test("^registry.redhat.io/") | not)
+        command: oc get {{ kind }} --all-namespaces -o json | jq -r {{ jq_expr }}
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize this jq query output focusing on:
+                - Key patterns and commonalities in the data
+                - Notable outliers, anomalies, or items that need attention
+                - Group similar results into aggregate descriptions when possible
+                - Highlight any empty results, null values, or missing data
+                - When applicable, mention specific resource names, namespaces, or values that stand out
+                - Organize findings in a structured way that helps with troubleshooting
+                - Be concise: aim for ≤ 50% of the original text; prioritize aggregates and actionable outliers
+                - Include grep-ready keys/values; avoid repeating entire objects or unchanged defaults
+  openshift/logs:
+    description: "Read pod logs using oc command"
+    docs_url: "https://holmesgpt.dev/data-sources/builtin-toolsets/openshift/"
+    tags:
+      - core
+    prerequisites:
+      - command: "oc version --client"
+    # Note: Log tools use transformers with llm_summarize to automatically
+    # summarize large log outputs when a fast model is configured. This helps
+    # focus on errors, patterns, and key information while reducing context usage.
+    tools:
+      - name: "oc_previous_logs"
+        description: "Run `oc logs --previous` on a single pod. Used to fetch logs for a pod that crashed and see logs from before the crash. Never give a deployment name or a resource that is not a pod."
+        command: "oc logs {{pod_name}} -n {{ namespace }} --previous"
+      - name: "oc_previous_logs_all_containers"
+        description: "Run `oc logs --previous` on a single pod. Used to fetch logs for a pod that crashed and see logs from before the crash."
+        command: "oc logs {{pod_name}} -n {{ namespace }} --previous --all-containers"
+      - name: "oc_container_previous_logs"
+        description: "Run `oc logs --previous` on a single container of a pod. Used to fetch logs for a pod that crashed and see logs from before the crash."
+        command: "oc logs {{pod_name}} -c {{container_name}} -n {{ namespace }} --previous"
+      - name: "oc_logs"
+        description: "Run `oc logs` on a single pod. Never give a deployment name or a resource that is not a pod."
+        command: "oc logs {{pod_name}} -n {{ namespace }}"
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize these pod logs focusing on:
+                - Errors, exceptions, and warning messages
+                - Recent activity patterns and trends
+                - Any authentication, connection, or startup issues
+                - Performance indicators (response times, throughput)
+                - Group similar log entries together
+                - When possible, mention exact error codes or keywords for easier searching
+                - Be concise: aim for ≤ 50% of the original text; prioritize aggregates and actionable outliers
+                - Include grep-ready keys/values; avoid repeating entire logs or unchanged defaults
+      - name: "oc_logs_all_containers"
+        description: "Run `oc logs` on all containers within a single pod."
+        command: "oc logs {{pod_name}} -n {{ namespace }} --all-containers"
+        transformers:
+          - name: llm_summarize
+            config:
+              input_threshold: 1000
+              prompt: |
+                Summarize these multi-container pod logs focusing on:
+                - Errors, exceptions, and warning messages by container
+                - Inter-container communication patterns
+                - Any authentication, connection, or startup issues
+                - Performance indicators and resource usage patterns
+                - Group similar log entries together by container
+                - When possible, mention exact error codes or keywords for easier searching
+                - Strive for ≤ 50% of the original size; keep results compact and grep-friendly (one line per aggregate)
+                - Prioritize aggregates and actionable outliers over comprehensive details
+      - name: "oc_container_logs"
+        description: "Run `oc logs` on a single container within a pod. This is to get the logs of a specific container in a multi-container pod."
+        command: "oc logs {{pod_name}} -c {{container_name}} -n {{ namespace }} "
+      - name: "oc_logs_grep"
+        description: "Search for a specific term in the logs of a single pod. Only provide a pod name, not a deployment or other resource."
+        command: "oc logs {{ pod_name }} -n {{ namespace }} | grep {{ search_term }}"
+      - name: "oc_logs_all_containers_grep"
+        description: "Search for a specific term in the logs of a single pod across all of its containers. Only provide a pod name, not a deployment or other resource."
+        command: "oc logs {{pod_name}} -n {{ namespace }} --all-containers | grep {{ search_term }}"
+  openshift/live-metrics:
+    description: "Provides real-time metrics for pods and nodes using oc"
+    docs_url: "https://holmesgpt.dev/data-sources/builtin-toolsets/openshift/"
+    llm_instructions: |
+      The oc_top_pods or oc_top_nodes do not return time series data or metrics that can be used for graphs
+      Do NOT use oc_top_pods or oc_top_nodes for graph generation - it only shows current snapshot data
+      oc_top_pods or oc_top_nodes are for current status checks, not historical graphs
+    tags:
+      - core
+    prerequisites:
+      - command: "oc adm top nodes"
+    tools:
+      - name: "oc_top_pods"
+        description: "Retrieves real-time CPU and memory usage for each pod in the cluster."
+        command: >
+          oc adm top pods -A
+      - name: "oc_top_nodes"
+        description: "Retrieves real-time CPU and memory usage for each node in the cluster."
+        command: >
+          oc adm top nodes
+  openshift/security:
+    description: "OpenShift security-related resources and configurations"
+    docs_url: "https://holmesgpt.dev/data-sources/builtin-toolsets/openshift/"
+    tags:
+      - core
+    prerequisites:
+      - command: "oc version --client"
+    tools:
+      - name: "oc_scc"
+        description: "List Security Context Constraints (SCCs) in the cluster"
+        command: "oc get scc{% if scc_name %} {{ scc_name }}{% endif %} -o wide"
+      - name: "oc_scc_describe"
+        description: "Describe a specific Security Context Constraint"
+        command: "oc describe scc {{ scc_name }}"
+      - name: "oc_policy_who_can"
+        description: "Check who can perform a specific action on a resource"
+        command: "oc policy who-can {{ verb }} {{ resource }}{% if namespace %} -n {{ namespace }}{% endif %}"
+      - name: "oc_policy_can_i"
+        description: "Check if the current user can perform a specific action"
+        command: "oc policy can-i {{ verb }} {{ resource }}{% if namespace %} -n {{ namespace }}{% endif %}"
+      - name: "oc_serviceaccounts"
+        description: "List service accounts in a namespace or cluster-wide"
+        command: "oc get serviceaccounts{% if namespace %} -n {{ namespace }}{% else %} -A{% endif %} -o wide"
+      - name: "oc_rolebindings"
+        description: "List role bindings in a namespace or cluster-wide"
+        command: "oc get rolebindings{% if namespace %} -n {{ namespace }}{% else %} -A{% endif %} -o wide"
+      - name: "oc_clusterrolebindings"
+        description: "List cluster role bindings"
+        command: "oc get clusterrolebindings -o wide"

holmesgpt 0.13.2__py3-none-any.whl → 0.16.2a0__py3-none-any.whl

holmesgpt 0.13.2py3-none-any.whl → 0.16.2a0py3-none-any.whl