PyPI - holmesgpt - Versions diffs - 0.14.1__py3-none-any.whl → 0.14.2__py3-none-any.whl - Mend

holmesgpt 0.14.1py3-none-any.whl → 0.14.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of holmesgpt might be problematic. Click here for more details.

Files changed (10) hide show

holmes/__init__.py CHANGED Viewed

@@ -1,5 +1,5 @@
 # This is patched by github actions during release
-__version__ = "0.14.1"
+__version__ = "0.14.2"
 # Re-export version functions from version module for backward compatibility
 from .version import (

holmes/common/env_vars.py CHANGED Viewed

@@ -73,11 +73,11 @@ LOG_LLM_USAGE_RESPONSE = load_bool("LOG_LLM_USAGE_RESPONSE", False)
 # For CLI only, enable user approval for potentially sensitive commands that would otherwise be rejected
 ENABLE_CLI_TOOL_APPROVAL = load_bool("ENABLE_CLI_TOOL_APPROVAL", True)
-MAX_GRAPH_POINTS = float(os.environ.get("MAX_GRAPH_POINTS", 200))
+MAX_GRAPH_POINTS = float(os.environ.get("MAX_GRAPH_POINTS", 100))
 # Limit each tool response to N% of the total context window.
 # Number between 0 and 100
 # Setting to either 0 or any number above 100 disables the logic that limits tool response size
 TOOL_MAX_ALLOCATED_CONTEXT_WINDOW_PCT = float(
-    os.environ.get("TOOL_MAX_ALLOCATED_CONTEXT_WINDOW_PCT", 10)
+    os.environ.get("TOOL_MAX_ALLOCATED_CONTEXT_WINDOW_PCT", 15)
 )

holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py CHANGED Viewed

@@ -242,9 +242,9 @@ Examples:
             import logging
             logger = logging.getLogger(__name__)
-            logger.info(f"Tempo query: {stats_query}")
+            logger.debug(f"Tempo query: {stats_query}")
-            logger.info(f"start: {start}, end: {end}")
+            logger.debug(f"start: {start}, end: {end}")
             all_traces_response = api.search_traces_by_query(
                 q=stats_query,
@@ -253,7 +253,7 @@ Examples:
                 limit=1000,
             )
-            logger.info(f"Response: {all_traces_response}")
+            logger.debug(f"Response: {all_traces_response}")
             traces = all_traces_response.get("traces", [])
             if not traces:

holmes/plugins/toolsets/prometheus/prometheus.py CHANGED Viewed

@@ -43,14 +43,12 @@ PROMETHEUS_METADATA_API_LIMIT = 100  # Default limit for Prometheus metadata API
 DEFAULT_QUERY_TIMEOUT_SECONDS = 20
 MAX_QUERY_TIMEOUT_SECONDS = 180
 # Default character limit for query responses to prevent token limit issues
-DEFAULT_QUERY_RESPONSE_SIZE_LIMIT = 20000
+DEFAULT_QUERY_RESPONSE_SIZE_LIMIT = 30000
 # Default timeout for metadata API calls (discovery endpoints)
 DEFAULT_METADATA_TIMEOUT_SECONDS = 20
 MAX_METADATA_TIMEOUT_SECONDS = 60
 # Default time window for metadata APIs (in hours)
 DEFAULT_METADATA_TIME_WINDOW_HRS = 1
-# Sample size for data summaries when results are too large
-DATA_SUMMARY_SAMPLE_SIZE = 10
 class PrometheusConfig(BaseModel):

holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2 CHANGED Viewed

@@ -6,11 +6,20 @@
 * Combine multiple patterns with regex OR (|) to reduce API calls:
   - `{__name__=~"node_cpu.*|node_memory.*|node_disk.*"}` - get all node resource metrics in one call
   - `{__name__=~"container.*|pod.*|kube.*"}` - get all Kubernetes-related metrics
-  - `{namespace=~"default|kube-system|monitoring"}` - metrics from multiple namespaces
+  - `{namespace=~"example1|example2|example3"}` - metrics from multiple namespaces
 * Use `get_metric_metadata` after discovering names to get types/descriptions if needed
 * Use `get_label_values` to discover pods, namespaces, jobs: e.g., get_label_values(label="pod")
 * Only use `get_series` when you need full label sets (slower than other methods)
+## Retrying queries that return too much data
+* When a Prometheus query returns too much data (e.g., truncation error), you MUST retry with a more specific query or less data points or topk/bottomk
+* NEVER EVER EVER answer a question based on Prometheus data that was truncated as you might be missing important information and give the totally wrong answer
+* Prefer telling the user you can't answer the question because of too much data rather than answering based on incomplete data
+* You are also able to show graphs to the user (using the promql embed functionality mentioned below) so you can show users graphs and THEY can interpret the data themselves, even if you can't answer.
+* Do NOT hestitate to try alternative queries and try to reduce the amount of data returned until you get a successful query
+* Be extremely, extremely cautious when answering based on get_label_values because the existence of a label value says NOTHING about the metric value itself (is it high, low, or perhaps the label exists in Prometheus but its an older series not present right now)
+* DO NOT give answers about metrics based on what 'is typically the case' or 'common knowledge' - if you can't see the actual metric value, you MUST NEVER EVER answer about it - just tell the user your limitations due to the size of the data
 ## Alert Investigation & Query Execution
 * When investigating a Prometheus alert, ALWAYS call list_prometheus_rules to get the alert definition
 * Use Prometheus to query metrics from the alert promql
@@ -37,24 +46,19 @@
 * ALWAYS use `topk()` or `bottomk()` to limit the number of series returned
 * Standard pattern for high-cardinality queries:
   - Use `topk(5, <your_query>)` to get the top 5 series
-  - Example: `topk(5, rate(container_cpu_usage_seconds_total{namespace="default"}[5m]))`
+  - Example: `topk(5, rate(container_cpu_usage_seconds_total{namespace="example"}[5m]))`
   - This prevents context overflow and focuses on the most relevant data
 * To also capture the aggregate of remaining series as "other":
   ```
-  topk(5, rate(container_cpu_usage_seconds_total{namespace="default"}[5m]))
-  or
-  label_replace(
-    (sum(rate(container_cpu_usage_seconds_total{namespace="default"}[5m])) - sum(topk(5, rate(container_cpu_usage_seconds_total{namespace="default"}[5m])))),
-    "pod", "other", "", ""
-  )
+  topk(5, rate(container_cpu_usage_seconds_total{namespace="example"}[5m])) or label_replace((sum(rate(container_cpu_usage_seconds_total{namespace="example"}[5m])) - sum(topk(5, rate(container_cpu_usage_seconds_total{namespace="example"}[5m])))), "pod", "other", "", "")
   ```
 * Common high-cardinality scenarios requiring topk():
   - Pod-level metrics in namespaces with many pods
   - Container-level CPU/memory metrics
   - HTTP metrics with many endpoints or status codes
   - Any query returning more than 10 time series
-* For initial exploration, use instant queries with `count()` to check cardinality:
-  - Example: `count(count by (pod) (container_cpu_usage_seconds_total{namespace="default"}))`
+* For initial exploration, you may use instant queries with `count()` to check cardinality:
+  - Example: `count(count by (pod) (container_cpu_usage_seconds_total{namespace="example"}))`
   - If count > 10, use topk() in your range query
 * When doing queries, always extend the time range, to 15 min before and after the alert start time
 * ALWAYS embed the execution results into your answer

{holmesgpt-0.14.1.dist-info → holmesgpt-0.14.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: holmesgpt
-Version: 0.14.1
+Version: 0.14.2
 Summary:
 Author: Natan Yellin
 Author-email: natan@robusta.dev

{holmesgpt-0.14.1.dist-info → holmesgpt-0.14.2.dist-info}/RECORD RENAMED Viewed

@@ -1,7 +1,7 @@
 holmes/.git_archival.json,sha256=PbwdO7rNhEJ4ALiO12DPPb81xNAIsVxCA0m8OrVoqsk,182
-holmes/__init__.py,sha256=jTatz8d7goRhTZfG4-8-aLMSIe0Pi2sDQJ5wtjRWGcg,257
+holmes/__init__.py,sha256=aObdUvtSLEMRLcbzR1BLUnoN1nK0-PV8tAXzjOfEEh8,257
 holmes/clients/robusta_client.py,sha256=rWst1PANJaIsprp3jZ7RV5UpttM_YLBGQ8B5noZqvgg,1532
-holmes/common/env_vars.py,sha256=y61QXRmu80iAtUU7cp30wjCrs_rwHNRS-kZaSyuzJcI,3312
+holmes/common/env_vars.py,sha256=3CKyDmPtEAfYFxWC5wEDq5ppn94BhzDbJA3k9Vtd_WU,3312
 holmes/common/openshift.py,sha256=akbQ0GpnmuzXOqTcotpTDQSDKIROypS9mgPOprUgkCw,407
 holmes/config.py,sha256=yu0kQox7tfeKc4kJLESH-eGa6w1-nNC9kxAOtHf_qhQ,21781
 holmes/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -172,7 +172,7 @@ holmes/plugins/toolsets/grafana/loki_api.py,sha256=f7oTzfhJ1LojsPoAfsKt32ADWffLE
 holmes/plugins/toolsets/grafana/toolset_grafana.py,sha256=_A3DUOyd2624I75BknsZhHpK1mzcf7JfACL7_ET6sPM,4922
 holmes/plugins/toolsets/grafana/toolset_grafana_loki.py,sha256=MK0mK5h8MZuULwAoQlng3UZS1xtxHzePwhEoJiroJSw,3912
 holmes/plugins/toolsets/grafana/toolset_grafana_tempo.jinja2,sha256=0HBYUXkGYWZbHwIvfQEF5oL9LFMYzjgcmL1U6RjgPSE,10417
-holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py,sha256=5lmWIVc8c4iSGwpvhhhxGPe5-LtpGMzprSdR8GmiuxQ,38416
+holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py,sha256=4q9FCHZ2kuI4Kng_JOWipkHIUyfkH2zT5zSywnFie18,38419
 holmes/plugins/toolsets/grafana/trace_parser.py,sha256=8PjqPGDGo9uB2Z8WWWknMKdhcqlqZEVncQCCkl2F06A,7024
 holmes/plugins/toolsets/helm.yaml,sha256=-IPDChKMHcxGbzA0z9GKczRshL-mD24cHpBizfNM1jM,1604
 holmes/plugins/toolsets/internet/internet.py,sha256=cQi8R2rcttIZ49egSzi2y2UVt4tncqE8medxiXp8II8,7779
@@ -196,8 +196,8 @@ holmes/plugins/toolsets/opensearch/opensearch_logs.py,sha256=_j-JAhLWtxhBPafCvey
 holmes/plugins/toolsets/opensearch/opensearch_traces.py,sha256=FjDbkU-oI-spMdra0raSmiHZb6Cfbo_AsS_OKEt9coI,8876
 holmes/plugins/toolsets/opensearch/opensearch_traces_instructions.jinja2,sha256=Xn8AW4XCMYV1VkBbF8nNB9fUpKQ1Vbm88iFczj-LQXo,1035
 holmes/plugins/toolsets/opensearch/opensearch_utils.py,sha256=mh9Wp22tOdJYmA9IaFS7tD3aEENljyeuPOsF-lEe5C0,5097
-holmes/plugins/toolsets/prometheus/prometheus.py,sha256=_13bVlcxVu0ezcZdyyauFIKPtp-ADLwSIOSXTy3dTag,65922
-holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2,sha256=ssokrP2TNMttRc4oH89BY3cHkTHNHrOUAi4rYcxuMak,5075
+holmes/plugins/toolsets/prometheus/prometheus.py,sha256=H5sdiwk2nAWrnD23wR-8nkTuRLBOhrCZXc51EOgDqIQ,65832
+holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2,sha256=taf5C-N9rdp1A7S__hETefcm2OaYHJLjs1ZbuqIsGtE,6383
 holmes/plugins/toolsets/prometheus/utils.py,sha256=ZenD354dP0sRmm0R-QBuAq1jyn40GjYf4wx15bXIYRc,775
 holmes/plugins/toolsets/rabbitmq/api.py,sha256=-BtqF7hQWtl_OamnQ521vYHhR8E2n2wcPNYxfI9r4kQ,14307
 holmes/plugins/toolsets/rabbitmq/rabbitmq_instructions.jinja2,sha256=qetmtJUMkx9LIihr2fSJ2EV9h2J-b-ZdUAvMtopXZYY,3105
@@ -237,8 +237,8 @@ holmes/utils/sentry_helper.py,sha256=_IbxqlqbsNb_ncvpZ-B5XxcauQphJStcwaVxRj18RpU
 holmes/utils/stream.py,sha256=L4vlu1xX5Ihtn-D0Mfml_HuQRfLhHFSkWNojcAJLi9g,3252
 holmes/utils/tags.py,sha256=SU4EZMBtLlIb7OlHsSpguFaypczRzOcuHYxDSanV3sQ,3364
 holmes/version.py,sha256=uDRPOvVaHreROj_9HPe81RVpTzHcG8ojpGTsnJIlQOM,5220
-holmesgpt-0.14.1.dist-info/LICENSE.txt,sha256=RdZMj8VXRQdVslr6PMYMbAEu5pOjOdjDqt3yAmWb9Ds,1072
-holmesgpt-0.14.1.dist-info/METADATA,sha256=vm-GB1-srkFxyYzIbo73gxxamIN5nfkQaaHJ7lNYYuE,16184
-holmesgpt-0.14.1.dist-info/WHEEL,sha256=kLuE8m1WYU0Ig0_YEGrXyTtiJvKPpLpDEiChiNyei5Y,88
-holmesgpt-0.14.1.dist-info/entry_points.txt,sha256=JdzEyZhpaYr7Boo4uy4UZgzY1VsAEbzMgGmHZtx9KFY,42
-holmesgpt-0.14.1.dist-info/RECORD,,
+holmesgpt-0.14.2.dist-info/LICENSE.txt,sha256=RdZMj8VXRQdVslr6PMYMbAEu5pOjOdjDqt3yAmWb9Ds,1072
+holmesgpt-0.14.2.dist-info/METADATA,sha256=_-DXRD2oFoAqxL5uMxMeds-RItenYjrE2aRKnmV0DHQ,16184
+holmesgpt-0.14.2.dist-info/WHEEL,sha256=kLuE8m1WYU0Ig0_YEGrXyTtiJvKPpLpDEiChiNyei5Y,88
+holmesgpt-0.14.2.dist-info/entry_points.txt,sha256=JdzEyZhpaYr7Boo4uy4UZgzY1VsAEbzMgGmHZtx9KFY,42
+holmesgpt-0.14.2.dist-info/RECORD,,

{holmesgpt-0.14.1.dist-info → holmesgpt-0.14.2.dist-info}/LICENSE.txt RENAMED Viewed

File without changes

{holmesgpt-0.14.1.dist-info → holmesgpt-0.14.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{holmesgpt-0.14.1.dist-info → holmesgpt-0.14.2.dist-info}/entry_points.txt RENAMED Viewed

File without changes

holmesgpt 0.14.1__py3-none-any.whl → 0.14.2__py3-none-any.whl

Potentially problematic release.

holmesgpt 0.14.1py3-none-any.whl → 0.14.2py3-none-any.whl