PyPI - holmesgpt - Versions diffs - 0.13.2__py3-none-any.whl → 0.18.4__py3-none-any.whl - Mend

holmesgpt 0.13.2py3-none-any.whl → 0.18.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (188) hide show

holmes/__init__.py +3 -5
holmes/clients/robusta_client.py +20 -6
holmes/common/env_vars.py +58 -3
holmes/common/openshift.py +1 -1
holmes/config.py +123 -148
holmes/core/conversations.py +71 -15
holmes/core/feedback.py +191 -0
holmes/core/investigation.py +31 -39
holmes/core/investigation_structured_output.py +3 -3
holmes/core/issue.py +1 -1
holmes/core/llm.py +508 -88
holmes/core/models.py +108 -4
holmes/core/openai_formatting.py +14 -1
holmes/core/prompt.py +48 -3
holmes/core/runbooks.py +1 -0
holmes/core/safeguards.py +8 -6
holmes/core/supabase_dal.py +295 -100
holmes/core/tool_calling_llm.py +489 -428
holmes/core/tools.py +325 -56
holmes/core/tools_utils/token_counting.py +21 -0
holmes/core/tools_utils/tool_context_window_limiter.py +40 -0
holmes/core/tools_utils/tool_executor.py +0 -13
holmes/core/tools_utils/toolset_utils.py +1 -0
holmes/core/toolset_manager.py +191 -5
holmes/core/tracing.py +19 -3
holmes/core/transformers/__init__.py +23 -0
holmes/core/transformers/base.py +63 -0
holmes/core/transformers/llm_summarize.py +175 -0
holmes/core/transformers/registry.py +123 -0
holmes/core/transformers/transformer.py +32 -0
holmes/core/truncation/compaction.py +94 -0
holmes/core/truncation/dal_truncation_utils.py +23 -0
holmes/core/truncation/input_context_window_limiter.py +219 -0
holmes/interactive.py +228 -31
holmes/main.py +23 -40
holmes/plugins/interfaces.py +2 -1
holmes/plugins/prompts/__init__.py +2 -1
holmes/plugins/prompts/_fetch_logs.jinja2 +31 -6
holmes/plugins/prompts/_general_instructions.jinja2 +1 -2
holmes/plugins/prompts/_runbook_instructions.jinja2 +24 -12
holmes/plugins/prompts/base_user_prompt.jinja2 +7 -0
holmes/plugins/prompts/conversation_history_compaction.jinja2 +89 -0
holmes/plugins/prompts/generic_ask.jinja2 +0 -4
holmes/plugins/prompts/generic_ask_conversation.jinja2 +0 -1
holmes/plugins/prompts/generic_ask_for_issue_conversation.jinja2 +0 -1
holmes/plugins/prompts/generic_investigation.jinja2 +0 -1
holmes/plugins/prompts/investigation_procedure.jinja2 +50 -1
holmes/plugins/prompts/kubernetes_workload_ask.jinja2 +0 -1
holmes/plugins/prompts/kubernetes_workload_chat.jinja2 +0 -1
holmes/plugins/runbooks/__init__.py +145 -17
holmes/plugins/runbooks/catalog.json +2 -0
holmes/plugins/sources/github/__init__.py +4 -2
holmes/plugins/sources/prometheus/models.py +1 -0
holmes/plugins/toolsets/__init__.py +44 -27
holmes/plugins/toolsets/aks-node-health.yaml +46 -0
holmes/plugins/toolsets/aks.yaml +64 -0
holmes/plugins/toolsets/atlas_mongodb/mongodb_atlas.py +38 -47
holmes/plugins/toolsets/azure_sql/apis/alert_monitoring_api.py +3 -2
holmes/plugins/toolsets/azure_sql/apis/azure_sql_api.py +2 -1
holmes/plugins/toolsets/azure_sql/apis/connection_failure_api.py +3 -2
holmes/plugins/toolsets/azure_sql/apis/connection_monitoring_api.py +3 -1
holmes/plugins/toolsets/azure_sql/apis/storage_analysis_api.py +3 -1
holmes/plugins/toolsets/azure_sql/azure_sql_toolset.py +12 -13
holmes/plugins/toolsets/azure_sql/tools/analyze_connection_failures.py +15 -12
holmes/plugins/toolsets/azure_sql/tools/analyze_database_connections.py +15 -12
holmes/plugins/toolsets/azure_sql/tools/analyze_database_health_status.py +11 -11
holmes/plugins/toolsets/azure_sql/tools/analyze_database_performance.py +11 -9
holmes/plugins/toolsets/azure_sql/tools/analyze_database_storage.py +15 -12
holmes/plugins/toolsets/azure_sql/tools/get_active_alerts.py +15 -15
holmes/plugins/toolsets/azure_sql/tools/get_slow_queries.py +11 -8
holmes/plugins/toolsets/azure_sql/tools/get_top_cpu_queries.py +11 -8
holmes/plugins/toolsets/azure_sql/tools/get_top_data_io_queries.py +11 -8
holmes/plugins/toolsets/azure_sql/tools/get_top_log_io_queries.py +11 -8
holmes/plugins/toolsets/azure_sql/utils.py +0 -32
holmes/plugins/toolsets/bash/argocd/__init__.py +3 -3
holmes/plugins/toolsets/bash/aws/__init__.py +4 -4
holmes/plugins/toolsets/bash/azure/__init__.py +4 -4
holmes/plugins/toolsets/bash/bash_toolset.py +11 -15
holmes/plugins/toolsets/bash/common/bash.py +23 -13
holmes/plugins/toolsets/bash/common/bash_command.py +1 -1
holmes/plugins/toolsets/bash/common/stringify.py +1 -1
holmes/plugins/toolsets/bash/kubectl/__init__.py +2 -1
holmes/plugins/toolsets/bash/kubectl/constants.py +0 -1
holmes/plugins/toolsets/bash/kubectl/kubectl_get.py +3 -4
holmes/plugins/toolsets/bash/parse_command.py +12 -13
holmes/plugins/toolsets/cilium.yaml +284 -0
holmes/plugins/toolsets/connectivity_check.py +124 -0
holmes/plugins/toolsets/coralogix/api.py +132 -119
holmes/plugins/toolsets/coralogix/coralogix.jinja2 +14 -0
holmes/plugins/toolsets/coralogix/toolset_coralogix.py +219 -0
holmes/plugins/toolsets/coralogix/utils.py +15 -79
holmes/plugins/toolsets/datadog/datadog_api.py +525 -26
holmes/plugins/toolsets/datadog/datadog_logs_instructions.jinja2 +55 -11
holmes/plugins/toolsets/datadog/datadog_metrics_instructions.jinja2 +3 -3
holmes/plugins/toolsets/datadog/datadog_models.py +59 -0
holmes/plugins/toolsets/datadog/datadog_url_utils.py +213 -0
holmes/plugins/toolsets/datadog/instructions_datadog_traces.jinja2 +165 -28
holmes/plugins/toolsets/datadog/toolset_datadog_general.py +417 -241
holmes/plugins/toolsets/datadog/toolset_datadog_logs.py +234 -214
holmes/plugins/toolsets/datadog/toolset_datadog_metrics.py +167 -79
holmes/plugins/toolsets/datadog/toolset_datadog_traces.py +374 -363
holmes/plugins/toolsets/elasticsearch/__init__.py +6 -0
holmes/plugins/toolsets/elasticsearch/elasticsearch.py +834 -0
holmes/plugins/toolsets/elasticsearch/opensearch_ppl_query_docs.jinja2 +1616 -0
holmes/plugins/toolsets/elasticsearch/opensearch_query_assist.py +78 -0
holmes/plugins/toolsets/elasticsearch/opensearch_query_assist_instructions.jinja2 +223 -0
holmes/plugins/toolsets/git.py +54 -50
holmes/plugins/toolsets/grafana/base_grafana_toolset.py +16 -4
holmes/plugins/toolsets/grafana/common.py +13 -29
holmes/plugins/toolsets/grafana/grafana_tempo_api.py +455 -0
holmes/plugins/toolsets/grafana/loki/instructions.jinja2 +25 -0
holmes/plugins/toolsets/grafana/loki/toolset_grafana_loki.py +191 -0
holmes/plugins/toolsets/grafana/loki_api.py +4 -0
holmes/plugins/toolsets/grafana/toolset_grafana.py +293 -89
holmes/plugins/toolsets/grafana/toolset_grafana_dashboard.jinja2 +49 -0
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.jinja2 +246 -11
holmes/plugins/toolsets/grafana/toolset_grafana_tempo.py +820 -292
holmes/plugins/toolsets/grafana/trace_parser.py +4 -3
holmes/plugins/toolsets/internet/internet.py +15 -16
holmes/plugins/toolsets/internet/notion.py +9 -11
holmes/plugins/toolsets/investigator/core_investigation.py +44 -36
holmes/plugins/toolsets/investigator/model.py +3 -1
holmes/plugins/toolsets/json_filter_mixin.py +134 -0
holmes/plugins/toolsets/kafka.py +36 -42
holmes/plugins/toolsets/kubernetes.yaml +317 -113
holmes/plugins/toolsets/kubernetes_logs.py +9 -9
holmes/plugins/toolsets/kubernetes_logs.yaml +32 -0
holmes/plugins/toolsets/logging_utils/logging_api.py +94 -8
holmes/plugins/toolsets/mcp/toolset_mcp.py +218 -64
holmes/plugins/toolsets/newrelic/new_relic_api.py +165 -0
holmes/plugins/toolsets/newrelic/newrelic.jinja2 +65 -0
holmes/plugins/toolsets/newrelic/newrelic.py +320 -0
holmes/plugins/toolsets/openshift.yaml +283 -0
holmes/plugins/toolsets/prometheus/prometheus.py +1202 -421
holmes/plugins/toolsets/prometheus/prometheus_instructions.jinja2 +54 -5
holmes/plugins/toolsets/prometheus/utils.py +28 -0
holmes/plugins/toolsets/rabbitmq/api.py +23 -4
holmes/plugins/toolsets/rabbitmq/toolset_rabbitmq.py +13 -14
holmes/plugins/toolsets/robusta/robusta.py +239 -68
holmes/plugins/toolsets/robusta/robusta_instructions.jinja2 +26 -9
holmes/plugins/toolsets/runbook/runbook_fetcher.py +157 -27
holmes/plugins/toolsets/service_discovery.py +1 -1
holmes/plugins/toolsets/servicenow_tables/instructions.jinja2 +83 -0
holmes/plugins/toolsets/servicenow_tables/servicenow_tables.py +426 -0
holmes/plugins/toolsets/utils.py +88 -0
holmes/utils/config_utils.py +91 -0
holmes/utils/connection_utils.py +31 -0
holmes/utils/console/result.py +10 -0
holmes/utils/default_toolset_installation_guide.jinja2 +1 -22
holmes/utils/env.py +7 -0
holmes/utils/file_utils.py +2 -1
holmes/utils/global_instructions.py +60 -11
holmes/utils/holmes_status.py +6 -4
holmes/utils/holmes_sync_toolsets.py +0 -2
holmes/utils/krr_utils.py +188 -0
holmes/utils/log.py +15 -0
holmes/utils/markdown_utils.py +2 -3
holmes/utils/memory_limit.py +58 -0
holmes/utils/sentry_helper.py +64 -0
holmes/utils/stream.py +69 -8
holmes/utils/tags.py +4 -3
holmes/version.py +37 -15
holmesgpt-0.18.4.dist-info/LICENSE +178 -0
{holmesgpt-0.13.2.dist-info → holmesgpt-0.18.4.dist-info}/METADATA +35 -31
holmesgpt-0.18.4.dist-info/RECORD +258 -0
holmes/core/performance_timing.py +0 -72
holmes/plugins/toolsets/aws.yaml +0 -80
holmes/plugins/toolsets/coralogix/toolset_coralogix_logs.py +0 -112
holmes/plugins/toolsets/datadog/datadog_traces_formatter.py +0 -310
holmes/plugins/toolsets/datadog/toolset_datadog_rds.py +0 -739
holmes/plugins/toolsets/grafana/grafana_api.py +0 -42
holmes/plugins/toolsets/grafana/tempo_api.py +0 -124
holmes/plugins/toolsets/grafana/toolset_grafana_loki.py +0 -110
holmes/plugins/toolsets/newrelic.py +0 -231
holmes/plugins/toolsets/opensearch/opensearch.py +0 -257
holmes/plugins/toolsets/opensearch/opensearch_logs.py +0 -161
holmes/plugins/toolsets/opensearch/opensearch_traces.py +0 -218
holmes/plugins/toolsets/opensearch/opensearch_traces_instructions.jinja2 +0 -12
holmes/plugins/toolsets/opensearch/opensearch_utils.py +0 -166
holmes/plugins/toolsets/servicenow/install.md +0 -37
holmes/plugins/toolsets/servicenow/instructions.jinja2 +0 -3
holmes/plugins/toolsets/servicenow/servicenow.py +0 -219
holmes/utils/keygen_utils.py +0 -6
holmesgpt-0.13.2.dist-info/LICENSE.txt +0 -21
holmesgpt-0.13.2.dist-info/RECORD +0 -234
/holmes/plugins/toolsets/{opensearch → newrelic}/__init__.py +0 -0
{holmesgpt-0.13.2.dist-info → holmesgpt-0.18.4.dist-info}/WHEEL +0 -0
{holmesgpt-0.13.2.dist-info → holmesgpt-0.18.4.dist-info}/entry_points.txt +0 -0

holmes/core/supabase_dal.py CHANGED Viewed

@@ -1,17 +1,21 @@
 import base64
 import binascii
+import gzip
 import json
 import logging
 import os
 import threading
 from datetime import datetime, timedelta
+from enum import Enum
 from typing import Dict, List, Optional, Tuple
 from uuid import uuid4
-import gzip
+import sentry_sdk
 import yaml  # type: ignore
 from cachetools import TTLCache  # type: ignore
+from postgrest._sync import request_builder as supabase_request_builder
 from postgrest._sync.request_builder import SyncQueryRequestBuilder
+from postgrest.base_request_builder import QueryArgs
 from postgrest.exceptions import APIError as PGAPIError
 from postgrest.types import ReturnMethod
 from pydantic import BaseModel
@@ -30,13 +34,19 @@ from holmes.core.resource_instruction import (
     ResourceInstructionDocument,
     ResourceInstructions,
 )
+from holmes.core.truncation.dal_truncation_utils import (
+    truncate_evidences_entities_if_necessary,
+)
+from holmes.plugins.runbooks import RobustaRunbookInstruction
 from holmes.utils.definitions import RobustaConfig
 from holmes.utils.env import get_env_replacement
 from holmes.utils.global_instructions import Instructions
+from holmes.utils.krr_utils import calculate_krr_savings
 SUPABASE_TIMEOUT_SECONDS = int(os.getenv("SUPABASE_TIMEOUT_SECONDS", 3600))
 ISSUES_TABLE = "Issues"
+GROUPED_ISSUES_TABLE = "GroupedIssues"
 EVIDENCE_TABLE = "Evidence"
 RUNBOOKS_TABLE = "HolmesRunbooks"
 SESSION_TOKENS_TABLE = "AuthTokens"
@@ -45,6 +55,31 @@ HOLMES_TOOLSET = "HolmesToolsStatus"
 SCANS_META_TABLE = "ScansMeta"
 SCANS_RESULTS_TABLE = "ScansResults"
+ENRICHMENT_BLACKLIST = ["text_file", "graph", "ai_analysis", "holmes"]
+ENRICHMENT_BLACKLIST_SET = set(ENRICHMENT_BLACKLIST)
+logging.info("Patching supabase_request_builder.pre_select")
+original_pre_select = supabase_request_builder.pre_select
+def pre_select_patched(*args, **kwargs):
+    query_args: QueryArgs = original_pre_select(*args, **kwargs)
+    if not query_args.json:
+        query_args = QueryArgs(
+            query_args.method, query_args.params, query_args.headers, None
+        )
+    return query_args
+supabase_request_builder.pre_select = pre_select_patched
+class FindingType(str, Enum):
+    ISSUE = "issue"
+    CONFIGURATION_CHANGE = "configuration_change"
 class RobustaToken(BaseModel):
     store_url: str
@@ -54,12 +89,23 @@ class RobustaToken(BaseModel):
     password: str
+class SupabaseDnsException(Exception):
+    def __init__(self, error: Exception, url: str):
+        message = (
+            f"\n{error.__class__.__name__}: {error}\n"
+            f"Error connecting to <{url}>\n"
+            "This is often due to DNS issues or firewall policies - to troubleshoot run in your cluster:\n"
+            f"curl -I {url}\n"
+        )
+        super().__init__(message)
 class SupabaseDal:
     def __init__(self, cluster: str):
         self.enabled = self.__init_config()
         self.cluster = cluster
         if not self.enabled:
-            logging.info(
+            logging.debug(
                 "Not connecting to Robusta platform - robusta token not provided - using ROBUSTA_AI will not be possible"
             )
             return
@@ -67,6 +113,7 @@ class SupabaseDal:
             f"Initializing Robusta platform connection for account {self.account_id}"
         )
         options = ClientOptions(postgrest_client_timeout=SUPABASE_TIMEOUT_SECONDS)
+        sentry_sdk.set_tag("db_url", self.url)
         self.client = create_client(self.url, self.api_key, options)  # type: ignore
         self.user_id = self.sign_in()
         ttl = int(os.environ.get("SAAS_SESSION_TOKEN_TTL_SEC", "82800"))  # 23 hours
@@ -117,7 +164,7 @@ class SupabaseDal:
                 )
         if not os.path.exists(config_file_path):
-            logging.info(f"No robusta config in {config_file_path}")
+            logging.debug(f"No robusta config in {config_file_path}")
             return None
         logging.info(f"loading config {config_file_path}")
@@ -179,118 +226,183 @@ class SupabaseDal:
         return all([self.account_id, self.url, self.api_key, self.email, self.password])
     def sign_in(self) -> str:
-        logging.info("Supabase DAL login")
-        res = self.client.auth.sign_in_with_password(
-            {"email": self.email, "password": self.password}
-        )
-        if not res.session:
-            raise ValueError("Authentication failed: no session returned")
-        if not res.user:
-            raise ValueError("Authentication failed: no user returned")
-        self.client.auth.set_session(
-            res.session.access_token, res.session.refresh_token
-        )
-        self.client.postgrest.auth(res.session.access_token)
-        return res.user.id
+        logging.info("Supabase dal login")
+        try:
+            res = self.client.auth.sign_in_with_password(
+                {"email": self.email, "password": self.password}
+            )
+            if not res.session:
+                raise ValueError("Authentication failed: no session returned")
+            if not res.user:
+                raise ValueError("Authentication failed: no user returned")
+            self.client.auth.set_session(
+                res.session.access_token, res.session.refresh_token
+            )
+            self.client.postgrest.auth(res.session.access_token)
+            return res.user.id
+        except Exception as e:
+            error_msg = str(e).lower()
+            if any(
+                dns_indicator in error_msg
+                for dns_indicator in [
+                    "temporary failure in name resolution",
+                    "name resolution",
+                    "dns",
+                    "name or service not known",
+                    "nodename nor servname provided",
+                ]
+            ):
+                raise SupabaseDnsException(e, self.url) from e
+            raise
     def get_resource_recommendation(
-        self, name: str, namespace: str, kind
+        self,
+        limit: int = 10,
+        sort_by: str = "cpu_total",
+        namespace: Optional[str] = None,
+        name_pattern: Optional[str] = None,
+        kind: Optional[str] = None,
+        container: Optional[str] = None,
     ) -> Optional[List[Dict]]:
+        """
+        Fetch top N resource recommendations with optional filters and sorting.
+        Args:
+            limit: Maximum number of recommendations to return (default: 10)
+            sort_by: Field to sort by potential savings. Options:
+                - "cpu_total": Total CPU savings (requests + limits)
+                - "memory_total": Total memory savings (requests + limits)
+                - "cpu_requests": CPU requests savings
+                - "memory_requests": Memory requests savings
+                - "cpu_limits": CPU limits savings
+                - "memory_limits": Memory limits savings
+                - "priority": Use the priority field from the scan
+            namespace: Filter by Kubernetes namespace (exact match)
+            name_pattern: Filter by workload name (supports SQL LIKE pattern, e.g., '%app%')
+            kind: Filter by Kubernetes resource kind (e.g., Deployment, StatefulSet, DaemonSet, Job)
+            container: Filter by container name (exact match)
+        Returns:
+            List of recommendations sorted by the specified metric
+        """
         if not self.enabled:
             return []
-        try:
-            scans_meta_response = (
-                self.client.table(SCANS_META_TABLE)
-                .select("*")
-                .eq("account_id", self.account_id)
-                .eq("cluster_id", self.cluster)
-                .eq("latest", True)
-                .execute()
-            )
-            if not len(scans_meta_response.data):
-                return None
+        scans_meta_response = (
+            self.client.table(SCANS_META_TABLE)
+            .select("*")
+            .eq("account_id", self.account_id)
+            .eq("cluster_id", self.cluster)
+            .eq("latest", True)
+            .execute()
+        )
+        if not len(scans_meta_response.data):
+            logging.warning("No scan metadata found for latest krr scan")
+            return None
-            scans_results_response = (
-                self.client.table(SCANS_RESULTS_TABLE)
-                .select("*")
-                .eq("account_id", self.account_id)
-                .eq("cluster_id", self.cluster)
-                .eq("scan_id", scans_meta_response.data[0]["scan_id"])
-                .eq("name", name)
-                .eq("namespace", namespace)
-                .eq("kind", kind)
-                .execute()
-            )
-            if not len(scans_results_response.data):
-                return None
+        scan_id = scans_meta_response.data[0]["scan_id"]
-            return scans_results_response.data
-        except Exception:
-            logging.exception("Supabase error while retrieving efficiency data")
+        query = (
+            self.client.table(SCANS_RESULTS_TABLE)
+            .select("*")
+            .eq("account_id", self.account_id)
+            .eq("cluster_id", self.cluster)
+            .eq("scan_id", scan_id)
+        )
+        if namespace:
+            query = query.eq("namespace", namespace)
+        if name_pattern:
+            query = query.like("name", name_pattern)
+        if kind:
+            query = query.eq("kind", kind)
+        if container:
+            query = query.eq("container", container)
+        # For priority sorting, we can use the database's order
+        if sort_by == "priority":
+            query = query.order("priority", desc=True).limit(limit)
+        scans_results_response = query.execute()
+        if not len(scans_results_response.data):
             return None
-    def get_configuration_changes(
-        self, start_datetime: str, end_datetime: str
+        results = scans_results_response.data
+        if len(results) <= 1:
+            return results
+        # If sorting by priority, we already ordered and limited in the query
+        if sort_by == "priority":
+            return results
+        # Sort by calculated savings (descending)
+        results_with_savings = [
+            (result, calculate_krr_savings(result, sort_by)) for result in results
+        ]
+        results_with_savings.sort(key=lambda x: x[1], reverse=True)
+        return [result for result, _ in results_with_savings[:limit]]
+    def get_issues_metadata(
+        self,
+        start_datetime: str,
+        end_datetime: str,
+        limit: int = 100,
+        workload: Optional[str] = None,
+        ns: Optional[str] = None,
+        cluster: Optional[str] = None,
+        finding_type: FindingType = FindingType.CONFIGURATION_CHANGE,
     ) -> Optional[List[Dict]]:
         if not self.enabled:
             return []
+        if not cluster:
+            cluster = self.cluster
         try:
-            changes_response = (
+            query = (
                 self.client.table(ISSUES_TABLE)
-                .select("id", "subject_name", "subject_namespace", "description")
+                .select(
+                    "id",
+                    "title",
+                    "subject_name",
+                    "subject_namespace",
+                    "subject_type",
+                    "description",
+                    "starts_at",
+                    "ends_at",
+                )
                 .eq("account_id", self.account_id)
-                .eq("cluster", self.cluster)
-                .eq("finding_type", "configuration_change")
+                .eq("cluster", cluster)
                 .gte("creation_date", start_datetime)
                 .lte("creation_date", end_datetime)
-                .execute()
+                .limit(limit)
             )
-            if not len(changes_response.data):
-                return None
-        except Exception:
-            logging.exception("Supabase error while retrieving change data")
-            return None
+            query = query.eq("finding_type", finding_type.value)
+            if workload:
+                query.eq("subject_name", workload)
+            if ns:
+                query.eq("subject_namespace", ns)
-        changes_ids = [change["id"] for change in changes_response.data]
-        try:
-            change_data_response = (
-                self.client.table(EVIDENCE_TABLE)
-                .select("*")
-                .eq("account_id", self.account_id)
-                .in_("issue_id", changes_ids)
-                .execute()
-            )
-            if not len(change_data_response.data):
+            res = query.execute()
+            if not res.data:
                 return None
         except Exception:
-            logging.exception("Supabase error while retrieving change content")
+            logging.exception("Supabase error while retrieving change data")
             return None
-        changes_data = []
-        change_data_map = {
-            change["issue_id"]: change for change in change_data_response.data
-        }
-        for change in changes_response.data:
-            change_content = change_data_map.get(change["id"])
-            if change_content:
-                changes_data.append(
-                    {
-                        "change": change_content["data"],
-                        "evidence_id": change_content["id"],
-                        **change,
-                    }
-                )
         logging.debug(
-            "Change history for %s-%s: %s", start_datetime, end_datetime, changes_data
+            "Change history metadata for %s-%s workload %s in ns %s: %s",
+            start_datetime,
+            end_datetime,
+            workload,
+            ns,
+            res.data,
         )
-        return changes_data
+        return res.data
     def unzip_evidence_file(self, data):
         try:
@@ -322,22 +434,30 @@ class SupabaseDal:
             return data
     def extract_relevant_issues(self, evidence):
-        enrichment_blacklist = {"text_file", "graph", "ai_analysis", "holmes"}
         data = [
             enrich
             for enrich in evidence.data
-            if enrich.get("enrichment_type") not in enrichment_blacklist
+            if enrich.get("enrichment_type") not in ENRICHMENT_BLACKLIST_SET
         ]
         unzipped_files = [
             self.unzip_evidence_file(enrich)
             for enrich in evidence.data
             if enrich.get("enrichment_type") == "text_file"
+            or enrich.get("enrichment_type") == "alert_raw_data"
         ]
         data.extend(unzipped_files)
         return data
+    def get_issue_from_db(self, issue_id: str, table: str) -> Optional[Dict]:
+        issue_response = (
+            self.client.table(table).select("*").filter("id", "eq", issue_id).execute()
+        )
+        if len(issue_response.data):
+            return issue_response.data[0]
+        return None
     def get_issue_data(self, issue_id: Optional[str]) -> Optional[Dict]:
         # TODO this could be done in a single atomic SELECT, but there is no
         # foreign key relation between Issues and Evidence.
@@ -347,14 +467,11 @@ class SupabaseDal:
             return None
         issue_data = None
         try:
-            issue_response = (
-                self.client.table(ISSUES_TABLE)
-                .select("*")
-                .filter("id", "eq", issue_id)
-                .execute()
-            )
-            if len(issue_response.data):
-                issue_data = issue_response.data[0]
+            issue_data = self.get_issue_from_db(issue_id, ISSUES_TABLE)
+            if issue_data and issue_data["source"] == "prometheus":
+                logging.debug("Getting alert %s from GroupedIssuesTable", issue_id)
+                # This issue will have the complete alert duration information
+                issue_data = self.get_issue_from_db(issue_id, GROUPED_ISSUES_TABLE)
         except Exception:  # e.g. invalid id format
             logging.exception("Supabase error while retrieving issue data")
@@ -364,12 +481,14 @@ class SupabaseDal:
         evidence = (
             self.client.table(EVIDENCE_TABLE)
             .select("*")
-            .filter("issue_id", "eq", issue_id)
+            .eq("issue_id", issue_id)
+            .not_.in_("enrichment_type", ENRICHMENT_BLACKLIST)
             .execute()
         )
-        data = self.extract_relevant_issues(evidence)
+        relevant_evidence = self.extract_relevant_issues(evidence)
+        truncate_evidences_entities_if_necessary(relevant_evidence)
-        issue_data["evidence"] = data
+        issue_data["evidence"] = relevant_evidence
         # build issue investigation dates
         started_at = issue_data.get("starts_at")
@@ -393,6 +512,79 @@ class SupabaseDal:
         return issue_data
+    def get_runbook_catalog(self) -> Optional[List[RobustaRunbookInstruction]]:
+        if not self.enabled:
+            return None
+        try:
+            res = (
+                self.client.table(RUNBOOKS_TABLE)
+                .select("*")
+                .eq("account_id", self.account_id)
+                .eq("subject_type", "RunbookCatalog")
+                .execute()
+            )
+            if not res.data:
+                return None
+            instructions = []
+            for row in res.data:
+                id = row.get("runbook_id")
+                symptom = row.get("symptoms")
+                title = row.get("subject_name")
+                if not symptom:
+                    logging.warning("Skipping runbook with empty symptom: %s", id)
+                    continue
+                instructions.append(
+                    RobustaRunbookInstruction(id=id, symptom=symptom, title=title)
+                )
+            return instructions
+        except Exception:
+            logging.exception("Failed to fetch RunbookCatalog", exc_info=True)
+            return None
+    def get_runbook_content(
+        self, runbook_id: str
+    ) -> Optional[RobustaRunbookInstruction]:
+        if not self.enabled:
+            return None
+        res = (
+            self.client.table(RUNBOOKS_TABLE)
+            .select("*")
+            .eq("account_id", self.account_id)
+            .eq("subject_type", "RunbookCatalog")
+            .eq("runbook_id", runbook_id)
+            .execute()
+        )
+        if not res.data or len(res.data) != 1:
+            return None
+        row = res.data[0]
+        id = row.get("runbook_id")
+        symptom = row.get("symptoms")
+        title = row.get("subject_name")
+        raw_instruction = row.get("runbook").get("instructions")
+        # TODO: remove in the future when we migrate the table data
+        if isinstance(raw_instruction, list) and len(raw_instruction) == 1:
+            instruction = raw_instruction[0]
+        elif isinstance(raw_instruction, list) and len(raw_instruction) > 1:
+            # not currently used, but will be used in the future
+            instruction = "\n - ".join(raw_instruction)
+        elif isinstance(raw_instruction, str):
+            # not supported by the current UI, but will be supported in the future
+            instruction = raw_instruction
+        else:
+            # in case the format is unexpected, convert to string
+            logging.error(
+                f"Unexpected runbook instruction format for runbook_id={runbook_id}: {raw_instruction}"
+            )
+            instruction = str(raw_instruction)
+        return RobustaRunbookInstruction(
+            id=id, symptom=symptom, instruction=instruction, title=title
+        )
     def get_resource_instructions(
         self, type: str, name: Optional[str]
     ) -> Optional[ResourceInstructions]:
@@ -512,10 +704,13 @@ class SupabaseDal:
                 self.client.table(EVIDENCE_TABLE)
                 .select("data, enrichment_type")
                 .in_("issue_id", unique_issues)
+                .not_.in_("enrichment_type", ENRICHMENT_BLACKLIST)
                 .execute()
             )
-            return self.extract_relevant_issues(res)
+            relevant_issues = self.extract_relevant_issues(res)
+            truncate_evidences_entities_if_necessary(relevant_issues)
+            return relevant_issues
         except Exception:
             logging.exception("failed to fetch workload issues data", exc_info=True)

holmesgpt 0.13.2__py3-none-any.whl → 0.18.4__py3-none-any.whl

holmesgpt 0.13.2py3-none-any.whl → 0.18.4py3-none-any.whl