RubyGems - pg_reports - Versions diffs - 0.4.0 → 0.5.0 - Mend

pg_reports 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

checksums.yaml +4 -4
data/CHANGELOG.md +104 -0
data/README.md +129 -4
data/app/controllers/pg_reports/dashboard_controller.rb +188 -25
data/app/views/layouts/pg_reports/application.html.erb +282 -0
data/app/views/pg_reports/dashboard/_show_scripts.html.erb +184 -23
data/app/views/pg_reports/dashboard/_show_styles.html.erb +373 -0
data/app/views/pg_reports/dashboard/index.html.erb +419 -0
data/config/locales/en.yml +45 -0
data/config/locales/ru.yml +45 -0
data/config/routes.rb +8 -0
data/lib/pg_reports/configuration.rb +13 -0
data/lib/pg_reports/dashboard/reports_registry.rb +24 -1
data/lib/pg_reports/definitions/connections/connection_churn.yml +49 -0
data/lib/pg_reports/definitions/connections/pool_saturation.yml +42 -0
data/lib/pg_reports/definitions/connections/pool_usage.yml +43 -0
data/lib/pg_reports/definitions/connections/pool_wait_times.yml +44 -0
data/lib/pg_reports/definitions/queries/missing_index_queries.yml +3 -3
data/lib/pg_reports/explain_analyzer.rb +338 -0
data/lib/pg_reports/modules/schema_analysis.rb +4 -6
data/lib/pg_reports/modules/system.rb +19 -2
data/lib/pg_reports/query_monitor.rb +280 -0
data/lib/pg_reports/sql/connections/connection_churn.sql +37 -0
data/lib/pg_reports/sql/connections/pool_saturation.sql +90 -0
data/lib/pg_reports/sql/connections/pool_usage.sql +31 -0
data/lib/pg_reports/sql/connections/pool_wait_times.sql +19 -0
data/lib/pg_reports/sql/queries/all_queries.sql +17 -15
data/lib/pg_reports/sql/queries/expensive_queries.sql +9 -4
data/lib/pg_reports/sql/queries/heavy_queries.sql +14 -12
data/lib/pg_reports/sql/queries/low_cache_hit_queries.sql +16 -14
data/lib/pg_reports/sql/queries/missing_index_queries.sql +18 -16
data/lib/pg_reports/sql/queries/slow_queries.sql +14 -12
data/lib/pg_reports/sql/system/databases_list.sql +8 -0
data/lib/pg_reports/version.rb +1 -1
data/lib/pg_reports.rb +2 -0
metadata +56 -3

data/lib/pg_reports/definitions/connections/connection_churn.yml ADDED Viewed

@@ -0,0 +1,49 @@
+# Connection Churn Analysis
+# Analyzes connection creation/destruction patterns and short-lived connections
+report:
+  name: connection_churn
+  module: connections
+  description: "Connection churn and short-lived connection analysis"
+  sql:
+    category: connections
+    file: connection_churn
+  title: "Connection Churn Analysis"
+  columns:
+    - database
+    - application
+    - total_connections
+    - avg_connection_age_seconds
+    - min_connection_age_seconds
+    - max_connection_age_seconds
+    - short_lived_connections
+    - churn_rate_pct
+  thresholds:
+    churn_rate_pct:
+      warning: 50
+      critical: 75
+    short_lived_connections:
+      warning: 10
+      critical: 25
+  problem_fields:
+    - churn_rate_pct
+    - short_lived_connections
+  problem_explanations:
+    churn_rate_pct: high_connection_churn
+    short_lived_connections: too_many_short_connections
+  documentation:
+    what: "Analyzes connection lifecycle patterns to identify excessive connection churn (frequent connect/disconnect cycles)."
+    why: "High connection churn wastes resources on connection setup/teardown and indicates potential connection pooling issues. Short-lived connections suggest the application isn't reusing connections efficiently."
+    nuances:
+      - "Connections under 10 seconds old are considered short-lived"
+      - "High churn rate (>50%) suggests missing or misconfigured connection pooling"
+      - "Many short-lived connections increase CPU overhead and authentication load"
+      - "Consider using PgBouncer or similar pooler to reduce churn"
+      - "Web applications should maintain a connection pool, not create connections per request"

data/lib/pg_reports/definitions/connections/pool_saturation.yml ADDED Viewed

@@ -0,0 +1,42 @@
+# Connection Pool Saturation Warnings
+# Identifies connection pool saturation and potential exhaustion
+report:
+  name: pool_saturation
+  module: connections
+  description: "Connection pool saturation analysis and warnings"
+  sql:
+    category: connections
+    file: pool_saturation
+  title: "Pool Saturation Warnings"
+  columns:
+    - metric
+    - current_value
+    - max_value
+    - utilization_pct
+    - status
+    - recommendation
+  thresholds:
+    utilization_pct:
+      warning: 70
+      critical: 85
+  problem_fields:
+    - utilization_pct
+  problem_explanations:
+    utilization_pct: pool_saturation
+  documentation:
+    what: "Overall connection pool health metrics with saturation warnings and recommendations."
+    why: "Pool saturation leads to connection exhaustion, causing 'too many connections' errors and application failures. Early detection prevents outages."
+    nuances:
+      - "Utilization consistently above 70% suggests need for pool tuning or scaling"
+      - "High idle in transaction connections waste resources and should be minimized"
+      - "Reserved connections (superuser_reserved_connections) reduce available pool"
+      - "Consider implementing connection pooling if not already in use"
+      - "Monitor trends over time - sudden spikes may indicate connection leaks"

data/lib/pg_reports/definitions/connections/pool_usage.yml ADDED Viewed

@@ -0,0 +1,43 @@
+# Connection Pool Usage Statistics
+# Shows current pool utilization, limits, and capacity warnings
+report:
+  name: pool_usage
+  module: connections
+  description: "Connection pool usage and capacity analysis"
+  sql:
+    category: connections
+    file: pool_usage
+  title: "Connection Pool Usage"
+  columns:
+    - database
+    - total_connections
+    - active_connections
+    - idle_connections
+    - idle_in_transaction
+    - max_connections
+    - utilization_pct
+    - available_connections
+  thresholds:
+    utilization_pct:
+      warning: 70
+      critical: 85
+  problem_fields:
+    - utilization_pct
+  problem_explanations:
+    utilization_pct: high_pool_usage
+  documentation:
+    what: "Current connection pool utilization across all databases, showing active, idle, and available connections."
+    why: "High pool utilization can lead to connection exhaustion, causing application errors and degraded performance. Monitoring pool usage helps prevent connection starvation."
+    nuances:
+      - "Utilization above 70% indicates you're approaching pool limits"
+      - "Idle in transaction connections hold locks and can block other queries"
+      - "max_connections is a database-wide setting, not per-database"
+      - "Consider using connection pooling (PgBouncer/pgpool) for better resource management"

data/lib/pg_reports/definitions/connections/pool_wait_times.yml ADDED Viewed

@@ -0,0 +1,44 @@
+# Connection Pool Wait Time Analysis
+# Analyzes queries waiting for resources (locks, IO, etc.)
+report:
+  name: pool_wait_times
+  module: connections
+  description: "Analysis of queries waiting for resources"
+  sql:
+    category: connections
+    file: pool_wait_times
+  title: "Pool Wait Time Analysis"
+  columns:
+    - pid
+    - database
+    - username
+    - wait_event_type
+    - wait_event
+    - state
+    - wait_duration_seconds
+    - query_start
+    - query
+  thresholds:
+    wait_duration_seconds:
+      warning: 10
+      critical: 60
+  problem_fields:
+    - wait_duration_seconds
+  problem_explanations:
+    wait_duration_seconds: long_wait_time
+  documentation:
+    what: "Queries currently waiting for resources like locks, I/O, or network operations."
+    why: "Long wait times indicate resource contention or bottlenecks. Understanding what queries are waiting for helps identify performance issues."
+    nuances:
+      - "ClientRead wait events indicate slow clients not consuming data fast enough"
+      - "Lock waits suggest contention between concurrent queries"
+      - "IO waits may indicate disk performance issues or need for more cache"
+      - "Wait times above 60 seconds are critical and should be investigated immediately"

data/lib/pg_reports/definitions/queries/missing_index_queries.yml CHANGED Viewed

@@ -16,9 +16,9 @@ report:
     - query
     - source
     - calls
-    - seq_scan_count
-    - rows_examined
-    - table_name
+    - total_time_ms
+    - rows_per_call
+    - disk_read_ratio
   parameters:
     limit:

data/lib/pg_reports/explain_analyzer.rb ADDED Viewed

@@ -0,0 +1,338 @@
+# frozen_string_literal: true
+module PgReports
+  # Analyzes EXPLAIN ANALYZE output and extracts insights
+  class ExplainAnalyzer
+    # Node types and their characteristics
+    NODE_TYPES = {
+      "Seq Scan" => {color: "warning", description: "Full table scan - potentially slow for large tables"},
+      "Index Scan" => {color: "good", description: "Using an index efficiently"},
+      "Index Only Scan" => {color: "good", description: "Most efficient - reading only from index"},
+      "Bitmap Index Scan" => {color: "ok", description: "First step of bitmap scan"},
+      "Bitmap Heap Scan" => {color: "ok", description: "Using multiple indexes combined"},
+      "Nested Loop" => {color: "neutral", description: "Joining tables in a loop"},
+      "Hash Join" => {color: "good", description: "Efficient join using hash table"},
+      "Merge Join" => {color: "good", description: "Efficient join on sorted data"},
+      "Sort" => {color: "warning", description: "Sorting data in memory or disk"},
+      "HashAggregate" => {color: "ok", description: "Grouping using hash table"},
+      "GroupAggregate" => {color: "ok", description: "Grouping on sorted data"},
+      "Aggregate" => {color: "ok", description: "Computing aggregate functions"},
+      "Limit" => {color: "good", description: "Limiting result set"},
+      "Subquery Scan" => {color: "neutral", description: "Scanning a subquery result"},
+      "CTE Scan" => {color: "neutral", description: "Scanning a Common Table Expression"},
+      "Materialize" => {color: "warning", description: "Caching intermediate results"},
+      "Gather" => {color: "ok", description: "Parallel query coordination"},
+      "Gather Merge" => {color: "ok", description: "Parallel query with merge"}
+    }.freeze
+    attr_reader :raw_output, :lines, :problems, :summary
+    def initialize(explain_output)
+      @raw_output = explain_output
+      @lines = explain_output.split("\n")
+      @problems = []
+      @summary = {}
+      analyze
+    end
+    def to_h
+      {
+        raw_output: @raw_output,
+        annotated_lines: annotate_lines,
+        problems: @problems,
+        summary: @summary,
+        stats: extract_stats
+      }
+    end
+    private
+    def analyze
+      detect_sequential_scans
+      detect_high_cost_operations
+      detect_sort_operations
+      detect_low_row_accuracy
+      detect_timing_issues
+      build_summary
+    end
+    # Annotate each line with metadata for rendering
+    def annotate_lines
+      @lines.map.with_index do |line, idx|
+        node_type = extract_node_type(line)
+        metrics = extract_metrics(line)
+        {
+          line_number: idx + 1,
+          text: line,
+          node_type: node_type,
+          node_info: NODE_TYPES[node_type],
+          metrics: metrics,
+          indent_level: line[/^ */].length / 2,
+          is_planning: line.include?("Planning"),
+          is_execution: line.include?("Execution"),
+          is_timing: line.match?(/Planning Time|Execution Time/)
+        }
+      end
+    end
+    def extract_node_type(line)
+      NODE_TYPES.keys.find { |type| line.include?(type) }
+    end
+    def extract_metrics(line)
+      metrics = {}
+      # Extract cost
+      if (match = line.match(/cost=([\d.]+)\.\.([\d.]+)/))
+        metrics[:startup_cost] = match[1].to_f
+        metrics[:total_cost] = match[2].to_f
+      end
+      # Extract rows
+      if (match = line.match(/rows=(\d+)/))
+        metrics[:rows_estimated] = match[1].to_i
+      end
+      # Extract actual rows
+      if (match = line.match(/rows=(\d+).*actual.*rows=(\d+)/))
+        metrics[:rows_estimated] = match[1].to_i
+        metrics[:rows_actual] = match[2].to_i
+      elsif (match = line.match(/actual.*rows=(\d+)/))
+        metrics[:rows_actual] = match[1].to_i
+      end
+      # Extract actual time
+      if (match = line.match(/actual time=([\d.]+)\.\.([\d.]+)/))
+        metrics[:actual_time_start] = match[1].to_f
+        metrics[:actual_time_end] = match[2].to_f
+      end
+      # Extract loops
+      if (match = line.match(/loops=(\d+)/))
+        metrics[:loops] = match[1].to_i
+      end
+      # Extract buffers
+      if (match = line.match(/Buffers: shared hit=(\d+)/))
+        metrics[:buffers_hit] = match[1].to_i
+      end
+      if (match = line.match(/read=(\d+)/))
+        metrics[:buffers_read] = match[1].to_i
+      end
+      metrics
+    end
+    def extract_stats
+      stats = {}
+      @lines.each do |line|
+        if (match = line.match(/Planning Time: ([\d.]+) ms/))
+          stats[:planning_time] = match[1].to_f
+        elsif (match = line.match(/Execution Time: ([\d.]+) ms/))
+          stats[:execution_time] = match[1].to_f
+        end
+      end
+      # Extract top-level cost and rows from first line with cost
+      first_cost_line = @lines.find { |l| l.include?("cost=") }
+      if first_cost_line
+        if (match = first_cost_line.match(/cost=[\d.]+\.\.([\d.]+)/))
+          stats[:total_cost] = match[1].to_f
+        end
+        if (match = first_cost_line.match(/rows=(\d+)/))
+          stats[:rows_estimated] = match[1].to_i
+        end
+      end
+      stats
+    end
+    def detect_sequential_scans
+      seq_scans = []
+      @lines.each_with_index do |line, idx|
+        next unless line.include?("Seq Scan")
+        table_name = extract_table_name(line)
+        metrics = extract_metrics(line)
+        # Consider it a problem if:
+        # 1. High cost (> 1000)
+        # 2. Many rows (> 1000)
+        # 3. Significant actual time (> 100ms per loop)
+        is_problem = false
+        reasons = []
+        if metrics[:total_cost] && metrics[:total_cost] > 1000
+          is_problem = true
+          reasons << "high cost (#{metrics[:total_cost].round(2)})"
+        end
+        if metrics[:rows_estimated] && metrics[:rows_estimated] > 1000
+          is_problem = true
+          reasons << "many rows (#{metrics[:rows_estimated]})"
+        end
+        if metrics[:actual_time_end] && metrics[:actual_time_end] > 100
+          is_problem = true
+          reasons << "slow execution (#{metrics[:actual_time_end].round(2)}ms)"
+        end
+        if is_problem
+          @problems << {
+            type: :sequential_scan,
+            severity: :warning,
+            line_number: idx + 1,
+            table: table_name,
+            message: "Sequential scan on #{table_name || "table"}",
+            details: reasons.join(", "),
+            recommendation: "Consider adding an index on frequently filtered columns"
+          }
+        end
+        seq_scans << {table: table_name, line: idx + 1, is_problem: is_problem}
+      end
+      seq_scans
+    end
+    def detect_high_cost_operations
+      @lines.each_with_index do |line, idx|
+        metrics = extract_metrics(line)
+        next unless metrics[:total_cost]
+        # Flag operations with very high cost (> 10000)
+        if metrics[:total_cost] > 10000
+          node_type = extract_node_type(line)
+          @problems << {
+            type: :high_cost,
+            severity: :warning,
+            line_number: idx + 1,
+            node_type: node_type,
+            cost: metrics[:total_cost],
+            message: "Very high cost operation (#{metrics[:total_cost].round(2)})",
+            recommendation: "This operation is expensive - review if it can be optimized"
+          }
+        end
+      end
+    end
+    def detect_sort_operations
+      @lines.each_with_index do |line, idx|
+        next unless line.include?("Sort")
+        # Check if sort spilled to disk
+        if line.match?(/external.*sort/i) || line.include?("Disk:")
+          @problems << {
+            type: :sort_spill,
+            severity: :critical,
+            line_number: idx + 1,
+            message: "Sort operation spilled to disk",
+            recommendation: "Increase work_mem or optimize query to reduce sort size"
+          }
+        elsif line.include?("Sort")
+          # Just a regular sort, note it but not necessarily a problem
+          metrics = extract_metrics(line)
+          if metrics[:actual_time_end] && metrics[:actual_time_end] > 1000
+            @problems << {
+              type: :slow_sort,
+              severity: :warning,
+              line_number: idx + 1,
+              message: "Slow sort operation (#{metrics[:actual_time_end].round(2)}ms)",
+              recommendation: "Consider reducing the dataset before sorting or using an index"
+            }
+          end
+        end
+      end
+    end
+    def detect_low_row_accuracy
+      @lines.each_with_index do |line, idx|
+        metrics = extract_metrics(line)
+        next unless metrics[:rows_estimated] && metrics[:rows_actual]
+        estimated = metrics[:rows_estimated].to_f
+        actual = metrics[:rows_actual].to_f
+        # Skip if very small numbers
+        next if estimated < 10 && actual < 10
+        # Calculate ratio (avoid division by zero)
+        max_val = [estimated, actual].max
+        min_val = [estimated, actual].min
+        next if max_val == 0
+        ratio = max_val / min_val
+        # If estimation is off by more than 10x, it's a problem
+        if ratio > 10
+          @problems << {
+            type: :estimation_error,
+            severity: :warning,
+            line_number: idx + 1,
+            message: "Row estimation is significantly off (estimated: #{estimated.to_i}, actual: #{actual.to_i})",
+            recommendation: "Run ANALYZE on the involved tables to update statistics"
+          }
+        end
+      end
+    end
+    def detect_timing_issues
+      stats = extract_stats
+      if stats[:execution_time] && stats[:execution_time] > 1000
+        @problems << {
+          type: :slow_query,
+          severity: :critical,
+          message: "Query execution is very slow (#{stats[:execution_time].round(2)}ms)",
+          recommendation: "Review the execution plan for optimization opportunities"
+        }
+      end
+      if stats[:planning_time] && stats[:planning_time] > 100
+        @problems << {
+          type: :slow_planning,
+          severity: :info,
+          message: "Query planning is slow (#{stats[:planning_time].round(2)}ms)",
+          recommendation: "Consider simplifying the query or using prepared statements"
+        }
+      end
+    end
+    def build_summary
+      @summary = {
+        total_problems: @problems.length,
+        critical_problems: @problems.count { |p| p[:severity] == :critical },
+        warnings: @problems.count { |p| p[:severity] == :warning },
+        info: @problems.count { |p| p[:severity] == :info }
+      }
+      # Add overall assessment
+      if @summary[:critical_problems] > 0
+        @summary[:status] = "critical"
+        @summary[:status_text] = "Critical issues detected"
+        @summary[:status_icon] = "🔴"
+      elsif @summary[:warnings] > 0
+        @summary[:status] = "warning"
+        @summary[:status_text] = "Potential issues detected"
+        @summary[:status_icon] = "🟡"
+      else
+        @summary[:status] = "good"
+        @summary[:status_text] = "No issues detected"
+        @summary[:status_icon] = "🟢"
+      end
+      # Group problems by type for summary
+      problem_types = @problems.group_by { |p| p[:type] }
+      @summary[:problem_breakdown] = problem_types.transform_values(&:count)
+    end
+    def extract_table_name(line)
+      if (match = line.match(/on (\w+)/))
+        match[1]
+      end
+    end
+  end
+end

data/lib/pg_reports/modules/schema_analysis.rb CHANGED Viewed

@@ -89,12 +89,10 @@ module PgReports
         ].uniq
         possible_names.each do |model_name|
-          begin
-            model = model_name.constantize
-            return model if model.is_a?(Class) && model < ActiveRecord::Base
-          rescue NameError
-            # Model doesn't exist, try next one
-          end
+          model = model_name.constantize
+          return model if model.is_a?(Class) && model < ActiveRecord::Base
+        rescue NameError
+          # Model doesn't exist, try next one
         end
         nil

data/lib/pg_reports/modules/system.rb CHANGED Viewed

@@ -50,8 +50,7 @@ module PgReports
       # @return [Hash] Metrics data
       def live_metrics(long_query_threshold: 60)
         data = executor.execute_from_file(:system, :live_metrics,
-          long_query_threshold: long_query_threshold
-        )
+          long_query_threshold: long_query_threshold)
         row = data.first || {}
@@ -116,6 +115,24 @@ module PgReports
         end
       end
+      # Get list of all databases
+      # @return [Array<Hash>] List of databases with sizes
+      def databases_list
+        executor.execute_from_file(:system, :databases_list)
+      rescue
+        # Fallback to empty array if query fails
+        []
+      end
+      # Get current database name
+      # @return [String] Current database name
+      def current_database
+        result = executor.execute("SELECT current_database() AS database")
+        result.first&.fetch("database", "unknown") || "unknown"
+      rescue
+        "unknown"
+      end
       private
       def executor