RubyGems - aidp - Versions diffs - 0.3.0 → 0.7.0 - Mend

aidp 0.3.0 → 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

checksums.yaml +4 -4
data/README.md +191 -5
data/lib/aidp/analysis/kb_inspector.rb +456 -0
data/lib/aidp/analysis/seams.rb +188 -0
data/lib/aidp/analysis/tree_sitter_grammar_loader.rb +493 -0
data/lib/aidp/analysis/tree_sitter_scan.rb +703 -0
data/lib/aidp/analyze/agent_personas.rb +1 -1
data/lib/aidp/analyze/agent_tool_executor.rb +5 -11
data/lib/aidp/analyze/data_retention_manager.rb +0 -5
data/lib/aidp/analyze/database.rb +99 -82
data/lib/aidp/analyze/error_handler.rb +12 -79
data/lib/aidp/analyze/export_manager.rb +0 -7
data/lib/aidp/analyze/focus_guidance.rb +2 -2
data/lib/aidp/analyze/incremental_analyzer.rb +1 -11
data/lib/aidp/analyze/large_analysis_progress.rb +0 -5
data/lib/aidp/analyze/memory_manager.rb +34 -60
data/lib/aidp/analyze/metrics_storage.rb +336 -0
data/lib/aidp/analyze/parallel_processor.rb +0 -6
data/lib/aidp/analyze/performance_optimizer.rb +0 -3
data/lib/aidp/analyze/prioritizer.rb +2 -2
data/lib/aidp/analyze/repository_chunker.rb +14 -21
data/lib/aidp/analyze/ruby_maat_integration.rb +6 -102
data/lib/aidp/analyze/runner.rb +107 -191
data/lib/aidp/analyze/steps.rb +35 -30
data/lib/aidp/analyze/storage.rb +233 -178
data/lib/aidp/analyze/tool_configuration.rb +21 -36
data/lib/aidp/cli/jobs_command.rb +489 -0
data/lib/aidp/cli/terminal_io.rb +52 -0
data/lib/aidp/cli.rb +160 -45
data/lib/aidp/core_ext/class_attribute.rb +36 -0
data/lib/aidp/database/pg_adapter.rb +148 -0
data/lib/aidp/database_config.rb +69 -0
data/lib/aidp/database_connection.rb +72 -0
data/lib/aidp/execute/runner.rb +65 -92
data/lib/aidp/execute/steps.rb +81 -82
data/lib/aidp/job_manager.rb +41 -0
data/lib/aidp/jobs/base_job.rb +45 -0
data/lib/aidp/jobs/provider_execution_job.rb +83 -0
data/lib/aidp/provider_manager.rb +25 -0
data/lib/aidp/providers/agent_supervisor.rb +348 -0
data/lib/aidp/providers/anthropic.rb +160 -3
data/lib/aidp/providers/base.rb +153 -6
data/lib/aidp/providers/cursor.rb +245 -43
data/lib/aidp/providers/gemini.rb +164 -3
data/lib/aidp/providers/supervised_base.rb +317 -0
data/lib/aidp/providers/supervised_cursor.rb +22 -0
data/lib/aidp/version.rb +1 -1
data/lib/aidp.rb +31 -34
data/templates/ANALYZE/01_REPOSITORY_ANALYSIS.md +4 -4
data/templates/ANALYZE/06a_tree_sitter_scan.md +217 -0
metadata +91 -36

data/lib/aidp/analyze/metrics_storage.rb ADDED Viewed

@@ -0,0 +1,336 @@
+# frozen_string_literal: true
+require "pg"
+require "json"
+module Aidp
+  module Analyze
+    class MetricsStorage
+      # Database schema version
+      SCHEMA_VERSION = 1
+      def initialize(project_dir = Dir.pwd, db_config = nil)
+        @project_dir = project_dir
+        @db_config = db_config || default_db_config
+        @db = nil
+        ensure_database_exists
+      end
+      # Store step execution metrics
+      def store_step_metrics(step_name, provider_name, duration, success, metadata = {})
+        ensure_connection
+        timestamp = Time.now
+        result = @db.exec_params(
+          "INSERT INTO step_executions (step_name, provider_name, duration, success, metadata, created_at) VALUES ($1, $2, $3, $4, $5, $6) RETURNING id",
+          [step_name, provider_name, duration, success, metadata.to_json, timestamp]
+        )
+        {
+          id: result[0]["id"],
+          step_name: step_name,
+          provider_name: provider_name,
+          duration: duration,
+          success: success,
+          stored_at: timestamp
+        }
+      end
+      # Store provider activity metrics
+      def store_provider_activity(provider_name, step_name, activity_summary)
+        ensure_connection
+        timestamp = Time.now
+        result = @db.exec_params(
+          "INSERT INTO provider_activities (provider_name, step_name, start_time, end_time, duration, final_state, stuck_detected, created_at) VALUES ($1, $2, $3, $4, $5, $6, $7, $8) RETURNING id",
+          [
+            provider_name,
+            step_name,
+            activity_summary[:start_time],
+            activity_summary[:end_time],
+            activity_summary[:duration],
+            activity_summary[:final_state].to_s,
+            activity_summary[:stuck_detected],
+            timestamp
+          ]
+        )
+        {
+          id: result[0]["id"],
+          provider_name: provider_name,
+          step_name: step_name,
+          stored_at: timestamp
+        }
+      end
+      # Get step execution statistics
+      def get_step_statistics(step_name = nil, provider_name = nil, limit = 100)
+        ensure_connection
+        query = "SELECT * FROM step_executions WHERE 1=1"
+        params = []
+        param_index = 1
+        if step_name
+          query += " AND step_name = $#{param_index}"
+          params << step_name
+          param_index += 1
+        end
+        if provider_name
+          query += " AND provider_name = $#{param_index}"
+          params << provider_name
+          param_index += 1
+        end
+        query += " ORDER BY created_at DESC LIMIT $#{param_index}"
+        params << limit
+        results = @db.exec_params(query, params)
+        results.map { |row| parse_step_execution(row) }
+      end
+      # Get provider activity statistics
+      def get_provider_activity_statistics(provider_name = nil, step_name = nil, limit = 100)
+        ensure_connection
+        query = "SELECT * FROM provider_activities WHERE 1=1"
+        params = []
+        param_index = 1
+        if provider_name
+          query += " AND provider_name = $#{param_index}"
+          params << provider_name
+          param_index += 1
+        end
+        if step_name
+          query += " AND step_name = $#{param_index}"
+          params << step_name
+          param_index += 1
+        end
+        query += " ORDER BY created_at DESC LIMIT $#{param_index}"
+        params << limit
+        results = @db.exec_params(query, params)
+        results.map { |row| parse_provider_activity(row) }
+      end
+      # Calculate timeout recommendations based on p95 of execution times
+      def calculate_timeout_recommendations
+        ensure_connection
+        recommendations = {}
+        # Get all step names
+        step_names = @db.exec("SELECT DISTINCT step_name FROM step_executions WHERE success = true")
+        step_names.each do |row|
+          step_name = row["step_name"]
+          # Get successful executions for this step
+          durations = @db.exec_params(
+            "SELECT duration FROM step_executions WHERE step_name = $1 AND success = true ORDER BY duration",
+            [step_name]
+          ).map { |r| r["duration"].to_f }
+          next if durations.empty?
+          # Calculate p95
+          p95_index = (durations.length * 0.95).ceil - 1
+          p95_duration = durations[p95_index]
+          # Round up to nearest second and add 10% buffer
+          recommended_timeout = (p95_duration * 1.1).ceil
+          recommendations[step_name] = {
+            p95_duration: p95_duration,
+            recommended_timeout: recommended_timeout,
+            sample_count: durations.length,
+            min_duration: durations.first,
+            max_duration: durations.last,
+            avg_duration: durations.sum.to_f / durations.length
+          }
+        end
+        recommendations
+      end
+      # Get overall metrics summary
+      def get_metrics_summary
+        ensure_connection
+        summary = {}
+        # Total executions
+        total_executions = @db.exec("SELECT COUNT(*) FROM step_executions").first["count"].to_i
+        summary[:total_executions] = total_executions
+        # Successful executions
+        successful_executions = @db.exec("SELECT COUNT(*) FROM step_executions WHERE success = true").first["count"].to_i
+        summary[:successful_executions] = successful_executions
+        # Success rate
+        summary[:success_rate] = (total_executions > 0) ? (successful_executions.to_f / total_executions * 100).round(2) : 0
+        # Average duration
+        avg_duration = @db.exec("SELECT AVG(duration) FROM step_executions WHERE success = true").first["avg"]
+        summary[:average_duration] = avg_duration ? avg_duration.to_f.round(2) : 0
+        # Stuck detections
+        stuck_count = @db.exec("SELECT COUNT(*) FROM provider_activities WHERE stuck_detected = true").first["count"].to_i
+        summary[:stuck_detections] = stuck_count
+        # Date range
+        date_range = @db.exec("SELECT MIN(created_at), MAX(created_at) FROM step_executions").first
+        if date_range && date_range["min"]
+          summary[:date_range] = {
+            start: Time.parse(date_range["min"]),
+            end: Time.parse(date_range["max"])
+          }
+        end
+        summary
+      end
+      # Clean up old metrics data
+      def cleanup_old_metrics(retention_days = 30)
+        ensure_connection
+        cutoff_time = Time.now - (retention_days * 24 * 60 * 60)
+        # Delete old step executions
+        deleted_executions = @db.exec_params(
+          "DELETE FROM step_executions WHERE created_at < $1 RETURNING id",
+          [cutoff_time]
+        ).ntuples
+        # Delete old provider activities
+        deleted_activities = @db.exec_params(
+          "DELETE FROM provider_activities WHERE created_at < $1 RETURNING id",
+          [cutoff_time]
+        ).ntuples
+        {
+          deleted_executions: deleted_executions,
+          deleted_activities: deleted_activities,
+          cutoff_time: cutoff_time
+        }
+      end
+      # Export metrics data
+      def export_metrics(format = :json)
+        ensure_connection
+        case format
+        when :json
+          {
+            step_executions: get_step_statistics(nil, nil, 1000),
+            provider_activities: get_provider_activity_statistics(nil, nil, 1000),
+            summary: get_metrics_summary,
+            recommendations: calculate_timeout_recommendations,
+            exported_at: Time.now.iso8601
+          }
+        when :csv
+          # TODO: Implement CSV export
+          raise NotImplementedError, "CSV export not yet implemented"
+        else
+          raise ArgumentError, "Unsupported export format: #{format}"
+        end
+      end
+      private
+      def default_db_config
+        {
+          host: ENV["AIDP_DB_HOST"] || "localhost",
+          port: ENV["AIDP_DB_PORT"] || 5432,
+          dbname: ENV["AIDP_DB_NAME"] || "aidp",
+          user: ENV["AIDP_DB_USER"] || ENV["USER"],
+          password: ENV["AIDP_DB_PASSWORD"]
+        }
+      end
+      def ensure_connection
+        return if @db
+        @db = PG.connect(@db_config)
+        @db.type_map_for_results = PG::BasicTypeMapForResults.new(@db)
+      end
+      def ensure_database_exists
+        ensure_connection
+        # Create step_executions table if it doesn't exist
+        @db.exec(<<~SQL)
+          CREATE TABLE IF NOT EXISTS step_executions (
+            id SERIAL PRIMARY KEY,
+            step_name TEXT NOT NULL,
+            provider_name TEXT NOT NULL,
+            duration REAL NOT NULL,
+            success BOOLEAN NOT NULL,
+            metadata JSONB,
+            created_at TIMESTAMP WITH TIME ZONE NOT NULL
+          )
+        SQL
+        # Create provider_activities table if it doesn't exist
+        @db.exec(<<~SQL)
+          CREATE TABLE IF NOT EXISTS provider_activities (
+            id SERIAL PRIMARY KEY,
+            provider_name TEXT NOT NULL,
+            step_name TEXT NOT NULL,
+            start_time TIMESTAMP WITH TIME ZONE,
+            end_time TIMESTAMP WITH TIME ZONE,
+            duration REAL,
+            final_state TEXT,
+            stuck_detected BOOLEAN DEFAULT FALSE,
+            created_at TIMESTAMP WITH TIME ZONE NOT NULL
+          )
+        SQL
+        # Create indexes separately
+        @db.exec("CREATE INDEX IF NOT EXISTS idx_step_executions_step_name ON step_executions(step_name)")
+        @db.exec("CREATE INDEX IF NOT EXISTS idx_step_executions_provider_name ON step_executions(provider_name)")
+        @db.exec("CREATE INDEX IF NOT EXISTS idx_step_executions_created_at ON step_executions(created_at)")
+        @db.exec("CREATE INDEX IF NOT EXISTS idx_provider_activities_provider_name ON provider_activities(provider_name)")
+        @db.exec("CREATE INDEX IF NOT EXISTS idx_provider_activities_step_name ON provider_activities(step_name)")
+        @db.exec("CREATE INDEX IF NOT EXISTS idx_provider_activities_created_at ON provider_activities(created_at)")
+        # Create metrics_schema_version table if it doesn't exist
+        @db.exec("CREATE TABLE IF NOT EXISTS metrics_schema_version (version INTEGER NOT NULL)")
+        @db.exec_params("INSERT INTO metrics_schema_version (version) VALUES ($1) ON CONFLICT DO NOTHING", [SCHEMA_VERSION])
+      end
+      def parse_step_execution(row)
+        {
+          id: row["id"].to_i,
+          step_name: row["step_name"],
+          provider_name: row["provider_name"],
+          duration: row["duration"].to_f,
+          success: row["success"],
+          metadata: row["metadata"] ? JSON.parse(row["metadata"]) : {},
+          created_at: Time.parse(row["created_at"])
+        }
+      end
+      def parse_provider_activity(row)
+        {
+          id: row["id"].to_i,
+          provider_name: row["provider_name"],
+          step_name: row["step_name"],
+          start_time: row["start_time"] ? Time.parse(row["start_time"]) : nil,
+          end_time: row["end_time"] ? Time.parse(row["end_time"]) : nil,
+          duration: row["duration"].to_f,
+          final_state: row["final_state"]&.to_sym,
+          stuck_detected: row["stuck_detected"],
+          created_at: Time.parse(row["created_at"])
+        }
+      end
+    end
+  end
+end

data/lib/aidp/analyze/parallel_processor.rb CHANGED Viewed

@@ -236,12 +236,6 @@ module Aidp
             index: future_info[:index]
           }
           @progress.increment
-        rescue => e
-          @errors << {
-            chunk_id: future_info[:chunk][:id],
-            error: e.message,
-            index: future_info[:index]
-          }
         end
         completed_futures

data/lib/aidp/analyze/performance_optimizer.rb CHANGED Viewed

@@ -663,9 +663,6 @@ module Aidp
       futures = items.map do |item|
         Concurrent::Future.execute do
           processor ? processor.call(item) : item
-        rescue => e
-          @statistics[:errors] += 1
-          {error: e.message, item: item}
         end
       end

data/lib/aidp/analyze/prioritizer.rb CHANGED Viewed

@@ -12,9 +12,9 @@ module Aidp
         @feature_analyzer = Aidp::Analyze::FeatureAnalyzer.new(project_dir)
       end
-      # Generate prioritized analysis recommendations based on Code Maat data
+      # Generate prioritized analysis recommendations based on ruby-maat data
       def generate_prioritized_recommendations
-        # Get Code Maat analysis data
+        # Get ruby-maat analysis data
         code_maat_data = @code_maat.run_comprehensive_analysis
         # Get feature analysis data

data/lib/aidp/analyze/repository_chunker.rb CHANGED Viewed

@@ -264,29 +264,22 @@ module Aidp
           status: "running"
         }
-        begin
-          # Perform analysis based on chunk type
-          case chunk[:strategy]
-          when "time_based"
-            results[:data] = analyze_time_chunk(chunk, analysis_type, options)
-          when "commit_count"
-            results[:data] = analyze_commit_chunk(chunk, analysis_type, options)
-          when "size_based"
-            results[:data] = analyze_size_chunk(chunk, analysis_type, options)
-          when "feature_based"
-            results[:data] = analyze_feature_chunk(chunk, analysis_type, options)
-          end
-          results[:status] = "completed"
-          results[:end_time] = Time.now
-          results[:duration] = results[:end_time] - results[:start_time]
-        rescue => e
-          results[:status] = "failed"
-          results[:error] = e.message
-          results[:end_time] = Time.now
-          results[:duration] = results[:end_time] - results[:start_time]
+        # Perform analysis based on chunk type
+        case chunk[:strategy]
+        when "time_based"
+          results[:data] = analyze_time_chunk(chunk, analysis_type, options)
+        when "commit_count"
+          results[:data] = analyze_commit_chunk(chunk, analysis_type, options)
+        when "size_based"
+          results[:data] = analyze_size_chunk(chunk, analysis_type, options)
+        when "feature_based"
+          results[:data] = analyze_feature_chunk(chunk, analysis_type, options)
         end
+        results[:status] = "completed"
+        results[:end_time] = Time.now
+        results[:duration] = results[:end_time] - results[:start_time]
         results
       end

data/lib/aidp/analyze/ruby_maat_integration.rb CHANGED Viewed

@@ -171,112 +171,16 @@ module Aidp
           # Write the output to the specified file
           File.write(output_file, stdout)
         else
-          # Fallback to mock implementation if RubyMaat fails
-          puts "Warning: RubyMaat analysis failed, using mock data. Error: #{stderr}"
-          mock_ruby_maat_analysis(analysis_type, input_file, output_file)
+          # Raise proper error instead of falling back to fake data
+          error_msg = "RubyMaat analysis failed for #{analysis_type}: #{stderr.strip}"
+          error_msg += "\n\nTo install ruby-maat, run: gem install ruby-maat"
+          error_msg += "\nOr add it to your Gemfile: gem 'ruby-maat'"
+          raise error_msg
         end
         output_file
       end
-      def mock_ruby_maat_analysis(analysis_type, input_file, output_file)
-        # Parse the Git log to generate mock analysis data
-        git_log_content = File.read(input_file)
-        case analysis_type
-        when "churn"
-          generate_mock_churn_data(git_log_content, output_file)
-        when "coupling"
-          generate_mock_coupling_data(git_log_content, output_file)
-        when "authorship"
-          generate_mock_authorship_data(git_log_content, output_file)
-        when "summary"
-          generate_mock_summary_data(git_log_content, output_file)
-        else
-          raise "Unknown analysis type: #{analysis_type}"
-        end
-        output_file
-      end
-      def generate_mock_churn_data(git_log_content, output_file)
-        # Extract file names from Git log and generate mock churn data
-        files = extract_files_from_git_log(git_log_content)
-        csv_content = "entity,n-revs,n-lines-added,n-lines-deleted\n"
-        files.each_with_index do |file, index|
-          changes = rand(1..20)
-          additions = rand(0..changes * 10)
-          deletions = rand(0..changes * 5)
-          csv_content += "#{file},#{changes},#{additions},#{deletions}\n"
-        end
-        File.write(output_file, csv_content)
-      end
-      def generate_mock_coupling_data(git_log_content, output_file)
-        # Generate mock coupling data between files
-        files = extract_files_from_git_log(git_log_content)
-        csv_content = "entity,coupled,degree,average-revs\n"
-        files.each_slice(2) do |file1, file2|
-          next unless file2
-          shared_changes = rand(1..10)
-          rand(0.1..1.0).round(2)
-          avg_revs = rand(1..5)
-          csv_content += "#{file1},#{file2},#{shared_changes},#{avg_revs}\n"
-        end
-        File.write(output_file, csv_content)
-      end
-      def generate_mock_authorship_data(git_log_content, output_file)
-        # Generate mock authorship data
-        files = extract_files_from_git_log(git_log_content)
-        authors = %w[Alice Bob Charlie Diana Eve]
-        csv_content = "entity,n-authors,revs\n"
-        files.each do |file|
-          author_count = rand(1..3)
-          file_authors = authors.sample(author_count)
-          revs = rand(1..15)
-          csv_content += "#{file},\"#{file_authors.join(";")}\",#{revs}\n"
-        end
-        File.write(output_file, csv_content)
-      end
-      def generate_mock_summary_data(git_log_content, output_file)
-        # Generate mock summary data
-        summary_content = <<~SUMMARY
-          Number of commits: 42
-          Number of entities: 15
-          Number of authors: 5
-          First commit: 2023-01-01
-          Last commit: 2024-01-01
-          Total lines added: 1250
-          Total lines deleted: 450
-        SUMMARY
-        File.write(output_file, summary_content)
-      end
-      def extract_files_from_git_log(git_log_content)
-        # Extract file names from Git log content
-        files = []
-        git_log_content.lines.each do |line|
-          # Look for lines that contain file paths (not commit info)
-          next unless line.match?(/\d+\s+\d+\s+[^\s]+$/)
-          parts = line.strip.split(/\s+/)
-          files << parts[2] if parts.length >= 3 && parts[2] != "-"
-        end
-        # Return unique files, limited to a reasonable number
-        files.uniq.first(20)
-      end
       # Check if repository is large enough to require chunking
       def large_repository?(git_log_file)
         return false unless File.exist?(git_log_file)
@@ -477,7 +381,7 @@ module Aidp
         report_file = File.join(@project_dir, "code_maat_analysis_report.md")
         report = <<~REPORT
-          # Code Maat Analysis Report
+          # Ruby-maat Analysis Report
           Generated on: #{Time.now.strftime("%Y-%m-%d %H:%M:%S")}
           Project: #{File.basename(@project_dir)}