RubyGems - evilution - Versions diffs - 0.33.0 → 0.34.0 - Mend

evilution 0.33.0 → 0.34.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

checksums.yaml +4 -4
data/.beads/interactions.jsonl +16 -0
data/.rubocop_todo.yml +1 -1
data/CHANGELOG.md +14 -0
data/README.md +11 -9
data/docs/isolation.md +31 -2
data/lib/evilution/cli/parser/options_builder.rb +17 -0
data/lib/evilution/config/validators/example_targeting_strategy.rb +22 -0
data/lib/evilution/config.rb +16 -2
data/lib/evilution/coverage/digest.rb +16 -0
data/lib/evilution/coverage/map.rb +64 -0
data/lib/evilution/coverage/map_builder.rb +82 -0
data/lib/evilution/coverage/map_store.rb +87 -0
data/lib/evilution/coverage/recorder.rb +85 -0
data/lib/evilution/coverage.rb +8 -0
data/lib/evilution/coverage_example_filter.rb +41 -0
data/lib/evilution/isolation/fork.rb +38 -76
data/lib/evilution/parallel/work_queue/dispatcher/deadline_tracker.rb +63 -0
data/lib/evilution/parallel/work_queue/dispatcher.rb +7 -34
data/lib/evilution/parallel/work_queue/worker.rb +41 -51
data/lib/evilution/process_supervisor.rb +259 -0
data/lib/evilution/runner/baseline_runner.rb +52 -0
data/lib/evilution/runner/isolation_resolver.rb +106 -12
data/lib/evilution/runner.rb +3 -2
data/lib/evilution/spec_resolver.rb +66 -0
data/lib/evilution/spec_selector.rb +14 -4
data/lib/evilution/version.rb +1 -1
data/lib/evilution.rb +1 -0
data/scripts/canary_manifest.yml +47 -0
data/scripts/compare_targeting +277 -0
data/scripts/compare_targeting.example.yml +24 -0
metadata +15 -3
data/lib/evilution/parallel/work_queue/worker_registry.rb +0 -47

data/scripts/canary_manifest.yml ADDED Viewed

@@ -0,0 +1,47 @@
+# Canary manifest for the EV-7ydn validation run of scripts/compare_targeting.
+#
+#   scripts/compare_targeting scripts/canary_manifest.yml --out .artifacts/targeting_validation.md
+#
+# Each repo is run through evilution three times (full_file / lexical / coverage)
+# over the SAME mutation set; the gate is total lost_kills == 0 (coverage must
+# never lose a kill full-file caught) before the default flips to coverage.
+#
+# `dir:` assumes the EV-rxob canary checkout layout (/tmp/ev-canaries/<repo>,
+# already `bundle install`ed). Adjust to your checkout. Per-repo `args` mirror
+# the EV-rxob R2 findings: repos whose specs are NOT lib-mirrored need an
+# explicit --spec (EV-z7f5 / GH #1325), or auto spec-resolution yields 0.0 and
+# the comparison is meaningless.
+#
+# Start with the R2 infra=none tier that ran clean; extend with the DB-tier
+# repos once their services are up.
+repos:
+  # --- R2 PASS, lib-mirrored specs (auto-resolution works) ---
+  - name: thoughtbot/factory_bot
+    dir: /tmp/ev-canaries/factory_bot
+    args: ["lib", "--jobs", "4"]
+  - name: jnunemaker/httparty
+    dir: /tmp/ev-canaries/httparty
+    args: ["lib", "--jobs", "4"]
+  - name: rubocop/rubocop
+    dir: /tmp/ev-canaries/rubocop
+    args: ["lib", "--jobs", "4"]
+  - name: rack/rack
+    dir: /tmp/ev-canaries/rack
+    args: ["lib", "--jobs", "4"]
+  # --- Non-lib-mirrored specs: explicit --spec required (EV-z7f5 / GH #1325) ---
+  - name: bblimke/webmock
+    dir: /tmp/ev-canaries/webmock
+    args: ["lib", "--spec", "spec/unit", "--jobs", "4"]
+  - name: doorkeeper-gem/doorkeeper
+    dir: /tmp/ev-canaries/doorkeeper
+    args: ["lib", "--spec", "spec", "--jobs", "4"]
+  - name: ruby-concurrency/concurrent-ruby
+    dir: /tmp/ev-canaries/concurrent-ruby
+    args: ["lib", "--spec", "spec", "--jobs", "4"]

data/scripts/compare_targeting ADDED Viewed

@@ -0,0 +1,277 @@
+#!/usr/bin/env ruby
+# frozen_string_literal: true
+# Targeting-mode comparison harness.
+#
+# For each repo in a manifest, runs evilution over the SAME mutation set under
+# three example-targeting modes -- full_file (baseline), lexical (current), and
+# coverage (new) -- joins the per-mutation results, and emits a per-repo table:
+#   score_full / score_lexical / score_coverage,
+#   lost_kills  (mutations full_file KILLED but coverage did NOT -> the gate),
+#   wall_ratio_lexical / wall_ratio_coverage (vs the full_file baseline).
+#
+# The accuracy gate is lost_kills == 0: coverage targeting must never lose a kill
+# the full-file run would catch. Speed is reported, not gated.
+#
+# Usage:
+#   scripts/compare_targeting MANIFEST.yml [--out report.md]
+#
+# MANIFEST.yml:
+#   repos:
+#     - name: acme/foo
+#       dir:  /checkouts/foo        # already bundled
+#       args: ["lib/foo.rb", "--jobs", "4"]
+#
+# The actual canary execution (checkout + bundle over the EV-rxob manifest) is
+# the validation run, EV-7ydn; this harness is the reusable comparison engine.
+require "json"
+require "yaml"
+require "open3"
+require "optparse"
+require "digest"
+module CompareTargeting
+  MODES = %w[full_file lexical coverage].freeze
+  KEY_FIELDS = %w[file line operator].freeze
+  class ConfigError < StandardError; end
+  module_function
+  # Stable per-mutation identity across modes: only TARGETING differs between
+  # runs, so the same mutation has the same file/line/operator (+ diff to
+  # separate distinct mutations sharing a line+operator).
+  def key_for(detail)
+    base = KEY_FIELDS.map { |field| detail[field] }.join(":")
+    digest = detail["diff"].to_s
+    digest.empty? ? base : "#{base}##{Digest::SHA256.hexdigest(digest)[0, 8]}"
+  end
+  # The label shown in lost-kill output: file:line:operator (no diff hash).
+  def label_for(detail)
+    KEY_FIELDS.map { |field| detail[field] }.join(":")
+  end
+  # One mode's run, indexed by mutation key.
+  class ModeResult
+    CATEGORIES = %w[killed survived neutral equivalent unresolved unparseable timed_out errors].freeze
+    def self.from_json(data)
+      by_key = {}
+      CATEGORIES.each do |category|
+        Array(data[category]).each do |detail|
+          key = CompareTargeting.key_for(detail)
+          by_key[key] ||= {
+            status: detail["status"],
+            duration: (detail["duration"] || 0.0).to_f,
+            label: CompareTargeting.label_for(detail)
+          }
+        end
+      end
+      new(by_key)
+    end
+    def initialize(by_key)
+      @by_key = by_key
+    end
+    def keys
+      @by_key.keys
+    end
+    def status(key)
+      @by_key.dig(key, :status)
+    end
+    def label(key)
+      @by_key.dig(key, :label)
+    end
+    def killed_count
+      @by_key.count { |_, value| value[:status] == "killed" }
+    end
+    # Measurable = the run actually observed a verdict: killed or survived.
+    # unresolved/equivalent/errors/unparseable are excluded from the score.
+    def measurable_count
+      @by_key.count { |_, value| %w[killed survived].include?(value[:status]) }
+    end
+    def total_duration
+      @by_key.values.sum { |value| value[:duration] }
+    end
+  end
+  # Joins the three modes for one repo and derives the comparison metrics.
+  class Comparison
+    def initialize(full_file:, lexical:, coverage:)
+      @modes = { "full_file" => full_file, "lexical" => lexical, "coverage" => coverage }
+    end
+    def score(mode)
+      result = @modes.fetch(mode)
+      return 0.0 if result.measurable_count.zero?
+      result.killed_count.to_f / result.measurable_count
+    end
+    def wall_ratio(mode)
+      baseline = @modes.fetch("full_file").total_duration
+      return 0.0 if baseline.zero?
+      @modes.fetch(mode).total_duration / baseline
+    end
+    # Mutation labels that full_file KILLED but `mode` failed to kill -- the
+    # lost kills that must be zero before coverage can become the default.
+    def lost_kills(mode = "coverage")
+      full = @modes.fetch("full_file")
+      other = @modes.fetch(mode)
+      full.keys.select { |key| full.status(key) == "killed" && other.status(key) != "killed" }
+               .map { |key| full.label(key) }
+    end
+    def to_row(repo)
+      {
+        repo: repo,
+        score_full: score("full_file"),
+        score_lexical: score("lexical"),
+        score_coverage: score("coverage"),
+        lost_kills: lost_kills("coverage").size,
+        wall_ratio_lexical: wall_ratio("lexical"),
+        wall_ratio_coverage: wall_ratio("coverage")
+      }
+    end
+  end
+  # Renders the per-repo rows as a markdown table with a PASS/FAIL gate line.
+  class TableReporter
+    COLUMNS = %w[repo score_full score_lexical score_coverage lost_kills
+                 wall_ratio_lexical wall_ratio_coverage].freeze
+    def initialize(rows)
+      @rows = rows
+    end
+    def to_markdown
+      (table_lines + ["", gate_line]).join("\n")
+    end
+    private
+    def table_lines
+      [header_row, separator_row, *@rows.map { |row| data_row(row) }]
+    end
+    def header_row
+      "| #{COLUMNS.join(" | ")} |"
+    end
+    def separator_row
+      "| #{COLUMNS.map { "---" }.join(" | ")} |"
+    end
+    def data_row(row)
+      "| #{COLUMNS.map { |col| format_cell(row[col.to_sym]) }.join(" | ")} |"
+    end
+    def gate_line
+      total_lost = @rows.sum { |row| row[:lost_kills] }
+      gate = total_lost.zero? ? "PASS" : "FAIL"
+      "GATE (total lost_kills == 0): #{gate} (#{total_lost} lost kills across #{@rows.size} repos)"
+    end
+    def format_cell(value)
+      value.is_a?(Float) ? format("%.3f", value) : value.to_s
+    end
+  end
+  # Runs evilution for one (repo, mode) and parses the JSON into a ModeResult.
+  # command_runner is injected so the pure pipeline is testable without a real
+  # mutation run.
+  class ModeRunner
+    # Run the inner `bundle exec evilution` in the TARGET repo's bundler context.
+    # If this harness is itself launched under `bundle exec`, Bundler exports
+    # BUNDLE_GEMFILE/RUBYOPT into the child, which would make the inner bundle
+    # resolve against evilution's Gemfile instead of the target repo's. Strip
+    # that inherited bundler env first.
+    DEFAULT_RUNNER = lambda do |cmd, dir|
+      stdout, stderr, status =
+        if defined?(Bundler)
+          Bundler.with_unbundled_env { Open3.capture3(*cmd, chdir: dir) }
+        else
+          Open3.capture3(*cmd, chdir: dir)
+        end
+      raise ConfigError, "evilution failed in #{dir}: #{stderr}" unless status.success?
+      stdout
+    end
+    def initialize(command_runner: DEFAULT_RUNNER)
+      @command_runner = command_runner
+    end
+    def run(repo_dir:, evilution_args:, mode:)
+      cmd = ["bundle", "exec", "evilution", *evilution_args,
+             "--example-targeting", mode, "--format", "json"]
+      json = @command_runner.call(cmd, repo_dir)
+      ModeResult.from_json(JSON.parse(json))
+    end
+  end
+  # Drives the manifest: every repo through every mode, then the table.
+  class Harness
+    def initialize(mode_runner: ModeRunner.new)
+      @mode_runner = mode_runner
+    end
+    def call(repos)
+      rows = repos.map { |repo| compare_repo(repo) }
+      TableReporter.new(rows).to_markdown
+    end
+    def compare_repo(repo)
+      results = MODES.to_h do |mode|
+        [mode, @mode_runner.run(repo_dir: repo.fetch(:dir), evilution_args: repo.fetch(:args), mode: mode)]
+      end
+      Comparison.new(**results.transform_keys(&:to_sym)).to_row(repo.fetch(:name))
+    end
+  end
+  def load_manifest(path)
+    data = YAML.safe_load_file(path, symbolize_names: true)
+    raise ConfigError, "manifest must list repos:" unless data.is_a?(Hash) && data[:repos].is_a?(Array)
+    data[:repos]
+  rescue Errno::ENOENT
+    raise ConfigError, "manifest not found: #{path}"
+  rescue Psych::SyntaxError => e
+    raise ConfigError, "manifest is not valid YAML: #{e.message}"
+  end
+end
+if __FILE__ == $PROGRAM_NAME
+  out_path = nil
+  parser = OptionParser.new do |opts|
+    opts.banner = "Usage: scripts/compare_targeting MANIFEST.yml [--out report.md]"
+    opts.on("--out PATH", "Write the markdown report to PATH (default: stdout)") { |p| out_path = p }
+  end
+  parser.parse!
+  manifest_path = ARGV.first
+  unless manifest_path
+    warn parser.banner
+    exit 2
+  end
+  begin
+    repos = CompareTargeting.load_manifest(manifest_path)
+    report = CompareTargeting::Harness.new.call(repos)
+    out_path ? File.write(out_path, report) : puts(report)
+    exit 0
+  rescue CompareTargeting::ConfigError => e
+    warn "Error: #{e.message}"
+    exit 2
+  end
+end

data/scripts/compare_targeting.example.yml ADDED Viewed

@@ -0,0 +1,24 @@
+# Example manifest for scripts/compare_targeting (EV-51d4).
+#
+# Each repo is run through evilution three times -- once per example-targeting
+# mode (full_file, lexical, coverage) -- over the SAME mutation set, and the
+# harness emits a per-repo table with the lost_kills gate and wall-time ratios.
+#
+# Repos must already be checked out and `bundle install`ed; the harness only
+# runs evilution inside them. The real EV-rxob canary list is wired up in the
+# validation run (EV-7ydn).
+#
+#   scripts/compare_targeting scripts/compare_targeting.example.yml --out report.md
+repos:
+  - name: thoughtbot/factory_bot
+    dir: /tmp/ev-canaries/factory_bot
+    args: ["lib", "--jobs", "4"]
+  - name: bblimke/webmock
+    dir: /tmp/ev-canaries/webmock
+    args: ["lib", "--jobs", "4"]
+  - name: rack/rack
+    dir: /tmp/ev-canaries/rack
+    args: ["lib", "--jobs", "4"]

metadata CHANGED Viewed

@@ -1,14 +1,14 @@
 --- !ruby/object:Gem::Specification
 name: evilution
 version: !ruby/object:Gem::Version
-  version: 0.33.0
+  version: 0.34.0
 platform: ruby
 authors:
 - Denis Kiselev
 autorequire:
 bindir: exe
 cert_chain: []
-date: 2026-06-07 00:00:00.000000000 Z
+date: 2026-06-16 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: diff-lcs
@@ -180,6 +180,7 @@ files:
 - lib/evilution/config/validators/base.rb
 - lib/evilution/config/validators/example_targeting_cache.rb
 - lib/evilution/config/validators/example_targeting_fallback.rb
+- lib/evilution/config/validators/example_targeting_strategy.rb
 - lib/evilution/config/validators/fail_fast.rb
 - lib/evilution/config/validators/hooks.rb
 - lib/evilution/config/validators/ignore_patterns.rb
@@ -190,6 +191,13 @@ files:
 - lib/evilution/config/validators/profile.rb
 - lib/evilution/config/validators/spec_mappings.rb
 - lib/evilution/config/validators/spec_pattern.rb
+- lib/evilution/coverage.rb
+- lib/evilution/coverage/digest.rb
+- lib/evilution/coverage/map.rb
+- lib/evilution/coverage/map_builder.rb
+- lib/evilution/coverage/map_store.rb
+- lib/evilution/coverage/recorder.rb
+- lib/evilution/coverage_example_filter.rb
 - lib/evilution/disable_comment.rb
 - lib/evilution/equivalent.rb
 - lib/evilution/equivalent/detector.rb
@@ -368,16 +376,17 @@ files:
 - lib/evilution/parallel/work_queue/channel/frame.rb
 - lib/evilution/parallel/work_queue/collection_state.rb
 - lib/evilution/parallel/work_queue/dispatcher.rb
+- lib/evilution/parallel/work_queue/dispatcher/deadline_tracker.rb
 - lib/evilution/parallel/work_queue/validators.rb
 - lib/evilution/parallel/work_queue/validators/optional_positive_int.rb
 - lib/evilution/parallel/work_queue/validators/optional_positive_number.rb
 - lib/evilution/parallel/work_queue/validators/positive_int.rb
 - lib/evilution/parallel/work_queue/worker.rb
 - lib/evilution/parallel/work_queue/worker/loop.rb
-- lib/evilution/parallel/work_queue/worker_registry.rb
 - lib/evilution/parallel/work_queue/worker_stat.rb
 - lib/evilution/parallel_db_warning.rb
 - lib/evilution/process_cleanup.rb
+- lib/evilution/process_supervisor.rb
 - lib/evilution/rails_detector.rb
 - lib/evilution/related_spec_heuristic.rb
 - lib/evilution/reporter.rb
@@ -497,8 +506,11 @@ files:
 - script/run_self_validation
 - scripts/benchmark_density
 - scripts/benchmark_density.yml
+- scripts/canary_manifest.yml
 - scripts/compare_mutations
 - scripts/compare_mutations.yml
+- scripts/compare_targeting
+- scripts/compare_targeting.example.yml
 - scripts/mutant_json_adapter
 - sig/evilution.rbs
 homepage: https://github.com/marinazzio/evilution

data/lib/evilution/parallel/work_queue/worker_registry.rb DELETED Viewed

@@ -1,47 +0,0 @@
-# frozen_string_literal: true
-require_relative "../work_queue"
-# Process-global registry of live worker process-group ids (pgids).
-#
-# EV-jwao / GH #1332: EV-cnx8 made each Worker its own process-group leader so a
-# stuck worker's whole subtree can be group-killed. Side effect: a terminal
-# Ctrl-C delivers SIGINT only to the parent's foreground group, so workers (now
-# in their own groups) no longer receive it -- and the parent's fatal-signal
-# death skips work_queue#map's `ensure cleanup_workers`, leaking any worker that
-# was actively running a (possibly blocking) mutation at interrupt time.
-#
-# Runner#install_signal_handler reads this registry from inside the trap and
-# forwards INT/TERM to each worker group before re-raising to DEFAULT.
-#
-# Signal-safety: under MRI a trap handler runs on the main thread between VM
-# instructions, so it must not acquire a Mutex (the main thread may hold it ->
-# deadlock). register/unregister therefore swap @pgids for a freshly built
-# frozen array via a single atomic reference assignment (copy-on-write). The
-# trap reads the current reference once and iterates that complete, immutable
-# snapshot -- no torn reads, no lock.
-module Evilution::Parallel::WorkQueue::WorkerRegistry
-  @pgids = [].freeze
-  class << self
-    # Frozen snapshot. Safe to read from a signal handler.
-    attr_reader :pgids
-    def register(pgid)
-      @pgids = (@pgids + [pgid]).freeze
-    end
-    def unregister(pgid)
-      @pgids = @pgids.reject { |existing| existing == pgid }.freeze
-    end
-    def signal_all(sig)
-      @pgids.each do |pgid|
-        Process.kill(sig, -pgid)
-      rescue Errno::ESRCH
-        # Group already gone (worker + subtree reaped) -- nothing to signal.
-        nil
-      end
-    end
-  end
-end