evilution 0.33.0 → 0.34.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,47 @@
1
+ # Canary manifest for the EV-7ydn validation run of scripts/compare_targeting.
2
+ #
3
+ # scripts/compare_targeting scripts/canary_manifest.yml --out .artifacts/targeting_validation.md
4
+ #
5
+ # Each repo is run through evilution three times (full_file / lexical / coverage)
6
+ # over the SAME mutation set; the gate is total lost_kills == 0 (coverage must
7
+ # never lose a kill full-file caught) before the default flips to coverage.
8
+ #
9
+ # `dir:` assumes the EV-rxob canary checkout layout (/tmp/ev-canaries/<repo>,
10
+ # already `bundle install`ed). Adjust to your checkout. Per-repo `args` mirror
11
+ # the EV-rxob R2 findings: repos whose specs are NOT lib-mirrored need an
12
+ # explicit --spec (EV-z7f5 / GH #1325), or auto spec-resolution yields 0.0 and
13
+ # the comparison is meaningless.
14
+ #
15
+ # Start with the R2 infra=none tier that ran clean; extend with the DB-tier
16
+ # repos once their services are up.
17
+
18
+ repos:
19
+ # --- R2 PASS, lib-mirrored specs (auto-resolution works) ---
20
+ - name: thoughtbot/factory_bot
21
+ dir: /tmp/ev-canaries/factory_bot
22
+ args: ["lib", "--jobs", "4"]
23
+
24
+ - name: jnunemaker/httparty
25
+ dir: /tmp/ev-canaries/httparty
26
+ args: ["lib", "--jobs", "4"]
27
+
28
+ - name: rubocop/rubocop
29
+ dir: /tmp/ev-canaries/rubocop
30
+ args: ["lib", "--jobs", "4"]
31
+
32
+ - name: rack/rack
33
+ dir: /tmp/ev-canaries/rack
34
+ args: ["lib", "--jobs", "4"]
35
+
36
+ # --- Non-lib-mirrored specs: explicit --spec required (EV-z7f5 / GH #1325) ---
37
+ - name: bblimke/webmock
38
+ dir: /tmp/ev-canaries/webmock
39
+ args: ["lib", "--spec", "spec/unit", "--jobs", "4"]
40
+
41
+ - name: doorkeeper-gem/doorkeeper
42
+ dir: /tmp/ev-canaries/doorkeeper
43
+ args: ["lib", "--spec", "spec", "--jobs", "4"]
44
+
45
+ - name: ruby-concurrency/concurrent-ruby
46
+ dir: /tmp/ev-canaries/concurrent-ruby
47
+ args: ["lib", "--spec", "spec", "--jobs", "4"]
@@ -0,0 +1,277 @@
1
+ #!/usr/bin/env ruby
2
+ # frozen_string_literal: true
3
+
4
+ # Targeting-mode comparison harness.
5
+ #
6
+ # For each repo in a manifest, runs evilution over the SAME mutation set under
7
+ # three example-targeting modes -- full_file (baseline), lexical (current), and
8
+ # coverage (new) -- joins the per-mutation results, and emits a per-repo table:
9
+ # score_full / score_lexical / score_coverage,
10
+ # lost_kills (mutations full_file KILLED but coverage did NOT -> the gate),
11
+ # wall_ratio_lexical / wall_ratio_coverage (vs the full_file baseline).
12
+ #
13
+ # The accuracy gate is lost_kills == 0: coverage targeting must never lose a kill
14
+ # the full-file run would catch. Speed is reported, not gated.
15
+ #
16
+ # Usage:
17
+ # scripts/compare_targeting MANIFEST.yml [--out report.md]
18
+ #
19
+ # MANIFEST.yml:
20
+ # repos:
21
+ # - name: acme/foo
22
+ # dir: /checkouts/foo # already bundled
23
+ # args: ["lib/foo.rb", "--jobs", "4"]
24
+ #
25
+ # The actual canary execution (checkout + bundle over the EV-rxob manifest) is
26
+ # the validation run, EV-7ydn; this harness is the reusable comparison engine.
27
+
28
+ require "json"
29
+ require "yaml"
30
+ require "open3"
31
+ require "optparse"
32
+ require "digest"
33
+
34
+ module CompareTargeting
35
+ MODES = %w[full_file lexical coverage].freeze
36
+ KEY_FIELDS = %w[file line operator].freeze
37
+
38
+ class ConfigError < StandardError; end
39
+
40
+ module_function
41
+
42
+ # Stable per-mutation identity across modes: only TARGETING differs between
43
+ # runs, so the same mutation has the same file/line/operator (+ diff to
44
+ # separate distinct mutations sharing a line+operator).
45
+ def key_for(detail)
46
+ base = KEY_FIELDS.map { |field| detail[field] }.join(":")
47
+ digest = detail["diff"].to_s
48
+ digest.empty? ? base : "#{base}##{Digest::SHA256.hexdigest(digest)[0, 8]}"
49
+ end
50
+
51
+ # The label shown in lost-kill output: file:line:operator (no diff hash).
52
+ def label_for(detail)
53
+ KEY_FIELDS.map { |field| detail[field] }.join(":")
54
+ end
55
+
56
+ # One mode's run, indexed by mutation key.
57
+ class ModeResult
58
+ CATEGORIES = %w[killed survived neutral equivalent unresolved unparseable timed_out errors].freeze
59
+
60
+ def self.from_json(data)
61
+ by_key = {}
62
+ CATEGORIES.each do |category|
63
+ Array(data[category]).each do |detail|
64
+ key = CompareTargeting.key_for(detail)
65
+ by_key[key] ||= {
66
+ status: detail["status"],
67
+ duration: (detail["duration"] || 0.0).to_f,
68
+ label: CompareTargeting.label_for(detail)
69
+ }
70
+ end
71
+ end
72
+ new(by_key)
73
+ end
74
+
75
+ def initialize(by_key)
76
+ @by_key = by_key
77
+ end
78
+
79
+ def keys
80
+ @by_key.keys
81
+ end
82
+
83
+ def status(key)
84
+ @by_key.dig(key, :status)
85
+ end
86
+
87
+ def label(key)
88
+ @by_key.dig(key, :label)
89
+ end
90
+
91
+ def killed_count
92
+ @by_key.count { |_, value| value[:status] == "killed" }
93
+ end
94
+
95
+ # Measurable = the run actually observed a verdict: killed or survived.
96
+ # unresolved/equivalent/errors/unparseable are excluded from the score.
97
+ def measurable_count
98
+ @by_key.count { |_, value| %w[killed survived].include?(value[:status]) }
99
+ end
100
+
101
+ def total_duration
102
+ @by_key.values.sum { |value| value[:duration] }
103
+ end
104
+ end
105
+
106
+ # Joins the three modes for one repo and derives the comparison metrics.
107
+ class Comparison
108
+ def initialize(full_file:, lexical:, coverage:)
109
+ @modes = { "full_file" => full_file, "lexical" => lexical, "coverage" => coverage }
110
+ end
111
+
112
+ def score(mode)
113
+ result = @modes.fetch(mode)
114
+ return 0.0 if result.measurable_count.zero?
115
+
116
+ result.killed_count.to_f / result.measurable_count
117
+ end
118
+
119
+ def wall_ratio(mode)
120
+ baseline = @modes.fetch("full_file").total_duration
121
+ return 0.0 if baseline.zero?
122
+
123
+ @modes.fetch(mode).total_duration / baseline
124
+ end
125
+
126
+ # Mutation labels that full_file KILLED but `mode` failed to kill -- the
127
+ # lost kills that must be zero before coverage can become the default.
128
+ def lost_kills(mode = "coverage")
129
+ full = @modes.fetch("full_file")
130
+ other = @modes.fetch(mode)
131
+ full.keys.select { |key| full.status(key) == "killed" && other.status(key) != "killed" }
132
+ .map { |key| full.label(key) }
133
+ end
134
+
135
+ def to_row(repo)
136
+ {
137
+ repo: repo,
138
+ score_full: score("full_file"),
139
+ score_lexical: score("lexical"),
140
+ score_coverage: score("coverage"),
141
+ lost_kills: lost_kills("coverage").size,
142
+ wall_ratio_lexical: wall_ratio("lexical"),
143
+ wall_ratio_coverage: wall_ratio("coverage")
144
+ }
145
+ end
146
+ end
147
+
148
+ # Renders the per-repo rows as a markdown table with a PASS/FAIL gate line.
149
+ class TableReporter
150
+ COLUMNS = %w[repo score_full score_lexical score_coverage lost_kills
151
+ wall_ratio_lexical wall_ratio_coverage].freeze
152
+
153
+ def initialize(rows)
154
+ @rows = rows
155
+ end
156
+
157
+ def to_markdown
158
+ (table_lines + ["", gate_line]).join("\n")
159
+ end
160
+
161
+ private
162
+
163
+ def table_lines
164
+ [header_row, separator_row, *@rows.map { |row| data_row(row) }]
165
+ end
166
+
167
+ def header_row
168
+ "| #{COLUMNS.join(" | ")} |"
169
+ end
170
+
171
+ def separator_row
172
+ "| #{COLUMNS.map { "---" }.join(" | ")} |"
173
+ end
174
+
175
+ def data_row(row)
176
+ "| #{COLUMNS.map { |col| format_cell(row[col.to_sym]) }.join(" | ")} |"
177
+ end
178
+
179
+ def gate_line
180
+ total_lost = @rows.sum { |row| row[:lost_kills] }
181
+ gate = total_lost.zero? ? "PASS" : "FAIL"
182
+ "GATE (total lost_kills == 0): #{gate} (#{total_lost} lost kills across #{@rows.size} repos)"
183
+ end
184
+
185
+ def format_cell(value)
186
+ value.is_a?(Float) ? format("%.3f", value) : value.to_s
187
+ end
188
+ end
189
+
190
+ # Runs evilution for one (repo, mode) and parses the JSON into a ModeResult.
191
+ # command_runner is injected so the pure pipeline is testable without a real
192
+ # mutation run.
193
+ class ModeRunner
194
+ # Run the inner `bundle exec evilution` in the TARGET repo's bundler context.
195
+ # If this harness is itself launched under `bundle exec`, Bundler exports
196
+ # BUNDLE_GEMFILE/RUBYOPT into the child, which would make the inner bundle
197
+ # resolve against evilution's Gemfile instead of the target repo's. Strip
198
+ # that inherited bundler env first.
199
+ DEFAULT_RUNNER = lambda do |cmd, dir|
200
+ stdout, stderr, status =
201
+ if defined?(Bundler)
202
+ Bundler.with_unbundled_env { Open3.capture3(*cmd, chdir: dir) }
203
+ else
204
+ Open3.capture3(*cmd, chdir: dir)
205
+ end
206
+ raise ConfigError, "evilution failed in #{dir}: #{stderr}" unless status.success?
207
+
208
+ stdout
209
+ end
210
+
211
+ def initialize(command_runner: DEFAULT_RUNNER)
212
+ @command_runner = command_runner
213
+ end
214
+
215
+ def run(repo_dir:, evilution_args:, mode:)
216
+ cmd = ["bundle", "exec", "evilution", *evilution_args,
217
+ "--example-targeting", mode, "--format", "json"]
218
+ json = @command_runner.call(cmd, repo_dir)
219
+ ModeResult.from_json(JSON.parse(json))
220
+ end
221
+ end
222
+
223
+ # Drives the manifest: every repo through every mode, then the table.
224
+ class Harness
225
+ def initialize(mode_runner: ModeRunner.new)
226
+ @mode_runner = mode_runner
227
+ end
228
+
229
+ def call(repos)
230
+ rows = repos.map { |repo| compare_repo(repo) }
231
+ TableReporter.new(rows).to_markdown
232
+ end
233
+
234
+ def compare_repo(repo)
235
+ results = MODES.to_h do |mode|
236
+ [mode, @mode_runner.run(repo_dir: repo.fetch(:dir), evilution_args: repo.fetch(:args), mode: mode)]
237
+ end
238
+ Comparison.new(**results.transform_keys(&:to_sym)).to_row(repo.fetch(:name))
239
+ end
240
+ end
241
+
242
+ def load_manifest(path)
243
+ data = YAML.safe_load_file(path, symbolize_names: true)
244
+ raise ConfigError, "manifest must list repos:" unless data.is_a?(Hash) && data[:repos].is_a?(Array)
245
+
246
+ data[:repos]
247
+ rescue Errno::ENOENT
248
+ raise ConfigError, "manifest not found: #{path}"
249
+ rescue Psych::SyntaxError => e
250
+ raise ConfigError, "manifest is not valid YAML: #{e.message}"
251
+ end
252
+ end
253
+
254
+ if __FILE__ == $PROGRAM_NAME
255
+ out_path = nil
256
+ parser = OptionParser.new do |opts|
257
+ opts.banner = "Usage: scripts/compare_targeting MANIFEST.yml [--out report.md]"
258
+ opts.on("--out PATH", "Write the markdown report to PATH (default: stdout)") { |p| out_path = p }
259
+ end
260
+ parser.parse!
261
+
262
+ manifest_path = ARGV.first
263
+ unless manifest_path
264
+ warn parser.banner
265
+ exit 2
266
+ end
267
+
268
+ begin
269
+ repos = CompareTargeting.load_manifest(manifest_path)
270
+ report = CompareTargeting::Harness.new.call(repos)
271
+ out_path ? File.write(out_path, report) : puts(report)
272
+ exit 0
273
+ rescue CompareTargeting::ConfigError => e
274
+ warn "Error: #{e.message}"
275
+ exit 2
276
+ end
277
+ end
@@ -0,0 +1,24 @@
1
+ # Example manifest for scripts/compare_targeting (EV-51d4).
2
+ #
3
+ # Each repo is run through evilution three times -- once per example-targeting
4
+ # mode (full_file, lexical, coverage) -- over the SAME mutation set, and the
5
+ # harness emits a per-repo table with the lost_kills gate and wall-time ratios.
6
+ #
7
+ # Repos must already be checked out and `bundle install`ed; the harness only
8
+ # runs evilution inside them. The real EV-rxob canary list is wired up in the
9
+ # validation run (EV-7ydn).
10
+ #
11
+ # scripts/compare_targeting scripts/compare_targeting.example.yml --out report.md
12
+
13
+ repos:
14
+ - name: thoughtbot/factory_bot
15
+ dir: /tmp/ev-canaries/factory_bot
16
+ args: ["lib", "--jobs", "4"]
17
+
18
+ - name: bblimke/webmock
19
+ dir: /tmp/ev-canaries/webmock
20
+ args: ["lib", "--jobs", "4"]
21
+
22
+ - name: rack/rack
23
+ dir: /tmp/ev-canaries/rack
24
+ args: ["lib", "--jobs", "4"]
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: evilution
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.33.0
4
+ version: 0.34.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Denis Kiselev
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2026-06-07 00:00:00.000000000 Z
11
+ date: 2026-06-16 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: diff-lcs
@@ -180,6 +180,7 @@ files:
180
180
  - lib/evilution/config/validators/base.rb
181
181
  - lib/evilution/config/validators/example_targeting_cache.rb
182
182
  - lib/evilution/config/validators/example_targeting_fallback.rb
183
+ - lib/evilution/config/validators/example_targeting_strategy.rb
183
184
  - lib/evilution/config/validators/fail_fast.rb
184
185
  - lib/evilution/config/validators/hooks.rb
185
186
  - lib/evilution/config/validators/ignore_patterns.rb
@@ -190,6 +191,13 @@ files:
190
191
  - lib/evilution/config/validators/profile.rb
191
192
  - lib/evilution/config/validators/spec_mappings.rb
192
193
  - lib/evilution/config/validators/spec_pattern.rb
194
+ - lib/evilution/coverage.rb
195
+ - lib/evilution/coverage/digest.rb
196
+ - lib/evilution/coverage/map.rb
197
+ - lib/evilution/coverage/map_builder.rb
198
+ - lib/evilution/coverage/map_store.rb
199
+ - lib/evilution/coverage/recorder.rb
200
+ - lib/evilution/coverage_example_filter.rb
193
201
  - lib/evilution/disable_comment.rb
194
202
  - lib/evilution/equivalent.rb
195
203
  - lib/evilution/equivalent/detector.rb
@@ -368,16 +376,17 @@ files:
368
376
  - lib/evilution/parallel/work_queue/channel/frame.rb
369
377
  - lib/evilution/parallel/work_queue/collection_state.rb
370
378
  - lib/evilution/parallel/work_queue/dispatcher.rb
379
+ - lib/evilution/parallel/work_queue/dispatcher/deadline_tracker.rb
371
380
  - lib/evilution/parallel/work_queue/validators.rb
372
381
  - lib/evilution/parallel/work_queue/validators/optional_positive_int.rb
373
382
  - lib/evilution/parallel/work_queue/validators/optional_positive_number.rb
374
383
  - lib/evilution/parallel/work_queue/validators/positive_int.rb
375
384
  - lib/evilution/parallel/work_queue/worker.rb
376
385
  - lib/evilution/parallel/work_queue/worker/loop.rb
377
- - lib/evilution/parallel/work_queue/worker_registry.rb
378
386
  - lib/evilution/parallel/work_queue/worker_stat.rb
379
387
  - lib/evilution/parallel_db_warning.rb
380
388
  - lib/evilution/process_cleanup.rb
389
+ - lib/evilution/process_supervisor.rb
381
390
  - lib/evilution/rails_detector.rb
382
391
  - lib/evilution/related_spec_heuristic.rb
383
392
  - lib/evilution/reporter.rb
@@ -497,8 +506,11 @@ files:
497
506
  - script/run_self_validation
498
507
  - scripts/benchmark_density
499
508
  - scripts/benchmark_density.yml
509
+ - scripts/canary_manifest.yml
500
510
  - scripts/compare_mutations
501
511
  - scripts/compare_mutations.yml
512
+ - scripts/compare_targeting
513
+ - scripts/compare_targeting.example.yml
502
514
  - scripts/mutant_json_adapter
503
515
  - sig/evilution.rbs
504
516
  homepage: https://github.com/marinazzio/evilution
@@ -1,47 +0,0 @@
1
- # frozen_string_literal: true
2
-
3
- require_relative "../work_queue"
4
-
5
- # Process-global registry of live worker process-group ids (pgids).
6
- #
7
- # EV-jwao / GH #1332: EV-cnx8 made each Worker its own process-group leader so a
8
- # stuck worker's whole subtree can be group-killed. Side effect: a terminal
9
- # Ctrl-C delivers SIGINT only to the parent's foreground group, so workers (now
10
- # in their own groups) no longer receive it -- and the parent's fatal-signal
11
- # death skips work_queue#map's `ensure cleanup_workers`, leaking any worker that
12
- # was actively running a (possibly blocking) mutation at interrupt time.
13
- #
14
- # Runner#install_signal_handler reads this registry from inside the trap and
15
- # forwards INT/TERM to each worker group before re-raising to DEFAULT.
16
- #
17
- # Signal-safety: under MRI a trap handler runs on the main thread between VM
18
- # instructions, so it must not acquire a Mutex (the main thread may hold it ->
19
- # deadlock). register/unregister therefore swap @pgids for a freshly built
20
- # frozen array via a single atomic reference assignment (copy-on-write). The
21
- # trap reads the current reference once and iterates that complete, immutable
22
- # snapshot -- no torn reads, no lock.
23
- module Evilution::Parallel::WorkQueue::WorkerRegistry
24
- @pgids = [].freeze
25
-
26
- class << self
27
- # Frozen snapshot. Safe to read from a signal handler.
28
- attr_reader :pgids
29
-
30
- def register(pgid)
31
- @pgids = (@pgids + [pgid]).freeze
32
- end
33
-
34
- def unregister(pgid)
35
- @pgids = @pgids.reject { |existing| existing == pgid }.freeze
36
- end
37
-
38
- def signal_all(sig)
39
- @pgids.each do |pgid|
40
- Process.kill(sig, -pgid)
41
- rescue Errno::ESRCH
42
- # Group already gone (worker + subtree reaped) -- nothing to signal.
43
- nil
44
- end
45
- end
46
- end
47
- end