RubyGems - ast-merge - Versions diffs - 1.0.0 - Mend

ast-merge 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

checksums.yaml +7 -0
checksums.yaml.gz.sig +0 -0
data/CHANGELOG.md +46 -0
data/CITATION.cff +20 -0
data/CODE_OF_CONDUCT.md +134 -0
data/CONTRIBUTING.md +227 -0
data/FUNDING.md +74 -0
data/LICENSE.txt +21 -0
data/README.md +852 -0
data/REEK +0 -0
data/RUBOCOP.md +71 -0
data/SECURITY.md +21 -0
data/lib/ast/merge/ast_node.rb +87 -0
data/lib/ast/merge/comment/block.rb +195 -0
data/lib/ast/merge/comment/empty.rb +78 -0
data/lib/ast/merge/comment/line.rb +138 -0
data/lib/ast/merge/comment/parser.rb +278 -0
data/lib/ast/merge/comment/style.rb +282 -0
data/lib/ast/merge/comment.rb +36 -0
data/lib/ast/merge/conflict_resolver_base.rb +399 -0
data/lib/ast/merge/debug_logger.rb +271 -0
data/lib/ast/merge/fenced_code_block_detector.rb +211 -0
data/lib/ast/merge/file_analyzable.rb +307 -0
data/lib/ast/merge/freezable.rb +82 -0
data/lib/ast/merge/freeze_node_base.rb +434 -0
data/lib/ast/merge/match_refiner_base.rb +312 -0
data/lib/ast/merge/match_score_base.rb +135 -0
data/lib/ast/merge/merge_result_base.rb +169 -0
data/lib/ast/merge/merger_config.rb +258 -0
data/lib/ast/merge/node_typing.rb +373 -0
data/lib/ast/merge/region.rb +124 -0
data/lib/ast/merge/region_detector_base.rb +114 -0
data/lib/ast/merge/region_mergeable.rb +364 -0
data/lib/ast/merge/rspec/shared_examples/conflict_resolver_base.rb +416 -0
data/lib/ast/merge/rspec/shared_examples/debug_logger.rb +174 -0
data/lib/ast/merge/rspec/shared_examples/file_analyzable.rb +193 -0
data/lib/ast/merge/rspec/shared_examples/freeze_node_base.rb +219 -0
data/lib/ast/merge/rspec/shared_examples/merge_result_base.rb +106 -0
data/lib/ast/merge/rspec/shared_examples/merger_config.rb +202 -0
data/lib/ast/merge/rspec/shared_examples/reproducible_merge.rb +115 -0
data/lib/ast/merge/rspec/shared_examples.rb +26 -0
data/lib/ast/merge/rspec.rb +4 -0
data/lib/ast/merge/section_typing.rb +303 -0
data/lib/ast/merge/smart_merger_base.rb +417 -0
data/lib/ast/merge/text/conflict_resolver.rb +161 -0
data/lib/ast/merge/text/file_analysis.rb +168 -0
data/lib/ast/merge/text/line_node.rb +142 -0
data/lib/ast/merge/text/merge_result.rb +42 -0
data/lib/ast/merge/text/section.rb +93 -0
data/lib/ast/merge/text/section_splitter.rb +397 -0
data/lib/ast/merge/text/smart_merger.rb +141 -0
data/lib/ast/merge/text/word_node.rb +86 -0
data/lib/ast/merge/text.rb +35 -0
data/lib/ast/merge/toml_frontmatter_detector.rb +88 -0
data/lib/ast/merge/version.rb +12 -0
data/lib/ast/merge/yaml_frontmatter_detector.rb +108 -0
data/lib/ast/merge.rb +165 -0
data/lib/ast-merge.rb +4 -0
data/sig/ast/merge.rbs +195 -0
data.tar.gz.sig +0 -0
metadata +326 -0
metadata.gz.sig +0 -0

data/lib/ast/merge/match_refiner_base.rb ADDED Viewed

@@ -0,0 +1,312 @@
+# frozen_string_literal: true
+module Ast
+  module Merge
+    # Base class for match refiners that pair unmatched nodes after signature matching.
+    #
+    # Match refiners run after initial signature-based matching to find additional
+    # pairings between nodes that didn't match by signature. This is useful when
+    # you want more nuanced matching than exact signatures provide - for example,
+    # matching tables with similar (but not identical) headers, or finding the
+    # closest match among several candidates using multi-factor scoring.
+    #
+    # By default, most node types use content-based signatures (including tables,
+    # which match on row count + header content). Refiners let you override this
+    # to implement fuzzy matching, positional matching, or any custom logic.
+    #
+    # Refiners use a callable interface (`#call`) so simple lambdas/procs can
+    # also be used where a full class isn't needed.
+    #
+    # @example Markdown: Table matching with multi-factor scoring
+    #   # Tables may have similar but not identical headers
+    #   # See Commonmarker::Merge::TableMatchRefiner
+    #   class TableMatchRefiner < Ast::Merge::MatchRefinerBase
+    #     def initialize(algorithm: nil, **options)
+    #       super(**options)
+    #       @algorithm = algorithm || TableMatchAlgorithm.new
+    #     end
+    #
+    #     def call(template_nodes, dest_nodes, context = {})
+    #       template_tables = filter_by_type(template_nodes, :table)
+    #       dest_tables = filter_by_type(dest_nodes, :table)
+    #
+    #       greedy_match(template_tables, dest_tables) do |t_node, d_node|
+    #         @algorithm.call(t_node, d_node)
+    #       end
+    #     end
+    #   end
+    #
+    # @example Ruby: Method matching with fuzzy name/signature scoring
+    #   # Methods may have similar names (process_user vs process_users)
+    #   # or same name with different parameters
+    #   # See Prism::Merge::MethodMatchRefiner
+    #   class MethodMatchRefiner < Ast::Merge::MatchRefinerBase
+    #     def call(template_nodes, dest_nodes, context = {})
+    #       template_methods = template_nodes.select { |n| n.is_a?(Prism::DefNode) }
+    #       dest_methods = dest_nodes.select { |n| n.is_a?(Prism::DefNode) }
+    #
+    #       greedy_match(template_methods, dest_methods) do |t_node, d_node|
+    #         compute_method_similarity(t_node, d_node)
+    #       end
+    #     end
+    #
+    #     private
+    #
+    #     def compute_method_similarity(t_method, d_method)
+    #       name_score = string_similarity(t_method.name.to_s, d_method.name.to_s)
+    #       param_score = param_similarity(t_method, d_method)
+    #       name_score * 0.7 + param_score * 0.3
+    #     end
+    #   end
+    #
+    # @example YAML: Mapping key matching with fuzzy scoring
+    #   # YAML keys may be renamed or have typos
+    #   # See Psych::Merge::MappingMatchRefiner
+    #   class MappingMatchRefiner < Ast::Merge::MatchRefinerBase
+    #     def call(template_nodes, dest_nodes, context = {})
+    #       template_mappings = template_nodes.select { |n| n.respond_to?(:key) }
+    #       dest_mappings = dest_nodes.select { |n| n.respond_to?(:key) }
+    #
+    #       greedy_match(template_mappings, dest_mappings) do |t_node, d_node|
+    #         key_similarity(t_node.key, d_node.key)
+    #       end
+    #     end
+    #   end
+    #
+    # @example JSON: Object property matching for arrays of objects
+    #   # JSON arrays may contain objects that should match by content
+    #   # See Json::Merge::ObjectMatchRefiner
+    #   class ObjectMatchRefiner < Ast::Merge::MatchRefinerBase
+    #     def call(template_nodes, dest_nodes, context = {})
+    #       template_objects = template_nodes.select { |n| n.type == :object }
+    #       dest_objects = dest_nodes.select { |n| n.type == :object }
+    #
+    #       greedy_match(template_objects, dest_objects) do |t_node, d_node|
+    #         compute_object_similarity(t_node, d_node)
+    #       end
+    #     end
+    #   end
+    #
+    # @example Using find_best_match with manual tracking (alternative approach)
+    #   class TableMatchRefiner < Ast::Merge::MatchRefinerBase
+    #     def call(template_nodes, dest_nodes, context = {})
+    #       matches = []
+    #       used_dest_nodes = Set.new
+    #       template_tables = filter_by_type(template_nodes, :table)
+    #       dest_tables = filter_by_type(dest_nodes, :table)
+    #
+    #       template_tables.each do |t_node|
+    #         best = find_best_match(t_node, dest_tables, used_dest_nodes: used_dest_nodes) do |t, d|
+    #           compute_table_score(t, d)
+    #         end
+    #         if best
+    #           matches << best
+    #           used_dest_nodes << best.dest_node
+    #         end
+    #       end
+    #
+    #       matches
+    #     end
+    #   end
+    #
+    # @example Using a simple lambda refiner
+    #   simple_refiner = ->(template, dest, ctx) do
+    #     # Return array of MatchResult objects
+    #     []
+    #   end
+    #
+    # @example Using refiners with a merger
+    #   merger = SmartMerger.new(
+    #     template,
+    #     destination,
+    #     match_refiners: [
+    #       TableMatchRefiner.new(threshold: 0.6),
+    #       CustomRefiner.new
+    #     ]
+    #   )
+    #
+    # @api public
+    class MatchRefinerBase
+      # Result of a match refinement operation.
+      #
+      # @!attribute [r] template_node
+      #   @return [Object] The node from the template
+      # @!attribute [r] dest_node
+      #   @return [Object] The node from the destination
+      # @!attribute [r] score
+      #   @return [Float] Match score between 0.0 and 1.0
+      # @!attribute [r] metadata
+      #   @return [Hash] Optional metadata about the match
+      MatchResult = Struct.new(:template_node, :dest_node, :score, :metadata, keyword_init: true) do
+        # Check if this is a high-confidence match.
+        #
+        # @param threshold [Float] Minimum score for high confidence (default: 0.8)
+        # @return [Boolean]
+        def high_confidence?(threshold: 0.8)
+          score >= threshold
+        end
+        # Compare match results by score for sorting.
+        #
+        # @param other [MatchResult]
+        # @return [Integer] -1, 0, or 1
+        def <=>(other)
+          score <=> other.score
+        end
+      end
+      # Default minimum score threshold for accepting a match
+      DEFAULT_THRESHOLD = 0.5
+      # @return [Float] Minimum score to accept a match
+      attr_reader :threshold
+      # @return [Array<Symbol>] Node types this refiner handles (empty = all types)
+      attr_reader :node_types
+      # Initialize a new match refiner.
+      #
+      # @param threshold [Float] Minimum score to accept a match (0.0-1.0)
+      # @param node_types [Array<Symbol>] Node types to process (empty = all)
+      def initialize(threshold: DEFAULT_THRESHOLD, node_types: [])
+        @threshold = [[threshold.to_f, 0.0].max, 1.0].min
+        @node_types = Array(node_types)
+      end
+      # Refine matches between unmatched template and destination nodes.
+      #
+      # This is the main entry point. Override in subclasses to implement
+      # custom matching logic.
+      #
+      # @param template_nodes [Array] Unmatched nodes from template
+      # @param dest_nodes [Array] Unmatched nodes from destination
+      # @param context [Hash] Additional context (e.g., file analyses)
+      # @return [Array<MatchResult>] Array of match results
+      # @raise [NotImplementedError] If not overridden in subclass
+      def call(template_nodes, dest_nodes, context = {})
+        raise NotImplementedError, "#{self.class}#call must be implemented"
+      end
+      # Check if this refiner handles a given node type.
+      #
+      # @param node_type [Symbol] The node type to check
+      # @return [Boolean] True if this refiner handles the type
+      def handles_type?(node_type)
+        node_types.empty? || node_types.include?(node_type)
+      end
+      protected
+      # Filter nodes by type.
+      #
+      # @param nodes [Array] Nodes to filter
+      # @param type [Symbol] Node type to select
+      # @return [Array] Filtered nodes
+      def filter_by_type(nodes, type)
+        nodes.select { |n| node_type(n) == type }
+      end
+      # Get the type of a node.
+      #
+      # Override in subclasses for parser-specific type extraction.
+      #
+      # @param node [Object] The node
+      # @return [Symbol, nil] The node type
+      def node_type(node)
+        if node.respond_to?(:type)
+          node.type
+        elsif node.respond_to?(:class)
+          node.class.name.split("::").last.to_sym
+        end
+      end
+      # Create a match result.
+      #
+      # @param template_node [Object] Template node
+      # @param dest_node [Object] Destination node
+      # @param score [Float] Match score
+      # @param metadata [Hash] Optional metadata
+      # @return [MatchResult]
+      def match_result(template_node, dest_node, score, metadata = {})
+        MatchResult.new(
+          template_node: template_node,
+          dest_node: dest_node,
+          score: score,
+          metadata: metadata,
+        )
+      end
+      # Find the best matching destination node for a template node.
+      #
+      # Uses a scoring algorithm to find the best match above the threshold.
+      #
+      # @param template_node [Object] The template node to match
+      # @param dest_nodes [Array] Candidate destination nodes
+      # @param used_dest_nodes [Set] Already-matched destination nodes to skip
+      # @yield [template_node, dest_node] Block that returns a score (0.0-1.0)
+      # @return [MatchResult, nil] Best match or nil if none above threshold
+      def find_best_match(template_node, dest_nodes, used_dest_nodes: Set.new)
+        best_match = nil
+        best_score = threshold
+        dest_nodes.each do |dest_node|
+          next if used_dest_nodes.include?(dest_node)
+          score = yield(template_node, dest_node)
+          next unless score && score > best_score
+          best_score = score
+          best_match = dest_node
+        end
+        return unless best_match
+        match_result(template_node, best_match, best_score)
+      end
+      # Perform greedy matching between template and destination nodes.
+      #
+      # Matches are made greedily by score, with each node matched at most once.
+      #
+      # @param template_nodes [Array] Template nodes to match
+      # @param dest_nodes [Array] Destination nodes to match against
+      # @yield [template_node, dest_node] Block that returns a score (0.0-1.0)
+      # @return [Array<MatchResult>] Array of matches
+      def greedy_match(template_nodes, dest_nodes)
+        matches = []
+        used_dest_nodes = Set.new
+        # Collect all potential matches with scores
+        candidates = []
+        template_nodes.each do |t_node|
+          dest_nodes.each do |d_node|
+            score = yield(t_node, d_node)
+            next unless score && score >= threshold
+            candidates << {template: t_node, dest: d_node, score: score}
+          end
+        end
+        # Sort by score descending
+        candidates.sort_by! { |c| -c[:score] }
+        # Greedily assign matches
+        used_template_nodes = Set.new
+        candidates.each do |candidate|
+          next if used_template_nodes.include?(candidate[:template])
+          next if used_dest_nodes.include?(candidate[:dest])
+          matches << match_result(
+            candidate[:template],
+            candidate[:dest],
+            candidate[:score],
+          )
+          used_template_nodes << candidate[:template]
+          used_dest_nodes << candidate[:dest]
+        end
+        matches
+      end
+    end
+  end
+end

data/lib/ast/merge/match_score_base.rb ADDED Viewed

@@ -0,0 +1,135 @@
+# frozen_string_literal: true
+module Ast
+  module Merge
+    # Base class for computing match scores between two nodes.
+    #
+    # Match scores help determine which nodes from a template should be linked
+    # to which nodes in a destination document. This is particularly useful for
+    # complex nodes like tables where simple signature matching is insufficient.
+    #
+    # The scoring algorithm is provided as a callable object (lambda, Proc, or
+    # any object responding to :call) which receives the two nodes and returns
+    # a score between 0.0 (no match) and 1.0 (perfect match).
+    #
+    # Includes Comparable for sorting and comparison operations.
+    #
+    # @example Basic usage with a lambda
+    #   algorithm = ->(node_a, node_b) { node_a.type == node_b.type ? 1.0 : 0.0 }
+    #   scorer = MatchScoreBase.new(template_node, dest_node, algorithm: algorithm)
+    #   puts scorer.score # => 1.0 if types match
+    #
+    # @example With a custom algorithm class
+    #   class TableMatcher
+    #     def call(table_a, table_b)
+    #       # Complex matching logic
+    #       compute_similarity(table_a, table_b)
+    #     end
+    #   end
+    #
+    #   scorer = MatchScoreBase.new(table1, table2, algorithm: TableMatcher.new)
+    #
+    # @example Comparing and sorting scorers
+    #   scorers = [scorer1, scorer2, scorer3]
+    #   best = scorers.max
+    #   sorted = scorers.sort
+    #
+    # @api public
+    class MatchScoreBase
+      include Comparable
+      # Minimum score threshold for considering two nodes as a potential match
+      # @return [Float]
+      DEFAULT_THRESHOLD = 0.5
+      # @return [Object] The first node to compare (typically from template)
+      attr_reader :node_a
+      # @return [Object] The second node to compare (typically from destination)
+      attr_reader :node_b
+      # @return [#call] The algorithm used to compute the match score
+      attr_reader :algorithm
+      # @return [Float] The minimum score to consider a match
+      attr_reader :threshold
+      # Initialize a match scorer.
+      #
+      # @param node_a [Object] First node to compare
+      # @param node_b [Object] Second node to compare
+      # @param algorithm [#call] Callable that computes the score (receives node_a, node_b)
+      # @param threshold [Float] Minimum score to consider a match (default: 0.5)
+      # @raise [ArgumentError] If algorithm doesn't respond to :call
+      def initialize(node_a, node_b, algorithm:, threshold: DEFAULT_THRESHOLD)
+        raise ArgumentError, "algorithm must respond to :call" unless algorithm.respond_to?(:call)
+        @node_a = node_a
+        @node_b = node_b
+        @algorithm = algorithm
+        @threshold = threshold
+        @score = nil
+      end
+      # Compute and return the match score.
+      #
+      # The score is cached after first computation.
+      #
+      # @return [Float] Score between 0.0 and 1.0
+      def score
+        @score ||= compute_score
+      end
+      # Check if the score meets the threshold for a match.
+      #
+      # @return [Boolean] True if score >= threshold
+      def match?
+        score >= threshold
+      end
+      # Compare two scorers by their scores.
+      #
+      # Required by Comparable. Enables <, <=, ==, >=, >, and between? operators.
+      #
+      # @param other [MatchScoreBase] Another scorer to compare
+      # @return [Integer] -1, 0, or 1 for comparison
+      def <=>(other)
+        score <=> other.score
+      end
+      # Generate a hash code for this scorer.
+      #
+      # Required for Hash key compatibility. Two scorers with the same
+      # node_a, node_b, and score should have the same hash.
+      #
+      # @return [Integer] Hash code
+      def hash
+        [node_a, node_b, score].hash
+      end
+      # Check equality for Hash key compatibility.
+      #
+      # Two scorers are eql? if they have the same node_a, node_b, and score.
+      # This is stricter than == from Comparable (which only compares scores).
+      #
+      # @param other [MatchScoreBase] Another scorer to compare
+      # @return [Boolean] True if equivalent
+      def eql?(other)
+        return false unless other.is_a?(MatchScoreBase)
+        node_a == other.node_a && node_b == other.node_b && score == other.score
+      end
+      private
+      # Compute the score using the algorithm.
+      #
+      # @return [Float] Score between 0.0 and 1.0
+      def compute_score
+        result = algorithm.call(node_a, node_b)
+        # Clamp to valid range
+        [[result.to_f, 0.0].max, 1.0].min
+      end
+    end
+  end
+end

data/lib/ast/merge/merge_result_base.rb ADDED Viewed

@@ -0,0 +1,169 @@
+# frozen_string_literal: true
+module Ast
+  module Merge
+    # Base class for tracking merge results in AST merge libraries.
+    # Provides shared decision constants and base functionality for
+    # file-type-specific implementations.
+    #
+    # @example Basic usage in a subclass
+    #   class MyMergeResult < Ast::Merge::MergeResultBase
+    #     def add_node(node, decision:, source:)
+    #       # File-type-specific node handling
+    #     end
+    #   end
+    class MergeResultBase
+      # Decision constants for tracking merge choices
+      # Line was kept from template (no conflict or template preferred).
+      # Used when template content is included without modification.
+      DECISION_KEPT_TEMPLATE = :kept_template
+      # Line was kept from destination (no conflict or destination preferred).
+      # Used when destination content is included without modification.
+      DECISION_KEPT_DEST = :kept_destination
+      # Line was merged from both sources.
+      # Used when content was combined from template and destination.
+      DECISION_MERGED = :merged
+      # Line was added from template (template-only content).
+      # Used for content that exists only in template and is added to result.
+      DECISION_ADDED = :added
+      # Line from destination freeze block (always preserved).
+      # Used for content within freeze markers that must be kept
+      # from destination regardless of template content.
+      DECISION_FREEZE_BLOCK = :freeze_block
+      # Line replaced matching content (signature match with preference applied).
+      # Used when template and destination have nodes with same signature but
+      # different content, and one version replaced the other based on preference.
+      DECISION_REPLACED = :replaced
+      # Line was appended from destination (destination-only content).
+      # Used for content that exists only in destination and is added to result.
+      DECISION_APPENDED = :appended
+      # @return [Array<String>] Lines in the result (canonical storage for line-by-line merging)
+      attr_reader :lines
+      # @return [Array<Hash>] Decisions made during merge
+      attr_reader :decisions
+      # @return [Object, nil] Analysis of the template file
+      attr_reader :template_analysis
+      # @return [Object, nil] Analysis of the destination file
+      attr_reader :dest_analysis
+      # @return [Array<Hash>] Conflicts detected during merge
+      attr_reader :conflicts
+      # @return [Array] Frozen blocks preserved during merge
+      attr_reader :frozen_blocks
+      # @return [Hash] Statistics about the merge
+      attr_reader :stats
+      # Initialize a new merge result.
+      #
+      # This unified constructor accepts all parameters that any *-merge gem might need.
+      # Subclasses should call super with the parameters they use.
+      #
+      # @param template_analysis [Object, nil] Analysis of the template file
+      # @param dest_analysis [Object, nil] Analysis of the destination file
+      # @param conflicts [Array<Hash>] Conflicts detected during merge
+      # @param frozen_blocks [Array] Frozen blocks preserved during merge
+      # @param stats [Hash] Statistics about the merge
+      def initialize(
+        template_analysis: nil,
+        dest_analysis: nil,
+        conflicts: [],
+        frozen_blocks: [],
+        stats: {}
+      )
+        @template_analysis = template_analysis
+        @dest_analysis = dest_analysis
+        @lines = []
+        @decisions = []
+        @conflicts = conflicts
+        @frozen_blocks = frozen_blocks
+        @stats = stats
+      end
+      # Get content - returns @lines array for most gems.
+      # Subclasses may override for different content models (e.g., string).
+      #
+      # @return [Array<String>] The merged content as array of lines
+      def content
+        @lines
+      end
+      # Set content from a string (splits on newlines).
+      # Used when region substitution replaces the merged content.
+      #
+      # @param value [String] The new content
+      def content=(value)
+        @lines = value.to_s.split("\n", -1)
+      end
+      # Get content as a string.
+      # This is the canonical method for converting the merge result to a string.
+      # Subclasses may override to customize string output (e.g., adding trailing newline).
+      #
+      # @return [String] Content as string joined with newlines
+      def to_s
+        @lines.join("\n")
+      end
+      # Check if content has been built (has any lines).
+      #
+      # @return [Boolean]
+      def content?
+        !@lines.empty?
+      end
+      # Check if the result is empty
+      # @return [Boolean]
+      def empty?
+        @lines.empty?
+      end
+      # Get the number of lines
+      # @return [Integer]
+      def line_count
+        @lines.length
+      end
+      # Get summary of decisions made
+      # @return [Hash<Symbol, Integer>]
+      def decision_summary
+        summary = Hash.new(0)
+        @decisions.each { |d| summary[d[:decision]] += 1 }
+        summary
+      end
+      # String representation
+      # @return [String]
+      def inspect
+        "#<#{self.class.name} lines=#{line_count} decisions=#{@decisions.length}>"
+      end
+      protected
+      # Track a decision
+      # @param decision [Symbol] The decision made
+      # @param source [Symbol] The source (:template, :destination, :merged)
+      # @param line [Integer, nil] The line number
+      def track_decision(decision, source, line: nil)
+        @decisions << {
+          decision: decision,
+          source: source,
+          line: line,
+          timestamp: Time.now,
+        }
+      end
+    end
+  end
+end