RubyGems - parsanol - Versions diffs - 1.0.1-aarch64-linux - Mend

parsanol 1.0.1-aarch64-linux

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (101) hide show

checksums.yaml +7 -0
data/HISTORY.txt +12 -0
data/LICENSE +23 -0
data/README.adoc +487 -0
data/Rakefile +135 -0
data/lib/parsanol/3.2/parsanol_native.so +0 -0
data/lib/parsanol/3.3/parsanol_native.so +0 -0
data/lib/parsanol/3.4/parsanol_native.so +0 -0
data/lib/parsanol/4.0/parsanol_native.so +0 -0
data/lib/parsanol/ast_visitor.rb +122 -0
data/lib/parsanol/atoms/alternative.rb +122 -0
data/lib/parsanol/atoms/base.rb +202 -0
data/lib/parsanol/atoms/can_flatten.rb +194 -0
data/lib/parsanol/atoms/capture.rb +38 -0
data/lib/parsanol/atoms/context.rb +334 -0
data/lib/parsanol/atoms/context_optimized.rb +38 -0
data/lib/parsanol/atoms/custom.rb +110 -0
data/lib/parsanol/atoms/cut.rb +66 -0
data/lib/parsanol/atoms/dsl.rb +96 -0
data/lib/parsanol/atoms/dynamic.rb +39 -0
data/lib/parsanol/atoms/entity.rb +75 -0
data/lib/parsanol/atoms/ignored.rb +37 -0
data/lib/parsanol/atoms/infix.rb +162 -0
data/lib/parsanol/atoms/lookahead.rb +82 -0
data/lib/parsanol/atoms/named.rb +74 -0
data/lib/parsanol/atoms/re.rb +83 -0
data/lib/parsanol/atoms/repetition.rb +259 -0
data/lib/parsanol/atoms/scope.rb +35 -0
data/lib/parsanol/atoms/sequence.rb +194 -0
data/lib/parsanol/atoms/str.rb +103 -0
data/lib/parsanol/atoms/visitor.rb +91 -0
data/lib/parsanol/atoms.rb +46 -0
data/lib/parsanol/buffer.rb +133 -0
data/lib/parsanol/builder_callbacks.rb +353 -0
data/lib/parsanol/cause.rb +122 -0
data/lib/parsanol/context.rb +39 -0
data/lib/parsanol/convenience.rb +36 -0
data/lib/parsanol/edit_tracker.rb +111 -0
data/lib/parsanol/error_reporter/contextual.rb +99 -0
data/lib/parsanol/error_reporter/deepest.rb +120 -0
data/lib/parsanol/error_reporter/tree.rb +63 -0
data/lib/parsanol/error_reporter.rb +100 -0
data/lib/parsanol/expression/treetop.rb +154 -0
data/lib/parsanol/expression.rb +106 -0
data/lib/parsanol/fast_mode.rb +149 -0
data/lib/parsanol/first_set.rb +79 -0
data/lib/parsanol/grammar_builder.rb +177 -0
data/lib/parsanol/incremental_parser.rb +177 -0
data/lib/parsanol/interval_tree.rb +217 -0
data/lib/parsanol/lazy_result.rb +179 -0
data/lib/parsanol/lexer.rb +144 -0
data/lib/parsanol/mermaid.rb +139 -0
data/lib/parsanol/native/parser.rb +612 -0
data/lib/parsanol/native/serializer.rb +248 -0
data/lib/parsanol/native/transformer.rb +435 -0
data/lib/parsanol/native/types.rb +42 -0
data/lib/parsanol/native.rb +217 -0
data/lib/parsanol/optimizer.rb +85 -0
data/lib/parsanol/optimizers/choice_optimizer.rb +78 -0
data/lib/parsanol/optimizers/cut_inserter.rb +179 -0
data/lib/parsanol/optimizers/lookahead_optimizer.rb +50 -0
data/lib/parsanol/optimizers/quantifier_optimizer.rb +60 -0
data/lib/parsanol/optimizers/sequence_optimizer.rb +97 -0
data/lib/parsanol/options/ruby_transform.rb +107 -0
data/lib/parsanol/options/serialized.rb +94 -0
data/lib/parsanol/options/zero_copy.rb +128 -0
data/lib/parsanol/options.rb +20 -0
data/lib/parsanol/parallel.rb +133 -0
data/lib/parsanol/parser.rb +182 -0
data/lib/parsanol/parslet.rb +151 -0
data/lib/parsanol/pattern/binding.rb +91 -0
data/lib/parsanol/pattern.rb +159 -0
data/lib/parsanol/pool.rb +219 -0
data/lib/parsanol/pools/array_pool.rb +75 -0
data/lib/parsanol/pools/buffer_pool.rb +175 -0
data/lib/parsanol/pools/position_pool.rb +92 -0
data/lib/parsanol/pools/slice_pool.rb +64 -0
data/lib/parsanol/position.rb +94 -0
data/lib/parsanol/resettable.rb +29 -0
data/lib/parsanol/result.rb +46 -0
data/lib/parsanol/result_builder.rb +208 -0
data/lib/parsanol/result_stream.rb +261 -0
data/lib/parsanol/rig/rspec.rb +71 -0
data/lib/parsanol/rope.rb +81 -0
data/lib/parsanol/scope.rb +104 -0
data/lib/parsanol/slice.rb +146 -0
data/lib/parsanol/source/line_cache.rb +109 -0
data/lib/parsanol/source.rb +180 -0
data/lib/parsanol/source_location.rb +167 -0
data/lib/parsanol/streaming_parser.rb +124 -0
data/lib/parsanol/string_view.rb +195 -0
data/lib/parsanol/transform.rb +226 -0
data/lib/parsanol/version.rb +5 -0
data/lib/parsanol/wasm/README.md +80 -0
data/lib/parsanol/wasm/package.json +51 -0
data/lib/parsanol/wasm/parsanol.js +252 -0
data/lib/parsanol/wasm/parslet.d.ts +129 -0
data/lib/parsanol/wasm_parser.rb +240 -0
data/lib/parsanol.rb +280 -0
data/parsanol-ruby.gemspec +67 -0
metadata +280 -0

data/lib/parsanol/position.rb ADDED Viewed

@@ -0,0 +1,94 @@
+# frozen_string_literal: true
+# Encapsules the concept of a position inside a string.
+#
+module Parsanol
+  class Position
+    include Parsanol::Resettable
+    # Changed to accessor to support pooling
+    attr_accessor :bytepos
+    attr_accessor :string, :charpos
+    include Comparable
+    def initialize(string, bytepos, charpos = nil)
+      @string = string
+      @bytepos = bytepos
+      @charpos = charpos
+    end
+    # Reset the position for reuse in object pooling.
+    # This allows the position to be reinitialized with new values for efficient reuse.
+    #
+    # @param string [String] Source string for position tracking
+    # @param bytepos [Integer] New byte position
+    # @param charpos [Integer, nil] Optional character position
+    # @return [self] Returns self for method chaining
+    #
+    def reset!(string, bytepos, charpos = nil)
+      @string = string
+      @bytepos = bytepos
+      @charpos = charpos
+      self
+    end
+    def charpos
+      # If charpos was provided during initialization, use it
+      return @charpos if @charpos
+      # Cache the calculated charpos to avoid repeated calculations
+      @charpos ||= calculate_charpos
+    end
+    private
+    def calculate_charpos
+      # Calculate it based on platform
+      if defined?(RUBY_ENGINE) && RUBY_ENGINE == 'opal'
+        # In Opal, convert byte position to character position.
+        # We need to calculate how many characters occupy the first @bytepos bytes.
+        `
+        var str = #{@string};
+        var bytePos = #{@bytepos};
+        var chars = Array.from(str);
+        var byteCount = 0;
+        var charCount = 0;
+        for (var i = 0; i < chars.length; i++) {
+          if (byteCount >= bytePos) break;
+          var char = chars[i];
+          var codePoint = char.codePointAt(0);
+          // Calculate UTF-8 byte length for this character
+          if (codePoint < 0x80) {
+            byteCount += 1;
+          } else if (codePoint < 0x800) {
+            byteCount += 2;
+          } else if (codePoint < 0x10000) {
+            byteCount += 3;
+          } else {
+            byteCount += 4;
+          }
+          if (byteCount <= bytePos) {
+            charCount++;
+          }
+        }
+        return charCount;
+      `
+      else
+        # Ruby: Use standard byteslice which handles Unicode correctly
+        @string.byteslice(0, @bytepos).size
+      end
+    end
+    public
+    def <=>(other)
+      bytepos <=> other.bytepos
+    end
+  end
+end

data/lib/parsanol/resettable.rb ADDED Viewed

@@ -0,0 +1,29 @@
+# frozen_string_literal: true
+module Parsanol
+  # Module for objects that can be reset for object pool reuse.
+  #
+  # Including this module signals that an object supports the reset!
+  # method for pooling purposes. This provides an explicit contract
+  # instead of duck-typing with respond_to?.
+  #
+  # @example
+  #   class MyPooledObject
+  #     include Parsanol::Resettable
+  #
+  #     def reset!
+  #       @state = nil
+  #       self
+  #     end
+  #   end
+  #
+  module Resettable
+    # Reset object state for reuse in object pool.
+    #
+    # @return [self] for method chaining
+    # @raise [NotImplementedError] if not implemented by including class
+    def reset!
+      raise NotImplementedError, "#{self.class} must implement #reset!"
+    end
+  end
+end

data/lib/parsanol/result.rb ADDED Viewed

@@ -0,0 +1,46 @@
+# frozen_string_literal: true
+# Phase 58: Result wrapper to replace [success, value] arrays
+#
+# This class wraps parse results to eliminate array allocations.
+# Instead of [true, value] or [false, cause], we use Result objects.
+#
+# Benefits:
+# - Eliminates array allocations (40% reduction)
+# - Cleaner API with success? method
+# - Can be optimized further (object pooling, etc.)
+#
+module Parsanol
+  class Result
+    attr_reader :value
+    def initialize(success, value)
+      @success = success
+      @value = value
+    end
+    def success?
+      @success
+    end
+    def error?
+      !@success
+    end
+    # Compatibility: Allow destructuring like arrays
+    # This enables gradual migration: result.success?, result.value
+    # or: success, value = result (array-like)
+    def to_ary
+      [@success, @value]
+    end
+    # Factory methods for common cases
+    def self.success(value)
+      new(true, value)
+    end
+    def self.error(cause)
+      new(false, cause)
+    end
+  end
+end

data/lib/parsanol/result_builder.rb ADDED Viewed

@@ -0,0 +1,208 @@
+# frozen_string_literal: true
+module Parsanol
+  # Base class for efficient result construction.
+  #
+  # ResultBuilder provides specialized construction patterns that avoid
+  # intermediate array allocations by building results directly.
+  #
+  # == Usage
+  #
+  #   builder = ResultBuilder.for(:repetition, context, estimated_size: 10)
+  #   builder.add_element(value1)
+  #   builder.add_element(value2)
+  #   result = builder.build  # Returns LazyResult
+  #
+  # == Builders
+  #
+  # - RepetitionBuilder: For repetition results
+  # - SequenceBuilder: For sequence results
+  # - HashBuilder: For named capture results
+  #
+  class ResultBuilder
+    # Factory method to create appropriate builder.
+    #
+    # @param type [Symbol] Builder type (:repetition, :sequence, :hash)
+    # @param context [Context] Parse context
+    # @param options [Hash] Builder options
+    # @return [ResultBuilder] Appropriate builder instance
+    #
+    def self.for(type, context, **options)
+      case type
+      when :repetition
+        RepetitionBuilder.new(context, **options)
+      when :sequence
+        SequenceBuilder.new(context, **options)
+      when :hash
+        HashBuilder.new(context, **options)
+      else
+        raise ArgumentError, "Unknown builder type: #{type}"
+      end
+    end
+    # Initialize builder.
+    #
+    # @param context [Context] Parse context for buffer access
+    #
+    def initialize(context)
+      @context = context
+    end
+    # Add element to result (subclasses implement).
+    #
+    # @param value [Object] Value to add
+    # @return [self] For method chaining
+    #
+    def add_element(value)
+      raise NotImplementedError
+    end
+    # Build final result (subclasses implement).
+    #
+    # @return [Object] Constructed result
+    #
+    def build
+      raise NotImplementedError
+    end
+    # Release resources (subclasses implement).
+    #
+    # @return [void]
+    #
+    def release
+      # Default: no-op
+    end
+  end
+  # Builder for repetition results.
+  #
+  # Constructs [:repetition, ...] arrays efficiently.
+  #
+  class RepetitionBuilder < ResultBuilder
+    # Initialize repetition builder.
+    #
+    # @param context [Context] Parse context
+    # @param tag [Symbol] Tag to use (default: :repetition)
+    # @param estimated_size [Integer] Estimated element count
+    #
+    def initialize(context, tag: :repetition, estimated_size: 10)
+      super(context)
+      @tag = tag
+      @buffer = context.acquire_buffer(size: estimated_size + 1)
+      @buffer.push(@tag)
+    end
+    # Add element to repetition.
+    #
+    # @param value [Object] Element to add
+    # @return [self]
+    #
+    def add_element(value)
+      @buffer.push(value)
+      self
+    end
+    # Build LazyResult.
+    #
+    # @return [LazyResult] Lazy repetition result
+    #
+    def build
+      Parsanol::LazyResult.new(@buffer, @context)
+    end
+    # Release buffer on failure.
+    #
+    # @return [void]
+    #
+    def release
+      @context.release_buffer(@buffer) if @buffer
+      @buffer = nil
+    end
+  end
+  # Builder for sequence results.
+  #
+  # Constructs [:sequence, ...] arrays efficiently.
+  #
+  class SequenceBuilder < ResultBuilder
+    # Initialize sequence builder.
+    #
+    # @param context [Context] Parse context
+    # @param size [Integer] Expected sequence length
+    #
+    def initialize(context, size: 5)
+      super(context)
+      @buffer = context.acquire_buffer(size: size + 1)
+      @buffer.push(:sequence)
+    end
+    # Add element to sequence.
+    #
+    # @param value [Object] Element to add
+    # @return [self]
+    #
+    def add_element(value)
+      @buffer.push(value) if value # Skip nil values
+      self
+    end
+    # Build LazyResult.
+    #
+    # @return [LazyResult] Lazy sequence result
+    #
+    def build
+      Parsanol::LazyResult.new(@buffer, @context)
+    end
+    # Release buffer on failure.
+    #
+    # @return [void]
+    #
+    def release
+      @context.release_buffer(@buffer) if @buffer
+      @buffer = nil
+    end
+  end
+  # Builder for hash results (named captures).
+  #
+  # Constructs hashes directly without intermediate arrays.
+  #
+  class HashBuilder < ResultBuilder
+    # Initialize hash builder.
+    #
+    # @param context [Context] Parse context
+    #
+    def initialize(context)
+      super
+      @hash = {}
+    end
+    # Add key-value pair.
+    #
+    # @param key [Symbol] Hash key
+    # @param value [Object] Hash value
+    # @return [self]
+    #
+    def add_pair(key, value)
+      @hash[key] = value
+      self
+    end
+    # Build hash result.
+    #
+    # @return [Hash] Constructed hash
+    #
+    def build
+      @hash
+    end
+    # Release resources (hash cleanup).
+    #
+    # @return [void]
+    #
+    def release
+      @hash = nil
+    end
+  end
+end

data/lib/parsanol/result_stream.rb ADDED Viewed

@@ -0,0 +1,261 @@
+# frozen_string_literal: true
+module Parsanol
+  # Streaming result iterator for memory-efficient parsing.
+  #
+  # Provides an Enumerable interface over parse results, allowing
+  # incremental processing without materializing the entire tree.
+  # Uses depth-first traversal to minimize memory usage.
+  #
+  # == Motivation
+  #
+  # Traditional parsing materializes the entire parse tree in memory:
+  #
+  #   results = parser.parse(large_input)  # Full tree in memory
+  #   results.each { |node| process(node) }
+  #
+  # For large inputs, this can consume significant memory. ResultStream
+  # provides lazy iteration without full tree materialization:
+  #
+  #   stream = ResultStream.new(parser.parse(input))
+  #   stream.each { |node| process(node) }  # Processes incrementally
+  #
+  # == Usage
+  #
+  # Basic iteration:
+  #
+  #   stream = ResultStream.new(parse_tree)
+  #   stream.each { |node| puts node }
+  #
+  # Filtering (leverages Enumerable):
+  #
+  #   stream.select { |node| node.is_a?(Hash) }.each { |hash| process(hash) }
+  #
+  # Mapping:
+  #
+  #   transformed = stream.map { |node| transform(node) }
+  #
+  # == Performance Characteristics
+  #
+  # - Memory: O(tree depth) instead of O(tree size)
+  # - Speed: Minimal overhead (~1-2% vs direct iteration)
+  # - Lazy evaluation: Nodes processed on-demand
+  #
+  # == Integration with Parser
+  #
+  # Can be used directly with parse results:
+  #
+  #   parser = MyParser.new
+  #   result = parser.parse(input)
+  #   stream = ResultStream.new(result)
+  #
+  # Or through the optional stream method on Base:
+  #
+  #   stream = parser.stream(input)  # If available
+  #
+  class ResultStream
+    include Enumerable
+    # Creates a new result stream.
+    #
+    # @param tree [Object] Parse tree (Hash, Array, or scalar)
+    def initialize(tree)
+      @tree = tree
+    end
+    # Iterates over all nodes in the parse tree.
+    # Uses depth-first traversal to minimize memory usage.
+    #
+    # Traversal order:
+    # 1. Current node (pre-order)
+    # 2. Child nodes (recursive)
+    #
+    # This ensures that:
+    # - Only the current path is kept in memory (stack)
+    # - Parent nodes are yielded before children
+    # - Natural processing order for most use cases
+    #
+    # @yield [node] Each node in the tree
+    # @yieldparam node [Object] Current node (Hash, Array, or scalar)
+    # @return [Enumerator] if no block given
+    #
+    # @example Basic iteration
+    #   stream.each { |node| puts node.class }
+    #
+    # @example Lazy enumeration
+    #   enum = stream.each  # Returns Enumerator
+    #   enum.next           # Get next node
+    #
+    def each(&block)
+      return enum_for(:each) unless block_given?
+      traverse(@tree, &block)
+      self
+    end
+    # Filters nodes by type.
+    #
+    # @param klass [Class] Class to filter by
+    # @return [Enumerator] Filtered nodes
+    #
+    # @example Get all hash nodes
+    #   stream.nodes_of_type(Hash)
+    #
+    def nodes_of_type(klass)
+      grep(klass)
+    end
+    # Returns all hash nodes in the tree.
+    #
+    # @return [Enumerator] Hash nodes
+    #
+    # @example
+    #   stream.hashes.each { |h| puts h.keys }
+    #
+    def hashes
+      nodes_of_type(Hash)
+    end
+    # Returns all array nodes in the tree.
+    #
+    # @return [Enumerator] Array nodes
+    #
+    # @example
+    #   stream.arrays.each { |a| puts a.size }
+    #
+    def arrays
+      nodes_of_type(Array)
+    end
+    # Returns all scalar nodes (non-Hash, non-Array).
+    #
+    # @return [Enumerator] Scalar nodes
+    #
+    # @example
+    #   stream.scalars.each { |s| puts s }
+    #
+    def scalars
+      select { |node| !node.is_a?(Hash) && !node.is_a?(Array) }
+    end
+    # Returns nodes matching a predicate at a specific depth.
+    #
+    # @param depth [Integer] Tree depth (0 = root)
+    # @yield [node] Predicate to test each node
+    # @return [Enumerator] Matching nodes
+    #
+    # @example Get all nodes at depth 2
+    #   stream.at_depth(2) { true }
+    #
+    def at_depth(target_depth, &predicate)
+      predicate ||= proc { true }
+      depth_traverse(@tree, 0, target_depth, &predicate)
+    end
+    # Counts total nodes in the tree.
+    #
+    # @return [Integer] Total node count
+    #
+    # @example
+    #   stream.count  # => 42
+    #
+    def count
+      counter = 0
+      each { counter += 1 }
+      counter
+    end
+    # Returns maximum depth of the tree.
+    #
+    # @return [Integer] Maximum depth
+    #
+    # @example
+    #   stream.max_depth  # => 5
+    #
+    def max_depth
+      find_max_depth(@tree, 0)
+    end
+    private
+    # Depth-first tree traversal with pre-order visiting.
+    #
+    # @param node [Object] Current node
+    # @yield [node] Each visited node
+    #
+    def traverse(node, &block)
+      # Yield current node first (pre-order)
+      yield node
+      # Recursively traverse children
+      case node
+      when Array
+        node.each { |item| traverse(item, &block) }
+      when Hash
+        node.each_value { |value| traverse(value, &block) }
+      end
+      # Scalars have no children, stop here
+    end
+    # Depth-aware traversal for filtering by level.
+    #
+    # @param node [Object] Current node
+    # @param current_depth [Integer] Current depth in tree
+    # @param target_depth [Integer] Depth to match
+    # @yield [node] Matching nodes at target depth
+    # @return [Enumerator]
+    #
+    def depth_traverse(node, current_depth, target_depth, &block)
+      return enum_for(:depth_traverse, node, current_depth, target_depth) unless block_given?
+      # Check if we're at target depth
+      return [node].to_enum if current_depth == target_depth && yield(node)
+      # Recurse to children if not at target depth yet
+      results = []
+      if current_depth < target_depth
+        case node
+        when Array
+          node.each do |item|
+            depth_traverse(item, current_depth + 1, target_depth, &block).each do |result|
+              results << result
+            end
+          end
+        when Hash
+          node.each_value do |value|
+            depth_traverse(value, current_depth + 1, target_depth, &block).each do |result|
+              results << result
+            end
+          end
+        end
+      end
+      results.to_enum
+    end
+    # Find maximum depth of tree recursively.
+    #
+    # @param node [Object] Current node
+    # @param current_depth [Integer] Current depth
+    # @return [Integer] Maximum depth from this node
+    #
+    def find_max_depth(node, current_depth)
+      max = current_depth
+      case node
+      when Array
+        node.each do |item|
+          depth = find_max_depth(item, current_depth + 1)
+          max = depth if depth > max
+        end
+      when Hash
+        node.each_value do |value|
+          depth = find_max_depth(value, current_depth + 1)
+          max = depth if depth > max
+        end
+      end
+      max
+    end
+  end
+end

data/lib/parsanol/rig/rspec.rb ADDED Viewed

@@ -0,0 +1,71 @@
+# frozen_string_literal: true
+# RSpec matcher for parsing expectations. Provides a fluent DSL for
+# specifying parsing behavior in tests.
+#
+# @example Basic usage
+#   expect(parser).to parse("input")
+#
+# @example With expected output
+#   expect(parser).to parse("123").as(123)
+#
+# @example With block validation
+#   expect(parser).to parse("input").as { |result| result.size > 0 }
+#
+# Inspired by RSpec matcher patterns and Parslet's testing utilities.
+#
+RSpec::Matchers.define(:parse) do |input_text, options|
+  expected_output = nil
+  validator_block = nil
+  actual_result = nil
+  error_trace = nil
+  match do |parser_instance|
+    actual_result = parser_instance.parse(input_text)
+    if validator_block
+      validator_block.call(actual_result)
+    else
+      expected_output.nil? || expected_output == actual_result
+    end
+  rescue Parsanol::ParseFailed => e
+    error_trace = e.parse_failure_cause.ascii_tree if options && options[:trace]
+    false
+  end
+  failure_message do |parser_instance|
+    if validator_block
+      "expected output of parsing #{input_text.inspect} with " \
+        "#{parser_instance.inspect} to meet block conditions, but it didn't"
+    else
+      msg = if expected_output
+              "expected output of parsing #{input_text.inspect} with " \
+                "#{parser_instance.inspect} to equal #{expected_output.inspect}, " \
+                "but was #{actual_result.inspect}"
+            else
+              "expected #{parser_instance.inspect} to be able to parse " \
+                "#{input_text.inspect}"
+            end
+      msg += "\n#{error_trace}" if error_trace
+      msg
+    end
+  end
+  failure_message_when_negated do |parser_instance|
+    if validator_block
+      "expected output of parsing #{input_text.inspect} with " \
+        "#{parser_instance.inspect} not to meet block conditions, but it did"
+    elsif expected_output
+      "expected output of parsing #{input_text.inspect} with " \
+        "#{parser_instance.inspect} not to equal #{expected_output.inspect}"
+    else
+      "expected #{parser_instance.inspect} to not parse " \
+        "#{input_text.inspect}, but it did"
+    end
+  end
+  # Chain method for specifying expected output or validation block
+  chain :as do |expected = nil, &block|
+    expected_output = expected
+    validator_block = block
+  end
+end