RubyGems - kumi-parser - Versions diffs - 0.0.33 → 0.1.0 - Mend

kumi-parser 0.0.33 → 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

checksums.yaml +4 -4
data/.rubocop.yml +41 -0
data/CHANGELOG.md +64 -0
data/CLAUDE.md +59 -120
data/README.md +28 -6
data/examples/parse_and_inspect.rb +34 -0
data/kumi-parser.gemspec +3 -4
data/lib/kumi/parser/grammar.rb +120 -0
data/lib/kumi/parser/lexer.rb +232 -0
data/lib/kumi/parser/parse_error.rb +52 -0
data/lib/kumi/parser/parser.rb +692 -0
data/lib/kumi/parser/source.rb +76 -0
data/lib/kumi/parser/text_parser.rb +37 -27
data/lib/kumi/parser/token.rb +10 -71
data/lib/kumi/parser/version.rb +1 -1
data/lib/kumi-parser.rb +9 -10
metadata +16 -37
data/examples/debug_text_parser.rb +0 -41
data/examples/debug_transform_rule.rb +0 -26
data/examples/text_parser_comprehensive_test.rb +0 -333
data/examples/text_parser_test_with_comments.rb +0 -146
data/lib/kumi/parser/base.rb +0 -51
data/lib/kumi/parser/direct_parser.rb +0 -698
data/lib/kumi/parser/error_extractor.rb +0 -89
data/lib/kumi/parser/errors.rb +0 -40
data/lib/kumi/parser/helpers.rb +0 -154
data/lib/kumi/parser/smart_tokenizer.rb +0 -373
data/lib/kumi/parser/syntax_validator.rb +0 -21
data/lib/kumi/parser/text_parser/api.rb +0 -60
data/lib/kumi/parser/token_constants.rb +0 -468
data/lib/kumi/text_parser.rb +0 -40
data/lib/kumi/text_schema.rb +0 -31

data/lib/kumi/parser/text_parser/api.rb DELETED Viewed

@@ -1,60 +0,0 @@
-# frozen_string_literal: true
-require 'ostruct'
-module Kumi
-  module Parser
-    module TextParser
-      # Public API for TextParser
-      class Api
-        class << self
-          def parse(text, source_file: '<input>')
-            parser = Parser.new
-            parser.parse(text, source_file: source_file)
-          end
-          def validate(text, source_file: '<input>')
-            parse(text, source_file: source_file)
-            []
-          rescue StandardError => e
-            [create_diagnostic(e, source_file)]
-          end
-          def valid?(text, source_file: '<input>')
-            validate(text, source_file: source_file).empty?
-          end
-          def diagnostics_for_monaco(text, source_file: '<input>')
-            validate(text, source_file: source_file)
-          end
-          def diagnostics_for_codemirror(text, source_file: '<input>')
-            validate(text, source_file: source_file)
-          end
-          def diagnostics_as_json(text, source_file: '<input>')
-            validate(text, source_file: source_file).map(&:to_h)
-          end
-          def analyze(text, source_file: '<input>')
-            ast = parse(text, source_file: source_file)
-            { success: true, ast: ast, diagnostics: [] }
-          rescue StandardError => e
-            { success: false, ast: nil, diagnostics: [create_diagnostic(e, source_file)] }
-          end
-          private
-          def create_diagnostic(error, source_file)
-            OpenStruct.new(
-              line: 1,
-              column: 1,
-              message: error.message,
-              source_file: source_file
-            )
-          end
-        end
-      end
-    end
-  end
-end

data/lib/kumi/parser/token_constants.rb DELETED Viewed

@@ -1,468 +0,0 @@
-# frozen_string_literal: true
-module Kumi
-  module Parser
-    # Token types
-    module TokenType
-      # Literals
-      INTEGER = :integer
-      FLOAT = :float
-      STRING = :string
-      BOOLEAN = :boolean
-      # Identifiers and symbols
-      IDENTIFIER = :identifier
-      SYMBOL = :symbol           # :name
-      CONSTANT = :constant       # Float::INFINITY
-      # Keywords
-      SCHEMA = :schema
-      INPUT = :input
-      VALUE = :value
-      TRAIT = :trait
-      IMPORT = :import
-      CODEGEN = :codegen
-      FROM = :from
-      DO = :do
-      END_KW = :end
-      ON = :on
-      BASE = :base
-      # Type keywords
-      INTEGER_TYPE = :integer_type   # integer
-      FLOAT_TYPE = :float_type       # float
-      DECIMAL_TYPE = :decimal_type   # decimal
-      STRING_TYPE = :string_type     # string
-      BOOLEAN_TYPE = :boolean_type   # boolean
-      ANY_TYPE = :any_type           # any
-      ARRAY_TYPE = :array_type       # array
-      ELEMENT_TYPE = :element_type   # element
-      INDEX_TYPE = :index_type       # index
-      # Function keywords
-      FN = :fn
-      # Operators (by precedence)
-      EXPONENT = :exponent # **
-      MULTIPLY = :multiply # *
-      DIVIDE = :divide          # /
-      MODULO = :modulo          # %
-      ADD = :add                # +
-      SUBTRACT = :subtract      # -
-      GTE = :gte                # >=
-      LTE = :lte                # <=
-      GT = :gt                  # >
-      LT = :lt                  # <
-      EQ = :eq                  # ==
-      NE = :ne                  # !=
-      AND = :and                # &
-      OR = :or                  # |
-      # Punctuation
-      DOT = :dot                # .
-      DOT_DOT = :dot_dot        # ..
-      DOT_DOT_DOT = :dot_dot_dot # ...
-      COMMA = :comma            # ,
-      COLON = :colon            # :
-      LPAREN = :lparen          # (
-      RPAREN = :rparen          # )
-      LBRACKET = :lbracket      # [
-      RBRACKET = :rbracket      # ]
-      # Special
-      NEWLINE = :newline
-      EOF = :eof
-      COMMENT = :comment # # comment
-    end
-    # Rich metadata for each token type
-    TOKEN_METADATA = {
-      # Keywords with parsing hints
-      schema: {
-        category: :keyword,
-        expects_block: true,
-        block_terminator: :end
-      },
-      input: {
-        category: :keyword,
-        expects_block: true,
-        block_terminator: :end,
-        context: :input_declarations
-      },
-      value: {
-        category: :keyword,
-        expects_expression: true,
-        declaration_type: :value
-      },
-      let: {
-        category: :keyword,
-        expects_expression: true
-      },
-      trait: {
-        category: :keyword,
-        expects_expression: true,
-        declaration_type: :trait
-      },
-      import: {
-        category: :keyword,
-        import_declaration: true
-      },
-      codegen: {
-        category: :keyword,
-        schema_directive: true
-      },
-      from: {
-        category: :keyword,
-        import_source: true
-      },
-      do: {
-        category: :keyword,
-        block_opener: true
-      },
-      end: {
-        category: :keyword,
-        block_closer: true,
-        terminates_expression: true
-      },
-      on: {
-        category: :keyword,
-        cascade_keyword: true,
-        expects_condition: true
-      },
-      base: {
-        category: :keyword,
-        cascade_keyword: true,
-        is_base_case: true
-      },
-      # Type keywords
-      integer_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :integer
-      },
-      float_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :float
-      },
-      decimal_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :decimal
-      },
-      string_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :string
-      },
-      boolean_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :boolean
-      },
-      any_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :any
-      },
-      array_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :array
-      },
-      hash_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :hash
-      },
-      element_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :element
-      },
-      index_type: {
-        category: :type_keyword,
-        starts_declaration: true,
-        type_name: :index
-      },
-      # Function keyword
-      fn: {
-        category: :keyword,
-        function_keyword: true,
-        starts_expression: true
-      },
-      function_sugar: {
-        function_keyword: true,
-        starts_expression: true
-      },
-      # Operators with precedence and associativity
-      exponent: {
-        category: :operator,
-        precedence: 7,
-        associativity: :right,
-        arity: :binary
-      },
-      multiply: {
-        category: :operator,
-        precedence: 6,
-        associativity: :left,
-        arity: :binary
-      },
-      divide: {
-        category: :operator,
-        precedence: 6,
-        associativity: :left,
-        arity: :binary
-      },
-      modulo: {
-        category: :operator,
-        precedence: 6,
-        associativity: :left,
-        arity: :binary
-      },
-      add: {
-        category: :operator,
-        precedence: 5,
-        associativity: :left,
-        arity: :binary
-      },
-      subtract: {
-        category: :operator,
-        precedence: 5,
-        associativity: :left,
-        arity: :binary
-      },
-      gte: {
-        category: :operator,
-        precedence: 4,
-        associativity: :left,
-        arity: :binary,
-        returns_boolean: true
-      },
-      lte: {
-        category: :operator,
-        precedence: 4,
-        associativity: :left,
-        arity: :binary,
-        returns_boolean: true
-      },
-      gt: {
-        category: :operator,
-        precedence: 4,
-        associativity: :left,
-        arity: :binary,
-        returns_boolean: true
-      },
-      lt: {
-        category: :operator,
-        precedence: 4,
-        associativity: :left,
-        arity: :binary,
-        returns_boolean: true
-      },
-      eq: {
-        category: :operator,
-        precedence: 4,
-        associativity: :left,
-        arity: :binary,
-        returns_boolean: true
-      },
-      ne: {
-        category: :operator,
-        precedence: 4,
-        associativity: :left,
-        arity: :binary,
-        returns_boolean: true
-      },
-      and: {
-        category: :operator,
-        precedence: 3,
-        associativity: :left,
-        arity: :binary,
-        requires_boolean: true
-      },
-      or: {
-        category: :operator,
-        precedence: 2,
-        associativity: :left,
-        arity: :binary,
-        requires_boolean: true
-      },
-      # Literals with type information
-      integer: {
-        category: :literal,
-        starts_expression: true,
-        ast_class: 'Kumi::Syntax::Literal'
-      },
-      float: {
-        category: :literal,
-        starts_expression: true,
-        ast_class: 'Kumi::Syntax::Literal'
-      },
-      string: {
-        category: :literal,
-        starts_expression: true,
-        ast_class: 'Kumi::Syntax::Literal'
-      },
-      boolean: {
-        category: :literal,
-        starts_expression: true,
-        ast_class: 'Kumi::Syntax::Literal'
-      },
-      # Identifiers and references
-      identifier: {
-        category: :identifier,
-        starts_expression: true,
-        can_be_reference: true
-      },
-      symbol: {
-        category: :identifier,
-        starts_expression: true,
-        is_declaration_name: true
-      },
-      constant: {
-        category: :literal,
-        starts_expression: true,
-        ast_class: 'Kumi::Syntax::Literal'
-      },
-      # Punctuation with parser hints
-      dot: {
-        category: :punctuation,
-        indicates_member_access: true
-      },
-      dot_dot: {
-        category: :range
-      },
-      dot_dot_dot: {
-        category: :range
-      },
-      comma: {
-        category: :punctuation,
-        separates_items: true
-      },
-      colon: {
-        category: :punctuation,
-        indicates_symbol: true
-      },
-      lparen: {
-        category: :punctuation,
-        opens_group: true,
-        group_closer: :rparen,
-        starts_expression: true
-      },
-      rparen: {
-        category: :punctuation,
-        closes_group: true,
-        terminates_expression: true
-      },
-      lbracket: {
-        category: :punctuation,
-        opens_group: true,
-        group_closer: :rbracket,
-        starts_expression: true,
-        indicates_array: true
-      },
-      rbracket: {
-        category: :punctuation,
-        closes_group: true,
-        terminates_expression: true
-      },
-      left_brace: {
-        category: :punctuation,
-        opens_scope: :hash
-      },
-      right_brace: {
-        category: :punctuation,
-        closes_scope: :hash
-      },
-      # Special tokens
-      newline: {
-        category: :whitespace,
-        separates_statements: true
-      },
-      eof: {
-        category: :special,
-        terminates_input: true
-      },
-      comment: {
-        category: :whitespace,
-        ignored_by_parser: true
-      }
-    }.freeze
-    # Character to token mappings
-    CHAR_TO_TOKEN = {
-      '(' => :lparen,
-      ')' => :rparen,
-      '[' => :lbracket,
-      ']' => :rbracket,
-      '{' => :left_brace,
-      '}' => :right_brace,
-      ',' => :comma,
-      '.' => :dot,
-      ':' => :colon,
-      '+' => :add,
-      '-' => :subtract,
-      '*' => :multiply,
-      '/' => :divide,
-      '%' => :modulo,
-      '&' => :and,
-      '|' => :or,
-      '=>' => :arrow
-    }.freeze
-    FUNCTION_SUGAR = {
-      'select' => '__select__',
-      'shift' => 'shift',
-      'roll' => 'roll',
-      'cross' => 'cross',
-      'outer' => 'outer',
-      'index' => 'index',
-      'to_decimal' => 'to_decimal',
-      'to_integer' => 'to_integer',
-      'to_float' => 'to_float',
-      'to_string' => 'to_string'
-    }.freeze
-    # Keywords mapping
-    KEYWORDS = {
-      'schema' => :schema,
-      'input' => :input,
-      'value' => :value,
-      'let' => :let,
-      'trait' => :trait,
-      'import' => :import,
-      'codegen' => :codegen,
-      'from' => :from,
-      'do' => :do,
-      'end' => :end,
-      'on' => :on,
-      'base' => :base,
-      'fn' => :fn,
-      'true' => :boolean,
-      'false' => :boolean,
-      'integer' => :integer_type,
-      'float' => :float_type,
-      'decimal' => :decimal_type,
-      'string' => :string_type,
-      'boolean' => :boolean_type,
-      'any' => :any_type,
-      'array' => :array_type,
-      'hash' => :hash_type,
-      'element' => :element_type
-    }.freeze
-    # Opener to closer mappings for error recovery
-    OPENER_FOR_CLOSER = {
-      rparen: :lparen,
-      rbracket: :lbracket
-    }.freeze
-  end
-end

data/lib/kumi/text_parser.rb DELETED Viewed

@@ -1,40 +0,0 @@
-# frozen_string_literal: true
-require_relative 'parser/text_parser'
-module Kumi
-  # Top-level text parser module with same interface as Ruby DSL
-  module TextParser
-    extend self
-    # Parse text schema and return AST (same interface as RubyParser::Dsl.build_syntax_tree)
-    def parse(text, source_file: '<input>')
-      Parser::TextParser.parse(text, source_file: source_file)
-    end
-    # Validate text schema
-    def valid?(text, source_file: '<input>')
-      Parser::TextParser.valid?(text, source_file: source_file)
-    end
-    # Get validation diagnostics
-    def validate(text, source_file: '<input>')
-      Parser::TextParser.validate(text, source_file: source_file)
-    end
-    # Get Monaco Editor format diagnostics
-    def diagnostics_for_monaco(text, source_file: '<input>')
-      Parser::TextParser.diagnostics_for_monaco(text, source_file: source_file)
-    end
-    # Get CodeMirror format diagnostics
-    def diagnostics_for_codemirror(text, source_file: '<input>')
-      Parser::TextParser.diagnostics_for_codemirror(text, source_file: source_file)
-    end
-    # Get JSON format diagnostics
-    def diagnostics_as_json(text, source_file: '<input>')
-      Parser::TextParser.diagnostics_as_json(text, source_file: source_file)
-    end
-  end
-end

data/lib/kumi/text_schema.rb DELETED Viewed

@@ -1,31 +0,0 @@
-# frozen_string_literal: true
-require 'kumi'
-require_relative 'text_parser'
-module Kumi
-  # Text-based schema that extends Kumi::Schema with text parsing capabilities
-  class TextSchema
-    extend Kumi::Schema
-    # Create a schema from text using the same pipeline as Ruby DSL
-    def self.from_text(text, source_file: '<input>')
-      # Parse text to AST (same as RubyParser::Dsl.build_syntax_tree)
-      @__kumi_syntax_tree__ = Kumi::TextParser.parse(text, source_file: source_file).freeze
-      @__analyzer_result__ = Analyzer.analyze!(@__kumi_syntax_tree__).freeze
-      @__compiled_schema__ = Compiler.compile(@__kumi_syntax_tree__, analyzer: @__analyzer_result__).freeze
-      Inspector.new(@__kumi_syntax_tree__, @__analyzer_result__, @__compiled_schema__)
-    end
-    # Validate text schema
-    def self.valid?(text, source_file: '<input>')
-      Kumi::TextParser.valid?(text, source_file: source_file)
-    end
-    # Get validation diagnostics
-    def self.validate(text, source_file: '<input>')
-      Kumi::TextParser.validate(text, source_file: source_file)
-    end
-  end
-end