RubyGems - vinter - Versions diffs - 0.2.0 → 0.4.0 - Mend

vinter 0.2.0 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

data/lib/vinter/lexer.rb CHANGED Viewed

@@ -2,17 +2,18 @@ module Vinter
   class Lexer
     TOKEN_TYPES = {
       # Vim9 specific keywords
-      keyword: /\b(if|else|elseif|endif|while|endwhile|for|endfor|def|enddef|function|endfunction|return|const|var|final|import|export|class|extends|static|enum|type|vim9script|abort)\b/,
+      keyword: /\b(if|else|elseif|endif|while|endwhile|for|endfor|def|enddef|function|endfunction|endfunc|return|const|var|final|import|export|class|extends|static|enum|type|vim9script|abort|autocmd|echom|echoerr|echohl|echomsg|let|unlet|execute|exec|continue|break|try|catch|finally|endtry|throw|runtime|silent|delete|command|call|set|setlocal|syntax|highlight|sleep|source|nnoremap|nmap|inoremap|imap|vnoremap|vmap|xnoremap|xmap|cnoremap|cmap|noremap|map)\b/,
       # Identifiers can include # and special characters
       identifier: /\b[a-zA-Z_][a-zA-Z0-9_#]*\b/,
       # Single-character operators
-      operator: /[\+\-\*\/=<>!&\|\.]/,
+      operator: /[\+\-\*\/=%<>!&\|\.]/,
       # Multi-character operators handled separately
-      number: /\b\d+(\.\d+)?\b/,
+      number: /\b(0[xX][0-9A-Fa-f]+|0[oO][0-7]+|0[bB][01]+|\d+(\.\d+)?([eE][+-]?\d+)?[smh]?)\b/,
       # Handle both single and double quoted strings
-      string: /"([^"\\]|\\.)*"|'([^'\\]|\\.)*'/,
+      # string: /"(\\"|[^"])*"|'(\\'|[^'])*'/,
+      register_access: /@[a-zA-Z0-9":.%#=*+~_\/\-]/,
       # Vim9 comments use #
-      comment: /#.*/,
+      comment: /(#|").*/,
       whitespace: /\s+/,
       brace_open: /\{/,
       brace_close: /\}/,
@@ -23,8 +24,12 @@ module Vinter
       colon: /:/,
       semicolon: /;/,
       comma: /,/,
+      backslash: /\\/,
+      question_mark: /\?/,
+      command_separator: /\|/,
     }
+    CONTINUATION_OPERATORS = %w(. .. + - * / = == ==# ==? != > < >= <= && || ? : -> =>)
     def initialize(input)
       @input = input
       @tokens = []
@@ -33,36 +38,428 @@ module Vinter
       @column = 1
     end
+    def should_parse_as_regex
+      # Look at recent tokens to determine if we're in a regex context
+      recent_tokens = @tokens.last(3)
+      # Check for contexts where regex is expected
+      return true if recent_tokens.any? { |t|
+        t && t[:type] == :keyword && ['syntax'].include?(t[:value])
+      }
+      return true if recent_tokens.any? { |t|
+        t && t[:type] == :identifier && ['match', 'region', 'keyword'].include?(t[:value])
+      }
+      # Check for comparison operators that often use regex
+      return true if recent_tokens.any? { |t|
+        t && t[:type] == :operator && ['=~', '!~', '=~#', '!~#', '=~?', '!~?'].include?(t[:value])
+      }
+      false
+    end
+    def find_unescaped_newline(chunk)
+      i = 0
+      while i < chunk.length
+        if chunk[i] == "\n" && (i == 0 || chunk[i - 1] != '\\')
+          return i
+        end
+        i += 1
+      end
+      nil # Return nil if no unescaped newline is found
+    end
     def tokenize
       until @position >= @input.length
         chunk = @input[@position..-1]
+        # First check if the line starts with a quote (comment in Vim)
+        # Check if we're at the beginning of a line (optionally after whitespace)
+        line_start = @position == 0 || @input[@position - 1] == "\n"
+        if !line_start
+          # Check if we're after whitespace at the start of a line
+          temp_pos = @position - 1
+          while temp_pos >= 0 && @input[temp_pos] =~ /[ \t]/
+            temp_pos -= 1
+          end
+          line_start = temp_pos < 0 || @input[temp_pos] == "\n"
+        end
-        # Handle multi-character operators explicitly
-        if match = chunk.match(/\A(==|!=|=>|->|\.\.)/)
-          @tokens << {
-            type: :operator,
-            value: match[0],
-            line: @line_num,
-            column: @column
+        # If we're at the start of a line and it begins with a quote
+        if line_start && chunk.start_with?('"')
+          # Find the end of the line
+          line_end = find_unescaped_newline(chunk) || chunk.length
+          comment_text = chunk[0...line_end]
+          @tokens << {
+            type: :comment,
+            value: comment_text,
+            line: @line_num,
+            column: @column
+          }
+          @position += comment_text.length
+          @column += comment_text.length
+          next
+        end
+        # Handle string literals manually
+        if chunk.start_with?("'") || chunk.start_with?('"')
+          quote = chunk[0]
+          i = 1
+          escaped = false
+          string_value = quote
+          # Keep going until we find an unescaped closing quote
+          while i < chunk.length
+            char = chunk[i]
+            string_value += char
+            if char == '\\' && !escaped
+              escaped = true
+            elsif (char == "\n" or char == quote) && !escaped
+              # Found closing quote
+              break
+            elsif escaped
+              escaped = false
+            end
+            i += 1
+          end
+          # Add the string token if we found a closing quote
+          if i < chunk.length || (i == chunk.length && chunk[-1] == quote)
+            @tokens << {
+              type: :string,
+              value: string_value,
+              line: @line_num,
+              column: @column
+            }
+            @column += string_value.length
+            @position += string_value.length
+            @line_num += 1 if string_value.include?("\n")
+            next
+          end
+        end
+        # Add special handling for command options in the tokenize method
+        if chunk.start_with?('<q-args>', '<f-args>', '<args>')
+          arg_token = chunk.match(/\A(<q-args>|<f-args>|<args>)/)[0]
+          @tokens << {
+            type: :command_arg_placeholder,
+            value: arg_token,
+            line: @line_num,
+            column: @column
+          }
+          @column += arg_token.length
+          @position += arg_token.length
+          next
+        end
+        # Special handling for a:000 variable arguments array
+        if chunk =~ /\Aa:0+/
+          varargs_token = chunk.match(/\Aa:0+/)[0]
+          @tokens << {
+            type: :arg_variable,
+            value: varargs_token,
+            line: @line_num,
+            column: @column
+          }
+          @column += varargs_token.length
+          @position += varargs_token.length
+          next
+        end
+        # Also add special handling for 'silent!' keyword
+        # Add this after the keyword check in tokenize method
+        if chunk.start_with?('silent!')
+          @tokens << {
+            type: :silent_bang,
+            value: 'silent!',
+            line: @line_num,
+            column: @column
+          }
+          @column += 7
+          @position += 7
+          next
+        end
+        # Check for keywords first, before other token types
+        if match = chunk.match(/\A\b(if|else|elseif|endif|while|endwhile|for|endfor|def|enddef|function|endfunction|endfunc|return|const|var|final|import|export|class|extends|static|enum|type|vim9script|abort|autocmd|echoerr|echohl|echomsg|let|unlet|execute|setlocal|syntax|highlight|sleep|source)\b/)
+          @tokens << {
+            type: :keyword,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle Vim scoped option variables with &l: or &g: prefix
+        if match = chunk.match(/\A&[lg]:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :scoped_option_variable,
+            value: match[0],
+            line: @line_num,
+            column: @column
           }
           @column += match[0].length
           @position += match[0].length
           next
         end
+        # Handle Vim option variables with & prefix
+        if match = chunk.match(/\A&[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :option_variable,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle Vim special variables with v: prefix
+        if match = chunk.match(/\Av:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :special_variable,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle script-local identifiers with s: prefix
+        if match = chunk.match(/\As:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :script_local,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle buffer-local identifiers with b: prefix
+        if match = chunk.match(/\Ab:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :buffer_local,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle window-local identifiers with w: prefix
+        if match = chunk.match(/\Aw:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :window_local,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle tab-local identifiers with t: prefix
+        if match = chunk.match(/\At:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :tab_local,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle global variables with g: prefix
+        if match = chunk.match(/\Ag:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :global_variable,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle argument variables with a: prefix
+        if match = chunk.match(/\Aa:[a-zA-Z_][a-zA-Z0-9_]*/) || match = chunk.match(/\Aa:[A-Z0-9]/)
+          @tokens << {
+            type: :arg_variable,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle argument variables with a: prefix
+        if match = chunk.match(/\Al:[a-zA-Z_][a-zA-Z0-9_]*/)
+          @tokens << {
+            type: :local_variable,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Add support for standalone namespace prefixes (like g:)
+        if match = chunk.match(/\A([sgbwtal]):/)
+          @tokens << {
+            type: :namespace_prefix,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle compound assignment operators
+        if match = chunk.match(/\A(\+=|-=|\*=|\/=|\.\.=|\.=)/)
+          @tokens << {
+            type: :compound_operator,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
         # Handle ellipsis for variable args
         if chunk.start_with?('...')
-          @tokens << {
-            type: :ellipsis,
-            value: '...',
-            line: @line_num,
-            column: @column
+          @tokens << {
+            type: :ellipsis,
+            value: '...',
+            line: @line_num,
+            column: @column
           }
           @column += 3
           @position += 3
           next
         end
+        # Handle multi-character operators explicitly
+        if match = chunk.match(/\A(=~#|=~\?|=~|!~#|!~\?|!~|==#|==\?|==|!=#|!=\?|!=|=>\?|=>|>=#|>=\?|>=|<=#|<=\?|<=|->#|->\?|->|\.\.|\|\||&&)/)
+          @tokens << {
+            type: :operator,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle regex patterns /pattern/ - only in specific contexts
+        if chunk.start_with?('/') && should_parse_as_regex
+          i = 1
+          regex_value = '/'
+          # Keep going until we find the closing slash
+          while i < chunk.length
+            char = chunk[i]
+            regex_value += char
+            if char == '/' && (i == 1 || chunk[i-1] != '\\')
+              # Found closing slash
+              i += 1
+              break
+            end
+            i += 1
+          end
+          # Add the regex token if we found a closing slash
+          if regex_value.end_with?('/')
+            @tokens << {
+              type: :regex,
+              value: regex_value,
+              line: @line_num,
+              column: @column
+            }
+            @column += regex_value.length
+            @position += regex_value.length
+            next
+          end
+        end
+        # Handle hex colors like #33FF33
+        if match = chunk.match(/\A#[0-9A-Fa-f]{6}/)
+          @tokens << {
+            type: :hex_color,
+            value: match[0],
+            line: @line_num,
+            column: @column
+          }
+          @column += match[0].length
+          @position += match[0].length
+          next
+        end
+        # Handle register access (@a, @", etc.)
+        if chunk =~ /\A@[a-zA-Z0-9":.%#=*+~_\/\-]/
+          register_token = chunk.match(/\A@[a-zA-Z0-9":.%#=*+~_\/\-]/)[0]
+          @tokens << {
+            type: :register_access,
+            value: register_token,
+            line: @line_num,
+            column: @column
+          }
+          @column += register_token.length
+          @position += register_token.length
+          next
+        end
+        # In the tokenize method, add special handling for common mapping components
+        if chunk.start_with?('<CR>', '<Esc>', '<Tab>', '<Space>', '<C-') ||
+           (chunk =~ /\A<[A-Za-z0-9\-_]+>/)
+          # Extract the special key notation
+          match = chunk.match(/\A(<[^>]+>)/)
+          if match
+            special_key = match[1]
+            @tokens << {
+              type: :special_key,
+              value: special_key,
+              line: @line_num,
+              column: @column
+            }
+            @position += special_key.length
+            @column += special_key.length
+            next
+          end
+        end
         # Skip whitespace but track position
         if match = chunk.match(/\A(\s+)/)
           whitespace = match[0]
@@ -77,20 +474,55 @@ module Vinter
           @position += whitespace.length
           next
         end
+        # Handle backslash for line continuation
+        if chunk.start_with?('\\')
+          @tokens << {
+            type: :line_continuation,
+            value: '\\',
+            line: @line_num,
+            column: @column
+          }
+          @column += 1
+          @position += 1
+          # If followed by a newline, advance to next line
+          if @position < @input.length && @input[@position] == "\n"
+            @line_num += 1
+            @column = 1
+            @position += 1
+          end
+          next
+        end
+        # Check for special case where 'function' is followed by '('
+        # which likely means it's used as a built-in function
+        if chunk =~ /\Afunction\s*\(/
+          @tokens << {
+            type: :identifier,  # Treat as identifier, not keyword
+            value: 'function',
+            line: @line_num,
+            column: @column
+          }
+          @column += 'function'.length
+          @position += 'function'.length
+          next
+        end
         match_found = false
         TOKEN_TYPES.each do |type, pattern|
           if match = chunk.match(/\A(#{pattern})/)
             value = match[0]
-            token = {
-              type: type,
-              value: value,
-              line: @line_num,
-              column: @column
+            token = {
+              type: type,
+              value: value,
+              line: @line_num,
+              column: @column
             }
             @tokens << token unless type == :whitespace
             # Update position
             if value.include?("\n")
               lines = value.split("\n")
@@ -103,33 +535,33 @@ module Vinter
             else
               @column += value.length
             end
             @position += value.length
             match_found = true
             break
           end
         end
         unless match_found
           # Try to handle unknown characters
-          @tokens << {
-            type: :unknown,
-            value: chunk[0],
-            line: @line_num,
-            column: @column
+          @tokens << {
+            type: :unknown,
+            value: chunk[0],
+            line: @line_num,
+            column: @column
           }
           if chunk[0] == "\n"
             @line_num += 1
             @column = 1
           else
             @column += 1
           end
           @position += 1
         end
       end
       @tokens
     end
   end

data/lib/vinter/linter.rb CHANGED Viewed

@@ -1,7 +1,12 @@
+require "yaml"
 module Vinter
   class Linter
-    def initialize
+    def initialize(config_path: nil)
       @rules = []
+      @ignored_rules = []
+      @config_path = config_path || find_config_path
+      load_config
       register_default_rules
     end
@@ -94,7 +99,7 @@ module Vinter
       lexer = Lexer.new(content)
       tokens = lexer.tokenize
-      parser = Parser.new(tokens)
+      parser = Parser.new(tokens, content)
       result = parser.parse
       issues = []
@@ -121,8 +126,9 @@ module Vinter
         }
       end
-      # Apply rules
+      # Apply rules, ignoring those specified in config
       @rules.each do |rule|
+        next if @ignored_rules.include?(rule.id)
         rule_issues = rule.apply(result[:ast])
         issues.concat(rule_issues.map { |i| {
           type: :rule,
@@ -135,6 +141,25 @@ module Vinter
       issues
     end
+    private
+    def find_config_path
+      # check for project level config
+      project_config = Dir.glob(".vinter{.yaml,.yml,}").first
+      project_config if project_config
+      # check for user-level config
+      user_config = File.expand_path("~/.vinter")
+      user_config if File.exist?(user_config)
+    end
+    def load_config
+      return unless @config_path && File.exist?(@config_path)
+      config = YAML.load_file(@config_path)
+      @ignored_rules = config["ignore_rules"] || []
+    end
   end
   class Rule