RubyGems - layo - Versions diffs - 1.0.0 - Mend

layo 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (74) hide show

data/LICENSE +26 -0
data/README.mkd +103 -0
data/Rakefile +21 -0
data/UnicodeData.txt +23697 -0
data/bin/layo +22 -0
data/layo.gemspec +23 -0
data/lib/layo.rb +11 -0
data/lib/layo/ast.rb +5 -0
data/lib/layo/ast/block.rb +13 -0
data/lib/layo/ast/expression.rb +14 -0
data/lib/layo/ast/node.rb +6 -0
data/lib/layo/ast/program.rb +9 -0
data/lib/layo/ast/statement.rb +10 -0
data/lib/layo/interpreter.rb +360 -0
data/lib/layo/lexer.rb +162 -0
data/lib/layo/parser.rb +371 -0
data/lib/layo/peekable.rb +31 -0
data/lib/layo/runtime_error.rb +9 -0
data/lib/layo/syntax_error.rb +14 -0
data/lib/layo/tokenizer.rb +119 -0
data/lib/layo/unexpected_token_error.rb +13 -0
data/lib/layo/unicode.rb +23614 -0
data/lib/layo/unknown_token_error.rb +7 -0
data/spec/interpreter_spec.rb +52 -0
data/spec/lexer_spec.rb +176 -0
data/spec/parser_spec.rb +373 -0
data/spec/source/basic/comments.lol +16 -0
data/spec/source/basic/comments.out +2 -0
data/spec/source/basic/line-continuation.lol +8 -0
data/spec/source/basic/line-continuation.out +2 -0
data/spec/source/basic/line-endings.lol +5 -0
data/spec/source/basic/line-endings.out +3 -0
data/spec/source/basic/minimal.lol +2 -0
data/spec/source/casting/boolean.lol +8 -0
data/spec/source/casting/boolean.out +5 -0
data/spec/source/casting/float.lol +10 -0
data/spec/source/casting/float.out +5 -0
data/spec/source/casting/int.lol +9 -0
data/spec/source/casting/int.out +4 -0
data/spec/source/casting/nil.lol +9 -0
data/spec/source/casting/nil.out +4 -0
data/spec/source/casting/string.lol +5 -0
data/spec/source/casting/string.out +2 -0
data/spec/source/expressions/boolean.lol +30 -0
data/spec/source/expressions/boolean.out +17 -0
data/spec/source/expressions/cast.lol +28 -0
data/spec/source/expressions/cast.out +20 -0
data/spec/source/expressions/function.lol +24 -0
data/spec/source/expressions/function.out +4 -0
data/spec/source/expressions/math.lol +9 -0
data/spec/source/expressions/math.out +7 -0
data/spec/source/expressions/string.lol +20 -0
data/spec/source/expressions/string.out +7 -0
data/spec/source/statements/assignment.lol +8 -0
data/spec/source/statements/assignment.out +3 -0
data/spec/source/statements/cast.lol +11 -0
data/spec/source/statements/cast.out +3 -0
data/spec/source/statements/declaration.lol +9 -0
data/spec/source/statements/declaration.out +2 -0
data/spec/source/statements/expression.lol +10 -0
data/spec/source/statements/expression.out +2 -0
data/spec/source/statements/if_then_else.lol +42 -0
data/spec/source/statements/if_then_else.out +3 -0
data/spec/source/statements/input.in +1 -0
data/spec/source/statements/input.lol +4 -0
data/spec/source/statements/input.out +1 -0
data/spec/source/statements/loop.lol +50 -0
data/spec/source/statements/loop.out +20 -0
data/spec/source/statements/print.lol +7 -0
data/spec/source/statements/print.out +2 -0
data/spec/source/statements/switch.lol +95 -0
data/spec/source/statements/switch.out +12 -0
data/spec/tokenizer_spec.rb +105 -0
metadata +135 -0

data/lib/layo/lexer.rb ADDED Viewed

@@ -0,0 +1,162 @@
+# encoding: UTF-8
+module Layo
+  class Lexer
+    include Peekable
+    # Input stream. Must be an instance of IO class (File, StringIO)
+    attr_accessor :input
+    # Current line number (1-based) and position (0-based) of cursor
+    attr_reader :pos, :line_no
+    def initialize(io = nil)
+      self.input = io unless io.nil?
+    end
+    # Sets input stream and resets variables
+    def input=(io)
+      @input = io
+      reset
+    end
+    # Resets this lexer instance
+    def reset
+      @line_no, @last_lexeme = 0, ["\n"]
+      super
+    end
+    def space?(char)
+      char == ' ' || char == "\t"
+    end
+    # Tells whether there is a lexeme delimiter at position pos in current line
+    def lexeme_delimiter?(pos)
+      @line[pos] == '!' || @line[pos] == ',' ||
+      @line[pos] == "\n" || space?(@line[pos]) ||
+      @line[pos] == '…' || @line[pos, 3] == '...'
+    end
+    # Reads and returns next lexeme
+    def next_item
+      return @last_lexeme if @last_lexeme[0].nil?
+      while true
+        @line = next_line if @line_no.zero? || @pos > @line.length - 1
+        if @line.nil?
+          lexeme = [nil, @line_no, 1]
+          break
+        end
+        # Skip whitespaces
+        while space?(@line[@pos])
+          @pos += 1
+        end
+        # Skip triple dot characters (join lines)
+        if @line[@pos, 4] == "...\n" || @line[@pos, 2] == "…\n"
+          line_no, pos = @line_no, @pos + 1
+          @line, @pos = next_line, 0
+          if @line.nil? || @line.strip.empty?
+            raise SyntaxError.new(line_no, pos, 'Line continuation may not be followed by an empty line')
+          end
+          next
+        end
+        # Skip one line comments
+        if @line[@pos, 3] == 'BTW'
+          @pos = @line.length - 1
+        end
+        # and multiline ones
+        if @last_lexeme[0] == "\n" && @line[@pos, 4] == 'OBTW'
+          tldr_found, line_no, pos = false, @line_no, @pos + 1
+          while true
+            @line = next_line
+            break if @line.nil?
+            m = @line.chomp.match(/(^|\s+)TLDR\s*(,|$)/)
+            unless m.nil?
+              tldr_found = true
+              @pos = m.end(0)
+              break
+            end
+          end
+          unless tldr_found
+            raise SyntaxError.new(line_no, pos, 'Unterminated multiline comment')
+          end
+          next
+        end
+        if @line[@pos] == "\n" || @line[@pos] == '!'
+          # Handle newline and bang separately
+          lexeme = [@line[@pos], @line_no, @pos + 1]
+          @pos += 1
+        elsif @line[@pos] == ','
+          # Comma is a virtual newline
+          lexeme = ["\n", @line_no, @pos + 1]
+          @pos += 1
+        elsif @line[@pos] == '"'
+          # Strings begin with "
+          # Need to handle empty strings separately
+          if @line[@pos + 1] == '"'
+            string = '""'
+          else
+            m = @line.match(/([^:](?:::)*)"/, @pos + 1)
+            string = @line[@pos..m.end(0) - 1] unless m.nil?
+          end
+          # String must be followed by an allowed lexeme delimiter
+          if string.nil? || !lexeme_delimiter?(@pos + string.length)
+            raise SyntaxError.new(@line_no, @pos + 1, 'Unterminated string constant')
+          end
+          lexeme = [%Q["#{escape_string(string[1..-2])}"], @line_no, @pos + 1]
+          @pos = @pos + string.length
+        else
+          # Grab as much characters as we can until meeting lexeme delimiter
+          # Treat what we grabbed as a lexeme
+          seq, pos = '', @pos + 1
+          until lexeme_delimiter?(@pos)
+            seq += @line[@pos]
+            @pos += 1
+          end
+          lexeme = [seq, @line_no, pos]
+        end
+        break
+      end
+      @last_lexeme = lexeme
+    end
+    # Reads and returns next line from input stream. Converts newline
+    # character to \n
+    # returns nil upon reaching EOF
+    def next_line
+      return nil if @input.eof?
+      line, ch, @pos, @line_no = '', '', 0, @line_no + 1
+      until ch == "\r" || ch == "\n" || ch.nil?
+        ch = @input.getc
+        line += ch unless ch.nil?
+      end
+      if ch == "\r"
+        ch = @input.getc
+        @input.ungetc(ch) unless ch == "\n" || ch.nil?
+      end
+      line.chomp << "\n"
+    end
+    # Performs substitution of escape characters in string
+    def escape_string(str)
+      replacement = {
+        ':)' => "\n", ':>' => "\t", ':o' => "\a", ':"' => '"', '::' => ':'
+      }
+      str
+        .gsub(/:[\)>o":]/, replacement)
+        .gsub(/:\(([0-9a-fA-F]+)\)/) do |match|
+          $1.to_i(16).chr(Encoding::UTF_8)
+        end
+        .gsub(/:\[(.+?)\]/) do |match|
+          code = Unicode::DATA[$1]
+          if code
+            code.chr(Encoding::UTF_8)
+          else
+            $stderr.puts("Unknown Unicode normative name: #{$1}")
+            match
+          end
+        end
+    end
+  end
+end

data/lib/layo/parser.rb ADDED Viewed

@@ -0,0 +1,371 @@
+module Layo
+  class Parser
+    attr_accessor :tokenizer
+    attr_reader :functions
+    def initialize(tokenizer)
+      @tokenizer, @functions = tokenizer, {}
+    end
+    # Function declarations should be parsed first in order to properly
+    # parse argument list and allow calling functions before their definition.
+    # So this method should be called as the first pass before parsing begins
+    def parse_function_declarations
+      @functions = {}
+      @tokenizer.reset_peek
+      until (token = @tokenizer.peek)[:type] == :eof
+        if token[:type] == :how_duz_i
+          # Function name must follow
+          token = @tokenizer.peek
+          unless token[:type] == :identifier
+            raise UnexpectedTokenError, token
+          end
+          name = token[:data]
+          args = []
+          token = @tokenizer.peek
+          if token[:type] == :yr
+            # Function arguments must follow
+            begin
+              token = @tokenizer.peek
+              unless token[:type] == :identifier
+                raise UnexpectedTokenError, token
+              end
+              args << token[:data]
+            end while @tokenizer.peek[:type] == :an_yr
+          end
+          @tokenizer.unpeek
+          @functions[name] = args
+          # Newline must follow
+          token = @tokenizer.peek
+          unless token[:type] == :newline
+            raise UnexpectedTokenError, token
+          end
+        end
+      end
+      @tokenizer.reset_peek
+    end
+    def parse_program
+      parse_function_declarations
+      skip_newlines
+      expect_token(:hai)
+      version = expect_token(:float)[:data]
+      expect_token(:newline)
+      block = parse_block
+      expect_token(:kthxbye)
+      skip_newlines
+      expect_token(:eof)
+      Ast::Program.new(version, block)
+    end
+    alias_method :parse, :parse_program
+    def expect_token(*types)
+      token = @tokenizer.next
+      raise UnexpectedTokenError, token unless types.include?(token[:type])
+      token
+    end
+    def skip_newlines
+      while @tokenizer.peek[:type] == :newline
+        @tokenizer.next
+      end
+      @tokenizer.unpeek
+    end
+    def parse_block
+      statements = []
+      begin
+        skip_newlines
+        unless (name = next_statement).nil?
+          statements << parse_statement(name)
+        end
+      end until name.nil?
+      Ast::Block.new(statements)
+    end
+    def next_statement
+      return 'assignment' if @tokenizer.try(:identifier, :r)
+      return 'break' if @tokenizer.try(:gtfo)
+      return 'cast' if @tokenizer.try(:identifier, :is_now_a)
+      return 'condition' if @tokenizer.try(:o_rly?)
+      return 'declaration' if @tokenizer.try(:i_has_a)
+      return 'function' if @tokenizer.try(:how_duz_i)
+      return 'input' if @tokenizer.try(:gimmeh)
+      return 'loop' if @tokenizer.try(:im_in_yr)
+      return 'print' if @tokenizer.try(:visible)
+      return 'return' if @tokenizer.try(:found_yr)
+      return 'switch' if @tokenizer.try(:wtf?)
+      return 'expression' if !next_expression.nil?
+      nil
+    end
+    def parse_statement(name)
+      token = @tokenizer.peek
+      @tokenizer.unpeek
+      statement = send("parse_#{name}_statement".to_sym)
+      expect_token(:newline)
+      statement.line = token[:line]
+      statement
+    end
+    def parse_assignment_statement
+      attrs = { identifier: expect_token(:identifier)[:data] }
+      expect_token(:r)
+      attrs[:expression] = parse_expression
+      Ast::Statement.new('assignment', attrs)
+    end
+    def parse_break_statement
+      expect_token(:gtfo)
+      Ast::Statement.new('break')
+    end
+    def parse_cast_statement
+      attrs = { identifier: expect_token(:identifier)[:data] }
+      expect_token(:is_now_a)
+      attrs[:to] = expect_token(:noob, :troof, :numbr, :numbar, :yarn)[:type]
+      Ast::Statement.new('cast', attrs)
+    end
+    def parse_condition_statement
+      expect_token(:o_rly?)
+      expect_token(:newline)
+      expect_token(:ya_rly)
+      expect_token(:newline)
+      attrs = { then: parse_block, elseif: [] }
+      while @tokenizer.peek[:type] == :mebbe
+        expect_token(:mebbe)
+        condition = parse_expression
+        expect_token(:newline)
+        attrs[:elseif] << { condition: condition, block: parse_block }
+      end
+      @tokenizer.unpeek
+      if @tokenizer.peek[:type] == :no_wai
+        expect_token(:no_wai)
+        expect_token(:newline)
+        attrs[:else] = parse_block
+      end
+      @tokenizer.unpeek
+      expect_token(:oic)
+      Ast::Statement.new('condition', attrs)
+    end
+    def parse_declaration_statement
+      expect_token(:i_has_a)
+      attrs = { identifier: expect_token(:identifier)[:data] }
+      if @tokenizer.peek[:type] == :itz
+        @tokenizer.next
+        attrs[:initialization] = parse_expression
+      end
+      @tokenizer.unpeek
+      Ast::Statement.new('declaration', attrs)
+    end
+    def parse_expression_statement
+      attrs = { expression: parse_expression }
+      Ast::Statement.new('expression', attrs)
+    end
+    def parse_function_statement
+      expect_token(:how_duz_i)
+      name = expect_token(:identifier)[:data]
+      if @functions.has_key?(name)
+        # Function definition was parsed in the first pass
+        until @tokenizer.next[:type] == :newline; end
+        args = @functions[name]
+      else
+        # Parse argument list as usual
+        args = []
+        if @tokenizer.peek[:type] == :yr
+          begin
+            @tokenizer.next
+            args << expect_token(:identifier)[:data]
+          end while @tokenizer.peek[:type] == :an_yr
+        end
+        @tokenizer.unpeek
+        expect_token(:newline)
+        @functions[name] = args
+      end
+      block = parse_block
+      expect_token(:if_u_say_so)
+      Ast::Statement.new('function', { name: name, args: args, block: block })
+    end
+    def parse_input_statement
+      expect_token(:gimmeh)
+      attrs = { identifier: expect_token(:identifier)[:data] }
+      Ast::Statement.new('input', attrs)
+    end
+    def parse_loop_statement
+      loop_start = expect_token(:im_in_yr)
+      label_begin = expect_token(:identifier)[:data]
+      attrs = {}
+      if [:uppin, :nerfin, :identifier].include?(@tokenizer.peek[:type])
+        attrs[:op] = expect_token(:uppin, :nerfin, :identifier)
+        expect_token(:yr)
+        attrs[:op] = attrs[:op][:type] == :identifier ? attrs[:op][:data] :
+          attrs[:op][:type]
+        attrs[:counter] = expect_token(:identifier)[:data]
+      end
+      @tokenizer.unpeek
+      if [:til, :wile].include?(@tokenizer.peek[:type])
+        attrs[:guard] = { type: expect_token(:til, :wile)[:type] }
+        attrs[:guard][:expression] = parse_expression
+      end
+      @tokenizer.unpeek
+      attrs[:block] = parse_block
+      expect_token(:im_outta_yr)
+      label_end = expect_token(:identifier)[:data]
+      unless label_begin == label_end
+        raise SyntaxError.new(
+          loop_start[:line], loop_start[:pos],
+          "Loop labels don't match: '#{label_begin}' and '#{label_end}'"
+        )
+      end
+      attrs[:label] = label_begin
+      Ast::Statement.new('loop', attrs)
+    end
+    def parse_print_statement
+      expect_token(:visible)
+      attrs = { expressions: [parse_expression] }
+      until (name = next_expression).nil?
+        attrs[:expressions] << parse_expression(name)
+      end
+      attrs[:suppress] = false
+      if @tokenizer.peek[:type] == :exclamation
+        @tokenizer.next
+        attrs[:suppress] = true
+      end
+      @tokenizer.unpeek
+      Ast::Statement.new('print', attrs)
+    end
+    def parse_return_statement
+      expect_token(:found_yr)
+      attrs = { expression: parse_expression }
+      Ast::Statement.new('return', attrs)
+    end
+    def parse_switch_statement
+      expect_token(:wtf?)
+      expect_token(:newline)
+      parse_case = lambda do
+        expect_token(:omg)
+        expression = parse_expression('constant')
+        expect_token(:newline)
+        { expression: expression, block: parse_block }
+      end
+      attrs = { cases: [parse_case.call] }
+      while @tokenizer.peek[:type] == :omg
+        attrs[:cases] << parse_case.call
+      end
+      @tokenizer.unpeek
+      if @tokenizer.peek[:type] == :omgwtf
+        expect_token(:omgwtf)
+        expect_token(:newline)
+        attrs[:default] = parse_block
+      end
+      @tokenizer.unpeek
+      expect_token(:oic)
+      Ast::Statement.new('switch', attrs)
+    end
+    # Returns internal name of the next expression
+    def next_expression
+      return 'binary' if @tokenizer.try([
+        :sum_of, :diff_of, :produkt_of, :quoshunt_of, :mod_of, :biggr_of,
+        :smallr_of, :both_of, :either_of, :won_of, :both_saem, :diffrint
+      ])
+      return 'cast' if @tokenizer.try(:maek)
+      return 'constant' if @tokenizer.try([:boolean, :integer, :float, :string])
+      return 'identifier' if @tokenizer.try(:identifier)
+      return 'nary' if @tokenizer.try([:all_of, :any_of, :smoosh])
+      return 'unary' if @tokenizer.try(:not)
+      nil
+    end
+    def parse_expression(name = nil)
+      token = @tokenizer.peek
+      @tokenizer.unpeek
+      name = next_expression unless name
+      unless name
+        raise SyntaxError.new(token[:line], token[:pos], 'Expected expression')
+      end
+      send("parse_#{name}_expression".to_sym)
+    end
+    def parse_binary_expression
+      attrs = {
+        operator: expect_token(
+          :sum_of, :diff_of, :produkt_of, :quoshunt_of, :mod_of, :biggr_of,
+          :smallr_of, :both_of, :either_of, :won_of, :both_saem, :diffrint
+        )[:type]
+      }
+      attrs[:left] = parse_expression
+      @tokenizer.next if @tokenizer.peek[:type] == :an
+      @tokenizer.unpeek
+      attrs[:right] = parse_expression
+      Ast::Expression.new('binary', attrs)
+    end
+    def parse_cast_expression
+      expect_token(:maek)
+      attrs = { being_casted: parse_expression }
+      expect_token(:a)
+      attrs[:to] = expect_token(:noob, :troof, :numbr, :numbar, :yarn)[:type]
+      Ast::Expression.new('cast', attrs)
+    end
+    def parse_constant_expression
+      token = expect_token(:boolean, :integer, :float, :string)
+      Ast::Expression.new('constant', { vtype: token[:type], value: token[:data] })
+    end
+    # Identifier expression represents two types of expressions:
+    #   variable expression: returns value of variable
+    #   function call expression: returns value of function call
+    def parse_identifier_expression
+      name = expect_token(:identifier)[:data]
+      begin
+        function = self.functions.fetch(name)
+        # Function call
+        attrs = { name: name, parameters: [] }
+        function.size.times do |c|
+          attrs[:parameters] << parse_expression
+        end
+        return Ast::Expression.new('function', attrs)
+      rescue KeyError
+        # Variable name
+        return Ast::Expression.new('variable', name: name)
+      end
+    end
+    def parse_nary_expression
+      attrs = { operator: expect_token(:all_of, :any_of, :smoosh)[:type] }
+      attrs[:expressions] = [parse_expression]
+      while true
+        @tokenizer.next if @tokenizer.peek[:type] == :an
+        @tokenizer.unpeek
+        name = next_expression
+        if name.nil? then break else attrs[:expressions] << parse_expression(name) end
+      end
+      # We need either MKAY or Newline here, but
+      # should consume only MKAY if present
+      token = @tokenizer.peek
+      unless [:mkay, :newline].include?(token[:type])
+        raise UnexpectedTokenError, token
+      end
+      @tokenizer.next if token[:type] == :mkay
+      @tokenizer.unpeek
+      Ast::Expression.new('nary', attrs)
+    end
+    def parse_unary_expression
+      expect_token(:not)
+      Ast::Expression.new('unary', { expression: parse_expression } )
+    end
+  end
+end