RubyGems - antelope - Versions diffs - 0.3.2 → 0.4.0 - Mend

antelope 0.3.2 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (102) hide show

checksums.yaml +4 -4
data/.gitignore +25 -25
data/.rspec +3 -3
data/.travis.yml +10 -10
data/.yardopts +7 -7
data/CONTRIBUTING.md +50 -38
data/GENERATORS.md +180 -124
data/Gemfile +7 -7
data/LICENSE.txt +22 -22
data/README.md +240 -104
data/Rakefile +2 -2
data/TODO.md +58 -58
data/antelope.gemspec +29 -28
data/bin/antelope +7 -7
data/examples/deterministic.ace +35 -35
data/examples/example.ace +52 -51
data/examples/example.ace.err +192 -192
data/examples/example.ace.inf +432 -432
data/examples/example.ate +70 -70
data/examples/example.ate.err +192 -192
data/examples/example.ate.inf +432 -432
data/examples/liquidscript.ace +233 -233
data/examples/simple.ace +22 -22
data/lib/antelope/ace/compiler.rb +334 -334
data/lib/antelope/ace/errors.rb +30 -30
data/lib/antelope/ace/scanner/argument.rb +57 -57
data/lib/antelope/ace/scanner/first.rb +89 -89
data/lib/antelope/ace/scanner/second.rb +178 -178
data/lib/antelope/ace/scanner/third.rb +27 -27
data/lib/antelope/ace/scanner.rb +144 -144
data/lib/antelope/ace.rb +47 -47
data/lib/antelope/cli.rb +60 -60
data/lib/antelope/errors.rb +25 -25
data/lib/antelope/generation/constructor/first.rb +86 -86
data/lib/antelope/generation/constructor/follow.rb +105 -105
data/lib/antelope/generation/constructor/nullable.rb +64 -64
data/lib/antelope/generation/constructor.rb +127 -127
data/lib/antelope/generation/errors.rb +17 -17
data/lib/antelope/generation/null.rb +13 -13
data/lib/antelope/generation/recognizer/rule.rb +216 -216
data/lib/antelope/generation/recognizer/state.rb +129 -129
data/lib/antelope/generation/recognizer.rb +177 -177
data/lib/antelope/generation/tableizer.rb +176 -176
data/lib/antelope/generation.rb +15 -15
data/lib/antelope/generator/base/coerce.rb +115 -0
data/lib/antelope/generator/base/extra.rb +50 -0
data/lib/antelope/generator/base.rb +134 -264
data/lib/antelope/generator/c.rb +11 -11
data/lib/antelope/generator/c_header.rb +105 -105
data/lib/antelope/generator/c_source.rb +39 -39
data/lib/antelope/generator/error.rb +34 -34
data/lib/antelope/generator/group.rb +60 -57
data/lib/antelope/generator/html.rb +51 -51
data/lib/antelope/generator/info.rb +47 -47
data/lib/antelope/generator/null.rb +18 -18
data/lib/antelope/generator/output.rb +17 -17
data/lib/antelope/generator/ruby.rb +112 -79
data/lib/antelope/generator/templates/c_header.ant +36 -36
data/lib/antelope/generator/templates/c_source.ant +202 -202
data/lib/antelope/generator/templates/error.erb +40 -0
data/lib/antelope/generator/templates/html/antelope.css +53 -1
data/lib/antelope/generator/templates/html/antelope.html +82 -1
data/lib/antelope/generator/templates/html/antelope.js +9 -1
data/lib/antelope/generator/templates/html/css.ant +53 -53
data/lib/antelope/generator/templates/html/html.ant +82 -82
data/lib/antelope/generator/templates/html/js.ant +9 -9
data/lib/antelope/generator/templates/info.erb +61 -0
data/lib/antelope/generator/templates/{ruby.ant → ruby.erb} +171 -178
data/lib/antelope/generator.rb +62 -66
data/lib/antelope/grammar/generation.rb +76 -76
data/lib/antelope/grammar/loading.rb +84 -84
data/lib/antelope/grammar/precedence.rb +59 -59
data/lib/antelope/grammar/precedences.rb +64 -64
data/lib/antelope/grammar/production.rb +56 -56
data/lib/antelope/grammar/productions.rb +154 -154
data/lib/antelope/grammar/symbols.rb +64 -64
data/lib/antelope/grammar/token/epsilon.rb +23 -23
data/lib/antelope/grammar/token/error.rb +24 -24
data/lib/antelope/grammar/token/nonterminal.rb +15 -15
data/lib/antelope/grammar/token/terminal.rb +15 -15
data/lib/antelope/grammar/token.rb +231 -231
data/lib/antelope/grammar.rb +68 -68
data/lib/antelope/version.rb +6 -6
data/lib/antelope.rb +18 -19
data/optimizations.txt +42 -42
data/spec/antelope/ace/compiler_spec.rb +60 -60
data/spec/antelope/ace/scanner_spec.rb +27 -27
data/spec/antelope/generation/constructor_spec.rb +131 -131
data/spec/fixtures/simple.ace +22 -22
data/spec/spec_helper.rb +39 -39
data/spec/support/benchmark_helper.rb +5 -5
data/spec/support/grammar_helper.rb +14 -14
data/subl/Ace (Ruby).JSON-tmLanguage +94 -94
data/subl/Ace (Ruby).tmLanguage +153 -153
metadata +22 -11
data/lib/antelope/generator/templates/error.ant +0 -34
data/lib/antelope/generator/templates/info.ant +0 -53
data/lib/antelope/template/compiler.rb +0 -78
data/lib/antelope/template/errors.rb +0 -9
data/lib/antelope/template/scanner.rb +0 -109
data/lib/antelope/template.rb +0 -64
data/spec/antelope/template_spec.rb +0 -50

data/lib/antelope/grammar/productions.rb CHANGED Viewed

@@ -1,154 +1,154 @@
-# encoding: utf-8
-module Antelope
-  class Grammar
-    # Manages the productions of the grammar.
-    module Productions
-      # Returns a hash of all of the productions.  The result is
-      # cached.
-      #
-      # @return [Hash<(Symbol, Array<Production>)>]
-      def productions
-        @_productions || generate_productions
-      end
-      # Returns all productions for all nonterminals, sorted by id.
-      #
-      # @return [Array<Production>]
-      def all_productions
-        productions.values.flatten.sort_by(&:id)
-      end
-      # Finds a token based on its corresponding symbol.  First
-      # checks the productions, to see if it's a nonterminal; then,
-      # tries to find it in the terminals; otherwise, if the symbol
-      # is `error`, it returns a {Token::Error}; if the symbol is
-      # `nothing` or `ε`, it returns a {Token::Epsilon}; if it's
-      # none of those, it raises an {UndefinedTokenError}.
-      #
-      # @raise [UndefinedTokenError] if the token doesn't exist.
-      # @param value [String, Symbol, #intern] the token's symbol to
-      #   check.
-      # @return [Token]
-      def find_token(value)
-        value = value.intern
-        if productions.key?(value)
-          typed_nonterminals.find { |term| term.name == value } ||
-            Token::Nonterminal.new(value)
-        elsif terminal = terminals.
-            find { |term| term.name == value }
-          terminal
-        elsif value == :$error || value == :error
-          Token::Error.new
-        elsif [:nothing, :ε, :"%empty"].include?(value)
-          Token::Epsilon.new
-        else
-          raise UndefinedTokenError, "Could not find a token " \
-            "named #{value.inspect}"
-        end
-      end
-      private
-      # Actually generates the productions.  Uses the rules from the
-      # compiler to construct the productions.  Makes two loops over
-      # the compiler's rules; the first to tell the grammar that the
-      # nonterminal does exist, and the second to actually construct
-      # the productions.  The first loop is for {#find_token},
-      # because otherwise it wouldn't be able to return a
-      # nonterminal properly.
-      #
-      # @return [Hash<(Symbol, Array<Production>)>]
-      def generate_productions
-        @_productions = {}
-        index = 0
-        rules = @compiler.rules.each do |rule|
-          productions[rule[:label]] = []
-        end
-        while index < rules.size
-          rule = rules[index]
-          productions[rule[:label]] <<
-            generate_production_for(rule, index)
-          index += 1
-        end
-        productions[:$start] = [default_production]
-        productions
-      end
-      # Generates a production for a given compiler rule.  Converts
-      # the tokens in the set to their {Token} counterparts,
-      # and then sets the precedence for the production.  If the
-      # precedence declaration from the compiler rule is empty,
-      # then it'll use the last terminal from the set to check for
-      # precedence; otherwise, it'll use the precedence declaration.
-      # This is to make sure that every production has a precedence
-      # declaration.
-      #
-      # @param rule [Hash] the compiler's rule.
-      # @param id [Numeric] the id for the production.
-      # @return [Production]
-      def generate_production_for(rule, id)
-        left  = Token::Nonterminal.new(rule[:label])
-        items = rule[:set].map { |_| find_token(_[0]) }
-        prec  = if rule[:prec].empty?
-          items.select(&:terminal?).first
-        else
-          rule[:prec].intern
-        end
-        prec  = precedence_for(prec)
-        left.type = type_for(rule[:label])
-        left.id = rule[:label_id]
-        rule[:set].each_with_index do |tok, i|
-          items[i] = items[i].dup
-          items[i].id = tok[1]
-        end
-        items.delete_if(&:epsilon?)
-        Production.new(left, items, rule[:block], prec, id + 1)
-      end
-      # Returns the defined type for the given token name.
-      # Uses the `%type` directive to infer the corresponding types.
-      #
-      # @param token [Symbol] the token to check for
-      #   types.
-      def type_for(token)
-        token = find_token(token) unless token.is_a?(Token)
-        case token
-        when Token::Nonterminal
-          token.type
-        when Token::Terminal
-          token.type
-        when Token::Epsilon
-          ""
-        when Token::Error
-          ""
-        end
-      end
-      # Creates the default production for the grammar.  The left
-      # hand side of the production is the `:$start` symbol, with
-      # the right hand side being the first rule's left-hand side
-      # and the terminal `$`.  This production is automagically
-      # given the last precedence, and an id of 0.
-      #
-      # @return [Production]
-      def default_production
-        Production.new(Token::Nonterminal.new(:$start), [
-            Token::Nonterminal.new(@compiler.rules.first[:label]),
-            Token::Terminal.new(:$end)
-          ], "", precedence.last, 0)
-      end
-    end
-  end
-end
+# encoding: utf-8
+module Antelope
+  class Grammar
+    # Manages the productions of the grammar.
+    module Productions
+      # Returns a hash of all of the productions.  The result is
+      # cached.
+      #
+      # @return [Hash<(Symbol, Array<Production>)>]
+      def productions
+        @_productions || generate_productions
+      end
+      # Returns all productions for all nonterminals, sorted by id.
+      #
+      # @return [Array<Production>]
+      def all_productions
+        productions.values.flatten.sort_by(&:id)
+      end
+      # Finds a token based on its corresponding symbol.  First
+      # checks the productions, to see if it's a nonterminal; then,
+      # tries to find it in the terminals; otherwise, if the symbol
+      # is `error`, it returns a {Token::Error}; if the symbol is
+      # `nothing` or `ε`, it returns a {Token::Epsilon}; if it's
+      # none of those, it raises an {UndefinedTokenError}.
+      #
+      # @raise [UndefinedTokenError] if the token doesn't exist.
+      # @param value [String, Symbol, #intern] the token's symbol to
+      #   check.
+      # @return [Token]
+      def find_token(value)
+        value = value.intern
+        if productions.key?(value)
+          typed_nonterminals.find { |term| term.name == value } ||
+            Token::Nonterminal.new(value)
+        elsif terminal = terminals.
+            find { |term| term.name == value }
+          terminal
+        elsif value == :$error || value == :error
+          Token::Error.new
+        elsif [:nothing, :ε, :"%empty"].include?(value)
+          Token::Epsilon.new
+        else
+          raise UndefinedTokenError, "Could not find a token " \
+            "named #{value.inspect}"
+        end
+      end
+      private
+      # Actually generates the productions.  Uses the rules from the
+      # compiler to construct the productions.  Makes two loops over
+      # the compiler's rules; the first to tell the grammar that the
+      # nonterminal does exist, and the second to actually construct
+      # the productions.  The first loop is for {#find_token},
+      # because otherwise it wouldn't be able to return a
+      # nonterminal properly.
+      #
+      # @return [Hash<(Symbol, Array<Production>)>]
+      def generate_productions
+        @_productions = {}
+        index = 0
+        rules = @compiler.rules.each do |rule|
+          productions[rule[:label]] = []
+        end
+        while index < rules.size
+          rule = rules[index]
+          productions[rule[:label]] <<
+            generate_production_for(rule, index)
+          index += 1
+        end
+        productions[:$start] = [default_production]
+        productions
+      end
+      # Generates a production for a given compiler rule.  Converts
+      # the tokens in the set to their {Token} counterparts,
+      # and then sets the precedence for the production.  If the
+      # precedence declaration from the compiler rule is empty,
+      # then it'll use the last terminal from the set to check for
+      # precedence; otherwise, it'll use the precedence declaration.
+      # This is to make sure that every production has a precedence
+      # declaration.
+      #
+      # @param rule [Hash] the compiler's rule.
+      # @param id [Numeric] the id for the production.
+      # @return [Production]
+      def generate_production_for(rule, id)
+        left  = Token::Nonterminal.new(rule[:label])
+        items = rule[:set].map { |_| find_token(_[0]) }
+        prec  = if rule[:prec].empty?
+          items.select(&:terminal?).first
+        else
+          rule[:prec].intern
+        end
+        prec  = precedence_for(prec)
+        left.type = type_for(rule[:label])
+        left.id = rule[:label_id]
+        rule[:set].each_with_index do |tok, i|
+          items[i] = items[i].dup
+          items[i].id = tok[1]
+        end
+        items.delete_if(&:epsilon?)
+        Production.new(left, items, rule[:block], prec, id + 1)
+      end
+      # Returns the defined type for the given token name.
+      # Uses the `%type` directive to infer the corresponding types.
+      #
+      # @param token [Symbol] the token to check for
+      #   types.
+      def type_for(token)
+        token = find_token(token) unless token.is_a?(Token)
+        case token
+        when Token::Nonterminal
+          token.type
+        when Token::Terminal
+          token.type
+        when Token::Epsilon
+          ""
+        when Token::Error
+          ""
+        end
+      end
+      # Creates the default production for the grammar.  The left
+      # hand side of the production is the `:$start` symbol, with
+      # the right hand side being the first rule's left-hand side
+      # and the terminal `$`.  This production is automagically
+      # given the last precedence, and an id of 0.
+      #
+      # @return [Production]
+      def default_production
+        Production.new(Token::Nonterminal.new(:$start), [
+            Token::Nonterminal.new(@compiler.rules.first[:label]),
+            Token::Terminal.new(:$end)
+          ], "", precedence.last, 0)
+      end
+    end
+  end
+end

data/lib/antelope/grammar/symbols.rb CHANGED Viewed

@@ -1,64 +1,64 @@
-# encoding: utf-8
-module Antelope
-  class Grammar
-    # Manages a list of the symbols in the grammar.
-    module Symbols
-      # A list of all terminals in the grammar.  Checks the compiler
-      # options for terminals, and then returns an array of
-      # terminals.  Caches the result.
-      #
-      # @return [Array<Token::Terminal>]
-      def terminals
-        @_terminals ||= begin
-          @compiler.options.fetch(:terminals) { [] }.map do |v|
-            Token::Terminal.new(*v)
-          end
-        end
-      end
-      # A list of all nonterminals in the grammar.
-      #
-      # @return [Array<Symbol>]
-      # @see #productions
-      def nonterminals
-        @_nonterminals ||= productions.keys
-      end
-      # A list of all nonterminals, with types.
-      #
-      # @return [Array<Token::Nonterminal>>]
-      def typed_nonterminals
-        @_typed_nonterminals ||= begin
-          typed = []
-          compiler.options[:nonterminals].each do |data|
-            data[1].each do |nonterm|
-              typed << Token::Nonterminal.new(nonterm, data[0])
-            end
-          end
-          typed
-        end
-      end
-      # A list of all symbols in the grammar; includes both
-      # terminals and nonterminals.
-      #
-      # @return [Array<Token::Terminal, Symbol>]
-      # @see #terminals
-      # @see #nonterminals
-      def symbols
-        @_symbols ||= terminals + nonterminals
-      end
-      # Checks to see if the grammar uses the `error` terminal
-      # anywhere.
-      #
-      # @return [Boolean]
-      def contains_error_token?
-        all_productions.any? { |_| _.items.any?(&:error?) }
-      end
-    end
-  end
-end
+# encoding: utf-8
+module Antelope
+  class Grammar
+    # Manages a list of the symbols in the grammar.
+    module Symbols
+      # A list of all terminals in the grammar.  Checks the compiler
+      # options for terminals, and then returns an array of
+      # terminals.  Caches the result.
+      #
+      # @return [Array<Token::Terminal>]
+      def terminals
+        @_terminals ||= begin
+          @compiler.options.fetch(:terminals) { [] }.map do |v|
+            Token::Terminal.new(*v)
+          end
+        end
+      end
+      # A list of all nonterminals in the grammar.
+      #
+      # @return [Array<Symbol>]
+      # @see #productions
+      def nonterminals
+        @_nonterminals ||= productions.keys
+      end
+      # A list of all nonterminals, with types.
+      #
+      # @return [Array<Token::Nonterminal>>]
+      def typed_nonterminals
+        @_typed_nonterminals ||= begin
+          typed = []
+          compiler.options[:nonterminals].each do |data|
+            data[1].each do |nonterm|
+              typed << Token::Nonterminal.new(nonterm, data[0])
+            end
+          end
+          typed
+        end
+      end
+      # A list of all symbols in the grammar; includes both
+      # terminals and nonterminals.
+      #
+      # @return [Array<Token::Terminal, Symbol>]
+      # @see #terminals
+      # @see #nonterminals
+      def symbols
+        @_symbols ||= terminals + nonterminals
+      end
+      # Checks to see if the grammar uses the `error` terminal
+      # anywhere.
+      #
+      # @return [Boolean]
+      def contains_error_token?
+        all_productions.any? { |_| _.items.any?(&:error?) }
+      end
+    end
+  end
+end

data/lib/antelope/grammar/token/epsilon.rb CHANGED Viewed

@@ -1,23 +1,23 @@
-# encoding: utf-8
-module Antelope
-  class Grammar
-    class Token
-      # Defines an epsilon token.  An epsilon token represents
-      # nothing.  This is used to say that a nonterminal can
-      # reduce to nothing.
-      class Epsilon < Token
-        # Initialize.  Technically takes no arguments.  Sets
-        # the name of the token to be `:$empty`.
-        def initialize(*)
-          super :"$empty"
-        end
-        # (see Token#epsilon?)
-        def epsilon?
-          true
-        end
-      end
-    end
-  end
-end
+# encoding: utf-8
+module Antelope
+  class Grammar
+    class Token
+      # Defines an epsilon token.  An epsilon token represents
+      # nothing.  This is used to say that a nonterminal can
+      # reduce to nothing.
+      class Epsilon < Token
+        # Initialize.  Technically takes no arguments.  Sets
+        # the name of the token to be `:$empty`.
+        def initialize(*)
+          super :"$empty"
+        end
+        # (see Token#epsilon?)
+        def epsilon?
+          true
+        end
+      end
+    end
+  end
+end

data/lib/antelope/grammar/token/error.rb CHANGED Viewed

@@ -1,24 +1,24 @@
-# encoding: utf-8
-module Antelope
-  class Grammar
-    class Token
-      # Defines an error token.  This may be used internally by the
-      # parser when it enters panic mode; any tokens following this
-      # are the synchronisation tokens.  This is considered a terminal
-      # for the purposes of rule definitions.
-      class Error < Terminal
-        # Initialize the error token.  Technically takes no arguments.
-        # Sets the name to be `:$error`.
-        def initialize(*)
-          super :$error
-        end
-        # (see Token#error?)
-        def error?
-          true
-        end
-      end
-    end
-  end
-end
+# encoding: utf-8
+module Antelope
+  class Grammar
+    class Token
+      # Defines an error token.  This may be used internally by the
+      # parser when it enters panic mode; any tokens following this
+      # are the synchronisation tokens.  This is considered a terminal
+      # for the purposes of rule definitions.
+      class Error < Terminal
+        # Initialize the error token.  Technically takes no arguments.
+        # Sets the name to be `:$error`.
+        def initialize(*)
+          super :$error
+        end
+        # (see Token#error?)
+        def error?
+          true
+        end
+      end
+    end
+  end
+end

data/lib/antelope/grammar/token/nonterminal.rb CHANGED Viewed

@@ -1,15 +1,15 @@
-# encoding: utf-8
-module Antelope
-  class Grammar
-    class Token
-      # Defines a nonterminal token.
-      class Nonterminal < Token
-        # (see Token#nonterminal?)
-        def nonterminal?
-          true
-        end
-      end
-    end
-  end
-end
+# encoding: utf-8
+module Antelope
+  class Grammar
+    class Token
+      # Defines a nonterminal token.
+      class Nonterminal < Token
+        # (see Token#nonterminal?)
+        def nonterminal?
+          true
+        end
+      end
+    end
+  end
+end

data/lib/antelope/grammar/token/terminal.rb CHANGED Viewed

@@ -1,15 +1,15 @@
-# encoding: utf-8
-module Antelope
-  class Grammar
-    class Token
-      # Defines a terminal token.
-      class Terminal < Token
-        # (see Token#terminal?)
-        def terminal?
-          true
-        end
-      end
-    end
-  end
-end
+# encoding: utf-8
+module Antelope
+  class Grammar
+    class Token
+      # Defines a terminal token.
+      class Terminal < Token
+        # (see Token#terminal?)
+        def terminal?
+          true
+        end
+      end
+    end
+  end
+end