RubyGems - antlr3 - Versions diffs - 1.2.3 - Mend

antlr3 1.2.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

data/ANTLR-LICENSE.txt +26 -0
data/History.txt +66 -0
data/README.txt +139 -0
data/bin/antlr4ruby +33 -0
data/java/RubyTarget.java +524 -0
data/java/antlr-full-3.2.1.jar +0 -0
data/lib/antlr3.rb +176 -0
data/lib/antlr3/constants.rb +88 -0
data/lib/antlr3/debug.rb +701 -0
data/lib/antlr3/debug/event-hub.rb +210 -0
data/lib/antlr3/debug/record-event-listener.rb +25 -0
data/lib/antlr3/debug/rule-tracer.rb +55 -0
data/lib/antlr3/debug/socket.rb +360 -0
data/lib/antlr3/debug/trace-event-listener.rb +92 -0
data/lib/antlr3/dfa.rb +247 -0
data/lib/antlr3/dot.rb +174 -0
data/lib/antlr3/error.rb +657 -0
data/lib/antlr3/main.rb +561 -0
data/lib/antlr3/modes/ast-builder.rb +41 -0
data/lib/antlr3/modes/filter.rb +56 -0
data/lib/antlr3/profile.rb +322 -0
data/lib/antlr3/recognizers.rb +1280 -0
data/lib/antlr3/streams.rb +985 -0
data/lib/antlr3/streams/interactive.rb +91 -0
data/lib/antlr3/streams/rewrite.rb +412 -0
data/lib/antlr3/test/call-stack.rb +57 -0
data/lib/antlr3/test/config.rb +23 -0
data/lib/antlr3/test/core-extensions.rb +269 -0
data/lib/antlr3/test/diff.rb +165 -0
data/lib/antlr3/test/functional.rb +207 -0
data/lib/antlr3/test/grammar.rb +371 -0
data/lib/antlr3/token.rb +592 -0
data/lib/antlr3/tree.rb +1415 -0
data/lib/antlr3/tree/debug.rb +163 -0
data/lib/antlr3/tree/visitor.rb +84 -0
data/lib/antlr3/tree/wizard.rb +481 -0
data/lib/antlr3/util.rb +149 -0
data/lib/antlr3/version.rb +27 -0
data/samples/ANTLRv3Grammar.g +621 -0
data/samples/Cpp.g +749 -0
data/templates/AST.stg +335 -0
data/templates/ASTDbg.stg +40 -0
data/templates/ASTParser.stg +153 -0
data/templates/ASTTreeParser.stg +272 -0
data/templates/Dbg.stg +192 -0
data/templates/Ruby.stg +1514 -0
data/test/functional/ast-output/auto-ast.rb +797 -0
data/test/functional/ast-output/construction.rb +555 -0
data/test/functional/ast-output/hetero-nodes.rb +753 -0
data/test/functional/ast-output/rewrites.rb +1327 -0
data/test/functional/ast-output/tree-rewrite.rb +1662 -0
data/test/functional/debugging/debug-mode.rb +689 -0
data/test/functional/debugging/profile-mode.rb +165 -0
data/test/functional/debugging/rule-tracing.rb +74 -0
data/test/functional/delegation/import.rb +379 -0
data/test/functional/lexer/basic.rb +559 -0
data/test/functional/lexer/filter-mode.rb +245 -0
data/test/functional/lexer/nuances.rb +47 -0
data/test/functional/lexer/properties.rb +104 -0
data/test/functional/lexer/syn-pred.rb +32 -0
data/test/functional/lexer/xml.rb +206 -0
data/test/functional/main/main-scripts.rb +245 -0
data/test/functional/parser/actions.rb +224 -0
data/test/functional/parser/backtracking.rb +244 -0
data/test/functional/parser/basic.rb +282 -0
data/test/functional/parser/calc.rb +98 -0
data/test/functional/parser/ll-star.rb +143 -0
data/test/functional/parser/nuances.rb +165 -0
data/test/functional/parser/predicates.rb +103 -0
data/test/functional/parser/properties.rb +242 -0
data/test/functional/parser/rule-methods.rb +132 -0
data/test/functional/parser/scopes.rb +274 -0
data/test/functional/token-rewrite/basic.rb +318 -0
data/test/functional/token-rewrite/via-parser.rb +100 -0
data/test/functional/tree-parser/basic.rb +750 -0
data/test/unit/sample-input/file-stream-1 +2 -0
data/test/unit/sample-input/teststreams.input2 +2 -0
data/test/unit/test-dfa.rb +52 -0
data/test/unit/test-exceptions.rb +44 -0
data/test/unit/test-recognizers.rb +55 -0
data/test/unit/test-scheme.rb +62 -0
data/test/unit/test-streams.rb +459 -0
data/test/unit/test-tree-wizard.rb +535 -0
data/test/unit/test-trees.rb +854 -0
metadata +205 -0

data/test/functional/parser/backtracking.rb ADDED

@@ -0,0 +1,244 @@
+#!/usr/bin/ruby
+# encoding: utf-8
+require 'antlr3/test/functional'
+class TestBacktracking < ANTLR3::Test::Functional
+  inline_grammar(<<-'END')
+    grammar Backtrack;
+    options {
+			language = Ruby;
+			backtrack=true;
+			memoize=true;
+			k=2;
+    }
+    scope Symbols {
+    	types;
+    }
+    @members {
+      def is_type_name?(name)
+        @Symbols_stack.reverse_each do |scope|
+          scope.types.include?(name) and return true
+        end
+        return false
+      end
+      def report_error(e)
+        # do nothing
+      end
+    }
+    translation_unit
+    scope Symbols; // entire file is a scope
+    @init {
+      $Symbols::types = Set.new
+    }
+    	: external_declaration+
+    	;
+    /** Either a function definition or any other kind of C decl/def.
+     *  The LL(*) analysis algorithm fails to deal with this due to
+     *  recursion in the declarator rules.  I'm putting in a
+     *  manual predicate here so that we don't backtrack over
+     *  the entire function.  Further, you get a better error
+     *  as errors within the function itself don't make it fail
+     *  to predict that it's a function.  Weird errors previously.
+     *  Remember: the goal is to avoid backtrack like the plague
+     *  because it makes debugging, actions, and errors harder.
+     *
+     *  Note that k=1 results in a much smaller predictor for the
+     *  fixed look; k=2 made a few extra thousand lines. ;)
+     *  I'll have to optimize that in the future.
+     */
+    external_declaration
+    options {k=1;}
+    	: ( declaration_specifiers? declarator declaration* '{' )=> function_definition
+    	| declaration
+    	;
+    function_definition
+    scope Symbols; // put parameters and locals into same scope for now
+    @init {
+      $Symbols::types = set()
+    }
+    	:	declaration_specifiers? declarator
+    	;
+    declaration
+    scope {
+      is_type_def;
+    }
+    @init {
+      $declaration::is_type_def = false
+    }
+    	: 'typedef' declaration_specifiers? {$declaration::is_type_def = true}
+    	  init_declarator_list ';' // special case, looking for typedef
+    	| declaration_specifiers init_declarator_list? ';'
+    	;
+    declaration_specifiers
+    	:   (   storage_class_specifier
+    		|   type_specifier
+            |   type_qualifier
+            )+
+    	;
+    init_declarator_list
+    	: init_declarator (',' init_declarator)*
+    	;
+    init_declarator
+    	: declarator //('=' initializer)?
+    	;
+    storage_class_specifier
+    	: 'extern'
+    	| 'static'
+    	| 'auto'
+    	| 'register'
+    	;
+    type_specifier
+    	: 'void'
+    	| 'char'
+    	| 'short'
+    	| 'int'
+    	| 'long'
+    	| 'float'
+    	| 'double'
+    	| 'signed'
+    	| 'unsigned'
+    	| type_id
+    	;
+    type_id
+        :   { is_type_name?(@input.look(1).text)}? IDENTIFIER
+        ;
+    type_qualifier
+    	: 'const'
+    	| 'volatile'
+    	;
+    declarator
+    	: pointer? direct_declarator
+    	| pointer
+    	;
+    direct_declarator
+    	:   (	IDENTIFIER
+    			{
+    			if $declaration.length > 0 && $declaration::is_type_def
+						$Symbols::types.add($IDENTIFIER.text)
+					end
+    			}
+    		|	'(' declarator ')'
+    		)
+            declarator_suffix*
+    	;
+    declarator_suffix
+    	:   /*'[' constant_expression ']'
+        |*/   '[' ']'
+        |   '(' ')'
+    	;
+    pointer
+    	: '*' type_qualifier+ pointer?
+    	| '*' pointer
+    	| '*'
+    	;
+    IDENTIFIER
+    	:	LETTER (LETTER|'0'..'9')*
+    	;
+    fragment
+    LETTER
+    	:	'$'
+    	|	'A'..'Z'
+    	|	'a'..'z'
+    	|	'_'
+    	;
+    CHARACTER_LITERAL
+        :   '\'' ( EscapeSequence | ~('\''|'\\') ) '\''
+        ;
+    STRING_LITERAL
+        :  '"' ( EscapeSequence | ~('\\'|'"') )* '"'
+        ;
+    HEX_LITERAL : '0' ('x'|'X') HexDigit+ IntegerTypeSuffix? ;
+    DECIMAL_LITERAL : ('0' | '1'..'9' '0'..'9'*) IntegerTypeSuffix? ;
+    OCTAL_LITERAL : '0' ('0'..'7')+ IntegerTypeSuffix? ;
+    fragment
+    HexDigit : ('0'..'9'|'a'..'f'|'A'..'F') ;
+    fragment
+    IntegerTypeSuffix
+    	:	('u'|'U')? ('l'|'L')
+    	|	('u'|'U')  ('l'|'L')?
+    	;
+    FLOATING_POINT_LITERAL
+        :   ('0'..'9')+ '.' ('0'..'9')* Exponent? FloatTypeSuffix?
+        |   '.' ('0'..'9')+ Exponent? FloatTypeSuffix?
+        |   ('0'..'9')+ Exponent FloatTypeSuffix?
+        |   ('0'..'9')+ Exponent? FloatTypeSuffix
+    	;
+    fragment
+    Exponent : ('e'|'E') ('+'|'-')? ('0'..'9')+ ;
+    fragment
+    FloatTypeSuffix : ('f'|'F'|'d'|'D') ;
+    fragment
+    EscapeSequence
+        :   '\\' ('b'|'t'|'n'|'f'|'r'|'\"'|'\''|'\\')
+        |   OctalEscape
+        ;
+    fragment
+    OctalEscape
+        :   '\\' ('0'..'3') ('0'..'7') ('0'..'7')
+        |   '\\' ('0'..'7') ('0'..'7')
+        |   '\\' ('0'..'7')
+        ;
+    fragment
+    UnicodeEscape
+        :   '\\' 'u' HexDigit HexDigit HexDigit HexDigit
+        ;
+    WS  :  (' '|'\r'|'\t'|'\u000C'|'\n') {$channel=HIDDEN;}
+        ;
+    COMMENT
+        :   '/*' ( options {greedy=false;} : . )* '*/' {$channel=HIDDEN;}
+        ;
+    LINE_COMMENT
+        : '//' ~('\n'|'\r')* '\r'? '\n' {$channel=HIDDEN;}
+        ;
+    LINE_COMMAND
+        : '#' ~('\n'|'\r')* '\r'? '\n' {$channel=HIDDEN;}
+        ;
+  END
+  example "grammar with backtracking and memoization" do
+    lexer = Backtrack::Lexer.new( 'int a;' )
+    parser = Backtrack::Parser.new lexer
+    events = parser.translation_unit
+  end
+end

data/test/functional/parser/basic.rb ADDED

@@ -0,0 +1,282 @@
+#!/usr/bin/ruby
+# encoding: utf-8
+require 'antlr3/test/functional'
+class TestParser001 < ANTLR3::Test::Functional
+  inline_grammar(<<-'END')
+    grammar Identifiers;
+    options { language = Ruby; }
+    @parser::init {
+      @identifiers = []
+      @reported_errors = []
+    }
+    @parser::members {
+      attr_reader :reported_errors, :identifiers
+      def found_identifier(name)
+          @identifiers << name
+      end
+      def emit_error_message(msg)
+        @reported_errors << msg
+      end
+    }
+    document:
+            t=IDENTIFIER {found_identifier($t.text)}
+            ;
+    IDENTIFIER: ('a'..'z'|'A'..'Z'|'_') ('a'..'z'|'A'..'Z'|'0'..'9'|'_')*;
+  END
+  example "parsing 'blah_de_blah'" do
+    # to build a parser, this is the standard chain of calls to prepare the input
+    input = ANTLR3::StringStream.new( 'blah_de_blah', :file => 'blah.txt' )
+    lexer  = Identifiers::Lexer.new( input )
+    tokens = ANTLR3::CommonTokenStream.new( lexer )
+    parser = Identifiers::Parser.new( tokens )
+    parser.document
+    parser.reported_errors.should be_empty
+    parser.identifiers.should == %w(blah_de_blah)
+  end
+  example "error from empty input" do
+    # if you don't need to use a customized stream, lexers and parsers will
+    # automatically wrap input in the standard stream classes
+    lexer = Identifiers::Lexer.new( '' )
+    parser = Identifiers::Parser.new( lexer )
+    parser.document
+    parser.reported_errors.should have(1).thing
+  end
+  example 'automatic input wrapping' do
+    # if the parser is able to figure out what lexer class
+    # to use (typically when it comes from a combined grammar),
+    # and you don't need to do any special token processing
+    # before making a parser, this is an extra shortcut for
+    # parser construction
+    parser = Identifiers::Parser.new( 'blah_de_blah', :file => 'blah.txt' )
+    parser.document
+    parser.reported_errors.should be_empty
+    parser.identifiers.should == %w(blah_de_blah)
+  end
+end
+class TestParser002 < ANTLR3::Test::Functional
+  inline_grammar(<<-'END')
+    grammar SimpleLanguage;
+    options {
+      language = Ruby;
+    }
+    @parser::init {
+      @events = []
+      @reported_errors = []
+    }
+    @parser::members {
+      attr_reader :reported_errors, :events
+      def emit_error_message(msg)
+        @reported_errors << msg
+      end
+    }
+    document:
+            ( declaration
+            | call
+            )*
+            EOF
+        ;
+    declaration:
+            'var' t=IDENTIFIER ';'
+            {@events << ['decl', $t.text]}
+        ;
+    call:
+            t=IDENTIFIER '(' ')' ';'
+            {@events << ['call', $t.text]}
+        ;
+    IDENTIFIER: ('a'..'z'|'A'..'Z'|'_') ('a'..'z'|'A'..'Z'|'0'..'9'|'_')*;
+    WS:  (' '|'\r'|'\t'|'\n') {$channel=HIDDEN;};
+  END
+  example "parsing decls and calls" do
+    lexer  = SimpleLanguage::Lexer.new( "var foobar; gnarz(); var blupp; flupp ( ) ;" )
+    parser = SimpleLanguage::Parser.new( lexer )
+    parser.document
+    parser.reported_errors.should be_empty
+    parser.events.should == [
+      %w(decl foobar),
+      %w(call gnarz),
+      %w(decl blupp),
+      %w(call flupp)
+    ]
+  end
+  example "bad declaration" do
+    lexer  = SimpleLanguage::Lexer.new( 'var; foo()' )
+    parser = SimpleLanguage::Parser.new( lexer )
+    parser.document
+    parser.reported_errors.should have(1).thing
+    parser.events.should be_empty
+  end
+  example "error recovery via token insertion" do
+    lexer  = SimpleLanguage::Lexer.new( 'gnarz(; flupp();' )
+    parser = SimpleLanguage::Parser.new( lexer )
+    parser.document
+    parser.reported_errors.should have(1).thing
+    parser.events.should == [
+      %w(call gnarz),
+      %w(call flupp)
+    ]
+  end
+end
+class TestParser003 < ANTLR3::Test::Functional
+  inline_grammar(<<-'END')
+    grammar MoreComplicated;
+    options { language = Ruby; }
+    @init {
+      @reported_errors = []
+    }
+    @members {
+      attr_reader :reported_errors
+      def emit_error_message(msg)
+        @reported_errors << msg
+      end
+    }
+    program
+        :   declaration+
+        ;
+    declaration
+        :   variable
+        |   functionHeader ';'
+        |   functionHeader block
+        ;
+    variable
+        :   type declarator ';'
+        ;
+    declarator
+        :   ID
+        ;
+    functionHeader
+        :   type ID '(' ( formalParameter ( ',' formalParameter )* )? ')'
+        ;
+    formalParameter
+        :   type declarator
+        ;
+    type
+        :   'int'
+        |   'char'
+        |   'void'
+        |   ID
+        ;
+    block
+        :   '{'
+                variable*
+                stat*
+            '}'
+        ;
+    stat: forStat
+        | expr ';'
+        | block
+        | assignStat ';'
+        | ';'
+        ;
+    forStat
+        :   'for' '(' assignStat ';' expr ';' assignStat ')' block
+        ;
+    assignStat
+        :   ID '=' expr
+        ;
+    expr:   condExpr
+        ;
+    condExpr
+        :   aexpr ( ('==' | '<') aexpr )?
+        ;
+    aexpr
+        :   atom ( '+' atom )*
+        ;
+    atom
+        : ID
+        | INT
+        | '(' expr ')'
+        ;
+    ID  :   ('a'..'z'|'A'..'Z'|'_') ('a'..'z'|'A'..'Z'|'0'..'9'|'_')*
+        ;
+    INT :	('0'..'9')+
+        ;
+    WS  :   (   ' '
+            |   '\t'
+            |   '\r'
+            |   '\n'
+            )+
+            {$channel=HIDDEN}
+        ;
+  END
+  example "parsing 'int foo;'" do
+    lexer = MoreComplicated::Lexer.new "int foo;"
+    parser = MoreComplicated::Parser.new lexer
+    parser.program
+    parser.reported_errors.should be_empty
+  end
+  example "catching badly formed input" do
+    lexer = MoreComplicated::Lexer.new "int foo() { 1+2 }"
+    parser = MoreComplicated::Parser.new lexer
+    parser.program
+    parser.reported_errors.should have(1).thing
+  end
+  example "two instances of badly formed input" do
+    lexer = MoreComplicated::Lexer.new "int foo() { 1+; 1+2 }"
+    parser = MoreComplicated::Parser.new lexer
+    parser.program
+    parser.reported_errors.should have(2).things
+  end
+end