RubyGems - parslet - Versions diffs - 1.0.0 → 1.0.1 - Mend

parslet 1.0.0 → 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (25) hide show

data/HISTORY.txt +14 -0
data/README +1 -3
data/Rakefile +2 -2
data/example/documentation.rb +18 -0
data/example/email_parser.rb +52 -0
data/example/empty.rb +13 -0
data/example/ip_address.rb +125 -0
data/example/minilisp.rb +101 -0
data/example/parens.rb +42 -0
data/example/readme.rb +36 -0
data/example/seasons.rb +45 -0
data/example/simple.lit +3 -0
data/example/simple_xml.rb +57 -0
data/example/string_parser.rb +75 -0
data/example/test.lit +4 -0
data/lib/parslet.rb +1 -1
data/lib/parslet/atoms/alternative.rb +2 -3
data/lib/parslet/atoms/base.rb +56 -19
data/lib/parslet/atoms/lookahead.rb +12 -9
data/lib/parslet/atoms/re.rb +3 -3
data/lib/parslet/atoms/repetition.rb +15 -16
data/lib/parslet/atoms/sequence.rb +7 -5
data/lib/parslet/pattern.rb +2 -1
data/lib/parslet/rig/rspec.rb +24 -0
metadata +16 -3

data/HISTORY.txt CHANGED

@@ -1,3 +1,17 @@
+= 1.1.0 / ???
+  + Uses throw/catch internally for an order of magnitude increase in execution
+    speed.
+= 1.0.1 / 17Jan2011
+  A happy new year!
+  ! FIX: Parslet::Transform was wrongly fixed earlier - it now wont mangle
+    hashes anymore. (Blake Sweeney)
+  + parslet/rig/rspec.rb contains useful rspec matchers. (R. Konstantin Haase)
 = 1.0.0 / 29Dez2010
   - #each_match was removed. There was some duplication of code that even

data/README CHANGED

@@ -47,8 +47,6 @@ This library should work with both ruby 1.8 and ruby 1.9.
 STATUS
-0.12.0
-On the road to 1.0; improving documentation, trying to ease access to the API.
+one dot oh.
 (c) 2010 Kaspar Schiess

data/Rakefile CHANGED

@@ -18,7 +18,7 @@ spec = Gem::Specification.new do |s|
   # Change these as appropriate
   s.name              = "parslet"
-  s.version           = "1.0.0"
+  s.version           = "1.0.1"
   s.summary           = "Parser construction library with great error reporting in Ruby."
   s.author            = "Kaspar Schiess"
   s.email             = "kaspar.schiess@absurd.li"
@@ -29,7 +29,7 @@ spec = Gem::Specification.new do |s|
   s.rdoc_options      = %w(--main README)
   # Add any extra files to include in the gem
-  s.files             = %w(Gemfile HISTORY.txt LICENSE Rakefile README) + Dir.glob("{spec,lib/**/*}")
+  s.files             = %w(Gemfile HISTORY.txt LICENSE Rakefile README) + Dir.glob("{lib,example}/**/*")
   s.require_paths     = ["lib"]
   # If you want to depend on other gems, add them here, along with any

data/example/documentation.rb ADDED

@@ -0,0 +1,18 @@
+# A small example that shows a really small parser and what happens on parser
+# errors.
+$:.unshift '../lib'
+require 'pp'
+require 'parslet'
+class MyParser < Parslet::Parser
+  rule(:a) { str('a').repeat }
+  def parse(str)
+    a.parse(str)
+  end
+end
+pp MyParser.new.parse('aaaa')
+pp MyParser.new.parse('bbbb')

data/example/email_parser.rb ADDED

@@ -0,0 +1,52 @@
+#!/usr/bin/env ruby
+# Example contributed by Hal Brodigan (postmodern). Thanks!
+require 'parslet'
+class EmailParser < Parslet::Parser
+  rule(:space) { match('\s').repeat(1) }
+  rule(:space?) { space.maybe }
+  rule(:dash?) { match['_-'].maybe }
+  rule(:at) {
+    str('@') |
+    (dash? >> (str('at') | str('AT')) >> dash?)
+  }
+  rule(:dot) {
+    str('.') |
+    (dash? >> (str('dot') | str('DOT')) >> dash?)
+  }
+  rule(:word) { match('[a-z0-9]').repeat(1).as(:word) >> space? }
+  rule(:separator) { space? >> dot.as(:dot) >> space? | space }
+  rule(:words) { word >> (separator >> word).repeat }
+  rule(:email) {
+    (words >> space? >> at.as(:at) >> space? >> words).as(:email)
+  }
+  root(:email)
+end
+class EmailSanitizer < Parslet::Transform
+  rule(:dot => simple(:dot), :word => simple(:word)) { ".#{word}" }
+  rule(:at => simple(:at)) { '@' }
+  rule(:word => simple(:word)) { word }
+  rule(:email => sequence(:email)) { email.join }
+end
+parser = EmailParser.new
+sanitizer = EmailSanitizer.new
+unless ARGV[0]
+  STDERR.puts "usage: #{$0} \"EMAIL_ADDR\""
+  exit -1
+end
+begin
+  puts sanitizer.apply(parser.parse(ARGV[0]))
+rescue Parslet::ParseFailed => error
+  puts error
+  puts parser.root.error_tree
+end

data/example/empty.rb ADDED

@@ -0,0 +1,13 @@
+# Basically just demonstrates that you can leave rules empty and get a nice
+# NotImplementedError. A way to quickly spec out your parser rules?
+$:.unshift '../lib'
+require 'parslet'
+class Parser < Parslet::Parser
+  rule(:empty) { }
+end
+Parser.new.empty.parslet

data/example/ip_address.rb ADDED

@@ -0,0 +1,125 @@
+# This example is heavily inspired by citrus' ip.citrus. Have a look at both
+# of these to get some choice!
+# The grammars in this file conform to the ABNF given in Appendix A of RFC 3986
+# Uniform Resource Identifier (URI): Generic Syntax.
+#
+# See http://tools.ietf.org/html/rfc3986#appendix-A for more information.
+$:.unshift '../lib'
+require 'pp'
+require 'parslet'
+module IPv4
+  include Parslet
+  # A host identified by an IPv4 literal address is represented in
+  # dotted-decimal notation (a sequence of four decimal numbers in the range 0
+  # to 255, separated by "."), as described in [RFC1123] by reference to
+  # [RFC0952].  Note that other forms of dotted notation may be interpreted on
+  # some platforms, as described in Section 7.4, but only the dotted-decimal
+  # form of four octets is allowed by this grammar.
+  rule(:ipv4) {
+    (dec_octet >> str('.') >> dec_octet >> str('.') >>
+      dec_octet >> str('.') >> dec_octet).as(:ipv4)
+  }
+  rule(:dec_octet) {
+    str('25') >> match("[0-5]") |
+    str('2') >> match("[0-4]") >> digit |
+    str('1') >> digit >> digit |
+    match('[1-9]') >> digit |
+    digit
+  }
+  rule(:digit) {
+    match('[0-9]')
+  }
+end
+# Must be used in concert with IPv4
+module IPv6
+  include Parslet
+  rule(:colon) { str(':') }
+  rule(:dcolon) { colon >> colon }
+  # h16 :
+  def h16r(times)
+    (h16 >> colon).repeat(times, times)
+  end
+  # : h16
+  def h16l(times)
+    (colon >> h16).repeat(0,times)
+  end
+  # A 128-bit IPv6 address is divided into eight 16-bit pieces. Each piece is
+  # represented numerically in case-insensitive hexadecimal, using one to four
+  # hexadecimal digits (leading zeroes are permitted). The eight encoded
+  # pieces are given most-significant first, separated by colon characters.
+  # Optionally, the least-significant two pieces may instead be represented in
+  # IPv4 address textual format. A sequence of one or more consecutive
+  # zero-valued 16-bit pieces within the address may be elided, omitting all
+  # their digits and leaving exactly two consecutive colons in their place to
+  # mark the elision.
+  rule(:ipv6) {
+    (
+      (
+        h16r(6) |
+        dcolon >> h16r(5) |
+        h16.maybe >> dcolon >> h16r(4) |
+        (h16 >> h16l(1)).maybe >> dcolon >> h16r(3) |
+        (h16 >> h16l(2)).maybe >> dcolon >> h16r(2) |
+        (h16 >> h16l(3)).maybe >> dcolon >> h16r(1) |
+        (h16 >> h16l(4)).maybe >> dcolon
+      ) >> ls32 |
+      (h16 >> h16l(5)).maybe >> dcolon >> h16 |
+      (h16 >> h16l(6)).maybe >> dcolon
+    ).as(:ipv6)
+  }
+  rule(:h16) {
+    hexdigit.repeat(1,4)
+  }
+  rule(:ls32) {
+    (h16 >> colon >> h16) |
+    ipv4
+  }
+  rule(:hexdigit) {
+    digit | match("[a-fA-F]")
+  }
+end
+class Parser
+  include IPv4
+  include IPv6
+  def parse(str)
+    (ipv4 | ipv6).parse(str)
+  end
+end
+%W(
+  0.0.0.0
+  255.255.255.255
+  255.255.255
+  1:2:3:4:5:6:7:8
+  12AD:34FC:A453:1922::
+  12AD::34FC
+  12AD::
+  ::
+  1:2
+).each do |address|
+  parser = Parser.new
+  printf "%30s -> ", address
+  begin
+    result = parser.parse(address)
+    puts result.inspect
+  rescue Parslet::ParseFailed => m
+    puts "Failed: #{m}"
+  end
+end

data/example/minilisp.rb ADDED

@@ -0,0 +1,101 @@
+# Reproduces [1] using parslet.
+# [1] http://thingsaaronmade.com/blog/a-quick-intro-to-writing-a-parser-using-treetop.html
+$:.unshift '../lib'
+require 'pp'
+require 'parslet'
+module MiniLisp
+  class Parser < Parslet::Parser
+    root :expression
+    rule(:expression) {
+      space? >> str('(') >> space? >> body >> str(')')
+    }
+    rule(:body) {
+      (expression | identifier | float | integer | string).repeat.as(:exp)
+    }
+    rule(:space) {
+      match('\s').repeat(1)
+    }
+    rule(:space?) {
+      space.maybe
+    }
+    rule(:identifier) {
+      (match('[a-zA-Z=*]') >> match('[a-zA-Z=*_]').repeat).as(:identifier) >> space?
+    }
+    rule(:float) {
+      (
+        integer >> (
+          str('.') >> match('[0-9]').repeat(1) |
+          str('e') >> match('[0-9]').repeat(1)
+        ).as(:e)
+      ).as(:float) >> space?
+    }
+    rule(:integer) {
+      ((str('+') | str('-')).maybe >> match("[0-9]").repeat(1)).as(:integer) >> space?
+    }
+    rule(:string) {
+      str('"') >> (
+        str('\\') >> any |
+        str('"').absnt? >> any
+      ).repeat.as(:string) >> str('"') >> space?
+    }
+  end
+  class Transform
+    include Parslet
+    attr_reader :t
+    def initialize
+      @t = Parslet::Transform.new
+      # To understand these, take a look at what comes out of the parser.
+      t.rule(:identifier => simple(:ident)) { ident.to_sym }
+      t.rule(:string => simple(:str))       { str }
+      t.rule(:integer => simple(:int))      { Integer(int) }
+      t.rule(:float=>{:integer=> simple(:a), :e=> simple(:b)}) { Float(a + b) }
+      t.rule(:exp => subtree(:exp))         { exp }
+    end
+    def do(tree)
+      t.apply(tree)
+    end
+  end
+end
+parser = MiniLisp::Parser.new
+transform = MiniLisp::Transform.new
+# Parse stage
+begin
+  result = parser.parse %Q{
+    (define test (lambda ()
+      (begin
+        (display "something")
+        (display 1)
+        (display 3.08))))
+    (test)
+  }
+rescue Parslet::ParseFailed => failure
+  puts failure
+  puts parser.root.error_tree if parser.root.cause
+  exit
+end
+# Transform the result
+pp transform.do(result)
+# Thereby reducing it to the earlier problem:
+# http://github.com/kschiess/toylisp

data/example/parens.rb ADDED

@@ -0,0 +1,42 @@
+# A small example that demonstrates the power of tree pattern matching. Also
+# uses '.as(:name)' to construct a tree that can reliably be matched
+# afterwards.
+$:.unshift '../lib'
+require 'pp'
+require 'parslet'
+module LISP # as in 'lots of insipid and stupid parenthesis'
+  class Parser < Parslet::Parser
+    rule(:balanced) {
+      str('(').as(:l) >> balanced.maybe.as(:m) >> str(')').as(:r)
+    }
+    root(:balanced)
+  end
+  class Transform < Parslet::Transform
+    rule(:l => '(', :m => simple(:x), :r => ')') {
+      # innermost :m will contain nil
+      x.nil? ? 1 : x+1
+    }
+  end
+end
+parser = LISP::Parser.new
+transform = LISP::Transform.new
+%w!
+  ()
+  (())
+  ((((()))))
+  ((())
+!.each do |pexp|
+  begin
+    result = parser.parse(pexp)
+    puts "#{"%20s"%pexp}: #{result.inspect} (#{transform.apply(result)} parens)"
+  rescue Parslet::ParseFailed => m
+    puts "#{"%20s"%pexp}: #{m}"
+  end
+  puts
+end

data/example/readme.rb ADDED

@@ -0,0 +1,36 @@
+# The example from the readme. With this, I am making sure that the readme
+# 'works'. Is this too messy?
+$:.unshift '../lib'
+require 'pp'
+require 'parslet'
+include Parslet
+require 'parslet'
+include Parslet
+# Constructs a parser using a Parser Expression Grammar like DSL:
+parser =  str('"') >>
+          (
+            str('\\') >> any |
+            str('"').absnt? >> any
+          ).repeat.as(:string) >>
+          str('"')
+# Parse the string and capture parts of the interpretation (:string above)
+tree = parser.parse(%Q{
+  "This is a \\"String\\" in which you can escape stuff"
+}.strip)
+tree # => {:string=>"This is a \\\"String\\\" in which you can escape stuff"}
+# Here's how you can grab results from that tree:
+# 1)
+transform = Parslet::Transform.new do
+  rule(:string => simple(:x)) {
+    puts "String contents: #{x}" }
+end
+transform.apply(tree)

data/example/seasons.rb ADDED

@@ -0,0 +1,45 @@
+$:.unshift '../lib/'
+require 'parslet'
+require 'pp'
+tree = {:bud => {:stem => []}}
+class Spring < Parslet::Transform
+  rule(:stem => sequence(:branches)) {
+    {:stem => (branches + [{:branch => :leaf}])}
+  }
+end
+class Summer < Parslet::Transform
+  rule(:stem => subtree(:branches)) {
+    new_branches = branches.map { |b| {:branch => [:leaf, :flower]} }
+    {:stem => new_branches}
+  }
+end
+class Fall < Parslet::Transform
+  rule(:branch => sequence(:x)) {
+    x.each { |e| puts "Fruit!" if e==:flower }
+    x.each { |e| puts "Falling Leaves!" if e==:leaf }
+    {:branch => []}
+  }
+end
+class Winter < Parslet::Transform
+  rule(:stem => subtree(:x)) {
+    {:stem => []}
+  }
+end
+def do_seasons(tree)
+  [Spring, Summer, Fall, Winter].each do |season|
+    p "And when #{season} comes"
+    tree = season.new.apply(tree)
+    pp tree
+    puts
+  end
+  tree
+end
+# What marvel of life!
+tree = do_seasons(tree)
+tree = do_seasons(tree)

data/example/simple.lit ADDED

@@ -0,0 +1,3 @@
+123
+12345
+" Some String with \"escapes\""

data/example/simple_xml.rb ADDED

@@ -0,0 +1,57 @@
+# A simple xml parser. It is simple in the respect as that it doesn't address
+# any of the complexities of XML. This is ruby 1.9.
+$:.unshift '../lib'
+require 'pp'
+require 'parslet'
+module XML
+  include Parslet
+  root :document
+  rule(:document) {
+    tag(close: false).as(:o) >> document.as(:i) >> tag(close: true).as(:c) |
+    text
+  }
+  # Perhaps we could have some syntax sugar to make this more easy?
+  #
+  def tag(opts={})
+    close = opts[:close] || false
+    parslet = str('<')
+    parslet = parslet >> str('/') if close
+    parslet = parslet >> (str('>').absnt? >> match("[a-zA-Z]")).repeat(1).as(:name)
+    parslet = parslet >> str('>')
+    parslet
+  end
+  rule(:text) {
+    match('[^<>]').repeat(0)
+  }
+end
+def check(xml)
+  include XML
+  r=parse(xml)
+  # We'll validate the tree by reducing valid pairs of tags into simply the
+  # string "verified". If the transformation ends on a string, then the
+  # document was 'valid'.
+  #
+  t = Parslet::Transform.new do
+    rule(
+      o: {name: simple(:tag)},
+      c: {name: simple(:tag)},
+      i: simple(:t)
+    ) { 'verified' }
+  end
+  t.apply(r)
+end
+pp check("<a><b>some text in the tags</b></a>")
+pp check("<b><b>some text in the tags</b></a>")

data/example/string_parser.rb ADDED

@@ -0,0 +1,75 @@
+# A more complex parser that illustrates how a compiler might be constructed.
+# The parser recognizes strings and integer literals and constructs almost a
+# useful AST from the file contents.
+require 'pp'
+$:.unshift '../lib/'
+require 'parslet'
+include Parslet
+class LiteralsParser < Parslet::Parser
+  rule :space do
+    (match '[ ]').repeat(1)
+  end
+  rule :literals do
+    (literal >> eol).repeat
+  end
+  rule :literal do
+    (integer | string).as(:literal) >> space.maybe
+  end
+  rule :string do
+    str('"') >>
+    (
+      (str('\\') >> any) |
+      (str('"').absnt? >> any)
+    ).repeat.as(:string) >>
+    str('"')
+  end
+  rule :integer do
+    match('[0-9]').repeat(1).as(:integer)
+  end
+  rule :eol do
+    line_end.repeat(1)
+  end
+  rule :line_end do
+    crlf >> space.maybe
+  end
+  rule :crlf do
+    match('[\r\n]').repeat(1)
+  end
+  root :literals
+end
+parsetree = LiteralsParser.new.parse(
+  File.read('simple.lit'))
+class Lit < Struct.new(:text)
+  def to_s
+    text.inspect
+  end
+end
+class StringLit < Lit
+end
+class IntLit < Lit
+  def to_s
+    text
+  end
+end
+transform = Parslet::Transform.new do
+  rule(:literal => {:integer => simple(:x)}) { IntLit.new(x) }
+  rule(:literal => {:string => simple(:s)}) { StringLit.new(s) }
+end
+ast = transform.apply(parsetree)
+pp ast

data/example/test.lit ADDED

@@ -0,0 +1,4 @@
+"THis is a string"
+"This is another string"
+"This string is escaped \"embedded quoted stuff \" "
+12 // an integer literal and a comment

data/lib/parslet.rb CHANGED

@@ -66,7 +66,7 @@ module Parslet
   #     puts parslet.error_tree
   #   end
   #
-  class ParseFailed < Exception
+  class ParseFailed < StandardError
   end
   module ClassMethods

data/lib/parslet/atoms/alternative.rb CHANGED

@@ -30,10 +30,9 @@ class Parslet::Atoms::Alternative < Parslet::Atoms::Base
   def try(io) # :nodoc:
     alternatives.each { |a|
-      begin
+      catch(:error) {
         return a.apply(io)
-      rescue Parslet::ParseFailed => ex
-      end
+      }
     }
     # If we reach this point, all alternatives have failed.
     error(io, "Expected one of #{alternatives.inspect}.")

data/lib/parslet/atoms/base.rb CHANGED

@@ -13,7 +13,18 @@ class Parslet::Atoms::Base
       io = StringIO.new(io)
     end
-    result = apply(io)
+    result = nil
+    error_message_or_success = catch(:error) {
+      result = apply(io)
+      :success
+    }
+    # If we didn't succeed the parse, raise an exception for the user.
+    # Stack trace will be off, but the error tree should explain the reason
+    # it failed.
+    if error_message_or_success != :success
+      raise Parslet::ParseFailed, error_message_or_success
+    end
     # If we haven't consumed the input, then the pattern doesn't match. Try
     # to provide a good error message (even asking down below)
@@ -22,30 +33,49 @@ class Parslet::Atoms::Base
       # error to fail with. Otherwise just report that we cannot consume the
       # input.
       if cause
-        raise Parslet::ParseFailed, "Unconsumed input, maybe because of this: #{cause}"
+        # Don't garnish the real cause; but the exception is different anyway.
+        raise Parslet::ParseFailed,
+          "Unconsumed input, maybe because of this: #{cause}"
       else
-        error(io, "Don't know what to do with #{io.string[io.pos,100]}")
+        parse_failed(
+          format_cause(io, "Don't know what to do with #{io.string[io.pos,100]}"))
       end
     end
     return flatten(result)
   end
+  #---
+  # Calls the #try method of this parslet. In case of a parse error, apply
+  # leaves the io in the state it was before the attempt.
+  #+++
   def apply(io) # :nodoc:
     # p [:start, self, io.string[io.pos, 10]]
     old_pos = io.pos
     # p [:try, self, io.string[io.pos, 20]]
-    begin
+    message = catch(:error) {
       r = try(io)
       # p [:return_from, self, r, flatten(r)]
+      # This has just succeeded, so last_cause must be empty
       @last_cause = nil
       return r
-    rescue Parslet::ParseFailed => ex
-      # p [:failing, self, io.string[io.pos, 20]]
-      io.pos = old_pos; raise ex
-    end
+    }
+    # We only reach this point if the parse has failed. message is not nil.
+    # p [:failing, self, io.string[io.pos, 20]]
+    io.pos = old_pos
+    throw :error, message
+  end
+  # Override this in your Atoms::Base subclasses to implement parsing
+  # behaviour.
+  #
+  def try(io)
+    raise NotImplementedError, "Atoms::Base doesn't have behaviour, please implement #try(io)."
   end
   # Construct a new atom that repeats the current atom min times at least and
@@ -126,6 +156,9 @@ class Parslet::Atoms::Base
     Parslet::Atoms::Named.new(self, name)
   end
+  # Takes a mixed value coming out of a parslet and converts it to a return
+  # value for the user by dropping things and merging hashes.
+  #
   def flatten(value) # :nodoc:
     # Passes through everything that isn't an array of things
     return value unless value.instance_of? Array
@@ -225,31 +258,35 @@ class Parslet::Atoms::Base
   # with #cause.
   #
   def error_tree
-    Parslet::ErrorTree.new(self) if cause?
+    Parslet::ErrorTree.new(self)
   end
   def cause? # :nodoc:
     not @last_cause.nil?
   end
 private
+  # TODO comments!!!
   # Report/raise a parse error with the given message, printing the current
   # position as well. Appends 'at line X char Y.' to the message you give.
   # If +pos+ is given, it is used as the real position the error happened,
   # correcting the io's current position.
   #
   def error(io, str, pos=nil)
+    @last_cause = format_cause(io, str, pos)
+    throw :error, @last_cause
+  end
+  def parse_failed(str)
+    @last_cause = str
+    raise Parslet::ParseFailed,
+      @last_cause
+  end
+  def format_cause(io, str, pos=nil)
     pre = io.string[0..(pos||io.pos)]
     lines = Array(pre.lines)
-    if lines.empty?
-      formatted_cause = str
-    else
-      pos   = lines.last.length
-      formatted_cause = "#{str} at line #{lines.count} char #{pos}."
-    end
-    @last_cause = formatted_cause
-    raise Parslet::ParseFailed, formatted_cause, nil
+    return str if lines.empty?
+    pos   = lines.last.length
+    return "#{str} at line #{lines.count} char #{pos}."
   end
   def warn_about_duplicate_keys(h1, h2)
     d = h1.keys & h2.keys

data/lib/parslet/atoms/lookahead.rb CHANGED

@@ -16,27 +16,30 @@ class Parslet::Atoms::Lookahead < Parslet::Atoms::Base
   def try(io) # :nodoc:
     pos = io.pos
-    begin
+    failed = true
+    catch(:error) {
       bound_parslet.apply(io)
-    rescue Parslet::ParseFailed
-      return fail(io)
-    ensure
-      io.pos = pos
-    end
-    return success(io)
+      failed = false
+    }
+    return failed ? fail(io) : success(io)
+  ensure
+    io.pos = pos
   end
+  # TODO Both of these will produce results that could be reduced easily.
+  # Maybe do some shortcut reducing here?
   def fail(io) # :nodoc:
     if positive
       error(io, "lookahead: #{bound_parslet.inspect} didn't match, but should have")
     else
-      # TODO: Squash this down to nothing? Return value handling here...
       return nil
     end
   end
   def success(io) # :nodoc:
     if positive
-      return nil  # see above, TODO
+      return nil
     else
       error(
         io,

data/lib/parslet/atoms/re.rb CHANGED

@@ -8,16 +8,16 @@
 #   match('\s')     # like regexps: matches space characters
 #
 class Parslet::Atoms::Re < Parslet::Atoms::Base
-  attr_reader :match
+  attr_reader :match, :re
   def initialize(match) # :nodoc:
     @match = match
+    @re    = Regexp.new(match, Regexp::MULTILINE)
   end
   def try(io) # :nodoc:
-    r = Regexp.new(match, Regexp::MULTILINE)
     s = io.read(1)
     error(io, "Premature end of input") unless s
-    error(io, "Failed to match #{match.inspect[1..-2]}") unless s.match(r)
+    error(io, "Failed to match #{match.inspect[1..-2]}") unless s.match(re)
     return s
   end

data/lib/parslet/atoms/repetition.rb CHANGED

@@ -17,22 +17,21 @@ class Parslet::Atoms::Repetition < Parslet::Atoms::Base
   def try(io) # :nodoc:
     occ = 0
     result = [@tag]   # initialize the result array with the tag (for flattening)
-    loop do
-      begin
-        result << parslet.apply(io)
-        occ += 1
-        # If we're not greedy (max is defined), check if that has been
-        # reached.
-        return result if max && occ>=max
-      rescue Parslet::ParseFailed => ex
-        # Greedy matcher has produced a failure. Check if occ (which will
-        # contain the number of sucesses) is in {min, max}.
-        # p [:repetition, occ, min, max]
-        error(io, "Expected at least #{min} of #{parslet.inspect}") if occ < min
-        return result
-      end
-    end
+    catch(:error) {
+      result << parslet.apply(io)
+      occ += 1
+      # If we're not greedy (max is defined), check if that has been
+      # reached.
+      return result if max && occ>=max
+      redo
+    }
+    # Greedy matcher has produced a failure. Check if occ (which will
+    # contain the number of sucesses) is in {min, max}.
+    # p [:repetition, occ, min, max]
+    error(io, "Expected at least #{min} of #{parslet.inspect}") if occ < min
+    return result
   end
   precedence REPETITION

data/lib/parslet/atoms/sequence.rb CHANGED

@@ -16,12 +16,14 @@ class Parslet::Atoms::Sequence < Parslet::Atoms::Base
   end
   def try(io) # :nodoc:
-    [:sequence]+parslets.map { |p|
-      # Save each parslet as potentially offending (raising an error).
-      @offending_parslet = p
-      p.apply(io)
+    catch(:error) {
+      return [:sequence]+parslets.map { |p|
+        # Save each parslet as potentially offending (raising an error).
+        @offending_parslet = p
+        p.apply(io)
+      }
     }
-  rescue Parslet::ParseFailed
     error(io, "Failed to match sequence (#{self.inspect})")
   end

data/lib/parslet/pattern.rb CHANGED

@@ -99,7 +99,8 @@ class Parslet::Pattern
   end
   def element_match_hash(tree, exp, bindings)
-    # p [:emh, tree, exp, bindings]
+    # Early failure when not all of the hash keys are matched.
+    return false unless exp.keys == tree.keys
     # We iterate over expected pattern, since we demand that the keys that
     # are there should be in tree as well.

data/lib/parslet/rig/rspec.rb ADDED

@@ -0,0 +1,24 @@
+RSpec::Matchers.define(:parse) do |input|
+  chain(:as) { |as| @as = as }
+  match do |parser|
+    begin
+      @result = parser.parse(input)
+      @as == @result or @as.nil?
+    rescue Parslet::ParseFailed
+      false
+    end
+  end
+  failure_message_for_should do |is|
+    "expected " << (@result ?
+      "output of parsing #{input.inspect} with #{is.inspect} to equal #{@as.inspect}, but was #{@result.inspect}" :
+      "expected #{is.inspect} to be able to parse #{input.inspect}")
+  end
+  failure_message_for_should_not do |is|
+    "expected " << (@as ?
+      "output of parsing #{input.inspect} with #{is.inspect} not to equal #{@as.inspect}" :
+      "expected #{is.inspect} to be able to parse #{input.inspect}")
+  end
+end

metadata CHANGED

@@ -5,8 +5,8 @@ version: !ruby/object:Gem::Version
   segments:
   - 1
   - 0
-  - 0
-  version: 1.0.0
+  - 1
+  version: 1.0.1
 platform: ruby
 authors:
 - Kaspar Schiess
@@ -14,7 +14,7 @@ autorequire:
 bindir: bin
 cert_chain: []
-date: 2010-12-29 00:00:00 +01:00
+date: 2011-01-17 00:00:00 +01:00
 default_executable:
 dependencies:
 - !ruby/object:Gem::Dependency
@@ -90,8 +90,21 @@ files:
 - lib/parslet/pattern/binding.rb
 - lib/parslet/pattern/context.rb
 - lib/parslet/pattern.rb
+- lib/parslet/rig/rspec.rb
 - lib/parslet/transform.rb
 - lib/parslet.rb
+- example/documentation.rb
+- example/email_parser.rb
+- example/empty.rb
+- example/ip_address.rb
+- example/minilisp.rb
+- example/parens.rb
+- example/readme.rb
+- example/seasons.rb
+- example/simple.lit
+- example/simple_xml.rb
+- example/string_parser.rb
+- example/test.lit
 has_rdoc: true
 homepage: http://kschiess.github.com/parslet
 licenses: []