RubyGems - ghazel-parslet - Versions diffs - 1.4.0.1 - Mend

ghazel-parslet 1.4.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (87) hide show

data/HISTORY.txt +195 -0
data/LICENSE +23 -0
data/README +70 -0
data/Rakefile +49 -0
data/example/boolean_algebra.rb +70 -0
data/example/calc.rb +153 -0
data/example/comments.rb +35 -0
data/example/deepest_errors.rb +131 -0
data/example/documentation.rb +18 -0
data/example/email_parser.rb +52 -0
data/example/empty.rb +13 -0
data/example/erb.rb +47 -0
data/example/ignore.rb +33 -0
data/example/ip_address.rb +125 -0
data/example/json.rb +128 -0
data/example/local.rb +34 -0
data/example/mathn.rb +44 -0
data/example/minilisp.rb +94 -0
data/example/modularity.rb +47 -0
data/example/nested_errors.rb +132 -0
data/example/output/boolean_algebra.out +4 -0
data/example/output/calc.out +1 -0
data/example/output/comments.out +8 -0
data/example/output/deepest_errors.out +54 -0
data/example/output/documentation.err +4 -0
data/example/output/documentation.out +1 -0
data/example/output/email_parser.out +2 -0
data/example/output/empty.err +1 -0
data/example/output/erb.out +7 -0
data/example/output/ignore.out +1 -0
data/example/output/ignore_whitespace.out +1 -0
data/example/output/ip_address.out +9 -0
data/example/output/json.out +5 -0
data/example/output/local.out +3 -0
data/example/output/mathn.out +4 -0
data/example/output/minilisp.out +5 -0
data/example/output/modularity.out +0 -0
data/example/output/nested_errors.out +54 -0
data/example/output/parens.out +8 -0
data/example/output/readme.out +1 -0
data/example/output/seasons.out +28 -0
data/example/output/sentence.out +1 -0
data/example/output/simple_xml.out +2 -0
data/example/output/string_parser.out +3 -0
data/example/parens.rb +42 -0
data/example/readme.rb +30 -0
data/example/seasons.rb +46 -0
data/example/sentence.rb +36 -0
data/example/simple.lit +3 -0
data/example/simple_xml.rb +54 -0
data/example/string_parser.rb +77 -0
data/example/test.lit +4 -0
data/lib/parslet.rb +254 -0
data/lib/parslet/atoms.rb +32 -0
data/lib/parslet/atoms/alternative.rb +50 -0
data/lib/parslet/atoms/base.rb +124 -0
data/lib/parslet/atoms/can_flatten.rb +137 -0
data/lib/parslet/atoms/context.rb +94 -0
data/lib/parslet/atoms/dsl.rb +98 -0
data/lib/parslet/atoms/entity.rb +41 -0
data/lib/parslet/atoms/lookahead.rb +49 -0
data/lib/parslet/atoms/named.rb +32 -0
data/lib/parslet/atoms/re.rb +38 -0
data/lib/parslet/atoms/repetition.rb +63 -0
data/lib/parslet/atoms/rule.rb +12 -0
data/lib/parslet/atoms/rule/position.rb +143 -0
data/lib/parslet/atoms/sequence.rb +38 -0
data/lib/parslet/atoms/str.rb +37 -0
data/lib/parslet/atoms/visitor.rb +89 -0
data/lib/parslet/cause.rb +94 -0
data/lib/parslet/convenience.rb +35 -0
data/lib/parslet/error_reporter.rb +7 -0
data/lib/parslet/error_reporter/deepest.rb +95 -0
data/lib/parslet/error_reporter/tree.rb +57 -0
data/lib/parslet/export.rb +162 -0
data/lib/parslet/expression.rb +51 -0
data/lib/parslet/expression/treetop.rb +92 -0
data/lib/parslet/parser.rb +67 -0
data/lib/parslet/pattern.rb +114 -0
data/lib/parslet/pattern/binding.rb +49 -0
data/lib/parslet/rig/rspec.rb +51 -0
data/lib/parslet/slice.rb +101 -0
data/lib/parslet/source.rb +62 -0
data/lib/parslet/source/line_cache.rb +95 -0
data/lib/parslet/transform.rb +236 -0
data/lib/parslet/transform/context.rb +32 -0
metadata +264 -0

data/HISTORY.txt ADDED

@@ -0,0 +1,195 @@
+= 2.0 / ?? (future release changes, like a reminder to self)
+  - prsnt? and absnt? are now finally banned into oblivion. Wasting vocals for
+    the win.
+= 1.4.0 / 25May2012
+  + Revised documentation. A few new API features have finally made it into
+    the documentation. Examples in the documentation are now curated and
+    run against the current code so that they really really work.
+    Also, the website generation tools have been replaced with 2012-style
+    tools. Much less pain to update now.
+  + Parslet::Source now doesn't hold a StringIO, it directly holds the
+    buffer to be parsed. The api of Source has changed a tiny bit. This change
+    has been made for speed optimisation reasons.
+  + :reporter argument to parse, allowing to customize error reporting within
+    wide boundaries. See issue #64 for a discussion.
+    Included are two error reporters, one (default) with the existing error
+    tree functionality, one reporting deepest errors as defined by the above
+    ticket.
+  + Optimistic parse: Parsing is two phase, with the first phase assuming
+    there will be no errors. This yields ~ 20% speed improvement in the
+    case where the parse succeeds.
+    Also, internal error handling is now using tuples. This and other
+    optimizations have yielded ~ 30% overall improvement.
+  ! #error_tree and #cause removed from all of parslet. The
+    Parslet::ParseFailed exception now contains a #cause field that can
+    be asked for an #ascii_tree as before.
+    Cleaner internal error handling, not stateful in atoms anymore. Some
+    parsers will see correct error reporting for the first time. (issue #65)
+  + Made it possible to pass a custom Parslet::Source implementor to #parse.
+    (see #63)
+  + #parse has now a second argument that is an options hash. See
+    Parslet::Atoms::Base#parse for documentation.
+  - VM engine on the way out. No benefit except for the intellectual
+    challenge.
+= 1.3.0 / 5Mar2012
+  ! Parslet::Transform::Context is now much more well-behaved. It has
+    #respond_to? and #method_missing; it now looks like a plain old Ruby
+    object with instance variables and attribute readers.
+  - Grammar transforms turned out to be a dead end and have been removed.
+  ! A few problems in error message generation have been fixed. This will
+  	improve diagnostics further.
+  + A VM driven parser engine: Removes the limitation that parsing needs a
+    lot of stack space, something dearly missing from Ruby 1.9.3 fibers.
+    This engine is experimental and might be removed in the future.
+  ! Interaction with mathn fixed - Line number generation will terminate.
+  . Internal reorganisation, removing cruft and bit rot.
+= 1.2.3 / 22Sep2011
+  + Transform#apply can now be called with a hash as second argument. This
+    provides bindings and a way to inject context.
+  ! Fixes a bug thar modified parslet atoms in place, defeating oop chaining.
+    (#50)
+= 1.2.1 / 6Jun2011
+  ! FIX: Input at the end of a parse raises Parslet::UnconsumedInput. (see
+    issue 18)
+  ! FIX: Unicode parsing should now work as expected. (see issue 38)
+  ! FIX: Slice#slice returned wrong bits at times (see issue 36).
+= 1.2.0 / 4Feb2011
+  + Parslet::Parser is now also a grammar atom, it can be composed freely with
+    other atoms. (str('f') >> MiniLispParser.new >> str('b'))
+  + No strings, only slices are returned as part of the parser result.
+    Parslet::Slice is almost a string class, but one that remembers the
+    source offset. This has also bought us a slight speedup.
+  + require 'parslet/convenience' now brings #parse_with_debug to all parslets.
+    This is a consequence of the above change.
+  + Deprecates prsnt? and absnt? in favor of the more readable absent? and
+    prsnt?. Uses 3 bytes more RAM. The old variants will exist until we release
+    2.0.
+  INTERNALLY
+  + Visitors now should have methods that all begin with 'visit_*'. #str
+    becomes #visit_str.
+  + Parslet::Atoms::Entity now takes only a block argument instead of context
+    and block.
+= 1.1.1 / 4Feb2011
+  ! FIX: Line counting was broken by performance optimisations.
+  + Squeezed out another few drops of performance.
+= 1.1.0 / 2Feb2011
+  + Uses return (fail/success), cached line counts, memoizing of parse results
+    and other tricks internally for at least an order of magnitude increase
+    in execution speed.
+  + str('foo').maybe will now return an empty string again. Use .as(...) to
+    name things and get back [] from #repeat and nil from #maybe.
+  + If you require 'parslet/atoms/visitor', you'll get an accept method on
+    all known Parslet::Atoms.
+  + If you require 'parslet/export', you can call #to_citrus and #to_treetop
+    to produce string versions of your grammar in those dialects.
+  + Requiring 'parslet/convenience' will given you a parse_with_debug on
+    your Parslet::Parser class. This prints some diagnostics on parse failure.
+    (Thanks to Florian Hanke)
+= 1.0.1 / 17Jan2011
+  A happy new year!
+  ! FIX: Parslet::Transform was wrongly fixed earlier - it now wont mangle
+    hashes anymore. (Blake Sweeney)
+  + parslet/rig/rspec.rb contains useful rspec matchers. (R. Konstantin Haase)
+= 1.0.0 / 29Dez2010
+  - #each_match was removed. There was some duplication of code that even
+    confused me - and we should not have 2 methods of achieving the same
+    goal.
+  + Full documentation. Fixed sdoc.
+= 0.11.0 / 25Nov2010
+  ! Bugfixes to tree handling. Let's hope that was the last such significant
+    change to the core.
+= 0.10.1 / 22Nov2010
+  + Allow match['a-z'], shortcut for match('[a-z]')
+  ! Fixed output inconsistencies (behaviour in connection to 'maybe')
+= 0.10.0 / 22Nov2010
+  + Parslet::Transform now takes a block on initialisation, wherein you can
+    define all the rules directly.
+  + Parslet::Transform now only passes a hash to the block during transform
+    when its arity is 1. Otherwise all hash contents as bound as local
+    variables.
+  + Both inline and other documentation have been improved.
+  + You can now use 'subtree(:x)' to bind any subtree to x during tree pattern
+    matching.
+  + Transform classes can now include rules into class definition. This makes
+    Parser and Transformer behave the same.
+= 0.9.0 / 28Oct2010
+  * More of everything: Examples, documentation, etc...
+  * Breaking change: Ruby's binary or ('|') is now used for alternatives,
+    instead of the division sign ('/') - this reduces the amount of
+    parenthesis needed for a grammar overall.
+  * parslet.maybe now yields the result or nil in case of parse failure. This
+    is probably better than the array it did before; the jury is still out on
+    that.
+  * parslet.repeat(min, max) is now valid syntax
+= 0.1.0 / not released.
+  * Initial version. Classes for parsing, matching in the resulting trees
+    and transforming the trees into something more useful.
+  * Parses and outputs intermediary trees
+  * Matching of single elements and sequences

data/LICENSE ADDED

@@ -0,0 +1,23 @@
+ Copyright (c) 2010 Kaspar Schiess
+ Permission is hereby granted, free of charge, to any person
+ obtaining a copy of this software and associated documentation
+ files (the "Software"), to deal in the Software without
+ restriction, including without limitation the rights to use,
+ copy, modify, merge, publish, distribute, sublicense, and/or sell
+ copies of the Software, and to permit persons to whom the
+ Software is furnished to do so, subject to the following
+ conditions:
+ The above copyright notice and this permission notice shall be
+ included in all copies or substantial portions of the Software.
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ OTHER DEALINGS IN THE SOFTWARE.

data/README ADDED

@@ -0,0 +1,70 @@
+INTRODUCTION
+Parslet makes developing complex parsers easy. It does so by
+* providing the best error reporting possible
+* not generating reams of code for you to debug
+Parslet takes the long way around to make your job easier. It allows for
+incremental language construction. Often, you start out small, implementing
+the atoms of your language first; _parslet_ takes pride in making this
+possible.
+Eager to try this out? Please see the associated web site:
+http://kschiess.github.com/parslet
+SYNOPSIS
+  require 'parslet'
+  include Parslet
+  # parslet parses strings
+  str('foo').
+    parse('foo') # => "foo"@0
+  # it matches character sets
+  match['abc'].parse('a') # => "a"@0
+  match['abc'].parse('b') # => "b"@0
+  match['abc'].parse('c') # => "c"@0
+  # and it annotates its output
+  str('foo').as(:important_bit).
+    parse('foo') # => {:important_bit=>"foo"@0}
+  # you can construct parsers with just a few lines
+  quote = str('"')
+  simple_string = quote >> (quote.absent? >> any).repeat >> quote
+  simple_string.
+    parse('"Simple Simple Simple"') # => "\"Simple Simple Simple\""@0
+  # or by making a fuss about it
+  class Smalltalk < Parslet::Parser
+    root :smalltalk
+    rule(:smalltalk) { statements }
+    rule(:statements) {
+      # insert smalltalk parser here (outside of the scope of this readme)
+    }
+  end
+  # and then
+  Smalltalk.new.parse('smalltalk')
+COMPATIBILITY
+This library should work with most rubies. I've tested it with MRI 1.8
+(except 1.8.6), 1.9, rbx-head, jruby. Please report as a bug if you encounter
+issues.
+Note that due to Ruby 1.8 internals, Unicode parsing is not supported on that
+version.
+On Mac OS X Lion, ruby-1.8.7-p352 has been known to segfault. Use
+ruby-1.8.7-p334 for better results.
+STATUS
+At version 1.4.0 - See HISTORY.txt for changes.
+(c) 2010, 2011, 2012 Kaspar Schiess

data/Rakefile ADDED

@@ -0,0 +1,49 @@
+require 'rdoc/task'
+require 'sdoc'
+require 'rspec/core/rake_task'
+require "rubygems/package_task"
+desc "Run all tests: Exhaustive."
+RSpec::Core::RakeTask.new
+namespace :spec do
+  desc "Only run unit tests: Fast. "
+  RSpec::Core::RakeTask.new(:unit) do |task|
+    task.pattern = "spec/parslet/**/*_spec.rb"
+  end
+end
+task :default => :spec
+# Generate documentation
+RDoc::Task.new do |rdoc|
+  rdoc.title    = "parslet - construction of parsers made easy"
+  rdoc.options << '--line-numbers'
+  rdoc.options << '--fmt' << 'shtml' # explictly set shtml generator
+  rdoc.template = 'direct' # lighter template used on railsapi.com
+  rdoc.main = "README"
+  rdoc.rdoc_files.include("README", "lib/**/*.rb")
+  rdoc.rdoc_dir = "rdoc"
+end
+desc 'Clear out RDoc'
+task :clean => [:clobber_rdoc, :clobber_package]
+# This task actually builds the gem.
+task :gem => :spec
+spec = eval(File.read('parslet.gemspec'))
+desc "Generate the gem package."
+Gem::PackageTask.new(spec) do |pkg|
+  pkg.gem_spec = spec
+end
+desc "Prints LOC stats"
+task :stat do
+  %w(lib spec example).each do |dir|
+    loc = %x(find #{dir} -name "*.rb" | xargs wc -l | grep 'total').split.first.to_i
+    printf("%20s %d\n", dir, loc)
+  end
+end

data/example/boolean_algebra.rb ADDED

@@ -0,0 +1,70 @@
+$:.unshift File.dirname(__FILE__) + "/../lib"
+require "parslet"
+require "pp"
+# Parses strings like "var1 and (var2 or var3)" respecting operator precedence
+# and parentheses. After that transforms the parse tree into an array of
+# arrays like this:
+#
+# [["1", "2"], ["1", "3"]]
+#
+# The array represents a DNF (disjunctive normal form). Elements of outer
+# array are connected with "or" operator, while elements of inner arrays are
+# joined with "and".
+#
+class Parser < Parslet::Parser
+  rule(:space)  { match[" "].repeat(1) }
+  rule(:space?) { space.maybe }
+  rule(:lparen) { str("(") >> space? }
+  rule(:rparen) { str(")") >> space? }
+  rule(:and_operator) { str("and") >> space? }
+  rule(:or_operator)  { str("or")  >> space? }
+  rule(:var) { str("var") >> match["0-9"].repeat(1).as(:var) >> space? }
+  # The primary rule deals with parentheses.
+  rule(:primary) { lparen >> or_operation >> rparen | var }
+  # Note that following rules are both right-recursive.
+  rule(:and_operation) {
+    (primary.as(:left) >> and_operator >>
+      and_operation.as(:right)).as(:and) |
+    primary }
+  rule(:or_operation)  {
+    (and_operation.as(:left) >> or_operator >>
+      or_operation.as(:right)).as(:or) |
+    and_operation }
+  # We start at the lowest precedence rule.
+  root(:or_operation)
+end
+class Transformer < Parslet::Transform
+  rule(:var => simple(:var)) { [[String(var)]] }
+  rule(:or => { :left => subtree(:left), :right => subtree(:right) }) do
+    (left + right)
+  end
+  rule(:and => { :left => subtree(:left), :right => subtree(:right) }) do
+     res = []
+     left.each do |l|
+       right.each do |r|
+         res << (l + r)
+       end
+     end
+     res
+  end
+end
+pp tree = Parser.new.parse("var1 and (var2 or var3)")
+# {:and=>
+#   {:left=>{:var=>"1"@3},
+#    :right=>{:or=>{:left=>{:var=>"2"@13}, :right=>{:var=>"3"@21}}}}}
+pp Transformer.new.apply(tree)
+# [["1", "2"], ["1", "3"]]

data/example/calc.rb ADDED

@@ -0,0 +1,153 @@
+# A simple integer calculator to answer the question about how to do
+# left and right associativity in parslet (PEG) once and for all.
+$:.unshift File.dirname(__FILE__) + "/../lib"
+require 'rspec'
+require 'parslet'
+require 'parslet/rig/rspec'
+# This is the parsing stage. It expresses left associativity by compiling
+# list of things that have the same associativity.
+class CalcParser < Parslet::Parser
+  root :addition
+  rule(:addition) {
+    multiplication.as(:l) >> (add_op >> multiplication.as(:r)).repeat(1) |
+    multiplication
+  }
+  rule(:multiplication) {
+    integer.as(:l) >> (mult_op >> integer.as(:r)).repeat(1) |
+    integer }
+  rule(:integer) { digit.repeat(1).as(:i) >> space? }
+  rule(:mult_op) { match['*/'].as(:o) >> space? }
+  rule(:add_op) { match['+-'].as(:o) >> space? }
+  rule(:digit) { match['0-9'] }
+  rule(:space?) { match['\s'].repeat }
+end
+# Classes for the abstract syntax tree.
+Int    = Struct.new(:int) {
+  def eval; self end
+  def op(operation, other)
+    left = int
+    right = other.int
+    Int.new(
+      case operation
+        when '+'
+          left + right
+        when '-'
+          left - right
+        when '*'
+          left * right
+        when '/'
+          left / right
+      end)
+  end
+  def to_i
+    int
+  end
+}
+Seq    = Struct.new(:sequence) {
+  def eval
+    sequence.reduce { |accum, operation|
+      operation.call(accum) }
+  end
+}
+LeftOp = Struct.new(:operation, :right) {
+  def call(left)
+    left = left.eval
+    right = self.right.eval
+    left.op(operation, right)
+  end
+}
+# Transforming intermediary syntax tree into a real AST.
+class CalcTransform < Parslet::Transform
+  rule(i: simple(:i)) { Int.new(Integer(i)) }
+  rule(o: simple(:o), r: simple(:i)) { LeftOp.new(o, i) }
+  rule(l: simple(:i)) { i }
+  rule(sequence(:seq)) { Seq.new(seq) }
+end
+# And this calls everything in the right order.
+def calculate(str)
+  intermediary_tree = CalcParser.new.parse(str)
+  abstract_tree = CalcTransform.new.apply(intermediary_tree)
+  result = abstract_tree.eval
+  result.to_i
+end
+# A test suite for the above parser
+describe CalcParser do
+  let(:p) { described_class.new }
+  describe '#integer' do
+    let(:i) { p.integer }
+    it "parses integers" do
+      i.should parse('1')
+      i.should parse('123')
+    end
+    it "consumes trailing white space" do
+      i.should parse('123   ')
+    end
+    it "doesn't parse floats" do
+      i.should_not parse('1.3')
+    end
+  end
+  describe '#multiplication' do
+    let(:m) { p.multiplication }
+    it "parses simple multiplication" do
+      m.should parse('1*2')
+    end
+    it "parses division" do
+      m.should parse('1/2')
+    end
+  end
+  describe '#addition' do
+    let(:a) { p.addition }
+    it "parses simple addition" do
+      a.should parse('1+2')
+      a.should parse('1+2+3-4')
+    end
+  end
+end
+describe CalcTransform do
+  def t(obj)
+    described_class.new.apply(obj)
+  end
+  it "transforms integers" do
+    t(i: '1').should == Int.new(1)
+  end
+  it "unwraps left operand" do
+    t(l: :obj).should == :obj
+  end
+end
+describe 'whole computation specs' do
+  def self.result_of(str, int)
+    it(str) { calculate(str).should == int }
+  end
+  result_of '1+1', 2
+  result_of '1-1-1', -1
+  result_of '1+1+3*5/2', 9
+  result_of '123*2', 246
+end
+# Enable these if you want to change the code.
+# RSpec::Core::Runner.run([], $stderr, $stdout)
+str = ARGV.join
+str = '123*2' if str.match(/^\s*$/)
+print "#{str} (command line): -> "
+puts calculate(str)