RubyGems - benhamill-gherkin - Versions diffs - 2.3.5 - Mend

benhamill-gherkin 2.3.5

Files changed (170) hide show

data/.gitattributes +2 -0
data/.gitignore +11 -0
data/.mailmap +2 -0
data/.rspec +1 -0
data/.rvmrc +1 -0
data/Gemfile +7 -0
data/History.txt +363 -0
data/LICENSE +20 -0
data/README.rdoc +149 -0
data/Rakefile +19 -0
data/VERSION +1 -0
data/build_native_gems.sh +8 -0
data/cucumber.yml +3 -0
data/features/escaped_pipes.feature +8 -0
data/features/feature_parser.feature +237 -0
data/features/json_formatter.feature +377 -0
data/features/json_parser.feature +318 -0
data/features/native_lexer.feature +19 -0
data/features/parser_with_native_lexer.feature +205 -0
data/features/pretty_formatter.feature +15 -0
data/features/step_definitions/eyeball_steps.rb +3 -0
data/features/step_definitions/gherkin_steps.rb +29 -0
data/features/step_definitions/json_formatter_steps.rb +28 -0
data/features/step_definitions/json_parser_steps.rb +20 -0
data/features/step_definitions/pretty_formatter_steps.rb +84 -0
data/features/steps_parser.feature +46 -0
data/features/support/env.rb +38 -0
data/gherkin.gemspec +61 -0
data/ikvm/.gitignore +3 -0
data/java/.gitignore +5 -0
data/java/src/main/java/gherkin/lexer/i18n/.gitignore +1 -0
data/java/src/main/resources/gherkin/.gitignore +1 -0
data/js/lib/gherkin/lexer/i18n/ar.js +1094 -0
data/js/lib/gherkin/lexer/i18n/bg.js +1308 -0
data/js/lib/gherkin/lexer/i18n/ca.js +1236 -0
data/js/lib/gherkin/lexer/i18n/cs.js +1090 -0
data/js/lib/gherkin/lexer/i18n/cy_gb.js +958 -0
data/js/lib/gherkin/lexer/i18n/da.js +974 -0
data/js/lib/gherkin/lexer/i18n/de.js +1082 -0
data/js/lib/gherkin/lexer/i18n/en.js +965 -0
data/js/lib/gherkin/lexer/i18n/en_au.js +902 -0
data/js/lib/gherkin/lexer/i18n/en_lol.js +859 -0
data/js/lib/gherkin/lexer/i18n/en_pirate.js +1136 -0
data/js/lib/gherkin/lexer/i18n/en_scouse.js +1289 -0
data/js/lib/gherkin/lexer/i18n/en_tx.js +942 -0
data/js/lib/gherkin/lexer/i18n/eo.js +916 -0
data/js/lib/gherkin/lexer/i18n/es.js +1049 -0
data/js/lib/gherkin/lexer/i18n/et.js +915 -0
data/js/lib/gherkin/lexer/i18n/fi.js +894 -0
data/js/lib/gherkin/lexer/i18n/fr.js +1116 -0
data/js/lib/gherkin/lexer/i18n/he.js +1044 -0
data/js/lib/gherkin/lexer/i18n/hr.js +994 -0
data/js/lib/gherkin/lexer/i18n/hu.js +1043 -0
data/js/lib/gherkin/lexer/i18n/id.js +884 -0
data/js/lib/gherkin/lexer/i18n/it.js +1007 -0
data/js/lib/gherkin/lexer/i18n/ja.js +1344 -0
data/js/lib/gherkin/lexer/i18n/ko.js +1028 -0
data/js/lib/gherkin/lexer/i18n/lt.js +972 -0
data/js/lib/gherkin/lexer/i18n/lu.js +1057 -0
data/js/lib/gherkin/lexer/i18n/lv.js +1092 -0
data/js/lib/gherkin/lexer/i18n/nl.js +1036 -0
data/js/lib/gherkin/lexer/i18n/no.js +986 -0
data/js/lib/gherkin/lexer/i18n/pl.js +1140 -0
data/js/lib/gherkin/lexer/i18n/pt.js +1000 -0
data/js/lib/gherkin/lexer/i18n/ro.js +1089 -0
data/js/lib/gherkin/lexer/i18n/ru.js +1560 -0
data/js/lib/gherkin/lexer/i18n/sk.js +972 -0
data/js/lib/gherkin/lexer/i18n/sr_cyrl.js +1728 -0
data/js/lib/gherkin/lexer/i18n/sr_latn.js +1220 -0
data/js/lib/gherkin/lexer/i18n/sv.js +997 -0
data/js/lib/gherkin/lexer/i18n/tr.js +1014 -0
data/js/lib/gherkin/lexer/i18n/uk.js +1572 -0
data/js/lib/gherkin/lexer/i18n/uz.js +1302 -0
data/js/lib/gherkin/lexer/i18n/vi.js +1124 -0
data/js/lib/gherkin/lexer/i18n/zh_cn.js +902 -0
data/js/lib/gherkin/lexer/i18n/zh_tw.js +940 -0
data/lib/.gitignore +4 -0
data/lib/gherkin.rb +2 -0
data/lib/gherkin/c_lexer.rb +17 -0
data/lib/gherkin/formatter/ansi_escapes.rb +95 -0
data/lib/gherkin/formatter/argument.rb +16 -0
data/lib/gherkin/formatter/escaping.rb +15 -0
data/lib/gherkin/formatter/filter_formatter.rb +136 -0
data/lib/gherkin/formatter/hashable.rb +19 -0
data/lib/gherkin/formatter/json_formatter.rb +102 -0
data/lib/gherkin/formatter/line_filter.rb +26 -0
data/lib/gherkin/formatter/model.rb +236 -0
data/lib/gherkin/formatter/pretty_formatter.rb +243 -0
data/lib/gherkin/formatter/regexp_filter.rb +21 -0
data/lib/gherkin/formatter/step_printer.rb +17 -0
data/lib/gherkin/formatter/tag_count_formatter.rb +47 -0
data/lib/gherkin/formatter/tag_filter.rb +19 -0
data/lib/gherkin/i18n.rb +175 -0
data/lib/gherkin/i18n.yml +588 -0
data/lib/gherkin/json_parser.rb +137 -0
data/lib/gherkin/lexer/i18n_lexer.rb +47 -0
data/lib/gherkin/listener/event.rb +45 -0
data/lib/gherkin/listener/formatter_listener.rb +113 -0
data/lib/gherkin/native.rb +7 -0
data/lib/gherkin/native/ikvm.rb +55 -0
data/lib/gherkin/native/java.rb +55 -0
data/lib/gherkin/native/null.rb +9 -0
data/lib/gherkin/parser/meta.txt +5 -0
data/lib/gherkin/parser/parser.rb +164 -0
data/lib/gherkin/parser/root.txt +11 -0
data/lib/gherkin/parser/steps.txt +4 -0
data/lib/gherkin/rb_lexer.rb +8 -0
data/lib/gherkin/rb_lexer/.gitignore +1 -0
data/lib/gherkin/rb_lexer/README.rdoc +8 -0
data/lib/gherkin/rubify.rb +24 -0
data/lib/gherkin/tag_expression.rb +62 -0
data/lib/gherkin/version.rb +3 -0
data/ragel/i18n/.gitignore +1 -0
data/ragel/lexer.c.rl.erb +439 -0
data/ragel/lexer.java.rl.erb +208 -0
data/ragel/lexer.rb.rl.erb +167 -0
data/ragel/lexer_common.rl.erb +50 -0
data/spec/gherkin/c_lexer_spec.rb +21 -0
data/spec/gherkin/fixtures/1.feature +8 -0
data/spec/gherkin/fixtures/comments_in_table.feature +9 -0
data/spec/gherkin/fixtures/complex.feature +45 -0
data/spec/gherkin/fixtures/complex.json +143 -0
data/spec/gherkin/fixtures/complex_for_filtering.feature +60 -0
data/spec/gherkin/fixtures/complex_with_tags.feature +61 -0
data/spec/gherkin/fixtures/dos_line_endings.feature +45 -0
data/spec/gherkin/fixtures/hantu_pisang.feature +35 -0
data/spec/gherkin/fixtures/i18n_fr.feature +14 -0
data/spec/gherkin/fixtures/i18n_no.feature +7 -0
data/spec/gherkin/fixtures/i18n_zh-CN.feature +9 -0
data/spec/gherkin/fixtures/scenario_outline_with_tags.feature +13 -0
data/spec/gherkin/fixtures/scenario_without_steps.feature +5 -0
data/spec/gherkin/fixtures/simple_with_comments.feature +7 -0
data/spec/gherkin/fixtures/simple_with_tags.feature +11 -0
data/spec/gherkin/fixtures/with_bom.feature +3 -0
data/spec/gherkin/formatter/ansi_escapes_spec.rb +19 -0
data/spec/gherkin/formatter/filter_formatter_spec.rb +165 -0
data/spec/gherkin/formatter/model_spec.rb +28 -0
data/spec/gherkin/formatter/pretty_formatter_spec.rb +158 -0
data/spec/gherkin/formatter/spaces.feature +9 -0
data/spec/gherkin/formatter/step_printer_spec.rb +55 -0
data/spec/gherkin/formatter/tabs.feature +9 -0
data/spec/gherkin/formatter/tag_count_formatter_spec.rb +30 -0
data/spec/gherkin/i18n_spec.rb +152 -0
data/spec/gherkin/java_lexer_spec.rb +20 -0
data/spec/gherkin/java_libs.rb +20 -0
data/spec/gherkin/json_parser_spec.rb +113 -0
data/spec/gherkin/lexer/i18n_lexer_spec.rb +43 -0
data/spec/gherkin/output_stream_string_io.rb +20 -0
data/spec/gherkin/parser/parser_spec.rb +16 -0
data/spec/gherkin/rb_lexer_spec.rb +19 -0
data/spec/gherkin/sexp_recorder.rb +56 -0
data/spec/gherkin/shared/lexer_group.rb +593 -0
data/spec/gherkin/shared/py_string_group.rb +153 -0
data/spec/gherkin/shared/row_group.rb +125 -0
data/spec/gherkin/shared/tags_group.rb +54 -0
data/spec/gherkin/tag_expression_spec.rb +137 -0
data/spec/spec_helper.rb +69 -0
data/tasks/bench.rake +184 -0
data/tasks/bench/feature_builder.rb +49 -0
data/tasks/bench/generated/.gitignore +1 -0
data/tasks/bench/null_listener.rb +4 -0
data/tasks/compile.rake +102 -0
data/tasks/cucumber.rake +20 -0
data/tasks/gems.rake +35 -0
data/tasks/ikvm.rake +79 -0
data/tasks/ragel_task.rb +70 -0
data/tasks/rdoc.rake +9 -0
data/tasks/release.rake +30 -0
data/tasks/rspec.rake +8 -0
metadata +609 -0

data/lib/gherkin/native/null.rb ADDED Viewed

@@ -0,0 +1,9 @@
+class Class
+  def implements(java_class_name)
+    # no-op
+  end
+  def native_impl(lib)
+    # no-op
+  end
+end

data/lib/gherkin/parser/meta.txt ADDED Viewed

@@ -0,0 +1,5 @@
+ |         | feature | background | scenario | scenario_outline | examples | step  | row   | py_string | eof | comment | tag |
+ | meta    | E       | E          | E        | E                | E        | E     | E     | E         | eof | comment | tag |
+ | comment | pop()   | pop()      | pop()    | pop()            | pop()    | pop() | pop() | pop()     | eof | pop()   | tag |
+ | tag     | pop()   | E          | pop()    | pop()            | pop()    | E     | E     | E         | E   | E       | tag |
+ | eof     | E       | E          | E        | E                | E        | E     | E     | E         | E   | E       | E   |

data/lib/gherkin/parser/parser.rb ADDED Viewed

@@ -0,0 +1,164 @@
+require 'gherkin/i18n'
+require 'gherkin/lexer/i18n_lexer'
+require 'gherkin/native'
+require 'gherkin/listener/formatter_listener'
+module Gherkin
+  module Parser
+    class ParseError < StandardError
+      def initialize(state, new_state, expected_states, uri, line)
+        super("Parse error at #{uri}:#{line}. Found #{new_state} when expecting one of: #{expected_states.join(', ')}. (Current state: #{state}).")
+      end
+    end
+    class Parser
+      native_impl('gherkin')
+      # Initialize the parser. +machine_name+ refers to a state machine table.
+      def initialize(formatter, raise_on_error=true, machine_name='root', force_ruby=false)
+        @formatter = formatter
+        @listener = Listener::FormatterListener.new(@formatter)
+        @raise_on_error = raise_on_error
+        @machine_name = machine_name
+        @machines = []
+        push_machine(@machine_name)
+        @lexer = Gherkin::Lexer::I18nLexer.new(self, force_ruby)
+      end
+      def parse(gherkin, feature_uri, line_offset)
+        @formatter.uri(feature_uri)
+        @line_offset = line_offset
+        @lexer.scan(gherkin)
+      end
+      def i18n_language
+        @lexer.i18n_language
+      end
+      def errors
+        @lexer.errors
+      end
+      # Doesn't yet fall back to super
+      def method_missing(method, *args)
+        # TODO: Catch exception and call super
+        event(method.to_s, args[-1])
+        @listener.__send__(method, *args)
+        if method == :eof
+          pop_machine
+          push_machine(@machine_name)
+        end
+      end
+      def event(ev, line)
+        l = line ? @line_offset+line : nil
+        machine.event(ev, l) do |state, legal_events|
+          if @raise_on_error
+            raise ParseError.new(state, ev, legal_events, @feature_uri, l)
+          else
+            # Only used for testing
+            @listener.syntax_error(state, ev, legal_events, @feature_uri, l)
+          end
+        end
+      end
+      def push_machine(name)
+        @machines.push(Machine.new(self, name))
+      end
+      def pop_machine
+        @machines.pop
+      end
+      def machine
+        @machines[-1]
+      end
+      def expected
+        machine.expected
+      end
+      def force_state(state)
+        machine.instance_variable_set('@state', state)
+      end
+      class Machine
+        def initialize(parser, name)
+          @parser = parser
+          @name = name
+          @transition_map = transition_map(name)
+          @state = name
+        end
+        def event(ev, line)
+          states = @transition_map[@state]
+          raise "Unknown state: #{@state.inspect} for machine #{@name}" if states.nil?
+          new_state = states[ev]
+          case new_state
+          when "E"
+            yield @state, expected
+          when /push\((.+)\)/
+            @parser.push_machine($1)
+            @parser.event(ev, line)
+          when "pop()"
+            @parser.pop_machine()
+            @parser.event(ev, line)
+          else
+            raise "Unknown transition: #{ev.inspect} among #{states.inspect} for machine #{@name}" if new_state.nil?
+            @state = new_state
+          end
+        end
+        def expected
+          allowed = @transition_map[@state].find_all { |_, action| action != "E" }
+          allowed.collect { |state| state[0] }.sort - ['eof']
+        end
+        private
+        @@transition_maps = {}
+        def transition_map(name)
+          @@transition_maps[name] ||= build_transition_map(name)
+        end
+        def build_transition_map(name)
+          table = transition_table(name)
+          events = table.shift[1..-1]
+          table.inject({}) do |machine, actions|
+            state = actions.shift
+            machine[state] = Hash[*events.zip(actions).flatten]
+            machine
+          end
+        end
+        def transition_table(name)
+          state_machine_reader = StateMachineReader.new
+          lexer = Gherkin::I18n.new('en').lexer(state_machine_reader)
+          machine = File.dirname(__FILE__) + "/#{name}.txt"
+          lexer.scan(File.read(machine))
+          state_machine_reader.rows
+        end
+        class StateMachineReader
+          attr_reader :rows
+          def initialize
+            @rows = []
+          end
+          def uri(uri)
+          end
+          def row(row, line_number)
+            @rows << row
+          end
+          def eof
+          end
+        end
+      end
+    end
+  end
+end

data/lib/gherkin/parser/root.txt ADDED Viewed

@@ -0,0 +1,11 @@
+ |                  | feature | background | scenario | scenario_outline | examples | step         | row            | py_string    | eof | comment    | tag        |
+ | root             | feature | E          | E        | E                | E        | E            | E              | E            | eof | push(meta) | push(meta) |
+ | feature          | E       | background | scenario | scenario_outline | E        | E            | E              | E            | eof | push(meta) | push(meta) |
+ | step             | E       | E          | scenario | scenario_outline | E        | step         | step           | step         | eof | push(meta) | push(meta) |
+ | outline_step     | E       | E          | scenario | scenario_outline | examples | outline_step | outline_step   | outline_step | eof | push(meta) | push(meta) |
+ | background       | E       | E          | scenario | scenario_outline | E        | step         | E              | E            | eof | push(meta) | push(meta) |
+ | scenario         | E       | E          | scenario | scenario_outline | E        | step         | E              | E            | eof | push(meta) | push(meta) |
+ | scenario_outline | E       | E          | E        | E                | E        | outline_step | E              | E            | eof | push(meta) | push(meta) |
+ | examples         | E       | E          | E        | E                | E        | E            | examples_table | E            | eof | push(meta) | push(meta) |
+ | examples_table   | E       | E          | scenario | scenario_outline | examples | E            | examples_table | E            | eof | push(meta) | push(meta) |
+ | eof              | E       | E          | E        | E                | E        | E            | E              | E            | E   | E          | E          |

data/lib/gherkin/parser/steps.txt ADDED Viewed

@@ -0,0 +1,4 @@
+ |       | feature | background | scenario | scenario_outline | examples | step | row  | py_string | eof | comment | tag |
+ | steps | E       | E          | E        | E                | E        | step | E    | E         | eof | E       | E   |
+ | step  | E       | E          | E        | E                | E        | step | step | steps     | eof | E       | E   |
+ | eof   | E       | E          | E        | E                | E        | E    | E    | E         | E   | E       | E   |

data/lib/gherkin/rb_lexer.rb ADDED Viewed

@@ -0,0 +1,8 @@
+module Gherkin
+  module RbLexer
+    def self.[](i18n_underscored_iso_code)
+      require "gherkin/rb_lexer/#{i18n_underscored_iso_code}"
+      const_get(i18n_underscored_iso_code.capitalize)
+    end
+  end
+end

data/lib/gherkin/rb_lexer/.gitignore ADDED Viewed

	@@ -0,0 +1 @@
1	+ *.rb

data/lib/gherkin/rb_lexer/README.rdoc ADDED Viewed

@@ -0,0 +1,8 @@
+= Lexers
+Gherkin support lexing of lots of natural languages, defined by gherkin/i18n.yml
+The lexers are generated with the following command:
+    rake ragel:i18n
+You have to run this command if you modify gherkin/i18n.yml

data/lib/gherkin/rubify.rb ADDED Viewed

@@ -0,0 +1,24 @@
+module Gherkin
+  module Rubify
+    if defined?(JRUBY_VERSION)
+      # Translate Java objects to Ruby.
+      # This is especially important to convert java.util.List coming
+      # from Java and back to a Ruby Array.
+      def rubify(o)
+        case(o)
+        when Java.java.util.Collection, Array
+          o.map{|e| rubify(e)}
+        when Java.gherkin.formatter.model.PyString
+          require 'gherkin/formatter/model'
+          Formatter::Model::PyString.new(o.value, o.line)
+        else
+          o
+        end
+      end
+    else
+      def rubify(o)
+        o
+      end
+    end
+  end
+end

data/lib/gherkin/tag_expression.rb ADDED Viewed

@@ -0,0 +1,62 @@
+require 'gherkin/native'
+module Gherkin
+  class TagExpression
+    native_impl('gherkin')
+    attr_reader :limits
+    def initialize(tag_expressions)
+      @ands = []
+      @limits = {}
+      tag_expressions.each do |expr|
+        add(expr.strip.split(/\s*,\s*/))
+      end
+    end
+    def empty?
+      @ands.empty?
+    end
+    def eval(tags)
+      return true if @ands.flatten.empty?
+      vars = Hash[*tags.map{|tag| [tag, true]}.flatten]
+      !!Kernel.eval(ruby_expression)
+    end
+  private
+    def add(tags_with_negation_and_limits)
+      negatives, positives = tags_with_negation_and_limits.partition{|tag| tag =~ /^~/}
+      @ands << (store_and_extract_limits(negatives, true) + store_and_extract_limits(positives, false))
+    end
+    def store_and_extract_limits(tags_with_negation_and_limits, negated)
+      tags_with_negation = []
+      tags_with_negation_and_limits.each do |tag_with_negation_and_limit|
+        tag_with_negation, limit = tag_with_negation_and_limit.split(':')
+        tags_with_negation << tag_with_negation
+        if limit
+          tag_without_negation = negated ? tag_with_negation[1..-1] : tag_with_negation
+          if @limits[tag_without_negation] && @limits[tag_without_negation] != limit.to_i
+            raise "Inconsistent tag limits for #{tag_without_negation}: #{@limits[tag_without_negation]} and #{limit.to_i}"
+          end
+          @limits[tag_without_negation] = limit.to_i
+        end
+      end
+      tags_with_negation
+    end
+    def ruby_expression
+      "(" + @ands.map do |ors|
+        ors.map do |tag|
+          if tag =~ /^~(.*)/
+            "!vars['#{$1}']"
+          else
+            "vars['#{tag}']"
+          end
+        end.join("||")
+      end.join(")&&(") + ")"
+    end
+  end
+end

data/lib/gherkin/version.rb ADDED Viewed

@@ -0,0 +1,3 @@
+module Gherkin
+  VERSION = IO.read(File.dirname(__FILE__) + '/../../VERSION').strip
+end

data/ragel/i18n/.gitignore ADDED Viewed

	@@ -0,0 +1 @@
1	+ *.rl

data/ragel/lexer.c.rl.erb ADDED Viewed

@@ -0,0 +1,439 @@
+#include <assert.h>
+#include <ruby.h>
+#if defined(_WIN32)
+#include <stddef.h>
+#endif
+#ifdef HAVE_RUBY_RE_H
+#include <ruby/re.h>
+#else
+#include <re.h>
+#endif
+#ifdef HAVE_RUBY_ENCODING_H
+#include <ruby/encoding.h>
+#define ENCODED_STR_NEW(ptr, len) \
+    rb_enc_str_new(ptr, len, rb_utf8_encoding())
+#else
+#define ENCODED_STR_NEW(ptr, len) \
+    rb_str_new(ptr, len)
+#endif
+#ifndef RSTRING_PTR
+#define RSTRING_PTR(s) (RSTRING(s)->ptr)
+#endif
+#ifndef RSTRING_LEN
+#define RSTRING_LEN(s) (RSTRING(s)->len)
+#endif
+#define DATA_GET(FROM, TYPE, NAME) \
+  Data_Get_Struct(FROM, TYPE, NAME); \
+  if (NAME == NULL) { \
+    rb_raise(rb_eArgError, "NULL found for " # NAME " when it shouldn't be."); \
+  }
+typedef struct lexer_state {
+  int content_len;
+  int line_number;
+  int current_line;
+  int start_col;
+  size_t mark;
+  size_t keyword_start;
+  size_t keyword_end;
+  size_t next_keyword_start;
+  size_t content_start;
+  size_t content_end;
+  size_t query_start;
+  size_t last_newline;
+  size_t final_newline;
+} lexer_state;
+static VALUE mGherkin;
+static VALUE mGherkinLexer;
+static VALUE mCLexer;
+static VALUE cI18nLexer;
+static VALUE rb_eGherkinLexingError;
+#define LEN(AT, P) (P - data - lexer->AT)
+#define MARK(M, P) (lexer->M = (P) - data)
+#define PTR_TO(P) (data + lexer->P)
+#define STORE_KW_END_CON(EVENT) \
+  store_multiline_kw_con(listener, # EVENT, \
+    PTR_TO(keyword_start), LEN(keyword_start, PTR_TO(keyword_end - 1)), \
+    PTR_TO(content_start), LEN(content_start, PTR_TO(content_end)), \
+    lexer->current_line, lexer->start_col); \
+    if (lexer->content_end != 0) { \
+      p = PTR_TO(content_end - 1); \
+    } \
+    lexer->content_end = 0
+#define STORE_ATTR(ATTR) \
+    store_attr(listener, # ATTR, \
+      PTR_TO(content_start), LEN(content_start, p), \
+      lexer->line_number)
+%%{
+  machine lexer;
+  action begin_content {
+		MARK(content_start, p);
+    lexer->current_line = lexer->line_number;
+    lexer->start_col = lexer->content_start - lexer->last_newline - (lexer->keyword_end - lexer->keyword_start) + 2;
+  }
+  action begin_pystring_content {
+    MARK(content_start, p);
+  }
+  action start_pystring {
+    lexer->current_line = lexer->line_number;
+    lexer->start_col = p - data - lexer->last_newline;
+  }
+  action store_pystring_content {
+    int len = LEN(content_start, PTR_TO(final_newline));
+    if (len < 0) len = 0;
+    store_pystring_content(listener, lexer->start_col, PTR_TO(content_start), len, lexer->current_line);
+  }
+  action store_feature_content {
+    STORE_KW_END_CON(feature);
+  }
+  action store_background_content {
+    STORE_KW_END_CON(background);
+  }
+  action store_scenario_content {
+    STORE_KW_END_CON(scenario);
+  }
+  action store_scenario_outline_content {
+    STORE_KW_END_CON(scenario_outline);
+  }
+  action store_examples_content {
+    STORE_KW_END_CON(examples);
+  }
+  action store_step_content {
+    store_kw_con(listener, "step",
+      PTR_TO(keyword_start), LEN(keyword_start, PTR_TO(keyword_end)),
+      PTR_TO(content_start), LEN(content_start, p),
+      lexer->current_line);
+  }
+  action store_comment_content {
+    STORE_ATTR(comment);
+    lexer->mark = 0;
+  }
+  action store_tag_content {
+    STORE_ATTR(tag);
+    lexer->mark = 0;
+  }
+  action inc_line_number {
+    lexer->line_number += 1;
+    MARK(final_newline, p);
+  }
+  action last_newline {
+    MARK(last_newline, p + 1);
+  }
+  action start_keyword {
+    if (lexer->mark == 0) {
+      MARK(mark, p);
+    }
+  }
+  action end_keyword {
+    MARK(keyword_end, p);
+    MARK(keyword_start, PTR_TO(mark));
+    MARK(content_start, p + 1);
+    lexer->mark = 0;
+  }
+  action next_keyword_start {
+    MARK(content_end, p);
+  }
+  action start_row {
+    p = p - 1;
+    lexer->current_line = lexer->line_number;
+    current_row = rb_ary_new();
+  }
+  action begin_cell_content {
+		MARK(content_start, p);
+  }
+  action store_cell_content {
+    VALUE re_pipe, re_newline, re_backslash;
+    VALUE con = ENCODED_STR_NEW(PTR_TO(content_start), LEN(content_start, p));
+    rb_funcall(con, rb_intern("strip!"), 0);
+    re_pipe      = rb_reg_regcomp(rb_str_new2("\\\\\\|"));
+    re_newline   = rb_reg_regcomp(rb_str_new2("\\\\n"));
+    re_backslash = rb_reg_regcomp(rb_str_new2("\\\\\\\\"));
+    rb_funcall(con, rb_intern("gsub!"), 2, re_pipe,      rb_str_new2("|"));
+    rb_funcall(con, rb_intern("gsub!"), 2, re_newline,   rb_str_new2("\n"));
+    rb_funcall(con, rb_intern("gsub!"), 2, re_backslash, rb_str_new2("\\"));
+    rb_ary_push(current_row, con);
+  }
+  action store_row {
+    rb_funcall(listener, rb_intern("row"), 2, current_row, INT2FIX(lexer->current_line));
+  }
+  action end_feature {
+    int line;
+    if (cs < lexer_first_final) {
+      size_t count = 0;
+      VALUE newstr_val;
+      char *newstr;
+      int newstr_count = 0;
+      size_t len;
+      const char *buff;
+      if (lexer->last_newline != 0) {
+        len = LEN(last_newline, eof);
+        buff = PTR_TO(last_newline);
+      } else {
+        len = strlen(data);
+        buff = data;
+      }
+      // Allocate as a ruby string so that it gets cleaned up by GC
+      newstr_val = rb_str_new(buff, len);
+      newstr = RSTRING_PTR(newstr_val);
+      for (count = 0; count < len; count++) {
+        if(buff[count] == 10) {
+          newstr[newstr_count] = '\0'; // terminate new string at first newline found
+          break;
+        } else {
+          if (buff[count] == '%') {
+            newstr[newstr_count++] = buff[count];
+            newstr[newstr_count] = buff[count];
+          } else {
+            newstr[newstr_count] = buff[count];
+          }
+        }
+        newstr_count++;
+      }
+      line = lexer->line_number;
+      lexer_init(lexer); // Re-initialize so we can scan again with the same lexer
+      raise_lexer_error(newstr, line);
+    } else {
+      rb_funcall(listener, rb_intern("eof"), 0);
+    }
+  }
+  include lexer_common "lexer_common.<%= @i18n.underscored_iso_code %>.rl";
+}%%
+/** Data **/
+%% write data;
+static VALUE
+unindent(VALUE con, int start_col)
+{
+  VALUE re;
+  // Gherkin will crash gracefully if the string representation of start_col pushes the pattern past 32 characters
+  char pat[32];
+  snprintf(pat, 32, "^[\t ]{0,%d}", start_col);
+  re = rb_reg_regcomp(rb_str_new2(pat));
+  rb_funcall(con, rb_intern("gsub!"), 2, re, rb_str_new2(""));
+  return Qnil;
+}
+static void
+store_kw_con(VALUE listener, const char * event_name,
+             const char * keyword_at, size_t keyword_length,
+             const char * at,         size_t length,
+             int current_line)
+{
+  VALUE con = Qnil, kw = Qnil;
+  kw = ENCODED_STR_NEW(keyword_at, keyword_length);
+  con = ENCODED_STR_NEW(at, length);
+  rb_funcall(con, rb_intern("strip!"), 0);
+  rb_funcall(listener, rb_intern(event_name), 3, kw, con, INT2FIX(current_line));
+}
+static void
+store_multiline_kw_con(VALUE listener, const char * event_name,
+                      const char * keyword_at, size_t keyword_length,
+                      const char * at,         size_t length,
+                      int current_line, int start_col)
+{
+  VALUE split;
+  VALUE con = Qnil, kw = Qnil, name = Qnil, desc = Qnil;
+  kw = ENCODED_STR_NEW(keyword_at, keyword_length);
+  con = ENCODED_STR_NEW(at, length);
+  unindent(con, start_col);
+  split = rb_str_split(con, "\n");
+  name = rb_funcall(split, rb_intern("shift"), 0);
+  desc = rb_ary_join(split, rb_str_new2( "\n" ));
+  if( name == Qnil )
+  {
+    name = rb_str_new2("");
+  }
+  if( rb_funcall(desc, rb_intern("size"), 0) == 0)
+  {
+    desc = rb_str_new2("");
+  }
+  rb_funcall(name, rb_intern("strip!"), 0);
+  rb_funcall(desc, rb_intern("rstrip!"), 0);
+  rb_funcall(listener, rb_intern(event_name), 4, kw, name, desc, INT2FIX(current_line));
+}
+static void
+store_attr(VALUE listener, const char * attr_type,
+           const char * at, size_t length,
+           int line)
+{
+  VALUE val = ENCODED_STR_NEW(at, length);
+  rb_funcall(listener, rb_intern(attr_type), 2, val, INT2FIX(line));
+}
+static void
+store_pystring_content(VALUE listener,
+          int start_col,
+          const char *at, size_t length,
+          int current_line)
+{
+  VALUE re2;
+  VALUE unescape_escaped_quotes;
+  VALUE con = ENCODED_STR_NEW(at, length);
+  unindent(con, start_col);
+  re2 = rb_reg_regcomp(rb_str_new2("\r\\Z"));
+  unescape_escaped_quotes = rb_reg_regcomp(rb_str_new2("\\\\\"\\\\\"\\\\\""));
+  rb_funcall(con, rb_intern("sub!"), 2, re2, rb_str_new2(""));
+  rb_funcall(con, rb_intern("gsub!"), 2, unescape_escaped_quotes, rb_str_new2("\"\"\""));
+  rb_funcall(listener, rb_intern("py_string"), 2, con, INT2FIX(current_line));
+}
+static void
+raise_lexer_error(const char * at, int line)
+{
+  rb_raise(rb_eGherkinLexingError, "Lexing error on line %d: '%s'. See http://wiki.github.com/aslakhellesoy/gherkin/lexingerror for more information.", line, at);
+}
+static void lexer_init(lexer_state *lexer) {
+  lexer->content_start = 0;
+  lexer->content_end = 0;
+  lexer->content_len = 0;
+  lexer->mark = 0;
+  lexer->keyword_start = 0;
+  lexer->keyword_end = 0;
+  lexer->next_keyword_start = 0;
+  lexer->line_number = 1;
+  lexer->last_newline = 0;
+  lexer->final_newline = 0;
+  lexer->start_col = 0;
+}
+static VALUE CLexer_alloc(VALUE klass)
+{
+  VALUE obj;
+  lexer_state *lxr = ALLOC(lexer_state);
+  lexer_init(lxr);
+  obj = Data_Wrap_Struct(klass, NULL, -1, lxr);
+  return obj;
+}
+static VALUE CLexer_init(VALUE self, VALUE listener)
+{
+  lexer_state *lxr;
+  rb_iv_set(self, "@listener", listener);
+  lxr = NULL;
+  DATA_GET(self, lexer_state, lxr);
+  lexer_init(lxr);
+  return self;
+}
+static VALUE CLexer_scan(VALUE self, VALUE input)
+{
+  VALUE input_copy;
+  char *data;
+  size_t len;
+  VALUE listener = rb_iv_get(self, "@listener");
+  lexer_state *lexer;
+  lexer = NULL;
+  DATA_GET(self, lexer_state, lexer);
+  input_copy = rb_str_dup(input);
+  rb_str_append(input_copy, rb_str_new2("\n%_FEATURE_END_%"));
+  data = RSTRING_PTR(input_copy);
+  len = RSTRING_LEN(input_copy);
+  if (len == 0) {
+    rb_raise(rb_eGherkinLexingError, "No content to lex.");
+  } else {
+    const char *p, *pe, *eof;
+    int cs = 0;
+    VALUE current_row = Qnil;
+    p = data;
+    pe = data + len;
+    eof = pe;
+    assert(*pe == '\0' && "pointer does not end on NULL");
+    %% write init;
+    %% write exec;
+    assert(p <= pe && "data overflow after parsing execute");
+    assert(lexer->content_start <= len && "content starts after data end");
+    assert(lexer->mark < len && "mark is after data end");
+    // Reset lexer by re-initializing the whole thing
+    lexer_init(lexer);
+    if (cs == lexer_error) {
+      rb_raise(rb_eGherkinLexingError, "Invalid format, lexing fails.");
+    } else {
+      return Qtrue;
+    }
+  }
+}
+void Init_gherkin_lexer_<%= @i18n.underscored_iso_code %>()
+{
+  mGherkin = rb_define_module("Gherkin");
+  mGherkinLexer = rb_define_module_under(mGherkin, "Lexer");
+  rb_eGherkinLexingError = rb_const_get(mGherkinLexer, rb_intern("LexingError"));
+  mCLexer = rb_define_module_under(mGherkin, "CLexer");
+  cI18nLexer = rb_define_class_under(mCLexer, "<%= @i18n.underscored_iso_code.capitalize %>", rb_cObject);
+  rb_define_alloc_func(cI18nLexer, CLexer_alloc);
+  rb_define_method(cI18nLexer, "initialize", CLexer_init, 1);
+  rb_define_method(cI18nLexer, "scan", CLexer_scan, 1);
+}