RubyGems - keyword_search - Versions diffs - 1.1.1 → 1.2.0 - Mend

keyword_search 1.1.1 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

data/History.txt +4 -0
data/Rakefile +16 -0
data/lib/keyword_search.rb +6 -5
data/lib/keyword_search/grammar.rb +1 -1
data/lib/keyword_search/parser.rb +18 -19
data/lib/keyword_search/tokenizer.rb +0 -105
data/test/test_keyword_search.rb +12 -1
metadata +2 -2

data/History.txt CHANGED Viewed

@@ -1,3 +1,7 @@
+= 1.2.0 / 2007-05-09
+* Raises KeywordSearch::ParseError instead of returning an empty Hash if an error occurs during parsing
 = 1.1.0 / 2007-03-21
 * Updated to use Dhaka 2.1.0

data/Rakefile CHANGED Viewed

@@ -23,4 +23,20 @@ task :rebuild_parser do
   end
 end
+task :rebuild_lexer do
+  require 'dhaka'
+  lexer = Dhaka::Lexer.new(KeywordSearch::LexerSpec)
+  File.open('lib/keyword_search/lexer.rb', 'w') do |file|
+    file << lexer.compile_to_ruby_source_as('KeywordSearch::Lexer')
+  end
+end
+task :rebuild_lexer do
+  require 'dhaka'
+  lexer = Dhaka::Lexer.new(KeywordSearch::LexerSpec)
+  File.open('lib/keyword_search/lexer.rb', 'w') do |file|
+    file << lexer.compile_to_ruby_source_as('KeywordSearch::Lexer')
+  end
+end
 # vim: syntax=Ruby

data/lib/keyword_search.rb CHANGED Viewed

@@ -1,20 +1,21 @@
 require 'dhaka'
 dirname = File.join(File.dirname(__FILE__), 'keyword_search')
-%w|grammar tokenizer parser evaluator definition|.each do |dependency|
+%w|grammar parser lexer_spec lexer evaluator definition|.each do |dependency|
   require File.join(dirname, dependency)
 end
 module KeywordSearch
-  VERSION = '1.1.1'
+  class ParseError < ::SyntaxError; end
+  VERSION = '1.2.0'
   class << self
     def search(input_string, definition=nil, &block)
       @evaluator ||= Evaluator.new
       definition ||= Definition.new(&block)
-      tokens = Tokenizer.tokenize(input_string)
-      parse_result = Parser.parse(tokens)
+      parse_result = Parser.parse(Lexer.lex(input_string))
       unless parse_result.has_error?
         results = @evaluator.evaluate(parse_result.parse_tree)
         results.each do |key, terms|
@@ -22,7 +23,7 @@ module KeywordSearch
         end
         results
       else
-        {}
+        raise ParseError, "Unexpected token #{parse_result.unexpected_token.inspect}"
       end
     end
   end

data/lib/keyword_search/grammar.rb CHANGED Viewed

@@ -12,7 +12,7 @@ module KeywordSearch
     end
     for_symbol 'Pair' do
-      keyword_and_term ['k', 's']
+      keyword_and_term ['s', ':', 's']
       default_keyword_term ['s']
     end

data/lib/keyword_search/parser.rb CHANGED Viewed

@@ -4,38 +4,37 @@ class KeywordSearch::Parser < Dhaka::CompiledParser
   start_with 0
-  at_state(3) {
-    for_symbols("k", "_End_", "s") { reduce_with "one_pair" }
-  }
   at_state(1) {
-    for_symbols("s") { shift_to 2 }
+    for_symbols("_End_") { reduce_with "start" }
+    for_symbols("s") { shift_to 3 }
+    for_symbols("Pair") { shift_to 2 }
   }
-  at_state(6) {
-    for_symbols("k", "_End_", "s") { reduce_with "multiple_pairs" }
+  at_state(5) {
+    for_symbols("_End_", "s") { reduce_with "keyword_and_term" }
   }
-  at_state(5) {
-    for_symbols("s") { shift_to 4 }
-    for_symbols("_End_") { reduce_with "start" }
-    for_symbols("k") { shift_to 1 }
-    for_symbols("Pair") { shift_to 6 }
+  at_state(4) {
+    for_symbols("s") { shift_to 5 }
   }
   at_state(2) {
-    for_symbols("k", "_End_", "s") { reduce_with "keyword_and_term" }
+    for_symbols("_End_", "s") { reduce_with "multiple_pairs" }
   }
   at_state(0) {
-    for_symbols("s") { shift_to 4 }
-    for_symbols("k") { shift_to 1 }
-    for_symbols("Pair") { shift_to 3 }
-    for_symbols("Pairs") { shift_to 5 }
+    for_symbols("Pair") { shift_to 6 }
+    for_symbols("s") { shift_to 3 }
+    for_symbols("Pairs") { shift_to 1 }
   }
-  at_state(4) {
-    for_symbols("k", "_End_", "s") { reduce_with "default_keyword_term" }
+  at_state(6) {
+    for_symbols("_End_", "s") { reduce_with "one_pair" }
+  }
+  at_state(3) {
+    for_symbols(":") { shift_to 4 }
+    for_symbols("_End_", "s") { reduce_with "default_keyword_term" }
   }
 end

data/lib/keyword_search/tokenizer.rb CHANGED Viewed

@@ -1,105 +0,0 @@
-module KeywordSearch
-  class Tokenizer < Dhaka::Tokenizer
-    def accumulator
-      @accumulator ||= ''
-    end
-    def accumulate(string)
-      accumulator << string
-    end
-    def clear_accumulator
-      @accumulator = ''
-    end
-    # TODO: Add further character support; this is just for initial release
-    letters = ('a'..'z').to_a + ('A'..'Z').to_a
-    numbers = ('0'..'9').to_a
-    extras = %w|_ - ' / \ [ ] { } 1 @ # $ % ^ & * ( ) . , ? < > |
-    printables = letters + numbers + extras
-    whitespace = [' ']
-    quotes = %w|' "|
-    keyword_separator = [':']
-    all_characters = keyword_separator + printables + whitespace + quotes
-    for_state :idle_state do
-      for_characters(printables) do
-        clear_accumulator
-        switch_to :unquoted_literal_state
-      end
-      for_characters(quotes) do
-        advance unless accumulator.empty?
-        clear_accumulator
-        case curr_char
-        when %<">
-          advance
-          switch_to :double_quoted_literal_state
-        when %<'>
-          advance
-          switch_to :single_quoted_literal_state
-        end
-      end
-      for_characters whitespace do
-        advance
-      end
-    end
-    for_state :unquoted_literal_state do
-      for_characters(printables) do
-        accumulate curr_char
-        advance
-        create_token('s', accumulator) unless curr_char
-      end
-      for_characters(keyword_separator) do
-        create_token 'k', accumulator
-        clear_accumulator
-        advance
-        switch_to :idle_state
-      end
-      for_characters(whitespace) do
-        create_token 's', accumulator
-        clear_accumulator
-        switch_to :idle_state
-      end
-    end
-    for_state :double_quoted_literal_state do
-      for_characters(all_characters - %w<">) do
-        accumulate curr_char
-        advance
-      end
-      for_characters %w<"> do
-        create_token 's', accumulator
-        clear_accumulator
-        advance
-        switch_to :idle_state
-      end
-    end
-    for_state :single_quoted_literal_state do
-      for_characters(all_characters - %w<'>) do
-        accumulate curr_char
-        advance
-      end
-      for_characters %w<'> do
-        create_token 's', accumulator
-        clear_accumulator
-        advance
-        switch_to :idle_state
-      end
-    end
-  end
-end

data/test/test_keyword_search.rb CHANGED Viewed

@@ -1,5 +1,5 @@
 require 'test/unit'
-require 'lib/keyword_search'
+require File.dirname(__FILE__) + '/../lib/keyword_search'
 class TestKeywordSearch < Test::Unit::TestCase
@@ -129,6 +129,17 @@ class TestKeywordSearch < Test::Unit::TestCase
     assert_equal %<okay...>, result
   end
+  def test_parse_error_results_in_exception
+    assert_raises(KeywordSearch::ParseError) do
+      KeywordSearch.search(%<we_do_not_allow:! or ::>) do |with|
+        with.default_keyword :text
+        with.keyword :text do |values|
+          result = values.first
+        end
+      end
+    end
+  end
 end

metadata CHANGED Viewed

@@ -3,8 +3,8 @@ rubygems_version: 0.9.0
 specification_version: 1
 name: keyword_search
 version: !ruby/object:Gem::Version
-  version: 1.1.1
-date: 2007-03-21 00:00:00 -06:00
+  version: 1.2.0
+date: 2007-05-09 00:00:00 -06:00
 summary: Generic support for extracting GMail-style search keywords/values from strings
 require_paths:
 - lib