RubyGems - picky - Versions diffs - 2.7.0 → 3.0.0.pre1 - Mend

picky 2.7.0 → 3.0.0.pre1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (213) hide show

data/lib/picky/adapters/rack/base.rb +20 -16
data/lib/picky/adapters/rack/live_parameters.rb +28 -24
data/lib/picky/adapters/rack/search.rb +67 -0
data/lib/picky/adapters/rack.rb +27 -23
data/lib/picky/application.rb +246 -236
data/lib/picky/backend/base.rb +115 -119
data/lib/picky/backend/file/basic.rb +102 -98
data/lib/picky/backend/file/json.rb +27 -23
data/lib/picky/backend/file/marshal.rb +32 -28
data/lib/picky/backend/file/text.rb +45 -41
data/lib/picky/backend/files.rb +19 -15
data/lib/picky/backend/redis/basic.rb +76 -72
data/lib/picky/backend/redis/list_hash.rb +40 -36
data/lib/picky/backend/redis/string_hash.rb +30 -26
data/lib/picky/backend/redis.rb +32 -28
data/lib/picky/bundle.rb +82 -57
data/lib/{bundling.rb → picky/bundling.rb} +0 -0
data/lib/picky/calculations/location.rb +51 -47
data/lib/picky/categories.rb +60 -56
data/lib/picky/categories_indexed.rb +73 -82
data/lib/picky/categories_indexing.rb +12 -8
data/lib/picky/category.rb +109 -120
data/lib/picky/category_indexed.rb +39 -41
data/lib/picky/category_indexing.rb +123 -125
data/lib/picky/character_substituters/west_european.rb +32 -26
data/lib/{constants.rb → picky/constants.rb} +0 -0
data/lib/picky/cores.rb +96 -92
data/lib/{deployment.rb → picky/deployment.rb} +0 -0
data/lib/picky/frontend_adapters/rack.rb +133 -118
data/lib/picky/generators/aliases.rb +5 -3
data/lib/picky/generators/base.rb +11 -7
data/lib/picky/generators/partial/default.rb +7 -3
data/lib/picky/generators/partial/none.rb +24 -20
data/lib/picky/generators/partial/strategy.rb +20 -16
data/lib/picky/generators/partial/substring.rb +94 -90
data/lib/picky/generators/partial_generator.rb +11 -7
data/lib/picky/generators/similarity/default.rb +9 -5
data/lib/picky/generators/similarity/double_metaphone.rb +20 -16
data/lib/picky/generators/similarity/metaphone.rb +20 -16
data/lib/picky/generators/similarity/none.rb +23 -19
data/lib/picky/generators/similarity/phonetic.rb +49 -45
data/lib/picky/generators/similarity/soundex.rb +20 -16
data/lib/picky/generators/similarity/strategy.rb +10 -6
data/lib/picky/generators/similarity_generator.rb +11 -7
data/lib/picky/generators/strategy.rb +14 -10
data/lib/picky/generators/weights/default.rb +9 -5
data/lib/picky/generators/weights/logarithmic.rb +30 -26
data/lib/picky/generators/weights/strategy.rb +10 -6
data/lib/picky/generators/weights_generator.rb +11 -7
data/lib/picky/helpers/measuring.rb +20 -16
data/lib/picky/indexed/bundle/base.rb +39 -37
data/lib/picky/indexed/bundle/memory.rb +68 -64
data/lib/picky/indexed/bundle/redis.rb +73 -69
data/lib/picky/indexed/wrappers/bundle/calculation.rb +26 -22
data/lib/picky/indexed/wrappers/bundle/location.rb +30 -26
data/lib/picky/indexed/wrappers/bundle/wrapper.rb +36 -32
data/lib/picky/indexed/wrappers/category/location.rb +17 -13
data/lib/picky/indexed/wrappers/exact_first.rb +46 -42
data/lib/picky/indexers/base.rb +26 -22
data/lib/picky/indexers/parallel.rb +62 -58
data/lib/picky/indexers/serial.rb +41 -37
data/lib/picky/indexes/index.rb +400 -0
data/lib/picky/indexes/index_indexed.rb +24 -0
data/lib/picky/indexes/index_indexing.rb +138 -0
data/lib/picky/indexes/memory.rb +20 -0
data/lib/picky/indexes/redis.rb +20 -0
data/lib/picky/indexes.rb +68 -61
data/lib/picky/indexes_indexed.rb +16 -12
data/lib/picky/indexes_indexing.rb +41 -37
data/lib/picky/indexing/bundle/base.rb +216 -205
data/lib/picky/indexing/bundle/memory.rb +16 -11
data/lib/picky/indexing/bundle/redis.rb +14 -12
data/lib/picky/indexing/wrappers/category/location.rb +17 -13
data/lib/picky/interfaces/live_parameters.rb +159 -154
data/lib/picky/loader.rb +267 -304
data/lib/picky/loggers/search.rb +20 -13
data/lib/picky/no_source_specified_exception.rb +7 -3
data/lib/picky/performant.rb +6 -2
data/lib/picky/query/allocation.rb +71 -67
data/lib/picky/query/allocations.rb +99 -94
data/lib/picky/query/combination.rb +70 -66
data/lib/picky/query/combinations/base.rb +56 -52
data/lib/picky/query/combinations/memory.rb +36 -32
data/lib/picky/query/combinations/redis.rb +66 -62
data/lib/picky/query/indexes.rb +175 -160
data/lib/picky/query/qualifier_category_mapper.rb +43 -0
data/lib/picky/query/token.rb +165 -172
data/lib/picky/query/tokens.rb +86 -82
data/lib/picky/query/weights.rb +44 -48
data/lib/picky/query.rb +5 -1
data/lib/picky/rack/harakiri.rb +51 -47
data/lib/picky/results.rb +81 -77
data/lib/picky/search.rb +169 -158
data/lib/picky/sinatra.rb +34 -0
data/lib/picky/sources/base.rb +73 -70
data/lib/picky/sources/couch.rb +61 -57
data/lib/picky/sources/csv.rb +68 -64
data/lib/picky/sources/db.rb +139 -135
data/lib/picky/sources/delicious.rb +52 -48
data/lib/picky/sources/mongo.rb +68 -63
data/lib/picky/sources/wrappers/base.rb +20 -16
data/lib/picky/sources/wrappers/location.rb +37 -33
data/lib/picky/statistics.rb +46 -43
data/lib/picky/tasks.rb +3 -0
data/lib/picky/tokenizers/base.rb +192 -187
data/lib/picky/tokenizers/index.rb +25 -21
data/lib/picky/tokenizers/location.rb +33 -29
data/lib/picky/tokenizers/query.rb +49 -43
data/lib/picky.rb +21 -13
data/lib/tasks/application.rake +1 -1
data/lib/tasks/index.rake +3 -3
data/lib/tasks/routes.rake +1 -1
data/lib/tasks/server.rake +1 -1
data/spec/lib/adapters/rack/base_spec.rb +1 -1
data/spec/lib/adapters/rack/live_parameters_spec.rb +1 -1
data/spec/lib/adapters/rack/query_spec.rb +1 -1
data/spec/lib/application_spec.rb +39 -32
data/spec/lib/backend/file/basic_spec.rb +2 -2
data/spec/lib/backend/file/json_spec.rb +2 -2
data/spec/lib/backend/file/marshal_spec.rb +2 -2
data/spec/lib/backend/file/text_spec.rb +1 -1
data/spec/lib/backend/files_spec.rb +14 -24
data/spec/lib/backend/redis/basic_spec.rb +2 -2
data/spec/lib/backend/redis/list_hash_spec.rb +3 -3
data/spec/lib/backend/redis/string_hash_spec.rb +3 -3
data/spec/lib/backend/redis_spec.rb +20 -13
data/spec/lib/calculations/location_spec.rb +1 -1
data/spec/lib/categories_indexed_spec.rb +16 -34
data/spec/lib/category_indexed_spec.rb +9 -27
data/spec/lib/category_indexing_spec.rb +2 -3
data/spec/lib/category_spec.rb +10 -10
data/spec/lib/character_substituters/west_european_spec.rb +6 -5
data/spec/lib/cores_spec.rb +17 -17
data/spec/lib/extensions/symbol_spec.rb +15 -1
data/spec/lib/frontend_adapters/rack_spec.rb +20 -20
data/spec/lib/generators/aliases_spec.rb +3 -3
data/spec/lib/generators/cacher_strategy_spec.rb +1 -1
data/spec/lib/generators/partial/default_spec.rb +3 -3
data/spec/lib/generators/partial/none_spec.rb +2 -2
data/spec/lib/generators/partial/substring_spec.rb +1 -1
data/spec/lib/generators/partial_generator_spec.rb +3 -3
data/spec/lib/generators/similarity/double_metaphone_spec.rb +1 -1
data/spec/lib/generators/similarity/metaphone_spec.rb +1 -1
data/spec/lib/generators/similarity/none_spec.rb +1 -1
data/spec/lib/generators/similarity/phonetic_spec.rb +1 -1
data/spec/lib/generators/similarity/soundex_spec.rb +1 -1
data/spec/lib/generators/similarity_generator_spec.rb +2 -2
data/spec/lib/generators/weights/logarithmic_spec.rb +1 -1
data/spec/lib/generators/weights_generator_spec.rb +1 -1
data/spec/lib/helpers/measuring_spec.rb +2 -2
data/spec/lib/indexed/bundle/memory_spec.rb +6 -6
data/spec/lib/indexed/bundle/redis_spec.rb +4 -4
data/spec/lib/indexed/wrappers/bundle/calculation_spec.rb +2 -3
data/spec/lib/indexed/wrappers/bundle/wrapper_spec.rb +2 -2
data/spec/lib/indexed/wrappers/exact_first_spec.rb +5 -5
data/spec/lib/indexers/base_spec.rb +1 -1
data/spec/lib/indexers/parallel_spec.rb +1 -1
data/spec/lib/indexers/serial_spec.rb +1 -1
data/spec/lib/{index/base_indexed_spec.rb → indexes/index_indexed_spec.rb} +3 -3
data/spec/lib/{index/base_indexing_spec.rb → indexes/index_indexing_spec.rb} +19 -2
data/spec/lib/{index/base_spec.rb → indexes/index_spec.rb} +6 -25
data/spec/lib/{index → indexes}/redis_spec.rb +1 -1
data/spec/lib/indexes_class_spec.rb +2 -2
data/spec/lib/indexes_indexed_spec.rb +1 -1
data/spec/lib/indexes_indexing_spec.rb +1 -1
data/spec/lib/indexes_spec.rb +1 -1
data/spec/lib/indexing/bundle/base_spec.rb +7 -5
data/spec/lib/indexing/bundle/memory_partial_generation_speed_spec.rb +4 -4
data/spec/lib/indexing/bundle/memory_spec.rb +15 -15
data/spec/lib/indexing/bundle/redis_spec.rb +9 -9
data/spec/lib/interfaces/live_parameters_spec.rb +5 -5
data/spec/lib/loader_spec.rb +17 -19
data/spec/lib/loggers/search_spec.rb +2 -2
data/spec/lib/query/allocation_spec.rb +1 -1
data/spec/lib/query/allocations_spec.rb +1 -1
data/spec/lib/query/combination_spec.rb +4 -4
data/spec/lib/query/combinations/base_spec.rb +1 -1
data/spec/lib/query/combinations/memory_spec.rb +1 -1
data/spec/lib/query/combinations/redis_spec.rb +1 -1
data/spec/lib/query/indexes_spec.rb +7 -2
data/spec/lib/query/qualifier_category_mapper_spec.rb +34 -0
data/spec/lib/query/token_spec.rb +32 -53
data/spec/lib/query/tokens_spec.rb +30 -35
data/spec/lib/query/weights_spec.rb +16 -16
data/spec/lib/rack/harakiri_spec.rb +5 -5
data/spec/lib/results_spec.rb +1 -1
data/spec/lib/search_spec.rb +24 -22
data/spec/lib/sinatra_spec.rb +36 -0
data/spec/lib/sources/base_spec.rb +1 -1
data/spec/lib/sources/couch_spec.rb +9 -9
data/spec/lib/sources/csv_spec.rb +7 -7
data/spec/lib/sources/db_spec.rb +2 -2
data/spec/lib/sources/delicious_spec.rb +5 -5
data/spec/lib/sources/mongo_spec.rb +7 -7
data/spec/lib/sources/wrappers/base_spec.rb +2 -2
data/spec/lib/sources/wrappers/location_spec.rb +1 -1
data/spec/lib/statistics_spec.rb +1 -1
data/spec/lib/tokenizers/base_spec.rb +2 -2
data/spec/lib/tokenizers/index_spec.rb +1 -1
data/spec/lib/tokenizers/query_spec.rb +1 -1
metadata +30 -30
data/lib/picky/adapters/rack/query.rb +0 -65
data/lib/picky/index/base.rb +0 -409
data/lib/picky/index/base_indexed.rb +0 -29
data/lib/picky/index/base_indexing.rb +0 -127
data/lib/picky/index/memory.rb +0 -16
data/lib/picky/index/redis.rb +0 -16
data/lib/picky/query/qualifiers.rb +0 -76
data/lib/picky/query/solr.rb +0 -60
data/lib/picky/signals.rb +0 -8
data/lib/picky-tasks.rb +0 -6
data/lib/tasks/spec.rake +0 -11
data/spec/lib/query/qualifiers_spec.rb +0 -31

data/lib/picky/query/token.rb CHANGED Viewed

@@ -1,202 +1,195 @@
-module Query
+module Picky
-  # This is a query token. Together with other tokens it makes up a query.
-  #
-  # It remembers the original form, and and a normalized form.
-  #
-  # It also knows whether it needs to look for similarity (bla~), or whether it is a partial (bla*).
-  #
-  class Token # :nodoc:all
+  module Query
-    attr_reader :text, :original
-    attr_writer :similar
-    delegate :blank?, :to => :text
-    # Normal initializer.
-    #
-    # Note: Use this if you do not want a qualified and normalized token.
-    #
-    # TODO text, qualifiers
+    # This is a query token. Together with other tokens it makes up a query.
     #
-    def initialize text
-      @text = text
-    end
-    # Returns a qualified and normalized token.
+    # It remembers the original form, and and a normalized form.
     #
-    # Note: Use this in the search engine if you need a qualified
-    #       and normalized token. I.e. one prepared for a search.
+    # It also knows whether it needs to look for similarity (bla~), or whether it is a partial (bla*).
     #
-    def self.processed text, downcase = true
-      new(text).process downcase
-    end
-    def process downcases = true
-      qualify
-      extract_original
-      downcase if downcases
-      partialize
-      similarize
-      remove_illegals
-      symbolize
-      self
-    end
+    class Token # :nodoc:all
-    # This returns an array of predefined category names if the user has given any.
-    #
-    def user_defined_category_names
-      @qualifiers
-    end
-    # Extracts a qualifier for this token and pre-assigns an allocation.
-    #
-    # Note: Removes the qualifier if it is not allowed.
-    #
-    # TODO Extract this sind it is Search-based.
-    #
-    def qualify
-      @qualifiers, @text = split @text
-      @qualifiers && @qualifiers.collect! { |qualifier| Query::Qualifiers.instance.normalize qualifier }.compact!
-      @qualifiers
-    end
-    def extract_original
-      @original = @text.dup
-    end
+      attr_reader :text, :original, :qualifiers, :user_defined_categories
+      attr_writer :similar
-    # Downcases the text.
-    #
-    def downcase
-      @text.downcase!
-    end
+      delegate :blank?, :to => :text
-    # Partial is a conditional setter.
-    #
-    # It is only settable if it hasn't been set yet.
-    #
-    def partial= partial
-      @partial = partial if @partial.nil?
-    end
-    def partial?
-      !@similar && @partial
-    end
+      # Normal initializer.
+      #
+      # Note: Use this if you do not want a normalized token.
+      #
+      def initialize text
+        @text = text
+      end
-    # If the text ends with *, partialize it. If with ", don't.
-    #
-    # The latter wins. So "hello*" will not be partially searched.
-    #
-    @@no_partial = /\"\Z/
-    @@partial    = /\*\Z/
-    def partialize
-      self.partial = false and return unless @text !~ @@no_partial
-      self.partial = true unless @text !~ @@partial
-    end
+      # Returns a qualified and normalized token.
+      #
+      # Note: Use this in the search engine if you need a qualified
+      #       and normalized token. I.e. one prepared for a search.
+      #
+      def self.processed text, downcase = true
+        new(text).process downcase
+      end
+      def process downcased = true
+        qualify
+        extract_original
+        downcase if downcased
+        partialize
+        similarize
+        remove_illegals
+        symbolize
+        self
+      end
-    # If the text ends with ~ similarize it. If with ", don't.
-    #
-    # The latter wins.
-    #
-    @@no_similar = /\"\Z/
-    @@similar    = /\~\Z/
-    def similarize
-      self.similar = false and return if @text =~ @@no_similar
-      self.similar = true if @text =~ @@similar
-    end
+      # Translates this token's qualifiers into actual categories.
+      #
+      # Note: If this is not done, there is no mapping.
+      #
+      def categorize mapper
+        @user_defined_categories = @qualifiers && @qualifiers.map do |qualifier|
+          mapper.map qualifier
+        end.compact
+      end
-    def similar?
-      @similar
-    end
+      # Dups the original text.
+      #
+      def extract_original
+        @original = @text.dup
+      end
-    # Normalizes this token's text.
-    #
-    @@illegals = /["*~]/
-    def remove_illegals
-      @text.gsub! @@illegals, '' unless @text.blank?
-    end
+      # Downcases the text.
+      #
+      def downcase
+        @text.downcase!
+      end
-    #
-    #
-    def symbolize
-      @text = @text.to_sym
-    end
+      # Partial is a conditional setter.
+      #
+      # It is only settable if it hasn't been set yet.
+      #
+      def partial= partial
+        @partial = partial if @partial.nil?
+      end
+      def partial?
+        !@similar && @partial
+      end
-    # Returns an array of possible combinations.
-    #
-    def possible_combinations_in index
-      index.possible_combinations self
-    end
+      # If the text ends with *, partialize it. If with ", don't.
+      #
+      # The latter wins. So "hello*" will not be partially searched.
+      #
+      @@no_partial = /\"\Z/
+      @@partial    = /\*\Z/
+      def partialize
+        self.partial = false and return unless @text !~ @@no_partial
+        self.partial = true unless @text !~ @@partial
+      end
-    # Returns a token with the next similar text.
-    #
-    # TODO Rewrite this. It is hard to understand. Also spec performance.
-    #
-    def next_similar_token category
-      token = self.dup
-      token if token.next_similar category.bundle_for(token)
-    end
-    # Sets and returns the next similar word.
-    #
-    # Note: Also overrides the original.
-    #
-    def next_similar bundle
-      @text = @original = (similarity(bundle).shift || return) if similar?
-    end
-    # Lazy similar reader.
-    #
-    def similarity bundle = nil
-      @similarity || @similarity = generate_similarity_for(bundle)
-    end
-    # Returns an enumerator that traverses over the similar.
-    #
-    # Note: The dup isn't too nice – since it is needed on account of the shift, above.
-    #       (We avoid a StopIteration exception. Which of both is less evil?)
-    #
-    def generate_similarity_for bundle
-      bundle.similar(@text).dup || []
-    end
+      # If the text ends with ~ similarize it. If with ", don't.
+      #
+      # The latter wins.
+      #
+      @@no_similar = /\"\Z/
+      @@similar    = /\~\Z/
+      def similarize
+        self.similar = false and return if @text =~ @@no_similar
+        self.similar = true if @text =~ @@similar
+      end
-    #
-    #
-    def to_result
-      [@original, @text]
-    end
+      def similar?
+        @similar
+      end
-    # Internal identifier.
-    #
-    def identifier
-      "#{similar?? :similarity : :inverted}:#{@text}"
-    end
+      # Normalizes this token's text.
+      #
+      @@illegals = /["*~]/
+      def remove_illegals
+        @text.gsub! @@illegals, '' unless @text.blank?
+      end
-    # If the originals & the text are the same, they are the same.
-    #
-    def == other
-      self.original == other.original && self.text == other.text
-    end
+      #
+      #
+      def symbolize
+        @text = @text.to_sym
+      end
-    # Displays the qualifier text and the text, joined.
-    #
-    # e.g. name:meier
-    #
-    @@split_qualifier_text = ':'
-    @@split_qualifiers     = ','
-    def to_s
-      [@qualifiers && @qualifiers.join(@@split_qualifiers), @text].compact.join @@split_qualifier_text
-    end
+      # Returns an array of possible combinations.
+      #
+      def possible_combinations_in index
+        index.possible_combinations self
+      end
-    private
+      # Returns a token with the next similar text.
+      #
+      # THINK Rewrite this. It is hard to understand. Also spec performance.
+      #
+      def next_similar_token category
+        token = self.dup
+        token if token.next_similar category.bundle_for(token)
+      end
+      # Sets and returns the next similar word.
+      #
+      # Note: Also overrides the original.
+      #
+      def next_similar bundle
+        @text = @original = (similarity(bundle).shift || return) if similar?
+      end
+      # Lazy similar reader.
+      #
+      def similarity bundle = nil
+        @similarity || @similarity = generate_similarity_for(bundle)
+      end
+      # Returns an enumerator that traverses over the similar.
+      #
+      # Note: The dup isn't too nice – since it is needed on account of the shift, above.
+      #       (We avoid a StopIteration exception. Which of both is less evil?)
+      #
+      def generate_similarity_for bundle
+        bundle.similar(@text).dup || []
+      end
       # Splits text into a qualifier and text.
       #
-      # Returns [qualifier, text].
-      #
-      def split unqualified_text
-        qualifiers, text = (unqualified_text || '').split(@@split_qualifier_text, 2)
-        if text.blank?
-          [nil, (qualifiers || '')]
+      @@split_qualifier_text = ':'
+      @@split_qualifiers     = ','
+      def qualify
+        @qualifiers, @text = (@text || '').split(@@split_qualifier_text, 2)
+        @qualifiers, @text = if @text.blank?
+          [nil, (@qualifiers || '')]
         else
-          [qualifiers.split(@@split_qualifiers), text]
+          [@qualifiers.split(@@split_qualifiers), @text]
         end
       end
+      #
+      #
+      def to_result
+        [@original, @text]
+      end
+      # Internal identifier.
+      #
+      def identifier
+        "#{similar?? :similarity : :inverted}:#{@text}"
+      end
+      # If the originals & the text are the same, they are the same.
+      #
+      def == other
+        self.original == other.original && self.text == other.text
+      end
+      # Displays the text and the qualifiers.
+      #
+      # e.g. name:meier
+      #
+      def to_s
+        "#{self.class}(#{[@text, (@qualifiers.inspect unless @qualifiers.blank?)].compact.join(', ')})"
+      end
+    end
   end
 end

data/lib/picky/query/tokens.rb CHANGED Viewed

@@ -1,101 +1,105 @@
-# encoding: utf-8
-#
-module Query
+module Picky
-  # This class primarily handles switching through similar token constellations.
+  # encoding: utf-8
   #
-  class Tokens # :nodoc:all
+  module Query
-    # Basically delegates to its internal tokens array.
+    # This class primarily handles switching through similar token constellations.
     #
-    self.delegate *[Enumerable.instance_methods, :slice!, :[], :uniq!, :last, :reject!, :length, :size, :empty?, :each, :exit, { :to => :@tokens }].flatten
+    class Tokens # :nodoc:all
-    # Create a new Tokens object with the array of tokens passed in.
-    #
-    def initialize tokens = []
-      @tokens = tokens
-    end
+      # Basically delegates to its internal tokens array.
+      #
+      self.delegate *[Enumerable.instance_methods, :slice!, :[], :uniq!, :last, :reject!, :length, :size, :empty?, :each, :exit, { :to => :@tokens }].flatten
-    # Creates a new Tokens object from a number of Strings.
-    #
-    # Options:
-    #  * downcase: Whether to downcase the passed strings (default is true)
-    #
-    def self.processed words, downcase = true
-      new words.collect! { |word| Token.processed word, downcase }
-    end
+      # Create a new Tokens object with the array of tokens passed in.
+      #
+      def initialize tokens = []
+        @tokens = tokens
+      end
-    # Tokenizes each token.
-    #
-    # Note: Passed tokenizer needs to offer #normalize(text).
-    #
-    def tokenize_with tokenizer
-      @tokens.each { |token| token.tokenize_with(tokenizer) }
-    end
+      # Creates a new Tokens object from a number of Strings.
+      #
+      # Options:
+      #  * downcase: Whether to downcase the passed strings (default is true)
+      #
+      def self.processed words, downcase = true
+        new words.collect! { |word| Token.processed word, downcase }
+      end
-    # Generates an array in the form of
-    # [
-    #  [combination],                           # of token 1
-    #  [combination, combination, combination], # of token 2
-    #  [combination, combination]               # of token 3
-    # ]
-    #
-    def possible_combinations_in index
-      @tokens.inject([]) do |combinations, token|
-        possible_combinations = token.possible_combinations_in index
-        # TODO Could move the ignore_unassigned_tokens here!
-        #
-        # Note: Optimization for ignoring tokens that allocate to nothing and
-        # can be ignored.
-        # For example in a special search, where "florian" is not
-        # mapped to any category.
-        #
-        possible_combinations ? combinations << possible_combinations : combinations
+      # Tokenizes each token.
+      #
+      # Note: Passed tokenizer needs to offer #normalize(text).
+      #
+      def tokenize_with tokenizer
+        @tokens.each { |token| token.tokenize_with(tokenizer) }
       end
-    end
-    # Makes the last of the tokens partial.
-    #
-    def partialize_last
-      @tokens.last.partial = true unless empty?
-    end
+      # Generates an array in the form of
+      # [
+      #  [combination],                           # of token 1
+      #  [combination, combination, combination], # of token 2
+      #  [combination, combination]               # of token 3
+      # ]
+      #
+      def possible_combinations_in index
+        @tokens.inject([]) do |combinations, token|
+          possible_combinations = token.possible_combinations_in index
+          # TODO Could move the ignore_unassigned_tokens here!
+          #
+          # Note: Optimization for ignoring tokens that allocate to nothing and
+          # can be ignored.
+          # For example in a special search, where "florian" is not
+          # mapped to any category.
+          #
+          possible_combinations ? combinations << possible_combinations : combinations
+        end
+      end
-    # Caps the tokens to the maximum.
-    #
-    def cap maximum
-      @tokens.slice!(maximum..-1) if cap?(maximum)
-    end
-    def cap? maximum
-      @tokens.size > maximum
-    end
+      # Makes the last of the tokens partial.
+      #
+      def partialize_last
+        @tokens.last.partial = true unless empty?
+      end
-    # Rejects blank tokens.
-    #
-    def reject
-      @tokens.reject! &:blank?
-    end
+      # Caps the tokens to the maximum.
+      #
+      def cap maximum
+        @tokens.slice!(maximum..-1) if cap?(maximum)
+      end
+      def cap? maximum
+        @tokens.size > maximum
+      end
-    # Returns a solr query.
-    #
-    def to_solr_query
-      @tokens.map(&:to_solr).join ' '
-    end
+      # Rejects blank tokens.
+      #
+      def reject
+        @tokens.reject! &:blank?
+      end
-    #
-    #
-    def originals
-      @tokens.map(&:original)
-    end
+      #
+      #
+      def categorize mapper
+        @tokens.each { |token| token.categorize mapper }
+      end
-    def == other
-      self.tokens == other.tokens
-    end
+      #
+      #
+      def originals
+        @tokens.map(&:original)
+      end
+      def == other
+        self.tokens == other.tokens
+      end
+      # Just join the token original texts.
+      #
+      def to_s
+        originals.join ' '
+      end
-    # Just join the token original texts.
-    #
-    def to_s
-      originals.join ' '
     end
   end

data/lib/picky/query/weights.rb CHANGED Viewed

@@ -1,62 +1,58 @@
-module Query
+module Picky
-  # Calculates weights for certain combinations.
-  #
-  class Weights # :nodoc:all
+  module Query
-    attr_reader :weights
-    #
+    # Calculates weights for certain combinations.
     #
-    def initialize weights = {}
-      @weights = weights
-    end
+    class Weights # :nodoc:all
-    # Get the weight of an allocation.
-    #
-    def weight_for clustered
-      @weights[clustered] || 0
-    end
+      attr_reader :weights
+      delegate :empty?, :to => :weights
-    # Returns an energy term E for allocation. this turns into a probability
-    # by P(allocation) = 1/Z * exp (-1/T * E(allocation)),
-    # where Z is the normalizing partition function
-    # sum_allocations exp(-1/T *E(allocation)), and T is a temperature constant.
-    # If T is high the distribution will be close to equally distributed.
-    # If T is low, the distribution will be the indicator function
-    # for min (E(allocation))…
-    #
-    # ...
-    #
-    # Just kidding. It's far more complicated than that. Ha ha ha ha ;)
-    #
-    # Note: Cache this if more complicated weighings become necessary.
-    #
-    def score combinations
-      # TODO Or hide: combinations#to_weights_key (but it's an array, so…)
       #
-      # TODO combinations could cluster uniq as combinations are added (since combinations don't change).
       #
-      # TODO Or it could use actual combinations? Could it? Or make combinations comparable to Symbols.
+      def initialize weights = {}
+        @weights = weights
+      end
+      # Get the weight of an allocation.
       #
-      weight_for combinations.map(&:category_name).clustered_uniq_fast
-    end
+      def weight_for clustered
+        @weights[clustered] || 0
+      end
+      # Returns an energy term E for allocation. this turns into a probability
+      # by P(allocation) = 1/Z * exp (-1/T * E(allocation)),
+      # where Z is the normalizing partition function
+      # sum_allocations exp(-1/T *E(allocation)), and T is a temperature constant.
+      # If T is high the distribution will be close to equally distributed.
+      # If T is low, the distribution will be the indicator function
+      # for min (E(allocation))…
+      #
+      # ...
+      #
+      # Just kidding. It's far more complicated than that. Ha ha ha ha ;)
+      #
+      # Note: Cache this if more complicated weighings become necessary.
+      #
+      def score combinations
+        # TODO Or it could use actual combinations? Could it? Or make combinations comparable to Symbols.
+        #
+        weight_for combinations.map(&:category_name).clustered_uniq_fast
+      end
-    # Are there any weights defined?
-    #
-    def empty?
-      @weights.empty?
-    end
+      def == other
+        @weights == other.weights
+      end
-    def == other
-      @weights == other.weights
-    end
+      # Prints out a nice representation of the configured weights.
+      #
+      def to_s
+        "#{self.class}(#{@weights})"
+      end
-    # Prints out a nice representation of the configured weights.
-    #
-    def to_s
-      @weights.to_s
     end
   end
 end

data/lib/picky/query.rb CHANGED Viewed

@@ -1,2 +1,6 @@
-module Query # :nodoc:all
+module Picky
+  module Query # :nodoc:all
+  end
 end