RubyGems - picky - Versions diffs - 2.7.0 → 3.0.0.pre1 - Mend

picky 2.7.0 → 3.0.0.pre1

Files changed (213) hide show

data/lib/picky/adapters/rack/base.rb +20 -16
data/lib/picky/adapters/rack/live_parameters.rb +28 -24
data/lib/picky/adapters/rack/search.rb +67 -0
data/lib/picky/adapters/rack.rb +27 -23
data/lib/picky/application.rb +246 -236
data/lib/picky/backend/base.rb +115 -119
data/lib/picky/backend/file/basic.rb +102 -98
data/lib/picky/backend/file/json.rb +27 -23
data/lib/picky/backend/file/marshal.rb +32 -28
data/lib/picky/backend/file/text.rb +45 -41
data/lib/picky/backend/files.rb +19 -15
data/lib/picky/backend/redis/basic.rb +76 -72
data/lib/picky/backend/redis/list_hash.rb +40 -36
data/lib/picky/backend/redis/string_hash.rb +30 -26
data/lib/picky/backend/redis.rb +32 -28
data/lib/picky/bundle.rb +82 -57
data/lib/{bundling.rb → picky/bundling.rb} +0 -0
data/lib/picky/calculations/location.rb +51 -47
data/lib/picky/categories.rb +60 -56
data/lib/picky/categories_indexed.rb +73 -82
data/lib/picky/categories_indexing.rb +12 -8
data/lib/picky/category.rb +109 -120
data/lib/picky/category_indexed.rb +39 -41
data/lib/picky/category_indexing.rb +123 -125
data/lib/picky/character_substituters/west_european.rb +32 -26
data/lib/{constants.rb → picky/constants.rb} +0 -0
data/lib/picky/cores.rb +96 -92
data/lib/{deployment.rb → picky/deployment.rb} +0 -0
data/lib/picky/frontend_adapters/rack.rb +133 -118
data/lib/picky/generators/aliases.rb +5 -3
data/lib/picky/generators/base.rb +11 -7
data/lib/picky/generators/partial/default.rb +7 -3
data/lib/picky/generators/partial/none.rb +24 -20
data/lib/picky/generators/partial/strategy.rb +20 -16
data/lib/picky/generators/partial/substring.rb +94 -90
data/lib/picky/generators/partial_generator.rb +11 -7
data/lib/picky/generators/similarity/default.rb +9 -5
data/lib/picky/generators/similarity/double_metaphone.rb +20 -16
data/lib/picky/generators/similarity/metaphone.rb +20 -16
data/lib/picky/generators/similarity/none.rb +23 -19
data/lib/picky/generators/similarity/phonetic.rb +49 -45
data/lib/picky/generators/similarity/soundex.rb +20 -16
data/lib/picky/generators/similarity/strategy.rb +10 -6
data/lib/picky/generators/similarity_generator.rb +11 -7
data/lib/picky/generators/strategy.rb +14 -10
data/lib/picky/generators/weights/default.rb +9 -5
data/lib/picky/generators/weights/logarithmic.rb +30 -26
data/lib/picky/generators/weights/strategy.rb +10 -6
data/lib/picky/generators/weights_generator.rb +11 -7
data/lib/picky/helpers/measuring.rb +20 -16
data/lib/picky/indexed/bundle/base.rb +39 -37
data/lib/picky/indexed/bundle/memory.rb +68 -64
data/lib/picky/indexed/bundle/redis.rb +73 -69
data/lib/picky/indexed/wrappers/bundle/calculation.rb +26 -22
data/lib/picky/indexed/wrappers/bundle/location.rb +30 -26
data/lib/picky/indexed/wrappers/bundle/wrapper.rb +36 -32
data/lib/picky/indexed/wrappers/category/location.rb +17 -13
data/lib/picky/indexed/wrappers/exact_first.rb +46 -42
data/lib/picky/indexers/base.rb +26 -22
data/lib/picky/indexers/parallel.rb +62 -58
data/lib/picky/indexers/serial.rb +41 -37
data/lib/picky/indexes/index.rb +400 -0
data/lib/picky/indexes/index_indexed.rb +24 -0
data/lib/picky/indexes/index_indexing.rb +138 -0
data/lib/picky/indexes/memory.rb +20 -0
data/lib/picky/indexes/redis.rb +20 -0
data/lib/picky/indexes.rb +68 -61
data/lib/picky/indexes_indexed.rb +16 -12
data/lib/picky/indexes_indexing.rb +41 -37
data/lib/picky/indexing/bundle/base.rb +216 -205
data/lib/picky/indexing/bundle/memory.rb +16 -11
data/lib/picky/indexing/bundle/redis.rb +14 -12
data/lib/picky/indexing/wrappers/category/location.rb +17 -13
data/lib/picky/interfaces/live_parameters.rb +159 -154
data/lib/picky/loader.rb +267 -304
data/lib/picky/loggers/search.rb +20 -13
data/lib/picky/no_source_specified_exception.rb +7 -3
data/lib/picky/performant.rb +6 -2
data/lib/picky/query/allocation.rb +71 -67
data/lib/picky/query/allocations.rb +99 -94
data/lib/picky/query/combination.rb +70 -66
data/lib/picky/query/combinations/base.rb +56 -52
data/lib/picky/query/combinations/memory.rb +36 -32
data/lib/picky/query/combinations/redis.rb +66 -62
data/lib/picky/query/indexes.rb +175 -160
data/lib/picky/query/qualifier_category_mapper.rb +43 -0
data/lib/picky/query/token.rb +165 -172
data/lib/picky/query/tokens.rb +86 -82
data/lib/picky/query/weights.rb +44 -48
data/lib/picky/query.rb +5 -1
data/lib/picky/rack/harakiri.rb +51 -47
data/lib/picky/results.rb +81 -77
data/lib/picky/search.rb +169 -158
data/lib/picky/sinatra.rb +34 -0
data/lib/picky/sources/base.rb +73 -70
data/lib/picky/sources/couch.rb +61 -57
data/lib/picky/sources/csv.rb +68 -64
data/lib/picky/sources/db.rb +139 -135
data/lib/picky/sources/delicious.rb +52 -48
data/lib/picky/sources/mongo.rb +68 -63
data/lib/picky/sources/wrappers/base.rb +20 -16
data/lib/picky/sources/wrappers/location.rb +37 -33
data/lib/picky/statistics.rb +46 -43
data/lib/picky/tasks.rb +3 -0
data/lib/picky/tokenizers/base.rb +192 -187
data/lib/picky/tokenizers/index.rb +25 -21
data/lib/picky/tokenizers/location.rb +33 -29
data/lib/picky/tokenizers/query.rb +49 -43
data/lib/picky.rb +21 -13
data/lib/tasks/application.rake +1 -1
data/lib/tasks/index.rake +3 -3
data/lib/tasks/routes.rake +1 -1
data/lib/tasks/server.rake +1 -1
data/spec/lib/adapters/rack/base_spec.rb +1 -1
data/spec/lib/adapters/rack/live_parameters_spec.rb +1 -1
data/spec/lib/adapters/rack/query_spec.rb +1 -1
data/spec/lib/application_spec.rb +39 -32
data/spec/lib/backend/file/basic_spec.rb +2 -2
data/spec/lib/backend/file/json_spec.rb +2 -2
data/spec/lib/backend/file/marshal_spec.rb +2 -2
data/spec/lib/backend/file/text_spec.rb +1 -1
data/spec/lib/backend/files_spec.rb +14 -24
data/spec/lib/backend/redis/basic_spec.rb +2 -2
data/spec/lib/backend/redis/list_hash_spec.rb +3 -3
data/spec/lib/backend/redis/string_hash_spec.rb +3 -3
data/spec/lib/backend/redis_spec.rb +20 -13
data/spec/lib/calculations/location_spec.rb +1 -1
data/spec/lib/categories_indexed_spec.rb +16 -34
data/spec/lib/category_indexed_spec.rb +9 -27
data/spec/lib/category_indexing_spec.rb +2 -3
data/spec/lib/category_spec.rb +10 -10
data/spec/lib/character_substituters/west_european_spec.rb +6 -5
data/spec/lib/cores_spec.rb +17 -17
data/spec/lib/extensions/symbol_spec.rb +15 -1
data/spec/lib/frontend_adapters/rack_spec.rb +20 -20
data/spec/lib/generators/aliases_spec.rb +3 -3
data/spec/lib/generators/cacher_strategy_spec.rb +1 -1
data/spec/lib/generators/partial/default_spec.rb +3 -3
data/spec/lib/generators/partial/none_spec.rb +2 -2
data/spec/lib/generators/partial/substring_spec.rb +1 -1
data/spec/lib/generators/partial_generator_spec.rb +3 -3
data/spec/lib/generators/similarity/double_metaphone_spec.rb +1 -1
data/spec/lib/generators/similarity/metaphone_spec.rb +1 -1
data/spec/lib/generators/similarity/none_spec.rb +1 -1
data/spec/lib/generators/similarity/phonetic_spec.rb +1 -1
data/spec/lib/generators/similarity/soundex_spec.rb +1 -1
data/spec/lib/generators/similarity_generator_spec.rb +2 -2
data/spec/lib/generators/weights/logarithmic_spec.rb +1 -1
data/spec/lib/generators/weights_generator_spec.rb +1 -1
data/spec/lib/helpers/measuring_spec.rb +2 -2
data/spec/lib/indexed/bundle/memory_spec.rb +6 -6
data/spec/lib/indexed/bundle/redis_spec.rb +4 -4
data/spec/lib/indexed/wrappers/bundle/calculation_spec.rb +2 -3
data/spec/lib/indexed/wrappers/bundle/wrapper_spec.rb +2 -2
data/spec/lib/indexed/wrappers/exact_first_spec.rb +5 -5
data/spec/lib/indexers/base_spec.rb +1 -1
data/spec/lib/indexers/parallel_spec.rb +1 -1
data/spec/lib/indexers/serial_spec.rb +1 -1
data/spec/lib/{index/base_indexed_spec.rb → indexes/index_indexed_spec.rb} +3 -3
data/spec/lib/{index/base_indexing_spec.rb → indexes/index_indexing_spec.rb} +19 -2
data/spec/lib/{index/base_spec.rb → indexes/index_spec.rb} +6 -25
data/spec/lib/{index → indexes}/redis_spec.rb +1 -1
data/spec/lib/indexes_class_spec.rb +2 -2
data/spec/lib/indexes_indexed_spec.rb +1 -1
data/spec/lib/indexes_indexing_spec.rb +1 -1
data/spec/lib/indexes_spec.rb +1 -1
data/spec/lib/indexing/bundle/base_spec.rb +7 -5
data/spec/lib/indexing/bundle/memory_partial_generation_speed_spec.rb +4 -4
data/spec/lib/indexing/bundle/memory_spec.rb +15 -15
data/spec/lib/indexing/bundle/redis_spec.rb +9 -9
data/spec/lib/interfaces/live_parameters_spec.rb +5 -5
data/spec/lib/loader_spec.rb +17 -19
data/spec/lib/loggers/search_spec.rb +2 -2
data/spec/lib/query/allocation_spec.rb +1 -1
data/spec/lib/query/allocations_spec.rb +1 -1
data/spec/lib/query/combination_spec.rb +4 -4
data/spec/lib/query/combinations/base_spec.rb +1 -1
data/spec/lib/query/combinations/memory_spec.rb +1 -1
data/spec/lib/query/combinations/redis_spec.rb +1 -1
data/spec/lib/query/indexes_spec.rb +7 -2
data/spec/lib/query/qualifier_category_mapper_spec.rb +34 -0
data/spec/lib/query/token_spec.rb +32 -53
data/spec/lib/query/tokens_spec.rb +30 -35
data/spec/lib/query/weights_spec.rb +16 -16
data/spec/lib/rack/harakiri_spec.rb +5 -5
data/spec/lib/results_spec.rb +1 -1
data/spec/lib/search_spec.rb +24 -22
data/spec/lib/sinatra_spec.rb +36 -0
data/spec/lib/sources/base_spec.rb +1 -1
data/spec/lib/sources/couch_spec.rb +9 -9
data/spec/lib/sources/csv_spec.rb +7 -7
data/spec/lib/sources/db_spec.rb +2 -2
data/spec/lib/sources/delicious_spec.rb +5 -5
data/spec/lib/sources/mongo_spec.rb +7 -7
data/spec/lib/sources/wrappers/base_spec.rb +2 -2
data/spec/lib/sources/wrappers/location_spec.rb +1 -1
data/spec/lib/statistics_spec.rb +1 -1
data/spec/lib/tokenizers/base_spec.rb +2 -2
data/spec/lib/tokenizers/index_spec.rb +1 -1
data/spec/lib/tokenizers/query_spec.rb +1 -1
metadata +30 -30
data/lib/picky/adapters/rack/query.rb +0 -65
data/lib/picky/index/base.rb +0 -409
data/lib/picky/index/base_indexed.rb +0 -29
data/lib/picky/index/base_indexing.rb +0 -127
data/lib/picky/index/memory.rb +0 -16
data/lib/picky/index/redis.rb +0 -16
data/lib/picky/query/qualifiers.rb +0 -76
data/lib/picky/query/solr.rb +0 -60
data/lib/picky/signals.rb +0 -8
data/lib/picky-tasks.rb +0 -6
data/lib/tasks/spec.rake +0 -11
data/spec/lib/query/qualifiers_spec.rb +0 -31

data/lib/picky/indexes/index.rb ADDED Viewed

@@ -0,0 +1,400 @@
+module Picky
+  # = Picky Indexes
+  #
+  # A Picky Index defines
+  # * where its data comes from (a data source).
+  # * how this data it is indexed.
+  # * a number of categories that may or may not map directly to data categories.
+  #
+  # == Howto
+  #
+  # This is a step-by-step description on how to create an index.
+  #
+  # Start by choosing an <tt>Indexes::Memory</tt> or an <tt>Indexes::Redis</tt>.
+  # In the example, we will be using an in-memory index, <tt>Indexes::Memory</tt>.
+  #
+  #   books = Indexes::Memory.new(:books)
+  #
+  # That in itself won't do much good, that's why we add a data source:
+  #
+  #   books = Indexes::Memory.new(:books) do
+  #     source Sources::CSV.new(:title, :author, file: 'data/books.csv')
+  #   end
+  #
+  # In the example, we use an explicit <tt>Sources::CSV</tt> of Picky.
+  # However, anything that responds to <tt>#each</tt>, and returns an object that
+  # answers to <tt>#id</tt>, works.
+  #
+  # For example, a 3.0 ActiveRecord class:
+  #
+  #   books = Indexes::Memory.new(:books) do
+  #     source Book.order('isbn ASC')
+  #   end
+  #
+  # Now we know where the data comes from, but not, how to categorize it.
+  #
+  # Let's add a few categories:
+  #
+  #   books = Indexes::Memory.new(:books) do
+  #     source   Book.order('isbn ASC')
+  #     category :title
+  #     category :author
+  #     category :isbn
+  #   end
+  #
+  # Categories offer quite a few options, see <tt>Indexes::Base#category</tt> for details.
+  #
+  # After adding more options, it might look like this:
+  #
+  #   books = Indexes::Memory.new(:books) do
+  #     source   Book.order('isbn ASC')
+  #     category :title,
+  #              partial: Partial::Substring.new(from: 1),
+  #              similarity: Similarity::DoubleMetaphone.new(3),
+  #              qualifiers: [:t, :title, :titulo]
+  #     category :author,
+  #              similarity: Similarity::Metaphone.new(2)
+  #     category :isbn,
+  #              partial: Partial::None.new,
+  #              from: :legacy_isbn_name
+  #   end
+  #
+  # For this to work, a <tt>Book</tt> should support methods <tt>#title</tt>, <tt>#author</tt> and <tt>#legacy_isbn_name</tt>.
+  #
+  # If it uses <tt>String</tt> ids, use <tt>#key_format</tt> to define a formatting method:
+  #
+  #   books = Indexes::Memory.new(:books) do
+  #     key_format :to_s
+  #     source     Book.order('isbn ASC')
+  #     category   :title
+  #     category   :author
+  #     category   :isbn
+  #   end
+  #
+  # Finally, use the index for a <tt>Search</tt>:
+  #
+  #   route %r{^/media$} => Search.new(books, dvds, mp3s)
+  #
+  class Indexes
+    # This class defines the indexing and index API that is exposed to the user
+    # as the #index method inside the Application class.
+    #
+    # It provides a single front for both indexing and index options. We suggest to always use the index API.
+    #
+    # Note: An Index holds both an *Indexed*::*Index* and an *Indexing*::*Index*.
+    #
+    class Index
+      attr_reader :name,
+                  :categories
+      delegate :[],
+               :each_category,
+               :to => :categories
+      # Create a new index with a given source.
+      #
+      # === Parameters
+      # * name: A name that will be used for the index directory and in the Picky front end.
+      #
+      # === Options
+      # * source: Where the data comes from, e.g. Sources::CSV.new(...). Optional, can be defined in the block using #source.
+      # * result_identifier: Use if you'd like a different identifier/name in the results than the name of the index.
+      # * after_indexing: As of this writing only used in the db source. Executes the given after_indexing as SQL after the indexing process.
+      # * tokenizer: The tokenizer to use for this index. Optional, can be defined in the block using #indexing.
+      # * key_format: The format the ids of this index are in. Optional, can be defined in the block using #key_format.
+      #
+      # Examples:
+      #   my_index = Indexes::Memory.new(:my_index, source: some_source) do
+      #     category :bla
+      #   end
+      #
+      #   my_index = Indexes::Memory.new(:my_index) do
+      #     source   Sources::CSV.new(file: 'data/index.csv')
+      #     category :bla
+      #   end
+      #
+      #
+      def initialize name, options = {}
+        check_name name
+        @name = name.to_sym
+        check_options options
+        @source = options[:source]
+        @after_indexing        = options[:after_indexing]
+        @tokenizer             = options[:tokenizer]
+        @key_format            = options[:key_format]
+        # Indexed.
+        #
+        @result_identifier    = options[:result_identifier] || name
+        # TODO Move ignore_unassigned_tokens to query, somehow.
+        #
+        @categories = Categories.new ignore_unassigned_tokens: (options[:ignore_unassigned_tokens] || false)
+        # Centralized registry.
+        #
+        Indexes.register self
+        #
+        #
+        instance_eval(&Proc.new) if block_given?
+        # Check if any source has been given in the block or the options.
+        #
+        check_source @source
+      end
+      # Default bundles.
+      #
+      def indexing_bundle_class
+        Indexing::Bundle::Memory
+      end
+      def indexed_bundle_class
+        Indexed::Bundle::Memory
+      end
+      # Defines a searchable category on the index.
+      #
+      # === Parameters
+      # * category_name: This identifier is used in the front end, but also to categorize query text. For example, “title:hobbit” will narrow the hobbit query on categories with the identifier :title.
+      #
+      # === Options
+      # * partial: Partial::None.new or Partial::Substring.new(from: starting_char, to: ending_char). Default is Partial::Substring.new(from: -3, to: -1).
+      # * similarity: Similarity::None.new or Similarity::DoubleMetaphone.new(similar_words_searched). Default is Similarity::None.new.
+      # * qualifiers: An array of qualifiers with which you can define which category you’d like to search, for example “title:hobbit” will search for hobbit in just title categories. Example: qualifiers: [:t, :titre, :title] (use it for example with multiple languages). Default is the name of the category.
+      # * qualifier: Convenience options if you just need a single qualifier, see above. Example: qualifiers => :title. Default is the name of the category.
+      # * source: Use a different source than the index uses. If you think you need that, there might be a better solution to your problem. Please post to the mailing list first with your application.rb :)
+      # * from: Take the data from the data category with this name. Example: You have a source Sources::CSV.new(:title, file:'some_file.csv') but you want the category to be called differently. The you use from: define_category(:similar_title, :from => :title).
+      #
+      def category category_name, options = {}
+        new_category = Category.new category_name.to_sym, self, options
+        categories << new_category
+        new_category = yield new_category if block_given?
+        new_category
+      end
+      alias define_category category
+      # Make this category range searchable with a fixed range. If you need other
+      # ranges, define another category with a different range value.
+      #
+      # Example:
+      # You have data values inside 1..100, and you want to have Picky return
+      # not only the results for 47 if you search for 47, but also results for
+      # 45, 46, or 47.2, 48.9, in a range of 2 around 47, so (45..49).
+      #
+      # Then you use:
+      #  ranged_category :values_inside_1_100, 2
+      #
+      # Optionally, you give it a precision value to reduce the error margin
+      # around 47 (Picky is a bit liberal).
+      #   Indexes::Memory.new :range do
+      #     ranged_category :values_inside_1_100, 2, precision: 5
+      #   end
+      #
+      # This will force Picky to maximally be wrong 5% of the given range value
+      # (5% of 2 = 0.1) instead of the default 20% (20% of 2 = 0.4).
+      #
+      # We suggest not to use much more than 5 as a higher precision is more
+      # performance intensive for less and less precision gain.
+      #
+      # == Protip 1
+      #
+      # Create two ranged categories to make an area search:
+      #   Indexes::Memory.new :area do
+      #     ranged_category :x, 1
+      #     ranged_category :y, 1
+      #   end
+      #
+      # Search for it using for example:
+      #   x:133, y:120
+      #
+      # This will search this square area (* = 133, 120: The "search" point entered):
+      #
+      #    132       134
+      #     |         |
+      #   --|---------|-- 121
+      #     |         |
+      #     |    *    |
+      #     |         |
+      #   --|---------|-- 119
+      #     |         |
+      #
+      # Note: The area does not need to be square, but can be rectangular.
+      #
+      # == Protip 2
+      #
+      # Create three ranged categories to make a volume search.
+      #
+      # Or go crazy and use 4 ranged categories for a space/time search! ;)
+      #
+      # === Parameters
+      # * category_name: The category_name as used in #define_category.
+      # * range: The range (in the units of your data values) around the query point where we search for results.
+      #
+      #  -----|<- range  ->*------------|-----
+      #
+      # === Options
+      # * precision: Default is 1 (20% error margin, very fast), up to 5 (5% error margin, slower) makes sense.
+      # * ... all options of #define_category.
+      #
+      def ranged_category category_name, range, options = {}
+        precision = options[:precision] || 1
+        options = { partial: Partial::None.new }.merge options
+        define_category category_name, options do |category|
+          Indexing::Wrappers::Category::Location.install_on category, range, precision
+          Indexed::Wrappers::Category::Location.install_on category, range, precision
+        end
+      end
+      alias define_ranged_category ranged_category
+      # HIGHLY EXPERIMENTAL Not correctly working yet. Try it if you feel "beta".
+      #
+      # Also a range search see #ranged_category, but on the earth's surface.
+      #
+      # Parameters:
+      # * lat_name: The latitude's name as used in #define_category.
+      # * lng_name: The longitude's name as used in #define_category.
+      # * radius: The distance (in km) around the query point which we search for results.
+      #
+      # Note: Picky uses a square, not a circle. That should be ok for most usages.
+      #
+      #  -----------------------------
+      #  |                           |
+      #  |                           |
+      #  |                           |
+      #  |                           |
+      #  |                           |
+      #  |             *<-  radius ->|
+      #  |                           |
+      #  |                           |
+      #  |                           |
+      #  |                           |
+      #  |                           |
+      #  -----------------------------
+      #
+      # Options
+      # * precision: Default 1 (20% error margin, very fast), up to 5 (5% error margin, slower) makes sense.
+      # * lat_from: The data category to take the data for the latitude from.
+      # * lng_from: The data category to take the data for the longitude from.
+      #
+      # TODO Will have to write a wrapper that combines two categories that are
+      #      indexed simultaneously, since lat/lng are correlated.
+      #
+      def geo_categories lat_name, lng_name, radius, options = {} # :nodoc:
+        # Extract lat/lng specific options.
+        #
+        lat_from = options.delete :lat_from
+        lng_from = options.delete :lng_from
+        # One can be a normal ranged_category.
+        #
+        ranged_category lat_name, radius*0.00898312, options.merge(from: lat_from)
+        # The other needs to adapt the radius depending on the one.
+        #
+        # Depending on the latitude, the radius of the longitude
+        # needs to enlarge, the closer we get to the pole.
+        #
+        # In our simplified case, the radius is given as if all the
+        # locations were on the 45 degree line.
+        #
+        # This calculates km -> longitude (degrees).
+        #
+        # A degree on the 45 degree line is equal to ~222.6398 km.
+        # So a km on the 45 degree line is equal to 0.01796624 degrees.
+        #
+        ranged_category lng_name, radius*0.01796624, options.merge(from: lng_from)
+      end
+      alias define_geo_categories geo_categories
+      #
+      # Since this is an API, we fail hard quickly.
+      #
+      def check_name name # :nodoc:
+        raise ArgumentError.new(<<-NAME
+  The index identifier (you gave "#{name}") for Indexes::Memory/Indexes::Redis should be a Symbol/String,
+  Examples:
+    Indexes::Memory.new(:my_cool_index) # Recommended
+    Indexes::Redis.new("a-redis-index")
+  NAME
+  ) unless name.respond_to?(:to_sym)
+      end
+      def check_options options # :nodoc:
+        raise ArgumentError.new(<<-OPTIONS
+  Sources are not passed in as second parameter for #{self.class.name} anymore, but either
+  * as :source option:
+    #{self.class.name}.new(#{name.inspect}, source: #{options})
+  or
+  * given to the #source method inside the config block:
+    #{self.class.name}.new(#{name.inspect}) do
+      source #{options}
+    end
+  Sorry about that breaking change (in 2.2.0), didn't want to go to 3.0.0 yet!
+  All the best
+    -- Picky
+  OPTIONS
+  ) unless options.respond_to?(:[])
+      end
+      def check_source source # :nodoc:
+        raise ArgumentError.new(<<-SOURCE
+  The index "#{name}" should use a data source that responds to either the method #each, or the method #harvest, which yields(id, text), OR it can be a lambda/block, returning such a source.
+  Or it could use one of the built-in sources:
+    Sources::#{(Sources.constants - [:Base, :Wrappers, :NoCSVFileGiven, :NoCouchDBGiven]).join(',
+    Sources::')}
+  SOURCE
+  ) unless source.respond_to?(:each) || source.respond_to?(:harvest) || source.respond_to?(:call)
+      end
+      def to_stats # :nodoc:
+        stats = <<-INDEX
+  #{name} (#{self.class}):
+  #{"source:            #{source}".indented_to_s}
+  #{"categories:        #{categories.map(&:name).join(', ')}".indented_to_s}
+  INDEX
+        stats << "  result identifier: \"#{result_identifier}\"".indented_to_s unless result_identifier.to_s == name.to_s
+        stats
+      end
+      # Identifier used for technical output.
+      #
+      def identifier
+        "#{PICKY_ENVIRONMENT}:#{name}"
+      end
+      #
+      #
+      def to_s
+        "#{self.class}(#{name}, result_id: #{result_identifier}, source: #{source}, categories: #{categories})"
+      end
+    end
+  end
+end

data/lib/picky/indexes/index_indexed.rb ADDED Viewed

@@ -0,0 +1,24 @@
+module Picky
+  class Indexes
+    #
+    #
+    class Index
+      attr_reader :result_identifier,
+                  :combinator
+      delegate :load_from_cache,
+               :analyze,
+               :reindex,
+               :possible_combinations,
+               :to => :categories
+      alias reload load_from_cache
+    end
+  end
+end

data/lib/picky/indexes/index_indexing.rb ADDED Viewed

@@ -0,0 +1,138 @@
+module Picky
+  class Indexes
+    #
+    #
+    class Index
+      attr_reader :after_indexing,
+                  :bundle_class
+      # Delegators for indexing.
+      #
+      delegate :cache,
+               :check,
+               :clear,
+               :backup,
+               :restore,
+               :to => :categories
+      # Calling index on an index will call index
+      # on every category.
+      #
+      # Decides whether to use a parallel indexer or whether to
+      # delegate to each category to index themselves.
+      #
+      def index
+        if source.respond_to?(:each)
+          check_source_empty
+          index_in_parallel
+        else
+          with_data_snapshot do
+            categories.each &:index
+          end
+        end
+      end
+      # Check if the given enumerable source is empty.
+      #
+      # Note: Checking as early as possible to tell the
+      #       user as early as possible.
+      #
+      def check_source_empty
+        warn %Q{\n\033[1mWarning\033[m, source for index "#{name}" is empty: #{source} (responds true to empty?).\n} if source.respond_to?(:empty?) && source.empty?
+      end
+      # Note: Duplicated in category_indexing.rb.
+      #
+      # Take a data snapshot if the source offers it.
+      #
+      def with_data_snapshot
+        if source.respond_to? :with_snapshot
+          source.with_snapshot(self) do
+            yield
+          end
+        else
+          yield
+        end
+      end
+      # Indexes the categories in parallel.
+      #
+      # Only use where the category does have a #each source defined.
+      #
+      def index_in_parallel
+        indexer = Indexers::Parallel.new self
+        indexer.index categories
+        categories.each &:cache
+      end
+      # Define an index tokenizer on the index.
+      #
+      # Parameters are the exact same as for indexing.
+      #
+      def indexing options = {}
+        @tokenizer = Tokenizers::Index.new options
+      end
+      alias define_indexing indexing
+      # Returns the installed tokenizer or the default.
+      #
+      def tokenizer
+        @tokenizer || Indexes.tokenizer
+      end
+      # Define a source on the index.
+      #
+      # Parameter is a source, either one of the standard sources or
+      # anything responding to #each and returning objects that
+      # respond to id and the category names (or the category from option).
+      #
+      def source some_source = nil, &block
+        some_source ||= block
+        some_source ? define_source(some_source) : (@source && extract_source || raise_no_source)
+      end
+      # Extract the actual source if it is wrapped in a time
+      # capsule, i.e. a block/lambda.
+      #
+      # TODO Extract into module.
+      #
+      def extract_source
+        @source = @source.respond_to?(:call) ? @source.call : @source
+      end
+      def define_source source
+        @source = source
+      end
+      def raise_no_source
+        raise NoSourceSpecifiedException.new(<<-NO_SOURCE
+  No source given for index #{name}. An index needs a source.
+  Example:
+  Indexes::Memory.new(:with_source) do
+    source   Sources::CSV.new(:title, file: 'data/books.csv')
+    category :title
+    category :author
+  end
+        NO_SOURCE
+  )
+      end
+      # Define a key_format on the index.
+      #
+      # Parameter is a method name to use on the key (e.g. :to_i, :to_s, :strip).
+      #
+      def key_format format = nil
+        format ? define_key_format(format) : @key_format
+      end
+      def define_key_format key_format
+        @key_format = key_format
+      end
+    end
+  end
+end

data/lib/picky/indexes/memory.rb ADDED Viewed

@@ -0,0 +1,20 @@
+module Picky
+  class Indexes
+    # An index that is persisted in files, loaded at startup and kept in memory at runtime.
+    #
+    class Memory < Index
+      def indexing_bundle_class
+        Indexing::Bundle::Memory
+      end
+      def indexed_bundle_class
+        Indexed::Bundle::Memory
+      end
+    end
+  end
+end

data/lib/picky/indexes/redis.rb ADDED Viewed

@@ -0,0 +1,20 @@
+module Picky
+  class Indexes
+    # An index that is persisted in Redis.
+    #
+    class Redis < Index
+      def indexing_bundle_class
+        Indexing::Bundle::Redis
+      end
+      def indexed_bundle_class
+        Indexed::Bundle::Redis
+      end
+    end
+  end
+end