RubyGems - isomorfeus-ferret - Versions diffs - 0.12.0 - Mend

isomorfeus-ferret 0.12.0

Files changed (222) hide show

checksums.yaml +7 -0
data/LICENSE +612 -0
data/README.md +44 -0
data/ext/isomorfeus_ferret_ext/benchmark.c +223 -0
data/ext/isomorfeus_ferret_ext/benchmark.h +45 -0
data/ext/isomorfeus_ferret_ext/benchmarks_all.h +25 -0
data/ext/isomorfeus_ferret_ext/bm_bitvector.c +123 -0
data/ext/isomorfeus_ferret_ext/bm_hash.c +118 -0
data/ext/isomorfeus_ferret_ext/bm_micro_string.c +40 -0
data/ext/isomorfeus_ferret_ext/bm_store.c +93 -0
data/ext/isomorfeus_ferret_ext/email.rl +21 -0
data/ext/isomorfeus_ferret_ext/extconf.rb +5 -0
data/ext/isomorfeus_ferret_ext/fio_tmpfile.h +53 -0
data/ext/isomorfeus_ferret_ext/frb_analysis.c +2577 -0
data/ext/isomorfeus_ferret_ext/frb_index.c +3457 -0
data/ext/isomorfeus_ferret_ext/frb_lang.c +9 -0
data/ext/isomorfeus_ferret_ext/frb_lang.h +17 -0
data/ext/isomorfeus_ferret_ext/frb_qparser.c +629 -0
data/ext/isomorfeus_ferret_ext/frb_search.c +4460 -0
data/ext/isomorfeus_ferret_ext/frb_store.c +515 -0
data/ext/isomorfeus_ferret_ext/frb_threading.h +30 -0
data/ext/isomorfeus_ferret_ext/frb_utils.c +1127 -0
data/ext/isomorfeus_ferret_ext/frt_analysis.c +1644 -0
data/ext/isomorfeus_ferret_ext/frt_analysis.h +247 -0
data/ext/isomorfeus_ferret_ext/frt_array.c +124 -0
data/ext/isomorfeus_ferret_ext/frt_array.h +54 -0
data/ext/isomorfeus_ferret_ext/frt_bitvector.c +95 -0
data/ext/isomorfeus_ferret_ext/frt_bitvector.h +586 -0
data/ext/isomorfeus_ferret_ext/frt_compound_io.c +374 -0
data/ext/isomorfeus_ferret_ext/frt_config.h +44 -0
data/ext/isomorfeus_ferret_ext/frt_document.c +134 -0
data/ext/isomorfeus_ferret_ext/frt_document.h +52 -0
data/ext/isomorfeus_ferret_ext/frt_except.c +95 -0
data/ext/isomorfeus_ferret_ext/frt_except.h +188 -0
data/ext/isomorfeus_ferret_ext/frt_field_index.c +233 -0
data/ext/isomorfeus_ferret_ext/frt_field_index.h +42 -0
data/ext/isomorfeus_ferret_ext/frt_filter.c +157 -0
data/ext/isomorfeus_ferret_ext/frt_fs_store.c +502 -0
data/ext/isomorfeus_ferret_ext/frt_global.c +427 -0
data/ext/isomorfeus_ferret_ext/frt_global.h +290 -0
data/ext/isomorfeus_ferret_ext/frt_hash.c +518 -0
data/ext/isomorfeus_ferret_ext/frt_hash.h +466 -0
data/ext/isomorfeus_ferret_ext/frt_hashset.c +191 -0
data/ext/isomorfeus_ferret_ext/frt_hashset.h +206 -0
data/ext/isomorfeus_ferret_ext/frt_helper.c +62 -0
data/ext/isomorfeus_ferret_ext/frt_helper.h +13 -0
data/ext/isomorfeus_ferret_ext/frt_ind.c +353 -0
data/ext/isomorfeus_ferret_ext/frt_ind.h +54 -0
data/ext/isomorfeus_ferret_ext/frt_index.c +6377 -0
data/ext/isomorfeus_ferret_ext/frt_index.h +880 -0
data/ext/isomorfeus_ferret_ext/frt_lang.c +104 -0
data/ext/isomorfeus_ferret_ext/frt_lang.h +44 -0
data/ext/isomorfeus_ferret_ext/frt_mempool.c +87 -0
data/ext/isomorfeus_ferret_ext/frt_mempool.h +33 -0
data/ext/isomorfeus_ferret_ext/frt_multimapper.c +349 -0
data/ext/isomorfeus_ferret_ext/frt_multimapper.h +52 -0
data/ext/isomorfeus_ferret_ext/frt_posh.c +1006 -0
data/ext/isomorfeus_ferret_ext/frt_posh.h +973 -0
data/ext/isomorfeus_ferret_ext/frt_priorityqueue.c +147 -0
data/ext/isomorfeus_ferret_ext/frt_priorityqueue.h +147 -0
data/ext/isomorfeus_ferret_ext/frt_q_boolean.c +1612 -0
data/ext/isomorfeus_ferret_ext/frt_q_const_score.c +157 -0
data/ext/isomorfeus_ferret_ext/frt_q_filtered_query.c +209 -0
data/ext/isomorfeus_ferret_ext/frt_q_fuzzy.c +281 -0
data/ext/isomorfeus_ferret_ext/frt_q_match_all.c +147 -0
data/ext/isomorfeus_ferret_ext/frt_q_multi_term.c +672 -0
data/ext/isomorfeus_ferret_ext/frt_q_parser.c +3084 -0
data/ext/isomorfeus_ferret_ext/frt_q_phrase.c +1182 -0
data/ext/isomorfeus_ferret_ext/frt_q_prefix.c +98 -0
data/ext/isomorfeus_ferret_ext/frt_q_range.c +665 -0
data/ext/isomorfeus_ferret_ext/frt_q_span.c +2386 -0
data/ext/isomorfeus_ferret_ext/frt_q_term.c +311 -0
data/ext/isomorfeus_ferret_ext/frt_q_wildcard.c +166 -0
data/ext/isomorfeus_ferret_ext/frt_ram_store.c +460 -0
data/ext/isomorfeus_ferret_ext/frt_scanner.c +899 -0
data/ext/isomorfeus_ferret_ext/frt_scanner.h +28 -0
data/ext/isomorfeus_ferret_ext/frt_scanner_mb.c +6705 -0
data/ext/isomorfeus_ferret_ext/frt_scanner_utf8.c +4419 -0
data/ext/isomorfeus_ferret_ext/frt_search.c +1824 -0
data/ext/isomorfeus_ferret_ext/frt_search.h +924 -0
data/ext/isomorfeus_ferret_ext/frt_similarity.c +150 -0
data/ext/isomorfeus_ferret_ext/frt_similarity.h +79 -0
data/ext/isomorfeus_ferret_ext/frt_sort.c +796 -0
data/ext/isomorfeus_ferret_ext/frt_stopwords.c +395 -0
data/ext/isomorfeus_ferret_ext/frt_store.c +680 -0
data/ext/isomorfeus_ferret_ext/frt_store.h +789 -0
data/ext/isomorfeus_ferret_ext/frt_term_vectors.c +72 -0
data/ext/isomorfeus_ferret_ext/frt_threading.h +23 -0
data/ext/isomorfeus_ferret_ext/frt_win32.h +54 -0
data/ext/isomorfeus_ferret_ext/isomorfeus_ferret.c +409 -0
data/ext/isomorfeus_ferret_ext/isomorfeus_ferret.h +95 -0
data/ext/isomorfeus_ferret_ext/libstemmer.c +93 -0
data/ext/isomorfeus_ferret_ext/libstemmer.h +73 -0
data/ext/isomorfeus_ferret_ext/q_parser.y +1366 -0
data/ext/isomorfeus_ferret_ext/scanner.h +28 -0
data/ext/isomorfeus_ferret_ext/scanner.in +43 -0
data/ext/isomorfeus_ferret_ext/scanner.rl +84 -0
data/ext/isomorfeus_ferret_ext/scanner_mb.rl +200 -0
data/ext/isomorfeus_ferret_ext/scanner_utf8.rl +85 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_danish.c +324 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_danish.h +7 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_dutch.c +610 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_dutch.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_english.c +1104 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_english.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_finnish.c +749 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_finnish.h +7 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_french.c +1233 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_french.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_german.c +490 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_german.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_hungarian.c +1217 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_hungarian.h +7 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_italian.c +1052 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_italian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_norwegian.c +283 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_norwegian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_porter.c +735 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_porter.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_portuguese.c +1003 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_portuguese.h +7 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_spanish.c +1079 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_spanish.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_swedish.c +293 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_1_swedish.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_2_romanian.c +984 -0
data/ext/isomorfeus_ferret_ext/stem_ISO_8859_2_romanian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_KOI8_R_russian.c +686 -0
data/ext/isomorfeus_ferret_ext/stem_KOI8_R_russian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_danish.c +325 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_danish.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_dutch.c +620 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_dutch.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_english.c +1111 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_english.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_finnish.c +754 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_finnish.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_french.c +1242 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_french.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_german.c +495 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_german.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_hungarian.c +1220 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_hungarian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_italian.c +1059 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_italian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_norwegian.c +285 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_norwegian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_porter.c +741 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_porter.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_portuguese.c +1009 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_portuguese.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_romanian.c +990 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_romanian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_russian.c +680 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_russian.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_spanish.c +1083 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_spanish.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_swedish.c +294 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_swedish.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_turkish.c +2191 -0
data/ext/isomorfeus_ferret_ext/stem_UTF_8_turkish.h +6 -0
data/ext/isomorfeus_ferret_ext/stem_api.c +66 -0
data/ext/isomorfeus_ferret_ext/stem_api.h +26 -0
data/ext/isomorfeus_ferret_ext/stem_header.h +57 -0
data/ext/isomorfeus_ferret_ext/stem_modules.h +190 -0
data/ext/isomorfeus_ferret_ext/stem_modules.txt +50 -0
data/ext/isomorfeus_ferret_ext/stem_utilities.c +478 -0
data/ext/isomorfeus_ferret_ext/test.c +850 -0
data/ext/isomorfeus_ferret_ext/test.h +416 -0
data/ext/isomorfeus_ferret_ext/test_1710.c +63 -0
data/ext/isomorfeus_ferret_ext/test_analysis.c +1221 -0
data/ext/isomorfeus_ferret_ext/test_array.c +272 -0
data/ext/isomorfeus_ferret_ext/test_bitvector.c +600 -0
data/ext/isomorfeus_ferret_ext/test_compound_io.c +170 -0
data/ext/isomorfeus_ferret_ext/test_document.c +156 -0
data/ext/isomorfeus_ferret_ext/test_except.c +244 -0
data/ext/isomorfeus_ferret_ext/test_fields.c +522 -0
data/ext/isomorfeus_ferret_ext/test_file_deleter.c +185 -0
data/ext/isomorfeus_ferret_ext/test_filter.c +331 -0
data/ext/isomorfeus_ferret_ext/test_fs_store.c +25 -0
data/ext/isomorfeus_ferret_ext/test_global.c +299 -0
data/ext/isomorfeus_ferret_ext/test_hash.c +485 -0
data/ext/isomorfeus_ferret_ext/test_hashset.c +288 -0
data/ext/isomorfeus_ferret_ext/test_helper.c +47 -0
data/ext/isomorfeus_ferret_ext/test_highlighter.c +548 -0
data/ext/isomorfeus_ferret_ext/test_index.c +2323 -0
data/ext/isomorfeus_ferret_ext/test_lang.c +74 -0
data/ext/isomorfeus_ferret_ext/test_mempool.c +102 -0
data/ext/isomorfeus_ferret_ext/test_multimapper.c +64 -0
data/ext/isomorfeus_ferret_ext/test_priorityqueue.c +213 -0
data/ext/isomorfeus_ferret_ext/test_q_const_score.c +84 -0
data/ext/isomorfeus_ferret_ext/test_q_filtered.c +61 -0
data/ext/isomorfeus_ferret_ext/test_q_fuzzy.c +241 -0
data/ext/isomorfeus_ferret_ext/test_q_parser.c +464 -0
data/ext/isomorfeus_ferret_ext/test_q_span.c +575 -0
data/ext/isomorfeus_ferret_ext/test_ram_store.c +77 -0
data/ext/isomorfeus_ferret_ext/test_search.c +1874 -0
data/ext/isomorfeus_ferret_ext/test_segments.c +167 -0
data/ext/isomorfeus_ferret_ext/test_similarity.c +25 -0
data/ext/isomorfeus_ferret_ext/test_sort.c +333 -0
data/ext/isomorfeus_ferret_ext/test_store.c +591 -0
data/ext/isomorfeus_ferret_ext/test_store.h +3 -0
data/ext/isomorfeus_ferret_ext/test_term.c +351 -0
data/ext/isomorfeus_ferret_ext/test_term_vectors.c +373 -0
data/ext/isomorfeus_ferret_ext/test_test.c +83 -0
data/ext/isomorfeus_ferret_ext/test_threading.c +188 -0
data/ext/isomorfeus_ferret_ext/testhelper.c +561 -0
data/ext/isomorfeus_ferret_ext/testhelper.h +25 -0
data/ext/isomorfeus_ferret_ext/tests_all.h +87 -0
data/ext/isomorfeus_ferret_ext/uchar-ucs4.rl +1854 -0
data/ext/isomorfeus_ferret_ext/uchar-utf8.rl +1999 -0
data/ext/isomorfeus_ferret_ext/url.rl +27 -0
data/ext/isomorfeus_ferret_ext/word_list.h +15156 -0
data/lib/isomorfeus/ferret/document.rb +132 -0
data/lib/isomorfeus/ferret/field_symbol.rb +85 -0
data/lib/isomorfeus/ferret/index/field_infos.rb +48 -0
data/lib/isomorfeus/ferret/index/index.rb +970 -0
data/lib/isomorfeus/ferret/monitor.rb +323 -0
data/lib/isomorfeus/ferret/stdlib_patches.rb +151 -0
data/lib/isomorfeus/ferret/version.rb +5 -0
data/lib/isomorfeus-ferret.rb +8 -0
metadata +307 -0

data/lib/isomorfeus/ferret/index/index.rb ADDED Viewed

@@ -0,0 +1,970 @@
+module Isomorfeus
+  module Ferret
+    module Index
+      # This is a simplified interface to the index. See the TUTORIAL for more
+      # information on how to use this class.
+      class Index
+        include Isomorfeus::Ferret::MonitorMixin
+        include Isomorfeus::Ferret::Store
+        include Isomorfeus::Ferret::Search
+        attr_reader :options
+        # If you create an Index without any options, it'll simply create an index
+        # in memory. But this class is highly configurable and every option that
+        # you can supply to IndexWriter and QueryParser, you can also set here.
+        # Please look at the options for the constructors to these classes.
+        #
+        # === Options
+        #
+        # See;
+        #
+        # * QueryParser
+        # * IndexWriter
+        #
+        # default_input_field::   Default: "id". This specifies the default field
+        #                         that will be used when you add a simple string
+        #                         to the index using #add_document or <<.
+        # id_field::              Default: "id". This field is as the field to
+        #                         search when doing searches on a term. For
+        #                         example, if you do a lookup by term "cat", ie
+        #                         index["cat"], this will be the field that is
+        #                         searched.
+        # key::                   Default: nil. Expert: This should only be used
+        #                         if you really know what you are doing. Basically
+        #                         you can set a field or an array of fields to be
+        #                         the key for the index. So if you add a document
+        #                         with a same key as an existing document, the
+        #                         existing document will be replaced by the new
+        #                         object.  Using a multiple field key will slow
+        #                         down indexing so it should not be done if
+        #                         performance is a concern. A single field key (or
+        #                         id) should be find however. Also, you must make
+        #                         sure that your key/keys are either untokenized
+        #                         or that they are not broken up by the analyzer.
+        # auto_flush::            Default: false. Set this option to true if you
+        #                         want the index automatically flushed every time
+        #                         you do a write (includes delete) to the index.
+        #                         This is useful if you have multiple processes
+        #                         accessing the index and you don't want lock
+        #                         errors. Setting :auto_flush to true has a huge
+        #                         performance impact so don't use it if you are
+        #                         concerned about performance. In that case you
+        #                         should think about setting up a DRb indexing
+        #                         service.
+        # lock_retry_time::       Default: 2 seconds. This parameter specifies how
+        #                         long to wait before retrying to obtain the
+        #                         commit lock when detecting if the IndexReader is
+        #                         at the latest version.
+        # close_dir::             Default: false.  If you explicitly pass a
+        #                         Directory object to this class and you want
+        #                         Index to close it when it is closed itself then
+        #                         set this to true.
+        # use_typed_range_query:: Default: true. Use TypedRangeQuery instead of
+        #                         the standard RangeQuery when parsing
+        #                         range queries. This is useful if you have number
+        #                         fields which you want to perform range queries
+        #                         on. You won't need to pad or normalize the data
+        #                         in the field in anyway to get correct results.
+        #                         However, performance will be a lot slower for
+        #                         large indexes, hence the default.
+        #
+        # == Examples
+        #
+        #   index = Index::Index.new(:analyzer => WhiteSpaceAnalyzer.new())
+        #
+        #   index = Index::Index.new(:path => '/path/to/index',
+        #                            :create_if_missing => false,
+        #                            :auto_flush => true)
+        #
+        #   index = Index::Index.new(:dir => directory,
+        #                            :default_slop => 2,
+        #                            :handle_parse_errors => false)
+        #
+        # You can also pass a block if you like. The index will be yielded and
+        # closed at the index of the box. For example;
+        #
+        #   Ferret::I.new() do |index|
+        #     # do stuff with index. Most of your actions will be cached.
+        #   end
+        def initialize(options = {}, &block)
+          super()
+          if options[:key]
+            @key = options[:key]
+            if @key.is_a?(Array)
+              @key.flatten.map {|k| k.to_s.intern}
+            end
+          else
+            @key = nil
+          end
+          if (fi = options[:field_infos]).is_a?(String)
+            options[:field_infos] = Isomorfeus::Ferret::Index::FieldInfos.load(fi)
+          end
+          @close_dir = options[:close_dir]
+          if options[:dir].is_a?(String)
+            options[:path] = options[:dir]
+          end
+          if options[:path]
+            @close_dir = true
+            begin
+              @dir = FSDirectory.new(options[:path], options[:create])
+            rescue IOError
+              @dir = FSDirectory.new(options[:path],
+                                    options[:create_if_missing] != false)
+            end
+          elsif options[:dir]
+            @dir = options[:dir]
+          else
+            options[:create] = true # this should always be true for a new RAMDir
+            @close_dir = true
+            @dir = RAMDirectory.new
+          end
+          @dir.extend(MonitorMixin) unless @dir.kind_of? MonitorMixin
+          options[:dir] = @dir
+          options[:lock_retry_time]||= 2
+          @options = options
+          if (!@dir.exists?("segments")) || options[:create]
+            IndexWriter.new(options).close
+          end
+          options[:analyzer]||= Ferret::Analysis::StandardAnalyzer.new
+          if options[:use_typed_range_query].nil?
+            options[:use_typed_range_query] = true
+          end
+          @searcher = nil
+          @writer = nil
+          @reader = nil
+          @options.delete(:create) # only create the first time if at all
+          @auto_flush = @options[:auto_flush] || false
+          if (@options[:id_field].nil? and @key.is_a?(Symbol))
+            @id_field = @key
+          else
+            @id_field = @options[:id_field] || :id
+          end
+          @default_field = (@options[:default_field]||= :*)
+          @default_input_field = options[:default_input_field] || @id_field
+          if @default_input_field.respond_to?(:intern)
+            @default_input_field = @default_input_field.intern
+          end
+          @open = true
+          @qp = nil
+          if block
+            yield self
+            self.close
+          end
+        end
+        # Returns an array of strings with the matches highlighted. The +query+ can
+        # either a query String or a Ferret::Search::Query object. The doc_id is
+        # the id of the document you want to highlight (usually returned by the
+        # search methods). There are also a number of options you can pass;
+        #
+        # === Options
+        #
+        # field::            Default: @options[:default_field]. The default_field
+        #                    is the field that is usually highlighted but you can
+        #                    specify which field you want to highlight here. If
+        #                    you want to highlight multiple fields then you will
+        #                    need to call this method multiple times.
+        # excerpt_length::   Default: 150. Length of excerpt to show. Highlighted
+        #                    terms will be in the centre of the excerpt. Set to
+        #                    :all to highlight the entire field.
+        # num_excerpts::     Default: 2. Number of excerpts to return.
+        # pre_tag::          Default: "<b>". Tag to place to the left of the
+        #                    match.  You'll probably want to change this to a
+        #                    "<span>" tag with a class. Try "\033[36m" for use in
+        #                    a terminal.
+        # post_tag::         Default: "</b>". This tag should close the
+        #                    +:pre_tag+. Try tag "\033[m" in the terminal.
+        # ellipsis::         Default: "...". This is the string that is appended
+        #                    at the beginning and end of excerpts (unless the
+        #                    excerpt hits the start or end of the field.
+        #                    Alternatively you may want to use the HTML entity
+        #                    &#8230; or the UTF-8 string "\342\200\246".
+        def highlight(query, doc_id, options = {})
+          @dir.synchronize do
+            ensure_searcher_open()
+            @searcher.highlight(do_process_query(query),
+                                doc_id,
+                                options[:field]||@options[:default_field],
+                                options)
+          end
+        end
+        # Closes this index by closing its associated reader and writer objects.
+        def close
+          @dir.synchronize do
+            if not @open
+              raise(StandardError, "tried to close an already closed directory")
+            end
+            @searcher.close() if @searcher
+            @reader.close() if @reader
+            @writer.close() if @writer
+            @dir.close() if @close_dir
+            @open = false
+          end
+        end
+        # Get the reader for this index.
+        # NOTE:: This will close the writer from this index.
+        def reader
+          ensure_reader_open()
+          return @reader
+        end
+        # Get the searcher for this index.
+        # NOTE:: This will close the writer from this index.
+        def searcher
+          ensure_searcher_open()
+          return @searcher
+        end
+        # Get the writer for this index.
+        # NOTE:: This will close the reader from this index.
+        def writer
+          ensure_writer_open()
+          return @writer
+        end
+        # Adds a document to this index, using the provided analyzer instead of
+        # the local analyzer if provided.  If the document contains more than
+        # IndexWriter::MAX_FIELD_LENGTH terms for a given field, the remainder are
+        # discarded.
+        #
+        # There are three ways to add a document to the index.
+        # To add a document you can simply add a string or an array of strings.
+        # This will store all the strings in the "" (ie empty string) field
+        # (unless you specify the default_field when you create the index).
+        #
+        #   index << "This is a new document to be indexed"
+        #   index << ["And here", "is another", "new document", "to be indexed"]
+        #
+        # But these are pretty simple documents. If this is all you want to index
+        # you could probably just use SimpleSearch. So let's give our documents
+        # some fields;
+        #
+        #   index << {:title => "Programming Ruby", :content => "blah blah blah"}
+        #   index << {:title => "Programming Ruby", :content => "yada yada yada"}
+        #
+        # Or if you are indexing data stored in a database, you'll probably want
+        # to store the id;
+        #
+        #   index << {:id => row.id, :title => row.title, :date => row.date}
+        #
+        # See FieldInfos for more information on how to set field properties.
+        def add_document(doc, analyzer = nil)
+          @dir.synchronize do
+            ensure_writer_open()
+            if doc.is_a?(String) or doc.is_a?(Array)
+              doc = {@default_input_field => doc}
+            end
+            # delete existing documents with the same key
+            if @key
+              if @key.is_a?(Array)
+                query = @key.inject(BooleanQuery.new()) do |bq, field|
+                  bq.add_query(TermQuery.new(field, doc[field].to_s), :must)
+                  bq
+                end
+                query_delete(query)
+              else
+                id = doc[@key].to_s
+                if id
+                  @writer.delete(@key, id)
+                end
+              end
+            end
+            ensure_writer_open()
+            if analyzer
+              old_analyzer = @writer.analyzer
+              @writer.analyzer = analyzer
+              @writer.add_document(doc)
+              @writer.analyzer = old_analyzer
+            else
+              @writer.add_document(doc)
+            end
+            flush() if @auto_flush
+          end
+        end
+        alias :<< :add_document
+        # Run a query through the Searcher on the index. A TopDocs object is
+        # returned with the relevant results. The +query+ is a built in Query
+        # object or a query string that can be parsed by the Ferret::QueryParser.
+        # Here are the options;
+        #
+        # === Options
+        #
+        # offset::      Default: 0. The offset of the start of the section of the
+        #               result-set to return. This is used for paging through
+        #               results. Let's say you have a page size of 10. If you
+        #               don't find the result you want among the first 10 results
+        #               then set +:offset+ to 10 and look at the next 10 results,
+        #               then 20 and so on.
+        # limit::       Default: 10. This is the number of results you want
+        #               returned, also called the page size. Set +:limit+ to
+        #               +:all+ to return all results
+        # sort::        A Sort object or sort string describing how the field
+        #               should be sorted. A sort string is made up of field names
+        #               which cannot contain spaces and the word "DESC" if you
+        #               want the field reversed, all separated by commas. For
+        #               example; "rating DESC, author, title". Note that Ferret
+        #               will try to determine a field's type by looking at the
+        #               first term in the index and seeing if it can be parsed as
+        #               an integer or a float. Keep this in mind as you may need
+        #               to specify a fields type to sort it correctly. For more
+        #               on this, see the documentation for SortField
+        # filter::      a Filter object to filter the search results with
+        # filter_proc:: a filter Proc is a Proc which takes the doc_id, the score
+        #               and the Searcher object as its parameters and returns a
+        #               Boolean value specifying whether the result should be
+        #               included in the result set.
+        def search(query, options = {})
+          @dir.synchronize do
+            return do_search(query, options)
+          end
+        end
+        # Run a query through the Searcher on the index. A TopDocs object is
+        # returned with the relevant results. The +query+ is a Query object or a
+        # query string that can be validly parsed by the Ferret::QueryParser. The
+        # Searcher#search_each method yields the internal document id (used to
+        # reference documents in the Searcher object like this;
+        # +searcher[doc_id]+) and the search score for that document. It is
+        # possible for the score to be greater than 1.0 for some queries and
+        # taking boosts into account. This method will also normalize scores to
+        # the range 0.0..1.0 when the max-score is greater than 1.0. Here are the
+        # options;
+        #
+        # === Options
+        #
+        # offset::      Default: 0. The offset of the start of the section of the
+        #               result-set to return. This is used for paging through
+        #               results. Let's say you have a page size of 10. If you
+        #               don't find the result you want among the first 10 results
+        #               then set +:offset+ to 10 and look at the next 10 results,
+        #               then 20 and so on.
+        # limit::       Default: 10. This is the number of results you want
+        #               returned, also called the page size. Set +:limit+ to
+        #               +:all+ to return all results
+        # sort::        A Sort object or sort string describing how the field
+        #               should be sorted. A sort string is made up of field names
+        #               which cannot contain spaces and the word "DESC" if you
+        #               want the field reversed, all separated by commas. For
+        #               example; "rating DESC, author, title". Note that Ferret
+        #               will try to determine a field's type by looking at the
+        #               first term in the index and seeing if it can be parsed as
+        #               an integer or a float. Keep this in mind as you may need
+        #               to specify a fields type to sort it correctly. For more
+        #               on this, see the documentation for SortField
+        # filter::      a Filter object to filter the search results with
+        # filter_proc:: a filter Proc is a Proc which takes the doc_id, the score
+        #               and the Searcher object as its parameters and returns a
+        #               Boolean value specifying whether the result should be
+        #               included in the result set.
+        #
+        # returns:: The total number of hits.
+        #
+        # === Example
+        # eg.
+        #   index.search_each(query, options = {}) do |doc, score|
+        #     puts "hit document number #{doc} with a score of #{score}"
+        #   end
+        #
+        def search_each(query, options = {}) # :yield: doc, score
+          @dir.synchronize do
+            ensure_searcher_open()
+            query = do_process_query(query)
+            @searcher.search_each(query, options) do |doc, score|
+              yield doc, score
+            end
+          end
+        end
+        # Run a query through the Searcher on the index, ignoring scoring and
+        # starting at +:start_doc+ and stopping when +:limit+ matches have been
+        # found. It returns an array of the matching document numbers.
+        #
+        # There is a big performance advange when using this search method on a
+        # very large index when there are potentially thousands of matching
+        # documents and you only want say 50 of them. The other search methods need
+        # to look at every single match to decide which one has the highest score.
+        # This search method just needs to find +:limit+ number of matches before
+        # it returns.
+        #
+        # === Options
+        #
+        # start_doc::     Default: 0. The start document to start the search from.
+        #                 NOTE very carefully that this is not the same as the
+        #                 +:offset+ parameter used in the other search methods
+        #                 which refers to the offset in the result-set. This is the
+        #                 document to start the scan from. So if you scanning
+        #                 through the index in increments of 50 documents at a time
+        #                 you need to use the last matched doc in the previous
+        #                 search to start your next search. See the example below.
+        # limit::         Default: 50. This is the number of results you want
+        #                 returned, also called the page size. Set +:limit+ to
+        #                 +:all+ to return all results.
+        # TODO: add option to return loaded documents instead
+        #
+        # === Options
+        #
+        #   start_doc = 0
+        #   begin
+        #     results = @searcher.scan(query, :start_doc => start_doc)
+        #     yield results # or do something with them
+        #     start_doc = results.last
+        #     # start_doc will be nil now if results is empty, ie no more matches
+        #   end while start_doc
+        def scan(query, options = {})
+          @dir.synchronize do
+            ensure_searcher_open()
+            query = do_process_query(query)
+            @searcher.scan(query, options)
+          end
+        end
+        # Retrieves a document/documents from the index. The method for retrieval
+        # depends on the type of the argument passed.
+        #
+        # If +arg+ is an Integer then return the document based on the internal
+        # document number.
+        #
+        # If +arg+ is a Range, then return the documents within the range based on
+        # internal document number.
+        #
+        # If +arg+ is a String then search for the first document with +arg+ in
+        # the +id+ field. The +id+ field is either :id or whatever you set
+        # +:id_field+ parameter to when you create the Index object.
+        def doc(*arg)
+          @dir.synchronize do
+            id = arg[0]
+            if id.kind_of?(String) or id.kind_of?(Symbol)
+              ensure_reader_open()
+              term_doc_enum = @reader.term_docs_for(@id_field, id.to_s)
+              return term_doc_enum.next? ? @reader[term_doc_enum.doc] : nil
+            else
+              ensure_reader_open(false)
+              return @reader[*arg]
+            end
+          end
+        end
+        alias :[] :doc
+        # Retrieves the term_vector for a document. The document can be referenced
+        # by either a string id to match the id field or an integer corresponding
+        # to Ferret's document number.
+        #
+        # See Ferret::Index::IndexReader#term_vector
+        def term_vector(id, field)
+          @dir.synchronize do
+            ensure_reader_open()
+            if id.kind_of?(String) or id.kind_of?(Symbol)
+              term_doc_enum = @reader.term_docs_for(@id_field, id.to_s)
+              if term_doc_enum.next?
+                id = term_doc_enum.doc
+              else
+                return nil
+              end
+            end
+            return @reader.term_vector(id, field)
+          end
+        end
+        # iterate through all documents in the index. This method preloads the
+        # documents so you don't need to call #load on the document to load all the
+        # fields.
+        def each
+          @dir.synchronize do
+            ensure_reader_open
+            (0...@reader.max_doc).each do |i|
+              yield @reader[i].load unless @reader.deleted?(i)
+            end
+          end
+        end
+        # Deletes a document/documents from the index. The method for determining
+        # the document to delete depends on the type of the argument passed.
+        #
+        # If +arg+ is an Integer then delete the document based on the internal
+        # document number. Will raise an error if the document does not exist.
+        #
+        # If +arg+ is a String then search for the documents with +arg+ in the
+        # +id+ field. The +id+ field is either :id or whatever you set +:id_field+
+        # parameter to when you create the Index object. Will fail quietly if the
+        # no document exists.
+        #
+        # If +arg+ is a Hash or an Array then a batch delete will be performed.
+        # If +arg+ is an Array then it will be considered an array of +id+'s. If
+        # it is a Hash, then its keys will be used instead as the Array of
+        # document +id+'s. If the +id+ is an Integer then it is considered a
+        # Ferret document number and the corresponding document will be deleted.
+        # If the +id+ is a String or a Symbol then the +id+ will be considered a
+        # term and the documents that contain that term in the +:id_field+ will be
+        # deleted.
+        def delete(arg)
+          @dir.synchronize do
+            if arg.is_a?(String) or arg.is_a?(Symbol)
+              ensure_writer_open()
+              @writer.delete(@id_field, arg.to_s)
+            elsif arg.is_a?(Integer)
+              ensure_reader_open()
+              _cnt = @reader.delete(arg)
+            elsif arg.is_a?(Hash) or arg.is_a?(Array)
+              batch_delete(arg)
+            else
+              raise ArgumentError, "Cannot delete for arg of type #{arg.class}"
+            end
+            flush() if @auto_flush
+          end
+          return self
+        end
+        # Delete all documents returned by the query.
+        #
+        # query:: The query to find documents you wish to delete. Can either be a
+        #         string (in which case it is parsed by the standard query parser)
+        #         or an actual query object.
+        def query_delete(query)
+          @dir.synchronize do
+            ensure_writer_open()
+            ensure_searcher_open()
+            query = do_process_query(query)
+            @searcher.search_each(query, :limit => :all) do |doc, score|
+              @reader.delete(doc)
+            end
+            flush() if @auto_flush
+          end
+        end
+        # Returns true if document +n+ has been deleted
+        def deleted?(n)
+          @dir.synchronize do
+            ensure_reader_open()
+            return @reader.deleted?(n)
+          end
+        end
+        # Update the document referenced by the document number +id+ if +id+ is an
+        # integer or all of the documents which have the term +id+ if +id+ is a
+        # term..
+        # For batch update of set of documents, for performance reasons, see batch_update
+        #
+        # id::      The number of the document to update. Can also be a string
+        #           representing the value in the +id+ field. Also consider using
+        #           the :key attribute.
+        # new_doc:: The document to replace the old document with
+        def update(id, new_doc)
+          @dir.synchronize do
+            ensure_writer_open()
+            delete(id)
+            if id.is_a?(String) or id.is_a?(Symbol)
+              @writer.commit
+            else
+              ensure_writer_open()
+            end
+            @writer << new_doc
+            flush() if @auto_flush
+          end
+        end
+        # Batch updates the documents in an index. You can pass either a Hash or
+        # an Array.
+        #
+        # === Array (recommended)
+        #
+        # If you pass an Array then each value needs to be a Document or a Hash
+        # and each of those documents must have an +:id_field+ which will be used
+        # to delete the old document that this document is replacing.
+        #
+        # === Hash
+        #
+        # If you pass a Hash then the keys of the Hash will be considered the
+        # +id+'s and the values will be the new documents to replace the old ones
+        # with.If the +id+ is an Integer then it is considered a Ferret document
+        # number and the corresponding document will be deleted.  If the +id+ is a
+        # String or a Symbol then the +id+ will be considered a term and the
+        # documents that contain that term in the +:id_field+ will be deleted.
+        #
+        # Note: No error will be raised if the document does not currently
+        # exist. A new document will simply be created.
+        #
+        # == Examples
+        #
+        #   # will replace the documents with the +id+'s id:133 and id:254
+        #   @index.batch_update({
+        #       '133' => {:id => '133', :content => 'yada yada yada'},
+        #       '253' => {:id => '253', :content => 'bla bla bal'}
+        #     })
+        #
+        #   # will replace the documents with the Ferret Document numbers 2 and 92
+        #   @index.batch_update({
+        #       2  => {:id => '133', :content => 'yada yada yada'},
+        #       92 => {:id => '253', :content => 'bla bla bal'}
+        #     })
+        #
+        #   # will replace the documents with the +id+'s id:133 and id:254
+        #   # this is recommended as it guarantees no duplicate keys
+        #   @index.batch_update([
+        #       {:id => '133', :content => 'yada yada yada'},
+        #       {:id => '253', :content => 'bla bla bal'}
+        #     ])
+        #
+        # docs:: A Hash of id/document pairs. The set of documents to be updated
+        def batch_update(docs)
+          @dir.synchronize do
+            ids = nil
+            case docs
+            when Array
+              ids = docs.collect{|doc| doc[@id_field].to_s}
+              if ids.include?(nil)
+                raise ArgumentError, "all documents must have an #{@id_field} field when doing a batch update"
+              end
+            when Hash
+              ids = docs.keys
+              docs = docs.values
+            else
+              raise ArgumentError, "must pass Hash or Array, not #{docs.class}"
+            end
+            batch_delete(ids)
+            ensure_writer_open()
+            docs.each {|new_doc| @writer << new_doc }
+            flush()
+          end
+        end
+        # Update all the documents returned by the query.
+        #
+        # query::   The query to find documents you wish to update. Can either be
+        #           a string (in which case it is parsed by the standard query
+        #           parser) or an actual query object.
+        # new_val:: The values we are updating. This can be a string in which case
+        #           the default field is updated, or it can be a hash, in which
+        #           case, all fields in the hash are merged into the old hash.
+        #           That is, the old fields are replaced by values in the new hash
+        #           if they exist.
+        #
+        # === Example
+        #
+        #   index << {:id => "26", :title => "Babylon", :artist => "David Grey"}
+        #   index << {:id => "29", :title => "My Oh My", :artist => "David Grey"}
+        #
+        #   # correct
+        #   index.query_update('artist:"David Grey"', {:artist => "David Gray"})
+        #
+        #   index["26"]
+        #     #=> {:id => "26", :title => "Babylon", :artist => "David Gray"}
+        #   index["28"]
+        #     #=> {:id => "28", :title => "My Oh My", :artist => "David Gray"}
+        #
+        def query_update(query, new_val)
+          @dir.synchronize do
+            ensure_writer_open()
+            ensure_searcher_open()
+            docs_to_add = []
+            query = do_process_query(query)
+            @searcher.search_each(query, :limit => :all) do |id, score|
+              document = @searcher[id].load
+              if new_val.is_a?(Hash)
+                document.merge!(new_val)
+              else new_val.is_a?(String) or new_val.is_a?(Symbol)
+                document[@default_input_field] = new_val.to_s
+              end
+              docs_to_add << document
+              @reader.delete(id)
+            end
+            ensure_writer_open()
+            docs_to_add.each {|doc| @writer << doc }
+            flush() if @auto_flush
+          end
+        end
+        # Returns true if any documents have been deleted since the index was last
+        # flushed.
+        def has_deletions?()
+          @dir.synchronize do
+            ensure_reader_open()
+            return @reader.has_deletions?
+          end
+        end
+        # Flushes all writes to the index. This will not optimize the index but it
+        # will make sure that all writes are written to it.
+        #
+        # NOTE: this is not necessary if you are only using this class. All writes
+        # will automatically flush when you perform an operation that reads the
+        # index.
+        def flush()
+          @dir.synchronize do
+            if @reader
+              if @searcher
+                @searcher.close
+                @searcher = nil
+              end
+              @reader.commit
+            elsif @writer
+              @writer.close
+              @writer = nil
+            end
+          end
+        end
+        alias :commit :flush
+        # optimizes the index. This should only be called when the index will no
+        # longer be updated very often, but will be read a lot.
+        def optimize()
+          @dir.synchronize do
+            ensure_writer_open()
+            @writer.optimize()
+            @writer.close()
+            @writer = nil
+          end
+        end
+        # returns the number of documents in the index
+        def size()
+          @dir.synchronize do
+            ensure_reader_open()
+            return @reader.num_docs()
+          end
+        end
+        # Merges all segments from an index or an array of indexes into this
+        # index. You can pass a single Index::Index, Index::Reader,
+        # Store::Directory or an array of any single one of these.
+        #
+        # This may be used to parallelize batch indexing. A large document
+        # collection can be broken into sub-collections. Each sub-collection can
+        # be indexed in parallel, on a different thread, process or machine and
+        # perhaps all in memory. The complete index can then be created by
+        # merging sub-collection indexes with this method.
+        #
+        # After this completes, the index is optimized.
+        def add_indexes(indexes)
+          @dir.synchronize do
+            ensure_writer_open()
+            indexes = [indexes].flatten   # make sure we have an array
+            return if indexes.size == 0 # nothing to do
+            if indexes[0].is_a?(Index)
+              indexes.delete(self) # don't merge with self
+              indexes = indexes.map {|index| index.reader }
+            elsif indexes[0].is_a?(Ferret::Store::Directory)
+              indexes.delete(@dir) # don't merge with self
+              indexes = indexes.map {|dir| IndexReader.new(dir) }
+            elsif indexes[0].is_a?(IndexReader)
+              indexes.delete(@reader) # don't merge with self
+            else
+              raise ArgumentError, "Unknown index type when trying to merge indexes"
+            end
+            ensure_writer_open
+            @writer.add_readers(indexes)
+          end
+        end
+        # This is a simple utility method for saving an in memory or RAM index to
+        # the file system. The same thing can be achieved by using the
+        # Index::Index#add_indexes method and you will have more options when
+        # creating the new index, however this is a simple way to turn a RAM index
+        # into a file system index.
+        #
+        # directory:: This can either be a Store::Directory object or a String
+        #             representing the path to the directory where you would
+        #             like to store the index.
+        #
+        # create::    True if you'd like to create the directory if it doesn't
+        #             exist or copy over an existing directory. False if you'd
+        #             like to merge with the existing directory. This defaults to
+        #             false.
+        def persist(directory, create = true)
+          synchronize do
+            close_all()
+            old_dir = @dir
+            if directory.is_a?(String)
+              @dir = FSDirectory.new(directory, create)
+            elsif directory.is_a?(Ferret::Store::Directory)
+              @dir = directory
+            end
+            @dir.extend(MonitorMixin) unless @dir.kind_of? MonitorMixin
+            @options[:dir] = @dir
+            @options[:create_if_missing] = true
+            add_indexes([old_dir])
+          end
+        end
+        def to_s
+          buf = ""
+          (0...(size)).each do |i|
+            buf << self[i].to_s + "\n" if not deleted?(i)
+          end
+          buf
+        end
+        # Returns an Explanation that describes how +doc+ scored against
+        # +query+.
+        #
+        # This is intended to be used in developing Similarity implementations,
+        # and, for good performance, should not be displayed with every hit.
+        # Computing an explanation is as expensive as executing the query over the
+        # entire index.
+        def explain(query, doc)
+          @dir.synchronize do
+            ensure_searcher_open()
+            query = do_process_query(query)
+            return @searcher.explain(query, doc)
+          end
+        end
+        # Turn a query string into a Query object with the Index's QueryParser
+        def process_query(query)
+          @dir.synchronize do
+            ensure_searcher_open()
+            return do_process_query(query)
+          end
+        end
+        # Returns the field_infos object so that you can add new fields to the
+        # index.
+        def field_infos
+          @dir.synchronize do
+            ensure_writer_open()
+            return @writer.field_infos
+          end
+        end
+        protected
+          def ensure_writer_open()
+            raise "tried to use a closed index" if not @open
+            return if @writer
+            if @reader
+              @searcher.close if @searcher
+              @reader.close
+              @reader = nil
+              @searcher = nil
+            end
+            @writer = IndexWriter.new(@options)
+          end
+          # returns the new reader if one is opened
+          def ensure_reader_open(get_latest = true)
+            raise "tried to use a closed index" if not @open
+            if @reader
+              if get_latest
+                latest = false
+                begin
+                  latest = @reader.latest?
+                rescue Lock::LockError
+                  sleep(@options[:lock_retry_time]) # sleep for 2 seconds and try again
+                  latest = @reader.latest?
+                end
+                if not latest
+                  @searcher.close if @searcher
+                  @reader.close
+                  return @reader = IndexReader.new(@dir)
+                end
+              end
+            else
+              if @writer
+                @writer.close
+                @writer = nil
+              end
+              return @reader = IndexReader.new(@dir)
+            end
+            return false
+          end
+          def ensure_searcher_open()
+            raise "tried to use a closed index" if not @open
+            if ensure_reader_open() or not @searcher
+              @searcher = Searcher.new(@reader)
+            end
+          end
+        private
+          def do_process_query(query)
+            if query.is_a?(String)
+              if @qp.nil?
+                @qp = Ferret::QueryParser.new(@options)
+              end
+              # we need to set this every time, in case a new field has been added
+              @qp.fields = @reader.fields unless options[:all_fields] || options[:fields]
+              @qp.tokenized_fields = @reader.tokenized_fields unless options[:tokenized_fields]
+              query = @qp.parse(query)
+            end
+            return query
+          end
+          def do_search(query, options)
+            ensure_searcher_open()
+            query = do_process_query(query)
+            return @searcher.search(query, options)
+          end
+          def close_all()
+            @dir.synchronize do
+              @searcher.close if @searcher
+              @reader.close if @reader
+              @writer.close if @writer
+              @reader = nil
+              @searcher = nil
+              @writer = nil
+            end
+          end
+          # If +docs+ is a Hash or an Array then a batch delete will be performed.
+          # If +docs+ is an Array then it will be considered an array of +id+'s. If
+          # it is a Hash, then its keys will be used instead as the Array of
+          # document +id+'s. If the +id+ is an Integers then it is considered a
+          # Ferret document number and the corresponding document will be deleted.
+          # If the +id+ is a String or a Symbol then the +id+ will be considered a
+          # term and the documents that contain that term in the +:id_field+ will
+          # be deleted.
+          #
+          # docs:: An Array of docs to be deleted, or a Hash (in which case the keys
+          # are used)
+          def batch_delete(docs)
+            docs = docs.keys if docs.is_a?(Hash)
+            raise ArgumentError, "must pass Array or Hash" unless docs.is_a? Array
+            ids = []
+            terms = []
+            docs.each do |doc|
+              case doc
+              when String then  terms << doc
+              when Symbol then  terms << doc.to_s
+              when Integer then ids   << doc
+              else
+                raise ArgumentError, "Cannot delete for arg of type #{id.class}"
+              end
+            end
+            if ids.size > 0
+              ensure_reader_open
+              ids.each {|id| @reader.delete(id)}
+            end
+            if terms.size > 0
+              ensure_writer_open()
+              @writer.delete(@id_field, terms)
+            end
+            return self
+          end
+      end
+    end
+    I = Index::Index
+  end
+end