RubyGems - np-ferret - Versions diffs - 0.11.6 - Mend

np-ferret 0.11.6

Files changed (275) hide show

data/CHANGELOG +24 -0
data/MIT-LICENSE +20 -0
data/README +102 -0
data/Rakefile +338 -0
data/TODO +17 -0
data/TUTORIAL +231 -0
data/bin/ferret-browser +79 -0
data/ext/Makefile +218 -0
data/ext/analysis.c +1584 -0
data/ext/analysis.h +219 -0
data/ext/analysis.o +0 -0
data/ext/api.c +69 -0
data/ext/api.h +27 -0
data/ext/api.o +0 -0
data/ext/array.c +123 -0
data/ext/array.h +53 -0
data/ext/array.o +0 -0
data/ext/bitvector.c +540 -0
data/ext/bitvector.h +272 -0
data/ext/bitvector.o +0 -0
data/ext/compound_io.c +383 -0
data/ext/compound_io.o +0 -0
data/ext/config.h +42 -0
data/ext/document.c +156 -0
data/ext/document.h +53 -0
data/ext/document.o +0 -0
data/ext/except.c +120 -0
data/ext/except.h +168 -0
data/ext/except.o +0 -0
data/ext/extconf.rb +14 -0
data/ext/ferret.c +402 -0
data/ext/ferret.h +91 -0
data/ext/ferret.o +0 -0
data/ext/ferret_ext.bundle +0 -0
data/ext/filter.c +156 -0
data/ext/filter.o +0 -0
data/ext/fs_store.c +484 -0
data/ext/fs_store.o +0 -0
data/ext/global.c +418 -0
data/ext/global.h +117 -0
data/ext/global.o +0 -0
data/ext/hash.c +598 -0
data/ext/hash.h +475 -0
data/ext/hash.o +0 -0
data/ext/hashset.c +170 -0
data/ext/hashset.h +187 -0
data/ext/hashset.o +0 -0
data/ext/header.h +58 -0
data/ext/helper.c +62 -0
data/ext/helper.h +13 -0
data/ext/helper.o +0 -0
data/ext/inc/lang.h +48 -0
data/ext/inc/threading.h +31 -0
data/ext/index.c +6510 -0
data/ext/index.h +964 -0
data/ext/index.o +0 -0
data/ext/lang.h +66 -0
data/ext/libstemmer.c +92 -0
data/ext/libstemmer.h +79 -0
data/ext/libstemmer.o +0 -0
data/ext/mempool.c +87 -0
data/ext/mempool.h +35 -0
data/ext/mempool.o +0 -0
data/ext/modules.h +162 -0
data/ext/multimapper.c +310 -0
data/ext/multimapper.h +51 -0
data/ext/multimapper.o +0 -0
data/ext/posh.c +1006 -0
data/ext/posh.h +1007 -0
data/ext/posh.o +0 -0
data/ext/priorityqueue.c +151 -0
data/ext/priorityqueue.h +143 -0
data/ext/priorityqueue.o +0 -0
data/ext/q_boolean.c +1608 -0
data/ext/q_boolean.o +0 -0
data/ext/q_const_score.c +165 -0
data/ext/q_const_score.o +0 -0
data/ext/q_filtered_query.c +209 -0
data/ext/q_filtered_query.o +0 -0
data/ext/q_fuzzy.c +335 -0
data/ext/q_fuzzy.o +0 -0
data/ext/q_match_all.c +148 -0
data/ext/q_match_all.o +0 -0
data/ext/q_multi_term.c +677 -0
data/ext/q_multi_term.o +0 -0
data/ext/q_parser.c +2825 -0
data/ext/q_parser.o +0 -0
data/ext/q_phrase.c +1126 -0
data/ext/q_phrase.o +0 -0
data/ext/q_prefix.c +100 -0
data/ext/q_prefix.o +0 -0
data/ext/q_range.c +356 -0
data/ext/q_range.o +0 -0
data/ext/q_span.c +2402 -0
data/ext/q_span.o +0 -0
data/ext/q_term.c +337 -0
data/ext/q_term.o +0 -0
data/ext/q_wildcard.c +171 -0
data/ext/q_wildcard.o +0 -0
data/ext/r_analysis.c +2636 -0
data/ext/r_analysis.o +0 -0
data/ext/r_index.c +3509 -0
data/ext/r_index.o +0 -0
data/ext/r_qparser.c +585 -0
data/ext/r_qparser.o +0 -0
data/ext/r_search.c +4240 -0
data/ext/r_search.o +0 -0
data/ext/r_store.c +513 -0
data/ext/r_store.o +0 -0
data/ext/r_utils.c +963 -0
data/ext/r_utils.o +0 -0
data/ext/ram_store.c +471 -0
data/ext/ram_store.o +0 -0
data/ext/search.c +1743 -0
data/ext/search.h +885 -0
data/ext/search.o +0 -0
data/ext/similarity.c +150 -0
data/ext/similarity.h +82 -0
data/ext/similarity.o +0 -0
data/ext/sort.c +985 -0
data/ext/sort.o +0 -0
data/ext/stem_ISO_8859_1_danish.c +338 -0
data/ext/stem_ISO_8859_1_danish.h +16 -0
data/ext/stem_ISO_8859_1_danish.o +0 -0
data/ext/stem_ISO_8859_1_dutch.c +635 -0
data/ext/stem_ISO_8859_1_dutch.h +16 -0
data/ext/stem_ISO_8859_1_dutch.o +0 -0
data/ext/stem_ISO_8859_1_english.c +1156 -0
data/ext/stem_ISO_8859_1_english.h +16 -0
data/ext/stem_ISO_8859_1_english.o +0 -0
data/ext/stem_ISO_8859_1_finnish.c +792 -0
data/ext/stem_ISO_8859_1_finnish.h +16 -0
data/ext/stem_ISO_8859_1_finnish.o +0 -0
data/ext/stem_ISO_8859_1_french.c +1276 -0
data/ext/stem_ISO_8859_1_french.h +16 -0
data/ext/stem_ISO_8859_1_french.o +0 -0
data/ext/stem_ISO_8859_1_german.c +512 -0
data/ext/stem_ISO_8859_1_german.h +16 -0
data/ext/stem_ISO_8859_1_german.o +0 -0
data/ext/stem_ISO_8859_1_italian.c +1091 -0
data/ext/stem_ISO_8859_1_italian.h +16 -0
data/ext/stem_ISO_8859_1_italian.o +0 -0
data/ext/stem_ISO_8859_1_norwegian.c +296 -0
data/ext/stem_ISO_8859_1_norwegian.h +16 -0
data/ext/stem_ISO_8859_1_norwegian.o +0 -0
data/ext/stem_ISO_8859_1_porter.c +776 -0
data/ext/stem_ISO_8859_1_porter.h +16 -0
data/ext/stem_ISO_8859_1_porter.o +0 -0
data/ext/stem_ISO_8859_1_portuguese.c +1035 -0
data/ext/stem_ISO_8859_1_portuguese.h +16 -0
data/ext/stem_ISO_8859_1_portuguese.o +0 -0
data/ext/stem_ISO_8859_1_spanish.c +1119 -0
data/ext/stem_ISO_8859_1_spanish.h +16 -0
data/ext/stem_ISO_8859_1_spanish.o +0 -0
data/ext/stem_ISO_8859_1_swedish.c +307 -0
data/ext/stem_ISO_8859_1_swedish.h +16 -0
data/ext/stem_ISO_8859_1_swedish.o +0 -0
data/ext/stem_KOI8_R_russian.c +701 -0
data/ext/stem_KOI8_R_russian.h +16 -0
data/ext/stem_KOI8_R_russian.o +0 -0
data/ext/stem_UTF_8_danish.c +344 -0
data/ext/stem_UTF_8_danish.h +16 -0
data/ext/stem_UTF_8_danish.o +0 -0
data/ext/stem_UTF_8_dutch.c +653 -0
data/ext/stem_UTF_8_dutch.h +16 -0
data/ext/stem_UTF_8_dutch.o +0 -0
data/ext/stem_UTF_8_english.c +1176 -0
data/ext/stem_UTF_8_english.h +16 -0
data/ext/stem_UTF_8_english.o +0 -0
data/ext/stem_UTF_8_finnish.c +808 -0
data/ext/stem_UTF_8_finnish.h +16 -0
data/ext/stem_UTF_8_finnish.o +0 -0
data/ext/stem_UTF_8_french.c +1296 -0
data/ext/stem_UTF_8_french.h +16 -0
data/ext/stem_UTF_8_french.o +0 -0
data/ext/stem_UTF_8_german.c +526 -0
data/ext/stem_UTF_8_german.h +16 -0
data/ext/stem_UTF_8_german.o +0 -0
data/ext/stem_UTF_8_italian.c +1113 -0
data/ext/stem_UTF_8_italian.h +16 -0
data/ext/stem_UTF_8_italian.o +0 -0
data/ext/stem_UTF_8_norwegian.c +302 -0
data/ext/stem_UTF_8_norwegian.h +16 -0
data/ext/stem_UTF_8_norwegian.o +0 -0
data/ext/stem_UTF_8_porter.c +794 -0
data/ext/stem_UTF_8_porter.h +16 -0
data/ext/stem_UTF_8_porter.o +0 -0
data/ext/stem_UTF_8_portuguese.c +1055 -0
data/ext/stem_UTF_8_portuguese.h +16 -0
data/ext/stem_UTF_8_portuguese.o +0 -0
data/ext/stem_UTF_8_russian.c +709 -0
data/ext/stem_UTF_8_russian.h +16 -0
data/ext/stem_UTF_8_russian.o +0 -0
data/ext/stem_UTF_8_spanish.c +1137 -0
data/ext/stem_UTF_8_spanish.h +16 -0
data/ext/stem_UTF_8_spanish.o +0 -0
data/ext/stem_UTF_8_swedish.c +313 -0
data/ext/stem_UTF_8_swedish.h +16 -0
data/ext/stem_UTF_8_swedish.o +0 -0
data/ext/stopwords.c +401 -0
data/ext/stopwords.o +0 -0
data/ext/store.c +692 -0
data/ext/store.h +777 -0
data/ext/store.o +0 -0
data/ext/term_vectors.c +352 -0
data/ext/term_vectors.o +0 -0
data/ext/threading.h +31 -0
data/ext/utilities.c +446 -0
data/ext/utilities.o +0 -0
data/ext/win32.h +54 -0
data/ferret.gemspec +39 -0
data/lib/ferret.rb +29 -0
data/lib/ferret/browser.rb +246 -0
data/lib/ferret/browser/s/global.js +192 -0
data/lib/ferret/browser/s/style.css +148 -0
data/lib/ferret/browser/views/document/list.rhtml +49 -0
data/lib/ferret/browser/views/document/show.rhtml +27 -0
data/lib/ferret/browser/views/error/index.rhtml +7 -0
data/lib/ferret/browser/views/help/index.rhtml +8 -0
data/lib/ferret/browser/views/home/index.rhtml +29 -0
data/lib/ferret/browser/views/layout.rhtml +22 -0
data/lib/ferret/browser/views/term-vector/index.rhtml +4 -0
data/lib/ferret/browser/views/term/index.rhtml +199 -0
data/lib/ferret/browser/views/term/termdocs.rhtml +1 -0
data/lib/ferret/browser/webrick.rb +14 -0
data/lib/ferret/document.rb +130 -0
data/lib/ferret/field_infos.rb +44 -0
data/lib/ferret/index.rb +786 -0
data/lib/ferret/number_tools.rb +157 -0
data/lib/ferret_ext.bundle +0 -0
data/lib/ferret_version.rb +3 -0
data/pkg/ferret-0.11.6.gem +0 -0
data/pkg/ferret-0.11.6.tgz +0 -0
data/pkg/ferret-0.11.6.zip +0 -0
data/setup.rb +1555 -0
data/test/test_all.rb +5 -0
data/test/test_helper.rb +24 -0
data/test/threading/number_to_spoken.rb +132 -0
data/test/threading/thread_safety_index_test.rb +79 -0
data/test/threading/thread_safety_read_write_test.rb +76 -0
data/test/threading/thread_safety_test.rb +133 -0
data/test/unit/analysis/tc_analyzer.rb +548 -0
data/test/unit/analysis/tc_token_stream.rb +646 -0
data/test/unit/index/tc_index.rb +762 -0
data/test/unit/index/tc_index_reader.rb +699 -0
data/test/unit/index/tc_index_writer.rb +437 -0
data/test/unit/index/th_doc.rb +315 -0
data/test/unit/largefile/tc_largefile.rb +46 -0
data/test/unit/query_parser/tc_query_parser.rb +238 -0
data/test/unit/search/tc_filter.rb +135 -0
data/test/unit/search/tc_fuzzy_query.rb +147 -0
data/test/unit/search/tc_index_searcher.rb +61 -0
data/test/unit/search/tc_multi_searcher.rb +128 -0
data/test/unit/search/tc_multiple_search_requests.rb +58 -0
data/test/unit/search/tc_search_and_sort.rb +179 -0
data/test/unit/search/tc_sort.rb +49 -0
data/test/unit/search/tc_sort_field.rb +27 -0
data/test/unit/search/tc_spans.rb +190 -0
data/test/unit/search/tm_searcher.rb +384 -0
data/test/unit/store/tc_fs_store.rb +77 -0
data/test/unit/store/tc_ram_store.rb +35 -0
data/test/unit/store/tm_store.rb +34 -0
data/test/unit/store/tm_store_lock.rb +68 -0
data/test/unit/tc_document.rb +81 -0
data/test/unit/ts_analysis.rb +2 -0
data/test/unit/ts_index.rb +2 -0
data/test/unit/ts_largefile.rb +4 -0
data/test/unit/ts_query_parser.rb +2 -0
data/test/unit/ts_search.rb +2 -0
data/test/unit/ts_store.rb +2 -0
data/test/unit/ts_utils.rb +2 -0
data/test/unit/utils/tc_bit_vector.rb +295 -0
data/test/unit/utils/tc_number_tools.rb +117 -0
data/test/unit/utils/tc_priority_queue.rb +106 -0
metadata +392 -0

data/TODO ADDED Viewed

@@ -0,0 +1,17 @@
+= TODO
+* user defined sorting
+* add field compression
+* Fix highlighting to work for compressed fields
+* Fix highlighting to work for external fields
+* Add Ferret::Index::Index
+* Fix:
+> Working Query:  field1:value1 AND NOT field2:value2
+> Failing Query:    field1:value1 AND ( NOT field2:value2 )
+= Done
+* Add string Sort descripter
+* fix memory bug
+* add MultiReader interface
+* add lexicographical sort (byte sort)
+* Add highlighting

data/TUTORIAL ADDED Viewed

@@ -0,0 +1,231 @@
+= Quick Introduction to Ferret
+The simplest way to use Ferret is through the Ferret::Index::Index class.
+This is now aliased by Ferret::I for quick and easy access. Start by including
+the Ferret module.
+  require 'ferret'
+  include Ferret
+=== Creating an index
+To create an in memory index is very simple;
+  index = Index::Index.new()
+To create a persistent index;
+  index = Index::Index.new(:path => '/path/to/index')
+Both of these methods create new Indexes with the StandardAnalyzer. An
+analyzer is what you use to divide the input data up into tokens which you can
+search for later. If you'd like to use a different analyzer you can specify it
+here, eg;
+  index = Index::Index.new(:path => '/path/to/index',
+                           :analyzer => Analysis::WhiteSpaceAnalyzer.new)
+For more options when creating an Index refer to Ferret::Index::Index.
+=== Adding Documents
+To add a document you can simply add a string or an array of strings. This will
+store all the strings in the "" (ie empty string) field (unless you specify the
+default field when you create the index).
+  index << "This is a new document to be indexed"
+  index << ["And here", "is another", "new document", "to be indexed"]
+But these are pretty simple documents. If this is all you want to index you
+could probably just use SimpleSearch. So let's give our documents some fields;
+  index << {:title => "Programming Ruby", :content => "blah blah blah"}
+  index << {:title => "Programming Ruby", :content => "yada yada yada"}
+Note the way that all field-names are Symbols. Although Strings will work,
+this is a best-practice in Ferret. Or if you are indexing data stored in a
+database, you'll probably want to store the id;
+  index << {:id => row.id, :title => row.title, :date => row.date}
+So far we have been storing and tokenizing all of the input data along with
+term vectors. If we want to change this we need to change the way we setup the
+index. You must create a FieldInfos object describing the index:
+  field_infos = FieldInfos.new(:store => :no,
+                               :index => :untokenized_omit_norms,
+                               :term_vector => :no)
+The values that you set FieldInfos to have will be used by default by all
+fields. If you want to change the properties for specific fields, you need to
+add a FieldInfo to field_infos.
+  field_infos.add_field(:title, :store => :yes, :index => :yes, :boost => 10.0)
+  field_infos.add_field(:content, :store => :yes,
+                                  :index => :yes,
+                                  :term_vector => :with_positions_offsets)
+If you need to add a field to an already open index you do so like this:
+  index.field_infos.add_field(:new_field, :store => :yes)
+=== Searching
+Now that we have data in our index, how do we actually use this index to
+search the data? The Index offers two search methods, Index#search and
+Index#search_each. The first method returns a Ferret::Index::TopDocs object.
+The second we'll show here. Lets say we wanted to find all documents with the
+phrase "quick brown fox" in the content field. We'd write;
+  index.search_each('content:"quick brown fox"') do |id, score|
+    puts "Document #{id} found with a score of #{score}"
+  end
+But "fast" has a pretty similar meaning to "quick" and we don't mind if the
+fox is a little red. Also, the phrase could be in the title so we'll search
+there as well. So we could expand our search like this;
+  index.search_each('title|content:"quick|fast brown|red fox"') do |id, score|
+    puts "Document #{id} found with a score of #{score}"
+  end
+What if we want to find all documents entered on or after 5th of September,
+2005 with the words "ruby" or "rails" in any field. We could type something like;
+  index.search_each('date:( >= 20050905) *:(ruby OR rails)') do |id, score|
+    puts "Document #{index[id][:title]} found with a score of #{score}"
+  end
+Ferret has quite a complex query language. To find out more about Ferret's
+query language, see Ferret::QueryParser. You can also construct even more
+complex queries like Ferret::Search::Spans by hand. See Ferret::Search::Query
+for more information.
+=== Highlighting
+Ferret now has a super-fast highlighting method. See
+Ferret::Index::Index#highlight. Here is an example of how you would use it
+when printing to the console:
+  index.search_each('date:( >= 20050905) content:(ruby OR rails)') do |id, score|
+    puts "Document #{index[id][:title]} found with a score of #{score}"
+    highlights = index.highlight("content:(ruby OR rails)", 0,
+                                 :field => :content,
+                                 :pre_tag = "\033[36m",
+                                 :post_tag = "\033[m")
+    puts highlights
+  end
+And if you want to highlight a whole document, set :excerpt_length to :all:
+  puts index.highlight(query, doc_id,
+                       :field => :content,
+                       :pre_tag = "\033[36m",
+                       :post_tag = "\033[m",
+                       :excerpt_length => :all)
+=== Accessing Documents
+You may have noticed that when we run a search we only get the document id
+back. By itself this isn't much use to us. Getting the data from the index is
+very straightforward. For example if we want the :title field form the 3rd
+document type;
+  index[2][:title]
+Documents are lazy loading so if you try this:
+  puts index[2]
+You will always get an empty Hash. To load all fields, call the load method:
+  puts index[2].load
+NOTE: documents are indexed from 0. You can also use array-like index
+parameters to access index. For example
+  index[1..4]
+  index[10, 10]
+  index[-5]
+The default field is :id (although you can change this with index's
+:default_create_field parameter);
+  index << "This is a document"
+  index[0][:id]
+Let's go back to the database example above. If we store all of our documents
+with an id then we can access that field using the id. As long as we called
+our id field :id we can do this
+  index["89721347"]["title"]
+Pretty simple huh? You should note though that if there are more then one
+document with the same *id* or *key* then only the first one will be returned
+so it is probably better that you ensure the key is unique somehow. By setting
+Index's :key attribute to :id, Ferret will do this automatically for you. It
+can even handle multiple field primary keys. For example, you could set to
+:key to [:id, :model] and Ferret would keep the documents unique for that pair
+of fields.
+=== Modifying and Deleting Documents
+What if we want to change the data in the index. Ferret doesn't actually let
+you change the data once it is in the index. But you can delete documents so
+the standard way to modify data is to delete it and re-add it again with the
+modifications made. It is important to note that when doing this the documents
+will get a new document number so you should be careful not to use a document
+number after the document has been deleted. Here is an example of modifying a
+document;
+  index << {:title => "Programing Rbuy", :content => "blah blah blah"}
+  doc_num = nil
+  index.search_each('title:"Programing Rbuy"') {|id, score| doc_id = id}
+  return unless doc_id
+  doc = index[doc_id]
+  index.delete(doc_id)
+  # modify doc. It is just a Hash after all
+  doc[:title] = "Programming Ruby"
+  index << doc
+If you set the :key parameter as described in the last section there is no
+need to delete the document. It will be automatically deleted when you add
+another document with the same key.
+Also, we can use the id field, as above, to delete documents. This time though
+every document that matches the id will be deleted. Again, it is probably a
+good idea if you somehow ensure that your *ids* are kept unique.
+  id = "23453422"
+  index.delete(id)
+=== Onwards
+This is just a small sampling of what Ferret allows you to do.  Ferret, like
+Lucene, is designed to be extended, and allows you to construct your own query
+types, analyzers, and so on. Going onwards you should check out the following
+documentation:
+* Ferret::Analysis: for more information on how the data is processed when it
+  is tokenized. There are a number of things you can do with your data such as
+  adding stop lists or perhaps a porter stemmer. There are also a number of
+  analyzers already available and it is almost trivial to create a new one
+  with a simple regular expression.
+* Ferret::Search: for more information on querying the index. There are a
+  number of already available queries and it's unlikely you'll need to create
+  your own. You may however want to take advantage of the sorting or filtering
+  abilities of Ferret to present your data the best way you see fit.
+* Ferret::QueryParser: if you want to find out more about what you can do with
+  Ferret's Query Parser, this is the place to look. The query parser is one
+  area that could use a bit of work so please send your suggestions.
+* Ferret::Index: for more advanced access to the index you'll probably want to
+  use the Ferret::Index::IndexWriter and Ferret::Index::IndexReader. This is
+  the place to look for more information on them.
+* Ferret::Store: This is the module used to access the actual index storage
+  and won't be of much interest to most people.

data/bin/ferret-browser ADDED Viewed

@@ -0,0 +1,79 @@
+#!/usr/bin/env ruby
+$: << File.expand_path(File.join(File.basename(__FILE__), '../lib'))
+require 'ferret'
+require 'ferret/browser'
+require 'optparse'
+require 'ostruct'
+SERVER_OPTIONS = ['webrick']
+conf = OpenStruct.new(:host => '0.0.0.0', :port => 3301)
+opts = OptionParser.new do |opts|
+  opts.banner = "Usage: #{File.basename($0)} /path/to/index"
+  opts.separator ""
+  opts.separator "Specific Options:"
+  opts.on("-h", "--host HOSTNAME",
+          "Host for web server to bind to (default is all IPs)") { |conf.host| }
+  opts.on("-p", "--port NUM",
+          "Port for web server (defaults to #{conf.port})") { |conf.port| }
+  opts.on("-s", "--server NAME",
+          "Server to force (#{SERVER_OPTIONS.join(', ')}).") { |s| conf.server = s.to_sym }
+  opts.separator ""
+  opts.separator "Common options:"
+  opts.on_tail("-?", "--help", "Show this message") do
+    puts opts
+    exit
+  end
+  opts.on_tail("-v", "--version", "Show version") do
+    puts Ferret::VERSION
+    exit
+  end
+end
+opts.parse! ARGV
+if ARGV.length != 1
+  puts opts
+  exit
+end
+@path = ARGV[0]
+# Load the Ferret index
+begin
+  @reader = Ferret::Index::IndexReader.new(@path)
+rescue Ferret::FileNotFoundError => e
+  puts "\033[31mCannot start Ferret. No index exists at \"\033[m" +
+    "\033[33m#{@path}\033[m\033[31m\".\033[m"
+  exit
+rescue Exception => e
+  puts "\033[31mCannot start Ferret.\n\033[m\033[33m#{e.to_s}\031[m"
+  exit
+end
+unless conf.server
+  conf.server = :webrick
+end
+case conf.server.to_s
+when 'webrick'
+  require 'webrick/httpserver'
+  require 'ferret/browser/webrick'
+  # Mount the root
+  s = WEBrick::HTTPServer.new(:BindAddress => conf.host, :Port => conf.port)
+  s.mount "/s", WEBrick::HTTPServlet::FileHandler, Ferret::Browser::Controller::STATIC_DIR, true
+  s.mount "/", WEBrick::FerretBrowserHandler, @reader, @path
+  # Server up
+  trap(:INT) do
+    s.shutdown
+  end
+  s.start
+else
+  raise "server #{conf.server} not known. Must be one of [#{SERVER_OPTIONS.join(', ')}]"
+end

data/ext/Makefile ADDED Viewed

@@ -0,0 +1,218 @@
+SHELL = /bin/sh
+# V=0 quiet, V=1 verbose.  other values don't work.
+V = 0
+Q1 = $(V:1=)
+Q = $(Q1:0=@)
+n=$(NULLCMD)
+ECHO1 = $(V:1=@$n)
+ECHO = $(ECHO1:0=@echo)
+#### Start of system configuration section. ####
+srcdir = .
+topdir = /Users/ehanson/.rbenv/versions/1.9.3-p392/include/ruby-1.9.1
+hdrdir = /Users/ehanson/.rbenv/versions/1.9.3-p392/include/ruby-1.9.1
+arch_hdrdir = /Users/ehanson/.rbenv/versions/1.9.3-p392/include/ruby-1.9.1/$(arch)
+VPATH = $(srcdir):$(arch_hdrdir)/ruby:$(hdrdir)/ruby
+prefix = $(DESTDIR)/Users/ehanson/.rbenv/versions/1.9.3-p392
+rubylibprefix = $(libdir)/$(RUBY_BASE_NAME)
+exec_prefix = $(prefix)
+vendorhdrdir = $(rubyhdrdir)/vendor_ruby
+sitehdrdir = $(rubyhdrdir)/site_ruby
+rubyhdrdir = $(includedir)/$(RUBY_BASE_NAME)-$(ruby_version)
+vendordir = $(rubylibprefix)/vendor_ruby
+sitedir = $(rubylibprefix)/site_ruby
+ridir = $(datarootdir)/$(RI_BASE_NAME)
+mandir = $(datarootdir)/man
+localedir = $(datarootdir)/locale
+libdir = $(exec_prefix)/lib
+psdir = $(docdir)
+pdfdir = $(docdir)
+dvidir = $(docdir)
+htmldir = $(docdir)
+infodir = $(datarootdir)/info
+docdir = $(datarootdir)/doc/$(PACKAGE)
+oldincludedir = $(DESTDIR)/usr/include
+includedir = $(prefix)/include
+localstatedir = $(prefix)/var
+sharedstatedir = $(prefix)/com
+sysconfdir = $(prefix)/etc
+datadir = $(datarootdir)
+datarootdir = $(prefix)/share
+libexecdir = $(exec_prefix)/libexec
+sbindir = $(exec_prefix)/sbin
+bindir = $(exec_prefix)/bin
+rubylibdir = $(rubylibprefix)/$(ruby_version)
+archdir = $(rubylibdir)/$(arch)
+sitelibdir = $(sitedir)/$(ruby_version)
+sitearchdir = $(sitelibdir)/$(sitearch)
+vendorlibdir = $(vendordir)/$(ruby_version)
+vendorarchdir = $(vendorlibdir)/$(sitearch)
+NULLCMD = :
+CC = gcc
+CXX = g++
+LIBRUBY = $(LIBRUBY_A)
+LIBRUBY_A = lib$(RUBY_SO_NAME)-static.a
+LIBRUBYARG_SHARED =
+LIBRUBYARG_STATIC = -l$(RUBY_SO_NAME)-static
+empty =
+OUTFLAG = -o $(empty)
+COUTFLAG = -o $(empty)
+RUBY_EXTCONF_H =
+cflags   =  $(optflags) $(debugflags) $(warnflags)
+optflags = -O3
+debugflags = -ggdb
+warnflags = -Wall -Wextra -Wno-unused-parameter -Wno-parentheses -Wno-long-long -Wno-missing-field-initializers -Wpointer-arith -Wwrite-strings -Wdeclaration-after-statement -Wshorten-64-to-32 -Wimplicit-function-declaration
+CFLAGS   = -fno-common  -O3 -Wno-error=shorten-64-to-32  -pipe -D_FILE_OFFSET_BITS=64 $(ARCH_FLAG)
+INCFLAGS = -I. -I$(arch_hdrdir) -I$(hdrdir)/ruby/backward -I$(hdrdir) -I$(srcdir)
+DEFS     =
+CPPFLAGS =  -I'/Users/ehanson/.rbenv/versions/1.9.3-p392/include'  -D_XOPEN_SOURCE -D_DARWIN_C_SOURCE $(DEFS) $(cppflags)
+CXXFLAGS = $(CFLAGS) $(cxxflags)
+ldflags  = -L. -L'/Users/ehanson/.rbenv/versions/1.9.3-p392/lib'  -L/usr/local/lib
+dldflags = -Wl,-undefined,dynamic_lookup -Wl,-multiply_defined,suppress -Wl,-flat_namespace
+ARCH_FLAG =
+DLDFLAGS = $(ldflags) $(dldflags) $(ARCH_FLAG)
+LDSHARED = $(CC) -dynamic -bundle
+LDSHAREDXX = $(CXX) -dynamic -bundle
+AR = ar
+EXEEXT =
+RUBY_BASE_NAME = ruby
+RUBY_INSTALL_NAME = ruby
+RUBY_SO_NAME = ruby
+arch = x86_64-darwin12.2.1
+sitearch = $(arch)
+ruby_version = 1.9.1
+ruby = /Users/ehanson/.rbenv/versions/1.9.3-p392/bin/ruby
+RUBY = $(ruby)
+RM = rm -f
+RM_RF = $(RUBY) -run -e rm -- -rf
+RMDIRS = rmdir -p
+MAKEDIRS = mkdir -p
+INSTALL = /usr/bin/install -c
+INSTALL_PROG = $(INSTALL) -m 0755
+INSTALL_DATA = $(INSTALL) -m 644
+COPY = cp
+TOUCH = exit >
+#### End of system configuration section. ####
+preload =
+libpath = . $(libdir)
+LIBPATH =  -L. -L$(libdir)
+DEFFILE =
+CLEANFILES = mkmf.log
+DISTCLEANFILES =
+DISTCLEANDIRS =
+extout =
+extout_prefix =
+target_prefix =
+LOCAL_LIBS =
+LIBS =   -lpthread -ldl -lobjc
+SRCS = analysis.c api.c array.c bitvector.c compound_io.c document.c except.c ferret.c filter.c fs_store.c global.c hash.c hashset.c helper.c index.c libstemmer.c mempool.c multimapper.c posh.c priorityqueue.c q_boolean.c q_const_score.c q_filtered_query.c q_fuzzy.c q_match_all.c q_multi_term.c q_parser.c q_phrase.c q_prefix.c q_range.c q_span.c q_term.c q_wildcard.c r_analysis.c r_index.c r_qparser.c r_search.c r_store.c r_utils.c ram_store.c search.c similarity.c sort.c stem_ISO_8859_1_danish.c stem_ISO_8859_1_dutch.c stem_ISO_8859_1_english.c stem_ISO_8859_1_finnish.c stem_ISO_8859_1_french.c stem_ISO_8859_1_german.c stem_ISO_8859_1_italian.c stem_ISO_8859_1_norwegian.c stem_ISO_8859_1_porter.c stem_ISO_8859_1_portuguese.c stem_ISO_8859_1_spanish.c stem_ISO_8859_1_swedish.c stem_KOI8_R_russian.c stem_UTF_8_danish.c stem_UTF_8_dutch.c stem_UTF_8_english.c stem_UTF_8_finnish.c stem_UTF_8_french.c stem_UTF_8_german.c stem_UTF_8_italian.c stem_UTF_8_norwegian.c stem_UTF_8_porter.c stem_UTF_8_portuguese.c stem_UTF_8_russian.c stem_UTF_8_spanish.c stem_UTF_8_swedish.c stopwords.c store.c term_vectors.c utilities.c
+OBJS = analysis.o api.o array.o bitvector.o compound_io.o document.o except.o ferret.o filter.o fs_store.o global.o hash.o hashset.o helper.o index.o libstemmer.o mempool.o multimapper.o posh.o priorityqueue.o q_boolean.o q_const_score.o q_filtered_query.o q_fuzzy.o q_match_all.o q_multi_term.o q_parser.o q_phrase.o q_prefix.o q_range.o q_span.o q_term.o q_wildcard.o r_analysis.o r_index.o r_qparser.o r_search.o r_store.o r_utils.o ram_store.o search.o similarity.o sort.o stem_ISO_8859_1_danish.o stem_ISO_8859_1_dutch.o stem_ISO_8859_1_english.o stem_ISO_8859_1_finnish.o stem_ISO_8859_1_french.o stem_ISO_8859_1_german.o stem_ISO_8859_1_italian.o stem_ISO_8859_1_norwegian.o stem_ISO_8859_1_porter.o stem_ISO_8859_1_portuguese.o stem_ISO_8859_1_spanish.o stem_ISO_8859_1_swedish.o stem_KOI8_R_russian.o stem_UTF_8_danish.o stem_UTF_8_dutch.o stem_UTF_8_english.o stem_UTF_8_finnish.o stem_UTF_8_french.o stem_UTF_8_german.o stem_UTF_8_italian.o stem_UTF_8_norwegian.o stem_UTF_8_porter.o stem_UTF_8_portuguese.o stem_UTF_8_russian.o stem_UTF_8_spanish.o stem_UTF_8_swedish.o stopwords.o store.o term_vectors.o utilities.o
+TARGET = ferret_ext
+DLLIB = $(TARGET).bundle
+EXTSTATIC =
+STATIC_LIB =
+BINDIR        = $(bindir)
+RUBYCOMMONDIR = $(sitedir)$(target_prefix)
+RUBYLIBDIR = /Users/ehanson/.rbenv/versions/1.9.3-p392/gemsets/ferret/gems/sdsykes-ferret-0.11.6.19/lib$(target_prefix)
+RUBYARCHDIR = /Users/ehanson/.rbenv/versions/1.9.3-p392/gemsets/ferret/gems/sdsykes-ferret-0.11.6.19/lib$(target_prefix)
+HDRDIR        = $(rubyhdrdir)/ruby$(target_prefix)
+ARCHHDRDIR    = $(rubyhdrdir)/$(arch)/ruby$(target_prefix)
+TARGET_SO     = $(DLLIB)
+CLEANLIBS     = $(TARGET).bundle
+CLEANOBJS     = *.o  *.bak
+all:    $(DLLIB)
+static: $(STATIC_LIB)
+.PHONY: all install static install-so install-rb
+.PHONY: clean clean-so clean-rb
+clean-static::
+clean-rb-default::
+clean-rb::
+clean-so::
+clean: clean-so clean-static clean-rb-default clean-rb
+		-$(Q)$(RM) $(CLEANLIBS) $(CLEANOBJS) $(CLEANFILES) .*.time
+distclean-rb-default::
+distclean-rb::
+distclean-so::
+distclean: clean distclean-so distclean-rb-default distclean-rb
+		@-$(RM) Makefile $(RUBY_EXTCONF_H) conftest.* mkmf.log
+		@-$(RM) core ruby$(EXEEXT) *~ $(DISTCLEANFILES)
+		@-$(RMDIRS) $(DISTCLEANDIRS) 2> /dev/null || true
+realclean: distclean
+install: install-so install-rb
+install-so: $(RUBYARCHDIR)/$(DLLIB)
+$(RUBYARCHDIR)/$(DLLIB): $(DLLIB)
+	-$(Q)$(MAKEDIRS) $(@D)
+	$(INSTALL_PROG) $(DLLIB) $(@D)
+clean-static::
+	-$(Q)$(RM) $(STATIC_LIB)
+install-rb: pre-install-rb install-rb-default
+install-rb-default: pre-install-rb-default
+pre-install-rb: Makefile
+pre-install-rb-default: Makefile
+pre-install-rb-default:
+	$(ECHO) installing default ferret_ext libraries
+./.RUBYARCHDIR.time:
+	$(Q) $(MAKEDIRS) $(RUBYARCHDIR)
+	$(Q) $(TOUCH) $@
+site-install: site-install-so site-install-rb
+site-install-so: install-so
+site-install-rb: install-rb
+.SUFFIXES: .c .m .cc .mm .cxx .cpp .C .o
+.cc.o:
+	$(ECHO) compiling $(<)
+	$(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $<
+.mm.o:
+	$(ECHO) compiling $(<)
+	$(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $<
+.cxx.o:
+	$(ECHO) compiling $(<)
+	$(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $<
+.cpp.o:
+	$(ECHO) compiling $(<)
+	$(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $<
+.C.o:
+	$(ECHO) compiling $(<)
+	$(Q) $(CXX) $(INCFLAGS) $(CPPFLAGS) $(CXXFLAGS) $(COUTFLAG)$@ -c $<
+.c.o:
+	$(ECHO) compiling $(<)
+	$(Q) $(CC) $(INCFLAGS) $(CPPFLAGS) $(CFLAGS) $(COUTFLAG)$@ -c $<
+.m.o:
+	$(ECHO) compiling $(<)
+	$(Q) $(CC) $(INCFLAGS) $(CPPFLAGS) $(CFLAGS) $(COUTFLAG)$@ -c $<
+$(DLLIB): $(OBJS) Makefile
+	$(ECHO) linking shared-object $(DLLIB)
+	-$(Q)$(RM) $(@)
+	$(Q) $(LDSHARED) -o $@ $(OBJS) $(LIBPATH) $(DLDFLAGS) $(LOCAL_LIBS) $(LIBS)
+$(OBJS): $(hdrdir)/ruby.h $(hdrdir)/ruby/defines.h $(arch_hdrdir)/ruby/config.h