sunspot 0.9.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (101) hide show
  1. data/History.txt +83 -0
  2. data/LICENSE +18 -0
  3. data/README.rdoc +154 -0
  4. data/Rakefile +9 -0
  5. data/TODO +9 -0
  6. data/VERSION.yml +4 -0
  7. data/bin/sunspot-configure-solr +46 -0
  8. data/bin/sunspot-solr +62 -0
  9. data/lib/light_config.rb +40 -0
  10. data/lib/sunspot.rb +469 -0
  11. data/lib/sunspot/adapters.rb +265 -0
  12. data/lib/sunspot/composite_setup.rb +186 -0
  13. data/lib/sunspot/configuration.rb +38 -0
  14. data/lib/sunspot/data_extractor.rb +47 -0
  15. data/lib/sunspot/dsl.rb +3 -0
  16. data/lib/sunspot/dsl/field_query.rb +72 -0
  17. data/lib/sunspot/dsl/fields.rb +86 -0
  18. data/lib/sunspot/dsl/query.rb +59 -0
  19. data/lib/sunspot/dsl/query_facet.rb +31 -0
  20. data/lib/sunspot/dsl/restriction.rb +25 -0
  21. data/lib/sunspot/dsl/scope.rb +193 -0
  22. data/lib/sunspot/dsl/search.rb +30 -0
  23. data/lib/sunspot/facet.rb +16 -0
  24. data/lib/sunspot/facet_data.rb +120 -0
  25. data/lib/sunspot/facet_row.rb +10 -0
  26. data/lib/sunspot/field.rb +157 -0
  27. data/lib/sunspot/field_factory.rb +126 -0
  28. data/lib/sunspot/indexer.rb +123 -0
  29. data/lib/sunspot/instantiated_facet.rb +42 -0
  30. data/lib/sunspot/instantiated_facet_row.rb +22 -0
  31. data/lib/sunspot/query.rb +191 -0
  32. data/lib/sunspot/query/base_query.rb +90 -0
  33. data/lib/sunspot/query/connective.rb +126 -0
  34. data/lib/sunspot/query/dynamic_query.rb +69 -0
  35. data/lib/sunspot/query/field_facet.rb +151 -0
  36. data/lib/sunspot/query/field_query.rb +63 -0
  37. data/lib/sunspot/query/pagination.rb +39 -0
  38. data/lib/sunspot/query/query_facet.rb +73 -0
  39. data/lib/sunspot/query/query_facet_row.rb +19 -0
  40. data/lib/sunspot/query/query_field_facet.rb +13 -0
  41. data/lib/sunspot/query/restriction.rb +233 -0
  42. data/lib/sunspot/query/scope.rb +165 -0
  43. data/lib/sunspot/query/sort.rb +36 -0
  44. data/lib/sunspot/query/sort_composite.rb +33 -0
  45. data/lib/sunspot/schema.rb +165 -0
  46. data/lib/sunspot/search.rb +219 -0
  47. data/lib/sunspot/search/hit.rb +66 -0
  48. data/lib/sunspot/session.rb +201 -0
  49. data/lib/sunspot/setup.rb +271 -0
  50. data/lib/sunspot/type.rb +200 -0
  51. data/lib/sunspot/util.rb +164 -0
  52. data/solr/etc/jetty.xml +212 -0
  53. data/solr/etc/webdefault.xml +379 -0
  54. data/solr/lib/jetty-6.1.3.jar +0 -0
  55. data/solr/lib/jetty-util-6.1.3.jar +0 -0
  56. data/solr/lib/jsp-2.1/ant-1.6.5.jar +0 -0
  57. data/solr/lib/jsp-2.1/core-3.1.1.jar +0 -0
  58. data/solr/lib/jsp-2.1/jsp-2.1.jar +0 -0
  59. data/solr/lib/jsp-2.1/jsp-api-2.1.jar +0 -0
  60. data/solr/lib/servlet-api-2.5-6.1.3.jar +0 -0
  61. data/solr/solr/conf/elevate.xml +36 -0
  62. data/solr/solr/conf/protwords.txt +21 -0
  63. data/solr/solr/conf/schema.xml +50 -0
  64. data/solr/solr/conf/solrconfig.xml +696 -0
  65. data/solr/solr/conf/stopwords.txt +57 -0
  66. data/solr/solr/conf/synonyms.txt +31 -0
  67. data/solr/start.jar +0 -0
  68. data/solr/webapps/solr.war +0 -0
  69. data/spec/api/adapters_spec.rb +33 -0
  70. data/spec/api/build_search_spec.rb +1039 -0
  71. data/spec/api/indexer_spec.rb +311 -0
  72. data/spec/api/query_spec.rb +153 -0
  73. data/spec/api/search_retrieval_spec.rb +362 -0
  74. data/spec/api/session_spec.rb +157 -0
  75. data/spec/api/spec_helper.rb +1 -0
  76. data/spec/api/sunspot_spec.rb +18 -0
  77. data/spec/integration/dynamic_fields_spec.rb +55 -0
  78. data/spec/integration/faceting_spec.rb +169 -0
  79. data/spec/integration/keyword_search_spec.rb +83 -0
  80. data/spec/integration/scoped_search_spec.rb +289 -0
  81. data/spec/integration/spec_helper.rb +1 -0
  82. data/spec/integration/stored_fields_spec.rb +10 -0
  83. data/spec/integration/test_pagination.rb +32 -0
  84. data/spec/mocks/adapters.rb +32 -0
  85. data/spec/mocks/blog.rb +3 -0
  86. data/spec/mocks/comment.rb +19 -0
  87. data/spec/mocks/connection.rb +84 -0
  88. data/spec/mocks/mock_adapter.rb +30 -0
  89. data/spec/mocks/mock_record.rb +48 -0
  90. data/spec/mocks/photo.rb +8 -0
  91. data/spec/mocks/post.rb +73 -0
  92. data/spec/mocks/user.rb +8 -0
  93. data/spec/spec_helper.rb +47 -0
  94. data/tasks/gemspec.rake +25 -0
  95. data/tasks/rcov.rake +28 -0
  96. data/tasks/rdoc.rake +22 -0
  97. data/tasks/schema.rake +19 -0
  98. data/tasks/spec.rake +24 -0
  99. data/tasks/todo.rake +4 -0
  100. data/templates/schema.xml.haml +24 -0
  101. metadata +246 -0
@@ -0,0 +1,265 @@
1
+ module Sunspot
2
+ #
3
+ # Sunspot works by saving references to the primary key (or natural ID) of
4
+ # each indexed object, and then retrieving the objects from persistent storage
5
+ # when their IDs are referenced in search results. In order for Sunspot to
6
+ # know what an object's primary key is, and how to retrieve objects from
7
+ # persistent storage given a primary key, an adapter must be registered for
8
+ # that object's class or one of its superclasses (for instance, an adapter
9
+ # registered for ActiveRecord::Base would be used for all ActiveRecord
10
+ # models).
11
+ #
12
+ # To provide Sunspot with this ability, adapters must have two roles:
13
+ #
14
+ # Data accessor::
15
+ # A subclass of Sunspot::Adapters::DataAccessor, this object is instantiated
16
+ # with a particular class and must respond to the #load() method, which
17
+ # returns an object from persistent storage given that object's primary key.
18
+ # It can also optionally implement the #load_all() method, which returns
19
+ # a collection of objects given a collection of primary keys, if that can be
20
+ # done more efficiently than calling #load() on each key.
21
+ # Instance adapter::
22
+ # A subclass of Sunspot::Adapters::InstanceAdapter, this object is
23
+ # instantiated with a particular instance. Its only job is to tell Sunspot
24
+ # what the object's primary key is, by implementing the #id() method.
25
+ #
26
+ # Adapters are registered by registering their two components, telling Sunspot
27
+ # that they are available for one or more classes, and all of their
28
+ # subclasses. See Sunspot::Adapters::DataAccessor.register and
29
+ # Sunspot::Adapters::InstanceAdapter.register for the details.
30
+ #
31
+ # See spec/mocks/mock_adapter.rb for an example of how adapter classes should
32
+ # be implemented.
33
+ #
34
+ module Adapters
35
+ # Subclasses of the InstanceAdapter class should implement the #id method,
36
+ # which returns the primary key of the instance stored in the @instance
37
+ # variable. The primary key must be unique within the scope of the
38
+ # instance's class.
39
+ #
40
+ # ==== Example:
41
+ #
42
+ # class FileAdapter < Sunspot::Adapters::InstanceAdapter
43
+ # def id
44
+ # File.expand_path(@instance.path)
45
+ # end
46
+ # end
47
+ #
48
+ # # then in your initializer
49
+ # Sunspot::Adapters::InstanceAdapter.register(MyAdapter, File)
50
+ #
51
+ class InstanceAdapter
52
+ def initialize(instance) #:nodoc:
53
+ @instance = instance
54
+ end
55
+
56
+ #
57
+ # The universally-unique ID for this instance that will be stored in solr
58
+ #
59
+ # ==== Returns
60
+ #
61
+ # String:: ID for use in Solr
62
+ #
63
+ def index_id #:nodoc:
64
+ InstanceAdapter.index_id_for(@instance.class.name, id)
65
+ end
66
+
67
+ class <<self
68
+ # Instantiate an InstanceAdapter for the given object, searching for
69
+ # registered adapters for the object's class.
70
+ #
71
+ # ==== Parameters
72
+ #
73
+ # instance<Object>:: The instance to adapt
74
+ #
75
+ # ==== Returns
76
+ #
77
+ # InstanceAdapter::
78
+ # An instance of an InstanceAdapter implementation that
79
+ # wraps the given instance
80
+ #
81
+ def adapt(instance) #:nodoc:
82
+ self.for(instance.class).new(instance)
83
+ end
84
+
85
+ # Register an instance adapter for a set of classes. When searching for
86
+ # an adapter for a given instance, Sunspot starts with the instance's
87
+ # class, and then searches for registered adapters up the class's
88
+ # ancestor chain.
89
+ #
90
+ # ==== Parameters
91
+ #
92
+ # instance_adapter<Class>:: The instance adapter class to register
93
+ # classes...<Class>::
94
+ # One or more classes that this instance adapter adapts
95
+ #
96
+ def register(instance_adapter, *classes)
97
+ for clazz in classes
98
+ instance_adapters[clazz.name.to_sym] = instance_adapter
99
+ end
100
+ end
101
+
102
+ # Find the best InstanceAdapter implementation that adapts the given
103
+ # class. Starting with the class and then moving up the ancestor chain,
104
+ # looks for registered InstanceAdapter implementations.
105
+ #
106
+ # ==== Parameters
107
+ #
108
+ # clazz<Class>:: The class to find an InstanceAdapter for
109
+ #
110
+ # ==== Returns
111
+ #
112
+ # Class:: Subclass of InstanceAdapter, or nil if none found
113
+ #
114
+ # ==== Raises
115
+ #
116
+ # Sunspot::NoAdapterError:: If no adapter is registered for this class
117
+ #
118
+ def for(clazz) #:nodoc:
119
+ original_class_name = clazz.name
120
+ clazz.ancestors.each do |ancestor_class|
121
+ next if ancestor_class.name.nil? || ancestor_class.name.empty?
122
+ class_name = ancestor_class.name.to_sym
123
+ return instance_adapters[class_name] if instance_adapters[class_name]
124
+ end
125
+
126
+ raise(Sunspot::NoAdapterError,
127
+ "No adapter is configured for #{original_class_name} or its superclasses. See the documentation for Sunspot::Adapters")
128
+ end
129
+
130
+ def index_id_for(class_name, id)
131
+ "#{class_name} #{id}"
132
+ end
133
+
134
+ protected
135
+
136
+ # Lazy-initialize the hash of registered instance adapters
137
+ #
138
+ # ==== Returns
139
+ #
140
+ # Hash:: Hash containing class names keyed to instance adapter classes
141
+ #
142
+ def instance_adapters #:nodoc:
143
+ @instance_adapters ||= {}
144
+ end
145
+ end
146
+ end
147
+
148
+ # Subclasses of the DataAccessor class take care of retreiving instances of
149
+ # the adapted class from (usually persistent) storage. Subclasses must
150
+ # implement the #load method, which takes an id (the value returned by
151
+ # InstanceAdapter#id, as a string), and returns the instance referenced by
152
+ # that ID. Optionally, it can also override the #load_all method, which
153
+ # takes an array of IDs and returns an array of instances in the order
154
+ # given. #load_all need only be implemented if it can be done more
155
+ # efficiently than simply iterating over the IDs and calling #load on each
156
+ # individually.
157
+ #
158
+ # ==== Example
159
+ #
160
+ # class FileAccessor < Sunspot::Adapters::InstanceAdapter
161
+ # def load(id)
162
+ # @clazz.open(id)
163
+ # end
164
+ # end
165
+ #
166
+ # Sunspot::Adapters::DataAccessor.register(FileAccessor, File)
167
+ #
168
+ class DataAccessor
169
+ def initialize(clazz) #:nodoc:
170
+ @clazz = clazz
171
+ end
172
+
173
+ # Subclasses can override this class to provide more efficient bulk
174
+ # loading of instances. Instances must be returned in the same order
175
+ # that the IDs were given.
176
+ #
177
+ # ==== Parameters
178
+ #
179
+ # ids<Array>:: collection of IDs
180
+ #
181
+ # ==== Returns
182
+ #
183
+ # Array:: collection of instances, in order of IDs given
184
+ #
185
+ def load_all(ids)
186
+ ids.map { |id| self.load(id) }
187
+ end
188
+
189
+ class <<self
190
+ # Create a DataAccessor for the given class, searching registered
191
+ # adapters for the best match. See InstanceAdapter#adapt for discussion
192
+ # of inheritence.
193
+ #
194
+ # ==== Parameters
195
+ #
196
+ # clazz<Class>:: Class to create DataAccessor for
197
+ #
198
+ # ==== Returns
199
+ #
200
+ # DataAccessor::
201
+ # DataAccessor implementation which provides access to given class
202
+ #
203
+ def create(clazz) #:nodoc:
204
+ self.for(clazz).new(clazz)
205
+ end
206
+
207
+ # Register data accessor for a set of classes. When searching for
208
+ # an accessor for a given class, Sunspot starts with the class,
209
+ # and then searches for registered adapters up the class's ancestor
210
+ # chain.
211
+ #
212
+ # ==== Parameters
213
+ #
214
+ # data_accessor<Class>:: The data accessor class to register
215
+ # classes...<Class>::
216
+ # One or more classes that this data accessor providess access to
217
+ #
218
+ def register(data_accessor, *classes)
219
+ for clazz in classes
220
+ data_accessors[clazz.name.to_sym] = data_accessor
221
+ end
222
+ end
223
+
224
+ # Find the best DataAccessor implementation that adapts the given class.
225
+ # Starting with the class and then moving up the ancestor chain, looks
226
+ # for registered DataAccessor implementations.
227
+ #
228
+ # ==== Parameters
229
+ #
230
+ # clazz<Class>:: The class to find a DataAccessor for
231
+ #
232
+ # ==== Returns
233
+ #
234
+ # Class:: Implementation of DataAccessor
235
+ #
236
+ # ==== Raises
237
+ #
238
+ # Sunspot::NoAdapterError:: If no data accessor exists for the given class
239
+ #
240
+ def for(clazz) #:nodoc:
241
+ original_class_name = clazz.name
242
+ clazz.ancestors.each do |ancestor_class|
243
+ next if ancestor_class.name.nil? || ancestor_class.name.empty?
244
+ class_name = ancestor_class.name.to_sym
245
+ return data_accessors[class_name] if data_accessors[class_name]
246
+ end
247
+ raise(Sunspot::NoAdapterError,
248
+ "No data accessor is configured for #{original_class_name} or its superclasses. See the documentation for Sunspot::Adapters")
249
+ end
250
+
251
+ protected
252
+
253
+ # Lazy-initialize the hash of registered data accessors
254
+ #
255
+ # ==== Returns
256
+ #
257
+ # Hash:: Hash containing class names keyed to data accessor classes
258
+ #
259
+ def data_accessors #:nodoc:
260
+ @adapters ||= {}
261
+ end
262
+ end
263
+ end
264
+ end
265
+ end
@@ -0,0 +1,186 @@
1
+ module Sunspot
2
+ #
3
+ # The CompositeSetup class encapsulates a collection of setups, and responds
4
+ # to a subset of the methods that Setup responds to (in particular, the
5
+ # methods required to build queries).
6
+ #
7
+ class CompositeSetup #:nodoc:
8
+ class << self
9
+ alias_method :for, :new
10
+ end
11
+
12
+ def initialize(types)
13
+ @types = types
14
+ end
15
+
16
+ #
17
+ # Collection of Setup objects for the enclosed types
18
+ #
19
+ # ==== Returns
20
+ #
21
+ # Array:: Collection of Setup objects
22
+ #
23
+ def setups
24
+ @setups ||= @types.map { |type| Setup.for(type) }
25
+ end
26
+
27
+ #
28
+ # Return the names of the encapsulated types
29
+ #
30
+ # ==== Returns
31
+ #
32
+ # Array:: Collection of class names
33
+ #
34
+ def type_names
35
+ @type_names ||= @types.map { |clazz| clazz.name }
36
+ end
37
+
38
+ #
39
+ # Get a text field object by its public name. A field will be returned if
40
+ # it is configured for any of the enclosed types.
41
+ #
42
+ # ==== Returns
43
+ #
44
+ # Sunspot::FulltextField:: Text field with the given public name
45
+ #
46
+ # ==== Raises
47
+ #
48
+ # UnrecognizedFieldError::
49
+ # If no field with that name is configured for any of the enclosed types.
50
+ #
51
+ def text_field(field_name)
52
+ text_fields_hash[field_name.to_sym] || raise(
53
+ UnrecognizedFieldError,
54
+ "No text field configured for #{@types * ', '} with name '#{field_name}'"
55
+ )
56
+ end
57
+
58
+ #
59
+ # Get a Sunspot::AttributeField instance corresponding to the given field name
60
+ #
61
+ # ==== Parameters
62
+ #
63
+ # field_name<Symbol>:: The public field name for which to find a field
64
+ #
65
+ # ==== Returns
66
+ #
67
+ # Sunspot::AttributeField The field object corresponding to the given name
68
+ #
69
+ # ==== Raises
70
+ #
71
+ # ArgumentError::
72
+ # If the given field name is not configured for the types being queried
73
+ #
74
+ def field(field_name) #:nodoc:
75
+ fields_hash[field_name.to_sym] || raise(
76
+ UnrecognizedFieldError,
77
+ "No field configured for #{@types * ', '} with name '#{field_name}'"
78
+ )
79
+ end
80
+
81
+ #
82
+ # Get a dynamic field factory for the given base name.
83
+ #
84
+ # ==== Returns
85
+ #
86
+ # DynamicFieldFactory:: Factory for dynamic fields with the given base name
87
+ #
88
+ # ==== Raises
89
+ #
90
+ # UnrecognizedFieldError::
91
+ # If the given base name is not configured as a dynamic field for the types being queried
92
+ #
93
+ def dynamic_field_factory(field_name)
94
+ dynamic_field_factories_hash[field_name.to_sym] || raise(
95
+ UnrecognizedFieldError,
96
+ "No dynamic field configured for #{@types * ', '} with name #{field_name.inspect}"
97
+ )
98
+ end
99
+
100
+ #
101
+ # Collection of all text fields configured for any of the enclosed types.
102
+ #
103
+ # === Returns
104
+ #
105
+ # Array:: Text fields configured for the enclosed types
106
+ #
107
+ def text_fields
108
+ @text_fields ||= text_fields_hash.values
109
+ end
110
+
111
+ private
112
+
113
+ #
114
+ # Return a hash of field names to text field objects, containing all fields
115
+ # that are configured for any of the types enclosed.
116
+ #
117
+ # ==== Returns
118
+ #
119
+ # Hash:: Hash of field names to text field objects.
120
+ #
121
+ def text_fields_hash
122
+ @text_fields_hash ||=
123
+ setups.inject({}) do |hash, setup|
124
+ setup.text_fields.each do |text_field|
125
+ hash[text_field.name] ||= text_field
126
+ end
127
+ hash
128
+ end
129
+ end
130
+
131
+ #
132
+ # Return a hash of field names to field objects, containing all fields
133
+ # that are common to all of the classes enclosed. In order for fields
134
+ # to be common, they must be of the same type and have the same
135
+ # value for allow_multiple? and stored?. This method is memoized.
136
+ #
137
+ # ==== Returns
138
+ #
139
+ # Hash:: field names keyed to field objects
140
+ #
141
+ def fields_hash
142
+ @fields_hash ||=
143
+ begin
144
+ fields_hash = @types.inject({}) do |hash, type|
145
+ Setup.for(type).fields.each do |field|
146
+ (hash[field.name.to_sym] ||= {})[type.name] = field
147
+ end
148
+ hash
149
+ end
150
+ fields_hash.each_pair do |field_name, field_configurations_hash|
151
+ if @types.any? { |type| field_configurations_hash[type.name].nil? } # at least one type doesn't have this field configured
152
+ fields_hash.delete(field_name)
153
+ elsif field_configurations_hash.values.map { |configuration| configuration.indexed_name }.uniq.length != 1 # fields with this name have different configs
154
+ fields_hash.delete(field_name)
155
+ else
156
+ fields_hash[field_name] = field_configurations_hash.values.first
157
+ end
158
+ end
159
+ end
160
+ end
161
+
162
+ #
163
+ # Return a hash of dynamic field base names to dynamic field factories for
164
+ # those base names. Criteria for the inclusion are the same as for
165
+ # #fields_hash()
166
+ #
167
+ def dynamic_field_factories_hash
168
+ @dynamic_field_factories_hash ||=
169
+ begin
170
+ dynamic_field_factories_hash = @types.inject({}) do |hash, type|
171
+ Setup.for(type).dynamic_field_factories.each do |field_factory|
172
+ (hash[field_factory.name.to_sym] ||= {})[type.name] = field_factory
173
+ end
174
+ hash
175
+ end
176
+ dynamic_field_factories_hash.each_pair do |field_name, field_configurations_hash|
177
+ if @types.any? { |type| field_configurations_hash[type.name].nil? }
178
+ dynamic_field_factories_hash.delete(field_name)
179
+ else
180
+ dynamic_field_factories_hash[field_name] = field_configurations_hash.values.first
181
+ end
182
+ end
183
+ end
184
+ end
185
+ end
186
+ end