erichummel-sunspot 1.2.1a

Sign up to get free protection for your applications and to get access to all the features.
Files changed (185) hide show
  1. data/Gemfile +10 -0
  2. data/Gemfile.lock +32 -0
  3. data/History.txt +222 -0
  4. data/LICENSE +18 -0
  5. data/Rakefile +11 -0
  6. data/TODO +13 -0
  7. data/VERSION.yml +4 -0
  8. data/bin/sunspot-installer +19 -0
  9. data/bin/sunspot-solr +74 -0
  10. data/installer/config/schema.yml +95 -0
  11. data/lib/light_config.rb +40 -0
  12. data/lib/sunspot/adapters.rb +265 -0
  13. data/lib/sunspot/composite_setup.rb +202 -0
  14. data/lib/sunspot/configuration.rb +46 -0
  15. data/lib/sunspot/data_extractor.rb +50 -0
  16. data/lib/sunspot/dsl/adjustable.rb +47 -0
  17. data/lib/sunspot/dsl/field_query.rb +266 -0
  18. data/lib/sunspot/dsl/fields.rb +103 -0
  19. data/lib/sunspot/dsl/fulltext.rb +243 -0
  20. data/lib/sunspot/dsl/function.rb +14 -0
  21. data/lib/sunspot/dsl/functional.rb +41 -0
  22. data/lib/sunspot/dsl/more_like_this_query.rb +56 -0
  23. data/lib/sunspot/dsl/paginatable.rb +28 -0
  24. data/lib/sunspot/dsl/query_facet.rb +36 -0
  25. data/lib/sunspot/dsl/restriction.rb +25 -0
  26. data/lib/sunspot/dsl/restriction_with_near.rb +121 -0
  27. data/lib/sunspot/dsl/scope.rb +217 -0
  28. data/lib/sunspot/dsl/search.rb +30 -0
  29. data/lib/sunspot/dsl/standard_query.rb +121 -0
  30. data/lib/sunspot/dsl.rb +5 -0
  31. data/lib/sunspot/field.rb +193 -0
  32. data/lib/sunspot/field_factory.rb +129 -0
  33. data/lib/sunspot/indexer.rb +131 -0
  34. data/lib/sunspot/installer/library_installer.rb +45 -0
  35. data/lib/sunspot/installer/schema_builder.rb +219 -0
  36. data/lib/sunspot/installer/solrconfig_updater.rb +76 -0
  37. data/lib/sunspot/installer/task_helper.rb +18 -0
  38. data/lib/sunspot/installer.rb +31 -0
  39. data/lib/sunspot/query/abstract_field_facet.rb +52 -0
  40. data/lib/sunspot/query/boost_query.rb +24 -0
  41. data/lib/sunspot/query/common_query.rb +85 -0
  42. data/lib/sunspot/query/composite_fulltext.rb +36 -0
  43. data/lib/sunspot/query/connective.rb +206 -0
  44. data/lib/sunspot/query/date_field_facet.rb +14 -0
  45. data/lib/sunspot/query/dismax.rb +128 -0
  46. data/lib/sunspot/query/field_facet.rb +41 -0
  47. data/lib/sunspot/query/filter.rb +38 -0
  48. data/lib/sunspot/query/function_query.rb +52 -0
  49. data/lib/sunspot/query/geo.rb +53 -0
  50. data/lib/sunspot/query/highlighting.rb +55 -0
  51. data/lib/sunspot/query/more_like_this.rb +61 -0
  52. data/lib/sunspot/query/more_like_this_query.rb +12 -0
  53. data/lib/sunspot/query/pagination.rb +38 -0
  54. data/lib/sunspot/query/query_facet.rb +16 -0
  55. data/lib/sunspot/query/restriction.rb +262 -0
  56. data/lib/sunspot/query/scope.rb +9 -0
  57. data/lib/sunspot/query/sort.rb +95 -0
  58. data/lib/sunspot/query/sort_composite.rb +33 -0
  59. data/lib/sunspot/query/standard_query.rb +16 -0
  60. data/lib/sunspot/query/text_field_boost.rb +17 -0
  61. data/lib/sunspot/query.rb +11 -0
  62. data/lib/sunspot/schema.rb +151 -0
  63. data/lib/sunspot/search/abstract_search.rb +296 -0
  64. data/lib/sunspot/search/date_facet.rb +35 -0
  65. data/lib/sunspot/search/facet_row.rb +27 -0
  66. data/lib/sunspot/search/field_facet.rb +88 -0
  67. data/lib/sunspot/search/highlight.rb +38 -0
  68. data/lib/sunspot/search/hit.rb +136 -0
  69. data/lib/sunspot/search/more_like_this_search.rb +31 -0
  70. data/lib/sunspot/search/query_facet.rb +67 -0
  71. data/lib/sunspot/search/standard_search.rb +21 -0
  72. data/lib/sunspot/search.rb +9 -0
  73. data/lib/sunspot/server.rb +152 -0
  74. data/lib/sunspot/session.rb +260 -0
  75. data/lib/sunspot/session_proxy/abstract_session_proxy.rb +29 -0
  76. data/lib/sunspot/session_proxy/class_sharding_session_proxy.rb +66 -0
  77. data/lib/sunspot/session_proxy/id_sharding_session_proxy.rb +89 -0
  78. data/lib/sunspot/session_proxy/master_slave_session_proxy.rb +43 -0
  79. data/lib/sunspot/session_proxy/sharding_session_proxy.rb +222 -0
  80. data/lib/sunspot/session_proxy/silent_fail_session_proxy.rb +42 -0
  81. data/lib/sunspot/session_proxy/thread_local_session_proxy.rb +37 -0
  82. data/lib/sunspot/session_proxy.rb +87 -0
  83. data/lib/sunspot/setup.rb +350 -0
  84. data/lib/sunspot/text_field_setup.rb +29 -0
  85. data/lib/sunspot/type.rb +372 -0
  86. data/lib/sunspot/util.rb +243 -0
  87. data/lib/sunspot/version.rb +3 -0
  88. data/lib/sunspot.rb +569 -0
  89. data/solr/etc/jetty.xml +214 -0
  90. data/solr/etc/webdefault.xml +379 -0
  91. data/solr/lib/jetty-6.1.3.jar +0 -0
  92. data/solr/lib/jetty-util-6.1.3.jar +0 -0
  93. data/solr/lib/jsp-2.1/ant-1.6.5.jar +0 -0
  94. data/solr/lib/jsp-2.1/core-3.1.1.jar +0 -0
  95. data/solr/lib/jsp-2.1/jsp-2.1.jar +0 -0
  96. data/solr/lib/jsp-2.1/jsp-api-2.1.jar +0 -0
  97. data/solr/lib/servlet-api-2.5-6.1.3.jar +0 -0
  98. data/solr/solr/conf/admin-extra.html +31 -0
  99. data/solr/solr/conf/elevate.xml +36 -0
  100. data/solr/solr/conf/mapping-ISOLatin1Accent.txt +246 -0
  101. data/solr/solr/conf/protwords.txt +21 -0
  102. data/solr/solr/conf/schema.xml +238 -0
  103. data/solr/solr/conf/scripts.conf +24 -0
  104. data/solr/solr/conf/solrconfig.xml +934 -0
  105. data/solr/solr/conf/spellings.txt +2 -0
  106. data/solr/solr/conf/stopwords.txt +58 -0
  107. data/solr/solr/conf/synonyms.txt +31 -0
  108. data/solr/start.jar +0 -0
  109. data/solr/webapps/solr.war +0 -0
  110. data/spec/api/adapters_spec.rb +33 -0
  111. data/spec/api/binding_spec.rb +50 -0
  112. data/spec/api/indexer/attributes_spec.rb +149 -0
  113. data/spec/api/indexer/batch_spec.rb +46 -0
  114. data/spec/api/indexer/dynamic_fields_spec.rb +42 -0
  115. data/spec/api/indexer/fixed_fields_spec.rb +57 -0
  116. data/spec/api/indexer/fulltext_spec.rb +43 -0
  117. data/spec/api/indexer/removal_spec.rb +53 -0
  118. data/spec/api/indexer/spec_helper.rb +1 -0
  119. data/spec/api/indexer_spec.rb +14 -0
  120. data/spec/api/query/advanced_manipulation_examples.rb +35 -0
  121. data/spec/api/query/connectives_examples.rb +189 -0
  122. data/spec/api/query/dsl_spec.rb +18 -0
  123. data/spec/api/query/dynamic_fields_examples.rb +165 -0
  124. data/spec/api/query/faceting_examples.rb +399 -0
  125. data/spec/api/query/fulltext_examples.rb +315 -0
  126. data/spec/api/query/function_spec.rb +70 -0
  127. data/spec/api/query/geo_examples.rb +69 -0
  128. data/spec/api/query/highlighting_examples.rb +225 -0
  129. data/spec/api/query/more_like_this_spec.rb +140 -0
  130. data/spec/api/query/ordering_pagination_examples.rb +97 -0
  131. data/spec/api/query/scope_examples.rb +275 -0
  132. data/spec/api/query/spec_helper.rb +1 -0
  133. data/spec/api/query/standard_spec.rb +28 -0
  134. data/spec/api/query/text_field_scoping_examples.rb +30 -0
  135. data/spec/api/query/types_spec.rb +20 -0
  136. data/spec/api/search/dynamic_fields_spec.rb +33 -0
  137. data/spec/api/search/faceting_spec.rb +360 -0
  138. data/spec/api/search/highlighting_spec.rb +69 -0
  139. data/spec/api/search/hits_spec.rb +140 -0
  140. data/spec/api/search/results_spec.rb +79 -0
  141. data/spec/api/search/search_spec.rb +23 -0
  142. data/spec/api/search/spec_helper.rb +1 -0
  143. data/spec/api/server_spec.rb +91 -0
  144. data/spec/api/session_proxy/class_sharding_session_proxy_spec.rb +85 -0
  145. data/spec/api/session_proxy/id_sharding_session_proxy_spec.rb +30 -0
  146. data/spec/api/session_proxy/master_slave_session_proxy_spec.rb +41 -0
  147. data/spec/api/session_proxy/sharding_session_proxy_spec.rb +77 -0
  148. data/spec/api/session_proxy/silent_fail_session_proxy_spec.rb +24 -0
  149. data/spec/api/session_proxy/spec_helper.rb +9 -0
  150. data/spec/api/session_proxy/thread_local_session_proxy_spec.rb +50 -0
  151. data/spec/api/session_spec.rb +220 -0
  152. data/spec/api/spec_helper.rb +3 -0
  153. data/spec/api/sunspot_spec.rb +18 -0
  154. data/spec/ext.rb +11 -0
  155. data/spec/helpers/indexer_helper.rb +29 -0
  156. data/spec/helpers/query_helper.rb +38 -0
  157. data/spec/helpers/search_helper.rb +80 -0
  158. data/spec/integration/dynamic_fields_spec.rb +55 -0
  159. data/spec/integration/faceting_spec.rb +238 -0
  160. data/spec/integration/highlighting_spec.rb +22 -0
  161. data/spec/integration/indexing_spec.rb +33 -0
  162. data/spec/integration/keyword_search_spec.rb +317 -0
  163. data/spec/integration/local_search_spec.rb +64 -0
  164. data/spec/integration/more_like_this_spec.rb +43 -0
  165. data/spec/integration/scoped_search_spec.rb +354 -0
  166. data/spec/integration/spec_helper.rb +7 -0
  167. data/spec/integration/stored_fields_spec.rb +10 -0
  168. data/spec/integration/test_pagination.rb +32 -0
  169. data/spec/mocks/adapters.rb +32 -0
  170. data/spec/mocks/blog.rb +3 -0
  171. data/spec/mocks/comment.rb +21 -0
  172. data/spec/mocks/connection.rb +126 -0
  173. data/spec/mocks/mock_adapter.rb +30 -0
  174. data/spec/mocks/mock_class_sharding_session_proxy.rb +24 -0
  175. data/spec/mocks/mock_record.rb +52 -0
  176. data/spec/mocks/mock_sharding_session_proxy.rb +15 -0
  177. data/spec/mocks/photo.rb +11 -0
  178. data/spec/mocks/post.rb +85 -0
  179. data/spec/mocks/super_class.rb +2 -0
  180. data/spec/mocks/user.rb +13 -0
  181. data/spec/spec_helper.rb +42 -0
  182. data/tasks/rdoc.rake +27 -0
  183. data/tasks/schema.rake +19 -0
  184. data/tasks/todo.rake +4 -0
  185. metadata +342 -0
@@ -0,0 +1,934 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+ <!--
19
+ For more details about configurations options that may appear in this
20
+ file, see http://wiki.apache.org/solr/SolrConfigXml.
21
+
22
+ Specifically, the Solr Config can support XInclude, which may make it easier to manage
23
+ the configuration. See https://issues.apache.org/jira/browse/SOLR-1167
24
+ -->
25
+ <config>
26
+ <!-- Set this to 'false' if you want solr to continue working after it has
27
+ encountered an severe configuration error. In a production environment,
28
+ you may want solr to keep working even if one handler is mis-configured.
29
+
30
+ You may also set this to false using by setting the system property:
31
+ -Dsolr.abortOnConfigurationError=false
32
+ -->
33
+ <abortOnConfigurationError>${solr.abortOnConfigurationError:true}</abortOnConfigurationError>
34
+ <!-- lib directives can be used to instruct Solr to load an Jars identified
35
+ and use them to resolve any "plugins" specified in your solrconfig.xml or
36
+ schema.xml (ie: Analyzers, Request Handlers, etc...).
37
+
38
+ All directories and paths are resolved relative the instanceDir.
39
+
40
+ If a "./lib" directory exists in your instanceDir, all files found in it
41
+ are included as if you had used the following syntax...
42
+
43
+ <lib dir="./lib" />
44
+ -->
45
+ <!-- A dir option by itself adds any files found in the directory to the
46
+ classpath, this is useful for including all jars in a directory.
47
+ -->
48
+ <lib dir="../../contrib/extraction/lib"/>
49
+ <!-- When a regex is specified in addition to a directory, only the files in that
50
+ directory which completely match the regex (anchored on both ends)
51
+ will be included.
52
+ -->
53
+ <lib dir="../../dist/" regex="apache-solr-cell-\d.*\.jar"/>
54
+ <lib dir="../../dist/" regex="apache-solr-clustering-\d.*\.jar"/>
55
+ <!-- If a dir option (with or without a regex) is used and nothing is found
56
+ that matches, it will be ignored
57
+ -->
58
+ <lib dir="../../contrib/clustering/lib/downloads/"/>
59
+ <lib dir="../../contrib/clustering/lib/"/>
60
+ <lib dir="/total/crap/dir/ignored"/>
61
+ <!-- an exact path can be used to specify a specific file. This will cause
62
+ a serious error to be logged if it can't be loaded.
63
+ <lib path="../a-jar-that-does-not-exist.jar" />
64
+ -->
65
+ <!-- Used to specify an alternate directory to hold all index data
66
+ other than the default ./data under the Solr home.
67
+ If replication is in use, this should match the replication configuration. -->
68
+ <dataDir>${solr.data.dir:./solr/data}</dataDir>
69
+ <!-- WARNING: this <indexDefaults> section only provides defaults for index writers
70
+ in general. See also the <mainIndex> section after that when changing parameters
71
+ for Solr's main Lucene index. -->
72
+ <indexDefaults>
73
+ <!-- Values here affect all index writers and act as a default unless overridden. -->
74
+ <useCompoundFile>false</useCompoundFile>
75
+ <mergeFactor>10</mergeFactor>
76
+ <!-- If both ramBufferSizeMB and maxBufferedDocs is set, then Lucene will flush
77
+ based on whichever limit is hit first. -->
78
+ <!--<maxBufferedDocs>1000</maxBufferedDocs>-->
79
+ <!-- Sets the amount of RAM that may be used by Lucene indexing
80
+ for buffering added documents and deletions before they are
81
+ flushed to the Directory. -->
82
+ <ramBufferSizeMB>32</ramBufferSizeMB>
83
+ <!-- <maxMergeDocs>2147483647</maxMergeDocs> -->
84
+ <maxFieldLength>10000</maxFieldLength>
85
+ <writeLockTimeout>1000</writeLockTimeout>
86
+ <commitLockTimeout>10000</commitLockTimeout>
87
+ <!--
88
+ Expert: Turn on Lucene's auto commit capability. This causes intermediate
89
+ segment flushes to write a new lucene index descriptor, enabling it to be
90
+ opened by an external IndexReader. This can greatly slow down indexing
91
+ speed. NOTE: Despite the name, this value does not have any relation to
92
+ Solr's autoCommit functionality
93
+ -->
94
+ <!--<luceneAutoCommit>false</luceneAutoCommit>-->
95
+ <!--
96
+ Expert: The Merge Policy in Lucene controls how merging is handled by
97
+ Lucene. The default in 2.3 is the LogByteSizeMergePolicy, previous
98
+ versions used LogDocMergePolicy.
99
+
100
+ LogByteSizeMergePolicy chooses segments to merge based on their size. The
101
+ Lucene 2.2 default, LogDocMergePolicy chose when to merge based on number
102
+ of documents
103
+
104
+ Other implementations of MergePolicy must have a no-argument constructor
105
+ -->
106
+ <!--<mergePolicy class="org.apache.lucene.index.LogByteSizeMergePolicy"/>-->
107
+ <!--
108
+ Expert:
109
+ The Merge Scheduler in Lucene controls how merges are performed. The
110
+ ConcurrentMergeScheduler (Lucene 2.3 default) can perform merges in the
111
+ background using separate threads. The SerialMergeScheduler (Lucene 2.2
112
+ default) does not.
113
+ -->
114
+ <!--<mergeScheduler class="org.apache.lucene.index.ConcurrentMergeScheduler"/>-->
115
+ <!--
116
+ This option specifies which Lucene LockFactory implementation to use.
117
+
118
+ single = SingleInstanceLockFactory - suggested for a read-only index
119
+ or when there is no possibility of another process trying
120
+ to modify the index.
121
+ native = NativeFSLockFactory - uses OS native file locking
122
+ simple = SimpleFSLockFactory - uses a plain file for locking
123
+
124
+ (For backwards compatibility with Solr 1.2, 'simple' is the default
125
+ if not specified.)
126
+ -->
127
+ <lockType>native</lockType>
128
+ <!--
129
+ Expert:
130
+ Controls how often Lucene loads terms into memory -->
131
+ <!--<termIndexInterval>256</termIndexInterval>-->
132
+ </indexDefaults>
133
+ <mainIndex>
134
+ <!-- options specific to the main on-disk lucene index -->
135
+ <useCompoundFile>false</useCompoundFile>
136
+ <ramBufferSizeMB>32</ramBufferSizeMB>
137
+ <mergeFactor>10</mergeFactor>
138
+ <!-- Deprecated -->
139
+ <!--<maxBufferedDocs>1000</maxBufferedDocs>-->
140
+ <!--<maxMergeDocs>2147483647</maxMergeDocs>-->
141
+ <!-- inherit from indexDefaults <maxFieldLength>10000</maxFieldLength> -->
142
+ <!-- If true, unlock any held write or commit locks on startup.
143
+ This defeats the locking mechanism that allows multiple
144
+ processes to safely access a lucene index, and should be
145
+ used with care.
146
+ This is not needed if lock type is 'none' or 'single'
147
+ -->
148
+ <unlockOnStartup>false</unlockOnStartup>
149
+ <!-- If true, IndexReaders will be reopened (often more efficient) instead
150
+ of closed and then opened. -->
151
+ <reopenReaders>true</reopenReaders>
152
+ <!--
153
+ Expert:
154
+ Controls how often Lucene loads terms into memory. Default is 128 and is likely good for most everyone. -->
155
+ <!--<termIndexInterval>256</termIndexInterval>-->
156
+ <!--
157
+ Custom deletion policies can specified here. The class must
158
+ implement org.apache.lucene.index.IndexDeletionPolicy.
159
+
160
+ http://lucene.apache.org/java/2_3_2/api/org/apache/lucene/index/IndexDeletionPolicy.html
161
+
162
+ The standard Solr IndexDeletionPolicy implementation supports deleting
163
+ index commit points on number of commits, age of commit point and
164
+ optimized status.
165
+
166
+ The latest commit point should always be preserved regardless
167
+ of the criteria.
168
+ -->
169
+ <deletionPolicy class="solr.SolrDeletionPolicy">
170
+ <!-- The number of commit points to be kept -->
171
+ <str name="maxCommitsToKeep">1</str>
172
+ <!-- The number of optimized commit points to be kept -->
173
+ <str name="maxOptimizedCommitsToKeep">0</str>
174
+ <!--
175
+ Delete all commit points once they have reached the given age.
176
+ Supports DateMathParser syntax e.g.
177
+
178
+ <str name="maxCommitAge">30MINUTES</str>
179
+ <str name="maxCommitAge">1DAY</str>
180
+ -->
181
+ </deletionPolicy>
182
+ <!-- To aid in advanced debugging, you may turn on IndexWriter debug logging.
183
+ Setting to true will set the file that the underlying Lucene IndexWriter
184
+ will write its debug infostream to. -->
185
+ <infoStream file="INFOSTREAM.txt">false</infoStream>
186
+ </mainIndex>
187
+ <!-- Enables JMX if and only if an existing MBeanServer is found, use this
188
+ if you want to configure JMX through JVM parameters. Remove this to disable
189
+ exposing Solr configuration and statistics to JMX.
190
+
191
+ If you want to connect to a particular server, specify the agentId
192
+ e.g. <jmx agentId="myAgent" />
193
+
194
+ If you want to start a new MBeanServer, specify the serviceUrl
195
+ e.g <jmx serviceUrl="service:jmx:rmi:///jndi/rmi://localhost:9999/solr"/>
196
+
197
+ For more details see http://wiki.apache.org/solr/SolrJmx
198
+ -->
199
+ <jmx/>
200
+ <!-- the default high-performance update handler -->
201
+ <updateHandler class="solr.DirectUpdateHandler2">
202
+ <!-- A prefix of "solr." for class names is an alias that
203
+ causes solr to search appropriate packages, including
204
+ org.apache.solr.(search|update|request|core|analysis)
205
+ -->
206
+ <!-- Perform a <commit/> automatically under certain conditions:
207
+ maxDocs - number of updates since last commit is greater than this
208
+ maxTime - oldest uncommited update (in ms) is this long ago
209
+ Instead of enabling autoCommit, consider using "commitWithin"
210
+ when adding documents. http://wiki.apache.org/solr/UpdateXmlMessages
211
+ <autoCommit>
212
+ <maxDocs>10000</maxDocs>
213
+ <maxTime>1000</maxTime>
214
+ </autoCommit>
215
+ -->
216
+ <!-- The RunExecutableListener executes an external command from a
217
+ hook such as postCommit or postOptimize.
218
+ exe - the name of the executable to run
219
+ dir - dir to use as the current working directory. default="."
220
+ wait - the calling thread waits until the executable returns. default="true"
221
+ args - the arguments to pass to the program. default=nothing
222
+ env - environment variables to set. default=nothing
223
+ -->
224
+ <!-- A postCommit event is fired after every commit or optimize command
225
+ <listener event="postCommit" class="solr.RunExecutableListener">
226
+ <str name="exe">solr/bin/snapshooter</str>
227
+ <str name="dir">.</str>
228
+ <bool name="wait">true</bool>
229
+ <arr name="args"> <str>arg1</str> <str>arg2</str> </arr>
230
+ <arr name="env"> <str>MYVAR=val1</str> </arr>
231
+ </listener>
232
+ -->
233
+ <!-- A postOptimize event is fired only after every optimize command
234
+ <listener event="postOptimize" class="solr.RunExecutableListener">
235
+ <str name="exe">snapshooter</str>
236
+ <str name="dir">solr/bin</str>
237
+ <bool name="wait">true</bool>
238
+ </listener>
239
+ -->
240
+ </updateHandler>
241
+ <!-- Use the following format to specify a custom IndexReaderFactory - allows for alternate
242
+ IndexReader implementations.
243
+
244
+ ** Experimental Feature **
245
+ Please note - Using a custom IndexReaderFactory may prevent certain other features
246
+ from working. The API to IndexReaderFactory may change without warning or may even
247
+ be removed from future releases if the problems cannot be resolved.
248
+
249
+ ** Features that may not work with custom IndexReaderFactory **
250
+ The ReplicationHandler assumes a disk-resident index. Using a custom
251
+ IndexReader implementation may cause incompatibility with ReplicationHandler and
252
+ may cause replication to not work correctly. See SOLR-1366 for details.
253
+
254
+ <indexReaderFactory name="IndexReaderFactory" class="package.class">
255
+ Parameters as required by the implementation
256
+ </indexReaderFactory >
257
+ -->
258
+ <!-- To set the termInfosIndexDivisor, do this: -->
259
+ <!--<indexReaderFactory name="IndexReaderFactory" class="org.apache.solr.core.StandardIndexReaderFactory">
260
+ <int name="termInfosIndexDivisor">12</int>
261
+ </indexReaderFactory >-->
262
+ <query>
263
+ <!-- Maximum number of clauses in a boolean query... in the past, this affected
264
+ range or prefix queries that expanded to big boolean queries - built in Solr
265
+ query parsers no longer create queries with this limitation.
266
+ An exception is thrown if exceeded. -->
267
+ <maxBooleanClauses>1024</maxBooleanClauses>
268
+ <!-- There are two implementations of cache available for Solr,
269
+ LRUCache, based on a synchronized LinkedHashMap, and
270
+ FastLRUCache, based on a ConcurrentHashMap. FastLRUCache has faster gets
271
+ and slower puts in single threaded operation and thus is generally faster
272
+ than LRUCache when the hit ratio of the cache is high (> 75%), and may be
273
+ faster under other scenarios on multi-cpu systems. -->
274
+ <!-- Cache used by SolrIndexSearcher for filters (DocSets),
275
+ unordered sets of *all* documents that match a query.
276
+ When a new searcher is opened, its caches may be prepopulated
277
+ or "autowarmed" using data from caches in the old searcher.
278
+ autowarmCount is the number of items to prepopulate. For LRUCache,
279
+ the autowarmed items will be the most recently accessed items.
280
+ Parameters:
281
+ class - the SolrCache implementation LRUCache or FastLRUCache
282
+ size - the maximum number of entries in the cache
283
+ initialSize - the initial capacity (number of entries) of
284
+ the cache. (seel java.util.HashMap)
285
+ autowarmCount - the number of entries to prepopulate from
286
+ and old cache.
287
+ -->
288
+ <filterCache class="solr.FastLRUCache" size="512" initialSize="512" autowarmCount="0"/>
289
+ <!-- Cache used to hold field values that are quickly accessible
290
+ by document id. The fieldValueCache is created by default
291
+ even if not configured here.
292
+ <fieldValueCache
293
+ class="solr.FastLRUCache"
294
+ size="512"
295
+ autowarmCount="128"
296
+ showItems="32"
297
+ />
298
+ -->
299
+ <!-- queryResultCache caches results of searches - ordered lists of
300
+ document ids (DocList) based on a query, a sort, and the range
301
+ of documents requested. -->
302
+ <queryResultCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
303
+ <!-- documentCache caches Lucene Document objects (the stored fields for each document).
304
+ Since Lucene internal document ids are transient, this cache will not be autowarmed. -->
305
+ <documentCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
306
+ <!-- If true, stored fields that are not requested will be loaded lazily.
307
+ This can result in a significant speed improvement if the usual case is to
308
+ not load all stored fields, especially if the skipped fields are large
309
+ compressed text fields.
310
+ -->
311
+ <enableLazyFieldLoading>true</enableLazyFieldLoading>
312
+ <!-- Example of a generic cache. These caches may be accessed by name
313
+ through SolrIndexSearcher.getCache(),cacheLookup(), and cacheInsert().
314
+ The purpose is to enable easy caching of user/application level data.
315
+ The regenerator argument should be specified as an implementation
316
+ of solr.search.CacheRegenerator if autowarming is desired. -->
317
+ <!--
318
+ <cache name="myUserCache"
319
+ class="solr.LRUCache"
320
+ size="4096"
321
+ initialSize="1024"
322
+ autowarmCount="1024"
323
+ regenerator="org.mycompany.mypackage.MyRegenerator"
324
+ />
325
+ -->
326
+ <!-- An optimization that attempts to use a filter to satisfy a search.
327
+ If the requested sort does not include score, then the filterCache
328
+ will be checked for a filter matching the query. If found, the filter
329
+ will be used as the source of document ids, and then the sort will be
330
+ applied to that.
331
+ <useFilterForSortedQuery>true</useFilterForSortedQuery>
332
+ -->
333
+ <!-- An optimization for use with the queryResultCache. When a search
334
+ is requested, a superset of the requested number of document ids
335
+ are collected. For example, if a search for a particular query
336
+ requests matching documents 10 through 19, and queryWindowSize is 50,
337
+ then documents 0 through 49 will be collected and cached. Any further
338
+ requests in that range can be satisfied via the cache. -->
339
+ <queryResultWindowSize>20</queryResultWindowSize>
340
+ <!-- Maximum number of documents to cache for any entry in the
341
+ queryResultCache. -->
342
+ <queryResultMaxDocsCached>200</queryResultMaxDocsCached>
343
+ <!-- a newSearcher event is fired whenever a new searcher is being prepared
344
+ and there is a current searcher handling requests (aka registered).
345
+ It can be used to prime certain caches to prevent long request times for
346
+ certain requests.
347
+ -->
348
+ <!-- QuerySenderListener takes an array of NamedList and executes a
349
+ local query request for each NamedList in sequence. -->
350
+ <listener event="newSearcher" class="solr.QuerySenderListener">
351
+ <arr name="queries">
352
+ <!--
353
+ <lst> <str name="q">solr</str> <str name="start">0</str> <str name="rows">10</str> </lst>
354
+ <lst> <str name="q">rocks</str> <str name="start">0</str> <str name="rows">10</str> </lst>
355
+ <lst><str name="q">static newSearcher warming query from solrconfig.xml</str></lst>
356
+ -->
357
+ </arr>
358
+ </listener>
359
+ <!-- a firstSearcher event is fired whenever a new searcher is being
360
+ prepared but there is no current registered searcher to handle
361
+ requests or to gain autowarming data from. -->
362
+ <listener event="firstSearcher" class="solr.QuerySenderListener">
363
+ <arr name="queries">
364
+ <lst>
365
+ <str name="q">solr rocks</str>
366
+ <str name="start">0</str>
367
+ <str name="rows">10</str>
368
+ </lst>
369
+ <lst>
370
+ <str name="q">static firstSearcher warming query from solrconfig.xml</str>
371
+ </lst>
372
+ </arr>
373
+ </listener>
374
+ <!-- If a search request comes in and there is no current registered searcher,
375
+ then immediately register the still warming searcher and use it. If
376
+ "false" then all requests will block until the first searcher is done
377
+ warming. -->
378
+ <useColdSearcher>false</useColdSearcher>
379
+ <!-- Maximum number of searchers that may be warming in the background
380
+ concurrently. An error is returned if this limit is exceeded. Recommend
381
+ 1-2 for read-only slaves, higher for masters w/o cache warming. -->
382
+ <maxWarmingSearchers>2</maxWarmingSearchers>
383
+ </query>
384
+ <!--
385
+ Let the dispatch filter handler /select?qt=XXX
386
+ handleSelect=true will use consistent error handling for /select and /update
387
+ handleSelect=false will use solr1.1 style error formatting
388
+ -->
389
+ <requestDispatcher handleSelect="true">
390
+ <!--Make sure your system has some authentication before enabling remote streaming! -->
391
+ <requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048000"/>
392
+ <!-- Set HTTP caching related parameters (for proxy caches and clients).
393
+
394
+ To get the behaviour of Solr 1.2 (ie: no caching related headers)
395
+ use the never304="true" option and do not specify a value for
396
+ <cacheControl>
397
+ -->
398
+ <!-- <httpCaching never304="true"> -->
399
+ <httpCaching lastModifiedFrom="openTime" etagSeed="Solr">
400
+ <!-- lastModFrom="openTime" is the default, the Last-Modified value
401
+ (and validation against If-Modified-Since requests) will all be
402
+ relative to when the current Searcher was opened.
403
+ You can change it to lastModFrom="dirLastMod" if you want the
404
+ value to exactly corrispond to when the physical index was last
405
+ modified.
406
+
407
+ etagSeed="..." is an option you can change to force the ETag
408
+ header (and validation against If-None-Match requests) to be
409
+ differnet even if the index has not changed (ie: when making
410
+ significant changes to your config file)
411
+
412
+ lastModifiedFrom and etagSeed are both ignored if you use the
413
+ never304="true" option.
414
+ -->
415
+ <!-- If you include a <cacheControl> directive, it will be used to
416
+ generate a Cache-Control header, as well as an Expires header
417
+ if the value contains "max-age="
418
+
419
+ By default, no Cache-Control header is generated.
420
+
421
+ You can use the <cacheControl> option even if you have set
422
+ never304="true"
423
+ -->
424
+ <!-- <cacheControl>max-age=30, public</cacheControl> -->
425
+ </httpCaching>
426
+ </requestDispatcher>
427
+ <!-- requestHandler plugins... incoming queries will be dispatched to the
428
+ correct handler based on the path or the qt (query type) param.
429
+ Names starting with a '/' are accessed with the a path equal to the
430
+ registered name. Names without a leading '/' are accessed with:
431
+ http://host/app/select?qt=name
432
+ If no qt is defined, the requestHandler that declares default="true"
433
+ will be used.
434
+ -->
435
+ <requestHandler name="standard" class="solr.SearchHandler" default="true">
436
+ <!-- default values for query parameters -->
437
+ <lst name="defaults">
438
+ <str name="echoParams">explicit</str>
439
+ <!--
440
+ <int name="rows">10</int>
441
+ <str name="fl">*</str>
442
+ <str name="version">2.1</str>
443
+ -->
444
+ </lst>
445
+ </requestHandler>
446
+ <!-- Please refer to http://wiki.apache.org/solr/SolrReplication for details on configuring replication -->
447
+ <!-- remove the <lst name="master"> section if this is just a slave -->
448
+ <!-- remove the <lst name="slave"> section if this is just a master -->
449
+ <!--
450
+ <requestHandler name="/replication" class="solr.ReplicationHandler" >
451
+ <lst name="master">
452
+ <str name="replicateAfter">commit</str>
453
+ <str name="replicateAfter">startup</str>
454
+ <str name="confFiles">schema.xml,stopwords.txt</str>
455
+ </lst>
456
+ <lst name="slave">
457
+ <str name="masterUrl">http://localhost:8983/solr/replication</str>
458
+ <str name="pollInterval">00:00:60</str>
459
+ </lst>
460
+ </requestHandler>-->
461
+ <!-- DisMaxRequestHandler allows easy searching across multiple fields
462
+ for simple user-entered phrases. It's implementation is now
463
+ just the standard SearchHandler with a default query type
464
+ of "dismax".
465
+ see http://wiki.apache.org/solr/DisMaxRequestHandler
466
+ -->
467
+ <requestHandler name="dismax" class="solr.SearchHandler">
468
+ <lst name="defaults">
469
+ <str name="defType">dismax</str>
470
+ <str name="echoParams">explicit</str>
471
+ <float name="tie">0.01</float>
472
+ <str name="qf">
473
+ text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 manu^1.1 cat^1.4
474
+ </str>
475
+ <str name="pf">
476
+ text^0.2 features^1.1 name^1.5 manu^1.4 manu_exact^1.9
477
+ </str>
478
+ <str name="bf">
479
+ popularity^0.5 recip(price,1,1000,1000)^0.3
480
+ </str>
481
+ <str name="fl">
482
+ id,name,price,score
483
+ </str>
484
+ <str name="mm">
485
+ 2&lt;-1 5&lt;-2 6&lt;90%
486
+ </str>
487
+ <int name="ps">100</int>
488
+ <str name="q.alt">*:*</str>
489
+ <!-- example highlighter config, enable per-query with hl=true -->
490
+ <str name="hl.fl">text features name</str>
491
+ <!-- for this field, we want no fragmenting, just highlighting -->
492
+ <str name="f.name.hl.fragsize">0</str>
493
+ <!-- instructs Solr to return the field itself if no query terms are
494
+ found -->
495
+ <str name="f.name.hl.alternateField">name</str>
496
+ <str name="f.text.hl.fragmenter">regex</str>
497
+ <!-- defined below -->
498
+ </lst>
499
+ </requestHandler>
500
+ <!-- Note how you can register the same handler multiple times with
501
+ different names (and different init parameters)
502
+ -->
503
+ <requestHandler name="partitioned" class="solr.SearchHandler">
504
+ <lst name="defaults">
505
+ <str name="defType">dismax</str>
506
+ <str name="echoParams">explicit</str>
507
+ <str name="qf">text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0</str>
508
+ <str name="mm">2&lt;-1 5&lt;-2 6&lt;90%</str>
509
+ <!-- This is an example of using Date Math to specify a constantly
510
+ moving date range in a config...
511
+ -->
512
+ <str name="bq">incubationdate_dt:[* TO NOW/DAY-1MONTH]^2.2</str>
513
+ </lst>
514
+ <!-- In addition to defaults, "appends" params can be specified
515
+ to identify values which should be appended to the list of
516
+ multi-val params from the query (or the existing "defaults").
517
+
518
+ In this example, the param "fq=instock:true" will be appended to
519
+ any query time fq params the user may specify, as a mechanism for
520
+ partitioning the index, independent of any user selected filtering
521
+ that may also be desired (perhaps as a result of faceted searching).
522
+
523
+ NOTE: there is *absolutely* nothing a client can do to prevent these
524
+ "appends" values from being used, so don't use this mechanism
525
+ unless you are sure you always want it.
526
+ -->
527
+ <lst name="appends">
528
+ <str name="fq">inStock:true</str>
529
+ </lst>
530
+ <!-- "invariants" are a way of letting the Solr maintainer lock down
531
+ the options available to Solr clients. Any params values
532
+ specified here are used regardless of what values may be specified
533
+ in either the query, the "defaults", or the "appends" params.
534
+
535
+ In this example, the facet.field and facet.query params are fixed,
536
+ limiting the facets clients can use. Faceting is not turned on by
537
+ default - but if the client does specify facet=true in the request,
538
+ these are the only facets they will be able to see counts for;
539
+ regardless of what other facet.field or facet.query params they
540
+ may specify.
541
+
542
+ NOTE: there is *absolutely* nothing a client can do to prevent these
543
+ "invariants" values from being used, so don't use this mechanism
544
+ unless you are sure you always want it.
545
+ -->
546
+ <lst name="invariants">
547
+ <str name="facet.field">cat</str>
548
+ <str name="facet.field">manu_exact</str>
549
+ <str name="facet.query">price:[* TO 500]</str>
550
+ <str name="facet.query">price:[500 TO *]</str>
551
+ </lst>
552
+ </requestHandler>
553
+ <!--
554
+ Search components are registered to SolrCore and used by Search Handlers
555
+
556
+ By default, the following components are avaliable:
557
+
558
+ <searchComponent name="query" class="org.apache.solr.handler.component.QueryComponent" />
559
+ <searchComponent name="facet" class="org.apache.solr.handler.component.FacetComponent" />
560
+ <searchComponent name="mlt" class="org.apache.solr.handler.component.MoreLikeThisComponent" />
561
+ <searchComponent name="highlight" class="org.apache.solr.handler.component.HighlightComponent" />
562
+ <searchComponent name="stats" class="org.apache.solr.handler.component.StatsComponent" />
563
+ <searchComponent name="debug" class="org.apache.solr.handler.component.DebugComponent" />
564
+
565
+ Default configuration in a requestHandler would look like:
566
+ <arr name="components">
567
+ <str>query</str>
568
+ <str>facet</str>
569
+ <str>mlt</str>
570
+ <str>highlight</str>
571
+ <str>stats</str>
572
+ <str>debug</str>
573
+ </arr>
574
+
575
+ If you register a searchComponent to one of the standard names, that will be used instead.
576
+ To insert components before or after the 'standard' components, use:
577
+
578
+ <arr name="first-components">
579
+ <str>myFirstComponentName</str>
580
+ </arr>
581
+
582
+ <arr name="last-components">
583
+ <str>myLastComponentName</str>
584
+ </arr>
585
+ -->
586
+ <!-- The spell check component can return a list of alternative spelling
587
+ suggestions. -->
588
+ <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
589
+ <str name="queryAnalyzerFieldType">textSpell</str>
590
+ <lst name="spellchecker">
591
+ <str name="name">default</str>
592
+ <str name="field">name</str>
593
+ <str name="spellcheckIndexDir">./spellchecker</str>
594
+ </lst>
595
+ <!-- a spellchecker that uses a different distance measure
596
+ <lst name="spellchecker">
597
+ <str name="name">jarowinkler</str>
598
+ <str name="field">spell</str>
599
+ <str name="distanceMeasure">org.apache.lucene.search.spell.JaroWinklerDistance</str>
600
+ <str name="spellcheckIndexDir">./spellchecker2</str>
601
+ </lst>
602
+ -->
603
+ <!-- a file based spell checker
604
+ <lst name="spellchecker">
605
+ <str name="classname">solr.FileBasedSpellChecker</str>
606
+ <str name="name">file</str>
607
+ <str name="sourceLocation">spellings.txt</str>
608
+ <str name="characterEncoding">UTF-8</str>
609
+ <str name="spellcheckIndexDir">./spellcheckerFile</str>
610
+ </lst>
611
+ -->
612
+ </searchComponent>
613
+ <!-- A request handler utilizing the spellcheck component.
614
+ #############################################################################
615
+ NOTE: This is purely as an example. The whole purpose of the
616
+ SpellCheckComponent is to hook it into the request handler that handles (i.e.
617
+ the standard or dismax SearchHandler) queries such that a separate request is
618
+ not needed to get suggestions.
619
+
620
+ IN OTHER WORDS, THERE IS REALLY GOOD CHANCE THE SETUP BELOW IS NOT WHAT YOU
621
+ WANT FOR YOUR PRODUCTION SYSTEM!
622
+ #############################################################################
623
+ -->
624
+ <requestHandler name="/spell" class="solr.SearchHandler" lazy="true">
625
+ <lst name="defaults">
626
+ <!-- omp = Only More Popular -->
627
+ <str name="spellcheck.onlyMorePopular">false</str>
628
+ <!-- exr = Extended Results -->
629
+ <str name="spellcheck.extendedResults">false</str>
630
+ <!-- The number of suggestions to return -->
631
+ <str name="spellcheck.count">1</str>
632
+ </lst>
633
+ <arr name="last-components">
634
+ <str>spellcheck</str>
635
+ </arr>
636
+ </requestHandler>
637
+ <searchComponent name="tvComponent" class="org.apache.solr.handler.component.TermVectorComponent"/>
638
+ <!-- A Req Handler for working with the tvComponent. This is purely as an example.
639
+ You will likely want to add the component to your already specified request handlers. -->
640
+ <requestHandler name="tvrh" class="org.apache.solr.handler.component.SearchHandler">
641
+ <lst name="defaults">
642
+ <bool name="tv">true</bool>
643
+ </lst>
644
+ <arr name="last-components">
645
+ <str>tvComponent</str>
646
+ </arr>
647
+ </requestHandler>
648
+ <!-- Clustering Component
649
+ http://wiki.apache.org/solr/ClusteringComponent
650
+ This relies on third party jars which are not included in the release.
651
+ To use this component (and the "/clustering" handler)
652
+ Those jars will need to be downloaded, and you'll need to set the
653
+ solr.cluster.enabled system property when running solr...
654
+ java -Dsolr.clustering.enabled=true -jar start.jar
655
+ -->
656
+ <searchComponent name="clusteringComponent" enable="${solr.clustering.enabled:false}" class="org.apache.solr.handler.clustering.ClusteringComponent">
657
+ <!-- Declare an engine -->
658
+ <lst name="engine">
659
+ <!-- The name, only one can be named "default" -->
660
+ <str name="name">default</str>
661
+ <!--
662
+ Class name of Carrot2 clustering algorithm. Currently available algorithms are:
663
+
664
+ * org.carrot2.clustering.lingo.LingoClusteringAlgorithm
665
+ * org.carrot2.clustering.stc.STCClusteringAlgorithm
666
+
667
+ See http://project.carrot2.org/algorithms.html for the algorithm's characteristics.
668
+ -->
669
+ <str name="carrot.algorithm">org.carrot2.clustering.lingo.LingoClusteringAlgorithm</str>
670
+ <!--
671
+ Overriding values for Carrot2 default algorithm attributes. For a description
672
+ of all available attributes, see: http://download.carrot2.org/stable/manual/#chapter.components.
673
+ Use attribute key as name attribute of str elements below. These can be further
674
+ overridden for individual requests by specifying attribute key as request
675
+ parameter name and attribute value as parameter value.
676
+ -->
677
+ <str name="LingoClusteringAlgorithm.desiredClusterCountBase">20</str>
678
+ </lst>
679
+ <lst name="engine">
680
+ <str name="name">stc</str>
681
+ <str name="carrot.algorithm">org.carrot2.clustering.stc.STCClusteringAlgorithm</str>
682
+ </lst>
683
+ </searchComponent>
684
+ <requestHandler name="/clustering" enable="${solr.clustering.enabled:false}" class="solr.SearchHandler">
685
+ <lst name="defaults">
686
+ <bool name="clustering">true</bool>
687
+ <str name="clustering.engine">default</str>
688
+ <bool name="clustering.results">true</bool>
689
+ <!-- The title field -->
690
+ <str name="carrot.title">name</str>
691
+ <str name="carrot.url">id</str>
692
+ <!-- The field to cluster on -->
693
+ <str name="carrot.snippet">features</str>
694
+ <!-- produce summaries -->
695
+ <bool name="carrot.produceSummary">true</bool>
696
+ <!-- the maximum number of labels per cluster -->
697
+ <!--<int name="carrot.numDescriptions">5</int>-->
698
+ <!-- produce sub clusters -->
699
+ <bool name="carrot.outputSubClusters">false</bool>
700
+ </lst>
701
+ <arr name="last-components">
702
+ <str>clusteringComponent</str>
703
+ </arr>
704
+ </requestHandler>
705
+ <!-- Solr Cell: http://wiki.apache.org/solr/ExtractingRequestHandler -->
706
+ <requestHandler name="/update/extract" class="org.apache.solr.handler.extraction.ExtractingRequestHandler" startup="lazy">
707
+ <lst name="defaults">
708
+ <!-- All the main content goes into "text"... if you need to return
709
+ the extracted text or do highlighting, use a stored field. -->
710
+ <str name="fmap.content">text</str>
711
+ <str name="lowernames">true</str>
712
+ <str name="uprefix">ignored_</str>
713
+ <!-- capture link hrefs but ignore div attributes -->
714
+ <str name="captureAttr">true</str>
715
+ <str name="fmap.a">links</str>
716
+ <str name="fmap.div">ignored_</str>
717
+ </lst>
718
+ </requestHandler>
719
+ <!-- A component to return terms and document frequency of those terms.
720
+ This component does not yet support distributed search. -->
721
+ <searchComponent name="termsComponent" class="org.apache.solr.handler.component.TermsComponent"/>
722
+ <requestHandler name="/terms" class="org.apache.solr.handler.component.SearchHandler">
723
+ <lst name="defaults">
724
+ <bool name="terms">true</bool>
725
+ </lst>
726
+ <arr name="components">
727
+ <str>termsComponent</str>
728
+ </arr>
729
+ </requestHandler>
730
+ <!-- a search component that enables you to configure the top results for
731
+ a given query regardless of the normal lucene scoring.-->
732
+ <searchComponent name="elevator" class="solr.QueryElevationComponent">
733
+ <!-- pick a fieldType to analyze queries -->
734
+ <str name="queryFieldType">string</str>
735
+ <str name="config-file">elevate.xml</str>
736
+ </searchComponent>
737
+ <!-- a request handler utilizing the elevator component -->
738
+ <requestHandler name="/elevate" class="solr.SearchHandler" startup="lazy">
739
+ <lst name="defaults">
740
+ <str name="echoParams">explicit</str>
741
+ </lst>
742
+ <arr name="last-components">
743
+ <str>elevator</str>
744
+ </arr>
745
+ </requestHandler>
746
+ <!-- Update request handler.
747
+
748
+ Note: Since solr1.1 requestHandlers requires a valid content type header if posted in
749
+ the body. For example, curl now requires: -H 'Content-type:text/xml; charset=utf-8'
750
+ The response format differs from solr1.1 formatting and returns a standard error code.
751
+ To enable solr1.1 behavior, remove the /update handler or change its path
752
+ -->
753
+ <requestHandler name="/update" class="solr.XmlUpdateRequestHandler"/>
754
+ <requestHandler name="/update/javabin" class="solr.BinaryUpdateRequestHandler"/>
755
+ <!--
756
+ Analysis request handler. Since Solr 1.3. Use to return how a document is analyzed. Useful
757
+ for debugging and as a token server for other types of applications.
758
+
759
+ This is deprecated in favor of the improved DocumentAnalysisRequestHandler and FieldAnalysisRequestHandler
760
+
761
+ <requestHandler name="/analysis" class="solr.AnalysisRequestHandler" />
762
+ -->
763
+ <!--
764
+ An analysis handler that provides a breakdown of the analysis process of provided docuemnts. This handler expects a
765
+ (single) content stream with the following format:
766
+
767
+ <docs>
768
+ <doc>
769
+ <field name="id">1</field>
770
+ <field name="name">The Name</field>
771
+ <field name="text">The Text Value</field>
772
+ <doc>
773
+ <doc>...</doc>
774
+ <doc>...</doc>
775
+ ...
776
+ </docs>
777
+
778
+ Note: Each document must contain a field which serves as the unique key. This key is used in the returned
779
+ response to assoicate an analysis breakdown to the analyzed document.
780
+
781
+ Like the FieldAnalysisRequestHandler, this handler also supports query analysis by
782
+ sending either an "analysis.query" or "q" request paraemter that holds the query text to be analyized. It also
783
+ supports the "analysis.showmatch" parameter which when set to true, all field tokens that match the query
784
+ tokens will be marked as a "match".
785
+ -->
786
+ <requestHandler name="/analysis/document" class="solr.DocumentAnalysisRequestHandler"/>
787
+ <!--
788
+ RequestHandler that provides much the same functionality as analysis.jsp. Provides the ability
789
+ to specify multiple field types and field names in the same request and outputs index-time and
790
+ query-time analysis for each of them.
791
+
792
+ Request parameters are:
793
+ analysis.fieldname - The field name whose analyzers are to be used
794
+ analysis.fieldtype - The field type whose analyzers are to be used
795
+ analysis.fieldvalue - The text for index-time analysis
796
+ q (or analysis.q) - The text for query time analysis
797
+ analysis.showmatch (true|false) - When set to true and when query analysis is performed, the produced
798
+ tokens of the field value analysis will be marked as "matched" for every
799
+ token that is produces by the query analysis
800
+ -->
801
+ <requestHandler name="/analysis/field" class="solr.FieldAnalysisRequestHandler"/>
802
+ <!-- CSV update handler, loaded on demand -->
803
+ <requestHandler name="/update/csv" class="solr.CSVRequestHandler" startup="lazy"/>
804
+ <!--
805
+ Admin Handlers - This will register all the standard admin RequestHandlers. Adding
806
+ this single handler is equivalent to registering:
807
+
808
+ <requestHandler name="/admin/luke" class="org.apache.solr.handler.admin.LukeRequestHandler" />
809
+ <requestHandler name="/admin/system" class="org.apache.solr.handler.admin.SystemInfoHandler" />
810
+ <requestHandler name="/admin/plugins" class="org.apache.solr.handler.admin.PluginInfoHandler" />
811
+ <requestHandler name="/admin/threads" class="org.apache.solr.handler.admin.ThreadDumpHandler" />
812
+ <requestHandler name="/admin/properties" class="org.apache.solr.handler.admin.PropertiesRequestHandler" />
813
+ <requestHandler name="/admin/file" class="org.apache.solr.handler.admin.ShowFileRequestHandler" >
814
+
815
+ If you wish to hide files under ${solr.home}/conf, explicitly register the ShowFileRequestHandler using:
816
+ <requestHandler name="/admin/file" class="org.apache.solr.handler.admin.ShowFileRequestHandler" >
817
+ <lst name="invariants">
818
+ <str name="hidden">synonyms.txt</str>
819
+ <str name="hidden">anotherfile.txt</str>
820
+ </lst>
821
+ </requestHandler>
822
+ -->
823
+ <requestHandler name="/admin/" class="org.apache.solr.handler.admin.AdminHandlers"/>
824
+ <!-- ping/healthcheck -->
825
+ <requestHandler name="/admin/ping" class="PingRequestHandler">
826
+ <lst name="defaults">
827
+ <str name="qt">standard</str>
828
+ <str name="q">solrpingquery</str>
829
+ <str name="echoParams">all</str>
830
+ </lst>
831
+ </requestHandler>
832
+ <!-- Echo the request contents back to the client -->
833
+ <requestHandler name="/debug/dump" class="solr.DumpRequestHandler">
834
+ <lst name="defaults">
835
+ <str name="echoParams">explicit</str>
836
+ <!-- for all params (including the default etc) use: 'all' -->
837
+ <str name="echoHandler">true</str>
838
+ </lst>
839
+ </requestHandler>
840
+ <highlighting>
841
+ <!-- Configure the standard fragmenter -->
842
+ <!-- This could most likely be commented out in the "default" case -->
843
+ <fragmenter name="gap" class="org.apache.solr.highlight.GapFragmenter" default="true">
844
+ <lst name="defaults">
845
+ <int name="hl.fragsize">100</int>
846
+ </lst>
847
+ </fragmenter>
848
+ <!-- A regular-expression-based fragmenter (f.i., for sentence extraction) -->
849
+ <fragmenter name="regex" class="org.apache.solr.highlight.RegexFragmenter">
850
+ <lst name="defaults">
851
+ <!-- slightly smaller fragsizes work better because of slop -->
852
+ <int name="hl.fragsize">70</int>
853
+ <!-- allow 50% slop on fragment sizes -->
854
+ <float name="hl.regex.slop">0.5</float>
855
+ <!-- a basic sentence pattern -->
856
+ <str name="hl.regex.pattern">[-\w ,/\n\"']{20,200}</str>
857
+ </lst>
858
+ </fragmenter>
859
+ <!-- Configure the standard formatter -->
860
+ <formatter name="html" class="org.apache.solr.highlight.HtmlFormatter" default="true">
861
+ <lst name="defaults">
862
+ <str name="hl.simple.pre"><![CDATA[<em>]]></str>
863
+ <str name="hl.simple.post"><![CDATA[</em>]]></str>
864
+ </lst>
865
+ </formatter>
866
+ </highlighting>
867
+ <!-- An example dedup update processor that creates the "id" field on the fly
868
+ based on the hash code of some other fields. This example has overwriteDupes
869
+ set to false since we are using the id field as the signatureField and Solr
870
+ will maintain uniqueness based on that anyway.
871
+
872
+ You have to link the chain to an update handler above to use it ie:
873
+ <requestHandler name="/update "class="solr.XmlUpdateRequestHandler">
874
+ <lst name="defaults">
875
+ <str name="update.processor">dedupe</str>
876
+ </lst>
877
+ </requestHandler>
878
+ -->
879
+ <!--
880
+ <updateRequestProcessorChain name="dedupe">
881
+ <processor class="org.apache.solr.update.processor.SignatureUpdateProcessorFactory">
882
+ <bool name="enabled">true</bool>
883
+ <str name="signatureField">id</str>
884
+ <bool name="overwriteDupes">false</bool>
885
+ <str name="fields">name,features,cat</str>
886
+ <str name="signatureClass">org.apache.solr.update.processor.Lookup3Signature</str>
887
+ </processor>
888
+ <processor class="solr.LogUpdateProcessorFactory" />
889
+ <processor class="solr.RunUpdateProcessorFactory" />
890
+ </updateRequestProcessorChain>
891
+ -->
892
+ <!-- queryResponseWriter plugins... query responses will be written using the
893
+ writer specified by the 'wt' request parameter matching the name of a registered
894
+ writer.
895
+ The "default" writer is the default and will be used if 'wt' is not specified
896
+ in the request. XMLResponseWriter will be used if nothing is specified here.
897
+ The json, python, and ruby writers are also available by default.
898
+
899
+ <queryResponseWriter name="xml" class="org.apache.solr.request.XMLResponseWriter" default="true"/>
900
+ <queryResponseWriter name="json" class="org.apache.solr.request.JSONResponseWriter"/>
901
+ <queryResponseWriter name="python" class="org.apache.solr.request.PythonResponseWriter"/>
902
+ <queryResponseWriter name="ruby" class="org.apache.solr.request.RubyResponseWriter"/>
903
+ <queryResponseWriter name="php" class="org.apache.solr.request.PHPResponseWriter"/>
904
+ <queryResponseWriter name="phps" class="org.apache.solr.request.PHPSerializedResponseWriter"/>
905
+
906
+ <queryResponseWriter name="custom" class="com.example.MyResponseWriter"/>
907
+ -->
908
+ <!-- XSLT response writer transforms the XML output by any xslt file found
909
+ in Solr's conf/xslt directory. Changes to xslt files are checked for
910
+ every xsltCacheLifetimeSeconds.
911
+ -->
912
+ <queryResponseWriter name="xslt" class="org.apache.solr.request.XSLTResponseWriter">
913
+ <int name="xsltCacheLifetimeSeconds">5</int>
914
+ </queryResponseWriter>
915
+ <!-- example of registering a query parser
916
+ <queryParser name="lucene" class="org.apache.solr.search.LuceneQParserPlugin"/>
917
+ -->
918
+ <!-- example of registering a custom function parser
919
+ <valueSourceParser name="myfunc" class="com.mycompany.MyValueSourceParser" />
920
+ -->
921
+ <!-- config for the admin interface -->
922
+ <admin>
923
+ <defaultQuery>solr</defaultQuery>
924
+ <!-- configure a healthcheck file for servers behind a loadbalancer
925
+ <healthcheck type="file">server-enabled</healthcheck>
926
+ -->
927
+ </admin>
928
+ <requestHandler class="solr.MoreLikeThisHandler" name="/mlt">
929
+ <lst name="defaults">
930
+ <str name="mlt.mintf">1</str>
931
+ <str name="mlt.mindf">2</str>
932
+ </lst>
933
+ </requestHandler>
934
+ </config>