active-fedora 1.0.5 → 1.1.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (246) hide show
  1. data/.document +5 -0
  2. data/.gitignore +21 -0
  3. data/.hg/00changelog.i +0 -0
  4. data/.hg/branch +1 -0
  5. data/.hg/branch.cache +2 -0
  6. data/.hg/dirstate +0 -0
  7. data/.hg/hgrc +2 -0
  8. data/.hg/requires +2 -0
  9. data/.hg/store/00changelog.i +0 -0
  10. data/.hg/store/00manifest.i +0 -0
  11. data/.hg/store/data/.hgignore.i +0 -0
  12. data/.hg/store/data/.hgtags.i +0 -0
  13. data/.hg/store/data/_c_o_p_y_i_n_g.txt.i +0 -0
  14. data/.hg/store/data/_c_o_y_i_n_g._l_e_s_s_e_r.txt.i +0 -0
  15. data/.hg/store/data/_history.txt.i +0 -0
  16. data/.hg/store/data/_license.txt.i +0 -0
  17. data/.hg/store/data/_manifest.txt.i +0 -0
  18. data/.hg/store/data/_post_install.txt.i +0 -0
  19. data/.hg/store/data/_r_e_a_d_m_e.rdoc.i +0 -0
  20. data/.hg/store/data/_r_e_a_d_m_e.txt.i +0 -0
  21. data/.hg/store/data/_rakefile.i +0 -0
  22. data/.hg/store/data/_v_e_r_s_i_o_n.i +0 -0
  23. data/.hg/store/data/active-fedora.gemspec.i +0 -0
  24. data/.hg/store/data/active__fedora/_history.txt.i +0 -0
  25. data/.hg/store/data/active__fedora/_manifest.txt.i +0 -0
  26. data/.hg/store/data/active__fedora/_post_install.txt.i +0 -0
  27. data/.hg/store/data/active__fedora/_r_e_a_d_m_e.rdoc.i +0 -0
  28. data/.hg/store/data/active__fedora/_rakefile.i +0 -0
  29. data/.hg/store/data/active__fedora/lib/active__fedora.rb.i +0 -0
  30. data/.hg/store/data/active__fedora/script/console.i +0 -0
  31. data/.hg/store/data/active__fedora/script/destroy.i +0 -0
  32. data/.hg/store/data/active__fedora/script/generate.i +0 -0
  33. data/.hg/store/data/active__fedora/spec/active__fedora__spec.rb.i +0 -0
  34. data/.hg/store/data/active__fedora/spec/spec__helper.rb.i +0 -0
  35. data/.hg/store/data/config/fedora.yml.i +0 -0
  36. data/.hg/store/data/config/solr__mappings.yml.i +0 -0
  37. data/.hg/store/data/config/solr__mappings__af__0.1.yml.i +0 -0
  38. data/.hg/store/data/config/solr__mappings__bl__2.4.yml.i +0 -0
  39. data/.hg/store/data/lib/active-fedora.rb.i +0 -0
  40. data/.hg/store/data/lib/active__fedora.rb.i +0 -0
  41. data/.hg/store/data/lib/active__fedora/base.rb.i +0 -0
  42. data/.hg/store/data/lib/active__fedora/content__model.rb.i +0 -0
  43. data/.hg/store/data/lib/active__fedora/datastream.rb.i +0 -0
  44. data/.hg/store/data/lib/active__fedora/fedora__object.rb.i +0 -0
  45. data/.hg/store/data/lib/active__fedora/metadata__datastream.rb.i +0 -0
  46. data/.hg/store/data/lib/active__fedora/model.rb.i +0 -0
  47. data/.hg/store/data/lib/active__fedora/property.rb.i +0 -0
  48. data/.hg/store/data/lib/active__fedora/qualified__dublin__core__datastream.rb.i +0 -0
  49. data/.hg/store/data/lib/active__fedora/relationship.rb.i +0 -0
  50. data/.hg/store/data/lib/active__fedora/rels__ext__datastream.rb.i +0 -0
  51. data/.hg/store/data/lib/active__fedora/semantic__node.rb.i +0 -0
  52. data/.hg/store/data/lib/active__fedora/solr__mapper.rb.i +0 -0
  53. data/.hg/store/data/lib/active__fedora/solr__service.rb.i +0 -0
  54. data/.hg/store/data/lib/fedora/base.rb.i +0 -0
  55. data/.hg/store/data/lib/fedora/connection.rb.i +0 -0
  56. data/.hg/store/data/lib/fedora/datastream.rb.i +0 -0
  57. data/.hg/store/data/lib/fedora/fedora__object.rb.i +0 -0
  58. data/.hg/store/data/lib/fedora/formats.rb.i +0 -0
  59. data/.hg/store/data/lib/fedora/generic__search.rb.i +0 -0
  60. data/.hg/store/data/lib/fedora/repository.rb.i +0 -0
  61. data/.hg/store/data/lib/ruby-fedora.rb.i +0 -0
  62. data/.hg/store/data/lib/util/class__level__inheritable__attributes.rb.i +0 -0
  63. data/.hg/store/data/script/console.i +0 -0
  64. data/.hg/store/data/script/destroy.i +0 -0
  65. data/.hg/store/data/script/generate.i +0 -0
  66. data/.hg/store/data/solr/config/schema-1.5.xml.i +0 -0
  67. data/.hg/store/data/solr/config/schema.xml.i +0 -0
  68. data/.hg/store/data/solr/config/solrconfig-1.5.xml.i +0 -0
  69. data/.hg/store/data/spec/fixtures/changeme155.xml.i +0 -0
  70. data/.hg/store/data/spec/fixtures/dino.jpg.i +0 -0
  71. data/.hg/store/data/spec/fixtures/minivan.jpg.d +0 -0
  72. data/.hg/store/data/spec/fixtures/minivan.jpg.i +0 -0
  73. data/.hg/store/data/spec/fixtures/test__12.foxml.xml.i +0 -0
  74. data/.hg/store/data/spec/integration/active__fedora/base__spec.rb.i +0 -0
  75. data/.hg/store/data/spec/integration/active__fedora/datastream__spec.rb.i +0 -0
  76. data/.hg/store/data/spec/integration/active__fedora/fedora__object__spec.rb.i +0 -0
  77. data/.hg/store/data/spec/integration/active__fedora/full__featured__model__spec.rb.i +0 -0
  78. data/.hg/store/data/spec/integration/active__fedora/model__spec.rb.i +0 -0
  79. data/.hg/store/data/spec/integration/active__fedora/rels__ext__datastream__spec.rb.i +0 -0
  80. data/.hg/store/data/spec/integration/active__fedora/semantic__node__spec.rb.i +0 -0
  81. data/.hg/store/data/spec/integration/base__file__management__spec.rb.i +0 -0
  82. data/.hg/store/data/spec/integration/base__spec.rb.i +0 -0
  83. data/.hg/store/data/spec/integration/bug__spec.rb.i +0 -0
  84. data/.hg/store/data/spec/integration/datastream__spec.rb.i +0 -0
  85. data/.hg/store/data/spec/integration/datastreams__crud__spec.rb.i +0 -0
  86. data/.hg/store/data/spec/integration/fedora__object__spec.rb.i +0 -0
  87. data/.hg/store/data/spec/integration/full__featured__model__spec.rb.i +0 -0
  88. data/.hg/store/data/spec/integration/model__spec.rb.i +0 -0
  89. data/.hg/store/data/spec/integration/rels__ext__datastream__spec.rb.i +0 -0
  90. data/.hg/store/data/spec/integration/repository__spec.rb.i +0 -0
  91. data/.hg/store/data/spec/integration/rf__fedora__object__spec.rb.i +0 -0
  92. data/.hg/store/data/spec/integration/semantic__node__spec.rb.i +0 -0
  93. data/.hg/store/data/spec/integration/solr__service__spec.rb.i +0 -0
  94. data/.hg/store/data/spec/samples/models/audio__record.rb.i +0 -0
  95. data/.hg/store/data/spec/samples/models/image.rb.i +0 -0
  96. data/.hg/store/data/spec/samples/models/oral__history.rb.i +0 -0
  97. data/.hg/store/data/spec/samples/models/seminar.rb.i +0 -0
  98. data/.hg/store/data/spec/samples/models/seminar__audio__file.rb.i +0 -0
  99. data/.hg/store/data/spec/samples/oh__qdc.xml.i +0 -0
  100. data/.hg/store/data/spec/samples/oral__history.rb.i +0 -0
  101. data/.hg/store/data/spec/samples/oral__history__sample.xml.i +0 -0
  102. data/.hg/store/data/spec/samples/oral__history__sample__model.rb.i +0 -0
  103. data/.hg/store/data/spec/samples/oral__history__xml.xml.i +0 -0
  104. data/.hg/store/data/spec/spec.opts.i +0 -0
  105. data/.hg/store/data/spec/spec__helper.rb.i +0 -0
  106. data/.hg/store/data/spec/unit/active__fedora/base__cma__spec.rb.i +0 -0
  107. data/.hg/store/data/spec/unit/active__fedora/base__extra__spec.rb.i +0 -0
  108. data/.hg/store/data/spec/unit/active__fedora/base__spec.rb.i +0 -0
  109. data/.hg/store/data/spec/unit/active__fedora/content__model__spec.rb.i +0 -0
  110. data/.hg/store/data/spec/unit/active__fedora/datastream__spec.rb.i +0 -0
  111. data/.hg/store/data/spec/unit/active__fedora/inheritance__spec.rb.i +0 -0
  112. data/.hg/store/data/spec/unit/active__fedora/metadata__datastream__spec.rb.i +0 -0
  113. data/.hg/store/data/spec/unit/active__fedora/model__spec.rb.i +0 -0
  114. data/.hg/store/data/spec/unit/active__fedora/property__spec.rb.i +0 -0
  115. data/.hg/store/data/spec/unit/active__fedora/qualified__dublin__core__datastream__spec.rb.i +0 -0
  116. data/.hg/store/data/spec/unit/active__fedora/relationship__spec.rb.i +0 -0
  117. data/.hg/store/data/spec/unit/active__fedora/rels__ext__datastream__spec.rb.i +0 -0
  118. data/.hg/store/data/spec/unit/active__fedora/semantic__node__spec.rb.i +0 -0
  119. data/.hg/store/data/spec/unit/active__fedora/solr__service__spec.rb.i +0 -0
  120. data/.hg/store/data/spec/unit/active__fedora__spec.rb.i +0 -0
  121. data/.hg/store/data/spec/unit/base__cma__spec.rb.i +0 -0
  122. data/.hg/store/data/spec/unit/base__datastream__management__spec.rb.i +0 -0
  123. data/.hg/store/data/spec/unit/base__extra__spec.rb.i +0 -0
  124. data/.hg/store/data/spec/unit/base__file__management__spec.rb.i +0 -0
  125. data/.hg/store/data/spec/unit/base__loader__spec.rb.i +0 -0
  126. data/.hg/store/data/spec/unit/base__spec.rb.i +0 -0
  127. data/.hg/store/data/spec/unit/connection__spec.rb.i +0 -0
  128. data/.hg/store/data/spec/unit/content__model__spec.rb.i +0 -0
  129. data/.hg/store/data/spec/unit/datastream__concurrency__spec.rb.i +0 -0
  130. data/.hg/store/data/spec/unit/datastream__spec.rb.i +0 -0
  131. data/.hg/store/data/spec/unit/fedora__object__spec.rb.i +0 -0
  132. data/.hg/store/data/spec/unit/inheritance__spec.rb.i +0 -0
  133. data/.hg/store/data/spec/unit/metadata__datastream__spec.rb.i +0 -0
  134. data/.hg/store/data/spec/unit/model__spec.rb.i +0 -0
  135. data/.hg/store/data/spec/unit/property__spec.rb.i +0 -0
  136. data/.hg/store/data/spec/unit/qualified__dublin__core__datastream__spec.rb.i +0 -0
  137. data/.hg/store/data/spec/unit/relationship__spec.rb.i +0 -0
  138. data/.hg/store/data/spec/unit/rels__ext__datastream__spec.rb.i +0 -0
  139. data/.hg/store/data/spec/unit/repository__spec.rb.i +0 -0
  140. data/.hg/store/data/spec/unit/rf__datastream__spec.rb.i +0 -0
  141. data/.hg/store/data/spec/unit/semantic__node__spec.rb.i +0 -0
  142. data/.hg/store/data/spec/unit/solr__config__options__spec.rb.i +0 -0
  143. data/.hg/store/data/spec/unit/solr__mapper__spec.rb.i +0 -0
  144. data/.hg/store/data/spec/unit/solr__service__spec.rb.i +0 -0
  145. data/.hg/store/data/tasks/rspec.rake.i +0 -0
  146. data/.hg/store/undo +0 -0
  147. data/.hg/undo.branch +1 -0
  148. data/.hg/undo.dirstate +0 -0
  149. data/.hgignore +7 -0
  150. data/.hgtags +14 -0
  151. data/COPYING.txt +674 -0
  152. data/COYING.LESSER.txt +165 -0
  153. data/History.txt +34 -0
  154. data/LICENSE +20 -0
  155. data/License.txt +58 -0
  156. data/Manifest.txt +1 -1
  157. data/README.rdoc +13 -54
  158. data/README.txt +59 -0
  159. data/Rakefile +35 -0
  160. data/VERSION +1 -0
  161. data/active-fedora.gemspec +359 -0
  162. data/config/fedora.yml +16 -0
  163. data/config/solr_mappings.yml +14 -0
  164. data/config/solr_mappings_af_0.1.yml +16 -0
  165. data/config/solr_mappings_bl_2.4.yml +14 -0
  166. data/lib/active_fedora.rb +66 -6
  167. data/lib/active_fedora/base.rb +59 -23
  168. data/lib/active_fedora/datastream.rb +1 -1
  169. data/lib/active_fedora/metadata_datastream.rb +14 -7
  170. data/lib/active_fedora/model.rb +4 -4
  171. data/lib/active_fedora/rels_ext_datastream.rb +1 -1
  172. data/lib/active_fedora/semantic_node.rb +4 -3
  173. data/lib/active_fedora/solr_mapper.rb +17 -0
  174. data/lib/active_fedora/solr_service.rb +44 -2
  175. data/lib/fedora/base.rb +38 -0
  176. data/lib/fedora/connection.rb +210 -0
  177. data/lib/fedora/datastream.rb +56 -0
  178. data/lib/fedora/fedora_object.rb +161 -0
  179. data/lib/fedora/formats.rb +30 -0
  180. data/lib/fedora/generic_search.rb +71 -0
  181. data/lib/fedora/repository.rb +287 -0
  182. data/lib/ruby-fedora.rb +20 -0
  183. data/lib/util/class_level_inheritable_attributes.rb +23 -0
  184. data/script/console +15 -0
  185. data/script/destroy +14 -0
  186. data/script/generate +14 -0
  187. data/solr/config/schema-1.5.xml +468 -0
  188. data/solr/config/schema.xml +174 -212
  189. data/solr/config/solrconfig-1.5.xml +1069 -0
  190. data/spec/active_fedora_spec.rb +7 -0
  191. data/spec/fixtures/changeme155.xml +255 -0
  192. data/spec/fixtures/dino.jpg +0 -0
  193. data/spec/fixtures/minivan.jpg +0 -0
  194. data/spec/fixtures/test_12.foxml.xml +121 -0
  195. data/spec/integration/base_file_management_spec.rb +20 -0
  196. data/spec/integration/base_spec.rb +196 -0
  197. data/spec/integration/bug_spec.rb +57 -0
  198. data/spec/integration/datastream_spec.rb +60 -0
  199. data/spec/integration/datastreams_crud_spec.rb +208 -0
  200. data/spec/integration/fedora_object_spec.rb +77 -0
  201. data/spec/integration/full_featured_model_spec.rb +207 -0
  202. data/spec/integration/model_spec.rb +54 -0
  203. data/spec/integration/rels_ext_datastream_spec.rb +67 -0
  204. data/spec/integration/repository_spec.rb +297 -0
  205. data/spec/integration/rf_fedora_object_spec.rb +95 -0
  206. data/spec/integration/semantic_node_spec.rb +95 -0
  207. data/spec/integration/solr_service_spec.rb +33 -0
  208. data/spec/samples/models/audio_record.rb +29 -0
  209. data/spec/samples/models/image.rb +5 -0
  210. data/spec/samples/models/oral_history.rb +50 -0
  211. data/spec/samples/models/seminar.rb +29 -0
  212. data/spec/samples/models/seminar_audio_file.rb +34 -0
  213. data/spec/samples/oh_qdc.xml +32 -0
  214. data/spec/samples/oral_history_sample.xml +38 -0
  215. data/spec/samples/oral_history_sample_model.rb +39 -0
  216. data/spec/samples/oral_history_xml.xml +35 -0
  217. data/spec/spec.opts +5 -0
  218. data/spec/spec_helper.rb +41 -0
  219. data/spec/unit/active_fedora_spec.rb +15 -0
  220. data/spec/unit/base_cma_spec.rb +25 -0
  221. data/spec/unit/base_datastream_management_spec.rb +119 -0
  222. data/spec/unit/base_extra_spec.rb +108 -0
  223. data/spec/unit/base_file_management_spec.rb +90 -0
  224. data/spec/unit/base_loader_spec.rb +43 -0
  225. data/spec/unit/base_spec.rb +584 -0
  226. data/spec/unit/connection_spec.rb +25 -0
  227. data/spec/unit/content_model_spec.rb +51 -0
  228. data/spec/unit/datastream_concurrency_spec.rb +59 -0
  229. data/spec/unit/datastream_spec.rb +85 -0
  230. data/spec/unit/fedora_object_spec.rb +66 -0
  231. data/spec/unit/inheritance_spec.rb +46 -0
  232. data/spec/unit/metadata_datastream_spec.rb +290 -0
  233. data/spec/unit/model_spec.rb +186 -0
  234. data/spec/unit/property_spec.rb +50 -0
  235. data/spec/unit/qualified_dublin_core_datastream_spec.rb +177 -0
  236. data/spec/unit/relationship_spec.rb +77 -0
  237. data/spec/unit/rels_ext_datastream_spec.rb +99 -0
  238. data/spec/unit/repository_spec.rb +136 -0
  239. data/spec/unit/rf_datastream_spec.rb +49 -0
  240. data/spec/unit/semantic_node_spec.rb +354 -0
  241. data/spec/unit/solr_config_options_spec.rb +98 -0
  242. data/spec/unit/solr_mapper_spec.rb +31 -0
  243. data/spec/unit/solr_service_spec.rb +83 -0
  244. data/tasks/hoe.rake +0 -0
  245. data/tasks/rspec.rake +29 -0
  246. metadata +373 -55
@@ -1,229 +1,191 @@
1
- <?xml version="1.0" ?>
2
- <!--
3
- Licensed to the Apache Software Foundation (ASF) under one or more
4
- contributor license agreements. See the NOTICE file distributed with
5
- this work for additional information regarding copyright ownership.
6
- The ASF licenses this file to You under the Apache License, Version 2.0
7
- (the "License"); you may not use this file except in compliance with
8
- the License. You may obtain a copy of the License at
9
-
10
- http://www.apache.org/licenses/LICENSE-2.0
11
-
12
- Unless required by applicable law or agreed to in writing, software
13
- distributed under the License is distributed on an "AS IS" BASIS,
14
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
- See the License for the specific language governing permissions and
16
- limitations under the License.
17
- -->
18
-
19
- <!-- This is the Solr schema file. This file should be named "schema.xml" and
20
- should be in the conf directory under the solr home
21
- (i.e. ./solr/conf/schema.xml by default)
22
- or located where the classloader for the Solr webapp can find it.
23
-
24
- For more information, on how to customize this file, please see
25
- http://wiki.apache.org/solr/SchemaXml
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ This is the basic solr schema for use with ActiveFedora 1.1
4
+
5
+ Based on "Blacklight Demo Index" schema version 2.4
6
+
7
+ Changes from Blacklight Schema:
8
+ * _t copyFields are stored
9
+
10
+ For information on how to customize a solr schema file, please see
11
+ http://wiki.apache.org/solr/SchemaXml.
26
12
  -->
27
13
 
28
- <schema name="active_fedora" version="0.1">
29
- <!-- attribute "name" is the name of this schema and is only used for display purposes.
30
- Applications should change this to reflect the nature of the search collection.
31
- version="1.1" is Solr's version number for the schema syntax and semantics. It should
32
- not normally be changed by applications.
33
- 1.0: multiValued attribute did not exist, all fields are multiValued by nature
34
- 1.1: multiValued attribute introduced, false by default -->
35
-
14
+ <schema name="ActiveFedora" version="1.1">
36
15
  <types>
37
- <!-- field type definitions. The "name" attribute is
38
- just a label to be used by field definitions. The "class"
39
- attribute and any other attributes determine the real
40
- behavior of the fieldtype.
41
- Class names starting with "solr" refer to java classes in the
42
- org.apache.solr.analysis package.
43
- -->
44
-
45
- <!-- The StrField type is not analyzed, but indexed/stored verbatim.
46
- - StrField and TextField support an optional compressThreshold which
47
- limits compression (if enabled in the derived fields) to values which
48
- exceed a certain size (in characters).
49
- -->
50
- <fieldtype name="string" class="solr.StrField" sortMissingLast="true" omitNorms="true"/>
51
-
52
- <!-- boolean type: "true" or "false" -->
53
- <fieldtype name="boolean" class="solr.BoolField" sortMissingLast="true" omitNorms="true"/>
54
-
55
- <!-- The optional sortMissingLast and sortMissingFirst attributes are
56
- currently supported on types that are sorted internally as strings.
57
- - If sortMissingLast="true", then a sort on this field will cause documents
58
- without the field to come after documents with the field,
59
- regardless of the requested sort order (asc or desc).
60
- - If sortMissingFirst="true", then a sort on this field will cause documents
61
- without the field to come before documents with the field,
62
- regardless of the requested sort order.
63
- - If sortMissingLast="false" and sortMissingFirst="false" (the default),
64
- then default lucene sorting will be used which places docs without the
65
- field first in an ascending sort and last in a descending sort.
66
- -->
67
-
68
-
69
- <!-- numeric field types that store and index the text
70
- value verbatim (and hence don't support range queries, since the
71
- lexicographic ordering isn't equal to the numeric ordering) -->
72
- <fieldtype name="integer" class="solr.IntField" omitNorms="true"/>
73
- <fieldtype name="long" class="solr.LongField" omitNorms="true"/>
74
- <fieldtype name="float" class="solr.FloatField" omitNorms="true"/>
75
- <fieldtype name="double" class="solr.DoubleField" omitNorms="true"/>
76
-
77
-
78
- <!-- Numeric field types that manipulate the value into
79
- a string value that isn't human-readable in its internal form,
80
- but with a lexicographic ordering the same as the numeric ordering,
81
- so that range queries work correctly. -->
82
- <fieldtype name="sint" class="solr.SortableIntField" sortMissingLast="true" omitNorms="true"/>
83
- <fieldtype name="slong" class="solr.SortableLongField" sortMissingLast="true" omitNorms="true"/>
84
- <fieldtype name="sfloat" class="solr.SortableFloatField" sortMissingLast="true" omitNorms="true"/>
85
- <fieldtype name="sdouble" class="solr.SortableDoubleField" sortMissingLast="true" omitNorms="true"/>
86
-
87
-
88
- <!-- The format for this date field is of the form 1995-12-31T23:59:59Z, and
89
- is a more restricted form of the canonical representation of dateTime
90
- http://www.w3.org/TR/xmlschema-2/#dateTime
91
- The trailing "Z" designates UTC time and is mandatory.
92
- Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z
93
- All other components are mandatory.
94
-
95
- Expressions can also be used to denote calculations that should be
96
- performed relative to "NOW" to determine the value, ie...
97
-
98
- NOW/HOUR
99
- ... Round to the start of the current hour
100
- NOW-1DAY
101
- ... Exactly 1 day prior to now
102
- NOW/DAY+6MONTHS+3DAYS
103
- ... 6 months and 3 days in the future from the start of
104
- the current day
105
-
106
- Consult the DateField javadocs for more information.
107
- -->
108
- <fieldtype name="date" class="solr.DateField" sortMissingLast="true" omitNorms="true"/>
109
-
110
- <!-- solr.TextField allows the specification of custom text analyzers
111
- specified as a tokenizer and a list of token filters. Different
112
- analyzers may be specified for indexing and querying.
113
-
114
- The optional positionIncrementGap puts space between multiple fields of
115
- this type on the same document, with the purpose of preventing false phrase
116
- matching across fields.
117
-
118
- For more info on customizing your analyzer chain, please see
119
- http://wiki.apache.org/solr/AnalyzersTokenizersTokenFilters
120
- -->
121
-
122
- <!-- One can also specify an existing Analyzer class that has a
123
- default constructor via the class attribute on the analyzer element
124
- <fieldtype name="text_greek" class="solr.TextField">
125
- <analyzer class="org.apache.lucene.analysis.el.GreekAnalyzer"/>
126
- </fieldType>
127
- -->
128
-
129
- <!-- A text field that only splits on whitespace for exact matching of words -->
130
- <fieldtype name="text_ws" class="solr.TextField" positionIncrementGap="100">
131
- <analyzer>
16
+ <fieldType name="string" class="solr.StrField" sortMissingLast="true" omitNorms="true"/>
17
+ <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true" omitNorms="true"/>
18
+ <fieldType name="integer" class="solr.IntField" omitNorms="true"/>
19
+ <fieldType name="long" class="solr.LongField" omitNorms="true"/>
20
+ <fieldType name="float" class="solr.FloatField" omitNorms="true"/>
21
+ <fieldType name="double" class="solr.DoubleField" omitNorms="true"/>
22
+ <fieldType name="sint" class="solr.SortableIntField" sortMissingLast="true" omitNorms="true"/>
23
+ <fieldType name="slong" class="solr.SortableLongField" sortMissingLast="true" omitNorms="true"/>
24
+ <fieldType name="sfloat" class="solr.SortableFloatField" sortMissingLast="true" omitNorms="true"/>
25
+ <fieldType name="sdouble" class="solr.SortableDoubleField" sortMissingLast="true" omitNorms="true"/>
26
+ <fieldType name="date" class="solr.DateField" sortMissingLast="true" omitNorms="true"/>
27
+ <fieldType name="random" class="solr.RandomSortField" indexed="true" />
28
+
29
+ <fieldType name="text" class="solr.TextField" positionIncrementGap="100">
30
+ <analyzer type="index">
132
31
  <tokenizer class="solr.WhitespaceTokenizerFactory"/>
32
+ <filter class="schema.UnicodeNormalizationFilterFactory" version="icu4j" composed="false" remove_diacritics="true" remove_modifiers="true" fold="true" />
33
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" enablePositionIncrements="true" />
34
+ <filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="1" catenateNumbers="1" catenateAll="0" splitOnCaseChange="1"/>
35
+ <filter class="solr.LowerCaseFilterFactory"/>
36
+ <filter class="solr.EnglishPorterFilterFactory" protected="protwords.txt"/>
37
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
133
38
  </analyzer>
134
- </fieldtype>
135
-
136
- <fieldtype name="text" class="solr.TextField" positionIncrementGap="100">
137
- <analyzer>
138
- <tokenizer class="solr.StandardTokenizerFactory"/>
139
- <filter class="solr.StandardFilterFactory"/>
39
+ <analyzer type="query">
40
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
41
+ <filter class="schema.UnicodeNormalizationFilterFactory" version="icu4j" composed="false" remove_diacritics="true" remove_modifiers="true" fold="true" />
42
+ <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
43
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" enablePositionIncrements="true" />
44
+ <filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="0" catenateNumbers="0" catenateAll="0" splitOnCaseChange="1"/>
140
45
  <filter class="solr.LowerCaseFilterFactory"/>
46
+ <filter class="solr.EnglishPorterFilterFactory" protected="protwords.txt"/>
47
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
141
48
  </analyzer>
142
- </fieldtype>
49
+ </fieldType>
143
50
 
144
- <fieldtype name="text_zh" class="solr.TextField">
145
- <analyzer class="org.apache.lucene.analysis.cn.ChineseAnalyzer"/>
51
+ <!-- Analyzed Text, no Stemming or Synonyms -->
52
+ <fieldtype name="textNoStem" class="solr.TextField" positionIncrementGap="100">
53
+ <analyzer type="index">
54
+ <tokenizer class="solr.WhitespaceTokenizerFactory" />
55
+ <filter class="schema.UnicodeNormalizationFilterFactory" version="icu4j" composed="false" remove_diacritics="true" remove_modifiers="true" fold="true" />
56
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" enablePositionIncrements="true" />
57
+ <filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="1" catenateNumbers="1" catenateAll="0" splitOnCaseChange="1" />
58
+ <filter class="solr.LowerCaseFilterFactory" />
59
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory" />
60
+ </analyzer>
61
+ <analyzer type="query">
62
+ <tokenizer class="solr.WhitespaceTokenizerFactory" />
63
+ <filter class="schema.UnicodeNormalizationFilterFactory" version="icu4j" composed="false" remove_diacritics="true" remove_modifiers="true" fold="true" />
64
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt" enablePositionIncrements="true" />
65
+ <filter class="solr.WordDelimiterFilterFactory" generateWordParts="1" generateNumberParts="1" catenateWords="0" catenateNumbers="0" catenateAll="0" splitOnCaseChange="1" />
66
+ <filter class="solr.LowerCaseFilterFactory" />
67
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory" />
68
+ </analyzer>
146
69
  </fieldtype>
147
-
148
-
149
- <!-- Less flexible matching, but less false matches. Probably not ideal for product names,
150
- but may be good for SKUs. Can insert dashes in the wrong place and still match. -->
151
- <fieldtype name="textTight" class="solr.TextField" positionIncrementGap="100" >
70
+
71
+ <fieldType name="textSpell" class="solr.TextField" positionIncrementGap="100" >
152
72
  <analyzer>
153
- <tokenizer class="solr.WhitespaceTokenizerFactory"/>
154
- <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="false"/>
73
+ <tokenizer class="solr.StandardTokenizerFactory"/>
155
74
  <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords.txt"/>
156
- <filter class="solr.WordDelimiterFilterFactory" generateWordParts="0" generateNumberParts="0" catenateWords="1" catenateNumbers="1" catenateAll="0"/>
75
+ <filter class="solr.StandardFilterFactory"/>
157
76
  <filter class="solr.LowerCaseFilterFactory"/>
158
- <filter class="solr.EnglishPorterFilterFactory" protected="protwords.txt"/>
159
77
  <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
160
78
  </analyzer>
161
- </fieldtype>
162
-
163
- </types>
164
-
165
-
166
- <fields>
167
- <!-- Valid attributes for fields:
168
- name: mandatory - the name for the field
169
- type: mandatory - the name of a previously defined type from the <types> section
170
- indexed: true if this field should be indexed (searchable or sortable)
171
- stored: true if this field should be retrievable
172
- compressed: [false] if this field should be stored using gzip compression
173
- (this will only apply if the field type is compressable; among
174
- the standard field types, only TextField and StrField are)
175
- multiValued: true if this field may contain multiple values per document
176
- omitNorms: (expert) set to true to omit the norms associated with
177
- this field (this disables length normalization and index-time
178
- boosting for the field, and saves some memory). Only full-text
179
- fields or fields that need an index-time boost need norms.
180
- -->
181
-
182
- <field name="id" type="string" indexed="true" stored="true"/>
183
-
184
- <!-- catchall field, containing all other searchable text fields (implemented
185
- via copyField further on in this schema -->
186
- <field name="text" type="text" indexed="true" stored="false" multiValued="true"/>
187
- <!-- catchall field, containing all other searchable text fields (implemented
188
- via copyField further on in this schema -->
189
- <field name="date" type="date" indexed="true" stored="false" multiValued="true"/>
190
-
191
- <!-- Dynamic field definitions. If a field name is not found, dynamicFields
192
- will be used if the name matches any of the patterns.
193
- RESTRICTION: the glob-like pattern in the name attribute must have
194
- a "*" only at the start or the end.
195
- EXAMPLE: name="*_i" will match any field ending in _i (like myid_i, z_i)
196
- Longer patterns will be matched first. if equal size patterns
197
- both match, the first appearing in the schema will be used. -->
198
- <dynamicField name="*_date" type="date" indexed="true" stored="true" multiValued="true"/>
199
- <dynamicField name="*_name" type="date" indexed="true" stored="true" multiValued="true"/>
200
- <dynamicField name="*_field" type="text" indexed="true" stored="true" multiValued="true"/>
201
-
202
- <dynamicField name="*_facet" type="string" indexed="true" stored="true" multiValued="true"/>
203
- <dynamicField name="*_zh_text" type="text_zh" indexed="true" stored="true" multiValued="true"/>
204
- <dynamicField name="*_text" type="text" indexed="true" stored="true" multiValued="true"/>
205
- <dynamicField name="*_display" type="text" indexed="false" stored="true" multiValued="true"/>
206
- </fields>
207
-
208
- <!-- field to use to determine and enforce document uniqueness. -->
209
- <uniqueKey>id</uniqueKey>
210
-
211
- <!-- field for the QueryParser to use when an explicit fieldname is absent -->
212
- <defaultSearchField>text</defaultSearchField>
213
-
214
- <!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
215
- <solrQueryParser defaultOperator="AND"/>
216
-
217
- <!-- copyField commands copy one field to another at the time a document
218
- is added to the index. It's used either to index the same field differently,
219
- or to add multiple fields to the same field for easier/faster searching. -->
220
- <copyField source="*_date" dest="date"/>
221
- <copyField source="*_text" dest="text"/>
222
- <copyField source="*_facet" dest="text"/>
79
+ </fieldType>
223
80
 
224
- <!-- Similarity is the scoring routine for each document vs. a query.
225
- A custom similarity may be specified here, but the default is fine
226
- for most applications. -->
227
- <!-- <similarity class="org.apache.lucene.search.DefaultSimilarity"/> -->
81
+ <fieldType name="alphaOnlySort" class="solr.TextField" sortMissingLast="true" omitNorms="true">
82
+ <analyzer>
83
+ <tokenizer class="solr.KeywordTokenizerFactory"/>
84
+ <filter class="schema.UnicodeNormalizationFilterFactory" version="icu4j" composed="false" remove_diacritics="true" remove_modifiers="true" fold="true" />
85
+ <filter class="solr.LowerCaseFilterFactory" />
86
+ <filter class="solr.TrimFilterFactory" />
87
+ <!--
88
+ <filter class="solr.PatternReplaceFilterFactory" pattern="([^a-z\d])" replacement="" replace="all" />
89
+ -->
90
+ </analyzer>
91
+ </fieldType>
92
+ </types>
93
+
94
+ <fields>
95
+ <!-- NOTE: this is not a full list of fields in the index; dynamic fields are also used -->
96
+ <field name="id" type="string" indexed="true" stored="true" required="true" />
97
+ <field name="timestamp" type="date" indexed="true" stored="true" default="NOW" multiValued="false"/>
98
+ <!-- default, catch all search field -->
99
+ <field name="text" type="text" indexed="true" stored="false" multiValued="true"/>
100
+
101
+ <!-- these display fields are NOT multi-valued -->
102
+ <field name="marc_display" type="string" indexed="false" stored="true" multiValued="false"/>
103
+ <field name="title_display" type="string" indexed="false" stored="true" multiValued="false"/>
104
+ <field name="title_vern_display" type="string" indexed="false" stored="true" multiValued="false"/>
105
+ <field name="subtitle_display" type="string" indexed="false" stored="true" multiValued="false"/>
106
+ <field name="subtitle_vern_display" type="string" indexed="false" stored="true" multiValued="false"/>
107
+ <field name="author_display" type="string" indexed="false" stored="true" multiValued="false"/>
108
+ <field name="author_vern_display" type="string" indexed="false" stored="true" multiValued="false"/>
109
+
110
+ <!-- these fields are also used for display, so they must be stored -->
111
+ <field name="isbn_t" type="text" indexed="true" stored="true" multiValued="true"/>
112
+ <field name="language_facet" type="string" indexed="true" stored="true" multiValued="true" />
113
+ <field name="subject_topic_facet" type="string" indexed="true" stored="true" multiValued="true" />
114
+ <field name="subject_era_facet" type="string" indexed="true" stored="true" multiValued="true" />
115
+ <field name="subject_geo_facet" type="string" indexed="true" stored="true" multiValued="true" />
116
+ <!-- pub_date is used for facet and display so it must be indexed and stored -->
117
+ <field name="pub_date" type="string" indexed="true" stored="true" multiValued="true"/>
118
+ <!-- format is used for facet, display, and choosing which partial to use for the show view, so it must be stored and indexed -->
119
+ <field name="format" type="string" indexed="true" stored="true"/>
120
+
121
+ <dynamicField name="*_i" type="sint" indexed="true" stored="true"/>
122
+ <dynamicField name="*_s" type="string" indexed="true" stored="true" multiValued="true"/>
123
+ <dynamicField name="*_l" type="slong" indexed="true" stored="true"/>
124
+ <dynamicField name="*_t" type="text" indexed="true" stored="true" multiValued="true"/>
125
+ <dynamicField name="*_b" type="boolean" indexed="true" stored="true"/>
126
+ <dynamicField name="*_f" type="sfloat" indexed="true" stored="true"/>
127
+ <dynamicField name="*_d" type="sdouble" indexed="true" stored="true"/>
128
+ <dynamicField name="*_dt" type="date" indexed="true" stored="true"/>
129
+ <dynamicField name="random*" type="random" />
130
+
131
+ <dynamicField name="*_facet" type="string" indexed="true" stored="false" multiValued="true" />
132
+ <dynamicField name="*_display" type="string" indexed="false" stored="true" multiValued="true" />
133
+ <dynamicField name="*_sort" type="alphaOnlySort" indexed="true" stored="false"/>
134
+ <dynamicField name="*_unstem_search" type="textNoStem" indexed="true" stored="false" multiValued="true" />
135
+ <dynamicField name="*spell" type="textSpell" indexed="true" stored="false" multiValued="true"/>
136
+
137
+ </fields>
138
+
139
+ <uniqueKey>id</uniqueKey>
140
+ <defaultSearchField>text</defaultSearchField>
141
+ <solrQueryParser defaultOperator="OR"/>
142
+
143
+ <!-- Copy Fields -->
144
+
145
+ <!-- unstemmed fields -->
146
+ <copyField source="title_t" dest="title_unstem_search"/>
147
+ <copyField source="subtitle_t" dest="subtitle_unstem_search"/>
148
+ <copyField source="title_addl_t" dest="title_addl_unstem_search"/>
149
+ <copyField source="title_added_entry_t" dest="title_added_entry_unstem_search"/>
150
+ <copyField source="title_series_t" dest="title_series_unstem_search"/>
151
+ <copyField source="author_t" dest="author_unstem_search"/>
152
+ <copyField source="author_addl_t" dest="author_addl_unstem_search"/>
153
+ <copyField source="subject_t" dest="subject_unstem_search"/>
154
+ <copyField source="subject_addl_t" dest="subject_addl_unstem_search"/>
155
+ <copyField source="subject_topic_facet" dest="subject_topic_unstem_search"/>
156
+
157
+ <!-- sort fields -->
158
+ <copyField source="pub_date" dest="pub_date_sort"/>
159
+
160
+ <!-- spellcheck fields -->
161
+ <!-- default spell check; should match fields for default request handler -->
162
+ <!-- it won't work with a copy of a copy field -->
163
+ <copyField source="*_t" dest="spell"/>
164
+ <copyField source="*_facet" dest="spell"/>
165
+ <!-- title spell check; should match fields for title request handler -->
166
+ <copyField source="title_t" dest="title_spell"/>
167
+ <copyField source="subtitle_t" dest="title_spell"/>
168
+ <copyField source="addl_titles_t" dest="title_spell"/>
169
+ <copyField source="title_added_entry_t" dest="title_spell"/>
170
+ <copyField source="title_series_t" dest="title_spell"/>
171
+ <!-- author spell check; should match fields for author request handler -->
172
+ <copyField source="author_t" dest="author_spell"/>
173
+ <copyField source="author_addl_t" dest="author_spell"/>
174
+ <!-- subject spell check; should match fields for subject request handler -->
175
+ <copyField source="subject_topic_facet" dest="subject_spell"/>
176
+ <copyField source="subject_t" dest="subject_spell"/>
177
+ <copyField source="subject_addl_t" dest="subject_spell"/>
178
+
179
+ <!-- OpenSearch query field should match request handler search fields -->
180
+ <copyField source="title_t" dest="opensearch_display"/>
181
+ <copyField source="subtitle_t" dest="opensearch_display"/>
182
+ <copyField source="addl_titles_t" dest="opensearch_display"/>
183
+ <copyField source="title_added_entry_t" dest="opensearch_display"/>
184
+ <copyField source="title_series_t" dest="opensearch_display"/>
185
+ <copyField source="author_t" dest="opensearch_display"/>
186
+ <copyField source="author_addl_t" dest="opensearch_display"/>
187
+ <copyField source="subject_topic_facet" dest="opensearch_display"/>
188
+ <copyField source="subject_t" dest="opensearch_display"/>
189
+ <copyField source="subject_addl_t" dest="opensearch_display"/>
228
190
 
229
191
  </schema>
@@ -0,0 +1,1069 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+ <!--
19
+ For more details about configurations options that may appear in this
20
+ file, see http://wiki.apache.org/solr/SolrConfigXml.
21
+
22
+ Specifically, the Solr Config can support XInclude, which may make it easier to manage
23
+ the configuration. See https://issues.apache.org/jira/browse/SOLR-1167
24
+ -->
25
+ <config>
26
+ <!-- Set this to 'false' if you want solr to continue working after it has
27
+ encountered an severe configuration error. In a production environment,
28
+ you may want solr to keep working even if one handler is mis-configured.
29
+
30
+ You may also set this to false using by setting the system property:
31
+ -Dsolr.abortOnConfigurationError=false
32
+ -->
33
+ <abortOnConfigurationError>${solr.abortOnConfigurationError:true}</abortOnConfigurationError>
34
+
35
+ <!-- lib directives can be used to instruct Solr to load an Jars identified
36
+ and use them to resolve any "plugins" specified in your solrconfig.xml or
37
+ schema.xml (ie: Analyzers, Request Handlers, etc...).
38
+
39
+ All directories and paths are resolved relative the instanceDir.
40
+
41
+ If a "./lib" directory exists in your instanceDir, all files found in it
42
+ are included as if you had used the following syntax...
43
+
44
+ <lib dir="./lib" />
45
+ -->
46
+ <!-- A dir option by itself adds any files found in the directory to the
47
+ classpath, this is useful for including all jars in a directory.
48
+ -->
49
+ <lib dir="../../contrib/extraction/lib" />
50
+ <!-- When a regex is specified in addition to a directory, only the files in that
51
+ directory which completely match the regex (anchored on both ends)
52
+ will be included.
53
+ -->
54
+ <lib dir="../../dist/" regex="apache-solr-cell-\d.*\.jar" />
55
+ <lib dir="../../dist/" regex="apache-solr-clustering-\d.*\.jar" />
56
+ <!-- If a dir option (with or without a regex) is used and nothing is found
57
+ that matches, it will be ignored
58
+ -->
59
+ <lib dir="../../contrib/clustering/lib/downloads/" />
60
+ <lib dir="../../contrib/clustering/lib/" />
61
+ <lib dir="/total/crap/dir/ignored" />
62
+ <!-- an exact path can be used to specify a specific file. This will cause
63
+ a serious error to be logged if it can't be loaded.
64
+ <lib path="../a-jar-that-does-not-exist.jar" />
65
+ -->
66
+
67
+
68
+ <!-- Used to specify an alternate directory to hold all index data
69
+ other than the default ./data under the Solr home.
70
+ If replication is in use, this should match the replication configuration. -->
71
+ <dataDir>${solr.data.dir:}</dataDir>
72
+
73
+
74
+ <!-- WARNING: this <indexDefaults> section only provides defaults for index writers
75
+ in general. See also the <mainIndex> section after that when changing parameters
76
+ for Solr's main Lucene index. -->
77
+ <indexDefaults>
78
+ <!-- Values here affect all index writers and act as a default unless overridden. -->
79
+ <useCompoundFile>false</useCompoundFile>
80
+
81
+ <mergeFactor>10</mergeFactor>
82
+ <!-- If both ramBufferSizeMB and maxBufferedDocs is set, then Lucene will flush
83
+ based on whichever limit is hit first. -->
84
+ <!--<maxBufferedDocs>1000</maxBufferedDocs>-->
85
+
86
+ <!-- Sets the amount of RAM that may be used by Lucene indexing
87
+ for buffering added documents and deletions before they are
88
+ flushed to the Directory. -->
89
+ <ramBufferSizeMB>32</ramBufferSizeMB>
90
+ <!-- <maxMergeDocs>2147483647</maxMergeDocs> -->
91
+ <maxFieldLength>10000</maxFieldLength>
92
+ <writeLockTimeout>1000</writeLockTimeout>
93
+ <commitLockTimeout>10000</commitLockTimeout>
94
+
95
+ <!--
96
+ Expert: Turn on Lucene's auto commit capability. This causes intermediate
97
+ segment flushes to write a new lucene index descriptor, enabling it to be
98
+ opened by an external IndexReader. This can greatly slow down indexing
99
+ speed. NOTE: Despite the name, this value does not have any relation to
100
+ Solr's autoCommit functionality
101
+ -->
102
+ <!--<luceneAutoCommit>false</luceneAutoCommit>-->
103
+
104
+ <!--
105
+ Expert: The Merge Policy in Lucene controls how merging is handled by
106
+ Lucene. The default in 2.3 is the LogByteSizeMergePolicy, previous
107
+ versions used LogDocMergePolicy.
108
+
109
+ LogByteSizeMergePolicy chooses segments to merge based on their size. The
110
+ Lucene 2.2 default, LogDocMergePolicy chose when to merge based on number
111
+ of documents
112
+
113
+ Other implementations of MergePolicy must have a no-argument constructor
114
+ -->
115
+ <!--<mergePolicy class="org.apache.lucene.index.LogByteSizeMergePolicy"/>-->
116
+
117
+ <!--
118
+ Expert:
119
+ The Merge Scheduler in Lucene controls how merges are performed. The
120
+ ConcurrentMergeScheduler (Lucene 2.3 default) can perform merges in the
121
+ background using separate threads. The SerialMergeScheduler (Lucene 2.2
122
+ default) does not.
123
+ -->
124
+ <!--<mergeScheduler class="org.apache.lucene.index.ConcurrentMergeScheduler"/>-->
125
+
126
+
127
+ <!--
128
+ This option specifies which Lucene LockFactory implementation to use.
129
+
130
+ single = SingleInstanceLockFactory - suggested for a read-only index
131
+ or when there is no possibility of another process trying
132
+ to modify the index.
133
+ native = NativeFSLockFactory - uses OS native file locking
134
+ simple = SimpleFSLockFactory - uses a plain file for locking
135
+
136
+ (For backwards compatibility with Solr 1.2, 'simple' is the default
137
+ if not specified.)
138
+ -->
139
+ <lockType>native</lockType>
140
+ <!--
141
+ Expert:
142
+ Controls how often Lucene loads terms into memory -->
143
+ <!--<termIndexInterval>256</termIndexInterval>-->
144
+ </indexDefaults>
145
+
146
+ <mainIndex>
147
+ <!-- options specific to the main on-disk lucene index -->
148
+ <useCompoundFile>false</useCompoundFile>
149
+ <ramBufferSizeMB>32</ramBufferSizeMB>
150
+ <mergeFactor>10</mergeFactor>
151
+ <!-- Deprecated -->
152
+ <!--<maxBufferedDocs>1000</maxBufferedDocs>-->
153
+ <!--<maxMergeDocs>2147483647</maxMergeDocs>-->
154
+
155
+ <!-- inherit from indexDefaults <maxFieldLength>10000</maxFieldLength> -->
156
+
157
+ <!-- If true, unlock any held write or commit locks on startup.
158
+ This defeats the locking mechanism that allows multiple
159
+ processes to safely access a lucene index, and should be
160
+ used with care.
161
+ This is not needed if lock type is 'none' or 'single'
162
+ -->
163
+ <unlockOnStartup>false</unlockOnStartup>
164
+
165
+ <!-- If true, IndexReaders will be reopened (often more efficient) instead
166
+ of closed and then opened. -->
167
+ <reopenReaders>true</reopenReaders>
168
+
169
+ <!--
170
+ Expert:
171
+ Controls how often Lucene loads terms into memory. Default is 128 and is likely good for most everyone. -->
172
+ <!--<termIndexInterval>256</termIndexInterval>-->
173
+
174
+ <!--
175
+ Custom deletion policies can specified here. The class must
176
+ implement org.apache.lucene.index.IndexDeletionPolicy.
177
+
178
+ http://lucene.apache.org/java/2_9_1/api/all/org/apache/lucene/index/IndexDeletionPolicy.html
179
+
180
+ The standard Solr IndexDeletionPolicy implementation supports deleting
181
+ index commit points on number of commits, age of commit point and
182
+ optimized status.
183
+
184
+ The latest commit point should always be preserved regardless
185
+ of the criteria.
186
+ -->
187
+ <deletionPolicy class="solr.SolrDeletionPolicy">
188
+ <!-- The number of commit points to be kept -->
189
+ <str name="maxCommitsToKeep">1</str>
190
+ <!-- The number of optimized commit points to be kept -->
191
+ <str name="maxOptimizedCommitsToKeep">0</str>
192
+ <!--
193
+ Delete all commit points once they have reached the given age.
194
+ Supports DateMathParser syntax e.g.
195
+
196
+ <str name="maxCommitAge">30MINUTES</str>
197
+ <str name="maxCommitAge">1DAY</str>
198
+ -->
199
+ </deletionPolicy>
200
+
201
+ <!-- To aid in advanced debugging, you may turn on IndexWriter debug logging.
202
+ Setting to true will set the file that the underlying Lucene IndexWriter
203
+ will write its debug infostream to. -->
204
+ <infoStream file="INFOSTREAM.txt">false</infoStream>
205
+
206
+ </mainIndex>
207
+
208
+ <!-- Enables JMX if and only if an existing MBeanServer is found, use this
209
+ if you want to configure JMX through JVM parameters. Remove this to disable
210
+ exposing Solr configuration and statistics to JMX.
211
+
212
+ If you want to connect to a particular server, specify the agentId
213
+ e.g. <jmx agentId="myAgent" />
214
+
215
+ If you want to start a new MBeanServer, specify the serviceUrl
216
+ e.g <jmx serviceUrl="service:jmx:rmi:///jndi/rmi://localhost:9999/solr"/>
217
+
218
+ For more details see http://wiki.apache.org/solr/SolrJmx
219
+ -->
220
+ <jmx />
221
+
222
+ <!-- the default high-performance update handler -->
223
+ <updateHandler class="solr.DirectUpdateHandler2">
224
+ <!-- A prefix of "solr." for class names is an alias that
225
+ causes solr to search appropriate packages, including
226
+ org.apache.solr.(search|update|request|core|analysis)
227
+ -->
228
+
229
+ <!-- Perform a <commit/> automatically under certain conditions:
230
+ maxDocs - number of updates since last commit is greater than this
231
+ maxTime - oldest uncommited update (in ms) is this long ago
232
+ Instead of enabling autoCommit, consider using "commitWithin"
233
+ when adding documents. http://wiki.apache.org/solr/UpdateXmlMessages
234
+ <autoCommit>
235
+ <maxDocs>10000</maxDocs>
236
+ <maxTime>1000</maxTime>
237
+ </autoCommit>
238
+ -->
239
+
240
+
241
+ <!-- The RunExecutableListener executes an external command from a
242
+ hook such as postCommit or postOptimize.
243
+ exe - the name of the executable to run
244
+ dir - dir to use as the current working directory. default="."
245
+ wait - the calling thread waits until the executable returns. default="true"
246
+ args - the arguments to pass to the program. default=nothing
247
+ env - environment variables to set. default=nothing
248
+ -->
249
+ <!-- A postCommit event is fired after every commit or optimize command
250
+ <listener event="postCommit" class="solr.RunExecutableListener">
251
+ <str name="exe">solr/bin/snapshooter</str>
252
+ <str name="dir">.</str>
253
+ <bool name="wait">true</bool>
254
+ <arr name="args"> <str>arg1</str> <str>arg2</str> </arr>
255
+ <arr name="env"> <str>MYVAR=val1</str> </arr>
256
+ </listener>
257
+ -->
258
+ <!-- A postOptimize event is fired only after every optimize command
259
+ <listener event="postOptimize" class="solr.RunExecutableListener">
260
+ <str name="exe">snapshooter</str>
261
+ <str name="dir">solr/bin</str>
262
+ <bool name="wait">true</bool>
263
+ </listener>
264
+ -->
265
+
266
+ </updateHandler>
267
+
268
+ <!-- Use the following format to specify a custom IndexReaderFactory - allows for alternate
269
+ IndexReader implementations.
270
+
271
+ ** Experimental Feature **
272
+ Please note - Using a custom IndexReaderFactory may prevent certain other features
273
+ from working. The API to IndexReaderFactory may change without warning or may even
274
+ be removed from future releases if the problems cannot be resolved.
275
+
276
+ ** Features that may not work with custom IndexReaderFactory **
277
+ The ReplicationHandler assumes a disk-resident index. Using a custom
278
+ IndexReader implementation may cause incompatibility with ReplicationHandler and
279
+ may cause replication to not work correctly. See SOLR-1366 for details.
280
+
281
+ <indexReaderFactory name="IndexReaderFactory" class="package.class">
282
+ Parameters as required by the implementation
283
+ </indexReaderFactory >
284
+ -->
285
+ <!-- To set the termInfosIndexDivisor, do this: -->
286
+ <!--<indexReaderFactory name="IndexReaderFactory" class="org.apache.solr.core.StandardIndexReaderFactory">
287
+ <int name="termInfosIndexDivisor">12</int>
288
+ </indexReaderFactory >-->
289
+
290
+
291
+ <query>
292
+ <!-- Maximum number of clauses in a boolean query... in the past, this affected
293
+ range or prefix queries that expanded to big boolean queries - built in Solr
294
+ query parsers no longer create queries with this limitation.
295
+ An exception is thrown if exceeded. -->
296
+ <maxBooleanClauses>1024</maxBooleanClauses>
297
+
298
+
299
+ <!-- There are two implementations of cache available for Solr,
300
+ LRUCache, based on a synchronized LinkedHashMap, and
301
+ FastLRUCache, based on a ConcurrentHashMap. FastLRUCache has faster gets
302
+ and slower puts in single threaded operation and thus is generally faster
303
+ than LRUCache when the hit ratio of the cache is high (> 75%), and may be
304
+ faster under other scenarios on multi-cpu systems. -->
305
+ <!-- Cache used by SolrIndexSearcher for filters (DocSets),
306
+ unordered sets of *all* documents that match a query.
307
+ When a new searcher is opened, its caches may be prepopulated
308
+ or "autowarmed" using data from caches in the old searcher.
309
+ autowarmCount is the number of items to prepopulate. For LRUCache,
310
+ the autowarmed items will be the most recently accessed items.
311
+ Parameters:
312
+ class - the SolrCache implementation LRUCache or FastLRUCache
313
+ size - the maximum number of entries in the cache
314
+ initialSize - the initial capacity (number of entries) of
315
+ the cache. (seel java.util.HashMap)
316
+ autowarmCount - the number of entries to prepopulate from
317
+ and old cache.
318
+ -->
319
+ <filterCache
320
+ class="solr.FastLRUCache"
321
+ size="512"
322
+ initialSize="512"
323
+ autowarmCount="0"/>
324
+
325
+ <!-- Cache used to hold field values that are quickly accessible
326
+ by document id. The fieldValueCache is created by default
327
+ even if not configured here.
328
+ <fieldValueCache
329
+ class="solr.FastLRUCache"
330
+ size="512"
331
+ autowarmCount="128"
332
+ showItems="32"
333
+ />
334
+ -->
335
+
336
+ <!-- queryResultCache caches results of searches - ordered lists of
337
+ document ids (DocList) based on a query, a sort, and the range
338
+ of documents requested. -->
339
+ <queryResultCache
340
+ class="solr.LRUCache"
341
+ size="512"
342
+ initialSize="512"
343
+ autowarmCount="0"/>
344
+
345
+ <!-- documentCache caches Lucene Document objects (the stored fields for each document).
346
+ Since Lucene internal document ids are transient, this cache will not be autowarmed. -->
347
+ <documentCache
348
+ class="solr.LRUCache"
349
+ size="512"
350
+ initialSize="512"
351
+ autowarmCount="0"/>
352
+
353
+ <!-- If true, stored fields that are not requested will be loaded lazily.
354
+ This can result in a significant speed improvement if the usual case is to
355
+ not load all stored fields, especially if the skipped fields are large
356
+ compressed text fields.
357
+ -->
358
+ <enableLazyFieldLoading>true</enableLazyFieldLoading>
359
+
360
+ <!-- Example of a generic cache. These caches may be accessed by name
361
+ through SolrIndexSearcher.getCache(),cacheLookup(), and cacheInsert().
362
+ The purpose is to enable easy caching of user/application level data.
363
+ The regenerator argument should be specified as an implementation
364
+ of solr.search.CacheRegenerator if autowarming is desired. -->
365
+ <!--
366
+ <cache name="myUserCache"
367
+ class="solr.LRUCache"
368
+ size="4096"
369
+ initialSize="1024"
370
+ autowarmCount="1024"
371
+ regenerator="org.mycompany.mypackage.MyRegenerator"
372
+ />
373
+ -->
374
+
375
+ <!-- An optimization that attempts to use a filter to satisfy a search.
376
+ If the requested sort does not include score, then the filterCache
377
+ will be checked for a filter matching the query. If found, the filter
378
+ will be used as the source of document ids, and then the sort will be
379
+ applied to that.
380
+ <useFilterForSortedQuery>true</useFilterForSortedQuery>
381
+ -->
382
+
383
+ <!-- An optimization for use with the queryResultCache. When a search
384
+ is requested, a superset of the requested number of document ids
385
+ are collected. For example, if a search for a particular query
386
+ requests matching documents 10 through 19, and queryWindowSize is 50,
387
+ then documents 0 through 49 will be collected and cached. Any further
388
+ requests in that range can be satisfied via the cache. -->
389
+ <queryResultWindowSize>20</queryResultWindowSize>
390
+
391
+ <!-- Maximum number of documents to cache for any entry in the
392
+ queryResultCache. -->
393
+ <queryResultMaxDocsCached>200</queryResultMaxDocsCached>
394
+
395
+ <!-- a newSearcher event is fired whenever a new searcher is being prepared
396
+ and there is a current searcher handling requests (aka registered).
397
+ It can be used to prime certain caches to prevent long request times for
398
+ certain requests.
399
+ -->
400
+ <!-- QuerySenderListener takes an array of NamedList and executes a
401
+ local query request for each NamedList in sequence. -->
402
+ <listener event="newSearcher" class="solr.QuerySenderListener">
403
+ <arr name="queries">
404
+ <!--
405
+ <lst> <str name="q">solr</str> <str name="start">0</str> <str name="rows">10</str> </lst>
406
+ <lst> <str name="q">rocks</str> <str name="start">0</str> <str name="rows">10</str> </lst>
407
+ <lst><str name="q">static newSearcher warming query from solrconfig.xml</str></lst>
408
+ -->
409
+ </arr>
410
+ </listener>
411
+
412
+ <!-- a firstSearcher event is fired whenever a new searcher is being
413
+ prepared but there is no current registered searcher to handle
414
+ requests or to gain autowarming data from. -->
415
+ <listener event="firstSearcher" class="solr.QuerySenderListener">
416
+ <arr name="queries">
417
+ <lst> <str name="q">solr rocks</str><str name="start">0</str><str name="rows">10</str></lst>
418
+ <lst><str name="q">static firstSearcher warming query from solrconfig.xml</str></lst>
419
+ </arr>
420
+ </listener>
421
+
422
+ <!-- If a search request comes in and there is no current registered searcher,
423
+ then immediately register the still warming searcher and use it. If
424
+ "false" then all requests will block until the first searcher is done
425
+ warming. -->
426
+ <useColdSearcher>false</useColdSearcher>
427
+
428
+ <!-- Maximum number of searchers that may be warming in the background
429
+ concurrently. An error is returned if this limit is exceeded. Recommend
430
+ 1-2 for read-only slaves, higher for masters w/o cache warming. -->
431
+ <maxWarmingSearchers>2</maxWarmingSearchers>
432
+
433
+ </query>
434
+
435
+ <!--
436
+ Let the dispatch filter handler /select?qt=XXX
437
+ handleSelect=true will use consistent error handling for /select and /update
438
+ handleSelect=false will use solr1.1 style error formatting
439
+ -->
440
+ <requestDispatcher handleSelect="true" >
441
+ <!--Make sure your system has some authentication before enabling remote streaming! -->
442
+ <requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048000" />
443
+
444
+ <!-- Set HTTP caching related parameters (for proxy caches and clients).
445
+
446
+ To get the behaviour of Solr 1.2 (ie: no caching related headers)
447
+ use the never304="true" option and do not specify a value for
448
+ <cacheControl>
449
+ -->
450
+ <!-- <httpCaching never304="true"> -->
451
+ <httpCaching lastModifiedFrom="openTime"
452
+ etagSeed="Solr">
453
+ <!-- lastModFrom="openTime" is the default, the Last-Modified value
454
+ (and validation against If-Modified-Since requests) will all be
455
+ relative to when the current Searcher was opened.
456
+ You can change it to lastModFrom="dirLastMod" if you want the
457
+ value to exactly corrispond to when the physical index was last
458
+ modified.
459
+
460
+ etagSeed="..." is an option you can change to force the ETag
461
+ header (and validation against If-None-Match requests) to be
462
+ differnet even if the index has not changed (ie: when making
463
+ significant changes to your config file)
464
+
465
+ lastModifiedFrom and etagSeed are both ignored if you use the
466
+ never304="true" option.
467
+ -->
468
+ <!-- If you include a <cacheControl> directive, it will be used to
469
+ generate a Cache-Control header, as well as an Expires header
470
+ if the value contains "max-age="
471
+
472
+ By default, no Cache-Control header is generated.
473
+
474
+ You can use the <cacheControl> option even if you have set
475
+ never304="true"
476
+ -->
477
+ <!-- <cacheControl>max-age=30, public</cacheControl> -->
478
+ </httpCaching>
479
+ </requestDispatcher>
480
+
481
+
482
+ <!-- requestHandler plugins... incoming queries will be dispatched to the
483
+ correct handler based on the path or the qt (query type) param.
484
+ Names starting with a '/' are accessed with the a path equal to the
485
+ registered name. Names without a leading '/' are accessed with:
486
+ http://host/app/select?qt=name
487
+ If no qt is defined, the requestHandler that declares default="true"
488
+ will be used.
489
+ -->
490
+ <requestHandler name="standard" class="solr.SearchHandler" default="true">
491
+ <!-- default values for query parameters -->
492
+ <lst name="defaults">
493
+ <str name="echoParams">explicit</str>
494
+ <!--
495
+ <int name="rows">10</int>
496
+ <str name="fl">*</str>
497
+ <str name="version">2.1</str>
498
+ -->
499
+ </lst>
500
+ </requestHandler>
501
+
502
+ <!-- Please refer to http://wiki.apache.org/solr/SolrReplication for details on configuring replication -->
503
+ <!-- remove the <lst name="master"> section if this is just a slave -->
504
+ <!-- remove the <lst name="slave"> section if this is just a master -->
505
+ <!--
506
+ <requestHandler name="/replication" class="solr.ReplicationHandler" >
507
+ <lst name="master">
508
+ <str name="replicateAfter">commit</str>
509
+ <str name="replicateAfter">startup</str>
510
+ <str name="confFiles">schema.xml,stopwords.txt</str>
511
+ </lst>
512
+ <lst name="slave">
513
+ <str name="masterUrl">http://localhost:8983/solr/replication</str>
514
+ <str name="pollInterval">00:00:60</str>
515
+ </lst>
516
+ </requestHandler>-->
517
+
518
+ <!-- DisMaxRequestHandler allows easy searching across multiple fields
519
+ for simple user-entered phrases. It's implementation is now
520
+ just the standard SearchHandler with a default query type
521
+ of "dismax".
522
+ see http://wiki.apache.org/solr/DisMaxRequestHandler
523
+ -->
524
+ <requestHandler name="dismax" class="solr.SearchHandler" >
525
+ <lst name="defaults">
526
+ <str name="defType">dismax</str>
527
+ <str name="echoParams">explicit</str>
528
+ <float name="tie">0.01</float>
529
+ <str name="qf">
530
+ text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0 manu^1.1 cat^1.4
531
+ </str>
532
+ <str name="pf">
533
+ text^0.2 features^1.1 name^1.5 manu^1.4 manu_exact^1.9
534
+ </str>
535
+ <str name="bf">
536
+ popularity^0.5 recip(price,1,1000,1000)^0.3
537
+ </str>
538
+ <str name="fl">
539
+ id,name,price,score
540
+ </str>
541
+ <str name="mm">
542
+ 2&lt;-1 5&lt;-2 6&lt;90%
543
+ </str>
544
+ <int name="ps">100</int>
545
+ <str name="q.alt">*:*</str>
546
+ <!-- example highlighter config, enable per-query with hl=true -->
547
+ <str name="hl.fl">text features name</str>
548
+ <!-- for this field, we want no fragmenting, just highlighting -->
549
+ <str name="f.name.hl.fragsize">0</str>
550
+ <!-- instructs Solr to return the field itself if no query terms are
551
+ found -->
552
+ <str name="f.name.hl.alternateField">name</str>
553
+ <str name="f.text.hl.fragmenter">regex</str> <!-- defined below -->
554
+ </lst>
555
+ </requestHandler>
556
+
557
+ <!-- Note how you can register the same handler multiple times with
558
+ different names (and different init parameters)
559
+ -->
560
+ <requestHandler name="partitioned" class="solr.SearchHandler" >
561
+ <lst name="defaults">
562
+ <str name="defType">dismax</str>
563
+ <str name="echoParams">explicit</str>
564
+ <str name="qf">text^0.5 features^1.0 name^1.2 sku^1.5 id^10.0</str>
565
+ <str name="mm">2&lt;-1 5&lt;-2 6&lt;90%</str>
566
+ <!-- This is an example of using Date Math to specify a constantly
567
+ moving date range in a config...
568
+ -->
569
+ <str name="bq">incubationdate_dt:[* TO NOW/DAY-1MONTH]^2.2</str>
570
+ </lst>
571
+ <!-- In addition to defaults, "appends" params can be specified
572
+ to identify values which should be appended to the list of
573
+ multi-val params from the query (or the existing "defaults").
574
+
575
+ In this example, the param "fq=instock:true" will be appended to
576
+ any query time fq params the user may specify, as a mechanism for
577
+ partitioning the index, independent of any user selected filtering
578
+ that may also be desired (perhaps as a result of faceted searching).
579
+
580
+ NOTE: there is *absolutely* nothing a client can do to prevent these
581
+ "appends" values from being used, so don't use this mechanism
582
+ unless you are sure you always want it.
583
+ -->
584
+ <lst name="appends">
585
+ <str name="fq">inStock:true</str>
586
+ </lst>
587
+ <!-- "invariants" are a way of letting the Solr maintainer lock down
588
+ the options available to Solr clients. Any params values
589
+ specified here are used regardless of what values may be specified
590
+ in either the query, the "defaults", or the "appends" params.
591
+
592
+ In this example, the facet.field and facet.query params are fixed,
593
+ limiting the facets clients can use. Faceting is not turned on by
594
+ default - but if the client does specify facet=true in the request,
595
+ these are the only facets they will be able to see counts for;
596
+ regardless of what other facet.field or facet.query params they
597
+ may specify.
598
+
599
+ NOTE: there is *absolutely* nothing a client can do to prevent these
600
+ "invariants" values from being used, so don't use this mechanism
601
+ unless you are sure you always want it.
602
+ -->
603
+ <lst name="invariants">
604
+ <str name="facet.field">cat</str>
605
+ <str name="facet.field">manu_exact</str>
606
+ <str name="facet.query">price:[* TO 500]</str>
607
+ <str name="facet.query">price:[500 TO *]</str>
608
+ </lst>
609
+ </requestHandler>
610
+
611
+
612
+ <!-- Blacklight's "search" request handler: for search results -->
613
+
614
+ <requestHandler name="search" class="solr.SearchHandler" >
615
+ <lst name="defaults">
616
+ <str name="defType">dismax</str>
617
+ <str name="echoParams">explicit</str>
618
+ <!-- list fields to be returned in the "fl" param -->
619
+ <str name="fl">*,score</str>
620
+
621
+ <str name="facet">on</str>
622
+ <str name="facet.mincount">1</str>
623
+ <str name="facet.limit">10</str>
624
+
625
+ <!-- list fields to be displayed as facets here. -->
626
+ <str name="facet.field">format</str>
627
+ <str name="facet.field">language_facet</str>
628
+
629
+ <str name="q.alt">*:*</str>
630
+ </lst>
631
+ </requestHandler>
632
+
633
+ <!-- Blacklight's "document" requestHandler: for a single record-->
634
+
635
+ <requestHandler name="document" class="solr.SearchHandler">
636
+ <lst name="defaults">
637
+ <str name="echoParams">explicit</str>
638
+ <str name="fl">*</str>
639
+ <str name="rows">1</str>
640
+ <str name="q">{!raw f=id v=$id}</str>
641
+ <!-- use id=blah instead of q=id:blah -->
642
+ </lst>
643
+ </requestHandler>
644
+
645
+ <!--
646
+ Search components are registered to SolrCore and used by Search Handlers
647
+
648
+ By default, the following components are avaliable:
649
+
650
+ <searchComponent name="query" class="org.apache.solr.handler.component.QueryComponent" />
651
+ <searchComponent name="facet" class="org.apache.solr.handler.component.FacetComponent" />
652
+ <searchComponent name="mlt" class="org.apache.solr.handler.component.MoreLikeThisComponent" />
653
+ <searchComponent name="highlight" class="org.apache.solr.handler.component.HighlightComponent" />
654
+ <searchComponent name="stats" class="org.apache.solr.handler.component.StatsComponent" />
655
+ <searchComponent name="debug" class="org.apache.solr.handler.component.DebugComponent" />
656
+
657
+ Default configuration in a requestHandler would look like:
658
+ <arr name="components">
659
+ <str>query</str>
660
+ <str>facet</str>
661
+ <str>mlt</str>
662
+ <str>highlight</str>
663
+ <str>stats</str>
664
+ <str>debug</str>
665
+ </arr>
666
+
667
+ If you register a searchComponent to one of the standard names, that will be used instead.
668
+ To insert components before or after the 'standard' components, use:
669
+
670
+ <arr name="first-components">
671
+ <str>myFirstComponentName</str>
672
+ </arr>
673
+
674
+ <arr name="last-components">
675
+ <str>myLastComponentName</str>
676
+ </arr>
677
+ -->
678
+
679
+ <!-- The spell check component can return a list of alternative spelling
680
+ suggestions. -->
681
+ <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
682
+
683
+ <str name="queryAnalyzerFieldType">textSpell</str>
684
+
685
+ <lst name="spellchecker">
686
+ <str name="name">default</str>
687
+ <str name="field">name</str>
688
+ <str name="spellcheckIndexDir">./spellchecker</str>
689
+ </lst>
690
+
691
+ <!-- a spellchecker that uses a different distance measure
692
+ <lst name="spellchecker">
693
+ <str name="name">jarowinkler</str>
694
+ <str name="field">spell</str>
695
+ <str name="distanceMeasure">org.apache.lucene.search.spell.JaroWinklerDistance</str>
696
+ <str name="spellcheckIndexDir">./spellchecker2</str>
697
+ </lst>
698
+ -->
699
+
700
+ <!-- a file based spell checker
701
+ <lst name="spellchecker">
702
+ <str name="classname">solr.FileBasedSpellChecker</str>
703
+ <str name="name">file</str>
704
+ <str name="sourceLocation">spellings.txt</str>
705
+ <str name="characterEncoding">UTF-8</str>
706
+ <str name="spellcheckIndexDir">./spellcheckerFile</str>
707
+ </lst>
708
+ -->
709
+ </searchComponent>
710
+
711
+ <!-- A request handler utilizing the spellcheck component.
712
+ #############################################################################
713
+ NOTE: This is purely as an example. The whole purpose of the
714
+ SpellCheckComponent is to hook it into the request handler that handles (i.e.
715
+ the standard or dismax SearchHandler) queries such that a separate request is
716
+ not needed to get suggestions.
717
+
718
+ See http://wiki.apache.org/solr/SpellCheckComponent for details on the request
719
+ parameters.
720
+
721
+ IN OTHER WORDS, THERE IS REALLY GOOD CHANCE THE SETUP BELOW IS NOT WHAT YOU
722
+ WANT FOR YOUR PRODUCTION SYSTEM!
723
+ #############################################################################
724
+ -->
725
+ <requestHandler name="/spell" class="solr.SearchHandler" lazy="true">
726
+ <lst name="defaults">
727
+ <str name="spellcheck.onlyMorePopular">false</str>
728
+ <str name="spellcheck.extendedResults">false</str>
729
+ <str name="spellcheck.count">1</str>
730
+ </lst>
731
+ <arr name="last-components">
732
+ <str>spellcheck</str>
733
+ </arr>
734
+ </requestHandler>
735
+
736
+ <searchComponent name="tvComponent" class="org.apache.solr.handler.component.TermVectorComponent"/>
737
+ <!-- A Req Handler for working with the tvComponent. This is purely as an example.
738
+ You will likely want to add the component to your already specified request handlers. -->
739
+ <requestHandler name="tvrh" class="org.apache.solr.handler.component.SearchHandler">
740
+ <lst name="defaults">
741
+ <bool name="tv">true</bool>
742
+ </lst>
743
+ <arr name="last-components">
744
+ <str>tvComponent</str>
745
+ </arr>
746
+ </requestHandler>
747
+
748
+ <!-- Clustering Component
749
+ http://wiki.apache.org/solr/ClusteringComponent
750
+ This relies on third party jars which are not included in the release.
751
+ To use this component (and the "/clustering" handler)
752
+ Those jars will need to be downloaded, and you'll need to set the
753
+ solr.cluster.enabled system property when running solr...
754
+ java -Dsolr.clustering.enabled=true -jar start.jar
755
+ -->
756
+ <searchComponent
757
+ name="clusteringComponent"
758
+ enable="${solr.clustering.enabled:false}"
759
+ class="org.apache.solr.handler.clustering.ClusteringComponent" >
760
+ <!-- Declare an engine -->
761
+ <lst name="engine">
762
+ <!-- The name, only one can be named "default" -->
763
+ <str name="name">default</str>
764
+ <!--
765
+ Class name of Carrot2 clustering algorithm. Currently available algorithms are:
766
+
767
+ * org.carrot2.clustering.lingo.LingoClusteringAlgorithm
768
+ * org.carrot2.clustering.stc.STCClusteringAlgorithm
769
+
770
+ See http://project.carrot2.org/algorithms.html for the algorithm's characteristics.
771
+ -->
772
+ <str name="carrot.algorithm">org.carrot2.clustering.lingo.LingoClusteringAlgorithm</str>
773
+ <!--
774
+ Overriding values for Carrot2 default algorithm attributes. For a description
775
+ of all available attributes, see: http://download.carrot2.org/stable/manual/#chapter.components.
776
+ Use attribute key as name attribute of str elements below. These can be further
777
+ overridden for individual requests by specifying attribute key as request
778
+ parameter name and attribute value as parameter value.
779
+ -->
780
+ <str name="LingoClusteringAlgorithm.desiredClusterCountBase">20</str>
781
+ </lst>
782
+ <lst name="engine">
783
+ <str name="name">stc</str>
784
+ <str name="carrot.algorithm">org.carrot2.clustering.stc.STCClusteringAlgorithm</str>
785
+ </lst>
786
+ </searchComponent>
787
+ <requestHandler name="/clustering"
788
+ enable="${solr.clustering.enabled:false}"
789
+ class="solr.SearchHandler">
790
+ <lst name="defaults">
791
+ <bool name="clustering">true</bool>
792
+ <str name="clustering.engine">default</str>
793
+ <bool name="clustering.results">true</bool>
794
+ <!-- The title field -->
795
+ <str name="carrot.title">name</str>
796
+ <str name="carrot.url">id</str>
797
+ <!-- The field to cluster on -->
798
+ <str name="carrot.snippet">features</str>
799
+ <!-- produce summaries -->
800
+ <bool name="carrot.produceSummary">true</bool>
801
+ <!-- the maximum number of labels per cluster -->
802
+ <!--<int name="carrot.numDescriptions">5</int>-->
803
+ <!-- produce sub clusters -->
804
+ <bool name="carrot.outputSubClusters">false</bool>
805
+ </lst>
806
+ <arr name="last-components">
807
+ <str>clusteringComponent</str>
808
+ </arr>
809
+ </requestHandler>
810
+
811
+ <!-- Solr Cell: http://wiki.apache.org/solr/ExtractingRequestHandler -->
812
+ <requestHandler name="/update/extract" class="org.apache.solr.handler.extraction.ExtractingRequestHandler" startup="lazy">
813
+ <lst name="defaults">
814
+ <!-- All the main content goes into "text"... if you need to return
815
+ the extracted text or do highlighting, use a stored field. -->
816
+ <str name="fmap.content">text</str>
817
+ <str name="lowernames">true</str>
818
+ <str name="uprefix">ignored_</str>
819
+
820
+ <!-- capture link hrefs but ignore div attributes -->
821
+ <str name="captureAttr">true</str>
822
+ <str name="fmap.a">links</str>
823
+ <str name="fmap.div">ignored_</str>
824
+ </lst>
825
+ </requestHandler>
826
+
827
+
828
+ <!-- A component to return terms and document frequency of those terms. -->
829
+ <searchComponent name="termsComponent" class="org.apache.solr.handler.component.TermsComponent"/>
830
+
831
+ <requestHandler name="/terms" class="org.apache.solr.handler.component.SearchHandler">
832
+ <lst name="defaults">
833
+ <bool name="terms">true</bool>
834
+ </lst>
835
+ <arr name="components">
836
+ <str>termsComponent</str>
837
+ </arr>
838
+ </requestHandler>
839
+
840
+
841
+ <!-- a search component that enables you to configure the top results for
842
+ a given query regardless of the normal lucene scoring.-->
843
+ <searchComponent name="elevator" class="solr.QueryElevationComponent" >
844
+ <!-- pick a fieldType to analyze queries -->
845
+ <str name="queryFieldType">string</str>
846
+ <str name="config-file">elevate.xml</str>
847
+ </searchComponent>
848
+
849
+ <!-- a request handler utilizing the elevator component -->
850
+ <requestHandler name="/elevate" class="solr.SearchHandler" startup="lazy">
851
+ <lst name="defaults">
852
+ <str name="echoParams">explicit</str>
853
+ </lst>
854
+ <arr name="last-components">
855
+ <str>elevator</str>
856
+ </arr>
857
+ </requestHandler>
858
+
859
+
860
+ <!-- Update request handler.
861
+
862
+ Note: Since solr1.1 requestHandlers requires a valid content type header if posted in
863
+ the body. For example, curl now requires: -H 'Content-type:text/xml; charset=utf-8'
864
+ The response format differs from solr1.1 formatting and returns a standard error code.
865
+ To enable solr1.1 behavior, remove the /update handler or change its path
866
+ -->
867
+ <requestHandler name="/update" class="solr.XmlUpdateRequestHandler" />
868
+
869
+
870
+ <requestHandler name="/update/javabin" class="solr.BinaryUpdateRequestHandler" />
871
+
872
+ <!--
873
+ Analysis request handler. Since Solr 1.3. Use to return how a document is analyzed. Useful
874
+ for debugging and as a token server for other types of applications.
875
+
876
+ This is deprecated in favor of the improved DocumentAnalysisRequestHandler and FieldAnalysisRequestHandler
877
+
878
+ <requestHandler name="/analysis" class="solr.AnalysisRequestHandler" />
879
+ -->
880
+
881
+ <!--
882
+ An analysis handler that provides a breakdown of the analysis process of provided docuemnts. This handler expects a
883
+ (single) content stream with the following format:
884
+
885
+ <docs>
886
+ <doc>
887
+ <field name="id">1</field>
888
+ <field name="name">The Name</field>
889
+ <field name="text">The Text Value</field>
890
+ <doc>
891
+ <doc>...</doc>
892
+ <doc>...</doc>
893
+ ...
894
+ </docs>
895
+
896
+ Note: Each document must contain a field which serves as the unique key. This key is used in the returned
897
+ response to assoicate an analysis breakdown to the analyzed document.
898
+
899
+ Like the FieldAnalysisRequestHandler, this handler also supports query analysis by
900
+ sending either an "analysis.query" or "q" request paraemter that holds the query text to be analyized. It also
901
+ supports the "analysis.showmatch" parameter which when set to true, all field tokens that match the query
902
+ tokens will be marked as a "match".
903
+ -->
904
+ <requestHandler name="/analysis/document" class="solr.DocumentAnalysisRequestHandler" />
905
+
906
+ <!--
907
+ RequestHandler that provides much the same functionality as analysis.jsp. Provides the ability
908
+ to specify multiple field types and field names in the same request and outputs index-time and
909
+ query-time analysis for each of them.
910
+
911
+ Request parameters are:
912
+ analysis.fieldname - The field name whose analyzers are to be used
913
+ analysis.fieldtype - The field type whose analyzers are to be used
914
+ analysis.fieldvalue - The text for index-time analysis
915
+ q (or analysis.q) - The text for query time analysis
916
+ analysis.showmatch (true|false) - When set to true and when query analysis is performed, the produced
917
+ tokens of the field value analysis will be marked as "matched" for every
918
+ token that is produces by the query analysis
919
+ -->
920
+ <requestHandler name="/analysis/field" class="solr.FieldAnalysisRequestHandler" />
921
+
922
+
923
+ <!-- CSV update handler, loaded on demand -->
924
+ <requestHandler name="/update/csv" class="solr.CSVRequestHandler" startup="lazy" />
925
+
926
+
927
+ <!--
928
+ Admin Handlers - This will register all the standard admin RequestHandlers. Adding
929
+ this single handler is equivalent to registering:
930
+
931
+ <requestHandler name="/admin/luke" class="org.apache.solr.handler.admin.LukeRequestHandler" />
932
+ <requestHandler name="/admin/system" class="org.apache.solr.handler.admin.SystemInfoHandler" />
933
+ <requestHandler name="/admin/plugins" class="org.apache.solr.handler.admin.PluginInfoHandler" />
934
+ <requestHandler name="/admin/threads" class="org.apache.solr.handler.admin.ThreadDumpHandler" />
935
+ <requestHandler name="/admin/properties" class="org.apache.solr.handler.admin.PropertiesRequestHandler" />
936
+ <requestHandler name="/admin/file" class="org.apache.solr.handler.admin.ShowFileRequestHandler" >
937
+
938
+ If you wish to hide files under ${solr.home}/conf, explicitly register the ShowFileRequestHandler using:
939
+ <requestHandler name="/admin/file" class="org.apache.solr.handler.admin.ShowFileRequestHandler" >
940
+ <lst name="invariants">
941
+ <str name="hidden">synonyms.txt</str>
942
+ <str name="hidden">anotherfile.txt</str>
943
+ </lst>
944
+ </requestHandler>
945
+ -->
946
+ <requestHandler name="/admin/" class="org.apache.solr.handler.admin.AdminHandlers" />
947
+
948
+ <!-- ping/healthcheck -->
949
+ <requestHandler name="/admin/ping" class="PingRequestHandler">
950
+ <lst name="defaults">
951
+ <str name="qt">standard</str>
952
+ <str name="q">solrpingquery</str>
953
+ <str name="echoParams">all</str>
954
+ </lst>
955
+ </requestHandler>
956
+
957
+ <!-- Echo the request contents back to the client -->
958
+ <requestHandler name="/debug/dump" class="solr.DumpRequestHandler" >
959
+ <lst name="defaults">
960
+ <str name="echoParams">explicit</str> <!-- for all params (including the default etc) use: 'all' -->
961
+ <str name="echoHandler">true</str>
962
+ </lst>
963
+ </requestHandler>
964
+
965
+ <highlighting>
966
+ <!-- Configure the standard fragmenter -->
967
+ <!-- This could most likely be commented out in the "default" case -->
968
+ <fragmenter name="gap" class="org.apache.solr.highlight.GapFragmenter" default="true">
969
+ <lst name="defaults">
970
+ <int name="hl.fragsize">100</int>
971
+ </lst>
972
+ </fragmenter>
973
+
974
+ <!-- A regular-expression-based fragmenter (f.i., for sentence extraction) -->
975
+ <fragmenter name="regex" class="org.apache.solr.highlight.RegexFragmenter">
976
+ <lst name="defaults">
977
+ <!-- slightly smaller fragsizes work better because of slop -->
978
+ <int name="hl.fragsize">70</int>
979
+ <!-- allow 50% slop on fragment sizes -->
980
+ <float name="hl.regex.slop">0.5</float>
981
+ <!-- a basic sentence pattern -->
982
+ <str name="hl.regex.pattern">[-\w ,/\n\"']{20,200}</str>
983
+ </lst>
984
+ </fragmenter>
985
+
986
+ <!-- Configure the standard formatter -->
987
+ <formatter name="html" class="org.apache.solr.highlight.HtmlFormatter" default="true">
988
+ <lst name="defaults">
989
+ <str name="hl.simple.pre"><![CDATA[<em>]]></str>
990
+ <str name="hl.simple.post"><![CDATA[</em>]]></str>
991
+ </lst>
992
+ </formatter>
993
+ </highlighting>
994
+
995
+ <!-- An example dedup update processor that creates the "id" field on the fly
996
+ based on the hash code of some other fields. This example has overwriteDupes
997
+ set to false since we are using the id field as the signatureField and Solr
998
+ will maintain uniqueness based on that anyway.
999
+
1000
+ You have to link the chain to an update handler above to use it ie:
1001
+ <requestHandler name="/update "class="solr.XmlUpdateRequestHandler">
1002
+ <lst name="defaults">
1003
+ <str name="update.processor">dedupe</str>
1004
+ </lst>
1005
+ </requestHandler>
1006
+ -->
1007
+ <!--
1008
+ <updateRequestProcessorChain name="dedupe">
1009
+ <processor class="org.apache.solr.update.processor.SignatureUpdateProcessorFactory">
1010
+ <bool name="enabled">true</bool>
1011
+ <str name="signatureField">id</str>
1012
+ <bool name="overwriteDupes">false</bool>
1013
+ <str name="fields">name,features,cat</str>
1014
+ <str name="signatureClass">org.apache.solr.update.processor.Lookup3Signature</str>
1015
+ </processor>
1016
+ <processor class="solr.LogUpdateProcessorFactory" />
1017
+ <processor class="solr.RunUpdateProcessorFactory" />
1018
+ </updateRequestProcessorChain>
1019
+ -->
1020
+
1021
+
1022
+ <!-- queryResponseWriter plugins... query responses will be written using
1023
+ the writer specified by the 'wt' request parameter matching the name
1024
+ of a registered writer.
1025
+ The "default" writer is the default and will be used if 'wt' is not
1026
+ specified in the request.
1027
+
1028
+ The following response writers are implicitly configured unless
1029
+ overridden...
1030
+
1031
+ <queryResponseWriter name="xml" class="org.apache.solr.request.XMLResponseWriter" default="true"/>
1032
+ <queryResponseWriter name="json" class="org.apache.solr.request.JSONResponseWriter"/>
1033
+ <queryResponseWriter name="python" class="org.apache.solr.request.PythonResponseWriter"/>
1034
+ <queryResponseWriter name="ruby" class="org.apache.solr.request.RubyResponseWriter"/>
1035
+ <queryResponseWriter name="php" class="org.apache.solr.request.PHPResponseWriter"/>
1036
+ <queryResponseWriter name="phps" class="org.apache.solr.request.PHPSerializedResponseWriter"/>
1037
+
1038
+ Custom response writers can be declared as needed...
1039
+
1040
+ <queryResponseWriter name="custom" class="com.example.MyResponseWriter"/>
1041
+ -->
1042
+
1043
+ <!-- XSLT response writer transforms the XML output by any xslt file found
1044
+ in Solr's conf/xslt directory. Changes to xslt files are checked for
1045
+ every xsltCacheLifetimeSeconds.
1046
+ -->
1047
+ <queryResponseWriter name="xslt" class="org.apache.solr.request.XSLTResponseWriter">
1048
+ <int name="xsltCacheLifetimeSeconds">5</int>
1049
+ </queryResponseWriter>
1050
+
1051
+
1052
+ <!-- example of registering a query parser
1053
+ <queryParser name="lucene" class="org.apache.solr.search.LuceneQParserPlugin"/>
1054
+ -->
1055
+
1056
+ <!-- example of registering a custom function parser
1057
+ <valueSourceParser name="myfunc" class="com.mycompany.MyValueSourceParser" />
1058
+ -->
1059
+
1060
+ <!-- config for the admin interface -->
1061
+ <admin>
1062
+ <defaultQuery>solr</defaultQuery>
1063
+
1064
+ <!-- configure a healthcheck file for servers behind a loadbalancer
1065
+ <healthcheck type="file">server-enabled</healthcheck>
1066
+ -->
1067
+ </admin>
1068
+
1069
+ </config>