active-fedora 10.3.0 → 11.0.0.rc1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (102) hide show
  1. checksums.yaml +4 -4
  2. data/.rubocop.yml +4 -0
  3. data/.rubocop_todo.yml +24 -0
  4. data/README.md +3 -1
  5. data/active-fedora.gemspec +4 -4
  6. data/lib/active_fedora.rb +0 -2
  7. data/lib/active_fedora/aggregation/list_source.rb +2 -0
  8. data/lib/active_fedora/associations/association_scope.rb +1 -1
  9. data/lib/active_fedora/associations/builder/aggregation.rb +1 -1
  10. data/lib/active_fedora/associations/builder/association.rb +1 -1
  11. data/lib/active_fedora/associations/builder/orders.rb +11 -3
  12. data/lib/active_fedora/associations/collection_association.rb +2 -2
  13. data/lib/active_fedora/associations/has_many_association.rb +2 -2
  14. data/lib/active_fedora/associations/has_subresource_association.rb +2 -2
  15. data/lib/active_fedora/associations/orders_association.rb +4 -0
  16. data/lib/active_fedora/associations/rdf.rb +2 -0
  17. data/lib/active_fedora/attribute_methods/dirty.rb +1 -1
  18. data/lib/active_fedora/base.rb +1 -1
  19. data/lib/active_fedora/containers/container.rb +1 -1
  20. data/lib/active_fedora/core.rb +7 -9
  21. data/lib/active_fedora/fedora.rb +2 -6
  22. data/lib/active_fedora/fedora_attributes.rb +1 -1
  23. data/lib/active_fedora/file.rb +1 -1
  24. data/lib/active_fedora/file/streaming.rb +1 -1
  25. data/lib/active_fedora/indexing.rb +1 -18
  26. data/lib/active_fedora/indexing_service.rb +0 -5
  27. data/lib/active_fedora/loadable_from_json.rb +12 -1
  28. data/lib/active_fedora/nested_attributes.rb +2 -2
  29. data/lib/active_fedora/orders/list_node.rb +2 -2
  30. data/lib/active_fedora/orders/ordered_list.rb +7 -3
  31. data/lib/active_fedora/orders/target_proxy.rb +4 -0
  32. data/lib/active_fedora/rake_support.rb +1 -1
  33. data/lib/active_fedora/rdf/persistence.rb +1 -0
  34. data/lib/active_fedora/rdf/rdf_datastream.rb +7 -1
  35. data/lib/active_fedora/solr_hit.rb +0 -9
  36. data/lib/active_fedora/solr_query_builder.rb +1 -1
  37. data/lib/active_fedora/version.rb +1 -1
  38. data/lib/generators/active_fedora/config/solr/templates/solr/config/solrconfig.xml +0 -11
  39. data/lib/generators/active_fedora/config/solr/templates/solr_wrapper_test.yml +1 -1
  40. data/lib/generators/active_fedora/model/model_generator.rb +1 -1
  41. data/lib/generators/active_fedora/model/templates/model.rb.erb +4 -4
  42. data/lib/tasks/active_fedora_dev.rake +1 -1
  43. data/solr/config/_rest_managed.json +3 -0
  44. data/solr/config/admin-extra.html +31 -0
  45. data/solr/config/elevate.xml +36 -0
  46. data/solr/config/mapping-ISOLatin1Accent.txt +246 -0
  47. data/solr/config/protwords.txt +21 -0
  48. data/solr/config/schema.xml +372 -0
  49. data/solr/config/scripts.conf +24 -0
  50. data/solr/config/solrconfig.xml +311 -0
  51. data/solr/config/spellings.txt +2 -0
  52. data/solr/config/stopwords.txt +58 -0
  53. data/solr/config/stopwords_en.txt +58 -0
  54. data/solr/config/synonyms.txt +31 -0
  55. data/solr/config/xslt/example.xsl +132 -0
  56. data/solr/config/xslt/example_atom.xsl +67 -0
  57. data/solr/config/xslt/example_rss.xsl +66 -0
  58. data/solr/config/xslt/luke.xsl +337 -0
  59. data/spec/integration/associations_spec.rb +6 -6
  60. data/spec/integration/basic_contains_association_spec.rb +1 -1
  61. data/spec/integration/clean_connection_spec.rb +1 -1
  62. data/spec/integration/complex_rdf_datastream_spec.rb +4 -5
  63. data/spec/integration/datastream_rdf_nested_attributes_spec.rb +15 -14
  64. data/spec/integration/date_time_properties_spec.rb +0 -15
  65. data/spec/integration/direct_container_spec.rb +4 -4
  66. data/spec/integration/directly_contains_one_association_spec.rb +1 -1
  67. data/spec/integration/eradicate_spec.rb +1 -1
  68. data/spec/integration/generators/solr_generator_spec.rb +10 -7
  69. data/spec/integration/has_and_belongs_to_many_associations_spec.rb +5 -5
  70. data/spec/integration/has_many_associations_spec.rb +4 -4
  71. data/spec/integration/indexing_spec.rb +1 -1
  72. data/spec/integration/indirect_container_spec.rb +3 -3
  73. data/spec/integration/ntriples_datastream_spec.rb +35 -23
  74. data/spec/integration/rdf_nested_attributes_spec.rb +3 -3
  75. data/spec/integration/relation_delegation_spec.rb +2 -2
  76. data/spec/integration/scoped_query_spec.rb +3 -3
  77. data/spec/integration/solr_hit_spec.rb +0 -11
  78. data/spec/integration/versionable_spec.rb +6 -6
  79. data/spec/integration/with_metadata_spec.rb +1 -1
  80. data/spec/samples/hydra-mods_article_datastream.rb +2 -4
  81. data/spec/unit/base_spec.rb +3 -4
  82. data/spec/unit/core/fedora_id_translator_spec.rb +2 -2
  83. data/spec/unit/core/fedora_uri_translator_spec.rb +2 -2
  84. data/spec/unit/core_spec.rb +5 -5
  85. data/spec/unit/fedora_spec.rb +1 -2
  86. data/spec/unit/file_spec.rb +2 -2
  87. data/spec/unit/filter_spec.rb +3 -3
  88. data/spec/unit/forbidden_attributes_protection_spec.rb +2 -2
  89. data/spec/unit/has_and_belongs_to_many_association_spec.rb +2 -2
  90. data/spec/unit/has_many_association_spec.rb +11 -26
  91. data/spec/unit/ntriples_datastream_spec.rb +6 -9
  92. data/spec/unit/ordered_spec.rb +8 -11
  93. data/spec/unit/orders/list_node_spec.rb +2 -2
  94. data/spec/unit/orders/ordered_list_spec.rb +1 -1
  95. data/spec/unit/query_spec.rb +4 -4
  96. data/spec/unit/rdf/indexing_service_spec.rb +5 -5
  97. data/spec/unit/rdf_resource_datastream_spec.rb +4 -0
  98. metadata +44 -17
  99. data/.solr_wrapper +0 -6
  100. data/lib/active_fedora/profile_indexing_service.rb +0 -11
  101. data/lib/active_fedora/solr_instance_loader.rb +0 -47
  102. data/spec/integration/solr_instance_loader_spec.rb +0 -156
@@ -0,0 +1,21 @@
1
+ # The ASF licenses this file to You under the Apache License, Version 2.0
2
+ # (the "License"); you may not use this file except in compliance with
3
+ # the License. You may obtain a copy of the License at
4
+ #
5
+ # http://www.apache.org/licenses/LICENSE-2.0
6
+ #
7
+ # Unless required by applicable law or agreed to in writing, software
8
+ # distributed under the License is distributed on an "AS IS" BASIS,
9
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10
+ # See the License for the specific language governing permissions and
11
+ # limitations under the License.
12
+
13
+ #-----------------------------------------------------------------------
14
+ # Use a protected word file to protect against the stemmer reducing two
15
+ # unrelated words to the same base word.
16
+
17
+ # Some non-words that normally won't be encountered,
18
+ # just to test that they won't be stemmed.
19
+ dontstems
20
+ zwhacky
21
+
@@ -0,0 +1,372 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!--
20
+ This is the Solr schema file. This file should be named "schema.xml" and
21
+ should be in the conf directory under the solr home
22
+ (i.e. ./solr/conf/schema.xml by default)
23
+ or located where the classloader for the Solr webapp can find it.
24
+
25
+ This example schema is the recommended starting point for users.
26
+ It should be kept correct and concise, usable out-of-the-box.
27
+
28
+ For more information, on how to customize this file, please see
29
+ http://wiki.apache.org/solr/SchemaXml
30
+
31
+ PERFORMANCE NOTE: this schema includes many optional features and should not
32
+ be used for benchmarking. To improve performance one could
33
+ - set stored="false" for all fields possible (esp large fields) when you
34
+ only need to search on the field but don't need to return the original
35
+ value.
36
+ - set indexed="false" if you don't need to search on the field, but only
37
+ return the field as a result of searching on other indexed fields.
38
+ - remove all unneeded copyField statements
39
+ - for best index size and searching performance, set "index" to false
40
+ for all general text fields, use copyField to copy them to the
41
+ catchall "text" field, and use that for searching.
42
+ - For maximum indexing performance, use the StreamingUpdateSolrServer
43
+ java client.
44
+ - Remember to run the JVM in server mode, and use a higher logging level
45
+ that avoids logging every request
46
+ -->
47
+
48
+ <schema name="Hydra Demo Index" version="1.5">
49
+ <!-- attribute "name" is the name of this schema and is only used for display purposes.
50
+ Applications should change this to reflect the nature of the search collection.
51
+ version="1.4" is Solr's version number for the schema syntax and semantics. It should
52
+ not normally be changed by applications.
53
+ 1.0: multiValued attribute did not exist, all fields are multiValued by nature
54
+ 1.1: multiValued attribute introduced, false by default
55
+ 1.2: omitTermFreqAndPositions attribute introduced, true by default except for text fields.
56
+ 1.3: removed optional field compress feature
57
+ 1.4: default auto-phrase (QueryParser feature) to off
58
+ -->
59
+
60
+ <types>
61
+ <fieldType name="string" class="solr.StrField" sortMissingLast="true" />
62
+ <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
63
+ <fieldType name="rand" class="solr.RandomSortField" omitNorms="true"/>
64
+
65
+ <!-- Default numeric field types. -->
66
+ <fieldType name="int" class="solr.TrieIntField" precisionStep="0" positionIncrementGap="0"/>
67
+ <fieldType name="float" class="solr.TrieFloatField" precisionStep="0" positionIncrementGap="0"/>
68
+ <fieldType name="long" class="solr.TrieLongField" precisionStep="0" positionIncrementGap="0"/>
69
+ <fieldType name="double" class="solr.TrieDoubleField" precisionStep="0" positionIncrementGap="0"/>
70
+
71
+ <!-- trie numeric field types for faster range queries -->
72
+ <fieldType name="tint" class="solr.TrieIntField" precisionStep="8" positionIncrementGap="0"/>
73
+ <fieldType name="tfloat" class="solr.TrieFloatField" precisionStep="8" positionIncrementGap="0"/>
74
+ <fieldType name="tlong" class="solr.TrieLongField" precisionStep="8" positionIncrementGap="0"/>
75
+ <fieldType name="tdouble" class="solr.TrieDoubleField" precisionStep="8" positionIncrementGap="0"/>
76
+
77
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z
78
+ Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z
79
+ -->
80
+ <fieldType name="date" class="solr.TrieDateField" precisionStep="0" positionIncrementGap="0"/>
81
+ <!-- A Trie based date field for faster date range queries and date faceting. -->
82
+ <fieldType name="tdate" class="solr.TrieDateField" precisionStep="6" positionIncrementGap="0"/>
83
+
84
+
85
+ <!-- This point type indexes the coordinates as separate fields (subFields)
86
+ If subFieldType is defined, it references a type, and a dynamic field
87
+ definition is created matching *___<typename>. Alternately, if
88
+ subFieldSuffix is defined, that is used to create the subFields.
89
+ Example: if subFieldType="double", then the coordinates would be
90
+ indexed in fields myloc_0___double,myloc_1___double.
91
+ Example: if subFieldSuffix="_d" then the coordinates would be indexed
92
+ in fields myloc_0_d,myloc_1_d
93
+ The subFields are an implementation detail of the fieldType, and end
94
+ users normally should not need to know about them.
95
+ -->
96
+ <fieldType name="point" class="solr.PointType" dimension="2" subFieldSuffix="_d"/>
97
+
98
+ <!-- A specialized field for geospatial search. If indexed, this fieldType must not be multivalued. -->
99
+ <fieldType name="location" class="solr.LatLonType" subFieldSuffix="_coordinate"/>
100
+
101
+ <!-- An alternative geospatial field type new to Solr 4. It supports multiValued and polygon shapes.
102
+ For more information about this and other Spatial fields new to Solr 4, see:
103
+ http://wiki.apache.org/solr/SolrAdaptersForLuceneSpatial4
104
+ -->
105
+ <fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType"
106
+ geo="true" distErrPct="0.025" maxDistErr="0.000009" distanceUnits="degrees" />
107
+
108
+ <fieldType name="text" class="solr.TextField" omitNorms="false">
109
+ <analyzer>
110
+ <tokenizer class="solr.ICUTokenizerFactory"/>
111
+ <filter class="solr.ICUFoldingFilterFactory"/> <!-- NFKC, case folding, diacritics removed -->
112
+ <filter class="solr.TrimFilterFactory"/>
113
+ </analyzer>
114
+ </fieldType>
115
+
116
+ <!-- A text field that only splits on whitespace for exact matching of words -->
117
+ <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
118
+ <analyzer>
119
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
120
+ <filter class="solr.TrimFilterFactory"/>
121
+ </analyzer>
122
+ </fieldType>
123
+
124
+ <!-- single token analyzed text, for sorting. Punctuation is significant. -->
125
+ <fieldtype name="alphaSort" class="solr.TextField" sortMissingLast="true" omitNorms="true">
126
+ <analyzer>
127
+ <tokenizer class="solr.KeywordTokenizerFactory" />
128
+ <filter class="solr.ICUFoldingFilterFactory"/>
129
+ <filter class="solr.TrimFilterFactory" />
130
+ </analyzer>
131
+ </fieldtype>
132
+
133
+ <!-- A text field with defaults appropriate for English -->
134
+ <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
135
+ <analyzer>
136
+ <tokenizer class="solr.ICUTokenizerFactory"/>
137
+ <filter class="solr.ICUFoldingFilterFactory"/> <!-- NFKC, case folding, diacritics removed -->
138
+ <filter class="solr.EnglishPossessiveFilterFactory"/>
139
+ <!-- EnglishMinimalStemFilterFactory is less aggressive than PorterStemFilterFactory: -->
140
+ <filter class="solr.EnglishMinimalStemFilterFactory"/>
141
+ <!--
142
+ <filter class="solr.PorterStemFilterFactory"/>
143
+ -->
144
+ <filter class="solr.TrimFilterFactory"/>
145
+ </analyzer>
146
+ </fieldType>
147
+
148
+ <!-- queries for paths match documents at that path, or in descendent paths -->
149
+ <fieldType name="descendent_path" class="solr.TextField">
150
+ <analyzer type="index">
151
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
152
+ </analyzer>
153
+ <analyzer type="query">
154
+ <tokenizer class="solr.KeywordTokenizerFactory" />
155
+ </analyzer>
156
+ </fieldType>
157
+
158
+ <!-- queries for paths match documents at that path, or in ancestor paths -->
159
+ <fieldType name="ancestor_path" class="solr.TextField">
160
+ <analyzer type="index">
161
+ <tokenizer class="solr.KeywordTokenizerFactory" />
162
+ </analyzer>
163
+ <analyzer type="query">
164
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
165
+ </analyzer>
166
+ </fieldType>
167
+
168
+ <fieldType class="solr.TextField" name="textSuggest" positionIncrementGap="100">
169
+ <analyzer>
170
+ <tokenizer class="solr.KeywordTokenizerFactory"/>
171
+ <filter class="solr.StandardFilterFactory"/>
172
+ <filter class="solr.LowerCaseFilterFactory"/>
173
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
174
+ </analyzer>
175
+ </fieldType>
176
+ </types>
177
+
178
+
179
+ <fields>
180
+ <!-- If you remove this field, you must _also_ disable the update log in solrconfig.xml
181
+ or Solr won't start. _version_ and update log are required for SolrCloud
182
+ -->
183
+ <field name="_version_" type="long" indexed="true" stored="true"/>
184
+
185
+ <field name="id" type="string" stored="true" indexed="true" multiValued="false" required="true"/>
186
+ <field name="timestamp" type="date" indexed="true" stored="true" default="NOW" multiValued="false"/>
187
+
188
+ <field name="lat" type="tdouble" stored="true" indexed="true" multiValued="false"/>
189
+ <field name="lng" type="tdouble" stored="true" indexed="true" multiValued="false"/>
190
+
191
+ <!-- NOTE: not all possible Solr field types are represented in the dynamic fields -->
192
+
193
+ <!-- text (_t...) -->
194
+ <dynamicField name="*_ti" type="text" stored="false" indexed="true" multiValued="false"/>
195
+ <dynamicField name="*_tim" type="text" stored="false" indexed="true" multiValued="true"/>
196
+ <dynamicField name="*_ts" type="text" stored="true" indexed="false" multiValued="false"/>
197
+ <dynamicField name="*_tsm" type="text" stored="true" indexed="false" multiValued="true"/>
198
+ <dynamicField name="*_tsi" type="text" stored="true" indexed="true" multiValued="false"/>
199
+ <dynamicField name="*_tsim" type="text" stored="true" indexed="true" multiValued="true"/>
200
+ <dynamicField name="*_tiv" type="text" stored="false" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
201
+ <dynamicField name="*_timv" type="text" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
202
+ <dynamicField name="*_tsiv" type="text" stored="true" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
203
+ <dynamicField name="*_tsimv" type="text" stored="true" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
204
+
205
+ <!-- English text (_te...) -->
206
+ <dynamicField name="*_tei" type="text_en" stored="false" indexed="true" multiValued="false"/>
207
+ <dynamicField name="*_teim" type="text_en" stored="false" indexed="true" multiValued="true"/>
208
+ <dynamicField name="*_tes" type="text_en" stored="true" indexed="false" multiValued="false"/>
209
+ <dynamicField name="*_tesm" type="text_en" stored="true" indexed="false" multiValued="true"/>
210
+ <dynamicField name="*_tesi" type="text_en" stored="true" indexed="true" multiValued="false"/>
211
+ <dynamicField name="*_tesim" type="text_en" stored="true" indexed="true" multiValued="true"/>
212
+ <dynamicField name="*_teiv" type="text_en" stored="false" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
213
+ <dynamicField name="*_teimv" type="text_en" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
214
+ <dynamicField name="*_tesiv" type="text_en" stored="true" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
215
+ <dynamicField name="*_tesimv" type="text_en" stored="true" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
216
+
217
+ <!-- string (_s...) -->
218
+ <dynamicField name="*_si" type="string" stored="false" indexed="true" multiValued="false"/>
219
+ <dynamicField name="*_sim" type="string" stored="false" indexed="true" multiValued="true"/>
220
+ <dynamicField name="*_ss" type="string" stored="true" indexed="false" multiValued="false"/>
221
+ <dynamicField name="*_ssm" type="string" stored="true" indexed="false" multiValued="true"/>
222
+ <dynamicField name="*_ssi" type="string" stored="true" indexed="true" multiValued="false"/>
223
+ <dynamicField name="*_ssim" type="string" stored="true" indexed="true" multiValued="true"/>
224
+ <dynamicField name="*_ssort" type="alphaSort" stored="false" indexed="true" multiValued="false"/>
225
+
226
+ <!-- integer (_i...) -->
227
+ <dynamicField name="*_ii" type="int" stored="false" indexed="true" multiValued="false"/>
228
+ <dynamicField name="*_iim" type="int" stored="false" indexed="true" multiValued="true"/>
229
+ <dynamicField name="*_is" type="int" stored="true" indexed="false" multiValued="false"/>
230
+ <dynamicField name="*_ism" type="int" stored="true" indexed="false" multiValued="true"/>
231
+ <dynamicField name="*_isi" type="int" stored="true" indexed="true" multiValued="false"/>
232
+ <dynamicField name="*_isim" type="int" stored="true" indexed="true" multiValued="true"/>
233
+
234
+ <!-- trie integer (_it...) (for faster range queries) -->
235
+ <dynamicField name="*_iti" type="tint" stored="false" indexed="true" multiValued="false"/>
236
+ <dynamicField name="*_itim" type="tint" stored="false" indexed="true" multiValued="true"/>
237
+ <dynamicField name="*_its" type="tint" stored="true" indexed="false" multiValued="false"/>
238
+ <dynamicField name="*_itsm" type="tint" stored="true" indexed="false" multiValued="true"/>
239
+ <dynamicField name="*_itsi" type="tint" stored="true" indexed="true" multiValued="false"/>
240
+ <dynamicField name="*_itsim" type="tint" stored="true" indexed="true" multiValued="true"/>
241
+
242
+ <!-- date (_dt...) -->
243
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z
244
+ Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z -->
245
+ <dynamicField name="*_dti" type="date" stored="false" indexed="true" multiValued="false"/>
246
+ <dynamicField name="*_dtim" type="date" stored="false" indexed="true" multiValued="true"/>
247
+ <dynamicField name="*_dts" type="date" stored="true" indexed="false" multiValued="false"/>
248
+ <dynamicField name="*_dtsm" type="date" stored="true" indexed="false" multiValued="true"/>
249
+ <dynamicField name="*_dtsi" type="date" stored="true" indexed="true" multiValued="false"/>
250
+ <dynamicField name="*_dtsim" type="date" stored="true" indexed="true" multiValued="true"/>
251
+
252
+ <!-- trie date (_dtt...) (for faster range queries) -->
253
+ <dynamicField name="*_dtti" type="tdate" stored="false" indexed="true" multiValued="false"/>
254
+ <dynamicField name="*_dttim" type="tdate" stored="false" indexed="true" multiValued="true"/>
255
+ <dynamicField name="*_dtts" type="tdate" stored="true" indexed="false" multiValued="false"/>
256
+ <dynamicField name="*_dttsm" type="tdate" stored="true" indexed="false" multiValued="true"/>
257
+ <dynamicField name="*_dttsi" type="tdate" stored="true" indexed="true" multiValued="false"/>
258
+ <dynamicField name="*_dttsim" type="tdate" stored="true" indexed="true" multiValued="true"/>
259
+
260
+ <!-- long (_l...) -->
261
+ <dynamicField name="*_li" type="long" stored="false" indexed="true" multiValued="false"/>
262
+ <dynamicField name="*_lim" type="long" stored="false" indexed="true" multiValued="true"/>
263
+ <dynamicField name="*_ls" type="long" stored="true" indexed="false" multiValued="false"/>
264
+ <dynamicField name="*_lsm" type="long" stored="true" indexed="false" multiValued="true"/>
265
+ <dynamicField name="*_lsi" type="long" stored="true" indexed="true" multiValued="false"/>
266
+ <dynamicField name="*_lsim" type="long" stored="true" indexed="true" multiValued="true"/>
267
+
268
+ <!-- trie long (_lt...) (for faster range queries) -->
269
+ <dynamicField name="*_lti" type="tlong" stored="false" indexed="true" multiValued="false"/>
270
+ <dynamicField name="*_ltim" type="tlong" stored="false" indexed="true" multiValued="true"/>
271
+ <dynamicField name="*_lts" type="tlong" stored="true" indexed="false" multiValued="false"/>
272
+ <dynamicField name="*_ltsm" type="tlong" stored="true" indexed="false" multiValued="true"/>
273
+ <dynamicField name="*_ltsi" type="tlong" stored="true" indexed="true" multiValued="false"/>
274
+ <dynamicField name="*_ltsim" type="tlong" stored="true" indexed="true" multiValued="true"/>
275
+
276
+ <!-- double (_db...) -->
277
+ <dynamicField name="*_dbi" type="double" stored="false" indexed="true" multiValued="false"/>
278
+ <dynamicField name="*_dbim" type="double" stored="false" indexed="true" multiValued="true"/>
279
+ <dynamicField name="*_dbs" type="double" stored="true" indexed="false" multiValued="false"/>
280
+ <dynamicField name="*_dbsm" type="double" stored="true" indexed="false" multiValued="true"/>
281
+ <dynamicField name="*_dbsi" type="double" stored="true" indexed="true" multiValued="false"/>
282
+ <dynamicField name="*_dbsim" type="double" stored="true" indexed="true" multiValued="true"/>
283
+
284
+ <!-- trie double (_dbt...) (for faster range queries) -->
285
+ <dynamicField name="*_dbti" type="tdouble" stored="false" indexed="true" multiValued="false"/>
286
+ <dynamicField name="*_dbtim" type="tdouble" stored="false" indexed="true" multiValued="true"/>
287
+ <dynamicField name="*_dbts" type="tdouble" stored="true" indexed="false" multiValued="false"/>
288
+ <dynamicField name="*_dbtsm" type="tdouble" stored="true" indexed="false" multiValued="true"/>
289
+ <dynamicField name="*_dbtsi" type="tdouble" stored="true" indexed="true" multiValued="false"/>
290
+ <dynamicField name="*_dbtsim" type="tdouble" stored="true" indexed="true" multiValued="true"/>
291
+
292
+ <!-- float (_f...) -->
293
+ <dynamicField name="*_fi" type="float" stored="false" indexed="true" multiValued="false"/>
294
+ <dynamicField name="*_fim" type="float" stored="false" indexed="true" multiValued="true"/>
295
+ <dynamicField name="*_fs" type="float" stored="true" indexed="false" multiValued="false"/>
296
+ <dynamicField name="*_fsm" type="float" stored="true" indexed="false" multiValued="true"/>
297
+ <dynamicField name="*_fsi" type="float" stored="true" indexed="true" multiValued="false"/>
298
+ <dynamicField name="*_fsim" type="float" stored="true" indexed="true" multiValued="true"/>
299
+
300
+ <!-- trie float (_ft...) (for faster range queries) -->
301
+ <dynamicField name="*_fti" type="tfloat" stored="false" indexed="true" multiValued="false"/>
302
+ <dynamicField name="*_ftim" type="tfloat" stored="false" indexed="true" multiValued="true"/>
303
+ <dynamicField name="*_fts" type="tfloat" stored="true" indexed="false" multiValued="false"/>
304
+ <dynamicField name="*_ftsm" type="tfloat" stored="true" indexed="false" multiValued="true"/>
305
+ <dynamicField name="*_ftsi" type="tfloat" stored="true" indexed="true" multiValued="false"/>
306
+ <dynamicField name="*_ftsim" type="tfloat" stored="true" indexed="true" multiValued="true"/>
307
+
308
+ <!-- boolean (_b...) -->
309
+ <dynamicField name="*_bi" type="boolean" stored="false" indexed="true" multiValued="false"/>
310
+ <dynamicField name="*_bs" type="boolean" stored="true" indexed="false" multiValued="false"/>
311
+ <dynamicField name="*_bsi" type="boolean" stored="true" indexed="true" multiValued="false"/>
312
+
313
+ <!-- Type used to index the lat and lon components for the "location" FieldType -->
314
+ <dynamicField name="*_coordinate" type="tdouble" indexed="true" stored="false" />
315
+
316
+ <!-- location (_ll...) -->
317
+ <dynamicField name="*_lli" type="location" stored="false" indexed="true" multiValued="false"/>
318
+ <dynamicField name="*_llim" type="location" stored="false" indexed="true" multiValued="true"/>
319
+ <dynamicField name="*_lls" type="location" stored="true" indexed="false" multiValued="false"/>
320
+ <dynamicField name="*_llsm" type="location" stored="true" indexed="false" multiValued="true"/>
321
+ <dynamicField name="*_llsi" type="location" stored="true" indexed="true" multiValued="false"/>
322
+ <dynamicField name="*_llsim" type="location" stored="true" indexed="true" multiValued="true"/>
323
+
324
+ <dynamicField name="*suggest" type="textSuggest" indexed="true" stored="false" multiValued="true" />
325
+
326
+ <!-- you must define copyField source and dest fields explicity or schemaBrowser doesn't work -->
327
+ <field name="all_text_timv" type="text" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
328
+
329
+
330
+ </fields>
331
+
332
+ <!-- Field to use to determine and enforce document uniqueness.
333
+ Unless this field is marked with required="false", it will be a required field
334
+ -->
335
+ <uniqueKey>id</uniqueKey>
336
+
337
+ <!-- field for the QueryParser to use when an explicit fieldname is absent -->
338
+ <!-- <defaultSearchField>text</defaultSearchField> -->
339
+
340
+ <!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
341
+ <solrQueryParser defaultOperator="OR"/>
342
+
343
+ <!-- copyField commands copy one field to another at the time a document
344
+ is added to the index. It's used either to index the same field differently,
345
+ or to add multiple fields to the same field for easier/faster searching. -->
346
+ <!-- Copy Fields -->
347
+
348
+ <!-- Above, multiple source fields are copied to the [text] field.
349
+ Another way to map multiple source fields to the same
350
+ destination field is to use the dynamic field syntax.
351
+ copyField also supports a maxChars to copy setting. -->
352
+
353
+ <!-- <copyField source="*_tesim" dest="all_text_timv" maxChars="3000"/> -->
354
+ <!-- for suggestions -->
355
+ <copyField source="*_tesim" dest="suggest"/>
356
+ <copyField source="*_ssim" dest="suggest"/>
357
+
358
+ <!-- Similarity is the scoring routine for each document vs. a query.
359
+ A custom similarity may be specified here, but the default is fine
360
+ for most applications. -->
361
+ <!-- <similarity class="org.apache.lucene.search.DefaultSimilarity"/> -->
362
+ <!-- ... OR ...
363
+ Specify a SimilarityFactory class name implementation
364
+ allowing parameters to be used.
365
+ -->
366
+ <!--
367
+ <similarity class="com.example.solr.CustomSimilarityFactory">
368
+ <str name="paramkey">param value</str>
369
+ </similarity>
370
+ -->
371
+
372
+ </schema>
@@ -0,0 +1,24 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one or more
2
+ # contributor license agreements. See the NOTICE file distributed with
3
+ # this work for additional information regarding copyright ownership.
4
+ # The ASF licenses this file to You under the Apache License, Version 2.0
5
+ # (the "License"); you may not use this file except in compliance with
6
+ # the License. You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ user=
17
+ solr_hostname=localhost
18
+ solr_port=8983
19
+ rsyncd_port=18983
20
+ data_dir=
21
+ webapp_name=solr
22
+ master_host=
23
+ master_data_dir=
24
+ master_status_dir=
@@ -0,0 +1,311 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!--
20
+ This is a stripped down config file used for a simple example...
21
+ It is *not* a good example to work from.
22
+ -->
23
+ <config>
24
+
25
+ <!-- Controls what version of Lucene various components of Solr
26
+ adhere to. Generally, you want to use the latest version to
27
+ get all bug fixes and improvements. It is highly recommended
28
+ that you fully re-index after changing this setting as it can
29
+ affect both how text is indexed and queried.
30
+ -->
31
+ <luceneMatchVersion>5.0.0</luceneMatchVersion>
32
+
33
+ <lib dir="${solr.install.dir:../../../..}/contrib/analysis-extras/lib" />
34
+ <lib dir="${solr.install.dir:../../../..}/contrib/analysis-extras/lucene-libs" />
35
+ <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar" />
36
+ <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-cell-\d.*\.jar" />
37
+
38
+ <directoryFactory name="DirectoryFactory"
39
+ class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}">
40
+ </directoryFactory>
41
+
42
+ <codecFactory class="solr.SchemaCodecFactory"/>
43
+
44
+ <schemaFactory class="ClassicIndexSchemaFactory"/>
45
+
46
+
47
+ <dataDir>${solr.blacklight-core.data.dir:}</dataDir>
48
+
49
+ <requestDispatcher handleSelect="true" >
50
+ <requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048000" />
51
+ </requestDispatcher>
52
+
53
+ <requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" />
54
+
55
+ <!-- config for the admin interface -->
56
+ <admin>
57
+ <defaultQuery>*:*</defaultQuery>
58
+ </admin>
59
+
60
+ <updateHandler class="solr.DirectUpdateHandler2">
61
+ <updateLog>
62
+ <str name="dir">${solr.ulog.dir:}</str>
63
+ </updateLog>
64
+
65
+ <autoCommit>
66
+ <maxTime>${solr.autoCommit.maxTime:15000}</maxTime>
67
+ <openSearcher>false</openSearcher>
68
+ </autoCommit>
69
+
70
+ <autoSoftCommit>
71
+ <maxTime>${solr.autoSoftCommit.maxTime:-1}</maxTime>
72
+ </autoSoftCommit>
73
+ </updateHandler>
74
+
75
+ <!-- SearchHandler
76
+
77
+ http://wiki.apache.org/solr/SearchHandler
78
+
79
+ For processing Search Queries, the primary Request Handler
80
+ provided with Solr is "SearchHandler" It delegates to a sequent
81
+ of SearchComponents (see below) and supports distributed
82
+ queries across multiple shards
83
+ -->
84
+ <requestHandler name="search" class="solr.SearchHandler" default="true">
85
+ <!-- default values for query parameters can be specified, these
86
+ will be overridden by parameters in the request
87
+ -->
88
+ <lst name="defaults">
89
+ <str name="defType">edismax</str>
90
+ <str name="echoParams">explicit</str>
91
+ <str name="q.alt">*:*</str>
92
+ <str name="mm">2&lt;-1 5&lt;-2 6&lt;90%</str>
93
+ <int name="qs">1</int>
94
+ <int name="ps">2</int>
95
+ <float name="tie">0.01</float>
96
+ <!-- this qf and pf are used by default, if not otherwise specified by
97
+ client. The default blacklight_config will use these for the
98
+ "keywords" search. See the author_qf/author_pf, title_qf, etc
99
+ below, which the default blacklight_config will specify for
100
+ those searches. You may also be interested in:
101
+ http://wiki.apache.org/solr/LocalParams
102
+ -->
103
+ <str name="qf">
104
+ id
105
+ title_tesim
106
+ author_tesim
107
+ subject_tesim
108
+ </str>
109
+ <str name="pf">
110
+ all_text_timv^10
111
+ </str>
112
+
113
+ <str name="author_qf">
114
+ author_tesim
115
+ </str>
116
+ <str name="author_pf">
117
+ </str>
118
+ <str name="title_qf">
119
+ title_tesim
120
+ </str>
121
+ <str name="title_pf">
122
+ </str>
123
+ <str name="subject_qf">
124
+ subject_tesim
125
+ </str>
126
+ <str name="subject_pf">
127
+ </str>
128
+
129
+ <str name="fl">
130
+ *,
131
+ score
132
+ </str>
133
+
134
+ <str name="facet">true</str>
135
+ <str name="facet.mincount">1</str>
136
+
137
+ <str name="spellcheck">true</str>
138
+ <str name="spellcheck.dictionary">default</str>
139
+ <str name="spellcheck.onlyMorePopular">true</str>
140
+ <str name="spellcheck.extendedResults">true</str>
141
+ <str name="spellcheck.collate">false</str>
142
+ <str name="spellcheck.count">5</str>
143
+
144
+ </lst>
145
+ <arr name="last-components">
146
+ <str>spellcheck</str>
147
+ </arr>
148
+ </requestHandler>
149
+
150
+ <requestHandler name="permissions" class="solr.SearchHandler" >
151
+ <lst name="defaults">
152
+ <str name="facet">off</str>
153
+ <str name="echoParams">all</str>
154
+ <str name="rows">1</str>
155
+ <str name="q">{!raw f=id v=$id}</str> <!-- use id=666 instead of q=id:666 -->
156
+ <str name="fl">
157
+ id,
158
+ access_ssim,
159
+ discover_access_group_ssim,discover_access_person_ssim,
160
+ read_access_group_ssim,read_access_person_ssim,
161
+ edit_access_group_ssim,edit_access_person_ssim,
162
+ depositor_ti,
163
+ embargo_release_date_dtsi
164
+ inheritable_access_ssim,
165
+ inheritable_discover_access_group_ssim,inheritable_discover_access_person_ssim,
166
+ inheritable_read_access_group_ssim,inheritable_read_access_person_ssim,
167
+ inheritable_edit_access_group_ssim,inheritable_edit_access_person_ssim,
168
+ inheritable_embargo_release_date_dtsi
169
+ </str>
170
+ </lst>
171
+ </requestHandler>
172
+
173
+ <requestHandler name="standard" class="solr.SearchHandler">
174
+ <lst name="defaults">
175
+ <str name="echoParams">explicit</str>
176
+ <str name="defType">lucene</str>
177
+ </lst>
178
+ </requestHandler>
179
+
180
+ <!-- for requests to get a single document; use id=666 instead of q=id:666 -->
181
+ <requestHandler name="document" class="solr.SearchHandler" >
182
+ <lst name="defaults">
183
+ <str name="echoParams">all</str>
184
+ <str name="fl">*</str>
185
+ <str name="rows">1</str>
186
+ <str name="q">{!term f=id v=$id}</str> <!-- use id=666 instead of q=id:666 -->
187
+ </lst>
188
+ </requestHandler>
189
+
190
+ <!-- Spell Check
191
+
192
+ The spell check component can return a list of alternative spelling
193
+ suggestions.
194
+
195
+ http://wiki.apache.org/solr/SpellCheckComponent
196
+ -->
197
+ <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
198
+
199
+ <str name="queryAnalyzerFieldType">textSpell</str>
200
+
201
+ <!-- Multiple "Spell Checkers" can be declared and used by this
202
+ component
203
+ -->
204
+
205
+ <!-- a spellchecker built from a field of the main index, and
206
+ written to disk
207
+ -->
208
+ <lst name="spellchecker">
209
+ <str name="name">default</str>
210
+ <str name="field">spell</str>
211
+ <str name="spellcheckIndexDir">./spell</str>
212
+ <str name="buildOnOptimize">true</str>
213
+ </lst>
214
+ <lst name="spellchecker">
215
+ <str name="name">author</str>
216
+ <str name="field">author_spell</str>
217
+ <str name="spellcheckIndexDir">./spell_author</str>
218
+ <str name="accuracy">0.7</str>
219
+ <str name="buildOnOptimize">true</str>
220
+ </lst>
221
+ <lst name="spellchecker">
222
+ <str name="name">subject</str>
223
+ <str name="field">subject_spell</str>
224
+ <str name="spellcheckIndexDir">./spell_subject</str>
225
+ <str name="accuracy">0.7</str>
226
+ <str name="buildOnOptimize">true</str>
227
+ </lst>
228
+ <lst name="spellchecker">
229
+ <str name="name">title</str>
230
+ <str name="field">title_spell</str>
231
+ <str name="spellcheckIndexDir">./spell_title</str>
232
+ <str name="accuracy">0.7</str>
233
+ <str name="buildOnOptimize">true</str>
234
+ </lst>
235
+
236
+ <!-- a spellchecker that uses a different distance measure -->
237
+ <!--
238
+ <lst name="spellchecker">
239
+ <str name="name">jarowinkler</str>
240
+ <str name="field">spell</str>
241
+ <str name="distanceMeasure">
242
+ org.apache.lucene.search.spell.JaroWinklerDistance
243
+ </str>
244
+ <str name="spellcheckIndexDir">spellcheckerJaro</str>
245
+ </lst>
246
+ -->
247
+
248
+ <!-- a spellchecker that use an alternate comparator
249
+
250
+ comparatorClass be one of:
251
+ 1. score (default)
252
+ 2. freq (Frequency first, then score)
253
+ 3. A fully qualified class name
254
+ -->
255
+ <!--
256
+ <lst name="spellchecker">
257
+ <str name="name">freq</str>
258
+ <str name="field">lowerfilt</str>
259
+ <str name="spellcheckIndexDir">spellcheckerFreq</str>
260
+ <str name="comparatorClass">freq</str>
261
+ <str name="buildOnCommit">true</str>
262
+ -->
263
+
264
+ <!-- A spellchecker that reads the list of words from a file -->
265
+ <!--
266
+ <lst name="spellchecker">
267
+ <str name="classname">solr.FileBasedSpellChecker</str>
268
+ <str name="name">file</str>
269
+ <str name="sourceLocation">spellings.txt</str>
270
+ <str name="characterEncoding">UTF-8</str>
271
+ <str name="spellcheckIndexDir">spellcheckerFile</str>
272
+ </lst>
273
+ -->
274
+ </searchComponent>
275
+
276
+ <searchComponent name="suggest" class="solr.SuggestComponent">
277
+ <lst name="suggester">
278
+ <str name="name">mySuggester</str>
279
+ <str name="lookupImpl">FuzzyLookupFactory</str>
280
+ <str name="suggestAnalyzerFieldType">textSuggest</str>
281
+ <str name="buildOnCommit">true</str>
282
+ <str name="field">suggest</str>
283
+ </lst>
284
+ </searchComponent>
285
+
286
+ <requestHandler name="/suggest" class="solr.SearchHandler" startup="lazy">
287
+ <lst name="defaults">
288
+ <str name="suggest">true</str>
289
+ <str name="suggest.count">5</str>
290
+ <str name="suggest.dictionary">mySuggester</str>
291
+ </lst>
292
+ <arr name="components">
293
+ <str>suggest</str>
294
+ </arr>
295
+ </requestHandler>
296
+
297
+ <requestHandler name="/update/extract" class="org.apache.solr.handler.extraction.ExtractingRequestHandler">
298
+ <lst name="defaults">
299
+ <str name="fmap.Last-Modified">last_modified</str>
300
+ <str name="uprefix">ignored_</str>
301
+ </lst>
302
+ <!--Optional. Specify a path to a tika configuration file. See the Tika docs for details.-->
303
+ <!-- <str name="tika.config">/my/path/to/tika.config</str> -->
304
+ <!-- Optional. Specify one or more date formats to parse. See DateUtil.DEFAULT_DATE_FORMATS
305
+ for default date formats -->
306
+ <!-- <lst name="date.formats"> -->
307
+ <!-- <str>yyyy&#45;MM&#45;dd</str> -->
308
+ <!-- </lst> -->
309
+ </requestHandler>
310
+ </config>
311
+