activefedora-aggregation 0.8.1 → 0.9.0

Sign up to get free protection for your applications and to get access to all the features.
@@ -0,0 +1,21 @@
1
+ # The ASF licenses this file to You under the Apache License, Version 2.0
2
+ # (the "License"); you may not use this file except in compliance with
3
+ # the License. You may obtain a copy of the License at
4
+ #
5
+ # http://www.apache.org/licenses/LICENSE-2.0
6
+ #
7
+ # Unless required by applicable law or agreed to in writing, software
8
+ # distributed under the License is distributed on an "AS IS" BASIS,
9
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10
+ # See the License for the specific language governing permissions and
11
+ # limitations under the License.
12
+
13
+ #-----------------------------------------------------------------------
14
+ # Use a protected word file to protect against the stemmer reducing two
15
+ # unrelated words to the same base word.
16
+
17
+ # Some non-words that normally won't be encountered,
18
+ # just to test that they won't be stemmed.
19
+ dontstems
20
+ zwhacky
21
+
@@ -0,0 +1,372 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!--
20
+ This is the Solr schema file. This file should be named "schema.xml" and
21
+ should be in the conf directory under the solr home
22
+ (i.e. ./solr/conf/schema.xml by default)
23
+ or located where the classloader for the Solr webapp can find it.
24
+
25
+ This example schema is the recommended starting point for users.
26
+ It should be kept correct and concise, usable out-of-the-box.
27
+
28
+ For more information, on how to customize this file, please see
29
+ http://wiki.apache.org/solr/SchemaXml
30
+
31
+ PERFORMANCE NOTE: this schema includes many optional features and should not
32
+ be used for benchmarking. To improve performance one could
33
+ - set stored="false" for all fields possible (esp large fields) when you
34
+ only need to search on the field but don't need to return the original
35
+ value.
36
+ - set indexed="false" if you don't need to search on the field, but only
37
+ return the field as a result of searching on other indexed fields.
38
+ - remove all unneeded copyField statements
39
+ - for best index size and searching performance, set "index" to false
40
+ for all general text fields, use copyField to copy them to the
41
+ catchall "text" field, and use that for searching.
42
+ - For maximum indexing performance, use the StreamingUpdateSolrServer
43
+ java client.
44
+ - Remember to run the JVM in server mode, and use a higher logging level
45
+ that avoids logging every request
46
+ -->
47
+
48
+ <schema name="Hydra Demo Index" version="1.5">
49
+ <!-- attribute "name" is the name of this schema and is only used for display purposes.
50
+ Applications should change this to reflect the nature of the search collection.
51
+ version="1.4" is Solr's version number for the schema syntax and semantics. It should
52
+ not normally be changed by applications.
53
+ 1.0: multiValued attribute did not exist, all fields are multiValued by nature
54
+ 1.1: multiValued attribute introduced, false by default
55
+ 1.2: omitTermFreqAndPositions attribute introduced, true by default except for text fields.
56
+ 1.3: removed optional field compress feature
57
+ 1.4: default auto-phrase (QueryParser feature) to off
58
+ -->
59
+
60
+ <types>
61
+ <fieldType name="string" class="solr.StrField" sortMissingLast="true" />
62
+ <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
63
+ <fieldType name="rand" class="solr.RandomSortField" omitNorms="true"/>
64
+
65
+ <!-- Default numeric field types. -->
66
+ <fieldType name="int" class="solr.TrieIntField" precisionStep="0" positionIncrementGap="0"/>
67
+ <fieldType name="float" class="solr.TrieFloatField" precisionStep="0" positionIncrementGap="0"/>
68
+ <fieldType name="long" class="solr.TrieLongField" precisionStep="0" positionIncrementGap="0"/>
69
+ <fieldType name="double" class="solr.TrieDoubleField" precisionStep="0" positionIncrementGap="0"/>
70
+
71
+ <!-- trie numeric field types for faster range queries -->
72
+ <fieldType name="tint" class="solr.TrieIntField" precisionStep="8" positionIncrementGap="0"/>
73
+ <fieldType name="tfloat" class="solr.TrieFloatField" precisionStep="8" positionIncrementGap="0"/>
74
+ <fieldType name="tlong" class="solr.TrieLongField" precisionStep="8" positionIncrementGap="0"/>
75
+ <fieldType name="tdouble" class="solr.TrieDoubleField" precisionStep="8" positionIncrementGap="0"/>
76
+
77
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z
78
+ Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z
79
+ -->
80
+ <fieldType name="date" class="solr.TrieDateField" precisionStep="0" positionIncrementGap="0"/>
81
+ <!-- A Trie based date field for faster date range queries and date faceting. -->
82
+ <fieldType name="tdate" class="solr.TrieDateField" precisionStep="6" positionIncrementGap="0"/>
83
+
84
+
85
+ <!-- This point type indexes the coordinates as separate fields (subFields)
86
+ If subFieldType is defined, it references a type, and a dynamic field
87
+ definition is created matching *___<typename>. Alternately, if
88
+ subFieldSuffix is defined, that is used to create the subFields.
89
+ Example: if subFieldType="double", then the coordinates would be
90
+ indexed in fields myloc_0___double,myloc_1___double.
91
+ Example: if subFieldSuffix="_d" then the coordinates would be indexed
92
+ in fields myloc_0_d,myloc_1_d
93
+ The subFields are an implementation detail of the fieldType, and end
94
+ users normally should not need to know about them.
95
+ -->
96
+ <fieldType name="point" class="solr.PointType" dimension="2" subFieldSuffix="_d"/>
97
+
98
+ <!-- A specialized field for geospatial search. If indexed, this fieldType must not be multivalued. -->
99
+ <fieldType name="location" class="solr.LatLonType" subFieldSuffix="_coordinate"/>
100
+
101
+ <!-- An alternative geospatial field type new to Solr 4. It supports multiValued and polygon shapes.
102
+ For more information about this and other Spatial fields new to Solr 4, see:
103
+ http://wiki.apache.org/solr/SolrAdaptersForLuceneSpatial4
104
+ -->
105
+ <fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType"
106
+ geo="true" distErrPct="0.025" maxDistErr="0.000009" units="degrees" />
107
+
108
+ <fieldType name="text" class="solr.TextField" omitNorms="false">
109
+ <analyzer>
110
+ <tokenizer class="solr.ICUTokenizerFactory"/>
111
+ <filter class="solr.ICUFoldingFilterFactory"/> <!-- NFKC, case folding, diacritics removed -->
112
+ <filter class="solr.TrimFilterFactory"/>
113
+ </analyzer>
114
+ </fieldType>
115
+
116
+ <!-- A text field that only splits on whitespace for exact matching of words -->
117
+ <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
118
+ <analyzer>
119
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
120
+ <filter class="solr.TrimFilterFactory"/>
121
+ </analyzer>
122
+ </fieldType>
123
+
124
+ <!-- single token analyzed text, for sorting. Punctuation is significant. -->
125
+ <fieldtype name="alphaSort" class="solr.TextField" sortMissingLast="true" omitNorms="true">
126
+ <analyzer>
127
+ <tokenizer class="solr.KeywordTokenizerFactory" />
128
+ <filter class="solr.ICUFoldingFilterFactory"/>
129
+ <filter class="solr.TrimFilterFactory" />
130
+ </analyzer>
131
+ </fieldtype>
132
+
133
+ <!-- A text field with defaults appropriate for English -->
134
+ <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
135
+ <analyzer>
136
+ <tokenizer class="solr.ICUTokenizerFactory"/>
137
+ <filter class="solr.ICUFoldingFilterFactory"/> <!-- NFKC, case folding, diacritics removed -->
138
+ <filter class="solr.EnglishPossessiveFilterFactory"/>
139
+ <!-- EnglishMinimalStemFilterFactory is less aggressive than PorterStemFilterFactory: -->
140
+ <filter class="solr.EnglishMinimalStemFilterFactory"/>
141
+ <!--
142
+ <filter class="solr.PorterStemFilterFactory"/>
143
+ -->
144
+ <filter class="solr.TrimFilterFactory"/>
145
+ </analyzer>
146
+ </fieldType>
147
+
148
+ <!-- queries for paths match documents at that path, or in descendent paths -->
149
+ <fieldType name="descendent_path" class="solr.TextField">
150
+ <analyzer type="index">
151
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
152
+ </analyzer>
153
+ <analyzer type="query">
154
+ <tokenizer class="solr.KeywordTokenizerFactory" />
155
+ </analyzer>
156
+ </fieldType>
157
+
158
+ <!-- queries for paths match documents at that path, or in ancestor paths -->
159
+ <fieldType name="ancestor_path" class="solr.TextField">
160
+ <analyzer type="index">
161
+ <tokenizer class="solr.KeywordTokenizerFactory" />
162
+ </analyzer>
163
+ <analyzer type="query">
164
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
165
+ </analyzer>
166
+ </fieldType>
167
+
168
+ <fieldType class="solr.TextField" name="textSuggest" positionIncrementGap="100">
169
+ <analyzer>
170
+ <tokenizer class="solr.KeywordTokenizerFactory"/>
171
+ <filter class="solr.StandardFilterFactory"/>
172
+ <filter class="solr.LowerCaseFilterFactory"/>
173
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
174
+ </analyzer>
175
+ </fieldType>
176
+ </types>
177
+
178
+
179
+ <fields>
180
+ <!-- If you remove this field, you must _also_ disable the update log in solrconfig.xml
181
+ or Solr won't start. _version_ and update log are required for SolrCloud
182
+ -->
183
+ <field name="_version_" type="long" indexed="true" stored="true"/>
184
+
185
+ <field name="id" type="string" stored="true" indexed="true" multiValued="false" required="true"/>
186
+ <field name="timestamp" type="date" indexed="true" stored="true" default="NOW" multiValued="false"/>
187
+
188
+ <field name="lat" type="tdouble" stored="true" indexed="true" multiValued="false"/>
189
+ <field name="lng" type="tdouble" stored="true" indexed="true" multiValued="false"/>
190
+
191
+ <!-- NOTE: not all possible Solr field types are represented in the dynamic fields -->
192
+
193
+ <!-- text (_t...) -->
194
+ <dynamicField name="*_ti" type="text" stored="false" indexed="true" multiValued="false"/>
195
+ <dynamicField name="*_tim" type="text" stored="false" indexed="true" multiValued="true"/>
196
+ <dynamicField name="*_ts" type="text" stored="true" indexed="false" multiValued="false"/>
197
+ <dynamicField name="*_tsm" type="text" stored="true" indexed="false" multiValued="true"/>
198
+ <dynamicField name="*_tsi" type="text" stored="true" indexed="true" multiValued="false"/>
199
+ <dynamicField name="*_tsim" type="text" stored="true" indexed="true" multiValued="true"/>
200
+ <dynamicField name="*_tiv" type="text" stored="false" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
201
+ <dynamicField name="*_timv" type="text" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
202
+ <dynamicField name="*_tsiv" type="text" stored="true" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
203
+ <dynamicField name="*_tsimv" type="text" stored="true" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
204
+
205
+ <!-- English text (_te...) -->
206
+ <dynamicField name="*_tei" type="text_en" stored="false" indexed="true" multiValued="false"/>
207
+ <dynamicField name="*_teim" type="text_en" stored="false" indexed="true" multiValued="true"/>
208
+ <dynamicField name="*_tes" type="text_en" stored="true" indexed="false" multiValued="false"/>
209
+ <dynamicField name="*_tesm" type="text_en" stored="true" indexed="false" multiValued="true"/>
210
+ <dynamicField name="*_tesi" type="text_en" stored="true" indexed="true" multiValued="false"/>
211
+ <dynamicField name="*_tesim" type="text_en" stored="true" indexed="true" multiValued="true"/>
212
+ <dynamicField name="*_teiv" type="text_en" stored="false" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
213
+ <dynamicField name="*_teimv" type="text_en" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
214
+ <dynamicField name="*_tesiv" type="text_en" stored="true" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
215
+ <dynamicField name="*_tesimv" type="text_en" stored="true" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
216
+
217
+ <!-- string (_s...) -->
218
+ <dynamicField name="*_si" type="string" stored="false" indexed="true" multiValued="false"/>
219
+ <dynamicField name="*_sim" type="string" stored="false" indexed="true" multiValued="true"/>
220
+ <dynamicField name="*_ss" type="string" stored="true" indexed="false" multiValued="false"/>
221
+ <dynamicField name="*_ssm" type="string" stored="true" indexed="false" multiValued="true"/>
222
+ <dynamicField name="*_ssi" type="string" stored="true" indexed="true" multiValued="false"/>
223
+ <dynamicField name="*_ssim" type="string" stored="true" indexed="true" multiValued="true"/>
224
+ <dynamicField name="*_ssort" type="alphaSort" stored="false" indexed="true" multiValued="false"/>
225
+
226
+ <!-- integer (_i...) -->
227
+ <dynamicField name="*_ii" type="int" stored="false" indexed="true" multiValued="false"/>
228
+ <dynamicField name="*_iim" type="int" stored="false" indexed="true" multiValued="true"/>
229
+ <dynamicField name="*_is" type="int" stored="true" indexed="false" multiValued="false"/>
230
+ <dynamicField name="*_ism" type="int" stored="true" indexed="false" multiValued="true"/>
231
+ <dynamicField name="*_isi" type="int" stored="true" indexed="true" multiValued="false"/>
232
+ <dynamicField name="*_isim" type="int" stored="true" indexed="true" multiValued="true"/>
233
+
234
+ <!-- trie integer (_it...) (for faster range queries) -->
235
+ <dynamicField name="*_iti" type="tint" stored="false" indexed="true" multiValued="false"/>
236
+ <dynamicField name="*_itim" type="tint" stored="false" indexed="true" multiValued="true"/>
237
+ <dynamicField name="*_its" type="tint" stored="true" indexed="false" multiValued="false"/>
238
+ <dynamicField name="*_itsm" type="tint" stored="true" indexed="false" multiValued="true"/>
239
+ <dynamicField name="*_itsi" type="tint" stored="true" indexed="true" multiValued="false"/>
240
+ <dynamicField name="*_itsim" type="tint" stored="true" indexed="true" multiValued="true"/>
241
+
242
+ <!-- date (_dt...) -->
243
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z
244
+ Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z -->
245
+ <dynamicField name="*_dti" type="date" stored="false" indexed="true" multiValued="false"/>
246
+ <dynamicField name="*_dtim" type="date" stored="false" indexed="true" multiValued="true"/>
247
+ <dynamicField name="*_dts" type="date" stored="true" indexed="false" multiValued="false"/>
248
+ <dynamicField name="*_dtsm" type="date" stored="true" indexed="false" multiValued="true"/>
249
+ <dynamicField name="*_dtsi" type="date" stored="true" indexed="true" multiValued="false"/>
250
+ <dynamicField name="*_dtsim" type="date" stored="true" indexed="true" multiValued="true"/>
251
+
252
+ <!-- trie date (_dtt...) (for faster range queries) -->
253
+ <dynamicField name="*_dtti" type="tdate" stored="false" indexed="true" multiValued="false"/>
254
+ <dynamicField name="*_dttim" type="tdate" stored="false" indexed="true" multiValued="true"/>
255
+ <dynamicField name="*_dtts" type="tdate" stored="true" indexed="false" multiValued="false"/>
256
+ <dynamicField name="*_dttsm" type="tdate" stored="true" indexed="false" multiValued="true"/>
257
+ <dynamicField name="*_dttsi" type="tdate" stored="true" indexed="true" multiValued="false"/>
258
+ <dynamicField name="*_dttsim" type="tdate" stored="true" indexed="true" multiValued="true"/>
259
+
260
+ <!-- long (_l...) -->
261
+ <dynamicField name="*_li" type="long" stored="false" indexed="true" multiValued="false"/>
262
+ <dynamicField name="*_lim" type="long" stored="false" indexed="true" multiValued="true"/>
263
+ <dynamicField name="*_ls" type="long" stored="true" indexed="false" multiValued="false"/>
264
+ <dynamicField name="*_lsm" type="long" stored="true" indexed="false" multiValued="true"/>
265
+ <dynamicField name="*_lsi" type="long" stored="true" indexed="true" multiValued="false"/>
266
+ <dynamicField name="*_lsim" type="long" stored="true" indexed="true" multiValued="true"/>
267
+
268
+ <!-- trie long (_lt...) (for faster range queries) -->
269
+ <dynamicField name="*_lti" type="tlong" stored="false" indexed="true" multiValued="false"/>
270
+ <dynamicField name="*_ltim" type="tlong" stored="false" indexed="true" multiValued="true"/>
271
+ <dynamicField name="*_lts" type="tlong" stored="true" indexed="false" multiValued="false"/>
272
+ <dynamicField name="*_ltsm" type="tlong" stored="true" indexed="false" multiValued="true"/>
273
+ <dynamicField name="*_ltsi" type="tlong" stored="true" indexed="true" multiValued="false"/>
274
+ <dynamicField name="*_ltsim" type="tlong" stored="true" indexed="true" multiValued="true"/>
275
+
276
+ <!-- double (_db...) -->
277
+ <dynamicField name="*_dbi" type="double" stored="false" indexed="true" multiValued="false"/>
278
+ <dynamicField name="*_dbim" type="double" stored="false" indexed="true" multiValued="true"/>
279
+ <dynamicField name="*_dbs" type="double" stored="true" indexed="false" multiValued="false"/>
280
+ <dynamicField name="*_dbsm" type="double" stored="true" indexed="false" multiValued="true"/>
281
+ <dynamicField name="*_dbsi" type="double" stored="true" indexed="true" multiValued="false"/>
282
+ <dynamicField name="*_dbsim" type="double" stored="true" indexed="true" multiValued="true"/>
283
+
284
+ <!-- trie double (_dbt...) (for faster range queries) -->
285
+ <dynamicField name="*_dbti" type="tdouble" stored="false" indexed="true" multiValued="false"/>
286
+ <dynamicField name="*_dbtim" type="tdouble" stored="false" indexed="true" multiValued="true"/>
287
+ <dynamicField name="*_dbts" type="tdouble" stored="true" indexed="false" multiValued="false"/>
288
+ <dynamicField name="*_dbtsm" type="tdouble" stored="true" indexed="false" multiValued="true"/>
289
+ <dynamicField name="*_dbtsi" type="tdouble" stored="true" indexed="true" multiValued="false"/>
290
+ <dynamicField name="*_dbtsim" type="tdouble" stored="true" indexed="true" multiValued="true"/>
291
+
292
+ <!-- float (_f...) -->
293
+ <dynamicField name="*_fi" type="float" stored="false" indexed="true" multiValued="false"/>
294
+ <dynamicField name="*_fim" type="float" stored="false" indexed="true" multiValued="true"/>
295
+ <dynamicField name="*_fs" type="float" stored="true" indexed="false" multiValued="false"/>
296
+ <dynamicField name="*_fsm" type="float" stored="true" indexed="false" multiValued="true"/>
297
+ <dynamicField name="*_fsi" type="float" stored="true" indexed="true" multiValued="false"/>
298
+ <dynamicField name="*_fsim" type="float" stored="true" indexed="true" multiValued="true"/>
299
+
300
+ <!-- trie float (_ft...) (for faster range queries) -->
301
+ <dynamicField name="*_fti" type="tfloat" stored="false" indexed="true" multiValued="false"/>
302
+ <dynamicField name="*_ftim" type="tfloat" stored="false" indexed="true" multiValued="true"/>
303
+ <dynamicField name="*_fts" type="tfloat" stored="true" indexed="false" multiValued="false"/>
304
+ <dynamicField name="*_ftsm" type="tfloat" stored="true" indexed="false" multiValued="true"/>
305
+ <dynamicField name="*_ftsi" type="tfloat" stored="true" indexed="true" multiValued="false"/>
306
+ <dynamicField name="*_ftsim" type="tfloat" stored="true" indexed="true" multiValued="true"/>
307
+
308
+ <!-- boolean (_b...) -->
309
+ <dynamicField name="*_bi" type="boolean" stored="false" indexed="true" multiValued="false"/>
310
+ <dynamicField name="*_bs" type="boolean" stored="true" indexed="false" multiValued="false"/>
311
+ <dynamicField name="*_bsi" type="boolean" stored="true" indexed="true" multiValued="false"/>
312
+
313
+ <!-- Type used to index the lat and lon components for the "location" FieldType -->
314
+ <dynamicField name="*_coordinate" type="tdouble" indexed="true" stored="false" />
315
+
316
+ <!-- location (_ll...) -->
317
+ <dynamicField name="*_lli" type="location" stored="false" indexed="true" multiValued="false"/>
318
+ <dynamicField name="*_llim" type="location" stored="false" indexed="true" multiValued="true"/>
319
+ <dynamicField name="*_lls" type="location" stored="true" indexed="false" multiValued="false"/>
320
+ <dynamicField name="*_llsm" type="location" stored="true" indexed="false" multiValued="true"/>
321
+ <dynamicField name="*_llsi" type="location" stored="true" indexed="true" multiValued="false"/>
322
+ <dynamicField name="*_llsim" type="location" stored="true" indexed="true" multiValued="true"/>
323
+
324
+ <dynamicField name="*suggest" type="textSuggest" indexed="true" stored="false" multiValued="true" />
325
+
326
+ <!-- you must define copyField source and dest fields explicity or schemaBrowser doesn't work -->
327
+ <field name="all_text_timv" type="text" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
328
+
329
+
330
+ </fields>
331
+
332
+ <!-- Field to use to determine and enforce document uniqueness.
333
+ Unless this field is marked with required="false", it will be a required field
334
+ -->
335
+ <uniqueKey>id</uniqueKey>
336
+
337
+ <!-- field for the QueryParser to use when an explicit fieldname is absent -->
338
+ <!-- <defaultSearchField>text</defaultSearchField> -->
339
+
340
+ <!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
341
+ <solrQueryParser defaultOperator="OR"/>
342
+
343
+ <!-- copyField commands copy one field to another at the time a document
344
+ is added to the index. It's used either to index the same field differently,
345
+ or to add multiple fields to the same field for easier/faster searching. -->
346
+ <!-- Copy Fields -->
347
+
348
+ <!-- Above, multiple source fields are copied to the [text] field.
349
+ Another way to map multiple source fields to the same
350
+ destination field is to use the dynamic field syntax.
351
+ copyField also supports a maxChars to copy setting. -->
352
+
353
+ <!-- <copyField source="*_tesim" dest="all_text_timv" maxChars="3000"/> -->
354
+ <!-- for suggestions -->
355
+ <copyField source="*_tesim" dest="suggest"/>
356
+ <copyField source="*_ssim" dest="suggest"/>
357
+
358
+ <!-- Similarity is the scoring routine for each document vs. a query.
359
+ A custom similarity may be specified here, but the default is fine
360
+ for most applications. -->
361
+ <!-- <similarity class="org.apache.lucene.search.DefaultSimilarity"/> -->
362
+ <!-- ... OR ...
363
+ Specify a SimilarityFactory class name implementation
364
+ allowing parameters to be used.
365
+ -->
366
+ <!--
367
+ <similarity class="com.example.solr.CustomSimilarityFactory">
368
+ <str name="paramkey">param value</str>
369
+ </similarity>
370
+ -->
371
+
372
+ </schema>
@@ -0,0 +1,24 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one or more
2
+ # contributor license agreements. See the NOTICE file distributed with
3
+ # this work for additional information regarding copyright ownership.
4
+ # The ASF licenses this file to You under the Apache License, Version 2.0
5
+ # (the "License"); you may not use this file except in compliance with
6
+ # the License. You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ user=
17
+ solr_hostname=localhost
18
+ solr_port=8983
19
+ rsyncd_port=18983
20
+ data_dir=
21
+ webapp_name=solr
22
+ master_host=
23
+ master_data_dir=
24
+ master_status_dir=
@@ -0,0 +1,297 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!--
20
+ This is a stripped down config file used for a simple example...
21
+ It is *not* a good example to work from.
22
+ -->
23
+ <config>
24
+
25
+ <!-- Controls what version of Lucene various components of Solr
26
+ adhere to. Generally, you want to use the latest version to
27
+ get all bug fixes and improvements. It is highly recommended
28
+ that you fully re-index after changing this setting as it can
29
+ affect both how text is indexed and queried.
30
+ -->
31
+ <luceneMatchVersion>5.0.0</luceneMatchVersion>
32
+
33
+ <lib dir="${solr.install.dir:../../../..}/contrib/analysis-extras/lib" />
34
+ <lib dir="${solr.install.dir:../../../..}/contrib/analysis-extras/lucene-libs" />
35
+ <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar" />
36
+ <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-cell-\d.*\.jar" />
37
+
38
+ <directoryFactory name="DirectoryFactory"
39
+ class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}">
40
+ </directoryFactory>
41
+
42
+ <codecFactory class="solr.SchemaCodecFactory"/>
43
+
44
+ <schemaFactory class="ClassicIndexSchemaFactory"/>
45
+
46
+
47
+ <dataDir>${solr.blacklight-core.data.dir:}</dataDir>
48
+
49
+ <requestDispatcher handleSelect="true" >
50
+ <requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048000" />
51
+ </requestDispatcher>
52
+
53
+ <requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" />
54
+
55
+ <!-- config for the admin interface -->
56
+ <admin>
57
+ <defaultQuery>*:*</defaultQuery>
58
+ </admin>
59
+
60
+ <!-- SearchHandler
61
+
62
+ http://wiki.apache.org/solr/SearchHandler
63
+
64
+ For processing Search Queries, the primary Request Handler
65
+ provided with Solr is "SearchHandler" It delegates to a sequent
66
+ of SearchComponents (see below) and supports distributed
67
+ queries across multiple shards
68
+ -->
69
+ <requestHandler name="search" class="solr.SearchHandler" default="true">
70
+ <!-- default values for query parameters can be specified, these
71
+ will be overridden by parameters in the request
72
+ -->
73
+ <lst name="defaults">
74
+ <str name="defType">edismax</str>
75
+ <str name="echoParams">explicit</str>
76
+ <str name="q.alt">*:*</str>
77
+ <str name="mm">2&lt;-1 5&lt;-2 6&lt;90%</str>
78
+ <int name="qs">1</int>
79
+ <int name="ps">2</int>
80
+ <float name="tie">0.01</float>
81
+ <!-- this qf and pf are used by default, if not otherwise specified by
82
+ client. The default blacklight_config will use these for the
83
+ "keywords" search. See the author_qf/author_pf, title_qf, etc
84
+ below, which the default blacklight_config will specify for
85
+ those searches. You may also be interested in:
86
+ http://wiki.apache.org/solr/LocalParams
87
+ -->
88
+ <str name="qf">
89
+ id
90
+ active_fedora_model_ssi
91
+ title_tesim
92
+ author_tesim
93
+ subject_tesim
94
+ </str>
95
+ <str name="pf">
96
+ all_text_timv^10
97
+ </str>
98
+
99
+ <str name="author_qf">
100
+ author_tesim
101
+ </str>
102
+ <str name="author_pf">
103
+ </str>
104
+ <str name="title_qf">
105
+ title_tesim
106
+ </str>
107
+ <str name="title_pf">
108
+ </str>
109
+ <str name="subject_qf">
110
+ subject_tesim
111
+ </str>
112
+ <str name="subject_pf">
113
+ </str>
114
+
115
+ <str name="fl">
116
+ *,
117
+ score
118
+ </str>
119
+
120
+ <str name="facet">true</str>
121
+ <str name="facet.mincount">1</str>
122
+
123
+ <str name="spellcheck">true</str>
124
+ <str name="spellcheck.dictionary">default</str>
125
+ <str name="spellcheck.onlyMorePopular">true</str>
126
+ <str name="spellcheck.extendedResults">true</str>
127
+ <str name="spellcheck.collate">false</str>
128
+ <str name="spellcheck.count">5</str>
129
+
130
+ </lst>
131
+ <arr name="last-components">
132
+ <str>spellcheck</str>
133
+ </arr>
134
+ </requestHandler>
135
+
136
+ <requestHandler name="permissions" class="solr.SearchHandler" >
137
+ <lst name="defaults">
138
+ <str name="facet">off</str>
139
+ <str name="echoParams">all</str>
140
+ <str name="rows">1</str>
141
+ <str name="q">{!raw f=id v=$id}</str> <!-- use id=666 instead of q=id:666 -->
142
+ <str name="fl">
143
+ id,
144
+ access_ssim,
145
+ discover_access_group_ssim,discover_access_person_ssim,
146
+ read_access_group_ssim,read_access_person_ssim,
147
+ edit_access_group_ssim,edit_access_person_ssim,
148
+ depositor_ti,
149
+ embargo_release_date_dtsi
150
+ inheritable_access_ssim,
151
+ inheritable_discover_access_group_ssim,inheritable_discover_access_person_ssim,
152
+ inheritable_read_access_group_ssim,inheritable_read_access_person_ssim,
153
+ inheritable_edit_access_group_ssim,inheritable_edit_access_person_ssim,
154
+ inheritable_embargo_release_date_dtsi
155
+ </str>
156
+ </lst>
157
+ </requestHandler>
158
+
159
+ <requestHandler name="standard" class="solr.SearchHandler">
160
+ <lst name="defaults">
161
+ <str name="echoParams">explicit</str>
162
+ <str name="defType">lucene</str>
163
+ </lst>
164
+ </requestHandler>
165
+
166
+ <!-- for requests to get a single document; use id=666 instead of q=id:666 -->
167
+ <requestHandler name="document" class="solr.SearchHandler" >
168
+ <lst name="defaults">
169
+ <str name="echoParams">all</str>
170
+ <str name="fl">*</str>
171
+ <str name="rows">1</str>
172
+ <str name="q">{!term f=id v=$id}</str> <!-- use id=666 instead of q=id:666 -->
173
+ </lst>
174
+ </requestHandler>
175
+
176
+ <!-- Spell Check
177
+
178
+ The spell check component can return a list of alternative spelling
179
+ suggestions.
180
+
181
+ http://wiki.apache.org/solr/SpellCheckComponent
182
+ -->
183
+ <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
184
+
185
+ <str name="queryAnalyzerFieldType">textSpell</str>
186
+
187
+ <!-- Multiple "Spell Checkers" can be declared and used by this
188
+ component
189
+ -->
190
+
191
+ <!-- a spellchecker built from a field of the main index, and
192
+ written to disk
193
+ -->
194
+ <lst name="spellchecker">
195
+ <str name="name">default</str>
196
+ <str name="field">spell</str>
197
+ <str name="spellcheckIndexDir">./spell</str>
198
+ <str name="buildOnOptimize">true</str>
199
+ </lst>
200
+ <lst name="spellchecker">
201
+ <str name="name">author</str>
202
+ <str name="field">author_spell</str>
203
+ <str name="spellcheckIndexDir">./spell_author</str>
204
+ <str name="accuracy">0.7</str>
205
+ <str name="buildOnOptimize">true</str>
206
+ </lst>
207
+ <lst name="spellchecker">
208
+ <str name="name">subject</str>
209
+ <str name="field">subject_spell</str>
210
+ <str name="spellcheckIndexDir">./spell_subject</str>
211
+ <str name="accuracy">0.7</str>
212
+ <str name="buildOnOptimize">true</str>
213
+ </lst>
214
+ <lst name="spellchecker">
215
+ <str name="name">title</str>
216
+ <str name="field">title_spell</str>
217
+ <str name="spellcheckIndexDir">./spell_title</str>
218
+ <str name="accuracy">0.7</str>
219
+ <str name="buildOnOptimize">true</str>
220
+ </lst>
221
+
222
+ <!-- a spellchecker that uses a different distance measure -->
223
+ <!--
224
+ <lst name="spellchecker">
225
+ <str name="name">jarowinkler</str>
226
+ <str name="field">spell</str>
227
+ <str name="distanceMeasure">
228
+ org.apache.lucene.search.spell.JaroWinklerDistance
229
+ </str>
230
+ <str name="spellcheckIndexDir">spellcheckerJaro</str>
231
+ </lst>
232
+ -->
233
+
234
+ <!-- a spellchecker that use an alternate comparator
235
+
236
+ comparatorClass be one of:
237
+ 1. score (default)
238
+ 2. freq (Frequency first, then score)
239
+ 3. A fully qualified class name
240
+ -->
241
+ <!--
242
+ <lst name="spellchecker">
243
+ <str name="name">freq</str>
244
+ <str name="field">lowerfilt</str>
245
+ <str name="spellcheckIndexDir">spellcheckerFreq</str>
246
+ <str name="comparatorClass">freq</str>
247
+ <str name="buildOnCommit">true</str>
248
+ -->
249
+
250
+ <!-- A spellchecker that reads the list of words from a file -->
251
+ <!--
252
+ <lst name="spellchecker">
253
+ <str name="classname">solr.FileBasedSpellChecker</str>
254
+ <str name="name">file</str>
255
+ <str name="sourceLocation">spellings.txt</str>
256
+ <str name="characterEncoding">UTF-8</str>
257
+ <str name="spellcheckIndexDir">spellcheckerFile</str>
258
+ </lst>
259
+ -->
260
+ </searchComponent>
261
+
262
+ <searchComponent name="suggest" class="solr.SuggestComponent">
263
+ <lst name="suggester">
264
+ <str name="name">mySuggester</str>
265
+ <str name="lookupImpl">FuzzyLookupFactory</str>
266
+ <str name="suggestAnalyzerFieldType">textSuggest</str>
267
+ <str name="buildOnCommit">true</str>
268
+ <str name="field">suggest</str>
269
+ </lst>
270
+ </searchComponent>
271
+
272
+ <requestHandler name="/suggest" class="solr.SearchHandler" startup="lazy">
273
+ <lst name="defaults">
274
+ <str name="suggest">true</str>
275
+ <str name="suggest.count">5</str>
276
+ <str name="suggest.dictionary">mySuggester</str>
277
+ </lst>
278
+ <arr name="components">
279
+ <str>suggest</str>
280
+ </arr>
281
+ </requestHandler>
282
+
283
+ <requestHandler name="/update/extract" class="org.apache.solr.handler.extraction.ExtractingRequestHandler">
284
+ <lst name="defaults">
285
+ <str name="fmap.Last-Modified">last_modified</str>
286
+ <str name="uprefix">ignored_</str>
287
+ </lst>
288
+ <!--Optional. Specify a path to a tika configuration file. See the Tika docs for details.-->
289
+ <!-- <str name="tika.config">/my/path/to/tika.config</str> -->
290
+ <!-- Optional. Specify one or more date formats to parse. See DateUtil.DEFAULT_DATE_FORMATS
291
+ for default date formats -->
292
+ <!-- <lst name="date.formats"> -->
293
+ <!-- <str>yyyy&#45;MM&#45;dd</str> -->
294
+ <!-- </lst> -->
295
+ </requestHandler>
296
+ </config>
297
+