zizia 2.0.0.alpha.01 → 2.1.0.alpha.01

Sign up to get free protection for your applications and to get access to all the features.
@@ -0,0 +1,21 @@
1
+ # The ASF licenses this file to You under the Apache License, Version 2.0
2
+ # (the "License"); you may not use this file except in compliance with
3
+ # the License. You may obtain a copy of the License at
4
+ #
5
+ # http://www.apache.org/licenses/LICENSE-2.0
6
+ #
7
+ # Unless required by applicable law or agreed to in writing, software
8
+ # distributed under the License is distributed on an "AS IS" BASIS,
9
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10
+ # See the License for the specific language governing permissions and
11
+ # limitations under the License.
12
+
13
+ #-----------------------------------------------------------------------
14
+ # Use a protected word file to protect against the stemmer reducing two
15
+ # unrelated words to the same base word.
16
+
17
+ # Some non-words that normally won't be encountered,
18
+ # just to test that they won't be stemmed.
19
+ dontstems
20
+ zwhacky
21
+
@@ -0,0 +1,9 @@
1
+ # frozen_string_literal: true
2
+ Zizia::Engine.routes.draw do
3
+ get 'importer_documentation/guide'
4
+ get 'importer_documentation/csv'
5
+
6
+ post 'csv_imports/preview', as: 'preview_csv_import'
7
+ get 'csv_imports/preview', to: redirect('csv_imports/new')
8
+ resources :csv_imports, only: [:index, :show, :new, :create]
9
+ end
@@ -0,0 +1,366 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!--
20
+ This is the Solr schema file. This file should be named "schema.xml" and
21
+ should be in the conf directory under the solr home
22
+ (i.e. ./solr/conf/schema.xml by default)
23
+ or located where the classloader for the Solr webapp can find it.
24
+
25
+ This example schema is the recommended starting point for users.
26
+ It should be kept correct and concise, usable out-of-the-box.
27
+
28
+ For more information, on how to customize this file, please see
29
+ http://wiki.apache.org/solr/SchemaXml
30
+
31
+ PERFORMANCE NOTE: this schema includes many optional features and should not
32
+ be used for benchmarking. To improve performance one could
33
+ - set stored="false" for all fields possible (esp large fields) when you
34
+ only need to search on the field but don't need to return the original
35
+ value.
36
+ - set indexed="false" if you don't need to search on the field, but only
37
+ return the field as a result of searching on other indexed fields.
38
+ - remove all unneeded copyField statements
39
+ - for best index size and searching performance, set "index" to false
40
+ for all general text fields, use copyField to copy them to the
41
+ catchall "text" field, and use that for searching.
42
+ - For maximum indexing performance, use the StreamingUpdateSolrServer
43
+ java client.
44
+ - Remember to run the JVM in server mode, and use a higher logging level
45
+ that avoids logging every request
46
+ -->
47
+
48
+ <schema name="Hydra Demo Index" version="1.5">
49
+ <!-- attribute "name" is the name of this schema and is only used for display purposes.
50
+ Applications should change this to reflect the nature of the search collection.
51
+ version="1.4" is Solr's version number for the schema syntax and semantics. It should
52
+ not normally be changed by applications.
53
+ 1.0: multiValued attribute did not exist, all fields are multiValued by nature
54
+ 1.1: multiValued attribute introduced, false by default
55
+ 1.2: omitTermFreqAndPositions attribute introduced, true by default except for text fields.
56
+ 1.3: removed optional field compress feature
57
+ 1.4: default auto-phrase (QueryParser feature) to off
58
+ -->
59
+
60
+ <types>
61
+ <fieldType name="string" class="solr.StrField" sortMissingLast="true" />
62
+ <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
63
+ <fieldType name="rand" class="solr.RandomSortField" omitNorms="true"/>
64
+
65
+ <!-- Default numeric field types. -->
66
+ <fieldType name="int" class="solr.TrieIntField" precisionStep="0" positionIncrementGap="0"/>
67
+ <fieldType name="float" class="solr.TrieFloatField" precisionStep="0" positionIncrementGap="0"/>
68
+ <fieldType name="long" class="solr.TrieLongField" precisionStep="0" positionIncrementGap="0"/>
69
+ <fieldType name="double" class="solr.TrieDoubleField" precisionStep="0" positionIncrementGap="0"/>
70
+
71
+ <!-- trie numeric field types for faster range queries -->
72
+ <fieldType name="tint" class="solr.TrieIntField" precisionStep="8" positionIncrementGap="0"/>
73
+ <fieldType name="tfloat" class="solr.TrieFloatField" precisionStep="8" positionIncrementGap="0"/>
74
+ <fieldType name="tlong" class="solr.TrieLongField" precisionStep="8" positionIncrementGap="0"/>
75
+ <fieldType name="tdouble" class="solr.TrieDoubleField" precisionStep="8" positionIncrementGap="0"/>
76
+
77
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z
78
+ Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z
79
+ -->
80
+ <fieldType name="date" class="solr.TrieDateField" precisionStep="0" positionIncrementGap="0"/>
81
+ <!-- A Trie based date field for faster date range queries and date faceting. -->
82
+ <fieldType name="tdate" class="solr.TrieDateField" precisionStep="6" positionIncrementGap="0"/>
83
+
84
+
85
+ <!-- This point type indexes the coordinates as separate fields (subFields)
86
+ If subFieldType is defined, it references a type, and a dynamic field
87
+ definition is created matching *___<typename>. Alternately, if
88
+ subFieldSuffix is defined, that is used to create the subFields.
89
+ Example: if subFieldType="double", then the coordinates would be
90
+ indexed in fields myloc_0___double,myloc_1___double.
91
+ Example: if subFieldSuffix="_d" then the coordinates would be indexed
92
+ in fields myloc_0_d,myloc_1_d
93
+ The subFields are an implementation detail of the fieldType, and end
94
+ users normally should not need to know about them.
95
+ -->
96
+ <fieldType name="point" class="solr.PointType" dimension="2" subFieldSuffix="_d"/>
97
+
98
+ <!-- A specialized field for geospatial search. If indexed, this fieldType must not be multivalued. -->
99
+ <fieldType name="location" class="solr.LatLonType" subFieldSuffix="_coordinate"/>
100
+
101
+ <!-- An alternative geospatial field type new to Solr 4. It supports multiValued and polygon shapes.
102
+ For more information about this and other Spatial fields new to Solr 4, see:
103
+ http://wiki.apache.org/solr/SolrAdaptersForLuceneSpatial4
104
+ -->
105
+ <fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType"
106
+ geo="true" distErrPct="0.025" maxDistErr="0.000009" distanceUnits="degrees" />
107
+
108
+ <fieldType name="text" class="solr.TextField" omitNorms="false">
109
+ <analyzer>
110
+ <tokenizer class="solr.ICUTokenizerFactory"/>
111
+ <filter class="solr.ICUFoldingFilterFactory"/> <!-- NFKC, case folding, diacritics removed -->
112
+ <filter class="solr.TrimFilterFactory"/>
113
+ </analyzer>
114
+ </fieldType>
115
+
116
+ <!-- A text field that only splits on whitespace for exact matching of words -->
117
+ <fieldType name="text_ws" class="solr.TextField" positionIncrementGap="100">
118
+ <analyzer>
119
+ <tokenizer class="solr.WhitespaceTokenizerFactory"/>
120
+ <filter class="solr.TrimFilterFactory"/>
121
+ </analyzer>
122
+ </fieldType>
123
+
124
+ <!-- single token analyzed text, for sorting. Punctuation is significant. -->
125
+ <fieldtype name="alphaSort" class="solr.TextField" sortMissingLast="true" omitNorms="true">
126
+ <analyzer>
127
+ <tokenizer class="solr.KeywordTokenizerFactory" />
128
+ <filter class="solr.ICUFoldingFilterFactory"/>
129
+ <filter class="solr.TrimFilterFactory" />
130
+ </analyzer>
131
+ </fieldtype>
132
+
133
+ <!-- A text field with defaults appropriate for English -->
134
+ <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
135
+ <analyzer>
136
+ <tokenizer class="solr.ICUTokenizerFactory"/>
137
+ <filter class="solr.ICUFoldingFilterFactory"/> <!-- NFKC, case folding, diacritics removed -->
138
+ <filter class="solr.EnglishPossessiveFilterFactory"/>
139
+ <!-- EnglishMinimalStemFilterFactory is less aggressive than PorterStemFilterFactory: -->
140
+ <filter class="solr.EnglishMinimalStemFilterFactory"/>
141
+ <!--
142
+ <filter class="solr.PorterStemFilterFactory"/>
143
+ -->
144
+ <filter class="solr.TrimFilterFactory"/>
145
+ </analyzer>
146
+ </fieldType>
147
+
148
+ <!-- queries for paths match documents at that path, or in descendent paths -->
149
+ <fieldType name="descendent_path" class="solr.TextField">
150
+ <analyzer type="index">
151
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
152
+ </analyzer>
153
+ <analyzer type="query">
154
+ <tokenizer class="solr.KeywordTokenizerFactory" />
155
+ </analyzer>
156
+ </fieldType>
157
+
158
+ <!-- queries for paths match documents at that path, or in ancestor paths -->
159
+ <fieldType name="ancestor_path" class="solr.TextField">
160
+ <analyzer type="index">
161
+ <tokenizer class="solr.KeywordTokenizerFactory" />
162
+ </analyzer>
163
+ <analyzer type="query">
164
+ <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
165
+ </analyzer>
166
+ </fieldType>
167
+
168
+ <fieldType class="solr.TextField" name="textSuggest" positionIncrementGap="100">
169
+ <analyzer>
170
+ <tokenizer class="solr.KeywordTokenizerFactory"/>
171
+ <filter class="solr.StandardFilterFactory"/>
172
+ <filter class="solr.LowerCaseFilterFactory"/>
173
+ <filter class="solr.RemoveDuplicatesTokenFilterFactory"/>
174
+ </analyzer>
175
+ </fieldType>
176
+ </types>
177
+
178
+
179
+ <fields>
180
+ <!-- If you remove this field, you must _also_ disable the update log in solrconfig.xml
181
+ or Solr won't start. _version_ and update log are required for SolrCloud
182
+ -->
183
+ <field name="_version_" type="long" indexed="true" stored="true"/>
184
+
185
+ <field name="id" type="string" stored="true" indexed="true" multiValued="false" required="true"/>
186
+ <field name="timestamp" type="date" indexed="true" stored="true" default="NOW" multiValued="false"/>
187
+
188
+ <field name="lat" type="tdouble" stored="true" indexed="true" multiValued="false"/>
189
+ <field name="lng" type="tdouble" stored="true" indexed="true" multiValued="false"/>
190
+
191
+ <!-- NOTE: not all possible Solr field types are represented in the dynamic fields -->
192
+
193
+ <!-- text (_t...) -->
194
+ <dynamicField name="*_ti" type="text" stored="false" indexed="true" multiValued="false"/>
195
+ <dynamicField name="*_tim" type="text" stored="false" indexed="true" multiValued="true"/>
196
+ <dynamicField name="*_ts" type="text" stored="true" indexed="false" multiValued="false"/>
197
+ <dynamicField name="*_tsm" type="text" stored="true" indexed="false" multiValued="true"/>
198
+ <dynamicField name="*_tsi" type="text" stored="true" indexed="true" multiValued="false"/>
199
+ <dynamicField name="*_tsim" type="text" stored="true" indexed="true" multiValued="true"/>
200
+ <dynamicField name="*_tiv" type="text" stored="false" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
201
+ <dynamicField name="*_timv" type="text" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
202
+ <dynamicField name="*_tsiv" type="text" stored="true" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
203
+ <dynamicField name="*_tsimv" type="text" stored="true" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
204
+
205
+ <!-- English text (_te...) -->
206
+ <dynamicField name="*_tei" type="text_en" stored="false" indexed="true" multiValued="false"/>
207
+ <dynamicField name="*_teim" type="text_en" stored="false" indexed="true" multiValued="true"/>
208
+ <dynamicField name="*_tes" type="text_en" stored="true" indexed="false" multiValued="false"/>
209
+ <dynamicField name="*_tesm" type="text_en" stored="true" indexed="false" multiValued="true"/>
210
+ <dynamicField name="*_tesi" type="text_en" stored="true" indexed="true" multiValued="false"/>
211
+ <dynamicField name="*_tesim" type="text_en" stored="true" indexed="true" multiValued="true"/>
212
+ <dynamicField name="*_teiv" type="text_en" stored="false" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
213
+ <dynamicField name="*_teimv" type="text_en" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
214
+ <dynamicField name="*_tesiv" type="text_en" stored="true" indexed="true" multiValued="false" termVectors="true" termPositions="true" termOffsets="true"/>
215
+ <dynamicField name="*_tesimv" type="text_en" stored="true" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
216
+
217
+ <!-- string (_s...) -->
218
+ <dynamicField name="*_si" type="string" stored="false" indexed="true" multiValued="false"/>
219
+ <dynamicField name="*_sim" type="string" stored="false" indexed="true" multiValued="true"/>
220
+ <dynamicField name="*_ss" type="string" stored="true" indexed="false" multiValued="false"/>
221
+ <dynamicField name="*_ssm" type="string" stored="true" indexed="false" multiValued="true"/>
222
+ <dynamicField name="*_ssi" type="string" stored="true" indexed="true" multiValued="false"/>
223
+ <dynamicField name="*_ssim" type="string" stored="true" indexed="true" multiValued="true"/>
224
+ <dynamicField name="*_ssort" type="alphaSort" stored="false" indexed="true" multiValued="false"/>
225
+
226
+ <!-- integer (_i...) -->
227
+ <dynamicField name="*_ii" type="int" stored="false" indexed="true" multiValued="false"/>
228
+ <dynamicField name="*_iim" type="int" stored="false" indexed="true" multiValued="true"/>
229
+ <dynamicField name="*_is" type="int" stored="true" indexed="false" multiValued="false"/>
230
+ <dynamicField name="*_ism" type="int" stored="true" indexed="false" multiValued="true"/>
231
+ <dynamicField name="*_isi" type="int" stored="true" indexed="true" multiValued="false"/>
232
+ <dynamicField name="*_isim" type="int" stored="true" indexed="true" multiValued="true"/>
233
+
234
+ <!-- trie integer (_it...) (for faster range queries) -->
235
+ <dynamicField name="*_iti" type="tint" stored="false" indexed="true" multiValued="false"/>
236
+ <dynamicField name="*_itim" type="tint" stored="false" indexed="true" multiValued="true"/>
237
+ <dynamicField name="*_its" type="tint" stored="true" indexed="false" multiValued="false"/>
238
+ <dynamicField name="*_itsm" type="tint" stored="true" indexed="false" multiValued="true"/>
239
+ <dynamicField name="*_itsi" type="tint" stored="true" indexed="true" multiValued="false"/>
240
+ <dynamicField name="*_itsim" type="tint" stored="true" indexed="true" multiValued="true"/>
241
+
242
+ <!-- date (_dt...) -->
243
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z
244
+ Optional fractional seconds are allowed: 1995-12-31T23:59:59.999Z -->
245
+ <dynamicField name="*_dti" type="date" stored="false" indexed="true" multiValued="false"/>
246
+ <dynamicField name="*_dtim" type="date" stored="false" indexed="true" multiValued="true"/>
247
+ <dynamicField name="*_dts" type="date" stored="true" indexed="false" multiValued="false"/>
248
+ <dynamicField name="*_dtsm" type="date" stored="true" indexed="false" multiValued="true"/>
249
+ <dynamicField name="*_dtsi" type="date" stored="true" indexed="true" multiValued="false"/>
250
+ <dynamicField name="*_dtsim" type="date" stored="true" indexed="true" multiValued="true"/>
251
+
252
+ <!-- trie date (_dtt...) (for faster range queries) -->
253
+ <dynamicField name="*_dtti" type="tdate" stored="false" indexed="true" multiValued="false"/>
254
+ <dynamicField name="*_dttim" type="tdate" stored="false" indexed="true" multiValued="true"/>
255
+ <dynamicField name="*_dtts" type="tdate" stored="true" indexed="false" multiValued="false"/>
256
+ <dynamicField name="*_dttsm" type="tdate" stored="true" indexed="false" multiValued="true"/>
257
+ <dynamicField name="*_dttsi" type="tdate" stored="true" indexed="true" multiValued="false"/>
258
+ <dynamicField name="*_dttsim" type="tdate" stored="true" indexed="true" multiValued="true"/>
259
+
260
+ <!-- long (_l...) -->
261
+ <dynamicField name="*_li" type="long" stored="false" indexed="true" multiValued="false"/>
262
+ <dynamicField name="*_lim" type="long" stored="false" indexed="true" multiValued="true"/>
263
+ <dynamicField name="*_ls" type="long" stored="true" indexed="false" multiValued="false"/>
264
+ <dynamicField name="*_lsm" type="long" stored="true" indexed="false" multiValued="true"/>
265
+ <dynamicField name="*_lsi" type="long" stored="true" indexed="true" multiValued="false"/>
266
+ <dynamicField name="*_lsim" type="long" stored="true" indexed="true" multiValued="true"/>
267
+
268
+ <!-- trie long (_lt...) (for faster range queries) -->
269
+ <dynamicField name="*_lti" type="tlong" stored="false" indexed="true" multiValued="false"/>
270
+ <dynamicField name="*_ltim" type="tlong" stored="false" indexed="true" multiValued="true"/>
271
+ <dynamicField name="*_lts" type="tlong" stored="true" indexed="false" multiValued="false"/>
272
+ <dynamicField name="*_ltsm" type="tlong" stored="true" indexed="false" multiValued="true"/>
273
+ <dynamicField name="*_ltsi" type="tlong" stored="true" indexed="true" multiValued="false"/>
274
+ <dynamicField name="*_ltsim" type="tlong" stored="true" indexed="true" multiValued="true"/>
275
+
276
+ <!-- double (_db...) -->
277
+ <dynamicField name="*_dbi" type="double" stored="false" indexed="true" multiValued="false"/>
278
+ <dynamicField name="*_dbim" type="double" stored="false" indexed="true" multiValued="true"/>
279
+ <dynamicField name="*_dbs" type="double" stored="true" indexed="false" multiValued="false"/>
280
+ <dynamicField name="*_dbsm" type="double" stored="true" indexed="false" multiValued="true"/>
281
+ <dynamicField name="*_dbsi" type="double" stored="true" indexed="true" multiValued="false"/>
282
+ <dynamicField name="*_dbsim" type="double" stored="true" indexed="true" multiValued="true"/>
283
+
284
+ <!-- trie double (_dbt...) (for faster range queries) -->
285
+ <dynamicField name="*_dbti" type="tdouble" stored="false" indexed="true" multiValued="false"/>
286
+ <dynamicField name="*_dbtim" type="tdouble" stored="false" indexed="true" multiValued="true"/>
287
+ <dynamicField name="*_dbts" type="tdouble" stored="true" indexed="false" multiValued="false"/>
288
+ <dynamicField name="*_dbtsm" type="tdouble" stored="true" indexed="false" multiValued="true"/>
289
+ <dynamicField name="*_dbtsi" type="tdouble" stored="true" indexed="true" multiValued="false"/>
290
+ <dynamicField name="*_dbtsim" type="tdouble" stored="true" indexed="true" multiValued="true"/>
291
+
292
+ <!-- float (_f...) -->
293
+ <dynamicField name="*_fi" type="float" stored="false" indexed="true" multiValued="false"/>
294
+ <dynamicField name="*_fim" type="float" stored="false" indexed="true" multiValued="true"/>
295
+ <dynamicField name="*_fs" type="float" stored="true" indexed="false" multiValued="false"/>
296
+ <dynamicField name="*_fsm" type="float" stored="true" indexed="false" multiValued="true"/>
297
+ <dynamicField name="*_fsi" type="float" stored="true" indexed="true" multiValued="false"/>
298
+ <dynamicField name="*_fsim" type="float" stored="true" indexed="true" multiValued="true"/>
299
+
300
+ <!-- trie float (_ft...) (for faster range queries) -->
301
+ <dynamicField name="*_fti" type="tfloat" stored="false" indexed="true" multiValued="false"/>
302
+ <dynamicField name="*_ftim" type="tfloat" stored="false" indexed="true" multiValued="true"/>
303
+ <dynamicField name="*_fts" type="tfloat" stored="true" indexed="false" multiValued="false"/>
304
+ <dynamicField name="*_ftsm" type="tfloat" stored="true" indexed="false" multiValued="true"/>
305
+ <dynamicField name="*_ftsi" type="tfloat" stored="true" indexed="true" multiValued="false"/>
306
+ <dynamicField name="*_ftsim" type="tfloat" stored="true" indexed="true" multiValued="true"/>
307
+
308
+ <!-- boolean (_b...) -->
309
+ <dynamicField name="*_bi" type="boolean" stored="false" indexed="true" multiValued="false"/>
310
+ <dynamicField name="*_bs" type="boolean" stored="true" indexed="false" multiValued="false"/>
311
+ <dynamicField name="*_bsi" type="boolean" stored="true" indexed="true" multiValued="false"/>
312
+
313
+ <!-- Type used to index the lat and lon components for the "location" FieldType -->
314
+ <dynamicField name="*_coordinate" type="tdouble" indexed="true" stored="false" />
315
+
316
+ <!-- location (_ll...) -->
317
+ <dynamicField name="*_lli" type="location" stored="false" indexed="true" multiValued="false"/>
318
+ <dynamicField name="*_llim" type="location" stored="false" indexed="true" multiValued="true"/>
319
+ <dynamicField name="*_lls" type="location" stored="true" indexed="false" multiValued="false"/>
320
+ <dynamicField name="*_llsm" type="location" stored="true" indexed="false" multiValued="true"/>
321
+ <dynamicField name="*_llsi" type="location" stored="true" indexed="true" multiValued="false"/>
322
+ <dynamicField name="*_llsim" type="location" stored="true" indexed="true" multiValued="true"/>
323
+
324
+ <dynamicField name="*suggest" type="textSuggest" indexed="true" stored="false" multiValued="true" />
325
+
326
+ <!-- you must define copyField source and dest fields explicity or schemaBrowser doesn't work -->
327
+ <field name="all_text_timv" type="text" stored="false" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
328
+
329
+
330
+ </fields>
331
+
332
+ <!-- Field to use to determine and enforce document uniqueness.
333
+ Unless this field is marked with required="false", it will be a required field
334
+ -->
335
+ <uniqueKey>id</uniqueKey>
336
+
337
+ <!-- copyField commands copy one field to another at the time a document
338
+ is added to the index. It's used either to index the same field differently,
339
+ or to add multiple fields to the same field for easier/faster searching. -->
340
+ <!-- Copy Fields -->
341
+
342
+ <!-- Above, multiple source fields are copied to the [text] field.
343
+ Another way to map multiple source fields to the same
344
+ destination field is to use the dynamic field syntax.
345
+ copyField also supports a maxChars to copy setting. -->
346
+
347
+ <!-- <copyField source="*_tesim" dest="all_text_timv" maxChars="3000"/> -->
348
+ <!-- for suggestions -->
349
+ <copyField source="*_tesim" dest="suggest"/>
350
+ <copyField source="*_ssim" dest="suggest"/>
351
+
352
+ <!-- Similarity is the scoring routine for each document vs. a query.
353
+ A custom similarity may be specified here, but the default is fine
354
+ for most applications. -->
355
+ <!-- <similarity class="org.apache.lucene.search.DefaultSimilarity"/> -->
356
+ <!-- ... OR ...
357
+ Specify a SimilarityFactory class name implementation
358
+ allowing parameters to be used.
359
+ -->
360
+ <!--
361
+ <similarity class="com.example.solr.CustomSimilarityFactory">
362
+ <str name="paramkey">param value</str>
363
+ </similarity>
364
+ -->
365
+
366
+ </schema>
@@ -0,0 +1,24 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one or more
2
+ # contributor license agreements. See the NOTICE file distributed with
3
+ # this work for additional information regarding copyright ownership.
4
+ # The ASF licenses this file to You under the Apache License, Version 2.0
5
+ # (the "License"); you may not use this file except in compliance with
6
+ # the License. You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ user=
17
+ solr_hostname=localhost
18
+ solr_port=8983
19
+ rsyncd_port=18983
20
+ data_dir=
21
+ webapp_name=solr
22
+ master_host=
23
+ master_data_dir=
24
+ master_status_dir=
@@ -0,0 +1,322 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!--
20
+ This is a stripped down config file used for a simple example...
21
+ It is *not* a good example to work from.
22
+ -->
23
+ <config>
24
+
25
+ <!-- Controls what version of Lucene various components of Solr
26
+ adhere to. Generally, you want to use the latest version to
27
+ get all bug fixes and improvements. It is highly recommended
28
+ that you fully re-index after changing this setting as it can
29
+ affect both how text is indexed and queried.
30
+ -->
31
+ <luceneMatchVersion>5.0.0</luceneMatchVersion>
32
+
33
+ <lib dir="${solr.install.dir:../../../..}/contrib/analysis-extras/lib" />
34
+ <lib dir="${solr.install.dir:../../../..}/contrib/analysis-extras/lucene-libs" />
35
+ <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar" />
36
+ <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-cell-\d.*\.jar" />
37
+
38
+ <directoryFactory name="DirectoryFactory"
39
+ class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}">
40
+ </directoryFactory>
41
+
42
+ <codecFactory class="solr.SchemaCodecFactory"/>
43
+
44
+ <schemaFactory class="ClassicIndexSchemaFactory"/>
45
+
46
+
47
+ <dataDir>${solr.blacklight-core.data.dir:}</dataDir>
48
+
49
+ <requestDispatcher handleSelect="true" >
50
+ <requestParsers enableRemoteStreaming="false" multipartUploadLimitInKB="2048000" />
51
+ </requestDispatcher>
52
+
53
+ <requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" />
54
+
55
+ <!-- config for the admin interface -->
56
+ <admin>
57
+ <defaultQuery>*:*</defaultQuery>
58
+ </admin>
59
+
60
+ <updateHandler class="solr.DirectUpdateHandler2">
61
+ <updateLog>
62
+ <str name="dir">${solr.ulog.dir:}</str>
63
+ </updateLog>
64
+
65
+ <autoCommit>
66
+ <maxTime>${solr.autoCommit.maxTime:15000}</maxTime>
67
+ <openSearcher>false</openSearcher>
68
+ </autoCommit>
69
+
70
+ <autoSoftCommit>
71
+ <maxTime>${solr.autoSoftCommit.maxTime:-1}</maxTime>
72
+ </autoSoftCommit>
73
+ </updateHandler>
74
+
75
+ <!-- SearchHandler
76
+
77
+ http://wiki.apache.org/solr/SearchHandler
78
+
79
+ For processing Search Queries, the primary Request Handler
80
+ provided with Solr is "SearchHandler" It delegates to a sequent
81
+ of SearchComponents (see below) and supports distributed
82
+ queries across multiple shards
83
+ -->
84
+ <requestHandler name="search" class="solr.SearchHandler" default="true">
85
+ <!-- default values for query parameters can be specified, these
86
+ will be overridden by parameters in the request
87
+ -->
88
+ <lst name="defaults">
89
+ <str name="defType">edismax</str>
90
+ <str name="echoParams">explicit</str>
91
+ <str name="q.alt">*:*</str>
92
+ <str name="mm">2&lt;-1 5&lt;-2 6&lt;90%</str>
93
+ <int name="qs">1</int>
94
+ <int name="ps">2</int>
95
+ <float name="tie">0.01</float>
96
+ <!-- this qf and pf are used by default, if not otherwise specified by
97
+ client. The default blacklight_config will use these for the
98
+ "keywords" search. See the author_qf/author_pf, title_qf, etc
99
+ below, which the default blacklight_config will specify for
100
+ those searches. You may also be interested in:
101
+ http://wiki.apache.org/solr/LocalParams
102
+ -->
103
+ <str name="qf">
104
+ id
105
+ title_tesim
106
+ author_tesim
107
+ subject_tesim
108
+ </str>
109
+ <str name="pf">
110
+ all_text_timv^10
111
+ </str>
112
+
113
+ <str name="author_qf">
114
+ author_tesim
115
+ </str>
116
+ <str name="author_pf">
117
+ </str>
118
+ <str name="title_qf">
119
+ title_tesim
120
+ </str>
121
+ <str name="title_pf">
122
+ </str>
123
+ <str name="subject_qf">
124
+ subject_tesim
125
+ </str>
126
+ <str name="subject_pf">
127
+ </str>
128
+
129
+ <str name="fl">
130
+ *,
131
+ score
132
+ </str>
133
+
134
+ <str name="facet">true</str>
135
+ <str name="facet.mincount">1</str>
136
+
137
+ <str name="spellcheck">true</str>
138
+ <str name="spellcheck.dictionary">default</str>
139
+ <str name="spellcheck.onlyMorePopular">true</str>
140
+ <str name="spellcheck.extendedResults">true</str>
141
+ <str name="spellcheck.collate">false</str>
142
+ <str name="spellcheck.count">5</str>
143
+
144
+ </lst>
145
+ <arr name="last-components">
146
+ <str>spellcheck</str>
147
+ </arr>
148
+ </requestHandler>
149
+
150
+ <requestHandler name="permissions" class="solr.SearchHandler" >
151
+ <lst name="defaults">
152
+ <str name="facet">off</str>
153
+ <str name="echoParams">all</str>
154
+ <str name="rows">1</str>
155
+ <str name="q">{!raw f=id v=$id}</str> <!-- use id=666 instead of q=id:666 -->
156
+ <str name="fl">
157
+ id,
158
+ access_ssim,
159
+ discover_access_group_ssim,discover_access_person_ssim,
160
+ read_access_group_ssim,read_access_person_ssim,
161
+ edit_access_group_ssim,edit_access_person_ssim,
162
+ depositor_ti,
163
+ embargo_release_date_dtsi
164
+ inheritable_access_ssim,
165
+ inheritable_discover_access_group_ssim,inheritable_discover_access_person_ssim,
166
+ inheritable_read_access_group_ssim,inheritable_read_access_person_ssim,
167
+ inheritable_edit_access_group_ssim,inheritable_edit_access_person_ssim,
168
+ inheritable_embargo_release_date_dtsi
169
+ </str>
170
+ </lst>
171
+ </requestHandler>
172
+
173
+ <requestHandler name="standard" class="solr.SearchHandler">
174
+ <lst name="defaults">
175
+ <str name="echoParams">explicit</str>
176
+ <str name="defType">lucene</str>
177
+ </lst>
178
+ </requestHandler>
179
+
180
+ <!-- for requests to get a single document; use id=666 instead of q=id:666 -->
181
+ <requestHandler name="document" class="solr.SearchHandler" >
182
+ <lst name="defaults">
183
+ <str name="echoParams">all</str>
184
+ <str name="fl">*</str>
185
+ <str name="rows">1</str>
186
+ <str name="q">{!term f=id v=$id}</str> <!-- use id=666 instead of q=id:666 -->
187
+ </lst>
188
+ </requestHandler>
189
+
190
+ <searchComponent name="termsComponent" class="solr.TermsComponent" />
191
+
192
+ <requestHandler name="/terms" class="solr.SearchHandler">
193
+ <lst name="defaults">
194
+ <bool name="terms">true</bool>
195
+ </lst>
196
+ <arr name="components">
197
+ <str>termsComponent</str>
198
+ </arr>
199
+ </requestHandler>
200
+
201
+ <!-- Spell Check
202
+
203
+ The spell check component can return a list of alternative spelling
204
+ suggestions.
205
+
206
+ http://wiki.apache.org/solr/SpellCheckComponent
207
+ -->
208
+ <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
209
+
210
+ <str name="queryAnalyzerFieldType">textSpell</str>
211
+
212
+ <!-- Multiple "Spell Checkers" can be declared and used by this
213
+ component
214
+ -->
215
+
216
+ <!-- a spellchecker built from a field of the main index, and
217
+ written to disk
218
+ -->
219
+ <lst name="spellchecker">
220
+ <str name="name">default</str>
221
+ <str name="field">spell</str>
222
+ <str name="spellcheckIndexDir">./spell</str>
223
+ <str name="buildOnOptimize">true</str>
224
+ </lst>
225
+ <lst name="spellchecker">
226
+ <str name="name">author</str>
227
+ <str name="field">author_spell</str>
228
+ <str name="spellcheckIndexDir">./spell_author</str>
229
+ <str name="accuracy">0.7</str>
230
+ <str name="buildOnOptimize">true</str>
231
+ </lst>
232
+ <lst name="spellchecker">
233
+ <str name="name">subject</str>
234
+ <str name="field">subject_spell</str>
235
+ <str name="spellcheckIndexDir">./spell_subject</str>
236
+ <str name="accuracy">0.7</str>
237
+ <str name="buildOnOptimize">true</str>
238
+ </lst>
239
+ <lst name="spellchecker">
240
+ <str name="name">title</str>
241
+ <str name="field">title_spell</str>
242
+ <str name="spellcheckIndexDir">./spell_title</str>
243
+ <str name="accuracy">0.7</str>
244
+ <str name="buildOnOptimize">true</str>
245
+ </lst>
246
+
247
+ <!-- a spellchecker that uses a different distance measure -->
248
+ <!--
249
+ <lst name="spellchecker">
250
+ <str name="name">jarowinkler</str>
251
+ <str name="field">spell</str>
252
+ <str name="distanceMeasure">
253
+ org.apache.lucene.search.spell.JaroWinklerDistance
254
+ </str>
255
+ <str name="spellcheckIndexDir">spellcheckerJaro</str>
256
+ </lst>
257
+ -->
258
+
259
+ <!-- a spellchecker that use an alternate comparator
260
+
261
+ comparatorClass be one of:
262
+ 1. score (default)
263
+ 2. freq (Frequency first, then score)
264
+ 3. A fully qualified class name
265
+ -->
266
+ <!--
267
+ <lst name="spellchecker">
268
+ <str name="name">freq</str>
269
+ <str name="field">lowerfilt</str>
270
+ <str name="spellcheckIndexDir">spellcheckerFreq</str>
271
+ <str name="comparatorClass">freq</str>
272
+ <str name="buildOnCommit">true</str>
273
+ -->
274
+
275
+ <!-- A spellchecker that reads the list of words from a file -->
276
+ <!--
277
+ <lst name="spellchecker">
278
+ <str name="classname">solr.FileBasedSpellChecker</str>
279
+ <str name="name">file</str>
280
+ <str name="sourceLocation">spellings.txt</str>
281
+ <str name="characterEncoding">UTF-8</str>
282
+ <str name="spellcheckIndexDir">spellcheckerFile</str>
283
+ </lst>
284
+ -->
285
+ </searchComponent>
286
+
287
+ <searchComponent name="suggest" class="solr.SuggestComponent">
288
+ <lst name="suggester">
289
+ <str name="name">mySuggester</str>
290
+ <str name="lookupImpl">FuzzyLookupFactory</str>
291
+ <str name="suggestAnalyzerFieldType">textSuggest</str>
292
+ <str name="buildOnCommit">true</str>
293
+ <str name="field">suggest</str>
294
+ </lst>
295
+ </searchComponent>
296
+
297
+ <requestHandler name="/suggest" class="solr.SearchHandler" startup="lazy">
298
+ <lst name="defaults">
299
+ <str name="suggest">true</str>
300
+ <str name="suggest.count">5</str>
301
+ <str name="suggest.dictionary">mySuggester</str>
302
+ </lst>
303
+ <arr name="components">
304
+ <str>suggest</str>
305
+ </arr>
306
+ </requestHandler>
307
+
308
+ <requestHandler name="/update/extract" class="org.apache.solr.handler.extraction.ExtractingRequestHandler">
309
+ <lst name="defaults">
310
+ <str name="fmap.Last-Modified">last_modified</str>
311
+ <str name="uprefix">ignored_</str>
312
+ </lst>
313
+ <!--Optional. Specify a path to a tika configuration file. See the Tika docs for details.-->
314
+ <!-- <str name="tika.config">/my/path/to/tika.config</str> -->
315
+ <!-- Optional. Specify one or more date formats to parse. See DateUtil.DEFAULT_DATE_FORMATS
316
+ for default date formats -->
317
+ <!-- <lst name="date.formats"> -->
318
+ <!-- <str>yyyy&#45;MM&#45;dd</str> -->
319
+ <!-- </lst> -->
320
+ </requestHandler>
321
+ </config>
322
+