warclight 0.6.3 → 0.7.0

Sign up to get free protection for your applications and to get access to all the features.
@@ -1,4 +1,4 @@
1
- <?xml version="1.0" encoding="UTF-8"?>
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
2
  <!--
3
3
  Licensed to the Apache Software Foundation (ASF) under one or more
4
4
  contributor license agreements. See the NOTICE file distributed with
@@ -16,192 +16,1151 @@
16
16
  limitations under the License.
17
17
  -->
18
18
 
19
- <!-- Sample Warclight Solr config to work from. -->
19
+ <!--
20
+ For more details about configurations options that may appear in
21
+ this file, see http://wiki.apache.org/solr/SolrConfigXml.
22
+ -->
20
23
  <config>
21
- <luceneMatchVersion>6.6.0</luceneMatchVersion>
24
+ <!-- In all configuration below, a prefix of "solr." for class names
25
+ is an alias that causes solr to search appropriate packages,
26
+ including org.apache.solr.(search|update|request|core|analysis)
27
+
28
+ You may also specify a fully qualified Java classname if you
29
+ have your own custom plugins.
30
+ -->
31
+
32
+ <!-- Controls what version of Lucene various components of Solr
33
+ adhere to. Generally, you want to use the latest version to
34
+ get all bug fixes and improvements. It is highly recommended
35
+ that you fully re-index after changing this setting as it can
36
+ affect both how text is indexed and queried.
37
+ -->
38
+ <luceneMatchVersion>7.0.1</luceneMatchVersion>
39
+
40
+ <!-- <lib/> directives can be used to instruct Solr to load an Jars
41
+ identified and use them to resolve any "plugins" specified in
42
+ your solrconfig.xml or schema.xml (ie: Analyzers, Request
43
+ Handlers, etc...).
44
+
45
+ All directories and paths are resolved relative to the
46
+ instanceDir.
47
+
48
+ Please note that <lib/> directives are processed in the order
49
+ that they appear in your solrconfig.xml file, and are "stacked"
50
+ on top of each other when building a ClassLoader - so if you have
51
+ plugin jars with dependencies on other jars, the "lower level"
52
+ dependency jars should be loaded first.
53
+
54
+ If a "./lib" directory exists in your instanceDir, all files
55
+ found in it are included as if you had used the following
56
+ syntax...
57
+
58
+ <lib dir="./lib" />
59
+ -->
60
+
61
+ <!-- A 'dir' option by itself adds any files found in the directory
62
+ to the classpath, this is useful for including all jars in a
63
+ directory.
64
+
65
+ When a 'regex' is specified in addition to a 'dir', only the
66
+ files in that directory which completely match the regex
67
+ (anchored on both ends) will be included.
68
+
69
+ If a 'dir' option (with or without a regex) is used and nothing
70
+ is found that matches, a warning will be logged.
71
+
72
+ The examples below can be used to load some solr-contribs along
73
+ with their external dependencies.
74
+ -->
75
+ <!-- BL commented out jar libs
76
+ <lib dir="../../../contrib/extraction/lib" regex=".*\.jar" />
77
+ <lib dir="../../../dist/" regex="solr-cell-\d.*\.jar" />
78
+
79
+ <lib dir="../../../contrib/clustering/lib/" regex=".*\.jar" />
80
+ <lib dir="../../../dist/" regex="solr-clustering-\d.*\.jar" />
81
+
82
+ <lib dir="../../../contrib/langid/lib/" regex=".*\.jar" />
83
+ <lib dir="../../../dist/" regex="solr-langid-\d.*\.jar" />
84
+
85
+ <lib dir="../../../contrib/velocity/lib" regex=".*\.jar" />
86
+ <lib dir="../../../dist/" regex="solr-velocity-\d.*\.jar" />
87
+ BL -->
22
88
 
23
- <lib dir="${solr.install.dir:../../../..}/contrib/extraction/lib" regex=".*\.jar"/>
24
- <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-cell-\d.*\.jar"/>
25
- <lib dir="${solr.install.dir:../../../..}/contrib/clustering/lib/" regex=".*\.jar"/>
26
- <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-clustering-\d.*\.jar"/>
27
- <lib dir="${solr.install.dir:../../../..}/contrib/langid/lib/" regex=".*\.jar"/>
28
- <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-langid-\d.*\.jar"/>
29
- <lib dir="${solr.install.dir:../../../..}/contrib/velocity/lib" regex=".*\.jar"/>
30
- <lib dir="${solr.install.dir:../../../..}/dist/" regex="solr-velocity-\d.*\.jar"/>
89
+ <!-- an exact 'path' can be used instead of a 'dir' to specify a
90
+ specific jar file. This will cause a serious error to be logged
91
+ if it can't be loaded.
92
+ -->
93
+ <!--
94
+ <lib path="../a-jar-that-does-not-exist.jar" />
95
+ -->
96
+
97
+ <!-- Data Directory
31
98
 
99
+ Used to specify an alternate directory to hold all index data
100
+ other than the default ./data under the Solr home. If
101
+ replication is in use, this should match the replication
102
+ configuration.
103
+ -->
32
104
  <dataDir>${solr.data.dir:}</dataDir>
33
105
 
34
- <directoryFactory name="DirectoryFactory" class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}"/>
35
106
 
107
+ <!-- The DirectoryFactory to use for indexes.
108
+
109
+ solr.StandardDirectoryFactory is filesystem
110
+ based and tries to pick the best implementation for the current
111
+ JVM and platform. solr.NRTCachingDirectoryFactory, the default,
112
+ wraps solr.StandardDirectoryFactory and caches small files in memory
113
+ for better NRT performance.
114
+
115
+ One can force a particular implementation via solr.MMapDirectoryFactory,
116
+ solr.NIOFSDirectoryFactory, or solr.SimpleFSDirectoryFactory.
117
+
118
+ solr.RAMDirectoryFactory is memory based, not
119
+ persistent, and doesn't work with replication.
120
+ -->
121
+ <!-- BL changed directoryFactory to MMapDirectoryFactory -->
122
+ <directoryFactory name="DirectoryFactory"
123
+ class="${solr.directoryFactory:solr.NIOFSDirectoryFactory}">
124
+ <!-- BL -->
125
+
126
+
127
+ <!-- These will be used if you are using the solr.HdfsDirectoryFactory,
128
+ otherwise they will be ignored. If you don't plan on using hdfs,
129
+ you can safely remove this section. -->
130
+ <!-- The root directory that collection data should be written to. -->
131
+ <str name="solr.hdfs.home">${solr.hdfs.home:}</str>
132
+ <!-- The hadoop configuration files to use for the hdfs client. -->
133
+ <str name="solr.hdfs.confdir">${solr.hdfs.confdir:}</str>
134
+ <!-- Enable/Disable the hdfs cache. -->
135
+ <str name="solr.hdfs.blockcache.enabled">${solr.hdfs.blockcache.enabled:true}</str>
136
+
137
+ </directoryFactory>
138
+
139
+ <!-- The CodecFactory for defining the format of the inverted index.
140
+ The default implementation is SchemaCodecFactory, which is the official Lucene
141
+ index format, but hooks into the schema to provide per-field customization of
142
+ the postings lists and per-document values in the fieldType element
143
+ (postingsFormat/docValuesFormat). Note that most of the alternative implementations
144
+ are experimental, so if you choose to customize the index format, its a good
145
+ idea to convert back to the official format e.g. via IndexWriter.addIndexes(IndexReader)
146
+ before upgrading to a newer version to avoid unnecessary reindexing.
147
+ -->
36
148
  <codecFactory class="solr.SchemaCodecFactory"/>
37
149
 
150
+ <!-- To enable dynamic schema REST APIs, use the following for <schemaFactory>:
151
+
152
+ <schemaFactory class="ManagedIndexSchemaFactory">
153
+ <bool name="mutable">true</bool>
154
+ <str name="managedSchemaResourceName">managed-schema</str>
155
+ </schemaFactory>
156
+
157
+ When ManagedIndexSchemaFactory is specified, Solr will load the schema from
158
+ he resource named in 'managedSchemaResourceName', rather than from schema.xml.
159
+ Note that the managed schema resource CANNOT be named schema.xml. If the managed
160
+ schema does not exist, Solr will create it after reading schema.xml, then rename
161
+ 'schema.xml' to 'schema.xml.bak'.
162
+
163
+ Do NOT hand edit the managed schema - external modifications will be ignored and
164
+ overwritten as a result of schema modification REST API calls.
165
+
166
+ When ManagedIndexSchemaFactory is specified with mutable = true, schema
167
+ modification REST API calls will be allowed; otherwise, error responses will be
168
+ sent back for these requests.
169
+ -->
38
170
  <schemaFactory class="ClassicIndexSchemaFactory"/>
39
171
 
172
+ <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
173
+ Index Config - These settings control low-level behavior of indexing
174
+ Most example settings here show the default value, but are commented
175
+ out, to more easily see where customizations have been made.
176
+
177
+ Note: This replaces <indexDefaults> and <mainIndex> from older versions
178
+ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
40
179
  <indexConfig>
180
+ <!-- maxFieldLength was removed in 4.0. To get similar behavior, include a
181
+ LimitTokenCountFilterFactory in your fieldType definition. E.g.
182
+ <filter class="solr.LimitTokenCountFilterFactory" maxTokenCount="10000"/>
183
+ -->
184
+ <!-- Maximum time to wait for a write lock (ms) for an IndexWriter. Default: 1000 -->
185
+ <!-- <writeLockTimeout>1000</writeLockTimeout> -->
186
+
187
+ <!-- The maximum number of simultaneous threads that may be
188
+ indexing documents at once in IndexWriter; if more than this
189
+ many threads arrive they will wait for others to finish.
190
+ Default in Solr/Lucene is 8. -->
191
+ <!-- <maxIndexingThreads>8</maxIndexingThreads> -->
192
+
193
+ <!-- Expert: Enabling compound file will use less files for the index,
194
+ using fewer file descriptors on the expense of performance decrease.
195
+ Default in Lucene is "true". Default in Solr is "false" (since 3.6) -->
196
+ <!-- <useCompoundFile>false</useCompoundFile> -->
197
+
198
+ <!-- ramBufferSizeMB sets the amount of RAM that may be used by Lucene
199
+ indexing for buffering added documents and deletions before they are
200
+ flushed to the Directory.
201
+ maxBufferedDocs sets a limit on the number of documents buffered
202
+ before flushing.
203
+ If both ramBufferSizeMB and maxBufferedDocs is set, then
204
+ Lucene will flush based on whichever limit is hit first.
205
+ The default is 100 MB. -->
206
+ <ramBufferSizeMB>500</ramBufferSizeMB>
207
+ <maxBufferedDocs>1000</maxBufferedDocs>
208
+
209
+
210
+
211
+ <mergeScheduler class="org.apache.lucene.index.ConcurrentMergeScheduler"/>
212
+
213
+ <mergePolicyFactory class="org.apache.solr.index.TieredMergePolicyFactory">
214
+ <int name="maxMergeAtOnce">10</int>
215
+ <int name="segmentsPerTier">10</int>
216
+ </mergePolicyFactory>
217
+
218
+
219
+
220
+ <!-- LockFactory
221
+
222
+ This option specifies which Lucene LockFactory implementation
223
+ to use.
224
+
225
+ single = SingleInstanceLockFactory - suggested for a
226
+ read-only index or when there is no possibility of
227
+ another process trying to modify the index.
228
+ native = NativeFSLockFactory - uses OS native file locking.
229
+ Do not use when multiple solr webapps in the same
230
+ JVM are attempting to share a single index.
231
+ simple = SimpleFSLockFactory - uses a plain file for locking
232
+
233
+ Defaults: 'native' is default for Solr3.6 and later, otherwise
234
+ 'simple' is the default
235
+
236
+ More details on the nuances of each LockFactory...
237
+ http://wiki.apache.org/lucene-java/AvailableLockFactories
238
+ -->
41
239
  <lockType>${solr.lock.type:native}</lockType>
240
+
241
+ <!-- Unlock On Startup
242
+
243
+ If true, unlock any held write or commit locks on startup.
244
+ This defeats the locking mechanism that allows multiple
245
+ processes to safely access a lucene index, and should be used
246
+ with care. Default is "false".
247
+
248
+ This is not needed if lock type is 'single'
249
+ -->
250
+ <!--
251
+ <unlockOnStartup>false</unlockOnStartup>
252
+ -->
253
+
254
+ <!-- Expert: Controls how often Lucene loads terms into memory
255
+ Default is 128 and is likely good for most everyone.
256
+ -->
257
+ <!-- <termIndexInterval>128</termIndexInterval> -->
258
+
259
+ <!-- If true, IndexReaders will be opened/reopened from the IndexWriter
260
+ instead of from the Directory. Hosts in a master/slave setup
261
+ should have this set to false while those in a SolrCloud
262
+ cluster need to be set to true. Default: true
263
+ -->
264
+ <!--
265
+ <nrtMode>true</nrtMode>
266
+ -->
267
+
268
+ <!-- Commit Deletion Policy
269
+ Custom deletion policies can be specified here. The class must
270
+ implement org.apache.lucene.index.IndexDeletionPolicy.
271
+
272
+ The default Solr IndexDeletionPolicy implementation supports
273
+ deleting index commit points on number of commits, age of
274
+ commit point and optimized status.
275
+
276
+ The latest commit point should always be preserved regardless
277
+ of the criteria.
278
+ -->
279
+ <!--
280
+ <deletionPolicy class="solr.SolrDeletionPolicy">
281
+ -->
282
+ <!-- The number of commit points to be kept -->
283
+ <!-- <str name="maxCommitsToKeep">1</str> -->
284
+ <!-- The number of optimized commit points to be kept -->
285
+ <!-- <str name="maxOptimizedCommitsToKeep">0</str> -->
286
+ <!--
287
+ Delete all commit points once they have reached the given age.
288
+ Supports DateMathParser syntax e.g.
289
+ -->
290
+ <!--
291
+ <str name="maxCommitAge">30MINUTES</str>
292
+ <str name="maxCommitAge">1DAY</str>
293
+ -->
294
+ <!--
295
+ </deletionPolicy>
296
+ -->
297
+
298
+ <!-- Lucene Infostream
299
+
300
+ To aid in advanced debugging, Lucene provides an "InfoStream"
301
+ of detailed information when indexing.
302
+
303
+ Setting the value to true will instruct the underlying Lucene
304
+ IndexWriter to write its info stream to solr's log. By default,
305
+ this is enabled here, and controlled through log4j.properties.
306
+ -->
307
+ <infoStream>true</infoStream>
42
308
  </indexConfig>
43
309
 
310
+
311
+ <!-- JMX
312
+
313
+ This example enables JMX if and only if an existing MBeanServer
314
+ is found, use this if you want to configure JMX through JVM
315
+ parameters. Remove this to disable exposing Solr configuration
316
+ and statistics to JMX.
317
+
318
+ For more details see http://wiki.apache.org/solr/SolrJmx
319
+ -->
320
+ <jmx />
321
+ <!-- If you want to connect to a particular server, specify the
322
+ agentId
323
+ -->
324
+ <!-- <jmx agentId="myAgent" /> -->
325
+ <!-- If you want to start a new MBeanServer, specify the serviceUrl -->
326
+ <!-- <jmx serviceUrl="service:jmx:rmi:///jndi/rmi://localhost:9999/solr"/>
327
+ -->
328
+
44
329
  <!-- The default high-performance update handler -->
45
330
  <updateHandler class="solr.DirectUpdateHandler2">
331
+
332
+ <!-- Enables a transaction log, used for real-time get, durability, and
333
+ and solr cloud replica recovery. The log can grow as big as
334
+ uncommitted changes to the index, so use of a hard autoCommit
335
+ is recommended (see below).
336
+ "dir" - the target directory for transaction logs, defaults to the
337
+ solr data directory. -->
46
338
  <updateLog>
47
339
  <str name="dir">${solr.ulog.dir:}</str>
48
- <int name="numVersionBuckets">${solr.ulog.numVersionBuckets:65536}</int>
49
340
  </updateLog>
50
- <autoCommit>
51
- <maxTime>${solr.autoCommit.maxTime:15000}</maxTime>
52
- <openSearcher>false</openSearcher>
53
- </autoCommit>
341
+
342
+ <!-- AutoCommit
343
+
344
+ Perform a hard commit automatically under certain conditions.
345
+ Instead of enabling autoCommit, consider using "commitWithin"
346
+ when adding documents.
347
+
348
+ http://wiki.apache.org/solr/UpdateXmlMessages
349
+
350
+ maxDocs - Maximum number of documents to add since the last
351
+ commit before automatically triggering a new commit.
352
+
353
+ maxTime - Maximum amount of time in ms that is allowed to pass
354
+ since a document was added before automatically
355
+ triggering a new commit.
356
+ openSearcher - if false, the commit causes recent index changes
357
+ to be flushed to stable storage, but does not cause a new
358
+ searcher to be opened to make those changes visible.
359
+
360
+ If the updateLog is enabled, then it's highly recommended to
361
+ have some sort of hard autoCommit to limit the log size.
362
+ -->
363
+ <!-- As openSearcher==false, this is a relatively light process -->
364
+ <autoCommit>
365
+ <maxTime>${solr.autoCommit.maxTime:60000}</maxTime>
366
+ <openSearcher>false</openSearcher>
367
+ </autoCommit>
368
+
369
+ <!-- softAutoCommit is like autoCommit except it causes a
370
+ 'soft' commit which only ensures that changes are visible
371
+ but does not ensure that data is synced to disk. This is
372
+ faster and more near-realtime friendly than a hard commit.
373
+ -->
374
+ <!-- Re-open each 100 minutes. Softcommits can be very heavy if the index
375
+ is queried while indexing (or warmup is used with facets), so we want
376
+ this to be conservative.
377
+ https://github.com/ukwa/webarchive-discovery/issues/130 -->
378
+ <autoSoftCommit>
379
+ <maxTime>${solr.autoSoftCommit.maxTime:6000000}</maxTime>
380
+ </autoSoftCommit>
381
+
382
+ <!-- Update Related Event Listeners
383
+
384
+ Various IndexWriter related events can trigger Listeners to
385
+ take actions.
386
+
387
+ postCommit - fired after every commit or optimize command
388
+ postOptimize - fired after every optimize command
389
+ -->
390
+ <!-- The RunExecutableListener executes an external command from a
391
+ hook such as postCommit or postOptimize.
392
+
393
+ exe - the name of the executable to run
394
+ dir - dir to use as the current working directory. (default=".")
395
+ wait - the calling thread waits until the executable returns.
396
+ (default="true")
397
+ args - the arguments to pass to the program. (default is none)
398
+ env - environment variables to set. (default is none)
399
+ -->
400
+ <!-- This example shows how RunExecutableListener could be used
401
+ with the script based replication...
402
+ http://wiki.apache.org/solr/CollectionDistribution
403
+ -->
404
+ <!--
405
+ <listener event="postCommit" class="solr.RunExecutableListener">
406
+ <str name="exe">solr/bin/snapshooter</str>
407
+ <str name="dir">.</str>
408
+ <bool name="wait">true</bool>
409
+ <arr name="args"> <str>arg1</str> <str>arg2</str> </arr>
410
+ <arr name="env"> <str>MYVAR=val1</str> </arr>
411
+ </listener>
412
+ -->
413
+
54
414
  </updateHandler>
415
+
416
+ <!-- IndexReaderFactory
417
+
418
+ Use the following format to specify a custom IndexReaderFactory,
419
+ which allows for alternate IndexReader implementations.
420
+
421
+ ** Experimental Feature **
422
+
423
+ Please note - Using a custom IndexReaderFactory may prevent
424
+ certain other features from working. The API to
425
+ IndexReaderFactory may change without warning or may even be
426
+ removed from future releases if the problems cannot be
427
+ resolved.
428
+
429
+
430
+ ** Features that may not work with custom IndexReaderFactory **
55
431
 
432
+ The ReplicationHandler assumes a disk-resident index. Using a
433
+ custom IndexReader implementation may cause incompatibility
434
+ with ReplicationHandler and may cause replication to not work
435
+ correctly. See SOLR-1366 for details.
436
+
437
+ -->
438
+ <!--
439
+ <indexReaderFactory name="IndexReaderFactory" class="package.class">
440
+ <str name="someArg">Some Value</str>
441
+ </indexReaderFactory >
442
+ -->
443
+ <!-- By explicitly declaring the Factory, the termIndexDivisor can
444
+ be specified.
445
+ -->
446
+ <!--
447
+ <indexReaderFactory name="IndexReaderFactory"
448
+ class="solr.StandardIndexReaderFactory">
449
+ <int name="setTermIndexDivisor">12</int>
450
+ </indexReaderFactory >
451
+ -->
452
+
453
+ <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
454
+ Query section - these settings control query time things like caches
455
+ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
56
456
  <query>
457
+ <!-- Max Boolean Clauses
458
+
459
+ Maximum number of clauses in each BooleanQuery, an exception
460
+ is thrown if exceeded.
461
+
462
+ ** WARNING **
463
+
464
+ This option actually modifies a global Lucene property that
465
+ will affect all SolrCores. If multiple solrconfig.xml files
466
+ disagree on this property, the value at any given moment will
467
+ be based on the last SolrCore to be initialized.
468
+
469
+ -->
57
470
  <maxBooleanClauses>1024</maxBooleanClauses>
58
- <filterCache class="solr.FastLRUCache" size="512" initialSize="512" autowarmCount="0"/>
59
- <queryResultCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
60
- <documentCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
61
- <cache name="perSegFilter" class="solr.search.LRUCache" size="10" initialSize="0" autowarmCount="10" regenerator="solr.NoOpRegenerator"/>
471
+
472
+
473
+ <!-- Solr Internal Query Caches
474
+
475
+ There are two implementations of cache available for Solr,
476
+ LRUCache, based on a synchronized LinkedHashMap, and
477
+ FastLRUCache, based on a ConcurrentHashMap.
478
+
479
+ FastLRUCache has faster gets and slower puts in single
480
+ threaded operation and thus is generally faster than LRUCache
481
+ when the hit ratio of the cache is high (> 75%), and may be
482
+ faster under other scenarios on multi-cpu systems.
483
+ -->
484
+
485
+ <!-- Filter Cache
486
+
487
+ Cache used by SolrIndexSearcher for filters (DocSets),
488
+ unordered sets of *all* documents that match a query. When a
489
+ new searcher is opened, its caches may be prepopulated or
490
+ "autowarmed" using data from caches in the old searcher.
491
+ autowarmCount is the number of items to prepopulate. For
492
+ LRUCache, the autowarmed items will be the most recently
493
+ accessed items.
494
+
495
+ Parameters:
496
+ class - the SolrCache implementation LRUCache or
497
+ (LRUCache or FastLRUCache)
498
+ size - the maximum number of entries in the cache
499
+ initialSize - the initial capacity (number of entries) of
500
+ the cache. (see java.util.HashMap)
501
+ autowarmCount - the number of entries to prepopulate from
502
+ and old cache.
503
+ -->
504
+ <!-- Worst-case for a filter entry is #total_docs_in_index/8 bytes so we
505
+ keep it fairly low in expectation of tens or hundreds of millions of
506
+ documents/shard. -->
507
+ <filterCache class="solr.FastLRUCache"
508
+ size="32"
509
+ initialSize="32"
510
+ autowarmCount="0"/>
511
+
512
+ <!-- Query Result Cache
513
+
514
+ Caches results of searches - ordered lists of document ids
515
+ (DocList) based on a query, a sort, and the range of documents requested.
516
+ -->
517
+ <queryResultCache class="solr.LRUCache"
518
+ size="512"
519
+ initialSize="512"
520
+ autowarmCount="0"/>
521
+
522
+ <!-- Document Cache
523
+
524
+ Caches Lucene Document objects (the stored fields for each
525
+ document). Since Lucene internal document ids are transient,
526
+ this cache will not be autowarmed.
527
+ -->
528
+ <!-- This is independent of index size -->
529
+ <documentCache class="solr.LRUCache"
530
+ size="512"
531
+ initialSize="512"
532
+ autowarmCount="0"/>
533
+
534
+ <!-- custom cache currently used by block join -->
535
+ <cache name="perSegFilter"
536
+ class="solr.search.LRUCache"
537
+ size="10"
538
+ initialSize="0"
539
+ autowarmCount="10"
540
+ regenerator="solr.NoOpRegenerator" />
541
+
542
+ <!-- Field Value Cache
543
+
544
+ Cache used to hold field values that are quickly accessible
545
+ by document id. The fieldValueCache is created by default
546
+ even if not configured here.
547
+ -->
548
+ <!--
549
+ <fieldValueCache class="solr.FastLRUCache"
550
+ size="512"
551
+ autowarmCount="128"
552
+ showItems="32" />
553
+ -->
554
+
555
+ <!-- Custom Cache
556
+
557
+ Example of a generic cache. These caches may be accessed by
558
+ name through SolrIndexSearcher.getCache(),cacheLookup(), and
559
+ cacheInsert(). The purpose is to enable easy caching of
560
+ user/application level data. The regenerator argument should
561
+ be specified as an implementation of solr.CacheRegenerator
562
+ if autowarming is desired.
563
+ -->
564
+ <!--
565
+ <cache name="myUserCache"
566
+ class="solr.LRUCache"
567
+ size="4096"
568
+ initialSize="1024"
569
+ autowarmCount="1024"
570
+ regenerator="com.mycompany.MyRegenerator"
571
+ />
572
+ -->
573
+
574
+
575
+ <!-- Lazy Field Loading
576
+
577
+ If true, stored fields that are not requested will be loaded
578
+ lazily. This can result in a significant speed improvement
579
+ if the usual case is to not load all stored fields,
580
+ especially if the skipped fields are large compressed text
581
+ fields.
582
+ -->
62
583
  <enableLazyFieldLoading>true</enableLazyFieldLoading>
63
- <queryResultWindowSize>20</queryResultWindowSize>
64
- <queryResultMaxDocsCached>200</queryResultMaxDocsCached>
584
+
585
+ <!-- Use Filter For Sorted Query
586
+
587
+ A possible optimization that attempts to use a filter to
588
+ satisfy a search. If the requested sort does not include
589
+ score, then the filterCache will be checked for a filter
590
+ matching the query. If found, the filter will be used as the
591
+ source of document ids, and then the sort will be applied to
592
+ that.
593
+
594
+ For most situations, this will not be useful unless you
595
+ frequently get the same search repeatedly with different sort
596
+ options, and none of them ever use "score"
597
+ -->
598
+ <!--
599
+ <useFilterForSortedQuery>true</useFilterForSortedQuery>
600
+ -->
601
+
602
+ <!-- Result Window Size
603
+
604
+ An optimization for use with the queryResultCache. When a search
605
+ is requested, a superset of the requested number of document ids
606
+ are collected. For example, if a search for a particular query
607
+ requests matching documents 10 through 19, and queryWindowSize is 50,
608
+ then documents 0 through 49 will be collected and cached. Any further
609
+ requests in that range can be satisfied via the cache.
610
+ -->
611
+ <queryResultWindowSize>20</queryResultWindowSize>
612
+
613
+ <!-- Maximum number of documents to cache for any entry in the
614
+ queryResultCache.
615
+ -->
616
+ <queryResultMaxDocsCached>200</queryResultMaxDocsCached>
617
+
618
+ <!-- Query Related Event Listeners
619
+
620
+ Various IndexSearcher related events can trigger Listeners to
621
+ take actions.
622
+
623
+ newSearcher - fired whenever a new searcher is being prepared
624
+ and there is a current searcher handling requests (aka
625
+ registered). It can be used to prime certain caches to
626
+ prevent long request times for certain requests.
627
+
628
+ firstSearcher - fired whenever a new searcher is being
629
+ prepared but there is no current registered searcher to handle
630
+ requests or to gain autowarming data from.
631
+
632
+
633
+ -->
634
+ <!-- QuerySenderListener takes an array of NamedList and executes a
635
+ local query request for each NamedList in sequence.
636
+ -->
65
637
  <listener event="newSearcher" class="solr.QuerySenderListener">
66
638
  <arr name="queries">
639
+ <!-- We don't put anything here as default in order to make softCommits
640
+ as cheap as possible (indexing-optimization). When used for
641
+ searching (or a combined index/search setup), there should be
642
+ representative queries here: Remember to state requests involving
643
+ all facets, groupings & sorts that are used -->
644
+
645
+ <!--
646
+ <lst><str name="q">solr</str><str name="sort">price asc</str></lst>
647
+ <lst><str name="q">rocks</str><str name="sort">weight asc</str></lst>
648
+ -->
67
649
  </arr>
68
650
  </listener>
69
651
  <listener event="firstSearcher" class="solr.QuerySenderListener">
70
652
  <arr name="queries">
653
+ <lst>
654
+ <str name="q">*:*</str>
655
+ </lst>
71
656
  </arr>
72
657
  </listener>
658
+
659
+ <!-- Use Cold Searcher
660
+
661
+ If a search request comes in and there is no current
662
+ registered searcher, then immediately register the still
663
+ warming searcher and use it. If "false" then all requests
664
+ will block until the first searcher is done warming.
665
+ -->
73
666
  <useColdSearcher>false</useColdSearcher>
667
+
668
+ <!-- Max Warming Searchers
669
+
670
+ Maximum number of searchers that may be warming in the
671
+ background concurrently. An error is returned if this limit
672
+ is exceeded.
673
+
674
+ Recommend values of 1-2 for read-only slaves, higher for
675
+ masters w/o cache warming.
676
+ -->
677
+ <maxWarmingSearchers>1</maxWarmingSearchers>
678
+
74
679
  </query>
75
680
 
76
- <requestDispatcher handleSelect="true">
77
- <requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048000" formdataUploadLimitInKB="2048" addHttpRequestToContext="false"/>
78
- <httpCaching never304="true"/>
681
+
682
+ <!-- Request Dispatcher
683
+
684
+ This section contains instructions for how the SolrDispatchFilter
685
+ should behave when processing requests for this SolrCore.
686
+
687
+ handleSelect is a legacy option that affects the behavior of requests
688
+ such as /select?qt=XXX
689
+
690
+ handleSelect="true" will cause the SolrDispatchFilter to process
691
+ the request and dispatch the query to a handler specified by the
692
+ "qt" param, assuming "/select" isn't already registered.
693
+
694
+ handleSelect="false" will cause the SolrDispatchFilter to
695
+ ignore "/select" requests, resulting in a 404 unless a handler
696
+ is explicitly registered with the name "/select"
697
+
698
+ handleSelect="true" is not recommended for new users, but is the default
699
+ for backwards compatibility
700
+ -->
701
+ <requestDispatcher handleSelect="false" >
702
+ <!-- Request Parsing
703
+
704
+ These settings indicate how Solr Requests may be parsed, and
705
+ what restrictions may be placed on the ContentStreams from
706
+ those requests
707
+
708
+ enableRemoteStreaming - enables use of the stream.file
709
+ and stream.url parameters for specifying remote streams.
710
+
711
+ multipartUploadLimitInKB - specifies the max size (in KiB) of
712
+ Multipart File Uploads that Solr will allow in a Request.
713
+
714
+ formdataUploadLimitInKB - specifies the max size (in KiB) of
715
+ form data (application/x-www-form-urlencoded) sent via
716
+ POST. You can use POST to pass request parameters not
717
+ fitting into the URL.
718
+
719
+ addHttpRequestToContext - if set to true, it will instruct
720
+ the requestParsers to include the original HttpServletRequest
721
+ object in the context map of the SolrQueryRequest under the
722
+ key "httpRequest". It will not be used by any of the existing
723
+ Solr components, but may be useful when developing custom
724
+ plugins.
725
+
726
+ *** WARNING ***
727
+ The settings below authorize Solr to fetch remote files, You
728
+ should make sure your system has some authentication before
729
+ using enableRemoteStreaming="true"
730
+
731
+ -->
732
+ <requestParsers enableRemoteStreaming="true"
733
+ multipartUploadLimitInKB="2048000"
734
+ formdataUploadLimitInKB="2048"
735
+ addHttpRequestToContext="false"/>
736
+
737
+ <!-- HTTP Caching
738
+
739
+ Set HTTP caching related parameters (for proxy caches and clients).
740
+
741
+ The options below instruct Solr not to output any HTTP Caching
742
+ related headers
743
+ -->
744
+ <httpCaching never304="true" />
745
+ <!-- If you include a <cacheControl> directive, it will be used to
746
+ generate a Cache-Control header (as well as an Expires header
747
+ if the value contains "max-age=")
748
+
749
+ By default, no Cache-Control header is generated.
750
+
751
+ You can use the <cacheControl> option even if you have set
752
+ never304="true"
753
+ -->
754
+ <!--
755
+ <httpCaching never304="true" >
756
+ <cacheControl>max-age=30, public</cacheControl>
757
+ </httpCaching>
758
+ -->
759
+ <!-- To enable Solr to respond with automatically generated HTTP
760
+ Caching headers, and to response to Cache Validation requests
761
+ correctly, set the value of never304="false"
762
+
763
+ This will cause Solr to generate Last-Modified and ETag
764
+ headers based on the properties of the Index.
765
+
766
+ The following options can also be specified to affect the
767
+ values of these headers...
768
+
769
+ lastModFrom - the default value is "openTime" which means the
770
+ Last-Modified value (and validation against If-Modified-Since
771
+ requests) will all be relative to when the current Searcher
772
+ was opened. You can change it to lastModFrom="dirLastMod" if
773
+ you want the value to exactly correspond to when the physical
774
+ index was last modified.
775
+
776
+ etagSeed="..." is an option you can change to force the ETag
777
+ header (and validation against If-None-Match requests) to be
778
+ different even if the index has not changed (ie: when making
779
+ significant changes to your config file)
780
+
781
+ (lastModifiedFrom and etagSeed are both ignored if you use
782
+ the never304="true" option)
783
+ -->
784
+ <!--
785
+ <httpCaching lastModifiedFrom="openTime"
786
+ etagSeed="Solr">
787
+ <cacheControl>max-age=30, public</cacheControl>
788
+ </httpCaching>
789
+ -->
79
790
  </requestDispatcher>
80
791
 
81
- <requestHandler name="/analysis/field" startup="lazy" class="solr.FieldAnalysisRequestHandler" />
792
+ <!-- Request Handlers
82
793
 
83
- <!-- config for the admin interface -->
84
- <admin>
85
- <defaultQuery>*:*</defaultQuery>
86
- </admin>
794
+ http://wiki.apache.org/solr/SolrRequestHandler
87
795
 
88
- <requestHandler name="/select" class="solr.SearchHandler" default="true">
89
- <lst name="defaults">
90
- <str name="defType">edismax</str>
91
- <str name="echoParams">explicit</str>
92
- <int name="rows">10</int>
93
- <str name="q.alt">*:*</str>
94
- <str name="qf">
95
- title^10
96
- author^10
97
- keywords^9
98
- description^8.5
99
- wct_title_^10
100
- wct_description^8.5
101
- url^15
102
- content^5
103
- host^5
104
- </str>
105
- <str name="pf">
106
- title^10
107
- author^10
108
- keywords^9
109
- description^8.5
110
- wct_title^10
111
- wct_description^8.5
112
- url^15
113
- content^5
114
- host^5
115
- </str>
116
- <int name="ps">3</int>
117
- <float name="tie">0.01</float>
118
- <str name="fl">id access_terms author category collection collection_name collection_number collections comments content content_encoding content_ffb content_first_bytes content_language content_length content_metadata content_metadata_ss content_text_length content_type content_type_droid content_type_ext content_type_full content_type_norm content_type_served content_type_tika content_type_version crawl_date crawl_dates crawl_year crawl_year_month crawl_year_month_day crawl_years description domain elements_used generator hash hashes host host_surt id_long image_colours image_dominant_colour image_faces image_faces_count image_height image_size image_width institution keywords last_modified last_modified_year license_url links links_domains links_hosts links_hosts_surts links_norm links_public_suffixes locations parse_error pdf_pdfa_errors pdf_pdfa_is_valid postcode postcode_district public_suffix publication_date publication_year record_type referrer_url resourcename sentiment sentiment_score server source_file source_file_offset status_code subject text title type url url_norm url_path url_type wayback_date wct_agency wct_collections wct_description wct_instance_id wct_subjects wct_target_id wct_titlexml_root_ns</str>
119
- <str name="facet">true</str>
120
- <str name="facet.mincount">1</str>
121
- <str name="spellcheck">true</str>
122
- <str name="spellcheck.dictionary">default</str>
123
- <str name="spellcheck.onlyMorePopular">true</str>
124
- <str name="spellcheck.extendedResults">true</str>
125
- <str name="spellcheck.collate">false</str>
126
- <str name="spellcheck.count">5</str>
796
+ Incoming queries will be dispatched to a specific handler by name
797
+ based on the path specified in the request.
798
+
799
+ Legacy behavior: If the request path uses "/select" but no Request
800
+ Handler has that name, and if handleSelect="true" has been specified in
801
+ the requestDispatcher, then the Request Handler is dispatched based on
802
+ the qt parameter. Handlers without a leading '/' are accessed this way
803
+ like so: http://host/app/[core/]select?qt=name If no qt is
804
+ given, then the requestHandler that declares default="true" will be
805
+ used or the one named "standard".
806
+
807
+ If a Request Handler is declared with startup="lazy", then it will
808
+ not be initialized until the first request that uses it.
809
+
810
+ -->
811
+ <!-- SearchHandler
812
+
813
+ http://wiki.apache.org/solr/SearchHandler
814
+
815
+ For processing Search Queries, the primary Request Handler
816
+ provided with Solr is "SearchHandler" It delegates to a sequent
817
+ of SearchComponents (see below) and supports distributed
818
+ queries across multiple shards
819
+ -->
820
+ <requestHandler name="/select" class="solr.SearchHandler">
821
+ <!-- default values for query parameters can be specified, these
822
+ will be overridden by parameters in the request
823
+ -->
824
+ <lst name="defaults">
825
+ <str name="wt">json</str> <!-- -->
826
+ <str name="echoParams">explicit</str>
827
+ <int name="rows">10</int>
828
+ <str name="defType">edismax</str>
829
+ <str name="q.op">AND</str>
830
+ <str name="tie">0.1</str>
831
+
832
+ <!-- Do not set mm, as this breaks OR-queries: https://issues.apache.org/jira/browse/SOLR-8812 -->
833
+ <!-- <str name="mm">100%</str> -->
834
+
835
+ <str name="qf">
836
+ text
837
+ author^5.0
838
+ title^2.0
839
+ description^2.0
840
+ url_search^0.5
841
+ </str>
842
+ <str name="pf">
843
+ text
844
+ </str>
845
+ <!-- We really want http 200 first. 404 will be boosted too much if url/title match-->
846
+ <str name="bq">
847
+ status_code:200^100
848
+ </str>
849
+ <str name="fl">*,score</str>
850
+ <str name="facet">false</str>
851
+ <str name="facet.mincount">1</str>
852
+ <str name="facet.limit">10</str>
853
+
854
+ <!-- Although we don't show facets per default, we want easy enabling of the common ones when
855
+ turning on faceting in the query -->
856
+ <str name="facet.field">domain</str>
857
+ <str name="facet.field">crawl_year</str>
858
+ <str name="facet.field">public_suffix</str>
859
+ <str name="facet.field">content_type_norm</str>
860
+ <str name="facet.field">status_code</str>
861
+ <str name="facet.field">host</str>
862
+
863
+ <str name="hl">on</str>
864
+ <str name="hl.requireFieldMatch">false</str>
865
+ <str name="hl.encoder">html</str>
866
+ <str name="f.content.hl.preserveMulti">true</str>
867
+ <str name="hl.fl">content</str>
868
+
869
+ </lst>
870
+ <arr name="last-components">
871
+ <str>highlight</str>
872
+ </arr>
873
+
874
+ </requestHandler>
875
+
876
+
877
+ <!-- realtime get handler, guaranteed to return the latest stored fields of
878
+ any document, without the need to commit or open a new searcher. The
879
+ current implementation relies on the updateLog feature being enabled.
880
+
881
+ ** WARNING **
882
+ Do NOT disable the realtime get handler at /get if you are using
883
+ SolrCloud otherwise any leader election will cause a full sync in ALL
884
+ replicas for the shard in question. Similarly, a replica recovery will
885
+ also always fetch the complete index from the leader because a partial
886
+ sync will not be possible in the absence of this handler.
887
+ -->
888
+ <requestHandler name="/get" class="solr.RealTimeGetHandler">
889
+ <lst name="defaults">
890
+ <str name="omitHeader">true</str>
891
+ <str name="wt">json</str>
892
+ <str name="indent">true</str>
893
+ </lst>
894
+ </requestHandler>
895
+
896
+
897
+ <!-- Update Request Handler.
898
+
899
+ http://wiki.apache.org/solr/UpdateXmlMessages
900
+
901
+ The canonical Request Handler for Modifying the Index through
902
+ commands specified using XML, JSON, CSV, or JAVABIN
903
+
904
+ Note: Since solr1.1 requestHandlers requires a valid content
905
+ type header if posted in the body. For example, curl now
906
+ requires: -H 'Content-type:text/xml; charset=utf-8'
907
+
908
+ To override the request content type and force a specific
909
+ Content-type, use the request parameter:
910
+ ?update.contentType=text/csv
911
+
912
+ This handler will pick a response format to match the input
913
+ if the 'wt' parameter is not explicit
914
+ -->
915
+ <requestHandler name="/update" class="solr.UpdateRequestHandler">
916
+ <!-- See below for information on defining
917
+ updateRequestProcessorChains that can be used by name
918
+ on each Update Request
919
+ -->
920
+ <!--
921
+ <lst name="defaults">
922
+ <str name="update.chain">dedupe</str>
923
+ </lst>
924
+ -->
925
+ </requestHandler>
926
+
927
+ <!-- for back compat with clients using /update/json and /update/csv -->
928
+ <requestHandler name="/update/json" class="solr.UpdateRequestHandler">
929
+ <lst name="defaults">
930
+ <str name="stream.contentType">application/json</str>
931
+ </lst>
932
+ </requestHandler>
933
+ <requestHandler name="/update/csv" class="solr.UpdateRequestHandler">
934
+ <lst name="defaults">
935
+ <str name="stream.contentType">application/csv</str>
936
+ </lst>
937
+ </requestHandler>
938
+
939
+ <!-- Solr Cell Update Request Handler
940
+
941
+ http://wiki.apache.org/solr/ExtractingRequestHandler
942
+
943
+ -->
944
+ <requestHandler name="/update/extract"
945
+ startup="lazy"
946
+ class="solr.extraction.ExtractingRequestHandler" >
947
+ <lst name="defaults">
948
+ <str name="lowernames">true</str>
949
+ <str name="uprefix">ignored_</str>
950
+
951
+ <!-- capture link hrefs but ignore div attributes -->
952
+ <str name="captureAttr">true</str>
953
+ <str name="fmap.a">links</str>
954
+ <str name="fmap.div">ignored_</str>
127
955
  </lst>
128
- <arr name="last-components">
129
- <str>spellcheck</str>
130
- </arr>
131
956
  </requestHandler>
132
957
 
133
- <!-- START Warclight Field-based searches -->
134
- <requestHandler name="/title_search" class="solr.SearchHandler">
135
- <lst name="defaults">
136
- <str name="defType">edismax</str>
137
- <str name="echoParams">explicit</str>
138
- <int name="rows">10</int>
139
- <str name="q.alt">*:*</str>
140
- <str name="df">title</str>
141
- <str name="q.op">AND</str>
142
- <str name="qf">title</str>
143
- <str name="pf">title</str>
144
- <str name="fl">*</str>
145
- <str name="facet">true</str>
146
- <str name="facet.mincount">1</str>
147
- </lst>
148
- </requestHandler>
149
- <requestHandler name="/content_search" class="solr.SearchHandler">
150
- <lst name="defaults">
151
- <str name="defType">edismax</str>
152
- <str name="echoParams">explicit</str>
153
- <int name="rows">10</int>
154
- <str name="q.alt">*:*</str>
155
- <str name="df">content</str>
156
- <str name="q.op">AND</str>
157
- <str name="qf">content</str>
158
- <str name="pf">content</str>
159
- <str name="fl">*</str>
160
- <str name="facet">true</str>
161
- <str name="facet.mincount">1</str>
162
- </lst>
163
- </requestHandler>
164
- <requestHandler name="/url_search" class="solr.SearchHandler">
165
- <lst name="defaults">
166
- <str name="defType">edismax</str>
167
- <str name="echoParams">explicit</str>
168
- <int name="rows">10</int>
169
- <str name="q.alt">*:*</str>
170
- <str name="df">url</str>
171
- <str name="q.op">AND</str>
172
- <str name="qf">url</str>
173
- <str name="pf">url</str>
174
- <str name="fl">*</str>
175
- <str name="facet">true</str>
176
- <str name="facet.mincount">1</str>
177
- </lst>
178
- </requestHandler>
179
- <requestHandler name="/host_search" class="solr.SearchHandler">
180
- <lst name="defaults">
181
- <str name="defType">edismax</str>
182
- <str name="echoParams">explicit</str>
183
- <int name="rows">10</int>
184
- <str name="q.alt">*:*</str>
185
- <str name="df">host</str>
186
- <str name="q.op">AND</str>
187
- <str name="qf">host</str>
188
- <str name="pf">host</str>
189
- <str name="fl">*</str>
190
- <str name="facet">true</str>
191
- <str name="facet.mincount">1</str>
192
- </lst>
193
- </requestHandler>
194
- <!-- END Warclight Field-based searches -->
195
-
196
- <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
197
- <str name="queryAnalyzerFieldType">text_general</str>
958
+
959
+ <!-- Field Analysis Request Handler
960
+
961
+ RequestHandler that provides much the same functionality as
962
+ analysis.jsp. Provides the ability to specify multiple field
963
+ types and field names in the same request and outputs
964
+ index-time and query-time analysis for each of them.
965
+
966
+ Request parameters are:
967
+ analysis.fieldname - field name whose analyzers are to be used
968
+
969
+ analysis.fieldtype - field type whose analyzers are to be used
970
+ analysis.fieldvalue - text for index-time analysis
971
+ q (or analysis.q) - text for query time analysis
972
+ analysis.showmatch (true|false) - When set to true and when
973
+ query analysis is performed, the produced tokens of the
974
+ field value analysis will be marked as "matched" for every
975
+ token that is produces by the query analysis
976
+ -->
977
+ <requestHandler name="/analysis/field"
978
+ startup="lazy"
979
+ class="solr.FieldAnalysisRequestHandler" />
980
+
981
+
982
+ <!-- Document Analysis Handler
983
+
984
+ http://wiki.apache.org/solr/AnalysisRequestHandler
985
+
986
+ An analysis handler that provides a breakdown of the analysis
987
+ process of provided documents. This handler expects a (single)
988
+ content stream with the following format:
989
+
990
+ <docs>
991
+ <doc>
992
+ <field name="id">1</field>
993
+ <field name="name">The Name</field>
994
+ <field name="text">The Text Value</field>
995
+ </doc>
996
+ <doc>...</doc>
997
+ <doc>...</doc>
998
+ ...
999
+ </docs>
1000
+
1001
+ Note: Each document must contain a field which serves as the
1002
+ unique key. This key is used in the returned response to associate
1003
+ an analysis breakdown to the analyzed document.
1004
+
1005
+ Like the FieldAnalysisRequestHandler, this handler also supports
1006
+ query analysis by sending either an "analysis.query" or "q"
1007
+ request parameter that holds the query text to be analyzed. It
1008
+ also supports the "analysis.showmatch" parameter which when set to
1009
+ true, all field tokens that match the query tokens will be marked
1010
+ as a "match".
1011
+ -->
1012
+ <requestHandler name="/analysis/document"
1013
+ class="solr.DocumentAnalysisRequestHandler"
1014
+ startup="lazy" />
1015
+
1016
+ <!-- If you wish to hide files under ${solr.home}/conf, explicitly
1017
+ register the ShowFileRequestHandler using the definition below.
1018
+ NOTE: The glob pattern ('*') is the only pattern supported at present, *.xml will
1019
+ not exclude all files ending in '.xml'. Use it to exclude _all_ updates
1020
+ -->
1021
+ <!--
1022
+ <requestHandler name="/admin/file"
1023
+ class="solr.admin.ShowFileRequestHandler" >
1024
+ <lst name="invariants">
1025
+ <str name="hidden">synonyms.txt</str>
1026
+ <str name="hidden">anotherfile.txt</str>
1027
+ <str name="hidden">*</str>
1028
+ </lst>
1029
+ </requestHandler>
1030
+ -->
1031
+
1032
+ <!--
1033
+ Enabling this request handler (which is NOT a default part of the admin handler) will allow the Solr UI to edit
1034
+ all the config files. This is intended for secure/development use ONLY! Leaving available and publically
1035
+ accessible is a security vulnerability and should be done with extreme caution!
1036
+ -->
1037
+ <!-- ping/healthcheck -->
1038
+ <requestHandler name="/admin/ping" class="solr.PingRequestHandler">
1039
+ <lst name="invariants">
1040
+ <str name="q">solrpingquery</str>
1041
+ </lst>
1042
+ <lst name="defaults">
1043
+ <str name="echoParams">all</str>
1044
+ </lst>
1045
+ <!-- An optional feature of the PingRequestHandler is to configure the
1046
+ handler with a "healthcheckFile" which can be used to enable/disable
1047
+ the PingRequestHandler.
1048
+ relative paths are resolved against the data dir
1049
+ -->
1050
+ <!-- <str name="healthcheckFile">server-enabled.txt</str> -->
1051
+ </requestHandler>
1052
+
1053
+ <!-- Echo the request contents back to the client -->
1054
+ <requestHandler name="/debug/dump" class="solr.DumpRequestHandler" >
1055
+ <lst name="defaults">
1056
+ <str name="echoParams">explicit</str>
1057
+ <str name="echoHandler">true</str>
1058
+ </lst>
1059
+ </requestHandler>
1060
+
1061
+ <!-- Solr Replication
1062
+
1063
+ The SolrReplicationHandler supports replicating indexes from a
1064
+ "master" used for indexing and "slaves" used for queries.
1065
+
1066
+ http://wiki.apache.org/solr/SolrReplication
1067
+
1068
+ It is also necessary for SolrCloud to function (in Cloud mode, the
1069
+ replication handler is used to bulk transfer segments when nodes
1070
+ are added or need to recover).
1071
+
1072
+ https://wiki.apache.org/solr/SolrCloud/
1073
+ -->
1074
+ <requestHandler name="/replication" class="solr.ReplicationHandler" >
1075
+ <!--
1076
+ To enable simple master/slave replication, uncomment one of the
1077
+ sections below, depending on whether this solr instance should be
1078
+ the "master" or a "slave". If this instance is a "slave" you will
1079
+ also need to fill in the masterUrl to point to a real machine.
1080
+ -->
1081
+ <!--
1082
+ <lst name="master">
1083
+ <str name="replicateAfter">commit</str>
1084
+ <str name="replicateAfter">startup</str>
1085
+ <str name="confFiles">schema.xml,stopwords.txt</str>
1086
+ </lst>
1087
+ -->
1088
+ <!--
1089
+ <lst name="slave">
1090
+ <str name="masterUrl">http://your-master-hostname:8983/solr</str>
1091
+ <str name="pollInterval">00:00:60</str>
1092
+ </lst>
1093
+ -->
1094
+ </requestHandler>
1095
+
1096
+ <!-- Search Components
1097
+
1098
+ Search components are registered to SolrCore and used by
1099
+ instances of SearchHandler (which can access them by name)
1100
+
1101
+ By default, the following components are available:
1102
+
1103
+ <searchComponent name="query" class="solr.QueryComponent" />
1104
+ <searchComponent name="facet" class="solr.FacetComponent" />
1105
+ <searchComponent name="mlt" class="solr.MoreLikeThisComponent" />
1106
+ <searchComponent name="highlight" class="solr.HighlightComponent" />
1107
+ <searchComponent name="stats" class="solr.StatsComponent" />
1108
+ <searchComponent name="debug" class="solr.DebugComponent" />
1109
+
1110
+ Default configuration in a requestHandler would look like:
1111
+
1112
+ <arr name="components">
1113
+ <str>query</str>
1114
+ <str>facet</str>
1115
+ <str>mlt</str>
1116
+ <str>highlight</str>
1117
+ <str>stats</str>
1118
+ <str>debug</str>
1119
+ </arr>
1120
+
1121
+ If you register a searchComponent to one of the standard names,
1122
+ that will be used instead of the default.
1123
+
1124
+ To insert components before or after the 'standard' components, use:
1125
+
1126
+ <arr name="first-components">
1127
+ <str>myFirstComponentName</str>
1128
+ </arr>
1129
+
1130
+ <arr name="last-components">
1131
+ <str>myLastComponentName</str>
1132
+ </arr>
1133
+
1134
+ NOTE: The component registered with the name "debug" will
1135
+ always be executed after the "last-components"
1136
+
1137
+ -->
1138
+
1139
+ <!-- Spell Check
1140
+
1141
+ The spell check component can return a list of alternative spelling
1142
+ suggestions.
1143
+
1144
+ http://wiki.apache.org/solr/SpellCheckComponent
1145
+ -->
1146
+ <searchComponent name="spellcheck" class="solr.SpellCheckComponent">
1147
+
1148
+ <!-- BL changed from text_general -->
1149
+ <str name="queryAnalyzerFieldType">textSpell</str>
1150
+ <!-- BL -->
1151
+
198
1152
  <!-- Multiple "Spell Checkers" can be declared and used by this
199
1153
  component
200
1154
  -->
1155
+
201
1156
  <!-- a spellchecker built from a field of the main index -->
202
1157
  <lst name="spellchecker">
203
1158
  <str name="name">default</str>
204
- <str name="field">text</str>
1159
+
1160
+ <!-- BL changed from text -->
1161
+ <str name="field">spell</str>
1162
+ <!-- BL -->
1163
+
205
1164
  <str name="classname">solr.DirectSolrSpellChecker</str>
206
1165
  <!-- the spellcheck distance measure used, the default is the internal levenshtein -->
207
1166
  <str name="distanceMeasure">internal</str>
@@ -218,8 +1177,842 @@
218
1177
  <!-- maximum threshold of documents a query term can appear to be considered for correction -->
219
1178
  <float name="maxQueryFrequency">0.01</float>
220
1179
  <!-- uncomment this to require suggestions to occur in 1% of the documents
221
- <float name="thresholdTokenFrequency">.01</float>
1180
+ <float name="thresholdTokenFrequency">.01</float>
1181
+ -->
1182
+ </lst>
1183
+
1184
+ <!-- a spellchecker that can break or combine words. See "/spell" handler below for usage -->
1185
+ <lst name="spellchecker">
1186
+ <str name="name">wordbreak</str>
1187
+ <str name="classname">solr.WordBreakSolrSpellChecker</str>
1188
+ <str name="field">name</str>
1189
+ <str name="combineWords">true</str>
1190
+ <str name="breakWords">true</str>
1191
+ <int name="maxChanges">10</int>
1192
+ </lst>
1193
+
1194
+ <!-- a spellchecker that uses a different distance measure -->
1195
+ <!--
1196
+ <lst name="spellchecker">
1197
+ <str name="name">jarowinkler</str>
1198
+ <str name="field">spell</str>
1199
+ <str name="classname">solr.DirectSolrSpellChecker</str>
1200
+ <str name="distanceMeasure">
1201
+ org.apache.lucene.search.spell.JaroWinklerDistance
1202
+ </str>
1203
+ </lst>
1204
+ -->
1205
+
1206
+ <!-- a spellchecker that use an alternate comparator
1207
+
1208
+ comparatorClass be one of:
1209
+ 1. score (default)
1210
+ 2. freq (Frequency first, then score)
1211
+ 3. A fully qualified class name
1212
+ -->
1213
+ <!--
1214
+ <lst name="spellchecker">
1215
+ <str name="name">freq</str>
1216
+ <str name="field">lowerfilt</str>
1217
+ <str name="classname">solr.DirectSolrSpellChecker</str>
1218
+ <str name="comparatorClass">freq</str>
222
1219
  -->
1220
+
1221
+ <!-- A spellchecker that reads the list of words from a file -->
1222
+ <!--
1223
+ <lst name="spellchecker">
1224
+ <str name="classname">solr.FileBasedSpellChecker</str>
1225
+ <str name="name">file</str>
1226
+ <str name="sourceLocation">spellings.txt</str>
1227
+ <str name="characterEncoding">UTF-8</str>
1228
+ <str name="spellcheckIndexDir">spellcheckerFile</str>
1229
+ </lst>
1230
+ -->
1231
+ </searchComponent>
1232
+
1233
+ <!-- A request handler for demonstrating the spellcheck component.
1234
+
1235
+ NOTE: This is purely as an example. The whole purpose of the
1236
+ SpellCheckComponent is to hook it into the request handler that
1237
+ handles your normal user queries so that a separate request is
1238
+ not needed to get suggestions.
1239
+
1240
+ IN OTHER WORDS, THERE IS REALLY GOOD CHANCE THE SETUP BELOW IS
1241
+ NOT WHAT YOU WANT FOR YOUR PRODUCTION SYSTEM!
1242
+
1243
+ See http://wiki.apache.org/solr/SpellCheckComponent for details
1244
+ on the request parameters.
1245
+ -->
1246
+ <requestHandler name="/spell" class="solr.SearchHandler" startup="lazy">
1247
+ <lst name="defaults">
1248
+ <str name="df">text</str>
1249
+ <!-- Solr will use suggestions from both the 'default' spellchecker
1250
+ and from the 'wordbreak' spellchecker and combine them.
1251
+ collations (re-written queries) can include a combination of
1252
+ corrections from both spellcheckers -->
1253
+ <str name="spellcheck.dictionary">default</str>
1254
+ <str name="spellcheck.dictionary">wordbreak</str>
1255
+ <str name="spellcheck">on</str>
1256
+ <str name="spellcheck.extendedResults">true</str>
1257
+ <str name="spellcheck.count">10</str>
1258
+ <str name="spellcheck.alternativeTermCount">5</str>
1259
+ <str name="spellcheck.maxResultsForSuggest">5</str>
1260
+ <str name="spellcheck.collate">true</str>
1261
+ <str name="spellcheck.collateExtendedResults">true</str>
1262
+ <str name="spellcheck.maxCollationTries">10</str>
1263
+ <str name="spellcheck.maxCollations">5</str>
1264
+ </lst>
1265
+ <arr name="last-components">
1266
+ <str>spellcheck</str>
1267
+ </arr>
1268
+ </requestHandler>
1269
+
1270
+ <!-- Term Vector Component
1271
+
1272
+ http://wiki.apache.org/solr/TermVectorComponent
1273
+ -->
1274
+ <searchComponent name="tvComponent" class="solr.TermVectorComponent"/>
1275
+
1276
+ <!-- A request handler for demonstrating the term vector component
1277
+
1278
+ This is purely as an example.
1279
+
1280
+ In reality you will likely want to add the component to your
1281
+ already specified request handlers.
1282
+ -->
1283
+ <requestHandler name="/tvrh" class="solr.SearchHandler" startup="lazy">
1284
+ <lst name="defaults">
1285
+ <str name="df">text</str>
1286
+ <bool name="tv">true</bool>
1287
+ </lst>
1288
+ <arr name="last-components">
1289
+ <str>tvComponent</str>
1290
+ </arr>
1291
+ </requestHandler>
1292
+
1293
+ <!-- Clustering Component
1294
+
1295
+ You'll need to set the solr.clustering.enabled system property
1296
+ when running solr to run with clustering enabled:
1297
+
1298
+ java -Dsolr.clustering.enabled=true -jar start.jar
1299
+
1300
+ http://wiki.apache.org/solr/ClusteringComponent
1301
+ http://carrot2.github.io/solr-integration-strategies/
1302
+ -->
1303
+ <searchComponent name="clustering"
1304
+ enable="${solr.clustering.enabled:false}"
1305
+ class="solr.clustering.ClusteringComponent" >
1306
+ <lst name="engine">
1307
+ <str name="name">lingo</str>
1308
+
1309
+ <!-- Class name of a clustering algorithm compatible with the Carrot2 framework.
1310
+
1311
+ Currently available open source algorithms are:
1312
+ * org.carrot2.clustering.lingo.LingoClusteringAlgorithm
1313
+ * org.carrot2.clustering.stc.STCClusteringAlgorithm
1314
+ * org.carrot2.clustering.kmeans.BisectingKMeansClusteringAlgorithm
1315
+
1316
+ See http://project.carrot2.org/algorithms.html for more information.
1317
+
1318
+ A commercial algorithm Lingo3G (needs to be installed separately) is defined as:
1319
+ * com.carrotsearch.lingo3g.Lingo3GClusteringAlgorithm
1320
+ -->
1321
+ <str name="carrot.algorithm">org.carrot2.clustering.lingo.LingoClusteringAlgorithm</str>
1322
+
1323
+ <!-- Override location of the clustering algorithm's resources
1324
+ (attribute definitions and lexical resources).
1325
+
1326
+ A directory from which to load algorithm-specific stop words,
1327
+ stop labels and attribute definition XMLs.
1328
+
1329
+ For an overview of Carrot2 lexical resources, see:
1330
+ http://download.carrot2.org/head/manual/#chapter.lexical-resources
1331
+
1332
+ For an overview of Lingo3G lexical resources, see:
1333
+ http://download.carrotsearch.com/lingo3g/manual/#chapter.lexical-resources
1334
+ -->
1335
+ <str name="carrot.resourcesDir">clustering/carrot2</str>
1336
+ </lst>
1337
+
1338
+ <!-- An example definition for the STC clustering algorithm. -->
1339
+ <lst name="engine">
1340
+ <str name="name">stc</str>
1341
+ <str name="carrot.algorithm">org.carrot2.clustering.stc.STCClusteringAlgorithm</str>
1342
+ </lst>
1343
+
1344
+ <!-- An example definition for the bisecting kmeans clustering algorithm. -->
1345
+ <lst name="engine">
1346
+ <str name="name">kmeans</str>
1347
+ <str name="carrot.algorithm">org.carrot2.clustering.kmeans.BisectingKMeansClusteringAlgorithm</str>
1348
+ </lst>
1349
+ </searchComponent>
1350
+
1351
+ <!-- Terms Component
1352
+
1353
+ http://wiki.apache.org/solr/TermsComponent
1354
+
1355
+ A component to return terms and document frequency of those
1356
+ terms
1357
+ -->
1358
+ <searchComponent name="terms" class="solr.TermsComponent"/>
1359
+
1360
+ <!-- A request handler for demonstrating the terms component -->
1361
+ <requestHandler name="/terms" class="solr.SearchHandler" startup="lazy">
1362
+ <lst name="defaults">
1363
+ <bool name="terms">true</bool>
1364
+ <bool name="distrib">false</bool>
1365
+ </lst>
1366
+ <arr name="components">
1367
+ <str>terms</str>
1368
+ </arr>
1369
+ </requestHandler>
1370
+
1371
+
1372
+
1373
+ <!-- Highlighting Component
1374
+
1375
+ http://wiki.apache.org/solr/HighlightingParameters
1376
+ -->
1377
+ <searchComponent class="solr.HighlightComponent" name="highlight">
1378
+ <highlighting>
1379
+ <!-- Configure the standard fragmenter -->
1380
+ <!-- This could most likely be commented out in the "default" case -->
1381
+ <fragmenter name="gap"
1382
+ default="true"
1383
+ class="solr.highlight.GapFragmenter">
1384
+ <lst name="defaults">
1385
+ <int name="hl.fragsize">100</int>
1386
+ </lst>
1387
+ </fragmenter>
1388
+
1389
+ <!-- A regular-expression-based fragmenter
1390
+ (for sentence extraction)
1391
+ -->
1392
+ <fragmenter name="regex"
1393
+ class="solr.highlight.RegexFragmenter">
1394
+ <lst name="defaults">
1395
+ <!-- slightly smaller fragsizes work better because of slop -->
1396
+ <int name="hl.fragsize">70</int>
1397
+ <!-- allow 50% slop on fragment sizes -->
1398
+ <float name="hl.regex.slop">0.5</float>
1399
+ <!-- a basic sentence pattern -->
1400
+ <str name="hl.regex.pattern">[-\w ,/\n\&quot;&apos;]{20,200}</str>
1401
+ </lst>
1402
+ </fragmenter>
1403
+
1404
+ <!-- Configure the standard formatter -->
1405
+ <formatter name="html"
1406
+ default="true"
1407
+ class="solr.highlight.HtmlFormatter">
1408
+ <lst name="defaults">
1409
+ <str name="hl.simple.pre"><![CDATA[<em>]]></str>
1410
+ <str name="hl.simple.post"><![CDATA[</em>]]></str>
1411
+ </lst>
1412
+ </formatter>
1413
+
1414
+ <!-- Configure the standard encoder -->
1415
+ <encoder name="html"
1416
+ class="solr.highlight.HtmlEncoder" />
1417
+
1418
+ <!-- Configure the standard fragListBuilder -->
1419
+ <fragListBuilder name="simple"
1420
+ class="solr.highlight.SimpleFragListBuilder"/>
1421
+
1422
+ <!-- Configure the single fragListBuilder -->
1423
+ <fragListBuilder name="single"
1424
+ class="solr.highlight.SingleFragListBuilder"/>
1425
+
1426
+ <!-- Configure the weighted fragListBuilder -->
1427
+ <fragListBuilder name="weighted"
1428
+ default="true"
1429
+ class="solr.highlight.WeightedFragListBuilder"/>
1430
+
1431
+ <!-- default tag FragmentsBuilder -->
1432
+ <fragmentsBuilder name="default"
1433
+ default="true"
1434
+ class="solr.highlight.ScoreOrderFragmentsBuilder">
1435
+ <!--
1436
+ <lst name="defaults">
1437
+ <str name="hl.multiValuedSeparatorChar">/</str>
1438
+ </lst>
1439
+ -->
1440
+ </fragmentsBuilder>
1441
+
1442
+ <!-- multi-colored tag FragmentsBuilder -->
1443
+ <fragmentsBuilder name="colored"
1444
+ class="solr.highlight.ScoreOrderFragmentsBuilder">
1445
+ <lst name="defaults">
1446
+ <str name="hl.tag.pre"><![CDATA[
1447
+ <b style="background:yellow">,<b style="background:lawgreen">,
1448
+ <b style="background:aquamarine">,<b style="background:magenta">,
1449
+ <b style="background:palegreen">,<b style="background:coral">,
1450
+ <b style="background:wheat">,<b style="background:khaki">,
1451
+ <b style="background:lime">,<b style="background:deepskyblue">]]></str>
1452
+ <str name="hl.tag.post"><![CDATA[</b>]]></str>
1453
+ </lst>
1454
+ </fragmentsBuilder>
1455
+
1456
+ <boundaryScanner name="default"
1457
+ default="true"
1458
+ class="solr.highlight.SimpleBoundaryScanner">
1459
+ <lst name="defaults">
1460
+ <str name="hl.bs.maxScan">10</str>
1461
+ <str name="hl.bs.chars">.,!? &#9;&#10;&#13;</str>
1462
+ </lst>
1463
+ </boundaryScanner>
1464
+
1465
+ <boundaryScanner name="breakIterator"
1466
+ class="solr.highlight.BreakIteratorBoundaryScanner">
1467
+ <lst name="defaults">
1468
+ <!-- type should be one of CHARACTER, WORD(default), LINE and SENTENCE -->
1469
+ <str name="hl.bs.type">WORD</str>
1470
+ <!-- language and country are used when constructing Locale object. -->
1471
+ <!-- And the Locale object will be used when getting instance of BreakIterator -->
1472
+ <str name="hl.bs.language">en</str>
1473
+ <str name="hl.bs.country">US</str>
1474
+ </lst>
1475
+ </boundaryScanner>
1476
+ </highlighting>
1477
+ </searchComponent>
1478
+
1479
+ <!-- Update Processors
1480
+
1481
+ Chains of Update Processor Factories for dealing with Update
1482
+ Requests can be declared, and then used by name in Update
1483
+ Request Processors
1484
+
1485
+ http://wiki.apache.org/solr/UpdateRequestProcessor
1486
+
1487
+ -->
1488
+ <!-- Deduplication
1489
+
1490
+ An example dedup update processor that creates the "id" field
1491
+ on the fly based on the hash code of some other fields. This
1492
+ example has overwriteDupes set to false since we are using the
1493
+ id field as the signatureField and Solr will maintain
1494
+ uniqueness based on that anyway.
1495
+
1496
+ -->
1497
+ <!--
1498
+ <updateRequestProcessorChain name="dedupe">
1499
+ <processor class="solr.processor.SignatureUpdateProcessorFactory">
1500
+ <bool name="enabled">true</bool>
1501
+ <str name="signatureField">id</str>
1502
+ <bool name="overwriteDupes">false</bool>
1503
+ <str name="fields">name,features,cat</str>
1504
+ <str name="signatureClass">solr.processor.Lookup3Signature</str>
1505
+ </processor>
1506
+ <processor class="solr.LogUpdateProcessorFactory" />
1507
+ <processor class="solr.RunUpdateProcessorFactory" />
1508
+ </updateRequestProcessorChain>
1509
+ -->
1510
+
1511
+ <!-- Language identification
1512
+
1513
+ This example update chain identifies the language of the incoming
1514
+ documents using the langid contrib. The detected language is
1515
+ written to field language_s. No field name mapping is done.
1516
+ The fields used for detection are text, title, subject and description,
1517
+ making this example suitable for detecting languages form full-text
1518
+ rich documents injected via ExtractingRequestHandler.
1519
+ See more about langId at http://wiki.apache.org/solr/LanguageDetection
1520
+ -->
1521
+ <!--
1522
+ <updateRequestProcessorChain name="langid">
1523
+ <processor class="org.apache.solr.update.processor.TikaLanguageIdentifierUpdateProcessorFactory">
1524
+ <str name="langid.fl">text,title,subject,description</str>
1525
+ <str name="langid.langField">language_s</str>
1526
+ <str name="langid.fallback">en</str>
1527
+ </processor>
1528
+ <processor class="solr.LogUpdateProcessorFactory" />
1529
+ <processor class="solr.RunUpdateProcessorFactory" />
1530
+ </updateRequestProcessorChain>
1531
+ -->
1532
+
1533
+ <!-- Script update processor
1534
+
1535
+ This example hooks in an update processor implemented using JavaScript.
1536
+
1537
+ See more about the script update processor at http://wiki.apache.org/solr/ScriptUpdateProcessor
1538
+ -->
1539
+ <!--
1540
+ <updateRequestProcessorChain name="script">
1541
+ <processor class="solr.StatelessScriptUpdateProcessorFactory">
1542
+ <str name="script">update-script.js</str>
1543
+ <lst name="params">
1544
+ <str name="config_param">example config parameter</str>
1545
+ </lst>
1546
+ </processor>
1547
+ <processor class="solr.RunUpdateProcessorFactory" />
1548
+ </updateRequestProcessorChain>
1549
+ -->
1550
+
1551
+ <!-- Response Writers
1552
+
1553
+ http://wiki.apache.org/solr/QueryResponseWriter
1554
+
1555
+ Request responses will be written using the writer specified by
1556
+ the 'wt' request parameter matching the name of a registered
1557
+ writer.
1558
+
1559
+ The "default" writer is the default and will be used if 'wt' is
1560
+ not specified in the request.
1561
+ -->
1562
+ <!-- The following response writers are implicitly configured unless
1563
+ overridden...
1564
+ -->
1565
+ <!--
1566
+ <queryResponseWriter name="xml"
1567
+ default="true"
1568
+ class="solr.XMLResponseWriter" />
1569
+ <queryResponseWriter name="json" class="solr.JSONResponseWriter"/>
1570
+ <queryResponseWriter name="python" class="solr.PythonResponseWriter"/>
1571
+ <queryResponseWriter name="ruby" class="solr.RubyResponseWriter"/>
1572
+ <queryResponseWriter name="php" class="solr.PHPResponseWriter"/>
1573
+ <queryResponseWriter name="phps" class="solr.PHPSerializedResponseWriter"/>
1574
+ <queryResponseWriter name="csv" class="solr.CSVResponseWriter"/>
1575
+ <queryResponseWriter name="schema.xml" class="solr.SchemaXmlResponseWriter"/>
1576
+ -->
1577
+
1578
+ <queryResponseWriter name="json" class="solr.JSONResponseWriter">
1579
+ <!-- For the purposes of the tutorial, JSON responses are written as
1580
+ plain text so that they are easy to read in *any* browser.
1581
+ If you expect a MIME type of "application/json" just remove this override.
1582
+ -->
1583
+ <str name="content-type">text/plain; charset=UTF-8</str>
1584
+ </queryResponseWriter>
1585
+
1586
+ <!--
1587
+ Custom response writers can be declared as needed...
1588
+ -->
1589
+ <queryResponseWriter name="velocity" class="solr.VelocityResponseWriter" startup="lazy"/>
1590
+
1591
+
1592
+ <!-- XSLT response writer transforms the XML output by any xslt file found
1593
+ in Solr's conf/xslt directory. Changes to xslt files are checked for
1594
+ every xsltCacheLifetimeSeconds.
1595
+ -->
1596
+ <queryResponseWriter name="xslt" class="solr.XSLTResponseWriter">
1597
+ <int name="xsltCacheLifetimeSeconds">5</int>
1598
+ </queryResponseWriter>
1599
+
1600
+ <!-- Query Parsers
1601
+
1602
+ http://wiki.apache.org/solr/SolrQuerySyntax
1603
+
1604
+ Multiple QParserPlugins can be registered by name, and then
1605
+ used in either the "defType" param for the QueryComponent (used
1606
+ by SearchHandler) or in LocalParams
1607
+ -->
1608
+ <!-- example of registering a query parser -->
1609
+ <!--
1610
+ <queryParser name="myparser" class="com.mycompany.MyQParserPlugin"/>
1611
+ -->
1612
+
1613
+ <!-- Function Parsers
1614
+
1615
+ http://wiki.apache.org/solr/FunctionQuery
1616
+
1617
+ Multiple ValueSourceParsers can be registered by name, and then
1618
+ used as function names when using the "func" QParser.
1619
+ -->
1620
+ <!-- example of registering a custom function parser -->
1621
+ <!--
1622
+ <valueSourceParser name="myfunc"
1623
+ class="com.mycompany.MyValueSourceParser" />
1624
+ -->
1625
+
1626
+
1627
+ <!-- Document Transformers
1628
+ http://wiki.apache.org/solr/DocTransformers
1629
+ -->
1630
+ <!--
1631
+ Could be something like:
1632
+ <transformer name="db" class="com.mycompany.LoadFromDatabaseTransformer" >
1633
+ <int name="connection">jdbc://....</int>
1634
+ </transformer>
1635
+
1636
+ To add a constant value to all docs, use:
1637
+ <transformer name="mytrans2" class="org.apache.solr.response.transform.ValueAugmenterFactory" >
1638
+ <int name="value">5</int>
1639
+ </transformer>
1640
+
1641
+ If you want the user to still be able to change it with _value:something_ use this:
1642
+ <transformer name="mytrans3" class="org.apache.solr.response.transform.ValueAugmenterFactory" >
1643
+ <double name="defaultValue">5</double>
1644
+ </transformer>
1645
+
1646
+ If you are using the QueryElevationComponent, you may wish to mark documents that get boosted. The
1647
+ EditorialMarkerFactory will do exactly that:
1648
+ <transformer name="qecBooster" class="org.apache.solr.response.transform.EditorialMarkerFactory" />
1649
+ -->
1650
+
1651
+ <!-- BL autosuggest from Kinman -->
1652
+ <searchComponent class="solr.SpellCheckComponent" name="suggestTitle">
1653
+ <lst name="spellchecker">
1654
+ <str name="name">suggest</str>
1655
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1656
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1657
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1658
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1659
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1660
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1661
+ [ternary trees] -->
1662
+ <str name="field">title</str> <!-- the indexed field to derive suggestions from -->
1663
+ <float name="threshold">0.005</float>
1664
+ <str name="buildOnCommit">true</str>
1665
+ <!-- <str name="sourceLocation">american-english</str> -->
1666
+ </lst>
1667
+ </searchComponent>
1668
+
1669
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestTitle">
1670
+ <lst name="defaults">
1671
+ <str name="spellcheck">true</str>
1672
+ <str name="spellcheck.dictionary">suggest</str>
1673
+ <str name="spellcheck.onlyMorePopular">true</str>
1674
+ <str name="spellcheck.count">5</str>
1675
+ <str name="spellcheck.collate">true</str>
1676
+ </lst>
1677
+ <arr name="components">
1678
+ <str>suggestTitle</str>
1679
+ </arr>
1680
+ </requestHandler>
1681
+
1682
+ <searchComponent class="solr.SpellCheckComponent" name="suggestUrl">
1683
+ <lst name="spellchecker">
1684
+ <str name="name">suggest</str>
1685
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1686
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1687
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1688
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1689
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1690
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1691
+ [ternary trees] -->
1692
+ <str name="field">url</str> <!-- the indexed field to derive suggestions from -->
1693
+ <float name="threshold">0.005</float>
1694
+ <str name="buildOnCommit">true</str>
1695
+ <!-- <str name="sourceLocation">american-english</str> -->
223
1696
  </lst>
224
1697
  </searchComponent>
1698
+
1699
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestUrl">
1700
+ <lst name="defaults">
1701
+ <str name="spellcheck">true</str>
1702
+ <str name="spellcheck.dictionary">suggest</str>
1703
+ <str name="spellcheck.onlyMorePopular">true</str>
1704
+ <str name="spellcheck.count">5</str>
1705
+ <str name="spellcheck.collate">true</str>
1706
+ </lst>
1707
+ <arr name="components">
1708
+ <str>suggestUrl</str>
1709
+ </arr>
1710
+ </requestHandler>
1711
+
1712
+ <searchComponent class="solr.SpellCheckComponent" name="suggestFileFormat">
1713
+ <lst name="spellchecker">
1714
+ <str name="name">suggest</str>
1715
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1716
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1717
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1718
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1719
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1720
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1721
+ [ternary trees] -->
1722
+ <str name="field">content_type_ext</str> <!-- the indexed field to derive suggestions from -->
1723
+ <float name="threshold">0.005</float>
1724
+ <str name="buildOnCommit">true</str>
1725
+ <!-- <str name="sourceLocation">american-english</str> -->
1726
+ </lst>
1727
+ </searchComponent>
1728
+
1729
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestFileFormat">
1730
+ <lst name="defaults">
1731
+ <str name="spellcheck">true</str>
1732
+ <str name="spellcheck.dictionary">suggest</str>
1733
+ <str name="spellcheck.onlyMorePopular">true</str>
1734
+ <str name="spellcheck.count">5</str>
1735
+ <str name="spellcheck.collate">true</str>
1736
+ </lst>
1737
+ <arr name="components">
1738
+ <str>suggestFileFormat</str>
1739
+ </arr>
1740
+ </requestHandler>
1741
+
1742
+ <searchComponent class="solr.SpellCheckComponent" name="suggestLinksHosts">
1743
+ <lst name="spellchecker">
1744
+ <str name="name">suggest</str>
1745
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1746
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1747
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1748
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1749
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1750
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1751
+ [ternary trees] -->
1752
+ <str name="field">links_hosts</str> <!-- the indexed field to derive suggestions from -->
1753
+ <float name="threshold">0.005</float>
1754
+ <str name="buildOnCommit">true</str>
1755
+ <!-- <str name="sourceLocation">american-english</str> -->
1756
+ </lst>
1757
+ </searchComponent>
1758
+
1759
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestLinksHosts">
1760
+ <lst name="defaults">
1761
+ <str name="spellcheck">true</str>
1762
+ <str name="spellcheck.dictionary">suggest</str>
1763
+ <str name="spellcheck.onlyMorePopular">true</str>
1764
+ <str name="spellcheck.count">5</str>
1765
+ <str name="spellcheck.collate">true</str>
1766
+ </lst>
1767
+ <arr name="components">
1768
+ <str>suggestLinksHosts</str>
1769
+ </arr>
1770
+ </requestHandler>
1771
+
1772
+ <searchComponent class="solr.SpellCheckComponent" name="suggestLinksDomains">
1773
+ <lst name="spellchecker">
1774
+ <str name="name">suggest</str>
1775
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1776
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1777
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1778
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1779
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1780
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1781
+ [ternary trees] -->
1782
+ <str name="field">links_domains</str> <!-- the indexed field to derive suggestions from -->
1783
+ <float name="threshold">0.005</float>
1784
+ <str name="buildOnCommit">true</str>
1785
+ <!-- <str name="sourceLocation">american-english</str> -->
1786
+ </lst>
1787
+ </searchComponent>
1788
+
1789
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestLinksDomains">
1790
+ <lst name="defaults">
1791
+ <str name="spellcheck">true</str>
1792
+ <str name="spellcheck.dictionary">suggest</str>
1793
+ <str name="spellcheck.onlyMorePopular">true</str>
1794
+ <str name="spellcheck.count">5</str>
1795
+ <str name="spellcheck.collate">true</str>
1796
+ </lst>
1797
+ <arr name="components">
1798
+ <str>suggestLinksDomains</str>
1799
+ </arr>
1800
+ </requestHandler>
1801
+
1802
+ <searchComponent class="solr.SpellCheckComponent" name="suggestLinksPublicSuffixes">
1803
+ <lst name="spellchecker">
1804
+ <str name="name">suggest</str>
1805
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1806
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1807
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1808
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1809
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1810
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1811
+ [ternary trees] -->
1812
+ <str name="field">links_public_suffixes</str> <!-- the indexed field to derive suggestions from -->
1813
+ <float name="threshold">0.005</float>
1814
+ <str name="buildOnCommit">true</str>
1815
+ <!-- <str name="sourceLocation">american-english</str> -->
1816
+ </lst>
1817
+ </searchComponent>
1818
+
1819
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestLinksPublicSuffixes">
1820
+ <lst name="defaults">
1821
+ <str name="spellcheck">true</str>
1822
+ <str name="spellcheck.dictionary">suggest</str>
1823
+ <str name="spellcheck.onlyMorePopular">true</str>
1824
+ <str name="spellcheck.count">5</str>
1825
+ <str name="spellcheck.collate">true</str>
1826
+ </lst>
1827
+ <arr name="components">
1828
+ <str>suggestLinksPublicSuffixes</str>
1829
+ </arr>
1830
+ </requestHandler>
1831
+
1832
+ <searchComponent class="solr.SpellCheckComponent" name="suggestHost">
1833
+ <lst name="spellchecker">
1834
+ <str name="name">suggest</str>
1835
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1836
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1837
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1838
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1839
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1840
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1841
+ [ternary trees] -->
1842
+ <str name="field">host</str> <!-- the indexed field to derive suggestions from -->
1843
+ <float name="threshold">0.005</float>
1844
+ <str name="buildOnCommit">true</str>
1845
+ <!-- <str name="sourceLocation">american-english</str> -->
1846
+ </lst>
1847
+ </searchComponent>
1848
+
1849
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestHost">
1850
+ <lst name="defaults">
1851
+ <str name="spellcheck">true</str>
1852
+ <str name="spellcheck.dictionary">suggest</str>
1853
+ <str name="spellcheck.onlyMorePopular">true</str>
1854
+ <str name="spellcheck.count">5</str>
1855
+ <str name="spellcheck.collate">true</str>
1856
+ </lst>
1857
+ <arr name="components">
1858
+ <str>suggestHost</str>
1859
+ </arr>
1860
+ </requestHandler>
1861
+
1862
+ <searchComponent class="solr.SpellCheckComponent" name="suggestDomain">
1863
+ <lst name="spellchecker">
1864
+ <str name="name">suggest</str>
1865
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1866
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1867
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1868
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1869
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1870
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1871
+ [ternary trees] -->
1872
+ <str name="field">domain</str> <!-- the indexed field to derive suggestions from -->
1873
+ <float name="threshold">0.005</float>
1874
+ <str name="buildOnCommit">true</str>
1875
+ <!-- <str name="sourceLocation">american-english</str> -->
1876
+ </lst>
1877
+ </searchComponent>
1878
+
1879
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestDomain">
1880
+ <lst name="defaults">
1881
+ <str name="spellcheck">true</str>
1882
+ <str name="spellcheck.dictionary">suggest</str>
1883
+ <str name="spellcheck.onlyMorePopular">true</str>
1884
+ <str name="spellcheck.count">5</str>
1885
+ <str name="spellcheck.collate">true</str>
1886
+ </lst>
1887
+ <arr name="components">
1888
+ <str>suggestDomain</str>
1889
+ </arr>
1890
+ </requestHandler>
1891
+
1892
+ <searchComponent class="solr.SpellCheckComponent" name="suggestPublicSuffix">
1893
+ <lst name="spellchecker">
1894
+ <str name="name">suggest</str>
1895
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1896
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1897
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1898
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1899
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1900
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1901
+ [ternary trees] -->
1902
+ <str name="field">public_suffix</str> <!-- the indexed field to derive suggestions from -->
1903
+ <float name="threshold">0.005</float>
1904
+ <str name="buildOnCommit">true</str>
1905
+ <!-- <str name="sourceLocation">american-english</str> -->
1906
+ </lst>
1907
+ </searchComponent>
1908
+
1909
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestPublicSuffix">
1910
+ <lst name="defaults">
1911
+ <str name="spellcheck">true</str>
1912
+ <str name="spellcheck.dictionary">suggest</str>
1913
+ <str name="spellcheck.onlyMorePopular">true</str>
1914
+ <str name="spellcheck.count">5</str>
1915
+ <str name="spellcheck.collate">true</str>
1916
+ </lst>
1917
+ <arr name="components">
1918
+ <str>suggestPublicSuffix</str>
1919
+ </arr>
1920
+ </requestHandler>
1921
+
1922
+ <searchComponent class="solr.SpellCheckComponent" name="suggestAuthor">
1923
+ <lst name="spellchecker">
1924
+ <str name="name">suggest</str>
1925
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1926
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1927
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1928
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1929
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1930
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1931
+ [ternary trees] -->
1932
+ <str name="field">author</str> <!-- the indexed field to derive suggestions from -->
1933
+ <float name="threshold">0.005</float>
1934
+ <str name="buildOnCommit">true</str>
1935
+ <!-- <str name="sourceLocation">american-english</str> -->
1936
+ </lst>
1937
+ </searchComponent>
1938
+
1939
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestAuthor">
1940
+ <lst name="defaults">
1941
+ <str name="spellcheck">true</str>
1942
+ <str name="spellcheck.dictionary">suggest</str>
1943
+ <str name="spellcheck.onlyMorePopular">true</str>
1944
+ <str name="spellcheck.count">5</str>
1945
+ <str name="spellcheck.collate">true</str>
1946
+ </lst>
1947
+ <arr name="components">
1948
+ <str>suggestAuthor</str>
1949
+ </arr>
1950
+ </requestHandler>
1951
+
1952
+ <searchComponent class="solr.SpellCheckComponent" name="suggestCollection">
1953
+ <lst name="spellchecker">
1954
+ <str name="name">suggest</str>
1955
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1956
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1957
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1958
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1959
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1960
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1961
+ [ternary trees] -->
1962
+ <str name="field">collection</str> <!-- the indexed field to derive suggestions from -->
1963
+ <float name="threshold">0.005</float>
1964
+ <str name="buildOnCommit">true</str>
1965
+ <!-- <str name="sourceLocation">american-english</str> -->
1966
+ </lst>
1967
+ </searchComponent>
1968
+
1969
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestCollection">
1970
+ <lst name="defaults">
1971
+ <str name="spellcheck">true</str>
1972
+ <str name="spellcheck.dictionary">suggest</str>
1973
+ <str name="spellcheck.onlyMorePopular">true</str>
1974
+ <str name="spellcheck.count">5</str>
1975
+ <str name="spellcheck.collate">true</str>
1976
+ </lst>
1977
+ <arr name="components">
1978
+ <str>suggestCollection</str>
1979
+ </arr>
1980
+ </requestHandler>
1981
+
1982
+ <searchComponent class="solr.SpellCheckComponent" name="suggestCollections">
1983
+ <lst name="spellchecker">
1984
+ <str name="name">suggest</str>
1985
+ <str name="classname">org.apache.solr.spelling.suggest.Suggester</str>
1986
+ <str name="lookupImpl">org.apache.solr.spelling.suggest.tst.TSTLookupFactory</str>
1987
+ <!-- Alternatives to lookupImpl: org.apache.solr.spelling.suggest.fst.FSTLookupFactory
1988
+ [finite state automaton] org.apache.solr.spelling.suggest.fst.WFSTLookupFactory
1989
+ [weighted finite state automaton] org.apache.solr.spelling.suggest.jaspell.JaspellLookupFactory
1990
+ [default, jaspell-based] org.apache.solr.spelling.suggest.tst.TSTLookupFactory
1991
+ [ternary trees] -->
1992
+ <str name="field">collections</str> <!-- the indexed field to derive suggestions from -->
1993
+ <float name="threshold">0.005</float>
1994
+ <str name="buildOnCommit">true</str>
1995
+ <!-- <str name="sourceLocation">american-english</str> -->
1996
+ </lst>
1997
+ </searchComponent>
1998
+
1999
+ <requestHandler class="org.apache.solr.handler.component.SearchHandler" name="/suggestCollections">
2000
+ <lst name="defaults">
2001
+ <str name="spellcheck">true</str>
2002
+ <str name="spellcheck.dictionary">suggest</str>
2003
+ <str name="spellcheck.onlyMorePopular">true</str>
2004
+ <str name="spellcheck.count">5</str>
2005
+ <str name="spellcheck.collate">true</str>
2006
+ </lst>
2007
+ <arr name="components">
2008
+ <str>suggestCollections</str>
2009
+ </arr>
2010
+ </requestHandler>
2011
+ <!-- BL -->
2012
+
2013
+ <!-- Legacy config for the admin interface -->
2014
+ <admin>
2015
+ <defaultQuery>*:*</defaultQuery>
2016
+ </admin>
2017
+
225
2018
  </config>