geoblacklight-schema 0.2.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/.gitignore +3 -0
- data/LICENSE +14 -0
- data/README.md +44 -0
- data/bin/fgdc2mods.rb +5 -0
- data/bin/mods2geoblacklight.rb +5 -0
- data/bin/xsltproc-saxon +14 -0
- data/conf/protwords.txt +21 -0
- data/conf/schema.xml +158 -0
- data/conf/solrconfig.xml +160 -0
- data/conf/stopwords_en.txt +34 -0
- data/conf/synonyms.txt +29 -0
- data/examples/Gemfile +4 -0
- data/examples/generate-example-doc.rb +42 -0
- data/examples/selected.json +5787 -0
- data/examples/upload-to-solr.rb +50 -0
- data/geoblacklight-schema.gemspec +23 -0
- data/lib/geoblacklight/gazetteer.csv +1011 -0
- data/lib/geoblacklight/gazetteer.rb +104 -0
- data/lib/xslt/arcgis_to_iso19110.xsl +364 -0
- data/lib/xslt/fgdc2mods.xsl +1007 -0
- data/lib/xslt/iso2mods.xsl +939 -0
- data/lib/xslt/mods2geoblacklight.xsl +268 -0
- data/lib/xslt/mods2ogp.xsl +195 -0
- data/tools/fgdc2html/Gemfile +2 -0
- data/tools/fgdc2html/fgdc2html.css +71 -0
- data/tools/fgdc2html/fgdc2html.js +6 -0
- data/tools/fgdc2html/fgdc2html.xsl +1034 -0
- data/tools/fgdc2html/render.rb +30 -0
- data/tools/iso2html/Gemfile +2 -0
- data/tools/iso2html/iso-html.xsl +1745 -0
- data/tools/iso2html/render.rb +24 -0
- data/tools/iso2html/utils/convert-enumerations.xsl +97 -0
- data/tools/iso2html/utils/convert-latlong.xsl +73 -0
- data/tools/iso2html/utils/decode-uri/base.css +408 -0
- data/tools/iso2html/utils/decode-uri/index.html +29 -0
- data/tools/iso2html/utils/elements-fgdc.xml +824 -0
- data/tools/iso2html/utils/elements-iso.xml +636 -0
- data/tools/iso2html/utils/printFormatted.xsl +267 -0
- data/tools/iso2html/utils/printTextLines.xsl +192 -0
- data/tools/iso2html/utils/replace-newlines.xsl +97 -0
- data/tools/iso2html/utils/replace-string.xsl +80 -0
- data/tools/iso2html/utils/strip-digits.xsl +60 -0
- data/tools/iso2html/utils/url-decode.xsl +87 -0
- data/tools/iso2html/utils/wrap-text.xsl +174 -0
- data/tools/ogp/0_download.rb +96 -0
- data/tools/ogp/1_validate.rb +225 -0
- data/tools/ogp/2_transform.rb +438 -0
- data/tools/ogp/3_stanford.rb +35 -0
- data/tools/ogp/4_select.rb +189 -0
- data/tools/ogp/5_ingest.rb +55 -0
- data/tools/ogp/Gemfile +2 -0
- data/tools/solr/Gemfile +3 -0
- data/tools/solr/purge.rb +33 -0
- data/tools/solr/upload.rb +35 -0
- data/vendor/.keep +0 -0
- metadata +131 -0
checksums.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
1
|
+
---
|
2
|
+
SHA1:
|
3
|
+
metadata.gz: 9ff360f9e0d93b2b8973cb0b7a698a83ed7df395
|
4
|
+
data.tar.gz: 214fe068e10569e722f8659815216dd4829f45a3
|
5
|
+
SHA512:
|
6
|
+
metadata.gz: de1dde11f1a3f1f622d1bc7a84c1f863a244e14cd7a055c012cb0f5d2b97ba447132dc01763988f6fca1fb7a35bd9df74697017806fa8fc9ad6b844693b37020
|
7
|
+
data.tar.gz: bd45f44fe4f4bf18c1e8372ad53ad9414204be49f4cb0844b8421575c072e9ce69e4d76babc9f0a18bc8bd9bbece2a645c2b77b1e9dc2da178696071f6ddaa4a
|
data/.gitignore
ADDED
data/LICENSE
ADDED
@@ -0,0 +1,14 @@
|
|
1
|
+
Copyright (c) 2014 by The Board of Trustees of the Leland Stanford
|
2
|
+
Junior University. All rights reserved.
|
3
|
+
|
4
|
+
Licensed under the Apache License, Version 2.0 (the "License"); you
|
5
|
+
may not use this file except in compliance with the License. You
|
6
|
+
may obtain a copy of the License at
|
7
|
+
|
8
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
9
|
+
|
10
|
+
Unless required by applicable law or agreed to in writing, software
|
11
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
12
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
|
13
|
+
implied. See the License for the specific language governing
|
14
|
+
permissions and limitations under the License.
|
data/README.md
ADDED
@@ -0,0 +1,44 @@
|
|
1
|
+
#### Introduction
|
2
|
+
|
3
|
+
This schema focuses on discovery use cases for patrons and analysts in a
|
4
|
+
research library setting, although it is likely useful in other settings. Text
|
5
|
+
search, faceted search and refinement, and spatial search and relevancy are
|
6
|
+
among the primary features that the schema enables. The schema design supports
|
7
|
+
a variety of discovery applications and GIS data types. We especially wanted to
|
8
|
+
provide for contextual collection-oriented discovery applications as well as
|
9
|
+
traditional portal applications.
|
10
|
+
|
11
|
+
The source code for the Solr implementation and the design document are on
|
12
|
+
Github:
|
13
|
+
|
14
|
+
http://github.com/geoblacklight/geoblacklight-schema
|
15
|
+
|
16
|
+
The conf/ folder has everything you need to implement the schema in Solr 4.7,
|
17
|
+
and the examples/ folder has 100 example Solr documents that you can use. The
|
18
|
+
lib/ folder has some initial, but incomplete, implementations for metadata
|
19
|
+
format conversions (e.g., FGDC -> MODS, OGP -> GeoBlacklight, etc.).
|
20
|
+
|
21
|
+
#### Example
|
22
|
+
|
23
|
+
The `examples` folder has some Solr documents that uses this schema. First,
|
24
|
+
install the schema into a Solr 4 instance, then upload the documents.
|
25
|
+
|
26
|
+
```bash
|
27
|
+
% cd examples
|
28
|
+
% ruby upload-to-solr.rb your-collection-name http://localhost:8080/solr
|
29
|
+
```
|
30
|
+
|
31
|
+
## Requirements
|
32
|
+
|
33
|
+
* Saxon-HE v9, the Home Edition from http://saxon.sourceforge.net installed as
|
34
|
+
`vendor/saxon9he.jar`
|
35
|
+
|
36
|
+
# Schema for GeoBlacklight
|
37
|
+
|
38
|
+
Please refer to http://journal.code4lib.org/articles/9710 which describes the schema in detail.
|
39
|
+
|
40
|
+
* Hardy, D., K. Durante. 2014. A Metadata Schema for Geospatial Resource Discovery Use Cases. _code4lib_ 25.
|
41
|
+
|
42
|
+
Abstract: We introduce a metadata schema that focuses on GIS discovery use cases for patrons in a research library setting. Text search, faceted refinement, and spatial search and relevancy are among GeoBlacklight’s primary use cases for federated geospatial holdings. The schema supports a variety of GIS data types and enables contextual, collection-oriented discovery applications as well as traditional portal applications. One key limitation of GIS resource discovery is the general lack of normative metadata practices, which has led to a proliferation of metadata schemas and duplicate records. The ISO 19115/19139 and FGDC standards specify metadata formats, but are intricate, lengthy, and not focused on discovery. Moreover, they require sophisticated authoring environments and cataloging expertise. Geographic metadata standards target preservation and quality measure use cases, but they do not provide for simple inter-institutional sharing of metadata for discovery use cases. To this end, our schema reuses elements from Dublin Core and GeoRSS to leverage their normative semantics, community best practices, open-source software implementations, and extensive examples already deployed in discovery contexts such as web search and mapping. Finally, we discuss a Solr implementation of the schema using a “geo” extension to MODS.
|
43
|
+
|
44
|
+
|
data/bin/fgdc2mods.rb
ADDED
data/bin/xsltproc-saxon
ADDED
@@ -0,0 +1,14 @@
|
|
1
|
+
#!/bin/bash
|
2
|
+
#
|
3
|
+
# Usage: xsltproc-saxon stylesheet.xsl input.xml [output.xml [flags or params]]
|
4
|
+
#
|
5
|
+
# See http://saxonica.com/documentation/html/using-xsl/commandline.html
|
6
|
+
#
|
7
|
+
s=$1; shift
|
8
|
+
i=$1; shift
|
9
|
+
o=$1; shift
|
10
|
+
if [ -n "$o" ]; then
|
11
|
+
o="-o:$o"
|
12
|
+
fi
|
13
|
+
|
14
|
+
java -jar ../vendor/saxon9he.jar "-s:$i" "-xsl:$s" $o $*
|
data/conf/protwords.txt
ADDED
@@ -0,0 +1,21 @@
|
|
1
|
+
# The ASF licenses this file to You under the Apache License, Version 2.0
|
2
|
+
# (the "License"); you may not use this file except in compliance with
|
3
|
+
# the License. You may obtain a copy of the License at
|
4
|
+
#
|
5
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
6
|
+
#
|
7
|
+
# Unless required by applicable law or agreed to in writing, software
|
8
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
9
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
10
|
+
# See the License for the specific language governing permissions and
|
11
|
+
# limitations under the License.
|
12
|
+
|
13
|
+
#-----------------------------------------------------------------------
|
14
|
+
# Use a protected word file to protect against the stemmer reducing two
|
15
|
+
# unrelated words to the same base word.
|
16
|
+
|
17
|
+
# Some non-words that normally won't be encountered,
|
18
|
+
# just to test that they won't be stemmed.
|
19
|
+
dontstems
|
20
|
+
zwhacky
|
21
|
+
|
data/conf/schema.xml
ADDED
@@ -0,0 +1,158 @@
|
|
1
|
+
<?xml version="1.0" encoding="UTF-8"?>
|
2
|
+
<schema name="geoblacklight-schema" version="1.5">
|
3
|
+
<uniqueKey>uuid</uniqueKey>
|
4
|
+
<fields>
|
5
|
+
<field name="_version_" type="long" stored="true" indexed="true"/>
|
6
|
+
<field name="timestamp" type="date" stored="true" indexed="true" default="NOW"/>
|
7
|
+
<field name="uuid" type="string" stored="true" indexed="true" required="true"/>
|
8
|
+
|
9
|
+
<!-- core generated fields -->
|
10
|
+
<field name="text" type="text_en" stored="false" indexed="true" multiValued="true"
|
11
|
+
termVectors="true" termPositions="true" termOffsets="true" />
|
12
|
+
|
13
|
+
<!-- dynamic field with simple types by suffix -->
|
14
|
+
<dynamicField name="*_b" type="boolean" stored="true" indexed="true"/>
|
15
|
+
<dynamicField name="*_d" type="double" stored="true" indexed="true"/>
|
16
|
+
<dynamicField name="*_dt" type="date" stored="true" indexed="true"/>
|
17
|
+
<dynamicField name="*_f" type="float" stored="true" indexed="true"/>
|
18
|
+
<dynamicField name="*_i" type="int" stored="true" indexed="true"/>
|
19
|
+
<dynamicField name="*_l" type="long" stored="true" indexed="true"/>
|
20
|
+
<dynamicField name="*_s" type="string" stored="true" indexed="true"/>
|
21
|
+
<dynamicField name="*_ss" type="string" stored="true" indexed="false"/>
|
22
|
+
<dynamicField name="*_si" type="string" stored="false" indexed="true"/>
|
23
|
+
<dynamicField name="*_sim" type="string" stored="false" indexed="true" multiValued="true" />
|
24
|
+
<dynamicField name="*_sm" type="string" stored="true" indexed="true" multiValued="true" />
|
25
|
+
<dynamicField name="*_url" type="string" stored="true" indexed="false"/>
|
26
|
+
<dynamicField name="*_blob" type="binary" stored="true" indexed="false"/>
|
27
|
+
|
28
|
+
<!-- dynamic Text fields by suffix without storage -->
|
29
|
+
<dynamicField name="*_t" type="text_en" stored="false" indexed="true"
|
30
|
+
termVectors="true" termPositions="true" termOffsets="true"/>
|
31
|
+
<dynamicField name="*_tm" type="text_en" stored="false" indexed="true" multiValued="true"
|
32
|
+
termVectors="true" termPositions="true" termOffsets="true"/>
|
33
|
+
<dynamicField name="*_ti" type="text_en" stored="false" indexed="true"
|
34
|
+
termVectors="true" termPositions="true" termOffsets="true"/>
|
35
|
+
<dynamicField name="*_tmi" type="text_en" stored="false" indexed="true" multiValued="true"
|
36
|
+
termVectors="true" termPositions="true" termOffsets="true"/>
|
37
|
+
<dynamicField name="*_sort" type="text_sort" stored="false" indexed="true" multiValued="false"/>
|
38
|
+
|
39
|
+
<!-- Spatial field types:
|
40
|
+
|
41
|
+
Solr3:
|
42
|
+
<field name="my_pt">83.1,-117.312</field>
|
43
|
+
as (y,x)
|
44
|
+
|
45
|
+
Solr4:
|
46
|
+
|
47
|
+
<field name="my_bbox">-117.312 83.1 -115.39 84.31</field>
|
48
|
+
as (W S E N)
|
49
|
+
|
50
|
+
<field name="my_geom">ENVELOPE(-117.312, -115.39, 84.31, 83.1)</field>
|
51
|
+
as (W E N S)
|
52
|
+
|
53
|
+
<field name="my_jts">POLYGON((1 8, 1 9, 2 9, 2 8, 1 8))</field>
|
54
|
+
as WKT for point, linestring, polygon
|
55
|
+
|
56
|
+
-->
|
57
|
+
<dynamicField name="*_pt" type="location" stored="true" indexed="true"/>
|
58
|
+
<dynamicField name="*_bbox" type="location_rpt" stored="true" indexed="true"/>
|
59
|
+
<dynamicField name="*_geom" type="location_rpt" stored="true" indexed="true"/>
|
60
|
+
<!-- <dynamicField name="*_jts" type="location_jts" stored="true" indexed="true"/> -->
|
61
|
+
</fields>
|
62
|
+
|
63
|
+
<types>
|
64
|
+
<fieldType name="string" class="solr.StrField" sortMissingLast="true" />
|
65
|
+
<fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
|
66
|
+
|
67
|
+
<fieldType name="int" class="solr.TrieIntField" precisionStep="8" positionIncrementGap="0"/>
|
68
|
+
<fieldType name="float" class="solr.TrieFloatField" precisionStep="8" positionIncrementGap="0"/>
|
69
|
+
<fieldType name="long" class="solr.TrieLongField" precisionStep="8" positionIncrementGap="0"/>
|
70
|
+
<fieldType name="double" class="solr.TrieDoubleField" precisionStep="8" positionIncrementGap="0"/>
|
71
|
+
|
72
|
+
<!-- The format for this date field is of the form 1995-12-31T23:59:59Z.
|
73
|
+
The trailing "Z" designates UTC time and is mandatory.
|
74
|
+
A Trie based date field for faster date range queries and date faceting. -->
|
75
|
+
<fieldType name="date" class="solr.TrieDateField" precisionStep="6" positionIncrementGap="0"/>
|
76
|
+
|
77
|
+
<!--Binary data type. The data should be sent/retrieved in as Base64 encoded Strings -->
|
78
|
+
<fieldtype name="binary" class="solr.BinaryField"/>
|
79
|
+
|
80
|
+
<!-- A text field with defaults appropriate for English: it
|
81
|
+
tokenizes with StandardTokenizer, removes English stop words
|
82
|
+
(lang/stopwords_en.txt), down cases, protects words from protwords.txt, and
|
83
|
+
finally applies Porter's stemming. The query time analyzer
|
84
|
+
also applies synonyms from synonyms.txt. -->
|
85
|
+
<fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
|
86
|
+
<analyzer type="index">
|
87
|
+
<tokenizer class="solr.StandardTokenizerFactory"/>
|
88
|
+
<filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords_en.txt"/>
|
89
|
+
<filter class="solr.LowerCaseFilterFactory"/>
|
90
|
+
<filter class="solr.EnglishPossessiveFilterFactory"/>
|
91
|
+
<filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
|
92
|
+
<filter class="solr.PorterStemFilterFactory"/>
|
93
|
+
</analyzer>
|
94
|
+
<analyzer type="query">
|
95
|
+
<tokenizer class="solr.StandardTokenizerFactory"/>
|
96
|
+
<filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
|
97
|
+
<filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords_en.txt"/>
|
98
|
+
<filter class="solr.LowerCaseFilterFactory"/>
|
99
|
+
<filter class="solr.EnglishPossessiveFilterFactory"/>
|
100
|
+
<filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
|
101
|
+
<filter class="solr.PorterStemFilterFactory"/>
|
102
|
+
</analyzer>
|
103
|
+
</fieldType>
|
104
|
+
|
105
|
+
<!-- for alpha sorting as a single token -->
|
106
|
+
<fieldType name="text_sort" class="solr.TextField" sortMissingLast="true" omitNorms="true">
|
107
|
+
<analyzer>
|
108
|
+
<tokenizer class="solr.KeywordTokenizerFactory"/>
|
109
|
+
<filter class="solr.LowerCaseFilterFactory" />
|
110
|
+
<filter class="solr.TrimFilterFactory" />
|
111
|
+
<filter class="solr.PatternReplaceFilterFactory" pattern="([^a-z0-9 ])" replacement="" replace="all"/>
|
112
|
+
</analyzer>
|
113
|
+
</fieldType>
|
114
|
+
|
115
|
+
<!-- Spatial field types -->
|
116
|
+
<fieldType name="location" class="solr.LatLonType" subFieldSuffix="_d"/>
|
117
|
+
|
118
|
+
<fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType"
|
119
|
+
distErrPct="0.025"
|
120
|
+
maxDistErr="0.000009"
|
121
|
+
units="degrees"
|
122
|
+
/>
|
123
|
+
|
124
|
+
<!-- JTS-enabled spatial predicates; requires JTS installation -->
|
125
|
+
<!-- <fieldType name="location_jts" class="solr.SpatialRecursivePrefixTreeFieldType"
|
126
|
+
spatialContextFactory="com.spatial4j.core.context.jts.JtsSpatialContextFactory"
|
127
|
+
distErrPct="0.025"
|
128
|
+
maxDistErr="0.000009"
|
129
|
+
units="degrees"
|
130
|
+
/> -->
|
131
|
+
</types>
|
132
|
+
|
133
|
+
<!-- for scoring formula -->
|
134
|
+
<copyField source="dct_spatial_sm" dest="dct_spatial_tmi" maxChars="10000"/>
|
135
|
+
<copyField source="dct_temporal_sm" dest="dct_temporal_tmi" maxChars="10000"/>
|
136
|
+
<copyField source="dc_creator_sm" dest="dc_creator_tmi" maxChars="1000"/>
|
137
|
+
<copyField source="dc_description_s" dest="dc_description_ti" maxChars="10000"/>
|
138
|
+
<copyField source="dc_format_s" dest="dc_format_ti" maxChars="100"/>
|
139
|
+
<copyField source="dc_identifier_s" dest="dc_identifier_ti" maxChars="100"/>
|
140
|
+
<copyField source="dc_publisher_s" dest="dc_publisher_ti" maxChars="1000"/>
|
141
|
+
<copyField source="dc_rights_s" dest="dc_rights_ti" maxChars="100"/>
|
142
|
+
<copyField source="dct_provenance_s" dest="dct_provenance_ti" maxChars="1000"/>
|
143
|
+
<copyField source="dc_subject_sm" dest="dc_subject_tmi" maxChars="10000"/>
|
144
|
+
<copyField source="dc_title_s" dest="dc_title_ti" maxChars="1000"/>
|
145
|
+
<copyField source="dct_isPartOf_sm" dest="dct_isPartOf_tmi" maxChars="1000"/>
|
146
|
+
<copyField source="layer_geom_type_s" dest="layer_geom_type_ti" maxChars="100"/>
|
147
|
+
<copyField source="layer_slug_s" dest="layer_slug_ti" maxChars="100"/>
|
148
|
+
|
149
|
+
<!-- core text search -->
|
150
|
+
<copyField source="*_ti" dest="text" />
|
151
|
+
<copyField source="*_tmi" dest="text" />
|
152
|
+
|
153
|
+
<!-- for sorting text fields -->
|
154
|
+
<copyField source="dct_provenance_s" dest="dct_provenance_sort"/>
|
155
|
+
<copyField source="dc_publisher_s" dest="dc_publisher_sort"/>
|
156
|
+
<copyField source="dc_title_s" dest="dc_title_sort"/>
|
157
|
+
|
158
|
+
</schema>
|
data/conf/solrconfig.xml
ADDED
@@ -0,0 +1,160 @@
|
|
1
|
+
<?xml version="1.0" encoding="UTF-8"?>
|
2
|
+
<!--
|
3
|
+
Licensed to the Apache Software Foundation (ASF) under one or more
|
4
|
+
contributor license agreements. See the NOTICE file distributed with
|
5
|
+
this work for additional information regarding copyright ownership.
|
6
|
+
The ASF licenses this file to You under the Apache License, Version 2.0
|
7
|
+
(the "License"); you may not use this file except in compliance with
|
8
|
+
the License. You may obtain a copy of the License at
|
9
|
+
|
10
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
11
|
+
|
12
|
+
Unless required by applicable law or agreed to in writing, software
|
13
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
14
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
15
|
+
See the License for the specific language governing permissions and
|
16
|
+
limitations under the License.
|
17
|
+
-->
|
18
|
+
<!--
|
19
|
+
For more details about configurations options that may appear in
|
20
|
+
this file, see http://wiki.apache.org/solr/SolrConfigXml.
|
21
|
+
-->
|
22
|
+
<config>
|
23
|
+
<luceneMatchVersion>4.7</luceneMatchVersion>
|
24
|
+
<dataDir>${solr.data.dir:}</dataDir>
|
25
|
+
<directoryFactory name="DirectoryFactory" class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}"/>
|
26
|
+
<codecFactory class="solr.SchemaCodecFactory"/>
|
27
|
+
<schemaFactory class="ClassicIndexSchemaFactory"/>
|
28
|
+
<indexConfig>
|
29
|
+
<lockType>${solr.lock.type:native}</lockType>
|
30
|
+
</indexConfig>
|
31
|
+
|
32
|
+
<!-- The default high-performance update handler -->
|
33
|
+
<updateHandler class="solr.DirectUpdateHandler2">
|
34
|
+
<updateLog>
|
35
|
+
<str name="dir">${solr.ulog.dir:}</str>
|
36
|
+
</updateLog>
|
37
|
+
<autoCommit>
|
38
|
+
<maxTime>15000</maxTime>
|
39
|
+
<openSearcher>false</openSearcher>
|
40
|
+
</autoCommit>
|
41
|
+
</updateHandler>
|
42
|
+
|
43
|
+
<!-- realtime get handler, guaranteed to return the latest stored fields
|
44
|
+
of any document, without the need to commit or open a new searcher. The current
|
45
|
+
implementation relies on the updateLog feature being enabled. -->
|
46
|
+
<requestHandler name="/get" class="solr.RealTimeGetHandler">
|
47
|
+
<lst name="defaults">
|
48
|
+
<str name="omitHeader">true</str>
|
49
|
+
</lst>
|
50
|
+
</requestHandler>
|
51
|
+
|
52
|
+
<requestHandler name="/replication" class="solr.ReplicationHandler" startup="lazy" />
|
53
|
+
|
54
|
+
<!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
|
55
|
+
Query section - these settings control query time things like caches
|
56
|
+
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
|
57
|
+
<query>
|
58
|
+
<maxBooleanClauses>1024</maxBooleanClauses>
|
59
|
+
<filterCache class="solr.FastLRUCache" size="512" initialSize="512" autowarmCount="0"/>
|
60
|
+
<queryResultCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
|
61
|
+
<documentCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
|
62
|
+
<enableLazyFieldLoading>true</enableLazyFieldLoading>
|
63
|
+
<queryResultWindowSize>20</queryResultWindowSize>
|
64
|
+
<queryResultMaxDocsCached>200</queryResultMaxDocsCached>
|
65
|
+
<listener event="newSearcher" class="solr.QuerySenderListener">
|
66
|
+
<arr name="queries">
|
67
|
+
<lst><str name="q">stanford</str></lst>
|
68
|
+
<lst><str name="q">polygon</str></lst>
|
69
|
+
</arr>
|
70
|
+
</listener>
|
71
|
+
<listener event="firstSearcher" class="solr.QuerySenderListener">
|
72
|
+
<arr name="queries">
|
73
|
+
<lst>
|
74
|
+
<str name="q">static firstSearcher warming in solrconfig.xml</str>
|
75
|
+
</lst>
|
76
|
+
</arr>
|
77
|
+
</listener>
|
78
|
+
<useColdSearcher>false</useColdSearcher>
|
79
|
+
<maxWarmingSearchers>2</maxWarmingSearchers>
|
80
|
+
</query>
|
81
|
+
|
82
|
+
<requestDispatcher handleSelect="false">
|
83
|
+
<requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048000" formdataUploadLimitInKB="2048"/>
|
84
|
+
<httpCaching never304="true"/>
|
85
|
+
</requestDispatcher>
|
86
|
+
|
87
|
+
<requestHandler name="/search" class="solr.SearchHandler"/>
|
88
|
+
|
89
|
+
<requestHandler name="/select" class="solr.SearchHandler">
|
90
|
+
<lst name="defaults">
|
91
|
+
<int name="start">0</int>
|
92
|
+
<int name="rows">10</int>
|
93
|
+
<str name="wt">json</str>
|
94
|
+
<int name="indent">2</int>
|
95
|
+
<str name="defType">edismax</str>
|
96
|
+
<str name="echoParams">all</str>
|
97
|
+
<str name="fl">*,score</str>
|
98
|
+
<str name="sort">score desc, dc_title_sort asc</str>
|
99
|
+
<str name="q.alt">*:*</str>
|
100
|
+
<str name="qf">
|
101
|
+
text^1
|
102
|
+
dc_description_ti^2
|
103
|
+
dc_creator_tmi^3
|
104
|
+
dc_publisher_ti^3
|
105
|
+
dct_isPartOf_tmi^4
|
106
|
+
dc_subject_tmi^5
|
107
|
+
dct_spatial_tmi^5
|
108
|
+
dct_temporal_tmi^5
|
109
|
+
dc_title_ti^6
|
110
|
+
dc_rights_ti^7
|
111
|
+
dct_provenance_ti^8
|
112
|
+
layer_geom_type_ti^9
|
113
|
+
layer_slug_ti^10
|
114
|
+
dc_identifier_ti^10
|
115
|
+
</str>
|
116
|
+
<bool name="facet">true</bool>
|
117
|
+
<int name="facet.mincount">1</int>
|
118
|
+
<int name="facet.limit">10</int>
|
119
|
+
<str name="facet.field">dct_isPartOf_sm</str>
|
120
|
+
<str name="facet.field">dct_provenance_s</str>
|
121
|
+
<str name="facet.field">dct_spatial_sm</str>
|
122
|
+
<str name="facet.field">dc_creator_sm</str>
|
123
|
+
<str name="facet.field">dc_format_s</str>
|
124
|
+
<str name="facet.field">dc_language_s</str>
|
125
|
+
<str name="facet.field">dc_publisher_s</str>
|
126
|
+
<str name="facet.field">dc_rights_s</str>
|
127
|
+
<str name="facet.field">dc_subject_sm</str>
|
128
|
+
<str name="facet.field">layer_geom_type_s</str>
|
129
|
+
<str name="facet.field">solr_year_i</str>
|
130
|
+
</lst>
|
131
|
+
</requestHandler>
|
132
|
+
|
133
|
+
<requestHandler name="/update" class="solr.UpdateRequestHandler"/>
|
134
|
+
<requestHandler name="/admin/" class="solr.admin.AdminHandlers"/>
|
135
|
+
|
136
|
+
<!-- ping/healthcheck -->
|
137
|
+
<requestHandler name="/admin/ping" class="solr.PingRequestHandler">
|
138
|
+
<lst name="invariants">
|
139
|
+
<str name="q">solrpingquery</str>
|
140
|
+
</lst>
|
141
|
+
<lst name="defaults">
|
142
|
+
<str name="echoParams">all</str>
|
143
|
+
</lst>
|
144
|
+
<!-- An optional feature of the PingRequestHandler is to configure the
|
145
|
+
handler with a "healthcheckFile" which can be used to enable/disable
|
146
|
+
the PingRequestHandler.
|
147
|
+
relative paths are resolved against the data dir
|
148
|
+
-->
|
149
|
+
<str name="healthcheckFile">server-enabled.txt</str>
|
150
|
+
</requestHandler>
|
151
|
+
|
152
|
+
<requestHandler name="/analysis/field"
|
153
|
+
startup="lazy"
|
154
|
+
class="solr.FieldAnalysisRequestHandler" />
|
155
|
+
|
156
|
+
<!-- Legacy config for the admin interface -->
|
157
|
+
<admin>
|
158
|
+
<defaultQuery>*:*</defaultQuery>
|
159
|
+
</admin>
|
160
|
+
</config>
|
@@ -0,0 +1,34 @@
|
|
1
|
+
# Standard english stop words taken from Lucene's StopAnalyzer
|
2
|
+
a
|
3
|
+
an
|
4
|
+
and
|
5
|
+
are
|
6
|
+
as
|
7
|
+
at
|
8
|
+
be
|
9
|
+
but
|
10
|
+
by
|
11
|
+
for
|
12
|
+
if
|
13
|
+
in
|
14
|
+
into
|
15
|
+
is
|
16
|
+
it
|
17
|
+
no
|
18
|
+
not
|
19
|
+
of
|
20
|
+
on
|
21
|
+
or
|
22
|
+
such
|
23
|
+
that
|
24
|
+
the
|
25
|
+
their
|
26
|
+
then
|
27
|
+
there
|
28
|
+
these
|
29
|
+
they
|
30
|
+
this
|
31
|
+
to
|
32
|
+
was
|
33
|
+
will
|
34
|
+
with
|