geoblacklight-schema 0.2.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (57) hide show
  1. checksums.yaml +7 -0
  2. data/.gitignore +3 -0
  3. data/LICENSE +14 -0
  4. data/README.md +44 -0
  5. data/bin/fgdc2mods.rb +5 -0
  6. data/bin/mods2geoblacklight.rb +5 -0
  7. data/bin/xsltproc-saxon +14 -0
  8. data/conf/protwords.txt +21 -0
  9. data/conf/schema.xml +158 -0
  10. data/conf/solrconfig.xml +160 -0
  11. data/conf/stopwords_en.txt +34 -0
  12. data/conf/synonyms.txt +29 -0
  13. data/examples/Gemfile +4 -0
  14. data/examples/generate-example-doc.rb +42 -0
  15. data/examples/selected.json +5787 -0
  16. data/examples/upload-to-solr.rb +50 -0
  17. data/geoblacklight-schema.gemspec +23 -0
  18. data/lib/geoblacklight/gazetteer.csv +1011 -0
  19. data/lib/geoblacklight/gazetteer.rb +104 -0
  20. data/lib/xslt/arcgis_to_iso19110.xsl +364 -0
  21. data/lib/xslt/fgdc2mods.xsl +1007 -0
  22. data/lib/xslt/iso2mods.xsl +939 -0
  23. data/lib/xslt/mods2geoblacklight.xsl +268 -0
  24. data/lib/xslt/mods2ogp.xsl +195 -0
  25. data/tools/fgdc2html/Gemfile +2 -0
  26. data/tools/fgdc2html/fgdc2html.css +71 -0
  27. data/tools/fgdc2html/fgdc2html.js +6 -0
  28. data/tools/fgdc2html/fgdc2html.xsl +1034 -0
  29. data/tools/fgdc2html/render.rb +30 -0
  30. data/tools/iso2html/Gemfile +2 -0
  31. data/tools/iso2html/iso-html.xsl +1745 -0
  32. data/tools/iso2html/render.rb +24 -0
  33. data/tools/iso2html/utils/convert-enumerations.xsl +97 -0
  34. data/tools/iso2html/utils/convert-latlong.xsl +73 -0
  35. data/tools/iso2html/utils/decode-uri/base.css +408 -0
  36. data/tools/iso2html/utils/decode-uri/index.html +29 -0
  37. data/tools/iso2html/utils/elements-fgdc.xml +824 -0
  38. data/tools/iso2html/utils/elements-iso.xml +636 -0
  39. data/tools/iso2html/utils/printFormatted.xsl +267 -0
  40. data/tools/iso2html/utils/printTextLines.xsl +192 -0
  41. data/tools/iso2html/utils/replace-newlines.xsl +97 -0
  42. data/tools/iso2html/utils/replace-string.xsl +80 -0
  43. data/tools/iso2html/utils/strip-digits.xsl +60 -0
  44. data/tools/iso2html/utils/url-decode.xsl +87 -0
  45. data/tools/iso2html/utils/wrap-text.xsl +174 -0
  46. data/tools/ogp/0_download.rb +96 -0
  47. data/tools/ogp/1_validate.rb +225 -0
  48. data/tools/ogp/2_transform.rb +438 -0
  49. data/tools/ogp/3_stanford.rb +35 -0
  50. data/tools/ogp/4_select.rb +189 -0
  51. data/tools/ogp/5_ingest.rb +55 -0
  52. data/tools/ogp/Gemfile +2 -0
  53. data/tools/solr/Gemfile +3 -0
  54. data/tools/solr/purge.rb +33 -0
  55. data/tools/solr/upload.rb +35 -0
  56. data/vendor/.keep +0 -0
  57. metadata +131 -0
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: 9ff360f9e0d93b2b8973cb0b7a698a83ed7df395
4
+ data.tar.gz: 214fe068e10569e722f8659815216dd4829f45a3
5
+ SHA512:
6
+ metadata.gz: de1dde11f1a3f1f622d1bc7a84c1f863a244e14cd7a055c012cb0f5d2b97ba447132dc01763988f6fca1fb7a35bd9df74697017806fa8fc9ad6b844693b37020
7
+ data.tar.gz: bd45f44fe4f4bf18c1e8372ad53ad9414204be49f4cb0844b8421575c072e9ce69e4d76babc9f0a18bc8bd9bbece2a645c2b77b1e9dc2da178696071f6ddaa4a
@@ -0,0 +1,3 @@
1
+ Gemfile.lock
2
+ data
3
+ vendor/*.jar
data/LICENSE ADDED
@@ -0,0 +1,14 @@
1
+ Copyright (c) 2014 by The Board of Trustees of the Leland Stanford
2
+ Junior University. All rights reserved.
3
+
4
+ Licensed under the Apache License, Version 2.0 (the "License"); you
5
+ may not use this file except in compliance with the License. You
6
+ may obtain a copy of the License at
7
+
8
+ http://www.apache.org/licenses/LICENSE-2.0
9
+
10
+ Unless required by applicable law or agreed to in writing, software
11
+ distributed under the License is distributed on an "AS IS" BASIS,
12
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
13
+ implied. See the License for the specific language governing
14
+ permissions and limitations under the License.
@@ -0,0 +1,44 @@
1
+ #### Introduction
2
+
3
+ This schema focuses on discovery use cases for patrons and analysts in a
4
+ research library setting, although it is likely useful in other settings. Text
5
+ search, faceted search and refinement, and spatial search and relevancy are
6
+ among the primary features that the schema enables. The schema design supports
7
+ a variety of discovery applications and GIS data types. We especially wanted to
8
+ provide for contextual collection-oriented discovery applications as well as
9
+ traditional portal applications.
10
+
11
+ The source code for the Solr implementation and the design document are on
12
+ Github:
13
+
14
+ http://github.com/geoblacklight/geoblacklight-schema
15
+
16
+ The conf/ folder has everything you need to implement the schema in Solr 4.7,
17
+ and the examples/ folder has 100 example Solr documents that you can use. The
18
+ lib/ folder has some initial, but incomplete, implementations for metadata
19
+ format conversions (e.g., FGDC -> MODS, OGP -> GeoBlacklight, etc.).
20
+
21
+ #### Example
22
+
23
+ The `examples` folder has some Solr documents that uses this schema. First,
24
+ install the schema into a Solr 4 instance, then upload the documents.
25
+
26
+ ```bash
27
+ % cd examples
28
+ % ruby upload-to-solr.rb your-collection-name http://localhost:8080/solr
29
+ ```
30
+
31
+ ## Requirements
32
+
33
+ * Saxon-HE v9, the Home Edition from http://saxon.sourceforge.net installed as
34
+ `vendor/saxon9he.jar`
35
+
36
+ # Schema for GeoBlacklight
37
+
38
+ Please refer to http://journal.code4lib.org/articles/9710 which describes the schema in detail.
39
+
40
+ * Hardy, D., K. Durante. 2014. A Metadata Schema for Geospatial Resource Discovery Use Cases. _code4lib_ 25.
41
+
42
+ Abstract: We introduce a metadata schema that focuses on GIS discovery use cases for patrons in a research library setting. Text search, faceted refinement, and spatial search and relevancy are among GeoBlacklight’s primary use cases for federated geospatial holdings. The schema supports a variety of GIS data types and enables contextual, collection-oriented discovery applications as well as traditional portal applications. One key limitation of GIS resource discovery is the general lack of normative metadata practices, which has led to a proliferation of metadata schemas and duplicate records. The ISO 19115/19139 and FGDC standards specify metadata formats, but are intricate, lengthy, and not focused on discovery. Moreover, they require sophisticated authoring environments and cataloging expertise. Geographic metadata standards target preservation and quality measure use cases, but they do not provide for simple inter-institutional sharing of metadata for discovery use cases. To this end, our schema reuses elements from Dublin Core and GeoRSS to leverage their normative semantics, community best practices, open-source software implementations, and extensive examples already deployed in discovery contexts such as web search and mapping. Finally, we discuss a Solr implementation of the schema using a “geo” extension to MODS.
43
+
44
+
@@ -0,0 +1,5 @@
1
+ #!/usr/bin/env ruby
2
+
3
+ cmd = "bin/xsltproc-saxon lib/xslt/fgdc2mods.xsl #{ARGV[0]}"
4
+ # puts cmd
5
+ system cmd
@@ -0,0 +1,5 @@
1
+ #!/usr/bin/env ruby
2
+
3
+ cmd = "bin/xsltproc-saxon lib/xslt/mods2geoblacklight.xsl #{ARGV[0]}"
4
+ # puts cmd
5
+ system cmd
@@ -0,0 +1,14 @@
1
+ #!/bin/bash
2
+ #
3
+ # Usage: xsltproc-saxon stylesheet.xsl input.xml [output.xml [flags or params]]
4
+ #
5
+ # See http://saxonica.com/documentation/html/using-xsl/commandline.html
6
+ #
7
+ s=$1; shift
8
+ i=$1; shift
9
+ o=$1; shift
10
+ if [ -n "$o" ]; then
11
+ o="-o:$o"
12
+ fi
13
+
14
+ java -jar ../vendor/saxon9he.jar "-s:$i" "-xsl:$s" $o $*
@@ -0,0 +1,21 @@
1
+ # The ASF licenses this file to You under the Apache License, Version 2.0
2
+ # (the "License"); you may not use this file except in compliance with
3
+ # the License. You may obtain a copy of the License at
4
+ #
5
+ # http://www.apache.org/licenses/LICENSE-2.0
6
+ #
7
+ # Unless required by applicable law or agreed to in writing, software
8
+ # distributed under the License is distributed on an "AS IS" BASIS,
9
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10
+ # See the License for the specific language governing permissions and
11
+ # limitations under the License.
12
+
13
+ #-----------------------------------------------------------------------
14
+ # Use a protected word file to protect against the stemmer reducing two
15
+ # unrelated words to the same base word.
16
+
17
+ # Some non-words that normally won't be encountered,
18
+ # just to test that they won't be stemmed.
19
+ dontstems
20
+ zwhacky
21
+
@@ -0,0 +1,158 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <schema name="geoblacklight-schema" version="1.5">
3
+ <uniqueKey>uuid</uniqueKey>
4
+ <fields>
5
+ <field name="_version_" type="long" stored="true" indexed="true"/>
6
+ <field name="timestamp" type="date" stored="true" indexed="true" default="NOW"/>
7
+ <field name="uuid" type="string" stored="true" indexed="true" required="true"/>
8
+
9
+ <!-- core generated fields -->
10
+ <field name="text" type="text_en" stored="false" indexed="true" multiValued="true"
11
+ termVectors="true" termPositions="true" termOffsets="true" />
12
+
13
+ <!-- dynamic field with simple types by suffix -->
14
+ <dynamicField name="*_b" type="boolean" stored="true" indexed="true"/>
15
+ <dynamicField name="*_d" type="double" stored="true" indexed="true"/>
16
+ <dynamicField name="*_dt" type="date" stored="true" indexed="true"/>
17
+ <dynamicField name="*_f" type="float" stored="true" indexed="true"/>
18
+ <dynamicField name="*_i" type="int" stored="true" indexed="true"/>
19
+ <dynamicField name="*_l" type="long" stored="true" indexed="true"/>
20
+ <dynamicField name="*_s" type="string" stored="true" indexed="true"/>
21
+ <dynamicField name="*_ss" type="string" stored="true" indexed="false"/>
22
+ <dynamicField name="*_si" type="string" stored="false" indexed="true"/>
23
+ <dynamicField name="*_sim" type="string" stored="false" indexed="true" multiValued="true" />
24
+ <dynamicField name="*_sm" type="string" stored="true" indexed="true" multiValued="true" />
25
+ <dynamicField name="*_url" type="string" stored="true" indexed="false"/>
26
+ <dynamicField name="*_blob" type="binary" stored="true" indexed="false"/>
27
+
28
+ <!-- dynamic Text fields by suffix without storage -->
29
+ <dynamicField name="*_t" type="text_en" stored="false" indexed="true"
30
+ termVectors="true" termPositions="true" termOffsets="true"/>
31
+ <dynamicField name="*_tm" type="text_en" stored="false" indexed="true" multiValued="true"
32
+ termVectors="true" termPositions="true" termOffsets="true"/>
33
+ <dynamicField name="*_ti" type="text_en" stored="false" indexed="true"
34
+ termVectors="true" termPositions="true" termOffsets="true"/>
35
+ <dynamicField name="*_tmi" type="text_en" stored="false" indexed="true" multiValued="true"
36
+ termVectors="true" termPositions="true" termOffsets="true"/>
37
+ <dynamicField name="*_sort" type="text_sort" stored="false" indexed="true" multiValued="false"/>
38
+
39
+ <!-- Spatial field types:
40
+
41
+ Solr3:
42
+ <field name="my_pt">83.1,-117.312</field>
43
+ as (y,x)
44
+
45
+ Solr4:
46
+
47
+ <field name="my_bbox">-117.312 83.1 -115.39 84.31</field>
48
+ as (W S E N)
49
+
50
+ <field name="my_geom">ENVELOPE(-117.312, -115.39, 84.31, 83.1)</field>
51
+ as (W E N S)
52
+
53
+ <field name="my_jts">POLYGON((1 8, 1 9, 2 9, 2 8, 1 8))</field>
54
+ as WKT for point, linestring, polygon
55
+
56
+ -->
57
+ <dynamicField name="*_pt" type="location" stored="true" indexed="true"/>
58
+ <dynamicField name="*_bbox" type="location_rpt" stored="true" indexed="true"/>
59
+ <dynamicField name="*_geom" type="location_rpt" stored="true" indexed="true"/>
60
+ <!-- <dynamicField name="*_jts" type="location_jts" stored="true" indexed="true"/> -->
61
+ </fields>
62
+
63
+ <types>
64
+ <fieldType name="string" class="solr.StrField" sortMissingLast="true" />
65
+ <fieldType name="boolean" class="solr.BoolField" sortMissingLast="true"/>
66
+
67
+ <fieldType name="int" class="solr.TrieIntField" precisionStep="8" positionIncrementGap="0"/>
68
+ <fieldType name="float" class="solr.TrieFloatField" precisionStep="8" positionIncrementGap="0"/>
69
+ <fieldType name="long" class="solr.TrieLongField" precisionStep="8" positionIncrementGap="0"/>
70
+ <fieldType name="double" class="solr.TrieDoubleField" precisionStep="8" positionIncrementGap="0"/>
71
+
72
+ <!-- The format for this date field is of the form 1995-12-31T23:59:59Z.
73
+ The trailing "Z" designates UTC time and is mandatory.
74
+ A Trie based date field for faster date range queries and date faceting. -->
75
+ <fieldType name="date" class="solr.TrieDateField" precisionStep="6" positionIncrementGap="0"/>
76
+
77
+ <!--Binary data type. The data should be sent/retrieved in as Base64 encoded Strings -->
78
+ <fieldtype name="binary" class="solr.BinaryField"/>
79
+
80
+ <!-- A text field with defaults appropriate for English: it
81
+ tokenizes with StandardTokenizer, removes English stop words
82
+ (lang/stopwords_en.txt), down cases, protects words from protwords.txt, and
83
+ finally applies Porter's stemming. The query time analyzer
84
+ also applies synonyms from synonyms.txt. -->
85
+ <fieldType name="text_en" class="solr.TextField" positionIncrementGap="100">
86
+ <analyzer type="index">
87
+ <tokenizer class="solr.StandardTokenizerFactory"/>
88
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords_en.txt"/>
89
+ <filter class="solr.LowerCaseFilterFactory"/>
90
+ <filter class="solr.EnglishPossessiveFilterFactory"/>
91
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
92
+ <filter class="solr.PorterStemFilterFactory"/>
93
+ </analyzer>
94
+ <analyzer type="query">
95
+ <tokenizer class="solr.StandardTokenizerFactory"/>
96
+ <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt" ignoreCase="true" expand="true"/>
97
+ <filter class="solr.StopFilterFactory" ignoreCase="true" words="stopwords_en.txt"/>
98
+ <filter class="solr.LowerCaseFilterFactory"/>
99
+ <filter class="solr.EnglishPossessiveFilterFactory"/>
100
+ <filter class="solr.KeywordMarkerFilterFactory" protected="protwords.txt"/>
101
+ <filter class="solr.PorterStemFilterFactory"/>
102
+ </analyzer>
103
+ </fieldType>
104
+
105
+ <!-- for alpha sorting as a single token -->
106
+ <fieldType name="text_sort" class="solr.TextField" sortMissingLast="true" omitNorms="true">
107
+ <analyzer>
108
+ <tokenizer class="solr.KeywordTokenizerFactory"/>
109
+ <filter class="solr.LowerCaseFilterFactory" />
110
+ <filter class="solr.TrimFilterFactory" />
111
+ <filter class="solr.PatternReplaceFilterFactory" pattern="([^a-z0-9 ])" replacement="" replace="all"/>
112
+ </analyzer>
113
+ </fieldType>
114
+
115
+ <!-- Spatial field types -->
116
+ <fieldType name="location" class="solr.LatLonType" subFieldSuffix="_d"/>
117
+
118
+ <fieldType name="location_rpt" class="solr.SpatialRecursivePrefixTreeFieldType"
119
+ distErrPct="0.025"
120
+ maxDistErr="0.000009"
121
+ units="degrees"
122
+ />
123
+
124
+ <!-- JTS-enabled spatial predicates; requires JTS installation -->
125
+ <!-- <fieldType name="location_jts" class="solr.SpatialRecursivePrefixTreeFieldType"
126
+ spatialContextFactory="com.spatial4j.core.context.jts.JtsSpatialContextFactory"
127
+ distErrPct="0.025"
128
+ maxDistErr="0.000009"
129
+ units="degrees"
130
+ /> -->
131
+ </types>
132
+
133
+ <!-- for scoring formula -->
134
+ <copyField source="dct_spatial_sm" dest="dct_spatial_tmi" maxChars="10000"/>
135
+ <copyField source="dct_temporal_sm" dest="dct_temporal_tmi" maxChars="10000"/>
136
+ <copyField source="dc_creator_sm" dest="dc_creator_tmi" maxChars="1000"/>
137
+ <copyField source="dc_description_s" dest="dc_description_ti" maxChars="10000"/>
138
+ <copyField source="dc_format_s" dest="dc_format_ti" maxChars="100"/>
139
+ <copyField source="dc_identifier_s" dest="dc_identifier_ti" maxChars="100"/>
140
+ <copyField source="dc_publisher_s" dest="dc_publisher_ti" maxChars="1000"/>
141
+ <copyField source="dc_rights_s" dest="dc_rights_ti" maxChars="100"/>
142
+ <copyField source="dct_provenance_s" dest="dct_provenance_ti" maxChars="1000"/>
143
+ <copyField source="dc_subject_sm" dest="dc_subject_tmi" maxChars="10000"/>
144
+ <copyField source="dc_title_s" dest="dc_title_ti" maxChars="1000"/>
145
+ <copyField source="dct_isPartOf_sm" dest="dct_isPartOf_tmi" maxChars="1000"/>
146
+ <copyField source="layer_geom_type_s" dest="layer_geom_type_ti" maxChars="100"/>
147
+ <copyField source="layer_slug_s" dest="layer_slug_ti" maxChars="100"/>
148
+
149
+ <!-- core text search -->
150
+ <copyField source="*_ti" dest="text" />
151
+ <copyField source="*_tmi" dest="text" />
152
+
153
+ <!-- for sorting text fields -->
154
+ <copyField source="dct_provenance_s" dest="dct_provenance_sort"/>
155
+ <copyField source="dc_publisher_s" dest="dc_publisher_sort"/>
156
+ <copyField source="dc_title_s" dest="dc_title_sort"/>
157
+
158
+ </schema>
@@ -0,0 +1,160 @@
1
+ <?xml version="1.0" encoding="UTF-8"?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+ <!--
19
+ For more details about configurations options that may appear in
20
+ this file, see http://wiki.apache.org/solr/SolrConfigXml.
21
+ -->
22
+ <config>
23
+ <luceneMatchVersion>4.7</luceneMatchVersion>
24
+ <dataDir>${solr.data.dir:}</dataDir>
25
+ <directoryFactory name="DirectoryFactory" class="${solr.directoryFactory:solr.NRTCachingDirectoryFactory}"/>
26
+ <codecFactory class="solr.SchemaCodecFactory"/>
27
+ <schemaFactory class="ClassicIndexSchemaFactory"/>
28
+ <indexConfig>
29
+ <lockType>${solr.lock.type:native}</lockType>
30
+ </indexConfig>
31
+
32
+ <!-- The default high-performance update handler -->
33
+ <updateHandler class="solr.DirectUpdateHandler2">
34
+ <updateLog>
35
+ <str name="dir">${solr.ulog.dir:}</str>
36
+ </updateLog>
37
+ <autoCommit>
38
+ <maxTime>15000</maxTime>
39
+ <openSearcher>false</openSearcher>
40
+ </autoCommit>
41
+ </updateHandler>
42
+
43
+ <!-- realtime get handler, guaranteed to return the latest stored fields
44
+ of any document, without the need to commit or open a new searcher. The current
45
+ implementation relies on the updateLog feature being enabled. -->
46
+ <requestHandler name="/get" class="solr.RealTimeGetHandler">
47
+ <lst name="defaults">
48
+ <str name="omitHeader">true</str>
49
+ </lst>
50
+ </requestHandler>
51
+
52
+ <requestHandler name="/replication" class="solr.ReplicationHandler" startup="lazy" />
53
+
54
+ <!-- ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
55
+ Query section - these settings control query time things like caches
56
+ ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -->
57
+ <query>
58
+ <maxBooleanClauses>1024</maxBooleanClauses>
59
+ <filterCache class="solr.FastLRUCache" size="512" initialSize="512" autowarmCount="0"/>
60
+ <queryResultCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
61
+ <documentCache class="solr.LRUCache" size="512" initialSize="512" autowarmCount="0"/>
62
+ <enableLazyFieldLoading>true</enableLazyFieldLoading>
63
+ <queryResultWindowSize>20</queryResultWindowSize>
64
+ <queryResultMaxDocsCached>200</queryResultMaxDocsCached>
65
+ <listener event="newSearcher" class="solr.QuerySenderListener">
66
+ <arr name="queries">
67
+ <lst><str name="q">stanford</str></lst>
68
+ <lst><str name="q">polygon</str></lst>
69
+ </arr>
70
+ </listener>
71
+ <listener event="firstSearcher" class="solr.QuerySenderListener">
72
+ <arr name="queries">
73
+ <lst>
74
+ <str name="q">static firstSearcher warming in solrconfig.xml</str>
75
+ </lst>
76
+ </arr>
77
+ </listener>
78
+ <useColdSearcher>false</useColdSearcher>
79
+ <maxWarmingSearchers>2</maxWarmingSearchers>
80
+ </query>
81
+
82
+ <requestDispatcher handleSelect="false">
83
+ <requestParsers enableRemoteStreaming="true" multipartUploadLimitInKB="2048000" formdataUploadLimitInKB="2048"/>
84
+ <httpCaching never304="true"/>
85
+ </requestDispatcher>
86
+
87
+ <requestHandler name="/search" class="solr.SearchHandler"/>
88
+
89
+ <requestHandler name="/select" class="solr.SearchHandler">
90
+ <lst name="defaults">
91
+ <int name="start">0</int>
92
+ <int name="rows">10</int>
93
+ <str name="wt">json</str>
94
+ <int name="indent">2</int>
95
+ <str name="defType">edismax</str>
96
+ <str name="echoParams">all</str>
97
+ <str name="fl">*,score</str>
98
+ <str name="sort">score desc, dc_title_sort asc</str>
99
+ <str name="q.alt">*:*</str>
100
+ <str name="qf">
101
+ text^1
102
+ dc_description_ti^2
103
+ dc_creator_tmi^3
104
+ dc_publisher_ti^3
105
+ dct_isPartOf_tmi^4
106
+ dc_subject_tmi^5
107
+ dct_spatial_tmi^5
108
+ dct_temporal_tmi^5
109
+ dc_title_ti^6
110
+ dc_rights_ti^7
111
+ dct_provenance_ti^8
112
+ layer_geom_type_ti^9
113
+ layer_slug_ti^10
114
+ dc_identifier_ti^10
115
+ </str>
116
+ <bool name="facet">true</bool>
117
+ <int name="facet.mincount">1</int>
118
+ <int name="facet.limit">10</int>
119
+ <str name="facet.field">dct_isPartOf_sm</str>
120
+ <str name="facet.field">dct_provenance_s</str>
121
+ <str name="facet.field">dct_spatial_sm</str>
122
+ <str name="facet.field">dc_creator_sm</str>
123
+ <str name="facet.field">dc_format_s</str>
124
+ <str name="facet.field">dc_language_s</str>
125
+ <str name="facet.field">dc_publisher_s</str>
126
+ <str name="facet.field">dc_rights_s</str>
127
+ <str name="facet.field">dc_subject_sm</str>
128
+ <str name="facet.field">layer_geom_type_s</str>
129
+ <str name="facet.field">solr_year_i</str>
130
+ </lst>
131
+ </requestHandler>
132
+
133
+ <requestHandler name="/update" class="solr.UpdateRequestHandler"/>
134
+ <requestHandler name="/admin/" class="solr.admin.AdminHandlers"/>
135
+
136
+ <!-- ping/healthcheck -->
137
+ <requestHandler name="/admin/ping" class="solr.PingRequestHandler">
138
+ <lst name="invariants">
139
+ <str name="q">solrpingquery</str>
140
+ </lst>
141
+ <lst name="defaults">
142
+ <str name="echoParams">all</str>
143
+ </lst>
144
+ <!-- An optional feature of the PingRequestHandler is to configure the
145
+ handler with a "healthcheckFile" which can be used to enable/disable
146
+ the PingRequestHandler.
147
+ relative paths are resolved against the data dir
148
+ -->
149
+ <str name="healthcheckFile">server-enabled.txt</str>
150
+ </requestHandler>
151
+
152
+ <requestHandler name="/analysis/field"
153
+ startup="lazy"
154
+ class="solr.FieldAnalysisRequestHandler" />
155
+
156
+ <!-- Legacy config for the admin interface -->
157
+ <admin>
158
+ <defaultQuery>*:*</defaultQuery>
159
+ </admin>
160
+ </config>
@@ -0,0 +1,34 @@
1
+ # Standard english stop words taken from Lucene's StopAnalyzer
2
+ a
3
+ an
4
+ and
5
+ are
6
+ as
7
+ at
8
+ be
9
+ but
10
+ by
11
+ for
12
+ if
13
+ in
14
+ into
15
+ is
16
+ it
17
+ no
18
+ not
19
+ of
20
+ on
21
+ or
22
+ such
23
+ that
24
+ the
25
+ their
26
+ then
27
+ there
28
+ these
29
+ they
30
+ this
31
+ to
32
+ was
33
+ will
34
+ with