exhibits_solr_conf 0.0.4 → 0.0.5

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 6337dd6836fbc0642a72a9ff44b4cb71c9a48f44
4
- data.tar.gz: cdaf04b4c6df1837f134fe7f6d5e054c650aa4b0
3
+ metadata.gz: 0c7734c926440e3f699e3fb7915583a3e8c1361c
4
+ data.tar.gz: 0c607b6fbc7c3bf27acae92ea79fb68d797edf0c
5
5
  SHA512:
6
- metadata.gz: 5c401f6625e5199b6ca090d5f19d82354ac81ef9799530bded3372e9a330fe9f6f17bf8b1faf782a3a8e4b491e0a1c1c8fdaf1969bf972587aeebde8736f890a
7
- data.tar.gz: 414d25ae01c3d15f19bef2adc3a2d4a665056bb96e570c5ca2ac381810b256de8b658514e0385bec79b68bc4fdb953b6f5e5f5915c0258b7b6f0619e782ef0e3
6
+ metadata.gz: 124f53f6dc327f40268013d68d6ff2a0ee4a304dd662495cfc8a2ff06bb6b67568150bd892cbfd19db14b6f6dd72876bd1a7328a5fdf8fdfc0591570e2013c93
7
+ data.tar.gz: c3d3e7b938387081b892697dcedf5bbd536116323d91ce0cf1077d69ff9854caf407314a241894461d31cdf7919ce61c8e47130bdcc1d1c7c049a2eaacd01492
@@ -1,3 +1,3 @@
1
1
  module ExhibitsSolrConf
2
- VERSION = '0.0.4'
2
+ VERSION = '0.0.5'
3
3
  end
@@ -1,5 +1,5 @@
1
1
  <?xml version="1.0" encoding="UTF-8" ?>
2
- <schema name="Stanford Searchworks" version="1.5">
2
+ <schema name="Stanford Exhibits based on SearchWorks" version="1.5">
3
3
  <uniqueKey>id</uniqueKey>
4
4
 
5
5
  <fields>
@@ -12,7 +12,7 @@
12
12
  <field name="last_updated" type="date" indexed="true" stored="true" default="NOW/SECOND" />
13
13
  <!-- entire marc bib record -->
14
14
  <field name="marcxml" type="string" indexed="false" stored="true" />
15
- <!-- all_search: catch-all field for searchable text; stored for hit highlighting />-->
15
+ <!-- all_search: catch-all field for metadata text; stored for hit highlighting -->
16
16
  <field name="all_search" type="text" indexed="true" stored="true" termVectors="true" termPositions="true" termOffsets="true" multiValued="true" />
17
17
  <field name="all_unstem_search" type="textNoStem" indexed="true" stored="true" multiValued="true" />
18
18
  <field name="vern_all_search" type="text" indexed="true" stored="true" multiValued="true" />
@@ -235,8 +235,6 @@
235
235
  <dynamicField name="*_facet" type="string" stored="true" indexed="true" multiValued="true" />
236
236
  <dynamicField name="*_display" type="string" stored="true" indexed="false" multiValued="true"/>
237
237
  -->
238
- <dynamicField name="*_si" type="string" stored="true" indexed="true" omitNorms="true" />
239
- <dynamicField name="*_sim" type="string" stored="true" indexed="true" multiValued="true" omitNorms="true" />
240
238
  <dynamicField name="*_ss" type="string" stored="true" indexed="false" omitNorms="true" />
241
239
  <dynamicField name="*_ssm" type="string" stored="true" indexed="false" multiValued="true" omitNorms="true" />
242
240
  <dynamicField name="*_ssi" type="string" stored="true" indexed="true" omitNorms="true" />
@@ -247,11 +245,18 @@
247
245
  <dynamicField name="*_xml" type="string" stored="true" indexed="false" omitNorms="true" />
248
246
  <dynamicField name="cjk_*" type="text_cjk" stored="true" indexed="true" multiValued="true" />
249
247
  <dynamicField name="*_hsim" type="string_hierarch" stored="true" indexed="true" multiValued="true" />
248
+
249
+ <!-- exhibits fields -->
250
+ <field name="full_text_search" type="text" indexed="true" stored="true" termVectors="true" termPositions="true" termOffsets="true" multiValued="true" />
251
+ <field name="full_text_unstem_search" type="textNoStem" indexed="true" stored="true" multiValued="true" />
252
+ <!-- NOTE: *_tesim fields are copied into all_search which is meant for metadata, not full text. Use _tesimv for full text -->
250
253
  <dynamicField name="*_tesim" type="text" stored="true" indexed="true" multiValued="true" omitNorms="true" />
254
+ <!-- NOTE: *_tesimv fields are copied into full_text_search which is meant for full text, not metadata. Use _tesim for metadata -->
255
+ <dynamicField name="*_tesimv" type="text" stored="true" indexed="true" multiValued="true" termVectors="true" termPositions="true" termOffsets="true"/>
251
256
  <dynamicField name="*_bsi" type="boolean" stored="true" indexed="true" multiValued="true" omitNorms="true" />
252
257
  <dynamicField name="*_ng" type="text_en_ng" stored="false" indexed="true" multiValued="true"/>
253
- <dynamicField name="*_pt" type="location" stored="true" indexed="true"/>
254
- <dynamicField name="*_bbox" type="location_rpt" stored="true" indexed="true" multiValued="true"/>
258
+ <dynamicField name="*_pt" type="location" stored="true" indexed="true"/>
259
+ <dynamicField name="*_bbox" type="location_rpt" stored="true" indexed="true" multiValued="true"/>
255
260
  </fields>
256
261
 
257
262
  <!-- copy fields -->
@@ -324,11 +329,15 @@
324
329
  <copyField source="vern_summary_search" dest="cjk_summary_search" />
325
330
  <copyField source="vern_all_search" dest="cjk_all_search" />
326
331
 
327
- <!-- Spotlight fields -->
332
+ <!-- exhibits fields -->
328
333
  <copyField source="id" dest="id_ng" maxChars="3000"/>
329
334
  <copyField source="title_full_display" dest="full_title_ng" maxChars="3000"/>
335
+ <!-- NOTE: all_search is meant for metadata -->
330
336
  <copyField source="*_tesim" dest="all_search" />
331
337
  <copyField source="*_tesim" dest="all_unstem_search" />
338
+ <!-- NOTE: full_text_search is meant for full text -->
339
+ <copyField source="*_tesimv" dest="full_text_search" />
340
+ <copyField source="full_text_search" dest="full_text_unstem_search" />
332
341
 
333
342
  <types>
334
343
  <fieldType name="string" class="solr.StrField" sortMissingLast="true" />
@@ -479,7 +488,9 @@
479
488
  </fieldType>
480
489
 
481
490
 
482
- <!-- A text field with defaults appropriate for English an NGrams -->
491
+ <!-- exhibits fieldTypes below -->
492
+
493
+ <!-- A text field with defaults appropriate for English and NGrams -->
483
494
  <fieldType name="text_en_ng" class="solr.TextField" positionIncrementGap="100">
484
495
  <analyzer type="index">
485
496
  <tokenizer class="solr.ICUTokenizerFactory"/>
@@ -490,12 +501,10 @@
490
501
  <filter class="solr.TrimFilterFactory"/>
491
502
  <filter class="solr.EdgeNGramFilterFactory" minGramSize="3" maxGramSize="15" />
492
503
  </analyzer>
493
-
494
- <analyzer type="index">
504
+ <analyzer type="query">
495
505
  <tokenizer class="solr.ICUTokenizerFactory"/>
496
- <filter class="solr.ICUFoldingFilterFactory"/> <!-- NFKC, case folding, diacritics removed -->
506
+ <filter class="solr.ICUFoldingFilterFactory"/>
497
507
  <filter class="solr.EnglishPossessiveFilterFactory"/>
498
- <!-- EnglishMinimalStemFilterFactory is less aggressive than PorterStemFilterFactory: -->
499
508
  <filter class="solr.EnglishMinimalStemFilterFactory"/>
500
509
  <filter class="solr.TrimFilterFactory"/>
501
510
  </analyzer>
@@ -503,7 +512,7 @@
503
512
 
504
513
  <!-- This point type indexes the coordinates as separate fields (subFields)
505
514
  If subFieldType is defined, it references a type, and a dynamic field
506
- definition is created matching *___<typename>. Alternately, if
515
+ definition is created matching *___<typename>. Alternately, if
507
516
  subFieldSuffix is defined, that is used to create the subFields.
508
517
  Example: if subFieldType="double", then the coordinates would be
509
518
  indexed in fields myloc_0___double,myloc_1___double.
@@ -513,10 +522,10 @@
513
522
  users normally should not need to know about them.
514
523
  -->
515
524
  <fieldType name="point" class="solr.PointType" dimension="2" subFieldSuffix="_d"/>
516
-
525
+
517
526
  <!-- A specialized field for geospatial search. If indexed, this fieldType must not be multivalued. -->
518
527
  <fieldType name="location" class="solr.LatLonType" subFieldSuffix="_coordinate"/>
519
-
528
+
520
529
  <!-- An alternative geospatial field type new to Solr 4. It supports multiValued and polygon shapes.
521
530
  For more information about this and other Spatial fields new to Solr 4, see:
522
531
  http://wiki.apache.org/solr/SolrAdaptersForLuceneSpatial4
@@ -107,6 +107,8 @@
107
107
  collection_search
108
108
  all_unstem_search^5
109
109
  all_search vern_all_search
110
+ full_text_unstem_search^2.5
111
+ full_text_search^0.5
110
112
  </str>
111
113
  <str name="pf"> <!-- (phrase boost within result set) -->
112
114
  title_245a_exact_search^5000
@@ -161,6 +163,8 @@
161
163
  collection_search^5
162
164
  all_unstem_search^25
163
165
  all_search^5 vern_all_search^5
166
+ full_text_unstem_search^12.5
167
+ full_text_search^2.5
164
168
  </str>
165
169
  <str name="pf3"> <!-- (token trigrams boost within result set) -->
166
170
  title_245a_search^1500 vern_title_245a_search^1500
@@ -190,6 +194,7 @@
190
194
  award_search^3
191
195
  collection_search^3
192
196
  all_search^3 vern_all_search^3
197
+ full_text_search^1.5
193
198
  </str>
194
199
  <str name="pf2"> <!--(token bigrams boost within result set) -->
195
200
  title_245a_search^1000 vern_title_245a_search^1000
@@ -219,6 +224,7 @@
219
224
  award_search^2
220
225
  collection_search^2
221
226
  all_search^2 vern_all_search^2
227
+ full_text_search
222
228
  </str>
223
229
 
224
230
  <str name="qf_cjk">
@@ -757,7 +763,7 @@
757
763
  <str name="facet.field">topic_facet</str>
758
764
 
759
765
  <!-- Highlighting defaults -->
760
- <str name="hl.fl">all_search</str>
766
+ <str name="hl.fl">all_search full_text_search</str>
761
767
 
762
768
  <str name="fl">
763
769
  score,
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: exhibits_solr_conf
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.0.4
4
+ version: 0.0.5
5
5
  platform: ruby
6
6
  authors:
7
7
  - Naomi Dushay
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2015-11-12 00:00:00.000000000 Z
11
+ date: 2015-11-13 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: bundler