enju_ndl 0.3.0 → 0.3.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (121) hide show
  1. checksums.yaml +5 -5
  2. data/app/models/ndl_book.rb +9 -1
  3. data/app/views/ndl_books/index.html.erb +1 -1
  4. data/lib/enju_ndl/engine.rb +1 -1
  5. data/lib/enju_ndl/ndl_search.rb +3 -3
  6. data/lib/enju_ndl/version.rb +1 -1
  7. data/spec/cassette_library/ImportRequest/should_import_a_foreign_book.yml +121 -0
  8. data/spec/cassette_library/ImportRequest/should_import_isbn.yml +49 -492
  9. data/spec/cassette_library/Manifestation/should_import_a_bibliographic_record.yml +121 -0
  10. data/spec/cassette_library/Manifestation/should_import_dcterms_issued.yml +121 -0
  11. data/spec/cassette_library/Manifestation/should_import_isbn.yml +52 -495
  12. data/spec/cassette_library/Manifestation/should_import_series_statement.yml +48 -1121
  13. data/spec/cassette_library/Manifestation/should_import_with_ndl_bib_id.yml +20 -23
  14. data/spec/cassette_library/NdlBook/import/should_get_author_IDs_from_NDLA.yml +62 -0
  15. data/spec/cassette_library/NdlBook/import/should_get_series_title.yml +24 -111
  16. data/spec/cassette_library/NdlBook/import/should_get_subject_IDs_from_NDLA.yml +62 -0
  17. data/spec/cassette_library/NdlBook/import/should_get_volume_number.yml +28 -92
  18. data/spec/cassette_library/NdlBook/import/should_import_audio_cd.yml +26 -126
  19. data/spec/cassette_library/NdlBook/import/should_import_bibliographic_record.yml +28 -166
  20. data/spec/cassette_library/NdlBook/import/should_import_bibliographic_record_that_does_not_have_any_classifications.yml +25 -155
  21. data/spec/cassette_library/NdlBook/import/should_import_edition.yml +25 -154
  22. data/spec/cassette_library/NdlBook/import/should_import_even_with_invalid_url.yml +25 -137
  23. data/spec/cassette_library/NdlBook/import/should_import_map.yml +25 -140
  24. data/spec/cassette_library/NdlBook/import/should_import_ndc8_classification.yml +26 -214
  25. data/spec/cassette_library/NdlBook/import/should_import_notated_music.yml +27 -125
  26. data/spec/cassette_library/NdlBook/import/should_import_painting.yml +26 -114
  27. data/spec/cassette_library/NdlBook/import/should_import_photograph.yml +26 -116
  28. data/spec/cassette_library/NdlBook/import/should_import_picture_postcard.yml +26 -136
  29. data/spec/cassette_library/NdlBook/import/should_import_publication_place.yml +28 -192
  30. data/spec/cassette_library/NdlBook/import/should_import_pud_date_is_nil.yml +25 -107
  31. data/spec/cassette_library/NdlBook/import/should_import_series_statement.yml +27 -194
  32. data/spec/cassette_library/NdlBook/import/should_import_series_statement_if_the_resource_is_serial.yml +24 -216
  33. data/spec/cassette_library/NdlBook/import/should_import_series_statement_s_creator.yml +27 -241
  34. data/spec/cassette_library/NdlBook/import/should_import_series_statement_transctiption.yml +27 -207
  35. data/spec/cassette_library/NdlBook/import/should_import_still_image.yml +26 -133
  36. data/spec/cassette_library/NdlBook/import/should_import_tactile_text.yml +28 -121
  37. data/spec/cassette_library/NdlBook/import/should_import_title_alternative.yml +27 -200
  38. data/spec/cassette_library/NdlBook/import/should_import_url_contain_whitespace.yml +24 -177
  39. data/spec/cassette_library/NdlBook/import/should_import_video_dvd.yml +25 -111
  40. data/spec/cassette_library/NdlBook/import/should_import_volume_number_string.yml +24 -193
  41. data/spec/cassette_library/NdlBook/import/should_import_volume_title.yml +25 -145
  42. data/spec/cassette_library/NdlBook/import/should_import_with_DDC_Fic_.yml +21 -24
  43. data/spec/cassette_library/NdlBook/import/should_not_get_series_title_if_book_has_not_series_title.yml +26 -124
  44. data/spec/cassette_library/NdlBook/import/should_not_get_volume_number_if_book_has_not_volume.yml +24 -105
  45. data/spec/cassette_library/NdlBook/search/should_not_distinguish_double_byte_space_from_one-byte_space_in_a_query.yml +53 -785
  46. data/spec/cassette_library/NdlBook/search/should_search_bibliographic_record.yml +26 -386
  47. data/spec/cassette_library/NdlBooksController/GET_index/should_get_index.yml +24 -463
  48. data/spec/cassette_library/NdlBooksController/POST_create/should_create_a_bibliographic_record_if_jpno_is_set.yml +24 -213
  49. data/spec/cassette_library/NdlBooksController/POST_create/should_create_a_serial_record.yml +28 -143
  50. data/spec/cassette_library/NdlBooksController/POST_create/should_not_create_a_bibliographic_record_if_jpno_is_not_set.yml +27 -22
  51. data/spec/cassette_library/Question/should_respond_to_search_crd.yml +12 -220
  52. data/spec/cassette_library/ndl_books/index/ndl_search_menu/should_reflect_query_params_for_views.yml +24 -384
  53. data/spec/dummy/db/schema.rb +920 -1004
  54. data/spec/dummy/db/test.sqlite3 +0 -0
  55. data/spec/dummy/solr/configsets/sunspot/conf/_rest_managed.json +1 -0
  56. data/spec/dummy/solr/configsets/sunspot/conf/admin-extra.html +31 -0
  57. data/spec/dummy/solr/configsets/sunspot/conf/currency.xml +67 -0
  58. data/spec/dummy/solr/configsets/sunspot/conf/elevate.xml +36 -0
  59. data/spec/dummy/solr/configsets/sunspot/conf/lang/stopwords_en.txt +54 -0
  60. data/spec/dummy/solr/configsets/sunspot/conf/mapping-ISOLatin1Accent.txt +246 -0
  61. data/spec/dummy/solr/configsets/sunspot/conf/protwords.txt +21 -0
  62. data/spec/dummy/solr/configsets/sunspot/conf/schema.xml +278 -0
  63. data/spec/dummy/solr/configsets/sunspot/conf/scripts.conf +24 -0
  64. data/spec/dummy/solr/configsets/sunspot/conf/solrconfig.xml +631 -0
  65. data/spec/dummy/solr/configsets/sunspot/conf/spellings.txt +2 -0
  66. data/spec/dummy/solr/configsets/sunspot/conf/synonyms.txt +29 -0
  67. data/spec/dummy/solr/default/data/index/segments_1 +0 -0
  68. data/spec/dummy/solr/default/data/index/write.lock +0 -0
  69. data/spec/dummy/solr/development/data/index/segments_1 +0 -0
  70. data/spec/dummy/solr/development/data/index/write.lock +0 -0
  71. data/spec/dummy/solr/pids/test/sunspot-solr-test.pid +1 -0
  72. data/spec/dummy/solr/solr.xml +51 -0
  73. data/spec/dummy/solr/test/data/index/_1p8.fdt +0 -0
  74. data/spec/dummy/solr/test/data/index/_1p8.fdx +0 -0
  75. data/spec/dummy/solr/test/data/index/_1p8.fnm +0 -0
  76. data/spec/dummy/solr/test/data/index/_1p8.nvd +0 -0
  77. data/spec/dummy/solr/test/data/index/_1p8.nvm +0 -0
  78. data/spec/dummy/solr/test/data/index/_1p8.si +0 -0
  79. data/spec/dummy/solr/test/data/index/_1p8_2.liv +0 -0
  80. data/spec/dummy/solr/test/data/index/_1p8_Lucene50_0.doc +0 -0
  81. data/spec/dummy/solr/test/data/index/_1p8_Lucene50_0.pos +0 -0
  82. data/spec/dummy/solr/test/data/index/_1p8_Lucene50_0.tim +0 -0
  83. data/spec/dummy/solr/test/data/index/_1p8_Lucene50_0.tip +0 -0
  84. data/spec/dummy/solr/test/data/index/_1pe.fdt +0 -0
  85. data/spec/dummy/solr/test/data/index/_1pe.fdx +0 -0
  86. data/spec/dummy/solr/test/data/index/_1pe.fnm +0 -0
  87. data/spec/dummy/solr/test/data/index/_1pe.nvd +0 -0
  88. data/spec/dummy/solr/test/data/index/_1pe.nvm +0 -0
  89. data/spec/dummy/solr/test/data/index/_1pe.si +0 -0
  90. data/spec/dummy/solr/test/data/index/_1pe_Lucene50_0.doc +0 -0
  91. data/spec/dummy/solr/test/data/index/_1pe_Lucene50_0.pos +0 -0
  92. data/spec/dummy/solr/test/data/index/_1pe_Lucene50_0.tim +0 -0
  93. data/spec/dummy/solr/test/data/index/_1pe_Lucene50_0.tip +0 -0
  94. data/spec/dummy/solr/test/data/index/_1pf.fdt +0 -0
  95. data/spec/dummy/solr/test/data/index/_1pf.fdx +0 -0
  96. data/spec/dummy/solr/test/data/index/_1pf.fnm +0 -0
  97. data/spec/dummy/solr/test/data/index/_1pf.nvd +0 -0
  98. data/spec/dummy/solr/test/data/index/_1pf.nvm +0 -0
  99. data/spec/dummy/solr/test/data/index/_1pf.si +0 -0
  100. data/spec/dummy/solr/test/data/index/_1pf_Lucene50_0.doc +0 -0
  101. data/spec/dummy/solr/test/data/index/_1pf_Lucene50_0.pos +0 -0
  102. data/spec/dummy/solr/test/data/index/_1pf_Lucene50_0.tim +0 -0
  103. data/spec/dummy/solr/test/data/index/_1pf_Lucene50_0.tip +0 -0
  104. data/spec/dummy/solr/test/data/index/segments_1p0 +0 -0
  105. data/spec/dummy/solr/test/data/index/write.lock +0 -0
  106. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002916 +0 -0
  107. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002918 +0 -0
  108. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002919 +0 -0
  109. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002920 +0 -0
  110. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002921 +0 -0
  111. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002922 +0 -0
  112. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002924 +0 -0
  113. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002925 +0 -0
  114. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002926 +0 -0
  115. data/spec/dummy/solr/test/data/tlog/tlog.0000000000000002927 +0 -0
  116. data/spec/models/import_request_spec.rb +4 -0
  117. data/spec/models/manifestation_spec.rb +9 -1
  118. data/spec/models/ndl_book_spec.rb +20 -5
  119. data/spec/views/ndl_books/index.html.erb_spec.rb +1 -1
  120. metadata +472 -340
  121. data/spec/cassette_library/Manifestation/should_imporrt_a_bibliographic_record.yml +0 -1211
@@ -0,0 +1 @@
1
+ {"initArgs":{},"managedList":[]}
@@ -0,0 +1,31 @@
1
+ <!--
2
+ Licensed to the Apache Software Foundation (ASF) under one or more
3
+ contributor license agreements. See the NOTICE file distributed with
4
+ this work for additional information regarding copyright ownership.
5
+ The ASF licenses this file to You under the Apache License, Version 2.0
6
+ (the "License"); you may not use this file except in compliance with
7
+ the License. You may obtain a copy of the License at
8
+
9
+ http://www.apache.org/licenses/LICENSE-2.0
10
+
11
+ Unless required by applicable law or agreed to in writing, software
12
+ distributed under the License is distributed on an "AS IS" BASIS,
13
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
+ See the License for the specific language governing permissions and
15
+ limitations under the License.
16
+ -->
17
+
18
+ <!-- The content of this page will be statically included into the top
19
+ of the admin page. Uncomment this as an example to see there the content
20
+ will show up.
21
+
22
+ <hr>
23
+ <i>This line will appear before the first table</i>
24
+ <tr>
25
+ <td colspan="2">
26
+ This row will be appended to the end of the first table
27
+ </td>
28
+ </tr>
29
+ <hr>
30
+
31
+ -->
@@ -0,0 +1,67 @@
1
+ <?xml version="1.0" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!-- Example exchange rates file for CurrencyField type named "currency" in example schema -->
20
+
21
+ <currencyConfig version="1.0">
22
+ <rates>
23
+ <!-- Updated from http://www.exchangerate.com/ at 2011-09-27 -->
24
+ <rate from="USD" to="ARS" rate="4.333871" comment="ARGENTINA Peso" />
25
+ <rate from="USD" to="AUD" rate="1.025768" comment="AUSTRALIA Dollar" />
26
+ <rate from="USD" to="EUR" rate="0.743676" comment="European Euro" />
27
+ <rate from="USD" to="BRL" rate="1.881093" comment="BRAZIL Real" />
28
+ <rate from="USD" to="CAD" rate="1.030815" comment="CANADA Dollar" />
29
+ <rate from="USD" to="CLP" rate="519.0996" comment="CHILE Peso" />
30
+ <rate from="USD" to="CNY" rate="6.387310" comment="CHINA Yuan" />
31
+ <rate from="USD" to="CZK" rate="18.47134" comment="CZECH REP. Koruna" />
32
+ <rate from="USD" to="DKK" rate="5.515436" comment="DENMARK Krone" />
33
+ <rate from="USD" to="HKD" rate="7.801922" comment="HONG KONG Dollar" />
34
+ <rate from="USD" to="HUF" rate="215.6169" comment="HUNGARY Forint" />
35
+ <rate from="USD" to="ISK" rate="118.1280" comment="ICELAND Krona" />
36
+ <rate from="USD" to="INR" rate="49.49088" comment="INDIA Rupee" />
37
+ <rate from="USD" to="XDR" rate="0.641358" comment="INTNL MON. FUND SDR" />
38
+ <rate from="USD" to="ILS" rate="3.709739" comment="ISRAEL Sheqel" />
39
+ <rate from="USD" to="JPY" rate="76.32419" comment="JAPAN Yen" />
40
+ <rate from="USD" to="KRW" rate="1169.173" comment="KOREA (SOUTH) Won" />
41
+ <rate from="USD" to="KWD" rate="0.275142" comment="KUWAIT Dinar" />
42
+ <rate from="USD" to="MXN" rate="13.85895" comment="MEXICO Peso" />
43
+ <rate from="USD" to="NZD" rate="1.285159" comment="NEW ZEALAND Dollar" />
44
+ <rate from="USD" to="NOK" rate="5.859035" comment="NORWAY Krone" />
45
+ <rate from="USD" to="PKR" rate="87.57007" comment="PAKISTAN Rupee" />
46
+ <rate from="USD" to="PEN" rate="2.730683" comment="PERU Sol" />
47
+ <rate from="USD" to="PHP" rate="43.62039" comment="PHILIPPINES Peso" />
48
+ <rate from="USD" to="PLN" rate="3.310139" comment="POLAND Zloty" />
49
+ <rate from="USD" to="RON" rate="3.100932" comment="ROMANIA Leu" />
50
+ <rate from="USD" to="RUB" rate="32.14663" comment="RUSSIA Ruble" />
51
+ <rate from="USD" to="SAR" rate="3.750465" comment="SAUDI ARABIA Riyal" />
52
+ <rate from="USD" to="SGD" rate="1.299352" comment="SINGAPORE Dollar" />
53
+ <rate from="USD" to="ZAR" rate="8.329761" comment="SOUTH AFRICA Rand" />
54
+ <rate from="USD" to="SEK" rate="6.883442" comment="SWEDEN Krona" />
55
+ <rate from="USD" to="CHF" rate="0.906035" comment="SWITZERLAND Franc" />
56
+ <rate from="USD" to="TWD" rate="30.40283" comment="TAIWAN Dollar" />
57
+ <rate from="USD" to="THB" rate="30.89487" comment="THAILAND Baht" />
58
+ <rate from="USD" to="AED" rate="3.672955" comment="U.A.E. Dirham" />
59
+ <rate from="USD" to="UAH" rate="7.988582" comment="UKRAINE Hryvnia" />
60
+ <rate from="USD" to="GBP" rate="0.647910" comment="UNITED KINGDOM Pound" />
61
+
62
+ <!-- Cross-rates for some common currencies -->
63
+ <rate from="EUR" to="GBP" rate="0.869914" />
64
+ <rate from="EUR" to="NOK" rate="7.800095" />
65
+ <rate from="GBP" to="NOK" rate="8.966508" />
66
+ </rates>
67
+ </currencyConfig>
@@ -0,0 +1,36 @@
1
+ <?xml version="1.0" encoding="UTF-8" ?>
2
+ <!--
3
+ Licensed to the Apache Software Foundation (ASF) under one or more
4
+ contributor license agreements. See the NOTICE file distributed with
5
+ this work for additional information regarding copyright ownership.
6
+ The ASF licenses this file to You under the Apache License, Version 2.0
7
+ (the "License"); you may not use this file except in compliance with
8
+ the License. You may obtain a copy of the License at
9
+
10
+ http://www.apache.org/licenses/LICENSE-2.0
11
+
12
+ Unless required by applicable law or agreed to in writing, software
13
+ distributed under the License is distributed on an "AS IS" BASIS,
14
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15
+ See the License for the specific language governing permissions and
16
+ limitations under the License.
17
+ -->
18
+
19
+ <!-- If this file is found in the config directory, it will only be
20
+ loaded once at startup. If it is found in Solr's data
21
+ directory, it will be re-loaded every commit.
22
+ -->
23
+
24
+ <elevate>
25
+ <query text="foo bar">
26
+ <doc id="1" />
27
+ <doc id="2" />
28
+ <doc id="3" />
29
+ </query>
30
+
31
+ <query text="ipod">
32
+ <doc id="MA147LL/A" /> <!-- put the actual ipod at the top -->
33
+ <doc id="IW-02" exclude="true" /> <!-- exclude this cable -->
34
+ </query>
35
+
36
+ </elevate>
@@ -0,0 +1,54 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one or more
2
+ # contributor license agreements. See the NOTICE file distributed with
3
+ # this work for additional information regarding copyright ownership.
4
+ # The ASF licenses this file to You under the Apache License, Version 2.0
5
+ # (the "License"); you may not use this file except in compliance with
6
+ # the License. You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ # a couple of test stopwords to test that the words are really being
17
+ # configured from this file:
18
+ stopworda
19
+ stopwordb
20
+
21
+ # Standard english stop words taken from Lucene's StopAnalyzer
22
+ a
23
+ an
24
+ and
25
+ are
26
+ as
27
+ at
28
+ be
29
+ but
30
+ by
31
+ for
32
+ if
33
+ in
34
+ into
35
+ is
36
+ it
37
+ no
38
+ not
39
+ of
40
+ on
41
+ or
42
+ such
43
+ that
44
+ the
45
+ their
46
+ then
47
+ there
48
+ these
49
+ they
50
+ this
51
+ to
52
+ was
53
+ will
54
+ with
@@ -0,0 +1,246 @@
1
+ # The ASF licenses this file to You under the Apache License, Version 2.0
2
+ # (the "License"); you may not use this file except in compliance with
3
+ # the License. You may obtain a copy of the License at
4
+ #
5
+ # http://www.apache.org/licenses/LICENSE-2.0
6
+ #
7
+ # Unless required by applicable law or agreed to in writing, software
8
+ # distributed under the License is distributed on an "AS IS" BASIS,
9
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10
+ # See the License for the specific language governing permissions and
11
+ # limitations under the License.
12
+
13
+ # Syntax:
14
+ # "source" => "target"
15
+ # "source".length() > 0 (source cannot be empty.)
16
+ # "target".length() >= 0 (target can be empty.)
17
+
18
+ # example:
19
+ # "À" => "A"
20
+ # "\u00C0" => "A"
21
+ # "\u00C0" => "\u0041"
22
+ # "ß" => "ss"
23
+ # "\t" => " "
24
+ # "\n" => ""
25
+
26
+ # À => A
27
+ "\u00C0" => "A"
28
+
29
+ # Á => A
30
+ "\u00C1" => "A"
31
+
32
+ # Â => A
33
+ "\u00C2" => "A"
34
+
35
+ # Ã => A
36
+ "\u00C3" => "A"
37
+
38
+ # Ä => A
39
+ "\u00C4" => "A"
40
+
41
+ # Å => A
42
+ "\u00C5" => "A"
43
+
44
+ # Æ => AE
45
+ "\u00C6" => "AE"
46
+
47
+ # Ç => C
48
+ "\u00C7" => "C"
49
+
50
+ # È => E
51
+ "\u00C8" => "E"
52
+
53
+ # É => E
54
+ "\u00C9" => "E"
55
+
56
+ # Ê => E
57
+ "\u00CA" => "E"
58
+
59
+ # Ë => E
60
+ "\u00CB" => "E"
61
+
62
+ # Ì => I
63
+ "\u00CC" => "I"
64
+
65
+ # Í => I
66
+ "\u00CD" => "I"
67
+
68
+ # Î => I
69
+ "\u00CE" => "I"
70
+
71
+ # Ï => I
72
+ "\u00CF" => "I"
73
+
74
+ # IJ => IJ
75
+ "\u0132" => "IJ"
76
+
77
+ # Ð => D
78
+ "\u00D0" => "D"
79
+
80
+ # Ñ => N
81
+ "\u00D1" => "N"
82
+
83
+ # Ò => O
84
+ "\u00D2" => "O"
85
+
86
+ # Ó => O
87
+ "\u00D3" => "O"
88
+
89
+ # Ô => O
90
+ "\u00D4" => "O"
91
+
92
+ # Õ => O
93
+ "\u00D5" => "O"
94
+
95
+ # Ö => O
96
+ "\u00D6" => "O"
97
+
98
+ # Ø => O
99
+ "\u00D8" => "O"
100
+
101
+ # Π=> OE
102
+ "\u0152" => "OE"
103
+
104
+ # Þ
105
+ "\u00DE" => "TH"
106
+
107
+ # Ù => U
108
+ "\u00D9" => "U"
109
+
110
+ # Ú => U
111
+ "\u00DA" => "U"
112
+
113
+ # Û => U
114
+ "\u00DB" => "U"
115
+
116
+ # Ü => U
117
+ "\u00DC" => "U"
118
+
119
+ # Ý => Y
120
+ "\u00DD" => "Y"
121
+
122
+ # Ÿ => Y
123
+ "\u0178" => "Y"
124
+
125
+ # à => a
126
+ "\u00E0" => "a"
127
+
128
+ # á => a
129
+ "\u00E1" => "a"
130
+
131
+ # â => a
132
+ "\u00E2" => "a"
133
+
134
+ # ã => a
135
+ "\u00E3" => "a"
136
+
137
+ # ä => a
138
+ "\u00E4" => "a"
139
+
140
+ # å => a
141
+ "\u00E5" => "a"
142
+
143
+ # æ => ae
144
+ "\u00E6" => "ae"
145
+
146
+ # ç => c
147
+ "\u00E7" => "c"
148
+
149
+ # è => e
150
+ "\u00E8" => "e"
151
+
152
+ # é => e
153
+ "\u00E9" => "e"
154
+
155
+ # ê => e
156
+ "\u00EA" => "e"
157
+
158
+ # ë => e
159
+ "\u00EB" => "e"
160
+
161
+ # ì => i
162
+ "\u00EC" => "i"
163
+
164
+ # í => i
165
+ "\u00ED" => "i"
166
+
167
+ # î => i
168
+ "\u00EE" => "i"
169
+
170
+ # ï => i
171
+ "\u00EF" => "i"
172
+
173
+ # ij => ij
174
+ "\u0133" => "ij"
175
+
176
+ # ð => d
177
+ "\u00F0" => "d"
178
+
179
+ # ñ => n
180
+ "\u00F1" => "n"
181
+
182
+ # ò => o
183
+ "\u00F2" => "o"
184
+
185
+ # ó => o
186
+ "\u00F3" => "o"
187
+
188
+ # ô => o
189
+ "\u00F4" => "o"
190
+
191
+ # õ => o
192
+ "\u00F5" => "o"
193
+
194
+ # ö => o
195
+ "\u00F6" => "o"
196
+
197
+ # ø => o
198
+ "\u00F8" => "o"
199
+
200
+ # œ => oe
201
+ "\u0153" => "oe"
202
+
203
+ # ß => ss
204
+ "\u00DF" => "ss"
205
+
206
+ # þ => th
207
+ "\u00FE" => "th"
208
+
209
+ # ù => u
210
+ "\u00F9" => "u"
211
+
212
+ # ú => u
213
+ "\u00FA" => "u"
214
+
215
+ # û => u
216
+ "\u00FB" => "u"
217
+
218
+ # ü => u
219
+ "\u00FC" => "u"
220
+
221
+ # ý => y
222
+ "\u00FD" => "y"
223
+
224
+ # ÿ => y
225
+ "\u00FF" => "y"
226
+
227
+ # ff => ff
228
+ "\uFB00" => "ff"
229
+
230
+ # fi => fi
231
+ "\uFB01" => "fi"
232
+
233
+ # fl => fl
234
+ "\uFB02" => "fl"
235
+
236
+ # ffi => ffi
237
+ "\uFB03" => "ffi"
238
+
239
+ # ffl => ffl
240
+ "\uFB04" => "ffl"
241
+
242
+ # ſt => ft
243
+ "\uFB05" => "ft"
244
+
245
+ # st => st
246
+ "\uFB06" => "st"
@@ -0,0 +1,21 @@
1
+ # The ASF licenses this file to You under the Apache License, Version 2.0
2
+ # (the "License"); you may not use this file except in compliance with
3
+ # the License. You may obtain a copy of the License at
4
+ #
5
+ # http://www.apache.org/licenses/LICENSE-2.0
6
+ #
7
+ # Unless required by applicable law or agreed to in writing, software
8
+ # distributed under the License is distributed on an "AS IS" BASIS,
9
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10
+ # See the License for the specific language governing permissions and
11
+ # limitations under the License.
12
+
13
+ #-----------------------------------------------------------------------
14
+ # Use a protected word file to protect against the stemmer reducing two
15
+ # unrelated words to the same base word.
16
+
17
+ # Some non-words that normally won't be encountered,
18
+ # just to test that they won't be stemmed.
19
+ dontstems
20
+ zwhacky
21
+