hydra-works 2.1.0 → 2.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.circleci/config.yml +100 -111
- data/CONTRIBUTING.md +23 -1
- data/hydra-works.gemspec +2 -2
- data/lib/hydra/works/version.rb +1 -1
- data/solr/conf/_rest_managed.json +3 -0
- data/solr/conf/admin-extra.html +31 -0
- data/solr/conf/elevate.xml +36 -0
- data/solr/conf/mapping-ISOLatin1Accent.txt +246 -0
- data/solr/conf/protwords.txt +21 -0
- data/solr/conf/schema.xml +367 -0
- data/solr/conf/scripts.conf +24 -0
- data/solr/conf/solrconfig.xml +327 -0
- data/solr/conf/spellings.txt +2 -0
- data/solr/conf/stopwords.txt +58 -0
- data/solr/conf/stopwords_en.txt +58 -0
- data/solr/conf/synonyms.txt +31 -0
- data/solr/conf/xslt/example.xsl +132 -0
- data/solr/conf/xslt/example_atom.xsl +67 -0
- data/solr/conf/xslt/example_rss.xsl +66 -0
- data/solr/conf/xslt/luke.xsl +337 -0
- metadata +23 -7
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: 9deacc2e32feacbc584f092c9d135b0948bb64ed4f7cdd64dc8d4caa439c15f9
|
|
4
|
+
data.tar.gz: 0f65c6d092513d7ef0eff6973b3c89dc9e094d02876a45d0ddfc7e78551b819c
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 2d4cbcec78178a7909174a536a791075d8e7aec6fd4e3f47d2a6fc5a257781e2f1dccba82c04fb9c260d04c69f06f701fa10b7b9dbf50d44c9b55d50654daf1e
|
|
7
|
+
data.tar.gz: 3bdc1a0dcfe3afed1b1b5e59028a9581ecb5689d68139487483772d55e574fdc5078fbc269ecf77f37a182f16c6f4903a0a97df7f33e77b68ced7b90b5fa0542
|
data/.circleci/config.yml
CHANGED
|
@@ -3,22 +3,49 @@ version: 2.1
|
|
|
3
3
|
orbs:
|
|
4
4
|
samvera: samvera/circleci-orb@1.0
|
|
5
5
|
jobs:
|
|
6
|
-
|
|
6
|
+
bundle_lint_test:
|
|
7
7
|
parameters:
|
|
8
8
|
ruby_version:
|
|
9
9
|
type: string
|
|
10
10
|
bundler_version:
|
|
11
11
|
type: string
|
|
12
|
-
default: 2.
|
|
12
|
+
default: 2.4.5
|
|
13
13
|
rails_version:
|
|
14
14
|
type: string
|
|
15
|
+
solr_config_path:
|
|
16
|
+
type: string
|
|
17
|
+
default: solr/conf
|
|
18
|
+
ruby_type:
|
|
19
|
+
type: string
|
|
20
|
+
default: 'ruby'
|
|
21
|
+
solr_port:
|
|
22
|
+
type: string
|
|
23
|
+
default: '8985'
|
|
24
|
+
fcrepo_version:
|
|
25
|
+
type: string
|
|
26
|
+
default: "4.7.5"
|
|
27
|
+
solr_version:
|
|
28
|
+
type: string
|
|
29
|
+
default: "9.5"
|
|
30
|
+
docker:
|
|
31
|
+
- image: cimg/<< parameters.ruby_type >>:<< parameters.ruby_version >>-browsers
|
|
32
|
+
- image: samvera/fcrepo4:<< parameters.fcrepo_version >>
|
|
33
|
+
environment:
|
|
34
|
+
CATALINA_OPTS: "-Djava.awt.headless=true -Dfile.encoding=UTF-8 -server -Xms512m -Xmx1024m -XX:NewSize=256m -XX:MaxNewSize=256m -XX:PermSize=256m -XX:MaxPermSize=256m -XX:+DisableExplicitGC"
|
|
35
|
+
- image: zookeeper:3.9
|
|
36
|
+
environment:
|
|
37
|
+
ZOO_ADMINSERVER_ENABLED: false
|
|
38
|
+
- image: solr:<< parameters.solr_version >>
|
|
39
|
+
environment:
|
|
40
|
+
VERBOSE: yes
|
|
41
|
+
SECURITY_JSON: '{"authentication":{"blockUnknown": false, "class":"solr.BasicAuthPlugin", "credentials":{"solr":"IV0EHq1OnNrj6gvRCwvFwTrZ1+z1oBbnQdiVC3otuq0= Ndd7LKvVBAaZIF0QAVi1ekCfAJXr1GGfLtRUXhgrF8c="}, "realm":"My Solr users", "forwardCredentials": false}, "authorization":{ "class":"solr.RuleBasedAuthorizationPlugin", "permissions":[{"name":"security-edit", "role":"admin"}], "user-role":{"solr":"admin"}}}'
|
|
42
|
+
command: sh -c "server/scripts/cloud-scripts/zkcli.sh -zkhost localhost:2181 -cmd put /security.json \"${SECURITY_JSON}\" && solr-fg -cloud -noprompt -p << parameters.solr_port >> -z localhost:2181"
|
|
15
43
|
environment:
|
|
16
44
|
RAILS_VERSION: << parameters.rails_version >>
|
|
17
45
|
NOKOGIRI_USE_SYSTEM_LIBRARIES: true
|
|
18
|
-
|
|
19
|
-
name: 'samvera/ruby_fcrepo_solr_redis_postgres'
|
|
20
|
-
ruby_version: << parameters.ruby_version >>
|
|
46
|
+
FCREPO_TEST_PORT: 8080
|
|
21
47
|
steps:
|
|
48
|
+
- run: 'wget -q -O - https://dl.google.com/linux/linux_signing_key.pub | sudo apt-key add -'
|
|
22
49
|
- run: 'sudo apt-get update'
|
|
23
50
|
- run: 'sudo apt-get install -y clamav libsqlite3-dev'
|
|
24
51
|
- run: 'sudo freshclam'
|
|
@@ -30,66 +57,50 @@ jobs:
|
|
|
30
57
|
bundler_version: << parameters.bundler_version >>
|
|
31
58
|
project: hydra-works
|
|
32
59
|
|
|
33
|
-
-
|
|
60
|
+
- run:
|
|
61
|
+
name: Install solr core
|
|
62
|
+
command: |
|
|
63
|
+
cd << parameters.solr_config_path >>
|
|
64
|
+
zip -1 -r solr_conf.zip ./*
|
|
65
|
+
curl -H "Content-type:application/octet-stream" --data-binary @solr_conf.zip "http://solr:SolrRocks@127.0.0.1:8985/solr/admin/configs?action=UPLOAD&name=solrconfig"
|
|
66
|
+
curl "http://solr:SolrRocks@127.0.0.1:8985/solr/admin/collections?action=CREATE&name=hydra-test&numShards=1&collection.configName=solrconfig"
|
|
34
67
|
|
|
35
68
|
- samvera/parallel_rspec
|
|
36
69
|
|
|
37
70
|
workflows:
|
|
38
|
-
version: 2
|
|
39
71
|
ci:
|
|
40
72
|
jobs:
|
|
41
|
-
#
|
|
42
|
-
-
|
|
43
|
-
name: ruby3-
|
|
44
|
-
ruby_version: 3.
|
|
45
|
-
rails_version:
|
|
46
|
-
-
|
|
47
|
-
name: ruby3-
|
|
48
|
-
ruby_version: 3.
|
|
49
|
-
rails_version:
|
|
50
|
-
-
|
|
51
|
-
name: ruby3-
|
|
52
|
-
ruby_version: 3.
|
|
53
|
-
rails_version: 7.0
|
|
54
|
-
#
|
|
55
|
-
-
|
|
56
|
-
name: ruby3-
|
|
57
|
-
ruby_version: 3.2.
|
|
58
|
-
rails_version:
|
|
59
|
-
-
|
|
60
|
-
name: ruby3-
|
|
61
|
-
ruby_version: 3.
|
|
62
|
-
rails_version:
|
|
63
|
-
-
|
|
64
|
-
name: ruby3-
|
|
65
|
-
ruby_version: 3.
|
|
66
|
-
rails_version:
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
- test:
|
|
73
|
-
name: ruby3-2_rails6-0
|
|
74
|
-
ruby_version: 3.2.0
|
|
75
|
-
rails_version: 6.0.6.1
|
|
76
|
-
- test:
|
|
77
|
-
name: ruby3-1_rails6-0
|
|
78
|
-
ruby_version: 3.1.3
|
|
79
|
-
rails_version: 6.0.6.1
|
|
80
|
-
- test:
|
|
81
|
-
name: ruby3-0_rails6-0
|
|
82
|
-
ruby_version: 3.0.5
|
|
83
|
-
rails_version: 6.0.6.1
|
|
84
|
-
- test:
|
|
85
|
-
name: ruby2-7_rails6-0
|
|
86
|
-
ruby_version: 2.7.7
|
|
87
|
-
rails_version: 6.0.6.1
|
|
88
|
-
# Rails 5.2
|
|
89
|
-
- test:
|
|
90
|
-
name: ruby2-7_rails5-2
|
|
91
|
-
ruby_version: 2.7.7
|
|
92
|
-
rails_version: 5.2.8.1
|
|
73
|
+
# Ruby 3.3 releases
|
|
74
|
+
- bundle_lint_test:
|
|
75
|
+
name: ruby3-3_rails8-1
|
|
76
|
+
ruby_version: 3.3.4
|
|
77
|
+
rails_version: 8.1.1
|
|
78
|
+
- bundle_lint_test:
|
|
79
|
+
name: ruby3-3_rails8-0
|
|
80
|
+
ruby_version: 3.3.4
|
|
81
|
+
rails_version: 8.0.4
|
|
82
|
+
- bundle_lint_test:
|
|
83
|
+
name: ruby3-3_rails7-2
|
|
84
|
+
ruby_version: 3.3.4
|
|
85
|
+
rails_version: 7.2.0
|
|
86
|
+
# Ruby 3.2 releases
|
|
87
|
+
- bundle_lint_test:
|
|
88
|
+
name: ruby3-2_rails8-1
|
|
89
|
+
ruby_version: 3.2.5
|
|
90
|
+
rails_version: 8.1.1
|
|
91
|
+
- bundle_lint_test:
|
|
92
|
+
name: ruby3-2_rails8-0
|
|
93
|
+
ruby_version: 3.2.5
|
|
94
|
+
rails_version: 8.0.4
|
|
95
|
+
- bundle_lint_test:
|
|
96
|
+
name: ruby3-2_rails7-2
|
|
97
|
+
ruby_version: 3.2.5
|
|
98
|
+
rails_version: 7.2.0
|
|
99
|
+
# Ruby 3.1 releases
|
|
100
|
+
- bundle_lint_test:
|
|
101
|
+
name: ruby3-1_rails7-2
|
|
102
|
+
ruby_version: 3.1.6
|
|
103
|
+
rails_version: 7.2.0
|
|
93
104
|
|
|
94
105
|
nightly:
|
|
95
106
|
triggers:
|
|
@@ -100,55 +111,33 @@ workflows:
|
|
|
100
111
|
only:
|
|
101
112
|
- main
|
|
102
113
|
jobs:
|
|
103
|
-
#
|
|
104
|
-
-
|
|
105
|
-
name: ruby3-
|
|
106
|
-
ruby_version: 3.
|
|
107
|
-
rails_version:
|
|
108
|
-
-
|
|
109
|
-
name: ruby3-
|
|
110
|
-
ruby_version: 3.
|
|
111
|
-
rails_version:
|
|
112
|
-
-
|
|
113
|
-
name: ruby3-
|
|
114
|
-
ruby_version: 3.
|
|
115
|
-
rails_version: 7.0
|
|
116
|
-
#
|
|
117
|
-
-
|
|
118
|
-
name: ruby3-
|
|
119
|
-
ruby_version: 3.2.
|
|
120
|
-
rails_version:
|
|
121
|
-
-
|
|
122
|
-
name: ruby3-
|
|
123
|
-
ruby_version: 3.
|
|
124
|
-
rails_version:
|
|
125
|
-
-
|
|
126
|
-
name: ruby3-
|
|
127
|
-
ruby_version: 3.
|
|
128
|
-
rails_version:
|
|
129
|
-
-
|
|
130
|
-
name:
|
|
131
|
-
ruby_version:
|
|
132
|
-
rails_version:
|
|
133
|
-
# Rails 6.0
|
|
134
|
-
- test:
|
|
135
|
-
name: ruby3-2_rails6-0
|
|
136
|
-
ruby_version: 3.2.0
|
|
137
|
-
rails_version: 6.0.6.1
|
|
138
|
-
- test:
|
|
139
|
-
name: ruby3-1_rails6-0
|
|
140
|
-
ruby_version: 3.1.3
|
|
141
|
-
rails_version: 6.0.6.1
|
|
142
|
-
- test:
|
|
143
|
-
name: ruby3-0_rails6-0
|
|
144
|
-
ruby_version: 3.0.5
|
|
145
|
-
rails_version: 6.0.6.1
|
|
146
|
-
- test:
|
|
147
|
-
name: ruby2-7_rails6-0
|
|
148
|
-
ruby_version: 2.7.7
|
|
149
|
-
rails_version: 6.0.6.1
|
|
150
|
-
# Rails 5.2
|
|
151
|
-
- test:
|
|
152
|
-
name: ruby2-7_rails5-2
|
|
153
|
-
ruby_version: 2.7.7
|
|
154
|
-
rails_version: 5.2.8.1
|
|
114
|
+
# Ruby 3.3 releases
|
|
115
|
+
- bundle_lint_test:
|
|
116
|
+
name: ruby3-3_rails8-1
|
|
117
|
+
ruby_version: 3.3.4
|
|
118
|
+
rails_version: 8.1.1
|
|
119
|
+
- bundle_lint_test:
|
|
120
|
+
name: ruby3-3_rails8-0
|
|
121
|
+
ruby_version: 3.3.4
|
|
122
|
+
rails_version: 8.0.4
|
|
123
|
+
- bundle_lint_test:
|
|
124
|
+
name: ruby3-3_rails7-2
|
|
125
|
+
ruby_version: 3.3.4
|
|
126
|
+
rails_version: 7.2.0
|
|
127
|
+
# Ruby 3.2 releases
|
|
128
|
+
- bundle_lint_test:
|
|
129
|
+
name: ruby3-2_rails8-1
|
|
130
|
+
ruby_version: 3.2.5
|
|
131
|
+
rails_version: 8.1.1
|
|
132
|
+
- bundle_lint_test:
|
|
133
|
+
name: ruby3-2_rails8-0
|
|
134
|
+
ruby_version: 3.2.5
|
|
135
|
+
rails_version: 8.0.4
|
|
136
|
+
- bundle_lint_test:
|
|
137
|
+
name: ruby3-2_rails7-2
|
|
138
|
+
ruby_version: 3.2.5
|
|
139
|
+
rails_version: 7.2.0
|
|
140
|
+
- bundle_lint_test:
|
|
141
|
+
name: ruby3-1_rails7-2
|
|
142
|
+
ruby_version: 3.1.6
|
|
143
|
+
rails_version: 7.2.0
|
data/CONTRIBUTING.md
CHANGED
|
@@ -22,6 +22,28 @@ https://wiki.duraspace.org/display/samvera/Samvera+Community+Intellectual+Proper
|
|
|
22
22
|
|
|
23
23
|
You should also add yourself to the `CONTRIBUTORS.md` file in the root of the project.
|
|
24
24
|
|
|
25
|
+
## Language
|
|
26
|
+
|
|
27
|
+
The language we use matters. Today, tomorrow, and for years to come
|
|
28
|
+
people will read the code we write. They will judge us for our
|
|
29
|
+
design, logic, and the words we use to describe the system.
|
|
30
|
+
|
|
31
|
+
Our words should be accessible. Favor descriptive words that give
|
|
32
|
+
meaning while avoiding reinforcing systemic inequities. For example,
|
|
33
|
+
in the Samvera community, we should favor using allowed\_list instead
|
|
34
|
+
of whitelist, denied\_list instead of blacklist, or source/copy
|
|
35
|
+
instead of master/slave.
|
|
36
|
+
|
|
37
|
+
We're going to get it wrong, but this is a call to keep working to
|
|
38
|
+
make it right. View our code and the words we choose as a chance to
|
|
39
|
+
have a conversation. A chance to grow an understanding of the systems
|
|
40
|
+
we develop as well as the systems in which we live.
|
|
41
|
+
|
|
42
|
+
See [“Blacklists” and “whitelists”: a salutary warning concerning the
|
|
43
|
+
prevalence of racist language in discussions of predatory
|
|
44
|
+
publishing](https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6148600/) for
|
|
45
|
+
further details.
|
|
46
|
+
|
|
25
47
|
## Contribution Tasks
|
|
26
48
|
|
|
27
49
|
* Reporting Issues
|
|
@@ -34,7 +56,7 @@ You should also add yourself to the `CONTRIBUTORS.md` file in the root of the pr
|
|
|
34
56
|
### Reporting Issues
|
|
35
57
|
|
|
36
58
|
* Make sure you have a [GitHub account](https://github.com/signup/free)
|
|
37
|
-
* Submit a [Github issue](https://github.com/samvera/
|
|
59
|
+
* Submit a [Github issue](https://github.com/samvera/{{library}}/issues/) by:
|
|
38
60
|
* Clearly describing the issue
|
|
39
61
|
* Provide a descriptive summary
|
|
40
62
|
* Explain the expected behavior
|
data/hydra-works.gemspec
CHANGED
|
@@ -20,8 +20,8 @@ Gem::Specification.new do |spec|
|
|
|
20
20
|
spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
|
|
21
21
|
spec.require_paths = ['lib']
|
|
22
22
|
|
|
23
|
-
spec.add_dependency 'activesupport', '>= 5.2', '<
|
|
24
|
-
spec.add_dependency 'hydra-derivatives', '
|
|
23
|
+
spec.add_dependency 'activesupport', '>= 5.2', '< 9.0'
|
|
24
|
+
spec.add_dependency 'hydra-derivatives', '>= 3.6'
|
|
25
25
|
spec.add_dependency 'hydra-file_characterization', '~> 1.0'
|
|
26
26
|
spec.add_dependency 'hydra-pcdm', '>= 0.9'
|
|
27
27
|
|
data/lib/hydra/works/version.rb
CHANGED
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
<!--
|
|
2
|
+
Licensed to the Apache Software Foundation (ASF) under one or more
|
|
3
|
+
contributor license agreements. See the NOTICE file distributed with
|
|
4
|
+
this work for additional information regarding copyright ownership.
|
|
5
|
+
The ASF licenses this file to You under the Apache License, Version 2.0
|
|
6
|
+
(the "License"); you may not use this file except in compliance with
|
|
7
|
+
the License. You may obtain a copy of the License at
|
|
8
|
+
|
|
9
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
|
10
|
+
|
|
11
|
+
Unless required by applicable law or agreed to in writing, software
|
|
12
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
|
13
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
14
|
+
See the License for the specific language governing permissions and
|
|
15
|
+
limitations under the License.
|
|
16
|
+
-->
|
|
17
|
+
|
|
18
|
+
<!-- The content of this page will be statically included into the top
|
|
19
|
+
of the admin page. Uncomment this as an example to see there the content
|
|
20
|
+
will show up.
|
|
21
|
+
|
|
22
|
+
<hr>
|
|
23
|
+
<i>This line will appear before the first table</i>
|
|
24
|
+
<tr>
|
|
25
|
+
<td colspan="2">
|
|
26
|
+
This row will be appended to the end of the first table
|
|
27
|
+
</td>
|
|
28
|
+
</tr>
|
|
29
|
+
<hr>
|
|
30
|
+
|
|
31
|
+
-->
|
|
@@ -0,0 +1,36 @@
|
|
|
1
|
+
<?xml version="1.0" encoding="UTF-8" ?>
|
|
2
|
+
<!--
|
|
3
|
+
Licensed to the Apache Software Foundation (ASF) under one or more
|
|
4
|
+
contributor license agreements. See the NOTICE file distributed with
|
|
5
|
+
this work for additional information regarding copyright ownership.
|
|
6
|
+
The ASF licenses this file to You under the Apache License, Version 2.0
|
|
7
|
+
(the "License"); you may not use this file except in compliance with
|
|
8
|
+
the License. You may obtain a copy of the License at
|
|
9
|
+
|
|
10
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
|
11
|
+
|
|
12
|
+
Unless required by applicable law or agreed to in writing, software
|
|
13
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
|
14
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
15
|
+
See the License for the specific language governing permissions and
|
|
16
|
+
limitations under the License.
|
|
17
|
+
-->
|
|
18
|
+
|
|
19
|
+
<!-- If this file is found in the config directory, it will only be
|
|
20
|
+
loaded once at startup. If it is found in Solr's data
|
|
21
|
+
directory, it will be re-loaded every commit.
|
|
22
|
+
-->
|
|
23
|
+
|
|
24
|
+
<elevate>
|
|
25
|
+
<query text="foo bar">
|
|
26
|
+
<doc id="1" />
|
|
27
|
+
<doc id="2" />
|
|
28
|
+
<doc id="3" />
|
|
29
|
+
</query>
|
|
30
|
+
|
|
31
|
+
<query text="ipod">
|
|
32
|
+
<doc id="MA147LL/A" /> <!-- put the actual ipod at the top -->
|
|
33
|
+
<doc id="IW-02" exclude="true" /> <!-- exclude this cable -->
|
|
34
|
+
</query>
|
|
35
|
+
|
|
36
|
+
</elevate>
|
|
@@ -0,0 +1,246 @@
|
|
|
1
|
+
# The ASF licenses this file to You under the Apache License, Version 2.0
|
|
2
|
+
# (the "License"); you may not use this file except in compliance with
|
|
3
|
+
# the License. You may obtain a copy of the License at
|
|
4
|
+
#
|
|
5
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
6
|
+
#
|
|
7
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
8
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
9
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
10
|
+
# See the License for the specific language governing permissions and
|
|
11
|
+
# limitations under the License.
|
|
12
|
+
|
|
13
|
+
# Syntax:
|
|
14
|
+
# "source" => "target"
|
|
15
|
+
# "source".length() > 0 (source cannot be empty.)
|
|
16
|
+
# "target".length() >= 0 (target can be empty.)
|
|
17
|
+
|
|
18
|
+
# example:
|
|
19
|
+
# "??" => "A"
|
|
20
|
+
# "\u00C0" => "A"
|
|
21
|
+
# "\u00C0" => "\u0041"
|
|
22
|
+
# "??" => "ss"
|
|
23
|
+
# "\t" => " "
|
|
24
|
+
# "\n" => ""
|
|
25
|
+
|
|
26
|
+
# ?? => A
|
|
27
|
+
"\u00C0" => "A"
|
|
28
|
+
|
|
29
|
+
# ?? => A
|
|
30
|
+
"\u00C1" => "A"
|
|
31
|
+
|
|
32
|
+
# ?? => A
|
|
33
|
+
"\u00C2" => "A"
|
|
34
|
+
|
|
35
|
+
# ?? => A
|
|
36
|
+
"\u00C3" => "A"
|
|
37
|
+
|
|
38
|
+
# ?? => A
|
|
39
|
+
"\u00C4" => "A"
|
|
40
|
+
|
|
41
|
+
# ?? => A
|
|
42
|
+
"\u00C5" => "A"
|
|
43
|
+
|
|
44
|
+
# ?? => AE
|
|
45
|
+
"\u00C6" => "AE"
|
|
46
|
+
|
|
47
|
+
# ?? => C
|
|
48
|
+
"\u00C7" => "C"
|
|
49
|
+
|
|
50
|
+
# ?? => E
|
|
51
|
+
"\u00C8" => "E"
|
|
52
|
+
|
|
53
|
+
# ?? => E
|
|
54
|
+
"\u00C9" => "E"
|
|
55
|
+
|
|
56
|
+
# ?? => E
|
|
57
|
+
"\u00CA" => "E"
|
|
58
|
+
|
|
59
|
+
# ?? => E
|
|
60
|
+
"\u00CB" => "E"
|
|
61
|
+
|
|
62
|
+
# ?? => I
|
|
63
|
+
"\u00CC" => "I"
|
|
64
|
+
|
|
65
|
+
# ?? => I
|
|
66
|
+
"\u00CD" => "I"
|
|
67
|
+
|
|
68
|
+
# ?? => I
|
|
69
|
+
"\u00CE" => "I"
|
|
70
|
+
|
|
71
|
+
# ?? => I
|
|
72
|
+
"\u00CF" => "I"
|
|
73
|
+
|
|
74
|
+
# ?? => IJ
|
|
75
|
+
"\u0132" => "IJ"
|
|
76
|
+
|
|
77
|
+
# ?? => D
|
|
78
|
+
"\u00D0" => "D"
|
|
79
|
+
|
|
80
|
+
# ?? => N
|
|
81
|
+
"\u00D1" => "N"
|
|
82
|
+
|
|
83
|
+
# ?? => O
|
|
84
|
+
"\u00D2" => "O"
|
|
85
|
+
|
|
86
|
+
# ?? => O
|
|
87
|
+
"\u00D3" => "O"
|
|
88
|
+
|
|
89
|
+
# ?? => O
|
|
90
|
+
"\u00D4" => "O"
|
|
91
|
+
|
|
92
|
+
# ?? => O
|
|
93
|
+
"\u00D5" => "O"
|
|
94
|
+
|
|
95
|
+
# ?? => O
|
|
96
|
+
"\u00D6" => "O"
|
|
97
|
+
|
|
98
|
+
# ?? => O
|
|
99
|
+
"\u00D8" => "O"
|
|
100
|
+
|
|
101
|
+
# ?? => OE
|
|
102
|
+
"\u0152" => "OE"
|
|
103
|
+
|
|
104
|
+
# ??
|
|
105
|
+
"\u00DE" => "TH"
|
|
106
|
+
|
|
107
|
+
# ?? => U
|
|
108
|
+
"\u00D9" => "U"
|
|
109
|
+
|
|
110
|
+
# ?? => U
|
|
111
|
+
"\u00DA" => "U"
|
|
112
|
+
|
|
113
|
+
# ?? => U
|
|
114
|
+
"\u00DB" => "U"
|
|
115
|
+
|
|
116
|
+
# ?? => U
|
|
117
|
+
"\u00DC" => "U"
|
|
118
|
+
|
|
119
|
+
# ?? => Y
|
|
120
|
+
"\u00DD" => "Y"
|
|
121
|
+
|
|
122
|
+
# ?? => Y
|
|
123
|
+
"\u0178" => "Y"
|
|
124
|
+
|
|
125
|
+
# ?? => a
|
|
126
|
+
"\u00E0" => "a"
|
|
127
|
+
|
|
128
|
+
# ?? => a
|
|
129
|
+
"\u00E1" => "a"
|
|
130
|
+
|
|
131
|
+
# ?? => a
|
|
132
|
+
"\u00E2" => "a"
|
|
133
|
+
|
|
134
|
+
# ?? => a
|
|
135
|
+
"\u00E3" => "a"
|
|
136
|
+
|
|
137
|
+
# ?? => a
|
|
138
|
+
"\u00E4" => "a"
|
|
139
|
+
|
|
140
|
+
# ?? => a
|
|
141
|
+
"\u00E5" => "a"
|
|
142
|
+
|
|
143
|
+
# ?? => ae
|
|
144
|
+
"\u00E6" => "ae"
|
|
145
|
+
|
|
146
|
+
# ?? => c
|
|
147
|
+
"\u00E7" => "c"
|
|
148
|
+
|
|
149
|
+
# ?? => e
|
|
150
|
+
"\u00E8" => "e"
|
|
151
|
+
|
|
152
|
+
# ?? => e
|
|
153
|
+
"\u00E9" => "e"
|
|
154
|
+
|
|
155
|
+
# ?? => e
|
|
156
|
+
"\u00EA" => "e"
|
|
157
|
+
|
|
158
|
+
# ?? => e
|
|
159
|
+
"\u00EB" => "e"
|
|
160
|
+
|
|
161
|
+
# ?? => i
|
|
162
|
+
"\u00EC" => "i"
|
|
163
|
+
|
|
164
|
+
# ?? => i
|
|
165
|
+
"\u00ED" => "i"
|
|
166
|
+
|
|
167
|
+
# ?? => i
|
|
168
|
+
"\u00EE" => "i"
|
|
169
|
+
|
|
170
|
+
# ?? => i
|
|
171
|
+
"\u00EF" => "i"
|
|
172
|
+
|
|
173
|
+
# ?? => ij
|
|
174
|
+
"\u0133" => "ij"
|
|
175
|
+
|
|
176
|
+
# ?? => d
|
|
177
|
+
"\u00F0" => "d"
|
|
178
|
+
|
|
179
|
+
# ?? => n
|
|
180
|
+
"\u00F1" => "n"
|
|
181
|
+
|
|
182
|
+
# ?? => o
|
|
183
|
+
"\u00F2" => "o"
|
|
184
|
+
|
|
185
|
+
# ?? => o
|
|
186
|
+
"\u00F3" => "o"
|
|
187
|
+
|
|
188
|
+
# ?? => o
|
|
189
|
+
"\u00F4" => "o"
|
|
190
|
+
|
|
191
|
+
# ?? => o
|
|
192
|
+
"\u00F5" => "o"
|
|
193
|
+
|
|
194
|
+
# ?? => o
|
|
195
|
+
"\u00F6" => "o"
|
|
196
|
+
|
|
197
|
+
# ?? => o
|
|
198
|
+
"\u00F8" => "o"
|
|
199
|
+
|
|
200
|
+
# ?? => oe
|
|
201
|
+
"\u0153" => "oe"
|
|
202
|
+
|
|
203
|
+
# ?? => ss
|
|
204
|
+
"\u00DF" => "ss"
|
|
205
|
+
|
|
206
|
+
# ?? => th
|
|
207
|
+
"\u00FE" => "th"
|
|
208
|
+
|
|
209
|
+
# ?? => u
|
|
210
|
+
"\u00F9" => "u"
|
|
211
|
+
|
|
212
|
+
# ?? => u
|
|
213
|
+
"\u00FA" => "u"
|
|
214
|
+
|
|
215
|
+
# ?? => u
|
|
216
|
+
"\u00FB" => "u"
|
|
217
|
+
|
|
218
|
+
# ?? => u
|
|
219
|
+
"\u00FC" => "u"
|
|
220
|
+
|
|
221
|
+
# ?? => y
|
|
222
|
+
"\u00FD" => "y"
|
|
223
|
+
|
|
224
|
+
# ?? => y
|
|
225
|
+
"\u00FF" => "y"
|
|
226
|
+
|
|
227
|
+
# ??? => ff
|
|
228
|
+
"\uFB00" => "ff"
|
|
229
|
+
|
|
230
|
+
# ??? => fi
|
|
231
|
+
"\uFB01" => "fi"
|
|
232
|
+
|
|
233
|
+
# ??? => fl
|
|
234
|
+
"\uFB02" => "fl"
|
|
235
|
+
|
|
236
|
+
# ??? => ffi
|
|
237
|
+
"\uFB03" => "ffi"
|
|
238
|
+
|
|
239
|
+
# ??? => ffl
|
|
240
|
+
"\uFB04" => "ffl"
|
|
241
|
+
|
|
242
|
+
# ??? => ft
|
|
243
|
+
"\uFB05" => "ft"
|
|
244
|
+
|
|
245
|
+
# ??? => st
|
|
246
|
+
"\uFB06" => "st"
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
# The ASF licenses this file to You under the Apache License, Version 2.0
|
|
2
|
+
# (the "License"); you may not use this file except in compliance with
|
|
3
|
+
# the License. You may obtain a copy of the License at
|
|
4
|
+
#
|
|
5
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
6
|
+
#
|
|
7
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
8
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
9
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
10
|
+
# See the License for the specific language governing permissions and
|
|
11
|
+
# limitations under the License.
|
|
12
|
+
|
|
13
|
+
#-----------------------------------------------------------------------
|
|
14
|
+
# Use a protected word file to protect against the stemmer reducing two
|
|
15
|
+
# unrelated words to the same base word.
|
|
16
|
+
|
|
17
|
+
# Some non-words that normally won't be encountered,
|
|
18
|
+
# just to test that they won't be stemmed.
|
|
19
|
+
dontstems
|
|
20
|
+
zwhacky
|
|
21
|
+
|