blacklight-citeproc 0.0.4 → 0.2.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (98) hide show
  1. checksums.yaml +4 -4
  2. data/.env +3 -0
  3. data/.github/workflows/test.yml +25 -0
  4. data/.internal_test_app/solr/conf/_rest_managed.json +3 -0
  5. data/.internal_test_app/solr/conf/admin-extra.html +31 -0
  6. data/.internal_test_app/solr/conf/currency.xml +67 -0
  7. data/.internal_test_app/solr/conf/email_url_types.txt +2 -0
  8. data/.internal_test_app/solr/conf/lang/contractions_ca.txt +8 -0
  9. data/.internal_test_app/solr/conf/lang/contractions_fr.txt +15 -0
  10. data/.internal_test_app/solr/conf/lang/contractions_ga.txt +5 -0
  11. data/.internal_test_app/solr/conf/lang/contractions_it.txt +23 -0
  12. data/.internal_test_app/solr/conf/lang/hyphenations_ga.txt +5 -0
  13. data/.internal_test_app/solr/conf/lang/stemdict_nl.txt +6 -0
  14. data/.internal_test_app/solr/conf/lang/stoptags_ja.txt +420 -0
  15. data/.internal_test_app/solr/conf/lang/stopwords_ar.txt +125 -0
  16. data/.internal_test_app/solr/conf/lang/stopwords_bg.txt +193 -0
  17. data/.internal_test_app/solr/conf/lang/stopwords_ca.txt +220 -0
  18. data/.internal_test_app/solr/conf/lang/stopwords_cz.txt +172 -0
  19. data/.internal_test_app/solr/conf/lang/stopwords_da.txt +110 -0
  20. data/.internal_test_app/solr/conf/lang/stopwords_de.txt +294 -0
  21. data/.internal_test_app/solr/conf/lang/stopwords_el.txt +78 -0
  22. data/.internal_test_app/solr/conf/lang/stopwords_en.txt +54 -0
  23. data/.internal_test_app/solr/conf/lang/stopwords_es.txt +356 -0
  24. data/.internal_test_app/solr/conf/lang/stopwords_eu.txt +99 -0
  25. data/.internal_test_app/solr/conf/lang/stopwords_fa.txt +313 -0
  26. data/.internal_test_app/solr/conf/lang/stopwords_fi.txt +97 -0
  27. data/.internal_test_app/solr/conf/lang/stopwords_fr.txt +186 -0
  28. data/.internal_test_app/solr/conf/lang/stopwords_ga.txt +110 -0
  29. data/.internal_test_app/solr/conf/lang/stopwords_gl.txt +161 -0
  30. data/.internal_test_app/solr/conf/lang/stopwords_hi.txt +235 -0
  31. data/.internal_test_app/solr/conf/lang/stopwords_hu.txt +211 -0
  32. data/.internal_test_app/solr/conf/lang/stopwords_hy.txt +46 -0
  33. data/.internal_test_app/solr/conf/lang/stopwords_id.txt +359 -0
  34. data/.internal_test_app/solr/conf/lang/stopwords_it.txt +303 -0
  35. data/.internal_test_app/solr/conf/lang/stopwords_ja.txt +127 -0
  36. data/.internal_test_app/solr/conf/lang/stopwords_lv.txt +172 -0
  37. data/.internal_test_app/solr/conf/lang/stopwords_nl.txt +119 -0
  38. data/.internal_test_app/solr/conf/lang/stopwords_no.txt +194 -0
  39. data/.internal_test_app/solr/conf/lang/stopwords_pt.txt +253 -0
  40. data/.internal_test_app/solr/conf/lang/stopwords_ro.txt +233 -0
  41. data/.internal_test_app/solr/conf/lang/stopwords_ru.txt +243 -0
  42. data/.internal_test_app/solr/conf/lang/stopwords_sv.txt +133 -0
  43. data/.internal_test_app/solr/conf/lang/stopwords_th.txt +119 -0
  44. data/.internal_test_app/solr/conf/lang/stopwords_tr.txt +212 -0
  45. data/.internal_test_app/solr/conf/lang/userdict_ja.txt +29 -0
  46. data/.internal_test_app/solr/conf/mapping-ISOLatin1Accent.txt +246 -0
  47. data/.internal_test_app/solr/conf/protwords.txt +21 -0
  48. data/.internal_test_app/solr/conf/schema.xml +408 -0
  49. data/.internal_test_app/solr/conf/scripts.conf +24 -0
  50. data/.internal_test_app/solr/conf/solrconfig.xml +1287 -0
  51. data/.internal_test_app/solr/conf/spellings.txt +2 -0
  52. data/.internal_test_app/solr/conf/stopwords.txt +14 -0
  53. data/.internal_test_app/solr/conf/stopwords_en.txt +58 -0
  54. data/.internal_test_app/solr/conf/synonyms.txt +13 -0
  55. data/.internal_test_app/solr/conf/update-script.js +115 -0
  56. data/.internal_test_app/solr/conf/velocity/browse.vm +32 -0
  57. data/.internal_test_app/solr/conf/velocity/dropit.js +0 -0
  58. data/.internal_test_app/solr/conf/velocity/facet_doc_type.vm +2 -0
  59. data/.internal_test_app/solr/conf/velocity/facet_text_shingles.vm +12 -0
  60. data/.internal_test_app/solr/conf/velocity/facets.vm +24 -0
  61. data/.internal_test_app/solr/conf/velocity/footer.vm +29 -0
  62. data/.internal_test_app/solr/conf/velocity/head.vm +290 -0
  63. data/.internal_test_app/solr/conf/velocity/hit.vm +77 -0
  64. data/.internal_test_app/solr/conf/velocity/img/english_640.png +0 -0
  65. data/.internal_test_app/solr/conf/velocity/img/france_640.png +0 -0
  66. data/.internal_test_app/solr/conf/velocity/img/germany_640.png +0 -0
  67. data/.internal_test_app/solr/conf/velocity/img/globe_256.png +0 -0
  68. data/.internal_test_app/solr/conf/velocity/jquery.tx3-tag-cloud.js +0 -0
  69. data/.internal_test_app/solr/conf/velocity/js/dropit.js +97 -0
  70. data/.internal_test_app/solr/conf/velocity/js/jquery.autocomplete.js +763 -0
  71. data/.internal_test_app/solr/conf/velocity/js/jquery.tx3-tag-cloud.js +70 -0
  72. data/.internal_test_app/solr/conf/velocity/layout.vm +42 -0
  73. data/.internal_test_app/solr/conf/velocity/macros.vm +16 -0
  74. data/.internal_test_app/solr/conf/velocity/mime_type_lists.vm +68 -0
  75. data/.internal_test_app/solr/conf/velocity/results.vm +20 -0
  76. data/.internal_test_app/solr/conf/velocity/results_list.vm +21 -0
  77. data/.internal_test_app/solr/conf/xslt/example.xsl +132 -0
  78. data/.internal_test_app/solr/conf/xslt/example_atom.xsl +67 -0
  79. data/.internal_test_app/solr/conf/xslt/example_rss.xsl +66 -0
  80. data/.internal_test_app/solr/conf/xslt/luke.xsl +337 -0
  81. data/.rubocop.yml +4 -0
  82. data/.rubocop_todo.yml +40 -0
  83. data/Dockerfile +43 -0
  84. data/Gemfile +5 -0
  85. data/LICENSE.md +21 -0
  86. data/README.md +3 -0
  87. data/Rakefile +8 -0
  88. data/app/controllers/blacklight/citeproc/citation_controller.rb +45 -40
  89. data/app/models/concerns/blacklight/document/bibtex.rb +37 -35
  90. data/bin/entrypoint.sh +8 -0
  91. data/blacklight-citeproc.gemspec +19 -19
  92. data/config/routes.rb +2 -0
  93. data/docker-compose.yml +33 -0
  94. data/lib/blacklight/citeproc/engine.rb +2 -0
  95. data/lib/blacklight/citeproc/version.rb +3 -1
  96. data/lib/blacklight/citeproc.rb +2 -0
  97. data/lib/generators/blacklight/citeproc/install_generator.rb +20 -15
  98. metadata +119 -40
@@ -0,0 +1,133 @@
1
+ | From svn.tartarus.org/snowball/trunk/website/algorithms/swedish/stop.txt
2
+ | This file is distributed under the BSD License.
3
+ | See http://snowball.tartarus.org/license.php
4
+ | Also see http://www.opensource.org/licenses/bsd-license.html
5
+ | - Encoding was converted to UTF-8.
6
+ | - This notice was added.
7
+ |
8
+ | NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
9
+
10
+ | A Swedish stop word list. Comments begin with vertical bar. Each stop
11
+ | word is at the start of a line.
12
+
13
+ | This is a ranked list (commonest to rarest) of stopwords derived from
14
+ | a large text sample.
15
+
16
+ | Swedish stop words occasionally exhibit homonym clashes. For example
17
+ | så = so, but also seed. These are indicated clearly below.
18
+
19
+ och | and
20
+ det | it, this/that
21
+ att | to (with infinitive)
22
+ i | in, at
23
+ en | a
24
+ jag | I
25
+ hon | she
26
+ som | who, that
27
+ han | he
28
+ på | on
29
+ den | it, this/that
30
+ med | with
31
+ var | where, each
32
+ sig | him(self) etc
33
+ för | for
34
+ så | so (also: seed)
35
+ till | to
36
+ är | is
37
+ men | but
38
+ ett | a
39
+ om | if; around, about
40
+ hade | had
41
+ de | they, these/those
42
+ av | of
43
+ icke | not, no
44
+ mig | me
45
+ du | you
46
+ henne | her
47
+ då | then, when
48
+ sin | his
49
+ nu | now
50
+ har | have
51
+ inte | inte någon = no one
52
+ hans | his
53
+ honom | him
54
+ skulle | 'sake'
55
+ hennes | her
56
+ där | there
57
+ min | my
58
+ man | one (pronoun)
59
+ ej | nor
60
+ vid | at, by, on (also: vast)
61
+ kunde | could
62
+ något | some etc
63
+ från | from, off
64
+ ut | out
65
+ när | when
66
+ efter | after, behind
67
+ upp | up
68
+ vi | we
69
+ dem | them
70
+ vara | be
71
+ vad | what
72
+ över | over
73
+ än | than
74
+ dig | you
75
+ kan | can
76
+ sina | his
77
+ här | here
78
+ ha | have
79
+ mot | towards
80
+ alla | all
81
+ under | under (also: wonder)
82
+ någon | some etc
83
+ eller | or (else)
84
+ allt | all
85
+ mycket | much
86
+ sedan | since
87
+ ju | why
88
+ denna | this/that
89
+ själv | myself, yourself etc
90
+ detta | this/that
91
+ åt | to
92
+ utan | without
93
+ varit | was
94
+ hur | how
95
+ ingen | no
96
+ mitt | my
97
+ ni | you
98
+ bli | to be, become
99
+ blev | from bli
100
+ oss | us
101
+ din | thy
102
+ dessa | these/those
103
+ några | some etc
104
+ deras | their
105
+ blir | from bli
106
+ mina | my
107
+ samma | (the) same
108
+ vilken | who, that
109
+ er | you, your
110
+ sådan | such a
111
+ vår | our
112
+ blivit | from bli
113
+ dess | its
114
+ inom | within
115
+ mellan | between
116
+ sådant | such a
117
+ varför | why
118
+ varje | each
119
+ vilka | who, that
120
+ ditt | thy
121
+ vem | who
122
+ vilket | who, that
123
+ sitta | his
124
+ sådana | such a
125
+ vart | each
126
+ dina | thy
127
+ vars | whose
128
+ vårt | our
129
+ våra | our
130
+ ert | your
131
+ era | your
132
+ vilkas | whose
133
+
@@ -0,0 +1,119 @@
1
+ # Thai stopwords from:
2
+ # "Opinion Detection in Thai Political News Columns
3
+ # Based on Subjectivity Analysis"
4
+ # Khampol Sukhum, Supot Nitsuwat, and Choochart Haruechaiyasak
5
+ ไว้
6
+ ไม่
7
+ ไป
8
+ ได้
9
+ ให้
10
+ ใน
11
+ โดย
12
+ แห่ง
13
+ แล้ว
14
+ และ
15
+ แรก
16
+ แบบ
17
+ แต่
18
+ เอง
19
+ เห็น
20
+ เลย
21
+ เริ่ม
22
+ เรา
23
+ เมื่อ
24
+ เพื่อ
25
+ เพราะ
26
+ เป็นการ
27
+ เป็น
28
+ เปิดเผย
29
+ เปิด
30
+ เนื่องจาก
31
+ เดียวกัน
32
+ เดียว
33
+ เช่น
34
+ เฉพาะ
35
+ เคย
36
+ เข้า
37
+ เขา
38
+ อีก
39
+ อาจ
40
+ อะไร
41
+ ออก
42
+ อย่าง
43
+ อยู่
44
+ อยาก
45
+ หาก
46
+ หลาย
47
+ หลังจาก
48
+ หลัง
49
+ หรือ
50
+ หนึ่ง
51
+ ส่วน
52
+ ส่ง
53
+ สุด
54
+ สําหรับ
55
+ ว่า
56
+ วัน
57
+ ลง
58
+ ร่วม
59
+ ราย
60
+ รับ
61
+ ระหว่าง
62
+ รวม
63
+ ยัง
64
+ มี
65
+ มาก
66
+ มา
67
+ พร้อม
68
+ พบ
69
+ ผ่าน
70
+ ผล
71
+ บาง
72
+ น่า
73
+ นี้
74
+ นํา
75
+ นั้น
76
+ นัก
77
+ นอกจาก
78
+ ทุก
79
+ ที่สุด
80
+ ที่
81
+ ทําให้
82
+ ทํา
83
+ ทาง
84
+ ทั้งนี้
85
+ ทั้ง
86
+ ถ้า
87
+ ถูก
88
+ ถึง
89
+ ต้อง
90
+ ต่างๆ
91
+ ต่าง
92
+ ต่อ
93
+ ตาม
94
+ ตั้งแต่
95
+ ตั้ง
96
+ ด้าน
97
+ ด้วย
98
+ ดัง
99
+ ซึ่ง
100
+ ช่วง
101
+ จึง
102
+ จาก
103
+ จัด
104
+ จะ
105
+ คือ
106
+ ความ
107
+ ครั้ง
108
+ คง
109
+ ขึ้น
110
+ ของ
111
+ ขอ
112
+ ขณะ
113
+ ก่อน
114
+ ก็
115
+ การ
116
+ กับ
117
+ กัน
118
+ กว่า
119
+ กล่าว
@@ -0,0 +1,212 @@
1
+ # Turkish stopwords from LUCENE-559
2
+ # merged with the list from "Information Retrieval on Turkish Texts"
3
+ # (http://www.users.muohio.edu/canf/papers/JASIST2008offPrint.pdf)
4
+ acaba
5
+ altmış
6
+ altı
7
+ ama
8
+ ancak
9
+ arada
10
+ aslında
11
+ ayrıca
12
+ bana
13
+ bazı
14
+ belki
15
+ ben
16
+ benden
17
+ beni
18
+ benim
19
+ beri
20
+ beş
21
+ bile
22
+ bin
23
+ bir
24
+ birçok
25
+ biri
26
+ birkaç
27
+ birkez
28
+ birşey
29
+ birşeyi
30
+ biz
31
+ bize
32
+ bizden
33
+ bizi
34
+ bizim
35
+ böyle
36
+ böylece
37
+ bu
38
+ buna
39
+ bunda
40
+ bundan
41
+ bunlar
42
+ bunları
43
+ bunların
44
+ bunu
45
+ bunun
46
+ burada
47
+ çok
48
+ çünkü
49
+ da
50
+ daha
51
+ dahi
52
+ de
53
+ defa
54
+ değil
55
+ diğer
56
+ diye
57
+ doksan
58
+ dokuz
59
+ dolayı
60
+ dolayısıyla
61
+ dört
62
+ edecek
63
+ eden
64
+ ederek
65
+ edilecek
66
+ ediliyor
67
+ edilmesi
68
+ ediyor
69
+ eğer
70
+ elli
71
+ en
72
+ etmesi
73
+ etti
74
+ ettiği
75
+ ettiğini
76
+ gibi
77
+ göre
78
+ halen
79
+ hangi
80
+ hatta
81
+ hem
82
+ henüz
83
+ hep
84
+ hepsi
85
+ her
86
+ herhangi
87
+ herkesin
88
+ hiç
89
+ hiçbir
90
+ için
91
+ iki
92
+ ile
93
+ ilgili
94
+ ise
95
+ işte
96
+ itibaren
97
+ itibariyle
98
+ kadar
99
+ karşın
100
+ katrilyon
101
+ kendi
102
+ kendilerine
103
+ kendini
104
+ kendisi
105
+ kendisine
106
+ kendisini
107
+ kez
108
+ ki
109
+ kim
110
+ kimden
111
+ kime
112
+ kimi
113
+ kimse
114
+ kırk
115
+ milyar
116
+ milyon
117
+ mu
118
+
119
+
120
+ nasıl
121
+ ne
122
+ neden
123
+ nedenle
124
+ nerde
125
+ nerede
126
+ nereye
127
+ niye
128
+ niçin
129
+ o
130
+ olan
131
+ olarak
132
+ oldu
133
+ olduğu
134
+ olduğunu
135
+ olduklarını
136
+ olmadı
137
+ olmadığı
138
+ olmak
139
+ olması
140
+ olmayan
141
+ olmaz
142
+ olsa
143
+ olsun
144
+ olup
145
+ olur
146
+ olursa
147
+ oluyor
148
+ on
149
+ ona
150
+ ondan
151
+ onlar
152
+ onlardan
153
+ onları
154
+ onların
155
+ onu
156
+ onun
157
+ otuz
158
+ oysa
159
+ öyle
160
+ pek
161
+ rağmen
162
+ sadece
163
+ sanki
164
+ sekiz
165
+ seksen
166
+ sen
167
+ senden
168
+ seni
169
+ senin
170
+ siz
171
+ sizden
172
+ sizi
173
+ sizin
174
+ şey
175
+ şeyden
176
+ şeyi
177
+ şeyler
178
+ şöyle
179
+ şu
180
+ şuna
181
+ şunda
182
+ şundan
183
+ şunları
184
+ şunu
185
+ tarafından
186
+ trilyon
187
+ tüm
188
+ üç
189
+ üzere
190
+ var
191
+ vardı
192
+ ve
193
+ veya
194
+ ya
195
+ yani
196
+ yapacak
197
+ yapılan
198
+ yapılması
199
+ yapıyor
200
+ yapmak
201
+ yaptı
202
+ yaptığı
203
+ yaptığını
204
+ yaptıkları
205
+ yedi
206
+ yerine
207
+ yetmiş
208
+ yine
209
+ yirmi
210
+ yoksa
211
+ yüz
212
+ zaten
@@ -0,0 +1,29 @@
1
+ #
2
+ # This is a sample user dictionary for Kuromoji (JapaneseTokenizer)
3
+ #
4
+ # Add entries to this file in order to override the statistical model in terms
5
+ # of segmentation, readings and part-of-speech tags. Notice that entries do
6
+ # not have weights since they are always used when found. This is by-design
7
+ # in order to maximize ease-of-use.
8
+ #
9
+ # Entries are defined using the following CSV format:
10
+ # <text>,<token 1> ... <token n>,<reading 1> ... <reading n>,<part-of-speech tag>
11
+ #
12
+ # Notice that a single half-width space separates tokens and readings, and
13
+ # that the number tokens and readings must match exactly.
14
+ #
15
+ # Also notice that multiple entries with the same <text> is undefined.
16
+ #
17
+ # Whitespace only lines are ignored. Comments are not allowed on entry lines.
18
+ #
19
+
20
+ # Custom segmentation for kanji compounds
21
+ 日本経済新聞,日本 経済 新聞,ニホン ケイザイ シンブン,カスタム名詞
22
+ 関西国際空港,関西 国際 空港,カンサイ コクサイ クウコウ,カスタム名詞
23
+
24
+ # Custom segmentation for compound katakana
25
+ トートバッグ,トート バッグ,トート バッグ,かずカナ名詞
26
+ ショルダーバッグ,ショルダー バッグ,ショルダー バッグ,かずカナ名詞
27
+
28
+ # Custom reading for former sumo wrestler
29
+ 朝青龍,朝青龍,アサショウリュウ,カスタム人名
@@ -0,0 +1,246 @@
1
+ # The ASF licenses this file to You under the Apache License, Version 2.0
2
+ # (the "License"); you may not use this file except in compliance with
3
+ # the License. You may obtain a copy of the License at
4
+ #
5
+ # http://www.apache.org/licenses/LICENSE-2.0
6
+ #
7
+ # Unless required by applicable law or agreed to in writing, software
8
+ # distributed under the License is distributed on an "AS IS" BASIS,
9
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
10
+ # See the License for the specific language governing permissions and
11
+ # limitations under the License.
12
+
13
+ # Syntax:
14
+ # "source" => "target"
15
+ # "source".length() > 0 (source cannot be empty.)
16
+ # "target".length() >= 0 (target can be empty.)
17
+
18
+ # example:
19
+ # "??" => "A"
20
+ # "\u00C0" => "A"
21
+ # "\u00C0" => "\u0041"
22
+ # "??" => "ss"
23
+ # "\t" => " "
24
+ # "\n" => ""
25
+
26
+ # ?? => A
27
+ "\u00C0" => "A"
28
+
29
+ # ?? => A
30
+ "\u00C1" => "A"
31
+
32
+ # ?? => A
33
+ "\u00C2" => "A"
34
+
35
+ # ?? => A
36
+ "\u00C3" => "A"
37
+
38
+ # ?? => A
39
+ "\u00C4" => "A"
40
+
41
+ # ?? => A
42
+ "\u00C5" => "A"
43
+
44
+ # ?? => AE
45
+ "\u00C6" => "AE"
46
+
47
+ # ?? => C
48
+ "\u00C7" => "C"
49
+
50
+ # ?? => E
51
+ "\u00C8" => "E"
52
+
53
+ # ?? => E
54
+ "\u00C9" => "E"
55
+
56
+ # ?? => E
57
+ "\u00CA" => "E"
58
+
59
+ # ?? => E
60
+ "\u00CB" => "E"
61
+
62
+ # ?? => I
63
+ "\u00CC" => "I"
64
+
65
+ # ?? => I
66
+ "\u00CD" => "I"
67
+
68
+ # ?? => I
69
+ "\u00CE" => "I"
70
+
71
+ # ?? => I
72
+ "\u00CF" => "I"
73
+
74
+ # ?? => IJ
75
+ "\u0132" => "IJ"
76
+
77
+ # ?? => D
78
+ "\u00D0" => "D"
79
+
80
+ # ?? => N
81
+ "\u00D1" => "N"
82
+
83
+ # ?? => O
84
+ "\u00D2" => "O"
85
+
86
+ # ?? => O
87
+ "\u00D3" => "O"
88
+
89
+ # ?? => O
90
+ "\u00D4" => "O"
91
+
92
+ # ?? => O
93
+ "\u00D5" => "O"
94
+
95
+ # ?? => O
96
+ "\u00D6" => "O"
97
+
98
+ # ?? => O
99
+ "\u00D8" => "O"
100
+
101
+ # ?? => OE
102
+ "\u0152" => "OE"
103
+
104
+ # ??
105
+ "\u00DE" => "TH"
106
+
107
+ # ?? => U
108
+ "\u00D9" => "U"
109
+
110
+ # ?? => U
111
+ "\u00DA" => "U"
112
+
113
+ # ?? => U
114
+ "\u00DB" => "U"
115
+
116
+ # ?? => U
117
+ "\u00DC" => "U"
118
+
119
+ # ?? => Y
120
+ "\u00DD" => "Y"
121
+
122
+ # ?? => Y
123
+ "\u0178" => "Y"
124
+
125
+ # ?? => a
126
+ "\u00E0" => "a"
127
+
128
+ # ?? => a
129
+ "\u00E1" => "a"
130
+
131
+ # ?? => a
132
+ "\u00E2" => "a"
133
+
134
+ # ?? => a
135
+ "\u00E3" => "a"
136
+
137
+ # ?? => a
138
+ "\u00E4" => "a"
139
+
140
+ # ?? => a
141
+ "\u00E5" => "a"
142
+
143
+ # ?? => ae
144
+ "\u00E6" => "ae"
145
+
146
+ # ?? => c
147
+ "\u00E7" => "c"
148
+
149
+ # ?? => e
150
+ "\u00E8" => "e"
151
+
152
+ # ?? => e
153
+ "\u00E9" => "e"
154
+
155
+ # ?? => e
156
+ "\u00EA" => "e"
157
+
158
+ # ?? => e
159
+ "\u00EB" => "e"
160
+
161
+ # ?? => i
162
+ "\u00EC" => "i"
163
+
164
+ # ?? => i
165
+ "\u00ED" => "i"
166
+
167
+ # ?? => i
168
+ "\u00EE" => "i"
169
+
170
+ # ?? => i
171
+ "\u00EF" => "i"
172
+
173
+ # ?? => ij
174
+ "\u0133" => "ij"
175
+
176
+ # ?? => d
177
+ "\u00F0" => "d"
178
+
179
+ # ?? => n
180
+ "\u00F1" => "n"
181
+
182
+ # ?? => o
183
+ "\u00F2" => "o"
184
+
185
+ # ?? => o
186
+ "\u00F3" => "o"
187
+
188
+ # ?? => o
189
+ "\u00F4" => "o"
190
+
191
+ # ?? => o
192
+ "\u00F5" => "o"
193
+
194
+ # ?? => o
195
+ "\u00F6" => "o"
196
+
197
+ # ?? => o
198
+ "\u00F8" => "o"
199
+
200
+ # ?? => oe
201
+ "\u0153" => "oe"
202
+
203
+ # ?? => ss
204
+ "\u00DF" => "ss"
205
+
206
+ # ?? => th
207
+ "\u00FE" => "th"
208
+
209
+ # ?? => u
210
+ "\u00F9" => "u"
211
+
212
+ # ?? => u
213
+ "\u00FA" => "u"
214
+
215
+ # ?? => u
216
+ "\u00FB" => "u"
217
+
218
+ # ?? => u
219
+ "\u00FC" => "u"
220
+
221
+ # ?? => y
222
+ "\u00FD" => "y"
223
+
224
+ # ?? => y
225
+ "\u00FF" => "y"
226
+
227
+ # ??? => ff
228
+ "\uFB00" => "ff"
229
+
230
+ # ??? => fi
231
+ "\uFB01" => "fi"
232
+
233
+ # ??? => fl
234
+ "\uFB02" => "fl"
235
+
236
+ # ??? => ffi
237
+ "\uFB03" => "ffi"
238
+
239
+ # ??? => ffl
240
+ "\uFB04" => "ffl"
241
+
242
+ # ??? => ft
243
+ "\uFB05" => "ft"
244
+
245
+ # ??? => st
246
+ "\uFB06" => "st"