blacklight-citeproc 0.0.5 → 0.1.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.env +3 -0
- data/.internal_test_app/solr/conf/_rest_managed.json +3 -0
- data/.internal_test_app/solr/conf/admin-extra.html +31 -0
- data/.internal_test_app/solr/conf/currency.xml +67 -0
- data/.internal_test_app/solr/conf/email_url_types.txt +2 -0
- data/.internal_test_app/solr/conf/lang/contractions_ca.txt +8 -0
- data/.internal_test_app/solr/conf/lang/contractions_fr.txt +15 -0
- data/.internal_test_app/solr/conf/lang/contractions_ga.txt +5 -0
- data/.internal_test_app/solr/conf/lang/contractions_it.txt +23 -0
- data/.internal_test_app/solr/conf/lang/hyphenations_ga.txt +5 -0
- data/.internal_test_app/solr/conf/lang/stemdict_nl.txt +6 -0
- data/.internal_test_app/solr/conf/lang/stoptags_ja.txt +420 -0
- data/.internal_test_app/solr/conf/lang/stopwords_ar.txt +125 -0
- data/.internal_test_app/solr/conf/lang/stopwords_bg.txt +193 -0
- data/.internal_test_app/solr/conf/lang/stopwords_ca.txt +220 -0
- data/.internal_test_app/solr/conf/lang/stopwords_cz.txt +172 -0
- data/.internal_test_app/solr/conf/lang/stopwords_da.txt +110 -0
- data/.internal_test_app/solr/conf/lang/stopwords_de.txt +294 -0
- data/.internal_test_app/solr/conf/lang/stopwords_el.txt +78 -0
- data/.internal_test_app/solr/conf/lang/stopwords_en.txt +54 -0
- data/.internal_test_app/solr/conf/lang/stopwords_es.txt +356 -0
- data/.internal_test_app/solr/conf/lang/stopwords_eu.txt +99 -0
- data/.internal_test_app/solr/conf/lang/stopwords_fa.txt +313 -0
- data/.internal_test_app/solr/conf/lang/stopwords_fi.txt +97 -0
- data/.internal_test_app/solr/conf/lang/stopwords_fr.txt +186 -0
- data/.internal_test_app/solr/conf/lang/stopwords_ga.txt +110 -0
- data/.internal_test_app/solr/conf/lang/stopwords_gl.txt +161 -0
- data/.internal_test_app/solr/conf/lang/stopwords_hi.txt +235 -0
- data/.internal_test_app/solr/conf/lang/stopwords_hu.txt +211 -0
- data/.internal_test_app/solr/conf/lang/stopwords_hy.txt +46 -0
- data/.internal_test_app/solr/conf/lang/stopwords_id.txt +359 -0
- data/.internal_test_app/solr/conf/lang/stopwords_it.txt +303 -0
- data/.internal_test_app/solr/conf/lang/stopwords_ja.txt +127 -0
- data/.internal_test_app/solr/conf/lang/stopwords_lv.txt +172 -0
- data/.internal_test_app/solr/conf/lang/stopwords_nl.txt +119 -0
- data/.internal_test_app/solr/conf/lang/stopwords_no.txt +194 -0
- data/.internal_test_app/solr/conf/lang/stopwords_pt.txt +253 -0
- data/.internal_test_app/solr/conf/lang/stopwords_ro.txt +233 -0
- data/.internal_test_app/solr/conf/lang/stopwords_ru.txt +243 -0
- data/.internal_test_app/solr/conf/lang/stopwords_sv.txt +133 -0
- data/.internal_test_app/solr/conf/lang/stopwords_th.txt +119 -0
- data/.internal_test_app/solr/conf/lang/stopwords_tr.txt +212 -0
- data/.internal_test_app/solr/conf/lang/userdict_ja.txt +29 -0
- data/.internal_test_app/solr/conf/mapping-ISOLatin1Accent.txt +246 -0
- data/.internal_test_app/solr/conf/protwords.txt +21 -0
- data/.internal_test_app/solr/conf/schema.xml +408 -0
- data/.internal_test_app/solr/conf/scripts.conf +24 -0
- data/.internal_test_app/solr/conf/solrconfig.xml +1287 -0
- data/.internal_test_app/solr/conf/spellings.txt +2 -0
- data/.internal_test_app/solr/conf/stopwords.txt +14 -0
- data/.internal_test_app/solr/conf/stopwords_en.txt +58 -0
- data/.internal_test_app/solr/conf/synonyms.txt +13 -0
- data/.internal_test_app/solr/conf/update-script.js +115 -0
- data/.internal_test_app/solr/conf/velocity/browse.vm +32 -0
- data/.internal_test_app/solr/conf/velocity/dropit.js +0 -0
- data/.internal_test_app/solr/conf/velocity/facet_doc_type.vm +2 -0
- data/.internal_test_app/solr/conf/velocity/facet_text_shingles.vm +12 -0
- data/.internal_test_app/solr/conf/velocity/facets.vm +24 -0
- data/.internal_test_app/solr/conf/velocity/footer.vm +29 -0
- data/.internal_test_app/solr/conf/velocity/head.vm +290 -0
- data/.internal_test_app/solr/conf/velocity/hit.vm +77 -0
- data/.internal_test_app/solr/conf/velocity/img/english_640.png +0 -0
- data/.internal_test_app/solr/conf/velocity/img/france_640.png +0 -0
- data/.internal_test_app/solr/conf/velocity/img/germany_640.png +0 -0
- data/.internal_test_app/solr/conf/velocity/img/globe_256.png +0 -0
- data/.internal_test_app/solr/conf/velocity/jquery.tx3-tag-cloud.js +0 -0
- data/.internal_test_app/solr/conf/velocity/js/dropit.js +97 -0
- data/.internal_test_app/solr/conf/velocity/js/jquery.autocomplete.js +763 -0
- data/.internal_test_app/solr/conf/velocity/js/jquery.tx3-tag-cloud.js +70 -0
- data/.internal_test_app/solr/conf/velocity/layout.vm +42 -0
- data/.internal_test_app/solr/conf/velocity/macros.vm +16 -0
- data/.internal_test_app/solr/conf/velocity/mime_type_lists.vm +68 -0
- data/.internal_test_app/solr/conf/velocity/results.vm +20 -0
- data/.internal_test_app/solr/conf/velocity/results_list.vm +21 -0
- data/.internal_test_app/solr/conf/xslt/example.xsl +132 -0
- data/.internal_test_app/solr/conf/xslt/example_atom.xsl +67 -0
- data/.internal_test_app/solr/conf/xslt/example_rss.xsl +66 -0
- data/.internal_test_app/solr/conf/xslt/luke.xsl +337 -0
- data/Dockerfile +43 -0
- data/README.md +3 -0
- data/bin/entrypoint.sh +8 -0
- data/docker-compose.yml +33 -0
- data/lib/blacklight/citeproc/version.rb +1 -1
- metadata +83 -2
@@ -0,0 +1,356 @@
|
|
1
|
+
| From svn.tartarus.org/snowball/trunk/website/algorithms/spanish/stop.txt
|
2
|
+
| This file is distributed under the BSD License.
|
3
|
+
| See http://snowball.tartarus.org/license.php
|
4
|
+
| Also see http://www.opensource.org/licenses/bsd-license.html
|
5
|
+
| - Encoding was converted to UTF-8.
|
6
|
+
| - This notice was added.
|
7
|
+
|
|
8
|
+
| NOTE: To use this file with StopFilterFactory, you must specify format="snowball"
|
9
|
+
|
10
|
+
| A Spanish stop word list. Comments begin with vertical bar. Each stop
|
11
|
+
| word is at the start of a line.
|
12
|
+
|
13
|
+
|
14
|
+
| The following is a ranked list (commonest to rarest) of stopwords
|
15
|
+
| deriving from a large sample of text.
|
16
|
+
|
17
|
+
| Extra words have been added at the end.
|
18
|
+
|
19
|
+
de | from, of
|
20
|
+
la | the, her
|
21
|
+
que | who, that
|
22
|
+
el | the
|
23
|
+
en | in
|
24
|
+
y | and
|
25
|
+
a | to
|
26
|
+
los | the, them
|
27
|
+
del | de + el
|
28
|
+
se | himself, from him etc
|
29
|
+
las | the, them
|
30
|
+
por | for, by, etc
|
31
|
+
un | a
|
32
|
+
para | for
|
33
|
+
con | with
|
34
|
+
no | no
|
35
|
+
una | a
|
36
|
+
su | his, her
|
37
|
+
al | a + el
|
38
|
+
| es from SER
|
39
|
+
lo | him
|
40
|
+
como | how
|
41
|
+
más | more
|
42
|
+
pero | pero
|
43
|
+
sus | su plural
|
44
|
+
le | to him, her
|
45
|
+
ya | already
|
46
|
+
o | or
|
47
|
+
| fue from SER
|
48
|
+
este | this
|
49
|
+
| ha from HABER
|
50
|
+
sí | himself etc
|
51
|
+
porque | because
|
52
|
+
esta | this
|
53
|
+
| son from SER
|
54
|
+
entre | between
|
55
|
+
| está from ESTAR
|
56
|
+
cuando | when
|
57
|
+
muy | very
|
58
|
+
sin | without
|
59
|
+
sobre | on
|
60
|
+
| ser from SER
|
61
|
+
| tiene from TENER
|
62
|
+
también | also
|
63
|
+
me | me
|
64
|
+
hasta | until
|
65
|
+
hay | there is/are
|
66
|
+
donde | where
|
67
|
+
| han from HABER
|
68
|
+
quien | whom, that
|
69
|
+
| están from ESTAR
|
70
|
+
| estado from ESTAR
|
71
|
+
desde | from
|
72
|
+
todo | all
|
73
|
+
nos | us
|
74
|
+
durante | during
|
75
|
+
| estados from ESTAR
|
76
|
+
todos | all
|
77
|
+
uno | a
|
78
|
+
les | to them
|
79
|
+
ni | nor
|
80
|
+
contra | against
|
81
|
+
otros | other
|
82
|
+
| fueron from SER
|
83
|
+
ese | that
|
84
|
+
eso | that
|
85
|
+
| había from HABER
|
86
|
+
ante | before
|
87
|
+
ellos | they
|
88
|
+
e | and (variant of y)
|
89
|
+
esto | this
|
90
|
+
mí | me
|
91
|
+
antes | before
|
92
|
+
algunos | some
|
93
|
+
qué | what?
|
94
|
+
unos | a
|
95
|
+
yo | I
|
96
|
+
otro | other
|
97
|
+
otras | other
|
98
|
+
otra | other
|
99
|
+
él | he
|
100
|
+
tanto | so much, many
|
101
|
+
esa | that
|
102
|
+
estos | these
|
103
|
+
mucho | much, many
|
104
|
+
quienes | who
|
105
|
+
nada | nothing
|
106
|
+
muchos | many
|
107
|
+
cual | who
|
108
|
+
| sea from SER
|
109
|
+
poco | few
|
110
|
+
ella | she
|
111
|
+
estar | to be
|
112
|
+
| haber from HABER
|
113
|
+
estas | these
|
114
|
+
| estaba from ESTAR
|
115
|
+
| estamos from ESTAR
|
116
|
+
algunas | some
|
117
|
+
algo | something
|
118
|
+
nosotros | we
|
119
|
+
|
120
|
+
| other forms
|
121
|
+
|
122
|
+
mi | me
|
123
|
+
mis | mi plural
|
124
|
+
tú | thou
|
125
|
+
te | thee
|
126
|
+
ti | thee
|
127
|
+
tu | thy
|
128
|
+
tus | tu plural
|
129
|
+
ellas | they
|
130
|
+
nosotras | we
|
131
|
+
vosotros | you
|
132
|
+
vosotras | you
|
133
|
+
os | you
|
134
|
+
mío | mine
|
135
|
+
mía |
|
136
|
+
míos |
|
137
|
+
mías |
|
138
|
+
tuyo | thine
|
139
|
+
tuya |
|
140
|
+
tuyos |
|
141
|
+
tuyas |
|
142
|
+
suyo | his, hers, theirs
|
143
|
+
suya |
|
144
|
+
suyos |
|
145
|
+
suyas |
|
146
|
+
nuestro | ours
|
147
|
+
nuestra |
|
148
|
+
nuestros |
|
149
|
+
nuestras |
|
150
|
+
vuestro | yours
|
151
|
+
vuestra |
|
152
|
+
vuestros |
|
153
|
+
vuestras |
|
154
|
+
esos | those
|
155
|
+
esas | those
|
156
|
+
|
157
|
+
| forms of estar, to be (not including the infinitive):
|
158
|
+
estoy
|
159
|
+
estás
|
160
|
+
está
|
161
|
+
estamos
|
162
|
+
estáis
|
163
|
+
están
|
164
|
+
esté
|
165
|
+
estés
|
166
|
+
estemos
|
167
|
+
estéis
|
168
|
+
estén
|
169
|
+
estaré
|
170
|
+
estarás
|
171
|
+
estará
|
172
|
+
estaremos
|
173
|
+
estaréis
|
174
|
+
estarán
|
175
|
+
estaría
|
176
|
+
estarías
|
177
|
+
estaríamos
|
178
|
+
estaríais
|
179
|
+
estarían
|
180
|
+
estaba
|
181
|
+
estabas
|
182
|
+
estábamos
|
183
|
+
estabais
|
184
|
+
estaban
|
185
|
+
estuve
|
186
|
+
estuviste
|
187
|
+
estuvo
|
188
|
+
estuvimos
|
189
|
+
estuvisteis
|
190
|
+
estuvieron
|
191
|
+
estuviera
|
192
|
+
estuvieras
|
193
|
+
estuviéramos
|
194
|
+
estuvierais
|
195
|
+
estuvieran
|
196
|
+
estuviese
|
197
|
+
estuvieses
|
198
|
+
estuviésemos
|
199
|
+
estuvieseis
|
200
|
+
estuviesen
|
201
|
+
estando
|
202
|
+
estado
|
203
|
+
estada
|
204
|
+
estados
|
205
|
+
estadas
|
206
|
+
estad
|
207
|
+
|
208
|
+
| forms of haber, to have (not including the infinitive):
|
209
|
+
he
|
210
|
+
has
|
211
|
+
ha
|
212
|
+
hemos
|
213
|
+
habéis
|
214
|
+
han
|
215
|
+
haya
|
216
|
+
hayas
|
217
|
+
hayamos
|
218
|
+
hayáis
|
219
|
+
hayan
|
220
|
+
habré
|
221
|
+
habrás
|
222
|
+
habrá
|
223
|
+
habremos
|
224
|
+
habréis
|
225
|
+
habrán
|
226
|
+
habría
|
227
|
+
habrías
|
228
|
+
habríamos
|
229
|
+
habríais
|
230
|
+
habrían
|
231
|
+
había
|
232
|
+
habías
|
233
|
+
habíamos
|
234
|
+
habíais
|
235
|
+
habían
|
236
|
+
hube
|
237
|
+
hubiste
|
238
|
+
hubo
|
239
|
+
hubimos
|
240
|
+
hubisteis
|
241
|
+
hubieron
|
242
|
+
hubiera
|
243
|
+
hubieras
|
244
|
+
hubiéramos
|
245
|
+
hubierais
|
246
|
+
hubieran
|
247
|
+
hubiese
|
248
|
+
hubieses
|
249
|
+
hubiésemos
|
250
|
+
hubieseis
|
251
|
+
hubiesen
|
252
|
+
habiendo
|
253
|
+
habido
|
254
|
+
habida
|
255
|
+
habidos
|
256
|
+
habidas
|
257
|
+
|
258
|
+
| forms of ser, to be (not including the infinitive):
|
259
|
+
soy
|
260
|
+
eres
|
261
|
+
es
|
262
|
+
somos
|
263
|
+
sois
|
264
|
+
son
|
265
|
+
sea
|
266
|
+
seas
|
267
|
+
seamos
|
268
|
+
seáis
|
269
|
+
sean
|
270
|
+
seré
|
271
|
+
serás
|
272
|
+
será
|
273
|
+
seremos
|
274
|
+
seréis
|
275
|
+
serán
|
276
|
+
sería
|
277
|
+
serías
|
278
|
+
seríamos
|
279
|
+
seríais
|
280
|
+
serían
|
281
|
+
era
|
282
|
+
eras
|
283
|
+
éramos
|
284
|
+
erais
|
285
|
+
eran
|
286
|
+
fui
|
287
|
+
fuiste
|
288
|
+
fue
|
289
|
+
fuimos
|
290
|
+
fuisteis
|
291
|
+
fueron
|
292
|
+
fuera
|
293
|
+
fueras
|
294
|
+
fuéramos
|
295
|
+
fuerais
|
296
|
+
fueran
|
297
|
+
fuese
|
298
|
+
fueses
|
299
|
+
fuésemos
|
300
|
+
fueseis
|
301
|
+
fuesen
|
302
|
+
siendo
|
303
|
+
sido
|
304
|
+
| sed also means 'thirst'
|
305
|
+
|
306
|
+
| forms of tener, to have (not including the infinitive):
|
307
|
+
tengo
|
308
|
+
tienes
|
309
|
+
tiene
|
310
|
+
tenemos
|
311
|
+
tenéis
|
312
|
+
tienen
|
313
|
+
tenga
|
314
|
+
tengas
|
315
|
+
tengamos
|
316
|
+
tengáis
|
317
|
+
tengan
|
318
|
+
tendré
|
319
|
+
tendrás
|
320
|
+
tendrá
|
321
|
+
tendremos
|
322
|
+
tendréis
|
323
|
+
tendrán
|
324
|
+
tendría
|
325
|
+
tendrías
|
326
|
+
tendríamos
|
327
|
+
tendríais
|
328
|
+
tendrían
|
329
|
+
tenía
|
330
|
+
tenías
|
331
|
+
teníamos
|
332
|
+
teníais
|
333
|
+
tenían
|
334
|
+
tuve
|
335
|
+
tuviste
|
336
|
+
tuvo
|
337
|
+
tuvimos
|
338
|
+
tuvisteis
|
339
|
+
tuvieron
|
340
|
+
tuviera
|
341
|
+
tuvieras
|
342
|
+
tuviéramos
|
343
|
+
tuvierais
|
344
|
+
tuvieran
|
345
|
+
tuviese
|
346
|
+
tuvieses
|
347
|
+
tuviésemos
|
348
|
+
tuvieseis
|
349
|
+
tuviesen
|
350
|
+
teniendo
|
351
|
+
tenido
|
352
|
+
tenida
|
353
|
+
tenidos
|
354
|
+
tenidas
|
355
|
+
tened
|
356
|
+
|
@@ -0,0 +1,99 @@
|
|
1
|
+
# example set of basque stopwords
|
2
|
+
al
|
3
|
+
anitz
|
4
|
+
arabera
|
5
|
+
asko
|
6
|
+
baina
|
7
|
+
bat
|
8
|
+
batean
|
9
|
+
batek
|
10
|
+
bati
|
11
|
+
batzuei
|
12
|
+
batzuek
|
13
|
+
batzuetan
|
14
|
+
batzuk
|
15
|
+
bera
|
16
|
+
beraiek
|
17
|
+
berau
|
18
|
+
berauek
|
19
|
+
bere
|
20
|
+
berori
|
21
|
+
beroriek
|
22
|
+
beste
|
23
|
+
bezala
|
24
|
+
da
|
25
|
+
dago
|
26
|
+
dira
|
27
|
+
ditu
|
28
|
+
du
|
29
|
+
dute
|
30
|
+
edo
|
31
|
+
egin
|
32
|
+
ere
|
33
|
+
eta
|
34
|
+
eurak
|
35
|
+
ez
|
36
|
+
gainera
|
37
|
+
gu
|
38
|
+
gutxi
|
39
|
+
guzti
|
40
|
+
haiei
|
41
|
+
haiek
|
42
|
+
haietan
|
43
|
+
hainbeste
|
44
|
+
hala
|
45
|
+
han
|
46
|
+
handik
|
47
|
+
hango
|
48
|
+
hara
|
49
|
+
hari
|
50
|
+
hark
|
51
|
+
hartan
|
52
|
+
hau
|
53
|
+
hauei
|
54
|
+
hauek
|
55
|
+
hauetan
|
56
|
+
hemen
|
57
|
+
hemendik
|
58
|
+
hemengo
|
59
|
+
hi
|
60
|
+
hona
|
61
|
+
honek
|
62
|
+
honela
|
63
|
+
honetan
|
64
|
+
honi
|
65
|
+
hor
|
66
|
+
hori
|
67
|
+
horiei
|
68
|
+
horiek
|
69
|
+
horietan
|
70
|
+
horko
|
71
|
+
horra
|
72
|
+
horrek
|
73
|
+
horrela
|
74
|
+
horretan
|
75
|
+
horri
|
76
|
+
hortik
|
77
|
+
hura
|
78
|
+
izan
|
79
|
+
ni
|
80
|
+
noiz
|
81
|
+
nola
|
82
|
+
non
|
83
|
+
nondik
|
84
|
+
nongo
|
85
|
+
nor
|
86
|
+
nora
|
87
|
+
ze
|
88
|
+
zein
|
89
|
+
zen
|
90
|
+
zenbait
|
91
|
+
zenbat
|
92
|
+
zer
|
93
|
+
zergatik
|
94
|
+
ziren
|
95
|
+
zituen
|
96
|
+
zu
|
97
|
+
zuek
|
98
|
+
zuen
|
99
|
+
zuten
|