stopwords-filter2 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (46) hide show
  1. checksums.yaml +7 -0
  2. data/CHANGELOG.md +7 -0
  3. data/Gemfile +8 -0
  4. data/Gemfile.lock +38 -0
  5. data/LICENSE.txt +20 -0
  6. data/README.md +184 -0
  7. data/VERSION +1 -0
  8. data/lib/stopwords/filter.rb +21 -0
  9. data/lib/stopwords/snowball/filter.rb +16 -0
  10. data/lib/stopwords/snowball/locales/af.csv +1 -0
  11. data/lib/stopwords/snowball/locales/ar.csv +1 -0
  12. data/lib/stopwords/snowball/locales/bg.csv +1 -0
  13. data/lib/stopwords/snowball/locales/bn.csv +1 -0
  14. data/lib/stopwords/snowball/locales/br.csv +1 -0
  15. data/lib/stopwords/snowball/locales/ca.csv +1 -0
  16. data/lib/stopwords/snowball/locales/cs.csv +1 -0
  17. data/lib/stopwords/snowball/locales/da.csv +1 -0
  18. data/lib/stopwords/snowball/locales/de.csv +1 -0
  19. data/lib/stopwords/snowball/locales/el.csv +1 -0
  20. data/lib/stopwords/snowball/locales/en.csv +1 -0
  21. data/lib/stopwords/snowball/locales/es.csv +1 -0
  22. data/lib/stopwords/snowball/locales/fi.csv +1 -0
  23. data/lib/stopwords/snowball/locales/fn.csv +1 -0
  24. data/lib/stopwords/snowball/locales/fr.csv +1 -0
  25. data/lib/stopwords/snowball/locales/he.csv +1 -0
  26. data/lib/stopwords/snowball/locales/hu.csv +1 -0
  27. data/lib/stopwords/snowball/locales/id.csv +1 -0
  28. data/lib/stopwords/snowball/locales/it.csv +1 -0
  29. data/lib/stopwords/snowball/locales/ko.csv +1 -0
  30. data/lib/stopwords/snowball/locales/nl.csv +1 -0
  31. data/lib/stopwords/snowball/locales/pl.csv +1 -0
  32. data/lib/stopwords/snowball/locales/pt.csv +1 -0
  33. data/lib/stopwords/snowball/locales/ro.csv +1 -0
  34. data/lib/stopwords/snowball/locales/ru.csv +1 -0
  35. data/lib/stopwords/snowball/locales/sv.csv +1 -0
  36. data/lib/stopwords/snowball/locales/th.csv +1 -0
  37. data/lib/stopwords/snowball/locales/tr.csv +1 -0
  38. data/lib/stopwords/snowball/locales/vi.csv +1 -0
  39. data/lib/stopwords/snowball/locales/zh.csv +1 -0
  40. data/lib/stopwords/snowball/wordsieve.rb +20 -0
  41. data/lib/stopwords/snowball.rb +4 -0
  42. data/lib/stopwords.rb +4 -0
  43. data/spec/lib/filter_spec.rb +18 -0
  44. data/spec/lib/snowball_filter_spec.rb +40 -0
  45. data/spec/spec_helper.rb +1 -0
  46. metadata +91 -0
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA256:
3
+ metadata.gz: eda276cb0f1bc6ea398a56a79df0ed323076a0ec5e88a0dda8013c91e2c79416
4
+ data.tar.gz: 279865db59b5cd5d3b68187abf3037ebcf2edbd610cbb124f756f4ae4e3d8de9
5
+ SHA512:
6
+ metadata.gz: 4f52ec84821ac4ea97e1b1ee727a3d3caba73398e14170e308286b7706013557768660a5d4c93f2cc96148418527f2c47392ef5e4b2c692f7159ac21d8d46260
7
+ data.tar.gz: 506e1fc9c66ef5fa72b516ce8e7ac8a1931e4da85fe678a940de3e3fb899fb83f7b45d725abf89560b9c0c08cb2434181db664b90f9919de831d90a119bf5c83
data/CHANGELOG.md ADDED
@@ -0,0 +1,7 @@
1
+ # Changelog
2
+
3
+ ## v0.1.0
4
+ * Support Ruby 3.2
5
+ * Requires Ruby >= 2.4
6
+ * Update bundler to 2.1.4
7
+ * Remove calls to the deprecated `File.exists?` Thanks to [@mgmodell] for the original submission
data/Gemfile ADDED
@@ -0,0 +1,8 @@
1
+ # A sample Gemfile
2
+ source "https://rubygems.org"
3
+
4
+ group :test do
5
+ gem "rspec"
6
+ gem "rspec_junit_formatter", require: false
7
+ gem "jeweler", "1.8.4"
8
+ end
data/Gemfile.lock ADDED
@@ -0,0 +1,38 @@
1
+ GEM
2
+ remote: https://rubygems.org/
3
+ specs:
4
+ diff-lcs (1.3)
5
+ git (1.3.0)
6
+ jeweler (1.8.4)
7
+ bundler (~> 1.0)
8
+ git (>= 1.2.5)
9
+ rake
10
+ rdoc
11
+ rake (13.0.3)
12
+ rdoc (6.3.2)
13
+ rspec (3.5.0)
14
+ rspec-core (~> 3.5.0)
15
+ rspec-expectations (~> 3.5.0)
16
+ rspec-mocks (~> 3.5.0)
17
+ rspec-core (3.5.4)
18
+ rspec-support (~> 3.5.0)
19
+ rspec-expectations (3.5.0)
20
+ diff-lcs (>= 1.2.0, < 2.0)
21
+ rspec-support (~> 3.5.0)
22
+ rspec-mocks (3.5.0)
23
+ diff-lcs (>= 1.2.0, < 2.0)
24
+ rspec-support (~> 3.5.0)
25
+ rspec-support (3.5.0)
26
+ rspec_junit_formatter (0.6.0)
27
+ rspec-core (>= 2, < 4, != 2.12.0)
28
+
29
+ PLATFORMS
30
+ ruby
31
+
32
+ DEPENDENCIES
33
+ jeweler (= 1.8.4)
34
+ rspec
35
+ rspec_junit_formatter
36
+
37
+ BUNDLED WITH
38
+ 2.1.4
data/LICENSE.txt ADDED
@@ -0,0 +1,20 @@
1
+ Copyright (c) 2012 David J. Brenes
2
+
3
+ Permission is hereby granted, free of charge, to any person obtaining
4
+ a copy of this software and associated documentation files (the
5
+ "Software"), to deal in the Software without restriction, including
6
+ without limitation the rights to use, copy, modify, merge, publish,
7
+ distribute, sublicense, and/or sell copies of the Software, and to
8
+ permit persons to whom the Software is furnished to do so, subject to
9
+ the following conditions:
10
+
11
+ The above copyright notice and this permission notice shall be
12
+ included in all copies or substantial portions of the Software.
13
+
14
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
16
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
18
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
19
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
20
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,184 @@
1
+ Stopwords Filter (2)
2
+ ================
3
+
4
+ This project is a fork of a very simple and naive implementation of a stopwords filter by @brenes. It remove a list of banned words (stopwords) from a sentence.
5
+
6
+ Since the original repository appears to be no longer maintained, this fork aims to keep the project maintained and usable across current and future ruby versions.
7
+
8
+ Quick guide
9
+ -----------
10
+
11
+ * Install
12
+
13
+ just type
14
+
15
+ ```
16
+ gem install stopwords-filter2
17
+ ```
18
+
19
+ or
20
+
21
+ ```
22
+ # Don't forget the 'require:'
23
+ gem 'stopwords-filter2', require: 'stopwords'
24
+ ```
25
+
26
+ in your Gemfile.
27
+
28
+ * Use it
29
+
30
+ 1. Simple version
31
+
32
+ ```
33
+ stopwords = ['by', 'written', 'from']
34
+ filter = Stopwords::Filter.new stopwords
35
+
36
+ filter.filter 'guide by douglas adams'.split
37
+ # ['guide', 'douglas', 'adams']
38
+
39
+ filter.stopword? 'by'
40
+ # true
41
+ ```
42
+
43
+ 2. Snowball version
44
+
45
+
46
+ ```
47
+ filter = Stopwords::Snowball::Filter.new "en"
48
+ filter.filter 'guide by douglas adams'.split
49
+ # ['guide', 'douglas', 'adams']
50
+
51
+ filter.stopword? 'by'
52
+ # true
53
+ ```
54
+
55
+ 2.1 Snowball version with Sieve class (thanks to @s2gatev)
56
+
57
+ ```ruby
58
+ sieve = Stopwords::Snowball::WordSieve.new
59
+
60
+ filtered = sieve.filter lang: :en, words: 'guide by douglas adams'.split
61
+ # filtered = ['guide', 'douglas', 'adams']
62
+
63
+ sieve.stopword? lang: :en, word: 'by'
64
+ # true
65
+ ```
66
+
67
+
68
+
69
+ What is a Stopword?
70
+ -------------------
71
+
72
+ According to [Wikipedia][wikipedia_stopwords]
73
+
74
+ > In computing, stop words are words which are filtered out prior to, or after, processing of natural language data (text).
75
+
76
+ And that's it. Words that are removed before you perform some task on the rest of them.
77
+
78
+ Why would I want to remove anything?
79
+ ------------------------------------
80
+
81
+ Imagine you have a database of products and you want your customers to search on them. You can't use a proper search engine (such as [Solr][solr], [Sphinx][sphinx] or even [Google][google]) neither full search systems from popular database systems such as [PostgreSQL][postgre]. You are left alone with LIKEs and %.
82
+
83
+ You have your fake search engine working. Someone searches 'Guide Douglas Adams' and you find 'Douglas Adams - Hitchhiker's guide to the galaxy' everything is perfect.
84
+
85
+ But then someone searches 'guide by douglas adams' and you don't find anything. You don't have any 'by' in the description or title of the book! Most importantly, you don't need that 'by'!
86
+
87
+ You wish you could get rid of all those 'by' or 'written' or 'from', huh? That's why we are here!
88
+
89
+ How this thing works?
90
+ ---------------------
91
+
92
+ Main class of this 'library' is Stopwords::Filter You just create a new object with an array of stopwords
93
+
94
+ ```
95
+ stopwords = ['by', 'written', 'from']
96
+ filter = Stopwords::Filter.new stopwords
97
+ ```
98
+
99
+ And then you have it, you just can filter
100
+
101
+ ```
102
+ filter.filter 'guide by douglas adams'.split #-> ['guide', 'douglas', 'adams']
103
+ ```
104
+
105
+ That's all?
106
+ -----------
107
+
108
+ I know what you're thinking, it takes a line of ruby code to filter one array from other. That's why we have added an extra functionality, [Snowball][wikipedia_snowball] stopwords lists, already built for you and ready to use.
109
+
110
+ At least, in the beginning we were using snowball stopwords, but several collaborators have improved this humble gem by including new languages or adding new stopwords. So now, the Snowball version is more an "Snowball and friends" version.
111
+
112
+ How do I use that snowball thing?
113
+ ---------------------------------
114
+
115
+ You just create the filter with the locale you want to use
116
+
117
+ ```
118
+ filter = Stopwords::Snowball::Filter.new "en"
119
+ ```
120
+
121
+ And then you filter without worrying about the exact stopwords used
122
+
123
+ ```
124
+ filter.filter 'guide by douglas adams'.split #-> ['guide', 'douglas', 'adams']
125
+ ```
126
+
127
+ Which languages are supported with snowball?
128
+ -------------------------------------------
129
+
130
+ Currently we have support for:
131
+
132
+ * Afrikaans (af)
133
+ * Arabic (ar)
134
+ * Bengali (bn)
135
+ * Breton (br)
136
+ * Catalán (ca)
137
+ * Chinese (zh)
138
+ * Czesch (cs)
139
+ * Danish (da)
140
+ * German (de)
141
+ * Greek (el)
142
+ * English (en)
143
+ * Spanish (es)
144
+ * Finnish (fi): Due to an error it can also be used referring to the `fn` locale
145
+ * French (fr)
146
+ * Hebrew (he)
147
+ * Hungarian (hu)
148
+ * Indonesian (id)
149
+ * Italian (it)
150
+ * Korean (ko)
151
+ * Dutch (nl)
152
+ * Polish (pl)
153
+ * Portuguese (pt)
154
+ * Romanian (ro)
155
+ * Russian (ru)
156
+ * Swedish (sv)
157
+ * Thai (th)
158
+ * Turkish (tr)
159
+ * Vietnamese (vi)
160
+
161
+ In the changelog you can see the collaborators for each language.
162
+
163
+ Anything else?
164
+ --------------
165
+
166
+ In a future version I would like to include a chaining filter where you include a series of operations and they are executed in a lineal order, just like the [Pipes and Filters design pattern][wikipedia_pipes_filters]
167
+
168
+ Acknowledgments
169
+ ----------------
170
+
171
+ Thanks to @brenes who is the author of the [original gem](https://github.com/brenes/stopwords-filter) (published under `stopwords-filter`).
172
+
173
+ Thanks to @s2gatev who added the `stopword?` method and the sieve class to this gem
174
+
175
+ Thanks to @bettysteger, @fauno, @vrypan, @woto, @grzegorzblaszczyk, @nerde, @sbeckeriv and @zackxu1 for language support and other features.
176
+
177
+ [wikipedia_stopwords]: http://en.wikipedia.org/wiki/Stopword
178
+ [solr]: https://github.com/sunspot/sunspot
179
+ [sphinx]: https://github.com/freelancing-god/thinking-sphinx
180
+ [google]: https://github.com/alexreisner/google_custom_search
181
+ [postgre]: https://github.com/Casecommons/pg_search
182
+ [wikipedia_snowball]: http://en.wikipedia.org/wiki/Snowball_programming_language
183
+ [wikipedia_pipes_filters]: http://en.wikipedia.org/wiki/Pipes_and_filters
184
+
data/VERSION ADDED
@@ -0,0 +1 @@
1
+ 0.1.0
@@ -0,0 +1,21 @@
1
+ module Stopwords
2
+
3
+ class Filter
4
+
5
+ attr_reader :stopwords
6
+
7
+ def initialize stopwords
8
+ @stopwords = stopwords.map(&:downcase)
9
+ end
10
+
11
+ def filter words
12
+ words.reject{ |word| stopword?(word) }
13
+ end
14
+
15
+ def stopword? word
16
+ stopwords.include?(word) || stopwords.include?(word.downcase)
17
+ end
18
+
19
+ end
20
+
21
+ end
@@ -0,0 +1,16 @@
1
+ module Stopwords
2
+ module Snowball
3
+ class Filter < Stopwords::Filter
4
+ attr_reader :locale
5
+ attr_reader :locale_filename
6
+
7
+ def initialize locale, custom_list = []
8
+ @locale = locale.gsub(/-\w+/, '') # remove country appendix
9
+ @locale_filename = "#{File.dirname(__FILE__)}/locales/#{locale}.csv"
10
+
11
+ raise ArgumentError.new("Unknown locale: #{locale.inspect}") unless File.exist?(@locale_filename)
12
+ super File.read(@locale_filename).split(",") + custom_list
13
+ end
14
+ end
15
+ end
16
+ end
@@ -0,0 +1 @@
1
+ die,het,en,sy,nie,was,hy,te,is,ek,om,hulle,in,my,'n,vir,toe,haar,van,dit,op,se,wat,met,gaan,baie,ons,jy,na,maar,hom,so,n,huis,kan,aan,dat,daar,sal,jou,gesê,by,kom,een,ma,as,son,groot,begin,al
@@ -0,0 +1 @@
1
+ ،,آض,آمينَ,آه,آهاً,آي,أ,أب,أجل,أجمع,أخ,أخذ,أصبح,أضحى,أقبل,أقل,أكثر,ألا,أم,أما,أمامك,أمامكَ,أمسى,أمّا,أن,أنا,أنت,أنتم,أنتما,أنتن,أنتِ,أنشأ,أنّى,أو,أوشك,أولئك,أولئكم,أولاء,أولالك,أوّهْ,أي,أيا,أين,أينما,أيّ,أَنَّ,أََيُّ,أُفٍّ,إذ,إذا,إذاً,إذما,إذن,إلى,إليكم,إليكما,إليكنّ,إليكَ,إلَيْكَ,إلّا,إمّا,إن,إنّما,إي,إياك,إياكم,إياكما,إياكن,إيانا,إياه,إياها,إياهم,إياهما,إياهن,إياي,إيهٍ,إِنَّ,ا,ابتدأ,اثر,اجل,احد,اخرى,اخلولق,اذا,اربعة,ارتدّ,استحال,اطار,اعادة,اعلنت,اف,اكثر,اكد,الألاء,الألى,الا,الاخيرة,الان,الاول,الاولى,التى,التي,الثاني,الثانية,الذاتي,الذى,الذي,الذين,السابق,الف,اللائي,اللاتي,اللتان,اللتيا,اللتين,اللذان,اللذين,اللواتي,الماضي,المقبل,الوقت,الى,اليوم,اما,امام,امس,ان,انبرى,انقلب,انه,انها,او,اول,اي,ايار,ايام,ايضا,ب,بات,باسم,بان,بخٍ,برس,بسبب,بسّ,بشكل,بضع,بطآن,بعد,بعض,بك,بكم,بكما,بكن,بل,بلى,بما,بماذا,بمن,بن,بنا,به,بها,بي,بيد,بين,بَسْ,بَلْهَ,بِئْسَ,تانِ,تانِك,تبدّل,تجاه,تحوّل,تلقاء,تلك,تلكم,تلكما,تم,تينك,تَيْنِ,تِه,تِي,ثلاثة,ثم,ثمّ,ثمّة,ثُمَّ,جعل,جلل,جميع,جير,حار,حاشا,حاليا,حاي,حتى,حرى,حسب,حم,حوالى,حول,حيث,حيثما,حين,حيَّ,حَبَّذَا,حَتَّى,حَذارِ,خلا,خلال,دون,دونك,ذا,ذات,ذاك,ذانك,ذانِ,ذلك,ذلكم,ذلكما,ذلكن,ذو,ذوا,ذواتا,ذواتي,ذيت,ذينك,ذَيْنِ,ذِه,ذِي,راح,رجع,رويدك,ريث,رُبَّ,زيارة,سبحان,سرعان,سنة,سنوات,سوف,سوى,سَاءَ,سَاءَمَا,شبه,شخصا,شرع,شَتَّانَ,صار,صباح,صفر,صهٍ,صهْ,ضد,ضمن,طاق,طالما,طفق,طَق,ظلّ,عاد,عام,عاما,عامة,عدا,عدة,عدد,عدم,عسى,عشر,عشرة,علق,على,عليك,عليه,عليها,علًّ,عن,عند,عندما,عوض,عين,عَدَسْ,عَمَّا,غدا,غير,ـ,ف,فان,فلان,فو,فى,في,فيم,فيما,فيه,فيها,قال,قام,قبل,قد,قطّ,قلما,قوة,كأنّما,كأين,كأيّ,كأيّن,كاد,كان,كانت,كذا,كذلك,كرب,كل,كلا,كلاهما,كلتا,كلم,كليكما,كليهما,كلّما,كلَّا,كم,كما,كي,كيت,كيف,كيفما,كَأَنَّ,كِخ,لئن,لا,لات,لاسيما,لدن,لدى,لعمر,لقاء,لك,لكم,لكما,لكن,لكنَّما,لكي,لكيلا,للامم,لم,لما,لمّا,لن,لنا,له,لها,لو,لوكالة,لولا,لوما,لي,لَسْتَ,لَسْتُ,لَسْتُم,لَسْتُمَا,لَسْتُنَّ,لَسْتِ,لَسْنَ,لَعَلَّ,لَكِنَّ,لَيْتَ,لَيْسَ,لَيْسَا,لَيْسَتَا,لَيْسَتْ,لَيْسُوا,لَِسْنَا,ما,ماانفك,مابرح,مادام,ماذا,مازال,مافتئ,مايو,متى,مثل,مذ,مساء,مع,معاذ,مقابل,مكانكم,مكانكما,مكانكنّ,مكانَك,مليار,مليون,مما,ممن,من,منذ,منها,مه,مهما,مَنْ,مِن,نحن,نحو,نعم,نفس,نفسه,نهاية,نَخْ,نِعِمّا,نِعْمَ,ها,هاؤم,هاكَ,هاهنا,هبّ,هذا,هذه,هكذا,هل,هلمَّ,هلّا,هم,هما,هن,هنا,هناك,هنالك,هو,هي,هيا,هيت,هيّا,هَؤلاء,هَاتانِ,هَاتَيْنِ,هَاتِه,هَاتِي,هَجْ,هَذا,هَذانِ,هَذَيْنِ,هَذِه,هَذِي,هَيْهَاتَ,و,و6,وا,واحد,واضاف,واضافت,واكد,وان,واهاً,واوضح,وراءَك,وفي,وقال,وقالت,وقد,وقف,وكان,وكانت,ولا,ولم,ومن,وهو,وهي,ويكأنّ,وَيْ,وُشْكَانََ,يكون,يمكن,يوم,ّأيّان
@@ -0,0 +1 @@
1
+ а,автентичен,аз,ако,ала,бе,без,беше,би,бивш,бивша,бившо,бил,била,били,било,благодаря,близо,бъдат,бъде,бяха,в,вас,ваш,ваша,вероятно,вече,взема,ви,вие,винаги,внимава,време,все,всеки,всички,всичко,всяка,във,въпреки,върху,г,ги,главен,главна,главно,глас,го,година,години,годишен,д,да,дали,два,двама,двамата,две,двете,ден,днес,дни,до,добра,добре,добро,добър,докато,докога,дори,досега,доста,друг,друга,други,е,евтин,едва,един,една,еднаква,еднакви,еднакъв,едно,екип,ето,живот,за,забавям,зад,заедно,заради,засега,заспал,затова,защо,защото,и,из,или,им,има,имат,иска,й,каза,как,каква,какво,както,какъв,като,кога,когато,което,които,кой,който,колко,която,къде,където,към,лесен,лесно,ли,лош,м,май,малко,ме,между,мек,мен,месец,ми,много,мнозина,мога,могат,може,мокър,моля,момента,му,н,на,над,назад,най,направи,напред,например,нас,не,него,нещо,нея,ни,ние,никой,нито,нищо,но,нов,нова,нови,новина,някои,някой,няколко,няма,обаче,около,освен,особено,от,отгоре,отново,още,пак,по,повече,повечето,под,поне,поради,после,почти,прави,пред,преди,през,при,пък,първата,първи,първо,пъти,равен,равна,с,са,сам,само,се,сега,си,син,скоро,след,следващ,сме,смях,според,сред,срещу,сте,съм,със,също,т,тази,така,такива,такъв,там,твой,те,тези,ти,т.н.,то,това,тогава,този,той,толкова,точно,три,трябва,тук,тъй,тя,тях,у,утре,харесва,хиляди,ч,часа,че,често,чрез,ще,щом,юмрук,я,як
@@ -0,0 +1 @@
1
+ অতএব,অথচ,অথবা,অনুযায়ী,অনেক,অনেকে,অনেকেই,অন্তত,অন্য,অবধি,অবশ্য,অর্থাত,আই,আগামী,আগে,আগেই,আছে,আজ,আদ্যভাগে,আপনার,আপনি,আবার,আমরা,আমাকে,আমাদের,আমার,আমি,আর,আরও,ই,ইত্যাদি,ইহা,উচিত,উত্তর,উনি,উপর,উপরে,এ,এঁদের,এঁরা,এই,একই,একটি,একবার,একে,এক্,এখন,এখনও,এখানে,এখানেই,এটা,এটাই,এটি,এত,এতটাই,এতে,এদের,এব,এবং,এবার,এমন,এমনকী,এমনি,এর,এরা,এল,এস,এসে,ঐ,ও,ওঁদের,ওঁর,ওঁরা,ওই,ওকে,ওখানে,ওদের,ওর,ওরা,কখনও,কত,কবে,কমনে,কয়েক,কয়েকটি,করছে,করছেন,করতে,করবে,করবেন,করলে,করলেন,করা,করাই,করায়,করার,করি,করিতে,করিয়া,করিয়ে,করে,করেই,করেছিলেন,করেছে,করেছেন,করেন,কাউকে,কাছ,কাছে,কাজ,কাজে,কারও,কারণ,কি,কিংবা,কিছু,কিছুই,কিন্তু,কী,কে,কেউ,কেউই,কেখা,কেন,কোটি,কোন,কোনও,কোনো,ক্ষেত্রে,কয়েক,খুব,গিয়ে,গিয়েছে,গিয়ে,গুলি,গেছে,গেল,গেলে,গোটা,চলে,চান,চায়,চার,চালু,চেয়ে,চেষ্টা,ছাড়া,ছাড়াও,ছিল,ছিলেন,জন,জনকে,জনের,জন্য,জন্যওজে,জানতে,জানা,জানানো,জানায়,জানিয়ে,জানিয়েছে,জে,জ্নজন,টি,ঠিক,তখন,তত,তথা,তবু,তবে,তা,তাঁকে,তাঁদের,তাঁর,তাঁরা,তাঁাহারা,তাই,তাও,তাকে,তাতে,তাদের,তার,তারপর,তারা,তারৈ,তাহলে,তাহা,তাহাতে,তাহার,তিনঐ,তিনি,তিনিও,তুমি,তুলে,তেমন,তো,তোমার,থাকবে,থাকবেন,থাকা,থাকায়,থাকে,থাকেন,থেকে,থেকেই,থেকেও,দিকে,দিতে,দিন,দিয়ে,দিয়েছে,দিয়েছেন,দিলেন,দু,দুই,দুটি,দুটো,দেওয়া,দেওয়ার,দেওয়া,দেখতে,দেখা,দেখে,দেন,দেয়,দ্বারা,ধরা,ধরে,ধামার,নতুন,নয়,না,নাই,নাকি,নাগাদ,নানা,নিজে,নিজেই,নিজেদের,নিজের,নিতে,নিয়ে,নিয়ে,নেই,নেওয়া,নেওয়ার,নেওয়া,নয়,পক্ষে,পর,পরে,পরেই,পরেও,পর্যন্ত,পাওয়া,পাচ,পারি,পারে,পারেন,পি,পেয়ে,পেয়্র্,প্রতি,প্রথম,প্রভৃতি,প্রযন্ত,প্রাথমিক,প্রায়,প্রায়,ফলে,ফিরে,ফের,বক্তব্য,বদলে,বন,বরং,বলতে,বলল,বললেন,বলা,বলে,বলেছেন,বলেন,বসে,বহু,বা,বাদে,বার,বি,বিনা,বিভিন্ন,বিশেষ,বিষয়টি,বেশ,বেশি,ব্যবহার,ব্যাপারে,ভাবে,ভাবেই,মতো,মতোই,মধ্যভাগে,মধ্যে,মধ্যেই,মধ্যেও,মনে,মাত্র,মাধ্যমে,মোট,মোটেই,যখন,যত,যতটা,যথেষ্ট,যদি,যদিও,যা,যাঁর,যাঁরা,যাওয়া,যাওয়ার,যাওয়া,যাকে,যাচ্ছে,যাতে,যাদের,যান,যাবে,যায়,যার,যারা,যিনি,যে,যেখানে,যেতে,যেন,যেমন,র,রকম,রয়েছে,রাখা,রেখে,লক্ষ,শুধু,শুরু,সঙ্গে,সঙ্গেও,সব,সবার,সমস্ত,সম্প্রতি,সহ,সহিত,সাধারণ,সামনে,সি,সুতরাং,সে,সেই,সেখান,সেখানে,সেটা,সেটাই,সেটাও,সেটি,স্পষ্ট,স্বয়ং,হইতে,হইবে,হইয়া,হওয়া,হওয়ায়,হওয়ার,হচ্ছে,হত,হতে,হতেই,হন,হবে,হবেন,হয়,হয়তো,হয়নি,হয়ে,হয়েই,হয়েছিল,হয়েছে,হয়েছেন,হল,হলে,হলেই,হলেও,হলো,হাজার,হিসাবে,হৈলে,হোক,হয়
@@ -0,0 +1 @@
1
+ a,ainda,alem,ambas,ambos,antes,ao,aonde,aos,apos,aquele,aqueles,as,assim,com,como,contra,contudo,cuja,cujas,cujo,cujos,da,das,de,dela,dele,deles,demais,depois,desde,desta,deste,dispoe,dispoem,diversa,diversas,diversos,do,dos,durante,e,ela,elas,ele,eles,em,entao,entre,essa,essas,esse,esses,esta,estas,este,estes,ha,isso,isto,logo,mais,mas,mediante,menos,mesma,mesmas,mesmo,mesmos,na,nao,nas,nem,nesse,neste,nos,o,os,ou,outra,outras,outro,outros,pelas,pelo,pelos,perante,pois,por,porque,portanto,propios,proprio,quais,qual,qualquer,quando,quanto,que,quem,quer,se,seja,sem,sendo,seu,seus,sob,sobre,sua,suas,tal,tambem,teu,teus,toda,todas,todo,todos,tua,tuas,tudo,um,uma,umas,uns
@@ -0,0 +1 @@
1
+ a,abans,ací,ah,així,això,al,aleshores,algun,alguna,algunes,alguns,alhora,allà,allí,allò,als,altra,altre,altres,amb,ambdues,ambdós,apa,aquell,aquella,aquelles,aquells,aquest,aquesta,aquestes,aquests,aquí,baix,cada,cadascuna,cadascunes,cadascuns,cadascú,com,contra,d'un,d'una,d'unes,d'uns,dalt,de,del,dels,des,després,dins,dintre,donat,doncs,durant,e,eh,el,els,em,en,encara,ens,entre,eren,es,esta,estaven,esteu,està,estàvem,estàveu,et,etc,ets,fins,fora,gairebé,ha,han,has,havia,he,hem,heu,hi,ho,i,igual,iguals,ja,l'hi,la,les,li,li'n,llavors,m'he,ma,mal,malgrat,mateix,mateixa,mateixes,mateixos,me,mentre,meu,meus,meva,meves,molt,molta,moltes,molts,mon,mons,més,n'he,n'hi,ne,ni,no,nogensmenys,només,nosaltres,nostra,nostre,nostres,o,oh,oi,on,pas,pel,pels,per,perquè,però,poc,poca,pocs,poques,potser,propi,qual,quals,quan,quant,que,quelcom,qui,quin,quina,quines,quins,què,s'ha,s'han,sa,semblant,semblants,ses,seu,seus,seva,seves,si,sobre,sobretot,solament,sols,son,sons,sota,sou,sóc,són,t'ha,t'han,t'he,ta,tal,també,tampoc,tan,tant,tanta,tantes,teu,teus,teva,teves,ton,tons,tot,tota,totes,tots,un,una,unes,uns,us,va,vaig,vam,van,vas,veu,vosaltres,vostra,vostre,vostres,érem,éreu,és
@@ -0,0 +1 @@
1
+ a,aby,ahoj,aj,ale,anebo,ani,ano,asi,aspoň,atd,atp,ačkoli,až,bez,beze,blízko,bohužel,brzo,bude,budem,budeme,budete,budeš,budou,budu,by,byl,byla,byli,bylo,byly,bys,být,během,chce,chceme,chcete,chceš,chci,chtít,chtějí,chut',chuti,co,což,cz,daleko,další,den,deset,devatenáct,devět,dnes,do,dobrý,docela,dva,dvacet,dvanáct,dvě,dál,dále,děkovat,děkujeme,děkuji,ho,hodně,i,jak,jakmile,jako,jakož,jde,je,jeden,jedenáct,jedna,jedno,jednou,jedou,jeho,jehož,jej,jejich,její,jelikož,jemu,jen,jenom,jestli,jestliže,ještě,jež,ji,jich,jimi,jinak,jiné,již,jsem,jseš,jsi,jsme,jsou,jste,já,jí,jím,jíž,k,kam,kde,kdo,kdy,když,ke,kolik,kromě,kterou,která,které,který,kteří,kvůli,mají,mezi,mi,mne,mnou,mně,moc,mohl,mohou,moje,moji,možná,musí,my,má,málo,mám,máme,máte,máš,mé,mí,mít,mě,můj,může,na,nad,nade,napište,naproti,načež,naše,naši,ne,nebo,nebyl,nebyla,nebyli,nebyly,nedělají,nedělá,nedělám,neděláme,neděláte,neděláš,neg,nejsi,nejsou,nemají,nemáme,nemáte,neměl,není,nestačí,nevadí,než,nic,nich,nimi,nové,nový,nula,nám,námi,nás,náš,ním,ně,něco,nějak,někde,někdo,němu,němuž,o,od,ode,on,ona,oni,ono,ony,osm,osmnáct,pak,patnáct,po,pod,podle,pokud,potom,pouze,pozdě,pořád,pravé,pro,prostě,prosím,proti,proto,protože,proč,první,pta,pět,před,přes,přese,při,přičemž,re,rovně,s,se,sedm,sedmnáct,si,skoro,smí,smějí,snad,spolu,sta,sto,strana,sté,své,svých,svým,svými,ta,tady,tak,takhle,taky,také,takže,tam,tamhle,tamhleto,tamto,tato,tebe,tebou,ted',tedy,ten,tento,teto,ti,tipy,tisíc,tisíce,to,tobě,tohle,toho,tohoto,tom,tomto,tomu,tomuto,toto,trošku,tu,tuto,tvoje,tvá,tvé,tvůj,ty,tyto,téma,tím,tímto,tě,těm,těmu,třeba,tři,třináct,u,určitě,už,v,vaše,vaši,ve,vedle,večer,vlastně,vy,vám,vámi,vás,váš,více,však,všechno,všichni,vůbec,vždy,z,za,zatímco,zač,zda,zde,ze,zprávy,zpět,čau,či,článku,články,čtrnáct,čtyři,šest,šestnáct,že
@@ -0,0 +1 @@
1
+ og,i,jeg,det,at,en,den,til,er,som,på,de,med,han,af,for,ikke,der,var,mig,sig,men,et,har,om,vi,min,havde,ham,hun,nu,over,da,fra,du,ud,sin,dem,os,op,man,hans,hvor,eller,hvad,skal,selv,her,alle,vil,blev,kunne,ind,når,være,dog,noget,ville,jo,deres,efter,ned,skulle,denne,end,dette,mit,også,under,have,dig,anden,hende,mine,alt,meget,sit,sine,vor,mod,disse,hvis,din,nogle,hos,blive,mange,ad,bliver,hendes,været,thi,jer,sådan
@@ -0,0 +1 @@
1
+ a,ab,aber,ach,acht,achte,achten,achter,achtes,ag,alle,allein,allem,allen,aller,allerdings,alles,allgemeinen,als,also,am,an,ander,andere,anderem,anderen,anderer,anderes,anderm,andern,anderr,anders,au,auch,auf,aus,ausser,ausserdem,außer,außerdem,b,bald,bei,beide,beiden,beim,beispiel,bekannt,bereits,besonders,besser,besten,bin,bis,bisher,bist,c,d,d.h,da,dabei,dadurch,dafür,dagegen,daher,dahin,dahinter,damals,damit,danach,daneben,dank,dann,daran,darauf,daraus,darf,darfst,darin,darum,darunter,darüber,das,dasein,daselbst,dass,dasselbe,davon,davor,dazu,dazwischen,daß,dein,deine,deinem,deinen,deiner,deines,dem,dementsprechend,demgegenüber,demgemäss,demgemäß,demselben,demzufolge,den,denen,denn,denselben,der,deren,derer,derjenige,derjenigen,dermassen,dermaßen,derselbe,derselben,des,deshalb,desselben,dessen,deswegen,dich,die,diejenige,diejenigen,dies,diese,dieselbe,dieselben,diesem,diesen,dieser,dieses,dir,doch,dort,drei,drin,dritte,dritten,dritter,drittes,du,durch,durchaus,durfte,durften,dürfen,dürft,e,eben,ebenso,ehrlich,ei,ei,,eigen,eigene,eigenen,eigener,eigenes,ein,einander,eine,einem,einen,einer,eines,einig,einige,einigem,einigen,einiger,einiges,einmal,eins,elf,en,ende,endlich,entweder,er,ernst,erst,erste,ersten,erster,erstes,es,etwa,etwas,euch,euer,eure,eurem,euren,eurer,eures,f,folgende,früher,fünf,fünfte,fünften,fünfter,fünftes,für,g,gab,ganz,ganze,ganzen,ganzer,ganzes,gar,gedurft,gegen,gegenüber,gehabt,gehen,geht,gekannt,gekonnt,gemacht,gemocht,gemusst,genug,gerade,gern,gesagt,geschweige,gewesen,gewollt,geworden,gibt,ging,gleich,gott,gross,grosse,grossen,grosser,grosses,groß,große,großen,großer,großes,gut,gute,guter,gutes,h,hab,habe,haben,habt,hast,hat,hatte,hatten,hattest,hattet,heisst,her,heute,hier,hin,hinter,hoch,hätte,hätten,i,ich,ihm,ihn,ihnen,ihr,ihre,ihrem,ihren,ihrer,ihres,im,immer,in,indem,infolgedessen,ins,irgend,ist,j,ja,jahr,jahre,jahren,je,jede,jedem,jeden,jeder,jedermann,jedermanns,jedes,jedoch,jemand,jemandem,jemanden,jene,jenem,jenen,jener,jenes,jetzt,k,kam,kann,kannst,kaum,kein,keine,keinem,keinen,keiner,keines,kleine,kleinen,kleiner,kleines,kommen,kommt,konnte,konnten,kurz,können,könnt,könnte,l,lang,lange,leicht,leide,lieber,los,m,machen,macht,machte,mag,magst,mahn,mal,man,manche,manchem,manchen,mancher,manches,mann,mehr,mein,meine,meinem,meinen,meiner,meines,mensch,menschen,mich,mir,mit,mittel,mochte,mochten,morgen,muss,musst,musste,mussten,muß,mußt,möchte,mögen,möglich,mögt,müssen,müsst,müßt,n,na,nach,nachdem,nahm,natürlich,neben,nein,neue,neuen,neun,neunte,neunten,neunter,neuntes,nicht,nichts,nie,niemand,niemandem,niemanden,noch,nun,nur,o,ob,oben,oder,offen,oft,ohne,ordnung,p,q,r,recht,rechte,rechten,rechter,rechtes,richtig,rund,s,sa,sache,sagt,sagte,sah,satt,schlecht,schluss,schon,sechs,sechste,sechsten,sechster,sechstes,sehr,sei,seid,seien,sein,seine,seinem,seinen,seiner,seines,seit,seitdem,selbst,sich,sie,sieben,siebente,siebenten,siebenter,siebentes,sind,so,solang,solche,solchem,solchen,solcher,solches,soll,sollen,sollst,sollt,sollte,sollten,sondern,sonst,soweit,sowie,später,startseite,statt,steht,suche,t,tag,tage,tagen,tat,teil,tel,tritt,trotzdem,tun,u,uhr,um,und,und?,uns,unse,unsem,unsen,unser,unsere,unserer,unses,unter,v,vergangenen,viel,viele,vielem,vielen,vielleicht,vier,vierte,vierten,vierter,viertes,vom,von,vor,w,wahr?,wann,war,waren,warst,wart,warum,was,weg,wegen,weil,weit,weiter,weitere,weiteren,weiteres,welche,welchem,welchen,welcher,welches,wem,wen,wenig,wenige,weniger,weniges,wenigstens,wenn,wer,werde,werden,werdet,weshalb,wessen,wie,wieder,wieso,will,willst,wir,wird,wirklich,wirst,wissen,wo,woher,wohin,wohl,wollen,wollt,wollte,wollten,worden,wurde,wurden,während,währenddem,währenddessen,wäre,würde,würden,x,y,z,z.b,zehn,zehnte,zehnten,zehnter,zehntes,zeit,zu,zuerst,zugleich,zum,zunächst,zur,zurück,zusammen,zwanzig,zwar,zwei,zweite,zweiten,zweiter,zweites,zwischen,zwölf,über,überhaupt,übrigens
@@ -0,0 +1 @@
1
+ ο,η,το,οι,τα,του,τησ,των,τον,την,και,κι,κ,ειμαι,εισαι,ειναι,ειμαστε,ειστε,στο,στον,στη,στην,μα,αλλα,απο,για,προσ,με,σε,ωσ,παρα,αντι,κατα,μετα,θα,να,δε,δεν,μη,μην,επι,ενω,εαν,αν,τοτε,που,πωσ,ποιοσ,ποια,ποιο,ποιοι,ποιεσ,ποιων,ποιουσ,αυτοσ,αυτη,αυτο,αυτοι,αυτων,αυτουσ,αυτεσ,αυτα,εκεινοσ,εκεινη,εκεινο,εκεινοι,εκεινεσ,εκεινα,εκεινων,εκεινουσ,οπωσ,ομωσ,ισωσ,οσο,οτι
@@ -0,0 +1 @@
1
+ i,me,my,myself,we,our,ours,ourselves,you,your,yours,yourself,yourselves,he,him,his,himself,she,her,hers,herself,it,its,itself,they,them,their,theirs,themselves,what,which,who,whom,this,that,these,those,am,is,are,was,were,be,been,being,have,has,had,having,do,does,did,doing,would,should,could,ought,i'm,you're,he's,she's,it's,we're,they're,i've,you've,we've,they've,i'd,you'd,he'd,she'd,we'd,they'd,i'll,you'll,he'll,she'll,we'll,they'll,isn't,aren't,wasn't,weren't,hasn't,haven't,hadn't,doesn't,don't,didn't,won't,wouldn't,shan't,shouldn't,can't,cannot,couldn't,mustn't,let's,that's,who's,what's,here's,there's,when's,where's,why's,how's,a,an,the,and,but,if,or,because,as,until,while,of,at,by,for,with,about,against,between,into,through,during,before,after,above,below,to,from,up,down,in,out,on,off,over,under,again,further,then,once,here,there,when,where,why,how,all,any,both,each,few,more,most,other,some,such,no,nor,not,only,own,same,so,than,too,very,us,really,also,already,even,altough,much,bit,many
@@ -0,0 +1 @@
1
+ de,la,que,el,en,y,a,los,del,se,las,por,un,para,con,no,una,su,al,lo,como,más,pero,sus,le,ya,o,este,sí,porque,esta,entre,cuando,muy,sin,sobre,también,me,hasta,hay,donde,quien,desde,todo,nos,durante,todos,uno,les,ni,contra,otros,ese,eso,ante,ellos,e,esto,mí,antes,algunos,qué,unos,yo,otro,otras,otra,él,tanto,esa,estos,mucho,quienes,nada,muchos,cual,poco,ella,estar,estas,algunas,algo,nosotros,mi,mis,tú,te,ti,tu,tus,ellas,nosotras,vosotros,vosotras,os,mío,mía,míos,mías,tuyo,tuya,tuyos,tuyas,suyo,suya,suyos,suyas,nuestro,nuestra,nuestros,nuestras,vuestro,vuestra,vuestros,vuestras,esos,esas,estoy,estás,está,estamos,estáis,están,esté,estés,estemos,estéis,estén,estaré,estarás,estará,estaremos,estaréis,estarán,estaría,estarías,estaríamos,estaríais,estarían,estaba,estabas,estábamos,estabais,estaban,estuve,estuviste,estuvo,estuvimos,estuvisteis,estuvieron,estuviera,estuvieras,estuviéramos,estuvierais,estuvieran,estuviese,estuvieses,estuviésemos,estuvieseis,estuviesen,estando,estada,estadas,estad,he,has,ha,hemos,habéis,han,haya,hayas,hayamos,hayáis,hayan,habré,habrás,habrá,habremos,habréis,habrán,habría,habrías,habríamos,habríais,habrían,había,habías,habíamos,habíais,habían,hube,hubiste,hubo,hubimos,hubisteis,hubieron,hubiera,hubieras,hubiéramos,hubierais,hubieran,hubiese,hubieses,hubiésemos,hubieseis,hubiesen,habiendo,habido,habida,habidos,habidas,soy,eres,es,somos,sois,son,sea,seas,seamos,seáis,sean,seré,serás,será,seremos,seréis,serán,sería,serías,seríamos,seríais,serían,era,eras,éramos,erais,eran,fui,fuiste,fue,fuimos,fuisteis,fueron,fuera,fueras,fuéramos,fuerais,fueran,fuese,fueses,fuésemos,fueseis,fuesen,siendo,sido,tengo,tienes,tiene,tenemos,tenéis,tienen,tenga,tengas,tengamos,tengáis,tengan,tendré,tendrás,tendrá,tendremos,tendréis,tendrán,tendría,tendrías,tendríamos,tendríais,tendrían,tenía,tenías,teníamos,teníais,tenían,tuve,tuviste,tuvo,tuvimos,tuvisteis,tuvieron,tuviera,tuvieras,tuviéramos,tuvierais,tuvieran,tuviese,tuvieses,tuviésemos,tuvieseis,tuviesen,teniendo,tenido,tenida,tenidos,tenidas,tened,algunes,algunxs,elle,ellx,elles,ellxs,ese,esx,eses,esxs,estes,este,estxs,estx,lx,le,lxs,les,mucha,muchas,muches,muchxs,míe,míes,míx,míxs,nosotres,nosotrxs,nuestre,nuestres,nuestrx,nuestrxs,otre,otrx,otres,otrxs,poca,poque,pocx,suye,suyx,suyes,suyxs,tantas,tantxs,tantes,tenide,tenides,tenidx,tenidxs,toda,todas,tode,todes,todx,todxs,tuye,tuyes,tuyx,tuyxs,une,unx,unxs,unes,vosotrxs,vosotres,vuestre,vuestres,vuestrx,vuestrxs
@@ -0,0 +1 @@
1
+ olla,olen,olet,on,olemme,olette,ovat,ole,oli,olisi,olisit,olisin,olisimme,olisitte,olisivat,olit,olin,olimme,olitte,olivat,ollut,olleet,en,et,ei,emme,ette,eivät,minä,minun,minut,minua,minussa,minusta,minuun,minulla,minulta,minulle,sinä,sinun,sinut,sinua,sinussa,sinusta,sinuun,sinulla,sinulta,sinulle,hän,hänen,hänet,häntä,hänessä,hänestä,häneen,hänellä,häneltä,hänelle,me,meidän,meidät,meitä,meissä,meistä,meihin,meillä,meiltä,meille,te,teidän,teidät,teitä,teissä,teistä,teihin,teillä,teiltä,teille,he,heidän,heidät,heitä,heissä,heistä,heihin,heillä,heiltä,heille,tämä,tämän,tätä,tässä,tästä,tähän,tällä,tältä,tälle,tänä,täksi,tuo,tuon,tuota,tuossa,tuosta,tuohon,tuolla,tuolta,tuolle,tuona,tuoksi,se,sen,sitä,siinä,siitä,siihen,sillä,siltä,sille,sinä,siksi,nämä,näiden,näitä,näissä,näistä,näihin,näillä,näiltä,näille,näinä,näiksi,nuo,noiden,noita,noissa,noista,noihin,noilla,noilta,noille,noina,noiksi,ne,niiden,niitä,niissä,niistä,niihin,niillä,niiltä,niille,niinä,niiksi,kuka,kenen,kenet,ketä,kenessä,kenestä,keneen,kenellä,keneltä,kenelle,kenenä,keneksi,ketkä,keiden,ketkä,keitä,keissä,keistä,keihin,keillä,keiltä,keille,keinä,keiksi,mikä,minkä,minkä,mitä,missä,mistä,mihin,millä,miltä,mille,minä,miksi,mitkä,joka,jonka,jota,jossa,josta,johon,jolla,jolta,jolle,jona,joksi,jotka,joiden,joita,joissa,joista,joihin,joilla,joilta,joille,joina,joiksi,että,ja,jos,koska,kuin,mutta,niin,sekä,sillä,tai,vaan,vai,vaikka,kanssa,mukaan,noin,poikki,yli,kun,niin,nyt,itse
@@ -0,0 +1 @@
1
+ fi.csv
@@ -0,0 +1 @@
1
+ au,aux,avec,ce,ces,dans,de,des,du,elle,en,et,eux,il,je,la,le,leur,lui,ma,mais,me,même,mes,moi,mon,ne,nos,notre,nous,on,ou,par,pas,pour,qu,que,qui,sa,se,ses,son,sur,ta,te,tes,toi,ton,tu,un,une,vos,votre,vous,c,d,j,l,à,m,n,s,t,y,été,étée,étées,étés,étant,suis,es,est,sommes,êtes,sont,serai,seras,sera,serons,serez,seront,serais,serait,serions,seriez,seraient,étais,était,étions,étiez,étaient,fus,fut,fûmes,fûtes,furent,sois,soit,soyons,soyez,soient,fusse,fusses,fût,fussions,fussiez,fussent,ayant,eu,eue,eues,eus,ai,as,avons,avez,ont,aurai,auras,aura,aurons,aurez,auront,aurais,aurait,aurions,auriez,auraient,avais,avait,avions,aviez,avaient,eut,eûmes,eûtes,eurent,aie,aies,ait,ayons,ayez,aient,eusse,eusses,eût,eussions,eussiez,eussent,ceci,celà,cet,cette,ici,ils,les,leurs,quel,quels,quelle,quelles,sans,soi
@@ -0,0 +1 @@
1
+ אבל,או,אולי,אותה,אותו,אותי,אותך,אותם,אותן,אותנו,אז,אחר,אחרות,אחרי,אחריכן,אחרים,אחרת,אי,איזה,איך,אין,איפה,איתה,איתו,איתי,איתך,איתכם,איתכן,איתם,איתן,איתנו,אך,אל,אלה,אלו,אם,אנחנו,אני,אס,אף,אצל,אשר,את,אתה,אתכם,אתכן,אתם,אתן,באיזומידה,באמצע,באמצעות,בגלל,בין,בלי,במידה,במקוםשבו,ברם,בשביל,בשעהש,בתוך,גם,דרך,הוא,היא,היה,היכן,היתה,היתי,הם,הן,הנה,הסיבהשבגללה,הרי,ואילו,ואת,זאת,זה,זות,יהיה,יוכל,יוכלו,יותרמדי,יכול,יכולה,יכולות,יכולים,יכל,יכלה,יכלו,יש,כאן,כאשר,כולם,כולן,כזה,כי,כיצד,כך,ככה,כל,כלל,כמו,כן,כפי,כש,לא,לאו,לאיזותכלית,לאן,לבין,לה,להיות,להם,להן,לו,לי,לכם,לכן,למה,למטה,למעלה,למקוםשבו,למרות,לנו,לעבר,לעיכן,לפיכך,לפני,מאד,מאחורי,מאיזוסיבה,מאין,מאיפה,מבלי,מבעד,מדוע,מה,מהיכן,מול,מחוץ,מי,מכאן,מכיוון,מלבד,מן,מנין,מסוגל,מעט,מעטים,מעל,מצד,מקוםבו,מתחת,מתי,נגד,נגר,נו,עד,עז,על,עלי,עליה,עליהם,עליהן,עליו,עליך,עליכם,עלינו,עם,עצמה,עצמהם,עצמהן,עצמו,עצמי,עצמם,עצמן,עצמנו,פה,רק,שוב,של,שלה,שלהם,שלהן,שלו,שלי,שלך,שלכה,שלכם,שלכן,שלנו,שם,תהיה,תחת
@@ -0,0 +1 @@
1
+ a,ahogy,ahol,aki,akik,akkor,alatt,által,általában,amely,amelyek,amelyekben,amelyeket,amelyet,amelynek,ami,amit,amolyan,amíg,amikor,át,abban,ahhoz,annak,arra,arról,az,azok,azon,azt,azzal,azért,aztán,azután,azonban,bár,be,belül,benne,cikk,cikkek,cikkeket,csak,de,e,eddig,egész,egy,egyes,egyetlen,egyéb,egyik,egyre,ekkor,el,elég,ellen,elõ,elõször,elõtt,elsõ,én,éppen,ebben,ehhez,emilyen,ennek,erre,ez,ezt,ezek,ezen,ezzel,ezért,és,fel,felé,hanem,hiszen,hogy,hogyan,igen,így,illetve,ill.,ill,ilyen,ilyenkor,ison,ismét,itt,jó,jól,jobban,kell,kellett,keresztül,keressünk,ki,kívül,között,közül,legalább,lehet,lehetett,legyen,lenne,lenni,lesz,lett,maga,magát,majd,majd,már,más,másik,meg,még,mellett,mert,mely,melyek,mi,mit,míg,miért,milyen,mikor,minden,mindent,mindenki,mindig,mint,mintha,mivel,most,nagy,nagyobb,nagyon,ne,néha,nekem,neki,nem,néhány,nélkül,nincs,olyan,ott,össze,õ,õk,õket,pedig,persze,rá,s,saját,sem,semmi,sok,sokat,sokkal,számára,szemben,szerint,szinte,talán,tehát,teljes,tovább,továbbá,több,úgy,ugyanis,új,újabb,újra,után,utána,utolsó,vagy,vagyis,valaki,valami,valamint,való,vagyok,van,vannak,volt,voltam,voltak,voltunk,vissza,vele,viszont,volna
@@ -0,0 +1 @@
1
+ ada,adalah,adanya,adapun,agak,agaknya,agar,akan,akankah,akhir,akhiri,akhirnya,aku,akulah,amat,amatlah,anda,andalah,antar,antara,antaranya,apa,apaan,apabila,apakah,apalagi,apatah,artinya,asal,asalkan,atas,atau,ataukah,ataupun,awal,awalnya,bagai,bagaikan,bagaimana,bagaimanakah,bagaimanapun,bagi,bagian,bahkan,bahwa,bahwasanya,bakal,bakalan,balik,banyak,bapak,baru,bawah,beberapa,begini,beginian,beginikah,beginilah,begitu,begitukah,begitulah,begitupun,bekerja,belakang,belakangan,belum,belumlah,benar,benarkah,benarlah,berada,berakhir,berakhirlah,berakhirnya,berapa,berapakah,berapalah,berapapun,berarti,berawal,berbagai,berdatangan,beri,berikan,berikut,berikutnya,berjumlah,berkali-kali,berkata,berkehendak,berkeinginan,berkenaan,berlainan,berlalu,berlangsung,berlebihan,bermacam,bermacam-macam,bermaksud,bermula,bersama,bersama-sama,bersiap,bersiap-siap,bertanya,bertanya-tanya,berturut,berturut-turut,bertutur,berujar,berupa,besar,betul,betulkah,biasa,biasanya,bila,bilakah,bisa,bisakah,boleh,bolehkah,bolehlah,buat,bukan,bukankah,bukanlah,bukannya,bulan,bung,cara,caranya,cukup,cukupkah,cukuplah,cuma,dahulu,dalam,dan,dapat,dari,daripada,datang,dekat,demi,demikian,demikianlah,dengan,depan,di,dia,diakhiri,diakhirinya,dialah,diantara,diantaranya,diberi,diberikan,diberikannya,dibuat,dibuatnya,didapat,didatangkan,digunakan,diibaratkan,diibaratkannya,diingat,diingatkan,diinginkan,dijawab,dijelaskan,dijelaskannya,dikarenakan,dikatakan,dikatakannya,dikerjakan,diketahui,diketahuinya,dikira,dilakukan,dilalui,dilihat,dimaksud,dimaksudkan,dimaksudkannya,dimaksudnya,diminta,dimintai,dimisalkan,dimulai,dimulailah,dimulainya,dimungkinkan,dini,dipastikan,diperbuat,diperbuatnya,dipergunakan,diperkirakan,diperlihatkan,diperlukan,diperlukannya,dipersoalkan,dipertanyakan,dipunyai,diri,dirinya,disampaikan,disebut,disebutkan,disebutkannya,disini,disinilah,ditambahkan,ditandaskan,ditanya,ditanyai,ditanyakan,ditegaskan,ditujukan,ditunjuk,ditunjuki,ditunjukkan,ditunjukkannya,ditunjuknya,dituturkan,dituturkannya,diucapkan,diucapkannya,diungkapkan,dong,dulu,empat,enggak,enggaknya,entah,entahlah,guna,gunakan,hal,hampir,hanya,hanyalah,harus,haruslah,harusnya,hendak,hendaklah,hendaknya,hingga,ia,ialah,ibarat,ibaratkan,ibaratnya,ikut,ingat,ingat-ingat,ingin,inginkah,inginkan,ini,inikah,inilah,itu,itukah,itulah,jadi,jadilah,jadinya,jangan,jangankan,janganlah,jauh,jawab,jawaban,jawabnya,jelas,jelaskan,jelaslah,jelasnya,jika,jikalau,juga,jumlah,jumlahnya,justru,kala,kalau,kalaulah,kalaupun,kalian,kami,kamilah,kamu,kamulah,kan,kapan,kapankah,kapanpun,karena,karenanya,kasus,kata,katakan,katakanlah,katanya,ke,keadaan,kebetulan,kecil,kedua,keduanya,keinginan,kelamaan,kelihatan,kelihatannya,kelima,keluar,kembali,kemudian,kemungkinan,kemungkinannya,kenapa,kepada,kepadanya,kesampaian,keseluruhan,keseluruhannya,keterlaluan,ketika,khususnya,kini,kinilah,kira,kira-kira,kiranya,kita,kitalah,kok,kurang,lagi,lagian,lah,lain,lainnya,lalu,lama,lamanya,lanjut,lanjutnya,lebih,lewat,lima,luar,macam,maka,makanya,makin,malah,malahan,mampu,mampukah,mana,manakala,manalagi,masa,masalah,masalahnya,masih,masihkah,masing,masing-masing,mau,maupun,melainkan,melakukan,melalui,melihat,melihatnya,memang,memastikan,memberi,memberikan,membuat,memerlukan,memihak,meminta,memintakan,memisalkan,memperbuat,mempergunakan,memperkirakan,memperlihatkan,mempersiapkan,mempersoalkan,mempertanyakan,mempunyai,memulai,memungkinkan,menaiki,menambahkan,menandaskan,menanti,menanti-nanti,menantikan,menanya,menanyai,menanyakan,mendapat,mendapatkan,mendatang,mendatangi,mendatangkan,menegaskan,mengakhiri,mengapa,mengatakan,mengatakannya,mengenai,mengerjakan,mengetahui,menggunakan,menghendaki,mengibaratkan,mengibaratkannya,mengingat,mengingatkan,menginginkan,mengira,mengucapkan,mengucapkannya,mengungkapkan,menjadi,menjawab,menjelaskan,menuju,menunjuk,menunjuki,menunjukkan,menunjuknya,menurut,menuturkan,menyampaikan,menyangkut,menyatakan,menyebutkan,menyeluruh,menyiapkan,merasa,mereka,merekalah,merupakan,meski,meskipun,meyakini,meyakinkan,minta,mirip,misal,misalkan,misalnya,mula,mulai,mulailah,mulanya,mungkin,mungkinkah,nah,naik,namun,nanti,nantinya,nyaris,nyatanya,oleh,olehnya,pada,padahal,padanya,paling,panjang,pantas,para,pasti,pastilah,penting,pentingnya,per,percuma,perlu,perlukah,perlunya,pernah,persoalan,pertama,pertama-tama,pertanyaan,pertanyakan,pihak,pihaknya,pukul,pula,pun,punya,rasa,rasanya,rata,rupanya,saat,saatnya,saja,sajalah,saling,sama,sama-sama,sambil,sampai,sampai-sampai,sampaikan,sana,sangat,sangatlah,satu,saya,sayalah,se,sebab,sebabnya,sebagai,sebagaimana,sebagainya,sebagian,sebaik,sebaik-baiknya,sebaiknya,sebaliknya,sebanyak,sebegini,sebegitu,sebelum,sebelumnya,sebenarnya,seberapa,sebesar,sebetulnya,sebisanya,sebuah,sebut,sebutlah,sebutnya,secara,secukupnya,sedang,sedangkan,sedemikian,sedikit,sedikitnya,seenaknya,segala,segalanya,segera,seharusnya,sehingga,seingat,sejak,sejauh,sejenak,sejumlah,sekadar,sekadarnya,sekali,sekali-kali,sekalian,sekaligus,sekalipun,sekarang,sekarang,sekecil,seketika,sekiranya,sekitar,sekitarnya,sekurang-kurangnya,sekurangnya,sela,selain,selaku,selalu,selama,selama-lamanya,selamanya,selanjutnya,seluruh,seluruhnya,semacam,semakin,semampu,semampunya,semasa,semasih,semata,semata-mata,semaunya,sementara,semisal,semisalnya,sempat,semua,semuanya,semula,sendiri,sendirian,sendirinya,seolah,seolah-olah,seorang,sepanjang,sepantasnya,sepantasnyalah,seperlunya,seperti,sepertinya,sepihak,sering,seringnya,serta,serupa,sesaat,sesama,sesampai,sesegera,sesekali,seseorang,sesuatu,sesuatunya,sesudah,sesudahnya,setelah,setempat,setengah,seterusnya,setiap,setiba,setibanya,setidak-tidaknya,setidaknya,setinggi,seusai,sewaktu,siap,siapa,siapakah,siapapun,sini,sinilah,soal,soalnya,suatu,sudah,sudahkah,sudahlah,supaya,tadi,tadinya,tahu,tahun,tak,tambah,tambahnya,tampak,tampaknya,tandas,tandasnya,tanpa,tanya,tanyakan,tanyanya,tapi,tegas,tegasnya,telah,tempat,tengah,tentang,tentu,tentulah,tentunya,tepat,terakhir,terasa,terbanyak,terdahulu,terdapat,terdiri,terhadap,terhadapnya,teringat,teringat-ingat,terjadi,terjadilah,terjadinya,terkira,terlalu,terlebih,terlihat,termasuk,ternyata,tersampaikan,tersebut,tersebutlah,tertentu,tertuju,terus,terutama,tetap,tetapi,tiap,tiba,tiba-tiba,tidak,tidakkah,tidaklah,tiga,tinggi,toh,tunjuk,turut,tutur,tuturnya,ucap,ucapnya,ujar,ujarnya,umum,umumnya,ungkap,ungkapnya,untuk,usah,usai,waduh,wah,wahai,waktu,waktunya,walau,walaupun,wong,yaitu,yakin,yakni,yang
@@ -0,0 +1 @@
1
+ ad,al,allo,ai,agli,all,agl,alla,alle,con,col,coi,da,dal,dallo,dai,dagli,dall,dagl,dalla,dalle,di,del,dello,dei,degli,dell,degl,della,delle,in,nel,nello,nei,negli,nell,negl,nella,nelle,su,sul,sullo,sui,sugli,sull,sugl,sulla,sulle,per,tra,contro,io,tu,lui,lei,noi,voi,loro,mio,mia,miei,mie,tuo,tua,tuoi,tue,suo,sua,suoi,sue,nostro,nostra,nostri,nostre,vostro,vostra,vostri,vostre,mi,ti,ci,vi,lo,la,li,le,gli,ne,il,un,uno,una,ma,ed,se,perché,anche,come,dov,dove,che,chi,cui,non,più,quale,quanto,quanti,quanta,quante,quello,quelli,quella,quelle,questo,questi,questa,queste,si,tutto,tutti,a,c,e,i,l,o,ho,hai,ha,abbiamo,avete,hanno,abbia,abbiate,abbiano,avrò,avrai,avrà,avremo,avrete,avranno,avrei,avresti,avrebbe,avremmo,avreste,avrebbero,avevo,avevi,aveva,avevamo,avevate,avevano,ebbi,avesti,ebbe,avemmo,aveste,ebbero,avessi,avesse,avessimo,avessero,avendo,avuto,avuta,avuti,avute,sono,sei,è,siamo,siete,sia,siate,siano,sarò,sarai,sarà,saremo,sarete,saranno,sarei,saresti,sarebbe,saremmo,sareste,sarebbero,ero,eri,era,eravamo,eravate,erano,fui,fosti,fu,fummo,foste,furono,fossi,fosse,fossimo,fossero,essendo,faccio,fai,facciamo,fanno,faccia,facciate,facciano,farò,farai,farà,faremo,farete,faranno,farei,faresti,farebbe,faremmo,fareste,farebbero,facevo,facevi,faceva,facevamo,facevate,facevano,feci,facesti,fece,facemmo,faceste,fecero,facessi,facesse,facessimo,facessero,facendo,sto,stai,sta,stiamo,stanno,stia,stiate,stiano,starò,starai,starà,staremo,starete,staranno,starei,staresti,starebbe,staremmo,stareste,starebbero,stavo,stavi,stava,stavamo,stavate,stavano,stetti,stesti,stette,stemmo,steste,stettero,stessi,stesse,stessimo,stessero,stando
@@ -0,0 +1 @@
1
+ 0,1,2,3,4,5,6,7,8,9,0,1,2,3,4,5,6,7,8,9,가,가까스로,가령,각,각각,각자,각종,갖고말하자면,같다,같이,개의치않고,거니와,거바,거의,것,것과 같이,것들,게다가,게우다,겨우,견지에서,결과에 이르다,결국,결론을 낼 수 있다,겸사겸사,고려하면,고로,곧,공동으로,과,과연,관계가 있다,관계없이,관련이 있다,관하여,관한,관해서는,구,구체적으로,구토하다,그,그들,그때,그래,그래도,그래서,그러나,그러니,그러니까,그러면,그러므로,그러한즉,그런 까닭에,그런데,그런즉,그럼,그럼에도 불구하고,그렇게 함으로써,그렇지,그렇지 않다면,그렇지 않으면,그렇지만,그렇지않으면,그리고,그리하여,그만이다,그에 따르는,그위에,그저,그중에서,그치지 않다,근거로,근거하여,기대여,기점으로,기준으로,기타,까닭으로,까악,까지,까지 미치다,까지도,꽈당,끙끙,끼익,나,나머지는,남들,남짓,너,너희,너희들,네,넷,년,논하지 않다,놀라다,누가 알겠는가,누구,다른,다른 방면으로,다만,다섯,다소,다수,다시 말하자면,다시말하면,다음,다음에,다음으로,단지,답다,당신,당장,대로 하다,대하면,대하여,대해 말하자면,대해서,댕그,더구나,더군다나,더라도,더불어,더욱더,더욱이는,도달하다,도착하다,동시에,동안,된바에야,된이상,두번째로,둘,둥둥,뒤따라,뒤이어,든간에,들,등,등등,딩동,따라,따라서,따위,따지지 않다,딱,때,때가 되어,때문에,또,또한,뚝뚝,라 해도,령,로,로 인하여,로부터,로써,륙,를,마음대로,마저,마저도,마치,막론하고,만 못하다,만약,만약에,만은 아니다,만이 아니다,만일,만큼,말하자면,말할것도 없고,매,매번,메쓰겁다,몇,모,모두,무렵,무릎쓰고,무슨,무엇,무엇때문에,물론,및,바꾸어말하면,바꾸어말하자면,바꾸어서 말하면,바꾸어서 한다면,바꿔 말하면,바로,바와같이,밖에 안된다,반대로,반대로 말하자면,반드시,버금,보는데서,보다더,보드득,본대로,봐,봐라,부류의 사람들,부터,불구하고,불문하고,붕붕,비걱거리다,비교적,비길수 없다,비로소,비록,비슷하다,비추어 보아,비하면,뿐만 아니라,뿐만아니라,뿐이다,삐걱,삐걱거리다,사,삼,상대적으로 말하자면,생각한대로,설령,설마,설사,셋,소생,소인,솨,쉿,습니까,습니다,시각,시간,시작하여,시초에,시키다,실로,심지어,아,아니,아니나다를가,아니라면,아니면,아니었다면,아래윗,아무거나,아무도,아야,아울러,아이,아이고,아이구,아이야,아이쿠,아하,아홉,안 그러면,않기 위하여,않기 위해서,알 수 있다,알았어,앗,앞에서,앞의것,야,약간,양자,어,어기여차,어느,어느 년도,어느것,어느곳,어느때,어느쪽,어느해,어디,어때,어떠한,어떤,어떤것,어떤것들,어떻게,어떻해,어이,어째서,어쨋든,어쩔수 없다,어찌,어찌됏든,어찌됏어,어찌하든지,어찌하여,언제,언젠가,얼마,얼마 안 되는 것,얼마간,얼마나,얼마든지,얼마만큼,얼마큼,엉엉,에,에 가서,에 달려 있다,에 대해,에 있다,에 한하다,에게,에서,여,여기,여덟,여러분,여보시오,여부,여섯,여전히,여차,연관되다,연이서,영,영차,옆사람,예,예를 들면,예를 들자면,예컨대,예하면,오,오로지,오르다,오자마자,오직,오호,오히려,와,와 같은 사람들,와르르,와아,왜,왜냐하면,외에도,요만큼,요만한 것,요만한걸,요컨대,우르르,우리,우리들,우선,우에 종합한것과같이,운운,월,위에서 서술한바와같이,위하여,위해서,윙윙,육,으로,으로 인하여,으로서,으로써,을,응,응당,의,의거하여,의지하여,의해,의해되다,의해서,이,이 되다,이 때문에,이 밖에,이 외에,이 정도의,이것,이곳,이때,이라면,이래,이러이러하다,이러한,이런,이럴정도로,이렇게 많은 것,이렇게되면,이렇게말하자면,이렇구나,이로 인하여,이르기까지,이리하여,이만큼,이번,이봐,이상,이어서,이었다,이와 같다,이와 같은,이와 반대로,이와같다면,이외에도,이용하여,이유만으로,이젠,이지만,이쪽,이천구,이천육,이천칠,이천팔,인 듯하다,인젠,일,일것이다,일곱,일단,일때,일반적으로,일지라도,임에 틀림없다,입각하여,입장에서,잇따라,있다,자,자기,자기집,자마자,자신,잠깐,잠시,저,저것,저것만큼,저기,저쪽,저희,전부,전자,전후,점에서 보아,정도에 이르다,제,제각기,제외하고,조금,조차,조차도,졸졸,좀,좋아,좍좍,주룩주룩,주저하지 않고,줄은 몰랏다,줄은모른다,중에서,중의하나,즈음하여,즉,즉시,지든지,지만,지말고,진짜로,쪽으로,차라리,참,참나,첫번째로,쳇,총적으로,총적으로 말하면,총적으로 보면,칠,콸콸,쾅쾅,쿵,타다,타인,탕탕,토하다,통하여,툭,퉤,틈타,팍,팔,퍽,펄렁,하,하게될것이다,하게하다,하겠는가,하고 있다,하고있었다,하곤하였다,하구나,하기 때문에,하기 위하여,하기는한데,하기만 하면,하기보다는,하기에,하나,하느니,하는 김에,하는 편이 낫다,하는것도,하는것만 못하다,하는것이 낫다,하는바,하더라도,하도다,하도록시키다,하도록하다,하든지,하려고하다,하마터면,하면 할수록,하면된다,하면서,하물며,하여금,하여야,하자마자,하지 않는다면,하지 않도록,하지마,하지마라,하지만,하하,한 까닭에,한 이유는,한 후,한다면,한다면 몰라도,한데,한마디,한적이있다,한켠으로는,한항목,할 따름이다,할 생각이다,할 줄 안다,할 지경이다,할 힘이 있다,할때,할만하다,할망정,할뿐,할수있다,할수있어,할줄알다,할지라도,할지언정,함께,해도된다,해도좋다,해봐요,해서는 안된다,해야한다,해요,했어요,향하다,향하여,향해서,허,허걱,허허,헉,헉헉,헐떡헐떡,형식으로 쓰여,혹시,혹은,혼자,훨씬,휘익,휴,흐흐,흥,힘입어,︿,~,¥
@@ -0,0 +1 @@
1
+ de,en,van,ik,te,dat,die,in,een,hij,het,niet,zijn,is,was,op,aan,met,als,voor,had,er,maar,om,hem,dan,zou,of,wat,mijn,men,dit,zo,door,over,ze,zich,bij,ook,tot,je,mij,uit,der,daar,haar,naar,heb,hoe,heeft,hebben,deze,u,want,nog,zal,me,zij,nu,ge,geen,omdat,iets,worden,toch,al,waren,veel,meer,doen,toen,moet,ben,zonder,kan,hun,dus,alles,onder,ja,eens,hier,wie,werd,altijd,doch,wordt,wezen,kunnen,ons,zelf,tegen,na,reeds,wil,kon,niets,uw,iemand,geweest,andere,
@@ -0,0 +1 @@
1
+ a,aby,ach,acz,aczkolwiek,aj,albo,ale,ależ,ani,aż,bardziej,bardzo,bo,bowiem,by,byli,bynajmniej,być,był,była,było,były,będzie,będą,cali,cała,cały,ci,cię,ciebie,co,cokolwiek,coś,czasami,czasem,czemu,czy,czyli,daleko,dla,dlaczego,dlatego,do,dobrze,dokąd,dość,dużo,dwa,dwaj,dwie,dwoje,dziś,dzisiaj,gdy,gdyby,gdyż,gdzie,gdziekolwiek,gdzieś,i,ich,ile,im,inna,inne,inny,innych,iż,ja,ją,jak,jakaś,jakby,jaki,jakichś,jakie,jakiś,jakiż,jakkolwiek,jako,jakoś,je,jeden,jedna,jedno,jednak,jednakże,jego,jej,jemu,jest,jestem,jeszcze,jeśli,jeżeli,już,ją,każdy,kiedy,kilka,kimś,kto,ktokolwiek,ktoś,która,które,którego,której,który,których,którym,którzy,ku,lat,lecz,lub,ma,mają,mało,mam,mi,mimo,między,mną,mnie,mogą,moi,moim,moja,moje,może,możliwe,można,mój,mu,musi,my,na,nad,nam,nami,nas,nasi,nasz,nasza,nasze,naszego,naszych,natomiast,natychmiast,nawet,nią,nic,nich,nie,niech,niego,niej,niemu,nigdy,nim,nimi,niż,no,o,obok,od,około,on,ona,one,oni,ono,oraz,oto,owszem,pan,pana,pani,po,pod,podczas,pomimo,ponad,ponieważ,powinien,powinna,powinni,powinno,poza,prawie,przecież,przed,przede,przedtem,przez,przy,roku,również,sama,są,się,skąd,sobie,sobą,sposób,swoje,ta,tak,taka,taki,takie,także,tam,te,tego,tej,temu,ten,teraz,też,to,tobą,tobie,toteż,trzeba,tu,tutaj,twoi,twoim,twoja,twoje,twym,twój,ty,tych,tylko,tym,u,w,wam,wami,was,wasz,wasza,wasze,we,według,wiele,wielu,więc,więcej,wszyscy,wszystkich,wszystkie,wszystkim,wszystko,wtedy,wy,właśnie,z,za,zapewne,zawsze,ze,zł,znowu,znów,został,żaden,żadna,żadne,żadnych,że,żeby
@@ -0,0 +1 @@
1
+ de,a,o,que,e,do,da,em,um,para,com,não,uma,os,no,se,na,por,mais,as,dos,como,mas,ao,ele,das,à,seu,sua,ou,quando,muito,nos,já,eu,também,só,pelo,pela,até,isso,ela,entre,depois,sem,mesmo,aos,seus,quem,nas,me,esse,eles,você,essa,num,nem,suas,meu,às,minha,numa,pelos,elas,qual,nós,lhe,deles,essas,esses,pelas,este,dele,tu,te,vocês,vos,lhes,meus,minhas,teu,tua,teus,tuas,nosso,nossa,nossos,nossas,dela,delas,esta,estes,estas,aquele,aquela,aqueles,aquelas,isto,aquilo,estou,está,estamos,estão,estive,esteve,estivemos,estiveram,estava,estávamos,estavam,estivera,estivéramos,esteja,estejamos,estejam,estivesse,estivéssemos,estivessem,estiver,estivermos,estiverem,hei,há,havemos,hão,houve,houvemos,houveram,houvera,houvéramos,haja,hajamos,hajam,houvesse,houvéssemos,houvessem,houver,houvermos,houverem,houverei,houverá,houveremos,houverão,houveria,houveríamos,houveriam,sou,somos,são,era,éramos,eram,fui,foi,fomos,foram,fora,fôramos,seja,sejamos,sejam,fosse,fôssemos,fossem,for,formos,forem,serei,será,seremos,serão,seria,seríamos,seriam,tenho,tem,temos,tém,tinha,tínhamos,tinham,tive,teve,tivemos,tiveram,tivera,tivéramos,tenha,tenhamos,tenham,tivesse,tivéssemos,tivessem,tiver,tivermos,tiverem,terei,terá,teremos,terão,teria,teríamos,teriam
@@ -0,0 +1 @@
1
+ acea,aceasta,această,aceea,acei,aceia,acel,acela,acele,acelea,acest,acesta,aceste,acestea,aceşti,aceştia,acolo,acord,acum,ai,aia,aibă,aici,al,ăla,ale,alea,ălea,altceva,altcineva,am,ar,are,aş,aşadar,asemenea,asta,ăsta,astăzi,astea,ăstea,ăştia,asupra,aţi,au,avea,avem,aveţi,azi,bine,bucur,bună,ca,că,căci,când,care,cărei,căror,cărui,cât,câte,câţi,către,câtva,caut,ce,cel,ceva,chiar,cinci,cînd,cine,cineva,cît,cîte,cîţi,cîtva,contra,cu,cum,cumva,curând,curînd,da,dă,dacă,dar,dată,datorită,dau,de,deci,deja,deoarece,departe,deşi,din,dinaintea,dintr-,dintre,doi,doilea,două,drept,după,ea,ei,el,ele,eram,este,eşti,eu,face,fără,fata,fi,fie,fiecare,fii,fim,fiţi,fiu,frumos,graţie,halbă,iar,ieri,îi,îl,îmi,împotriva,în ,înainte,înaintea,încât,încît,încotro,între,întrucât,întrucît,îţi,la,lângă,le,li,lîngă,lor,lui,mă,mai,mâine,mea,mei,mele,mereu,meu,mi,mie,mîine,mine,mult,multă,mulţi,mulţumesc,ne,nevoie,nicăieri,nici,nimeni,nimeri,nimic,nişte,noastră,noastre,noi,noroc,noştri,nostru,nouă,nu,opt,ori,oricând,oricare,oricât,orice,oricînd,oricine,oricît,oricum,oriunde,până,patra,patru,patrulea,pe,pentru,peste,pic,pînă,poate,pot,prea,prima,primul,prin,puţin,puţina,puţină,rog,sa,să,săi,sale,şapte,şase,sau,său,se,şi,sînt,sîntem,sînteţi,spate,spre,ştiu,sub,sunt,suntem,sunteţi,sută,ta,tăi,tale,tău,te,ţi,ţie,timp,tine,toată,toate,tot,toţi,totuşi,trei,treia,treilea,tu,un,una,unde,undeva,unei,uneia,unele,uneori,unii,unor,unora,unu,unui,unuia,unul,vă,vi,voastră,voastre,voi,voştri,vostru,vouă,vreme,vreo,vreun,zece,zero,zi,zice
@@ -0,0 +1 @@
1
+ и,в,во,не,что,он,на,я,с,со,как,а,то,все,она,так,его,но,да,ты,к,у,же,вы,за,бы,по,только,ее,мне,было,вот,от,меня,еще,нет,о,из,ему,теперь,когда,даже,ну,вдруг,ли,если,уже,или,ни,быть,был,него,до,вас,нибудь,опять,уж,вам,сказал,ведь,там,потом,себя,ничего,ей,может,они,тут,где,есть,надо,ней,для,мы,тебя,их,чем,была,сам,чтоб,без,будто,человек,чего,раз,тоже,себе,под,жизнь,будет,ж,тогда,кто,этот,говорил,того,потому,этого,какой,совсем,ним,здесь,этом,один,почти,мой,тем,чтобы,нее,кажется,сейчас,были,куда,зачем,сказать,всех,никогда,сегодня,можно,при,наконец,два,об,другой,хоть,после,над,больше,тот,через,эти,нас,про,всего,них,какая,много,разве,сказала,три,эту,моя,впрочем,хорошо,свою,этой,перед,иногда,лучше,чуть,том,нельзя,такой,им,более,всегда,конечно,всю,между
@@ -0,0 +1 @@
1
+ och,det,att,i,en,jag,hon,som,han,på,den,med,var,sig,för,så,till,är,men,ett,om,hade,de,av,icke,mig,du,henne,då,sin,nu,har,inte,hans,honom,skulle,hennes,där,min,man,ej,vid,kunde,något,från,ut,när,efter,upp,vi,dem,vara,vad,över,än,dig,kan,sina,här,ha,mot,alla,under,någon,eller,allt,mycket,sedan,ju,denna,själv,detta,åt,utan,varit,hur,ingen,mitt,ni,bli,blev,oss,din,dessa,några,deras,blir,mina,samma,vilken,er,sådan,vår,blivit,dess,inom,mellan,sådant,varför,varje,vilka,ditt,vem,vilket,sitta,sådana,vart,dina,vars,vårt,våra,ert,era,vilkas
@@ -0,0 +1 @@
1
+ กล่าว,กว่า,กัน,กับ,การ,ก็,ก่อน,ขณะ,ขอ,ของ,ขึ้น,คง,ครั้ง,ความ,คือ,จะ,จัด,จาก,จึง,ช่วง,ซึ่ง,ดัง,ด้วย,ด้าน,ตั้ง,ตั้งแต่,ตาม,ต่อ,ต่าง,ต่างๆ,ต้อง,ถึง,ถูก,ถ้า,ทั้ง,ทั้งนี้,ทาง,ที่,ที่สุด,ทุก,ทํา,ทําให้,นอกจาก,นัก,นั้น,นี้,น่า,นํา,บาง,ผล,ผ่าน,พบ,พร้อม,มา,มาก,มี,ยัง,รวม,ระหว่าง,รับ,ราย,ร่วม,ลง,วัน,ว่า,สุด,ส่ง,ส่วน,สําหรับ,หนึ่ง,หรือ,หลัง,หลังจาก,หลาย,หาก,อยาก,อยู่,อย่าง,ออก,อะไร,อาจ,อีก,เขา,เข้า,เคย,เฉพาะ,เช่น,เดียว,เดียวกัน,เนื่องจาก,เปิด,เปิดเผย,เป็น,เป็นการ,เพราะ,เพื่อ,เมื่อ,เรา,เริ่ม,เลย,เห็น,เอง,แต่,แบบ,แรก,และ,แล้ว,แห่ง,โดย,ใน,ให้,ได้,ไป,ไม่,ไว้
@@ -0,0 +1 @@
1
+ acaba,acep,adeta,altmış,altmış,altı,altı,ama,ancak,arada,artık,aslında,aynen,ayrıca,az,bana,bari,bazen,bazı,bazı,başka,belki,ben,benden,beni,benim,beri,beş,beş,beş,bile,bin,bir,biraz,biri,birkaç,birkez,birçok,birşey,birşeyi,birşey,birşeyi,birşey,biz,bizden,bize,bizi,bizim,bu,buna,bunda,bundan,bunlar,bunları,bunların,bunu,bunun,burada,böyle,böylece,bütün,da,daha,dahi,dahil,daima,dair,dayanarak,de,defa,deđil,değil,diye,diđer,diğer,doksan,dokuz,dolayı,dolayısıyla,dört,edecek,eden,ederek,edilecek,ediliyor,edilmesi,ediyor,elli,en,etmesi,etti,ettiği,ettiğini,eđer,eğer,fakat,gibi,göre,halbuki,halen,hangi,hani,hariç,hatta,hele,hem,henüz,hep,hepsi,her,herhangi,herkes,herkesin,hiç,hiçbir,iken,iki,ila,ile,ilgili,ilk,illa,ise,itibaren,itibariyle,iyi,iyice,için,işte,işte,kadar,kanımca,karşın,katrilyon,kendi,kendilerine,kendini,kendisi,kendisine,kendisini,kere,kez,keşke,ki,kim,kimden,kime,kimi,kimse,kırk,kısaca,kırk,lakin,madem,međer,milyar,milyon,mu,mü,mı,mı,nasıl,nasıl,ne,neden,nedenle,nerde,nere,nerede,nereye,nitekim,niye,niçin,o,olan,olarak,oldu,olduklarını,olduğu,olduğunu,olmadı,olmadığı,olmak,olması,olmayan,olmaz,olsa,olsun,olup,olur,olursa,oluyor,on,ona,ondan,onlar,onlardan,onlari,onların,onları,onların,onu,onun,otuz,oysa,pek,rağmen,sadece,sanki,sekiz,seksen,sen,senden,seni,senin,siz,sizden,sizi,sizin,sonra,tarafından,trilyon,tüm,var,vardı,ve,veya,veyahut,ya,yahut,yani,yapacak,yapmak,yaptı,yaptıkları,yaptığı,yaptığını,yapılan,yapılması,yapıyor,yedi,yerine,yetmiş,yetmiş,yetmiş,yine,yirmi,yoksa,yüz,zaten,çok,çünkü,öyle,üzere,üç,şey,şeyden,şeyi,şeyler,şu,şuna,şunda,şundan,şunu,şey,şeyden,şeyi,şeyler,şu,şuna,şunda,şundan,şunları,şunu,şöyle,şayet,şimdi,şu,şöyle
@@ -0,0 +1 @@
1
+ bị,bởi,cả,các,cái,cần,càng,chỉ,chiếc,cho,chứ,chưa,chuyện,có,có thể,cứ,của,cùng,cũng,đã,đang,để,đến nỗi,đều,điều,do,đó,được,dưới,gì,khi,không,là,lại,lên,lúc,mà,mỗi,một cách,này,nên,nếu,ngay,nhiều,như,nhưng,những,nơi,nữa,phải,qua,ra,rằng,rất,rồi,sau,sẽ,so,sự,tại,theo,thì,trên,trước,từ,từng,và,vẫn,vào,vậy,vì,việc,với,vừa,vâng,à,ừ,từ
@@ -0,0 +1 @@
1
+ 的,地,得,和,跟,与,及,向,并,等,更,已,含,做,我,你,他,她,们,某,该,各,每,这,那,哪,什,么,谁,年,月,日,时,分,秒,几,多,来,在,就,又,很,呢,吧,吗,了,嘛,哇,儿,哼,啊,嗯,是,着,都,不,说,也,看,把,还,个,有,小,到,一,为,中,于,对,会,之,第,此,或,共,按,请
@@ -0,0 +1,20 @@
1
+ module Stopwords
2
+ module Snowball
3
+ class WordSieve
4
+ def initialize(custom_list = [])
5
+ @filters = Dir["#{File.dirname(__FILE__)}/locales/*.csv"].each_with_object({}) do |file, filters|
6
+ lang = File.basename(file, '.csv')
7
+ filters[lang.to_sym] = Stopwords::Snowball::Filter.new lang, custom_list
8
+ end
9
+ end
10
+
11
+ def stopword?(args = {})
12
+ args[:lang] ? @filters[args[:lang]].stopword?(args[:word]) : false
13
+ end
14
+
15
+ def filter(args = {})
16
+ args[:lang] ? @filters[args[:lang]].filter(args[:words]) : args[:words]
17
+ end
18
+ end
19
+ end
20
+ end
@@ -0,0 +1,4 @@
1
+ module Stopwords::Snowball
2
+ require_relative 'snowball/filter'
3
+ require_relative 'snowball/wordsieve'
4
+ end
data/lib/stopwords.rb ADDED
@@ -0,0 +1,4 @@
1
+ module Stopwords
2
+ require_relative 'stopwords/filter.rb'
3
+ require_relative 'stopwords/snowball'
4
+ end
@@ -0,0 +1,18 @@
1
+ require_relative("../spec_helper.rb")
2
+
3
+ describe Stopwords::Filter do
4
+
5
+ context "when fed with a list of arbitrary words" do
6
+
7
+ let (:filter) { Stopwords::Filter.new stopwords }
8
+ let (:stopwords) { ["A", "desde"] }
9
+
10
+ subject { filter }
11
+
12
+ it("should remove the stopwords for the list of words to be filtered") { expect(filter.filter("desde Santurce A Bilbao".split)).to eq ["Santurce", "Bilbao"]}
13
+ it("should remove stopwords even if upcase and downcases doesn't match") { expect(filter.filter("Desde Santurce a Bilbao".split)).to eq ["Santurce", "Bilbao"]}
14
+
15
+ end
16
+
17
+
18
+ end
@@ -0,0 +1,40 @@
1
+ # encoding: utf-8
2
+ require_relative("../spec_helper.rb")
3
+
4
+ describe Stopwords::Snowball::Filter do
5
+
6
+ context "when pointed to a valid locale" do
7
+
8
+ let (:filter) { Stopwords::Snowball::Filter.new "es" }
9
+
10
+ subject { filter }
11
+
12
+ it("should have the appropiate stopwords") { expect(subject.stopwords).to eq ["de","la","que","el","en","y","a","los","del","se","las","por","un","para","con","no","una","su","al","lo","como","más","pero","sus","le","ya","o","este","sí","porque","esta","entre","cuando","muy","sin","sobre","también","me","hasta","hay","donde","quien","desde","todo","nos","durante","todos","uno","les","ni","contra","otros","ese","eso","ante","ellos","e","esto","mí","antes","algunos","qué","unos","yo","otro","otras","otra","él","tanto","esa","estos","mucho","quienes","nada","muchos","cual","poco","ella","estar","estas","algunas","algo","nosotros","mi","mis","tú","te","ti","tu","tus","ellas","nosotras","vosotros","vosotras","os","mío","mía","míos","mías","tuyo","tuya","tuyos","tuyas","suyo","suya","suyos","suyas","nuestro","nuestra","nuestros","nuestras","vuestro","vuestra","vuestros","vuestras","esos","esas","estoy","estás","está","estamos","estáis","están","esté","estés","estemos","estéis","estén","estaré","estarás","estará","estaremos","estaréis","estarán","estaría","estarías","estaríamos","estaríais","estarían","estaba","estabas","estábamos","estabais","estaban","estuve","estuviste","estuvo","estuvimos","estuvisteis","estuvieron","estuviera","estuvieras","estuviéramos","estuvierais","estuvieran","estuviese","estuvieses","estuviésemos","estuvieseis","estuviesen","estando","estada","estadas","estad","he","has","ha","hemos","habéis","han","haya","hayas","hayamos","hayáis","hayan","habré","habrás","habrá","habremos","habréis","habrán","habría","habrías","habríamos","habríais","habrían","había","habías","habíamos","habíais","habían","hube","hubiste","hubo","hubimos","hubisteis","hubieron","hubiera","hubieras","hubiéramos","hubierais","hubieran","hubiese","hubieses","hubiésemos","hubieseis","hubiesen","habiendo","habido","habida","habidos","habidas","soy","eres","es","somos","sois","son","sea","seas","seamos","seáis","sean","seré","serás","será","seremos","seréis","serán","sería","serías","seríamos","seríais","serían","era","eras","éramos","erais","eran","fui","fuiste","fue","fuimos","fuisteis","fueron","fuera","fueras","fuéramos","fuerais","fueran","fuese","fueses","fuésemos","fueseis","fuesen","siendo","sido","tengo","tienes","tiene","tenemos","tenéis","tienen","tenga","tengas","tengamos","tengáis","tengan","tendré","tendrás","tendrá","tendremos","tendréis","tendrán","tendría","tendrías","tendríamos","tendríais","tendrían","tenía","tenías","teníamos","teníais","tenían","tuve","tuviste","tuvo","tuvimos","tuvisteis","tuvieron","tuviera","tuvieras","tuviéramos","tuvierais","tuvieran","tuviese","tuvieses","tuviésemos","tuvieseis","tuviesen","teniendo","tenido","tenida","tenidos","tenidas","tened","algunes","algunxs","elle","ellx","elles","ellxs","ese","esx","eses","esxs","estes","este","estxs","estx","lx","le","lxs","les","mucha","muchas","muches","muchxs","míe","míes","míx","míxs","nosotres","nosotrxs","nuestre","nuestres","nuestrx","nuestrxs","otre","otrx","otres","otrxs","poca","poque","pocx","suye","suyx","suyes","suyxs","tantas","tantxs","tantes","tenide","tenides","tenidx","tenidxs","toda","todas","tode","todes","todx","todxs","tuye","tuyes","tuyx","tuyxs","une","unx","unxs","unes","vosotrxs","vosotres","vuestre","vuestres","vuestrx","vuestrxs"]}
13
+
14
+ it("should remove the stopwords for the list of words to be filtered") { expect(filter.filter("desde Santurce a Bilbao".split)).to eq ["Santurce", "Bilbao"]}
15
+
16
+ end
17
+
18
+ context "when custom list" do
19
+
20
+ let (:filter) { Stopwords::Snowball::Filter.new "es", ["Santurce"] }
21
+
22
+ subject { filter }
23
+
24
+ it("should remove the stopwords for the list of words to be filtered") { expect(filter.filter("desde Santurce a Bilbao".split)).to eq ["Bilbao"]}
25
+
26
+ end
27
+
28
+ context "when locale is not found" do
29
+
30
+ let (:filter) { Stopwords::Snowball::Filter.new "no-real" }
31
+
32
+ subject { filter }
33
+
34
+ it("should throw an error explaining the locale not found") { expect{filter}.to raise_error(ArgumentError)}
35
+
36
+ end
37
+
38
+
39
+
40
+ end
@@ -0,0 +1 @@
1
+ require_relative '../lib/stopwords'
metadata ADDED
@@ -0,0 +1,91 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: stopwords-filter2
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.0
5
+ platform: ruby
6
+ authors:
7
+ - Aaron Stillwell
8
+ - David J. Brenes
9
+ autorequire:
10
+ bindir: bin
11
+ cert_chain: []
12
+ date: 2023-02-04 00:00:00.000000000 Z
13
+ dependencies: []
14
+ description: Small library that allows you to create a simple stopwords filter or
15
+ use some based on Snowball stopwords lists
16
+ email: stillwell.mailbox@gmail.com
17
+ executables: []
18
+ extensions: []
19
+ extra_rdoc_files:
20
+ - CHANGELOG.md
21
+ - LICENSE.txt
22
+ - README.md
23
+ files:
24
+ - CHANGELOG.md
25
+ - Gemfile
26
+ - Gemfile.lock
27
+ - LICENSE.txt
28
+ - README.md
29
+ - VERSION
30
+ - lib/stopwords.rb
31
+ - lib/stopwords/filter.rb
32
+ - lib/stopwords/snowball.rb
33
+ - lib/stopwords/snowball/filter.rb
34
+ - lib/stopwords/snowball/locales/af.csv
35
+ - lib/stopwords/snowball/locales/ar.csv
36
+ - lib/stopwords/snowball/locales/bg.csv
37
+ - lib/stopwords/snowball/locales/bn.csv
38
+ - lib/stopwords/snowball/locales/br.csv
39
+ - lib/stopwords/snowball/locales/ca.csv
40
+ - lib/stopwords/snowball/locales/cs.csv
41
+ - lib/stopwords/snowball/locales/da.csv
42
+ - lib/stopwords/snowball/locales/de.csv
43
+ - lib/stopwords/snowball/locales/el.csv
44
+ - lib/stopwords/snowball/locales/en.csv
45
+ - lib/stopwords/snowball/locales/es.csv
46
+ - lib/stopwords/snowball/locales/fi.csv
47
+ - lib/stopwords/snowball/locales/fn.csv
48
+ - lib/stopwords/snowball/locales/fr.csv
49
+ - lib/stopwords/snowball/locales/he.csv
50
+ - lib/stopwords/snowball/locales/hu.csv
51
+ - lib/stopwords/snowball/locales/id.csv
52
+ - lib/stopwords/snowball/locales/it.csv
53
+ - lib/stopwords/snowball/locales/ko.csv
54
+ - lib/stopwords/snowball/locales/nl.csv
55
+ - lib/stopwords/snowball/locales/pl.csv
56
+ - lib/stopwords/snowball/locales/pt.csv
57
+ - lib/stopwords/snowball/locales/ro.csv
58
+ - lib/stopwords/snowball/locales/ru.csv
59
+ - lib/stopwords/snowball/locales/sv.csv
60
+ - lib/stopwords/snowball/locales/th.csv
61
+ - lib/stopwords/snowball/locales/tr.csv
62
+ - lib/stopwords/snowball/locales/vi.csv
63
+ - lib/stopwords/snowball/locales/zh.csv
64
+ - lib/stopwords/snowball/wordsieve.rb
65
+ - spec/lib/filter_spec.rb
66
+ - spec/lib/snowball_filter_spec.rb
67
+ - spec/spec_helper.rb
68
+ homepage: http://github.com/aaronstillwell/stopwords-filter2
69
+ licenses:
70
+ - MIT
71
+ metadata: {}
72
+ post_install_message:
73
+ rdoc_options: []
74
+ require_paths:
75
+ - lib
76
+ required_ruby_version: !ruby/object:Gem::Requirement
77
+ requirements:
78
+ - - ">="
79
+ - !ruby/object:Gem::Version
80
+ version: '2.4'
81
+ required_rubygems_version: !ruby/object:Gem::Requirement
82
+ requirements:
83
+ - - ">="
84
+ - !ruby/object:Gem::Version
85
+ version: '0'
86
+ requirements: []
87
+ rubygems_version: 3.4.1
88
+ signing_key:
89
+ specification_version: 4
90
+ summary: Snowball based filters for stopwords
91
+ test_files: []