stopwords-filters 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (66) hide show
  1. checksums.yaml +7 -0
  2. data/CHANGELOG +75 -0
  3. data/Gemfile +6 -0
  4. data/Gemfile.lock +27 -0
  5. data/LICENSE.txt +20 -0
  6. data/README.md +182 -0
  7. data/VERSION +1 -0
  8. data/lib/stopwords/filter.rb +20 -0
  9. data/lib/stopwords/snowball/filter.rb +22 -0
  10. data/lib/stopwords/snowball/locales/af +1 -0
  11. data/lib/stopwords/snowball/locales/ar +1 -0
  12. data/lib/stopwords/snowball/locales/bg +1 -0
  13. data/lib/stopwords/snowball/locales/bn +1 -0
  14. data/lib/stopwords/snowball/locales/ca +1 -0
  15. data/lib/stopwords/snowball/locales/ckb +1 -0
  16. data/lib/stopwords/snowball/locales/cz +1 -0
  17. data/lib/stopwords/snowball/locales/da +1 -0
  18. data/lib/stopwords/snowball/locales/de +1 -0
  19. data/lib/stopwords/snowball/locales/el +1 -0
  20. data/lib/stopwords/snowball/locales/en +1 -0
  21. data/lib/stopwords/snowball/locales/eo +1 -0
  22. data/lib/stopwords/snowball/locales/es +1 -0
  23. data/lib/stopwords/snowball/locales/et +1 -0
  24. data/lib/stopwords/snowball/locales/eu +1 -0
  25. data/lib/stopwords/snowball/locales/fa +1 -0
  26. data/lib/stopwords/snowball/locales/fi +1 -0
  27. data/lib/stopwords/snowball/locales/fr +1 -0
  28. data/lib/stopwords/snowball/locales/ga +1 -0
  29. data/lib/stopwords/snowball/locales/gl +1 -0
  30. data/lib/stopwords/snowball/locales/he +1 -0
  31. data/lib/stopwords/snowball/locales/hi +1 -0
  32. data/lib/stopwords/snowball/locales/hr +1 -0
  33. data/lib/stopwords/snowball/locales/hu +1 -0
  34. data/lib/stopwords/snowball/locales/hy +1 -0
  35. data/lib/stopwords/snowball/locales/id +1 -0
  36. data/lib/stopwords/snowball/locales/it +1 -0
  37. data/lib/stopwords/snowball/locales/ja +1 -0
  38. data/lib/stopwords/snowball/locales/ko +1 -0
  39. data/lib/stopwords/snowball/locales/la +1 -0
  40. data/lib/stopwords/snowball/locales/lt +1 -0
  41. data/lib/stopwords/snowball/locales/lv +1 -0
  42. data/lib/stopwords/snowball/locales/mr +1 -0
  43. data/lib/stopwords/snowball/locales/nl +1 -0
  44. data/lib/stopwords/snowball/locales/no +1 -0
  45. data/lib/stopwords/snowball/locales/pl +1 -0
  46. data/lib/stopwords/snowball/locales/pt +1 -0
  47. data/lib/stopwords/snowball/locales/ro +1 -0
  48. data/lib/stopwords/snowball/locales/ru +1 -0
  49. data/lib/stopwords/snowball/locales/sk +1 -0
  50. data/lib/stopwords/snowball/locales/sl +1 -0
  51. data/lib/stopwords/snowball/locales/so +1 -0
  52. data/lib/stopwords/snowball/locales/st +1 -0
  53. data/lib/stopwords/snowball/locales/sv +1 -0
  54. data/lib/stopwords/snowball/locales/sw +1 -0
  55. data/lib/stopwords/snowball/locales/th +1 -0
  56. data/lib/stopwords/snowball/locales/tr +1 -0
  57. data/lib/stopwords/snowball/locales/yo +1 -0
  58. data/lib/stopwords/snowball/locales/zh +1 -0
  59. data/lib/stopwords/snowball/locales/zu +1 -0
  60. data/lib/stopwords/snowball/wordsieve.rb +21 -0
  61. data/lib/stopwords/snowball.rb +7 -0
  62. data/lib/stopwords.rb +7 -0
  63. data/spec/lib/filter_spec.rb +19 -0
  64. data/spec/lib/snowball_filter_spec.rb +40 -0
  65. data/spec/spec_helper.rb +3 -0
  66. metadata +110 -0
checksums.yaml ADDED
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA256:
3
+ metadata.gz: c4bb71d8681c57c1e30c987d017207a62a5032e3980c81283ac1e646f5ab432e
4
+ data.tar.gz: 2b03009e17c188ae050ce8a276a15b50c7930cf866815a87e9dcefeec45c0707
5
+ SHA512:
6
+ metadata.gz: 84ca8d38c1d46f391dedc9685249954f9bf6fa6d31aec29b08115ff14e32c099c5158c1d5aac93c6867a5d52120adcb5d2d378426f82bbdb4e96e14e3b936b38
7
+ data.tar.gz: 15120d3995de807b8ea8de59b04a51ecd5afb233310658472e7ad5b633b6ff31249a88c0f449ad09eed5cb849c1c7b7d94fd662b82d1539343e076a035bdcfac
data/CHANGELOG ADDED
@@ -0,0 +1,75 @@
1
+ 1.0.0:
2
+ * Updated language files to use ManticoreSearch stopwords
3
+ * Added support for the following languages:
4
+ * Afrikaans (af)
5
+ * Arabic (ar)
6
+ * Bengali (bn)
7
+ * Breton (br)
8
+ * Catalán (ca)
9
+ * Chinese (zh)
10
+ * Czech (cs)
11
+ * Danish (da)
12
+ * German (de)
13
+ * Greek (el)
14
+ * English (en)
15
+ * Spanish (es)
16
+ * Finnish (fi)
17
+ * French (fr)
18
+ * Hebrew (he)
19
+ * Hungarian (hu)
20
+ * Indonesian (id)
21
+ * Italian (it)
22
+ * Korean (ko)
23
+ * Dutch (nl)
24
+ * Polish (pl)
25
+ * Portuguese (pt)
26
+ * Romanian (ro)
27
+ * Russian (ru)
28
+ * Swedish (sv)
29
+ * Thai (th)
30
+ * Turkish (tr)
31
+ * Vietnamese (vi)
32
+ * Tested the gem with Ruby 3.2 to ensure compatibility
33
+
34
+ 0.7.0:
35
+ * Fixed Wordiseve class [@hmaack] [#19]
36
+ * Added suport for Chinese (zh) [@bettysteger] [#20]
37
+
38
+ 0.6.0:
39
+ * Added support for: [@bettysteger] [#16]
40
+ * Afrikaans (af)
41
+ * Arabic (ar)
42
+ * Bengali (bn)
43
+ * Breton (br)
44
+ * Catalán (ca)
45
+ * Czesch (cs)
46
+ * Hebrew (he)
47
+ * Indonesian (id)
48
+ * Korean (ko)
49
+ * Thai (th)
50
+ * Turkish (tr)
51
+ * Vietnamese (vi)
52
+ * Added keywords for English and German [@bettysteger] [#16]
53
+ * Fixed upcase/downcase behaviour [@bettysteger] [#16]
54
+ * Added gender neutral versions of some words in spanish [@fauno] [#17]
55
+ * Bumped rdoc version [@dependabot] [#18]
56
+ * Fixed Finnish locale code from `fn` to `fi`
57
+ 0.5.0:
58
+ * Added Greek stopwords based on Lucene [@vrypan] [#13]
59
+ * Fixed CSV format for sv and ru locales [@woto] [#14]
60
+ * Fixed romanian and polish CSV not being included in the gemspec.
61
+ 0.4.1:
62
+ * Dummy version to fix metadata in gemspec
63
+ 0.4.0:
64
+ * Added Polish stopwords based on https://pl.wikipedia.org/wiki/Wikipedia:Stopwords [@grzegorzblaszczyk] [#9]
65
+ * Added info when no locale is found on snowball filter [@nerde] [#10]
66
+ 0.3.0:
67
+ * Added custom words list to snowball filter [@sbeckeriv]
68
+ * Fixed problem about initialization: https://github.com/brenes//issues/3 [@zackxu1]
69
+ 0.2.0:
70
+ * Added stopword? method [@s2gatev]
71
+ * Added Sieve class [@s2gatev]
72
+ * Added bulgarian language [@s2gatev]
73
+ 0.1.0
74
+ * Added simple filter [@brenes]
75
+ * Added snowball filter [@brenes]
data/Gemfile ADDED
@@ -0,0 +1,6 @@
1
+ # A sample Gemfile
2
+ source 'https://rubygems.org'
3
+
4
+ group :test do
5
+ gem 'rspec'
6
+ end
data/Gemfile.lock ADDED
@@ -0,0 +1,27 @@
1
+ GEM
2
+ remote: https://rubygems.org/
3
+ specs:
4
+ diff-lcs (1.5.1)
5
+ rspec (3.13.0)
6
+ rspec-core (~> 3.13.0)
7
+ rspec-expectations (~> 3.13.0)
8
+ rspec-mocks (~> 3.13.0)
9
+ rspec-core (3.13.1)
10
+ rspec-support (~> 3.13.0)
11
+ rspec-expectations (3.13.2)
12
+ diff-lcs (>= 1.2.0, < 2.0)
13
+ rspec-support (~> 3.13.0)
14
+ rspec-mocks (3.13.1)
15
+ diff-lcs (>= 1.2.0, < 2.0)
16
+ rspec-support (~> 3.13.0)
17
+ rspec-support (3.13.1)
18
+
19
+ PLATFORMS
20
+ arm64-darwin-23
21
+ ruby
22
+
23
+ DEPENDENCIES
24
+ rspec
25
+
26
+ BUNDLED WITH
27
+ 2.5.6
data/LICENSE.txt ADDED
@@ -0,0 +1,20 @@
1
+ Copyright (c) 2012 David J. Brenes
2
+
3
+ Permission is hereby granted, free of charge, to any person obtaining
4
+ a copy of this software and associated documentation files (the
5
+ "Software"), to deal in the Software without restriction, including
6
+ without limitation the rights to use, copy, modify, merge, publish,
7
+ distribute, sublicense, and/or sell copies of the Software, and to
8
+ permit persons to whom the Software is furnished to do so, subject to
9
+ the following conditions:
10
+
11
+ The above copyright notice and this permission notice shall be
12
+ included in all copies or substantial portions of the Software.
13
+
14
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
15
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
16
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
17
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
18
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
19
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
20
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
data/README.md ADDED
@@ -0,0 +1,182 @@
1
+ Stopwords Filter
2
+ ================
3
+
4
+ [![Build Status](https://travis-ci.org/brenes/.svg?branch=master)](https://travis-ci.org/brenes/)
5
+
6
+ This project is a very simple and naive implementation of a stopwords filter that remove a list of banned words (stopwords) from a sentence.
7
+
8
+ Quick guide
9
+ -----------
10
+
11
+ * Install
12
+
13
+ just type
14
+
15
+ ```
16
+ gem install
17
+ ```
18
+
19
+ or
20
+
21
+ ```
22
+ # Don't forget the 'require:'
23
+ gem '', require: 'stopwords'
24
+ ```
25
+
26
+ in your Gemfile.
27
+
28
+ * Use it
29
+
30
+ 1. Simple version
31
+
32
+ ```
33
+ stopwords = ['by', 'written', 'from']
34
+ filter = Stopwords::Filter.new stopwords
35
+
36
+ filter.filter 'guide by douglas adams'.split
37
+ # ['guide', 'douglas', 'adams']
38
+
39
+ filter.stopword? 'by'
40
+ # true
41
+ ```
42
+
43
+ 2. Snowball version
44
+
45
+
46
+ ```
47
+ filter = Stopwords::Snowball::Filter.new "en"
48
+ filter.filter 'guide by douglas adams'.split
49
+ # ['guide', 'douglas', 'adams']
50
+
51
+ filter.stopword? 'by'
52
+ # true
53
+ ```
54
+
55
+ 2.1 Snowball version with Sieve class (thanks to @s2gatev)
56
+
57
+ ```ruby
58
+ sieve = Stopwords::Snowball::WordSieve.new
59
+
60
+ filtered = sieve.filter lang: :en, words: 'guide by douglas adams'.split
61
+ # filtered = ['guide', 'douglas', 'adams']
62
+
63
+ sieve.stopword? lang: :en, word: 'by'
64
+ # true
65
+ ```
66
+
67
+
68
+
69
+ What is a Stopword?
70
+ -------------------
71
+
72
+ According to [Wikipedia][wikipedia_stopwords]
73
+
74
+ > In computing, stop words are words which are filtered out prior to, or after, processing of natural language data (text).
75
+
76
+ And that's it. Words that are removed before you perform some task on the rest of them.
77
+
78
+ Why would I want to remove anything?
79
+ ------------------------------------
80
+
81
+ Imagine you have a database of products and you want your customers to search on them. You can't use a proper search engine (such as [Solr][solr], [Sphinx][sphinx] or even [Google][google]) neither full search systems from popular database systems such as [PostgreSQL][postgre]. You are left alone with LIKEs and %.
82
+
83
+ You have your fake search engine working. Someone searches 'Guide Douglas Adams' and you find 'Douglas Adams - Hitchhiker's guide to the galaxy' everything is perfect.
84
+
85
+ But then someone searches 'guide by douglas adams' and you don't find anything. You don't have any 'by' in the description or title of the book! Most importantly, you don't need that 'by'!
86
+
87
+ You wish you could get rid of all those 'by' or 'written' or 'from', huh? That's why we are here!
88
+
89
+ How this thing works?
90
+ ---------------------
91
+
92
+ Main class of this 'library' is Stopwords::Filter You just create a new object with an array of stopwords
93
+
94
+ ```
95
+ stopwords = ['by', 'written', 'from']
96
+ filter = Stopwords::Filter.new stopwords
97
+ ```
98
+
99
+ And then you have it, you just can filter
100
+
101
+ ```
102
+ filter.filter 'guide by douglas adams'.split #-> ['guide', 'douglas', 'adams']
103
+ ```
104
+
105
+ That's all?
106
+ -----------
107
+
108
+ I know what you're thinking, it takes a line of ruby code to filter one array from other. That's why we have added an extra functionality, [Snowball][wikipedia_snowball] stopwords lists, already built for you and ready to use.
109
+
110
+ At least, in the beginning we were using snowball stopwords, but several collaborators have improved this humble gem by including new languages or adding new stopwords. So now, the Snowball version is more an "Snowball and friends" version.
111
+
112
+ How do I use that snowball thing?
113
+ ---------------------------------
114
+
115
+ You just create the filter with the locale you want to use
116
+
117
+ ```
118
+ filter = Stopwords::Snowball::Filter.new "en"
119
+ ```
120
+
121
+ And then you filter without worrying about the exact stopwords used
122
+
123
+ ```
124
+ filter.filter 'guide by douglas adams'.split #-> ['guide', 'douglas', 'adams']
125
+ ```
126
+
127
+ Which languages are supported with snowball?
128
+ -------------------------------------------
129
+
130
+ Currently we have support for:
131
+
132
+ * Afrikaans (af)
133
+ * Arabic (ar)
134
+ * Bengali (bn)
135
+ * Breton (br)
136
+ * Catalán (ca)
137
+ * Chinese (zh)
138
+ * Czesch (cs)
139
+ * Danish (da)
140
+ * German (de)
141
+ * Greek (el)
142
+ * English (en)
143
+ * Spanish (es)
144
+ * Finnish (fi): Due to an error it can also be used referring to the `fn` locale
145
+ * French (fr)
146
+ * Hebrew (he)
147
+ * Hungarian (hu)
148
+ * Indonesian (id)
149
+ * Italian (it)
150
+ * Korean (ko)
151
+ * Dutch (nl)
152
+ * Polish (pl)
153
+ * Portuguese (pt)
154
+ * Romanian (ro)
155
+ * Russian (ru)
156
+ * Swedish (sv)
157
+ * Thai (th)
158
+ * Turkish (tr)
159
+ * Vietnamese (vi)
160
+
161
+ In the changelog you can see the collaborators for each language.
162
+
163
+ Anything else?
164
+ --------------
165
+
166
+ In a future version I would like to include a chaining filter where you include a series of operations and they are executed in a lineal order, just like the [Pipes and Filters design pattern][wikipedia_pipes_filters]
167
+
168
+ Ackonowledgments
169
+ ----------------
170
+
171
+ Thanks to @s2gatev who added the `stopword?` method and the sieve class to this gem
172
+
173
+ Thanks to @bettysteger, @fauno, @vrypan, @woto, @grzegorzblaszczyk, @nerde, @sbeckeriv and @zackxu1 for language support and other features.
174
+
175
+ [wikipedia_stopwords]: http://en.wikipedia.org/wiki/Stopword
176
+ [solr]: https://github.com/sunspot/sunspot
177
+ [sphinx]: https://github.com/freelancing-god/thinking-sphinx
178
+ [google]: https://github.com/alexreisner/google_custom_search
179
+ [postgre]: https://github.com/Casecommons/pg_search
180
+ [wikipedia_snowball]: http://en.wikipedia.org/wiki/Snowball_programming_language
181
+ [wikipedia_pipes_filters]: http://en.wikipedia.org/wiki/Pipes_and_filters
182
+
data/VERSION ADDED
@@ -0,0 +1 @@
1
+ 1.0.0
@@ -0,0 +1,20 @@
1
+ # frozen_string_literal: true
2
+
3
+ module Stopwords
4
+ # A filter for removing stopwords from a text.
5
+ class Filter
6
+ attr_reader :stopwords
7
+
8
+ def initialize(stopwords)
9
+ @stopwords = stopwords.map(&:downcase)
10
+ end
11
+
12
+ def filter(words)
13
+ words.reject { |word| stopword?(word) }
14
+ end
15
+
16
+ def stopword?(word)
17
+ stopwords.include?(word) || stopwords.include?(word.downcase)
18
+ end
19
+ end
20
+ end
@@ -0,0 +1,22 @@
1
+ # frozen_string_literal: true
2
+
3
+ module Stopwords
4
+ module Snowball
5
+ # A filter for removing stopwords from a text, using a Snowball-based stopword list.
6
+ class Filter < Stopwords::Filter
7
+ attr_reader :locale, :locale_filename
8
+
9
+ def initialize(locale, custom_list = [])
10
+ raise ArgumentError, 'Locale cannot be nil' if locale.nil?
11
+
12
+ @locale = locale.gsub(/-\w+/, '') # remove country appendix
13
+ @locale_filename = File.join(File.dirname(__FILE__), 'locales', locale.to_s)
14
+
15
+ raise ArgumentError, "Unknown locale: #{locale.inspect}" unless File.exist?(@locale_filename)
16
+
17
+ stopwords = File.read(@locale_filename).split(',').map(&:downcase) + custom_list.map(&:downcase)
18
+ super(stopwords)
19
+ end
20
+ end
21
+ end
22
+ end
@@ -0,0 +1 @@
1
+ 'n,aan,af,al,as,baie,by,daar,dag,dat,die,dit,een,ek,en,gaan,gesê,haar,het,hom,hulle,hy,in,is,jou,jy,kan,kom,ma,maar,met,my,na,nie,om,ons,op,saam,sal,se,sien,so,sy,te,toe,uit,van,vir,was,wat,ʼn
@@ -0,0 +1 @@
1
+ من,ومن,منها,منه,في,وفي,فيها,فيه,و,ف,ثم,او,أو,ب,بها,به,ا,أ,اى,اي,أي,أى,لا,ولا,الا,ألا,إلا,لكن,ما,وما,كما,فما,عن,مع,اذا,إذا,ان,أن,إن,انها,أنها,إنها,انه,أنه,إنه,بان,بأن,فان,فأن,وان,وأن,وإن,التى,التي,الذى,الذي,الذين,الى,الي,إلى,إلي,على,عليها,عليه,اما,أما,إما,ايضا,أيضا,كل,وكل,لم,ولم,لن,ولن,هى,هي,هو,وهى,وهي,وهو,فهى,فهي,فهو,انت,أنت,لك,لها,له,هذه,هذا,تلك,ذلك,هناك,كانت,كان,يكون,تكون,وكانت,وكان,غير,بعض,قد,نحو,بين,بينما,منذ,ضمن,حيث,الان,الآن,خلال,بعد,قبل,حتى,عند,عندما,لدى,جميع,
@@ -0,0 +1 @@
1
+ а,аз,ако,ала,бе,без,беше,би,бил,била,били,било,близо,бъдат,бъде,бяха,в,вас,ваш,ваша,вероятно,вече,взема,ви,вие,винаги,все,всеки,всички,всичко,всяка,във,въпреки,върху,г,ги,главно,го,д,да,дали,до,докато,докога,дори,досега,доста,е,едва,един,ето,за,зад,заедно,заради,засега,затова,защо,защото,и,из,или,им,има,имат,иска,й,каза,как,каква,какво,както,какъв,като,кога,когато,което,които,кой,който,колко,която,къде,където,към,ли,м,ме,между,мен,ми,мнозина,мога,могат,може,моля,момента,му,н,на,над,назад,най,направи,напред,например,нас,не,него,нея,ни,ние,никой,нито,но,някои,някой,няма,обаче,около,освен,особено,от,отгоре,отново,още,пак,по,повече,повечето,под,поне,поради,после,почти,прави,пред,преди,през,при,пък,първо,с,са,само,се,сега,си,скоро,след,сме,според,сред,срещу,сте,съм,със,също,т,тази,така,такива,такъв,там,твой,те,тези,ти,тн,то,това,тогава,този,той,толкова,точно,трябва,тук,тъй,тя,тях,у,харесва,ч,че,често,чрез,ще,щом,я,
@@ -0,0 +1 @@
1
+ এই,ও,থেকে,করে,এ,না,ওই,এক্,নিয়ে,করা,বলেন,সঙ্গে,যে,এব,তা,আর,কোনো,বলে,সেই,দিন,হয়,কি,দু,পরে,সব,দেওয়া,মধ্যে,এর,সি,শুরু,কাজ,কিছু,কাছে,সে,তবে,বা,বন,আগে,জ্নজন,পি,পর,তো,ছিল,এখন,আমরা,প্রায়,দুই,আমাদের,তাই,অন্য,গিয়ে,প্রযন্ত,মনে,নতুন,মতো,কেখা,প্রথম,আজ,টি,ধামার,অনেক,বিভিন্ন,র,হাজার,জানা,নয়,অবশ্য,বেশি,এস,করে,কে,হতে,বি,কয়েক,সহ,বেশ,এমন,এমনি,কেন,কেউ,নেওয়া,চেষ্টা,লক্ষ,বলা,কারণ,আছে,শুধু,তখন,যা,এসে,চার,ছিল,যদি,আবার,কোটি,উত্তর,সামনে,উপর,বক্তব্য,এত,প্রাথমিক,উপরে,আছে,প্রতি,কাজে,যখন,খুব,বহু,গেল,পেয়্র্,চালু,ই,নাগাদ,থাকা,পাচ,যাওয়া,রকম,সাধারণ,কমনে,
@@ -0,0 +1 @@
1
+ a,abans,ací,ah,així,això,al,als,aleshores,algun,alguna,algunes,alguns,alhora,allà,allí,allò,altra,altre,altres,amb,ambdós,ambdues,apa,aquell,aquella,aquelles,aquells,aquest,aquesta,aquestes,aquests,aquí,baix,cada,cadascú,cadascuna,cadascunes,cadascuns,com,contra,d'un,d'una,d'unes,d'uns,dalt,de,del,dels,des,després,dins,dintre,donat,doncs,durant,e,eh,el,els,em,en,encara,ens,entre,érem,eren,éreu,es,és,esta,està,estàvem,estaven,estàveu,esteu,et,etc,ets,fins,fora,gairebé,ha,han,has,havia,he,hem,heu,hi,ho,i,igual,iguals,ja,l'hi,la,les,li,li'n,llavors,m'he,ma,mal,malgrat,mateix,mateixa,mateixes,mateixos,me,mentre,més,meu,meus,meva,meves,molt,molta,moltes,molts,mon,mons,n'he,n'hi,ne,ni,no,nogensmenys,només,nosaltres,nostra,nostre,nostres,o,oh,oi,on,pas,pel,pels,per,però,perquè,poc,poca,pocs,poques,potser,propi,qual,quals,quan,quant,que,què,quelcom,qui,quin,quina,quines,quins,s'ha,s'han,sa,semblant,semblants,ses,seu,seus,seva,seva,seves,si,sobre,sobretot,sóc,solament,sols,son,són,sons,sota,sou,t'ha,t'han,t'he,ta,tal,també,tampoc,tan,tant,tanta,tantes,teu,teus,teva,teves,ton,tons,tot,tota,totes,tots,un,una,unes,uns,us,va,vaig,vam,van,vas,veu,vosaltres,vostra,vostre,vostres,
@@ -0,0 +1 @@
1
+ و,کە,ی,کرد,ئەوەی,سەر,دوو,هەروەها,لەو,دەکات,چەند,هەر,ئەو,ئەم,من,ئێمە,تۆ,ئێوە,ئەو,ئەوان,بە,پێ,بەبێ,بەدەم,بەلای,بەپێی,بەرلە,بەرەوی,بەرەوە,بەردەم,بێ,بێجگە,بۆ,دە,تێ,دەگەڵ,دوای,جگە,لە,لێ,لەبەر,لەبەینی,لەبابەت,لەبارەی,لەباتی,لەبن,لەبرێتی,لەدەم,لەگەڵ,لەلایەن,لەناو,لەنێو,لەپێناوی,لەرەوی,لەرێ,لەرێگا,لەسەر,لەژێر,ناو,نێوان,پاش,پێش,وەک,
@@ -0,0 +1 @@
1
+ a,s,k,o,i,u,v,z,dnes,cz,tímto,budeš,budem,byli,jseš,můj,svým,ta,tomto,tohle,tuto,tyto,jej,zda,proč,máte,tato,kam,tohoto,kdo,kteří,mi,nám,tom,tomuto,mít,nic,proto,kterou,byla,toho,protože,asi,ho,naši,napište,re,což,tím,takže,svých,její,svými,jste,aj,tu,tedy,teto,bylo,kde,ke,pravé,ji,nad,nejsou,či,pod,téma,mezi,přes,ty,pak,vám,ani,když,však,neg,jsem,tento,článku,články,aby,jsme,před,pta,jejich,byl,ještě,až,bez,také,pouze,první,vaše,která,nás,nový,tipy,pokud,může,strana,jeho,své,jiné,zprávy,nové,není,vás,jen,podle,zde,už,být,více,bude,již,než,který,by,které,co,nebo,ten,tak,má,při,od,po,jsou,jak,další,ale,si,se,ve,to,jako,za,zpět,ze,do,pro,je,na,atd,atp,jakmile,přičemž,já,on,ona,ono,oni,ony,my,vy,jí,ji,mě,mne,jemu,tomu,těm,těmu,němu,němuž,jehož,jíž,jelikož,jež,jakož,načež,
@@ -0,0 +1 @@
1
+ og,i,jeg,det,at,en,den,til,er,som,på,de,med,han,af,for,ikke,der,var,mig,sig,men,et,har,om,vi,min,havde,ham,hun,nu,over,da,fra,du,ud,sin,dem,os,op,man,hans,hvor,eller,hvad,skal,selv,her,alle,vil,blev,kunne,ind,når,være,dog,noget,ville,jo,deres,efter,ned,skulle,denne,end,dette,mit,også,under,have,dig,anden,hende,mine,alt,meget,sit,sine,vor,mod,disse,hvis,din,nogle,hos,blive,mange,ad,bliver,hendes,været,thi,jer,sådan,
@@ -0,0 +1 @@
1
+ aber,alle,allem,allen,aller,alles,als,also,am,an,ander,andere,anderem,anderen,anderer,anderes,anderm,andern,anderr,anders,auch,auf,aus,bei,bin,bis,bist,da,damit,dann,der,den,des,dem,die,das,daß,derselbe,derselben,denselben,desselben,demselben,dieselbe,dieselben,dasselbe,dazu,dein,deine,deinem,deinen,deiner,deines,denn,derer,dessen,dich,dir,du,dies,diese,diesem,diesen,dieser,dieses,doch,dort,durch,ein,eine,einem,einen,einer,eines,einig,einige,einigem,einigen,einiger,einiges,einmal,er,ihn,ihm,es,etwas,euer,eure,eurem,euren,eurer,eures,für,gegen,gewesen,hab,habe,haben,hat,hatte,hatten,hier,hin,hinter,ich,mich,mir,ihr,ihre,ihrem,ihren,ihrer,ihres,euch,im,in,indem,ins,ist,jede,jedem,jeden,jeder,jedes,jene,jenem,jenen,jener,jenes,jetzt,kann,kein,keine,keinem,keinen,keiner,keines,können,könnte,machen,man,manche,manchem,manchen,mancher,manches,mein,meine,meinem,meinen,meiner,meines,mit,muss,musste,nach,nicht,nichts,noch,nun,nur,ob,oder,ohne,sehr,sein,seine,seinem,seinen,seiner,seines,selbst,sich,sie,ihnen,sind,so,solche,solchem,solchen,solcher,solches,soll,sollte,sondern,sonst,über,um,und,uns,unse,unsem,unsen,unser,unses,unter,viel,vom,von,vor,während,war,waren,warst,was,weg,weil,weiter,welche,welchem,welchen,welcher,welches,wenn,werde,werden,wie,wieder,will,wir,wird,wirst,wo,wollen,wollte,würde,würden,zu,zum,zur,zwar,zwischen,
@@ -0,0 +1 @@
1
+ ο,η,το,οι,τα,του,τησ,των,τον,την,και,κι,κ,ειμαι,εισαι,ειναι,ειμαστε,ειστε,στο,στον,στη,στην,μα,αλλα,απο,για,προσ,με,σε,ωσ,παρα,αντι,κατα,μετα,θα,να,δε,δεν,μη,μην,επι,ενω,εαν,αν,τοτε,που,πωσ,ποιοσ,ποια,ποιο,ποιοι,ποιεσ,ποιων,ποιουσ,αυτοσ,αυτη,αυτο,αυτοι,αυτων,αυτουσ,αυτεσ,αυτα,εκεινοσ,εκεινη,εκεινο,εκεινοι,εκεινεσ,εκεινα,εκεινων,εκεινουσ,οπωσ,ομωσ,ισωσ,οσο,οτι,
@@ -0,0 +1 @@
1
+ i,me,my,myself,we,our,ours,ourselves,you,your,yours,yourself,yourselves,he,him,his,himself,she,her,hers,herself,it,its,itself,they,them,their,theirs,themselves,what,which,who,whom,this,that,these,those,am,is,are,was,were,be,been,being,have,has,had,having,do,does,did,doing,would,should,could,ought,i'm,you're,he's,she's,it's,we're,they're,i've,you've,we've,they've,i'd,you'd,he'd,she'd,we'd,they'd,i'll,you'll,he'll,she'll,we'll,they'll,isn't,aren't,wasn't,weren't,hasn't,haven't,hadn't,doesn't,don't,didn't,won't,wouldn't,shan't,shouldn't,can't,cannot,couldn't,mustn't,let's,that's,who's,what's,here's,there's,when's,where's,why's,how's,a,an,the,and,but,if,or,because,as,until,while,of,at,by,for,with,about,against,between,into,through,during,before,after,above,below,to,from,up,down,in,out,on,off,over,under,again,further,then,once,here,there,when,where,why,how,all,any,both,each,few,more,most,other,some,such,no,nor,not,only,own,same,so,than,too,very,
@@ -0,0 +1 @@
1
+ adiaŭ,ajn,al,ankoraŭ,antaŭ,aŭ,bonan,bonvole,bonvolu,bv,ci,cia,cian,cin,d-ro,da,de,dek,deka,do,doktor',doktoro,du,dua,dum,eble,ekz,ekzemple,en,estas,estis,estos,estu,estus,eĉ,f-no,feliĉan,for,fraŭlino,ha,havas,havis,havos,havu,havus,he,ho,hu,ili,ilia,ilian,ilin,inter,io,ion,iu,iujn,iun,ja,jam,je,jes,k,kaj,ke,kio,kion,kiu,kiujn,kiun,kvankam,kvar,kvara,kvazaŭ,kvin,kvina,la,li,lia,lian,lin,malantaŭ,male,malgraŭ,mem,mi,mia,mian,min,minus,naŭ,naŭa,ne,nek,nenio,nenion,neniu,neniun,nepre,ni,nia,nian,nin,nu,nun,nur,ok,oka,oni,onia,onian,onin,plej,pli,plu,plus,por,post,preter,s-no,s-ro,se,sed,sep,sepa,ses,sesa,si,sia,sian,sin,sinjor',sinjorino,sinjoro,sub,super,supren,sur,tamen,tio,tion,tiu,tiujn,tiun,tra,tri,tria,tuj,tute,unu,unua,ve,verŝajne,vi,via,vian,vin,ĉi,ĉio,ĉion,ĉiu,ĉiujn,ĉiun,ĉu,ĝi,ĝia,ĝian,ĝin,ĝis,ĵus,ŝi,ŝia,ŝin
@@ -0,0 +1 @@
1
+ de,la,que,el,en,y,a,los,del,se,las,por,un,para,con,no,una,su,al,lo,como,más,pero,sus,le,ya,o,este,sí,porque,esta,entre,cuando,muy,sin,sobre,también,me,hasta,hay,donde,quien,desde,todo,nos,durante,todos,uno,les,ni,contra,otros,ese,eso,ante,ellos,e,esto,mí,antes,algunos,qué,unos,yo,otro,otras,otra,él,tanto,esa,estos,mucho,quienes,nada,muchos,cual,poco,ella,estar,estas,algunas,algo,nosotros,mi,mis,tú,te,ti,tu,tus,ellas,nosotras,vosotros,vosotras,os,mío,mía,míos,mías,tuyo,tuya,tuyos,tuyas,suyo,suya,suyos,suyas,nuestro,nuestra,nuestros,nuestras,vuestro,vuestra,vuestros,vuestras,esos,esas,estoy,estás,está,estamos,estáis,están,esté,estés,estemos,estéis,estén,estaré,estarás,estará,estaremos,estaréis,estarán,estaría,estarías,estaríamos,estaríais,estarían,estaba,estabas,estábamos,estabais,estaban,estuve,estuviste,estuvo,estuvimos,estuvisteis,estuvieron,estuviera,estuvieras,estuviéramos,estuvierais,estuvieran,estuviese,estuvieses,estuviésemos,estuvieseis,estuviesen,estando,estado,estada,estados,estadas,estad,he,has,ha,hemos,habéis,han,haya,hayas,hayamos,hayáis,hayan,habré,habrás,habrá,habremos,habréis,habrán,habría,habrías,habríamos,habríais,habrían,había,habías,habíamos,habíais,habían,hube,hubiste,hubo,hubimos,hubisteis,hubieron,hubiera,hubieras,hubiéramos,hubierais,hubieran,hubiese,hubieses,hubiésemos,hubieseis,hubiesen,habiendo,habido,habida,habidos,habidas,soy,eres,es,somos,sois,son,sea,seas,seamos,seáis,sean,seré,serás,será,seremos,seréis,serán,sería,serías,seríamos,seríais,serían,era,eras,éramos,erais,eran,fui,fuiste,fue,fuimos,fuisteis,fueron,fuera,fueras,fuéramos,fuerais,fueran,fuese,fueses,fuésemos,fueseis,fuesen,siendo,sido,tengo,tienes,tiene,tenemos,tenéis,tienen,tenga,tengas,tengamos,tengáis,tengan,tendré,tendrás,tendrá,tendremos,tendréis,tendrán,tendría,tendrías,tendríamos,tendríais,tendrían,tenía,tenías,teníamos,teníais,tenían,tuve,tuviste,tuvo,tuvimos,tuvisteis,tuvieron,tuviera,tuvieras,tuviéramos,tuvierais,tuvieran,tuviese,tuvieses,tuviésemos,tuvieseis,tuviesen,teniendo,tenido,tenida,tenidos,tenidas,tened
@@ -0,0 +1 @@
1
+ aga,ei,et,ja,jah,kas,kui,kõik,ma,me,mida,midagi,mind,minu,mis,mu,mul,mulle,nad,nii,oled,olen,oli,oma,on,pole,sa,seda,see,selle,siin,siis,ta,te,ära
@@ -0,0 +1 @@
1
+ al,anitz,arabera,asko,baina,bat,batean,batek,bati,batzuei,batzuek,batzuetan,batzuk,bera,beraiek,berau,berauek,bere,berori,beroriek,beste,bezala,da,dago,dira,ditu,du,dute,edo,egin,ere,eta,eurak,ez,gainera,gu,gutxi,guzti,haiei,haiek,haietan,hainbeste,hala,han,handik,hango,hara,hari,hark,hartan,hau,hauei,hauek,hauetan,hemen,hemendik,hemengo,hi,hona,honek,honela,honetan,honi,hor,hori,horiei,horiek,horietan,horko,horra,horrek,horrela,horretan,horri,hortik,hura,izan,ni,noiz,nola,non,nondik,nongo,nor,nora,ze,zein,zen,zenbait,zenbat,zer,zergatik,ziren,zituen,zu,zuek,zuen,zuten,
@@ -0,0 +1 @@
1
+ انان,نداشته,سراسر,خياه,ايشان,وي,تاكنون,بيشتري,دوم,پس,ناشي,وگو,يا,داشتند,سپس,هنگام,هرگز,پنج,نشان,امسال,ديگر,گروهي,شدند,چطور,ده,و,دو,نخستين,ولي,چرا,چه,وسط,ه,كدام,قابل,يك,رفت,هفت,همچنين,در,هزار,بله,بلي,شايد,اما,شناسي,گرفته,دهد,داشته,دانست,داشتن,خواهيم,ميليارد,وقتيكه,امد,خواهد,جز,اورده,شده,بلكه,خدمات,شدن,برخي,نبود,بسياري,جلوگيري,حق,كردند,نوعي,بعري,نكرده,نظير,نبايد,بوده,بودن,داد,اورد,هست,جايي,شود,دنبال,داده,بايد,سابق,هيچ,همان,انجا,كمتر,كجاست,گردد,كسي,تر,مردم,تان,دادن,بودند,سري,جدا,ندارند,مگر,يكديگر,دارد,دهند,بنابراين,هنگامي,سمت,جا,انچه,خود,دادند,زياد,دارند,اثر,بدون,بهترين,بيشتر,البته,به,براساس,بيرون,كرد,بعضي,گرفت,توي,اي,ميليون,او,جريان,تول,بر,مانند,برابر,باشيم,مدتي,گويند,اكنون,تا,تنها,جديد,چند,بي,نشده,كردن,كردم,گويد,كرده,كنيم,نمي,نزد,روي,قصد,فقط,بالاي,ديگران,اين,ديروز,توسط,سوم,ايم,دانند,سوي,استفاده,شما,كنار,داريم,ساخته,طور,امده,رفته,نخست,بيست,نزديك,طي,كنيد,از,انها,تمامي,داشت,يكي,طريق,اش,چيست,روب,نمايد,گفت,چندين,چيزي,تواند,ام,ايا,با,ان,ايد,ترين,اينكه,ديگري,راه,هايي,بروز,همچنان,پاعين,كس,حدود,مختلف,مقابل,چيز,گيرد,ندارد,ضد,همچون,سازي,شان,مورد,باره,مرسي,خويش,برخوردار,چون,خارج,شش,هنوز,تحت,ضمن,هستيم,گفته,فكر,بسيار,پيش,براي,روزهاي,انكه,نخواهد,بالا,كل,وقتي,كي,چنين,كه,گيري,نيست,است,كجا,كند,نيز,يابد,بندي,حتي,توانند,عقب,خواست,كنند,بين,تمام,همه,ما,باشند,مثل,شد,اري,باشد,اره,طبق,بعد,اگر,صورت,غير,جاي,بيش,ريزي,اند,زيرا,چگونه,بار,لطفا,مي,درباره,من,ديده,همين,گذاري,برداري,علت,گذاشته,هم,فوق,نه,ها,شوند,اباد,همواره,هر,اول,خواهند,چهار,نام,امروز,مان,هاي,قبل,كنم,سعي,تازه,را,هستند,زير,جلوي,عنوان,بود,
@@ -0,0 +1 @@
1
+ olla,olen,olet,on,olemme,olette,ovat,ole,oli,olisi,olisit,olisin,olisimme,olisitte,olisivat,olit,olin,olimme,olitte,olivat,ollut,olleet,en,et,ei,emme,ette,eivät,minä,minun,minut,minua,minussa,minusta,minuun,minulla,minulta,minulle,sinä,sinun,sinut,sinua,sinussa,sinusta,sinuun,sinulla,sinulta,sinulle,hän,hänen,hänet,häntä,hänessä,hänestä,häneen,hänellä,häneltä,hänelle,me,meidän,meidät,meitä,meissä,meistä,meihin,meillä,meiltä,meille,te,teidän,teidät,teitä,teissä,teistä,teihin,teillä,teiltä,teille,he,heidän,heidät,heitä,heissä,heistä,heihin,heillä,heiltä,heille,tämä,tämän,tätä,tässä,tästä,tähän,tallä,tältä,tälle,tänä,täksi,tuo,tuon,tuotä,tuossa,tuosta,tuohon,tuolla,tuolta,tuolle,tuona,tuoksi,se,sen,sitä,siinä,siitä,siihen,sillä,siltä,sille,sinä,siksi,nämä,näiden,näitä,näissä,näistä,näihin,näillä,näiltä,näille,näinä,näiksi,nuo,noiden,noita,noissa,noista,noihin,noilla,noilta,noille,noina,noiksi,ne,niiden,niitä,niissä,niistä,niihin,niillä,niiltä,niille,niinä,niiksi,kuka,kenen,kenet,ketä,kenessä,kenestä,keneen,kenellä,keneltä,kenelle,kenenä,keneksi,ketkä,keiden,ketkä,keitä,keissä,keistä,keihin,keillä,keiltä,keille,keinä,keiksi,mikä,minkä,minkä,mitä,missä,mistä,mihin,millä,miltä,mille,minä,miksi,mitkä,joka,jonka,jota,jossa,josta,johon,jolla,jolta,jolle,jona,joksi,jotka,joiden,joita,joissa,joista,joihin,joilla,joilta,joille,joina,joiksi,että,ja,jos,koska,kuin,mutta,niin,sekä,sillä,tai,vaan,vai,vaikka,kanssa,mukaan,noin,poikki,yli,kun,niin,nyt,itse,
@@ -0,0 +1 @@
1
+ au,aux,avec,ce,ces,dans,de,des,du,elle,en,et,eux,il,je,la,le,leur,lui,ma,mais,me,même,mes,moi,mon,ne,nos,notre,nous,on,ou,par,pas,pour,qu,que,qui,sa,se,ses,son,sur,ta,te,tes,toi,ton,tu,un,une,vos,votre,vous,c,d,j,l,à,m,n,s,t,y,été,étée,étées,étés,étant,suis,es,est,sommes,êtes,sont,serai,seras,sera,serons,serez,seront,serais,serait,serions,seriez,seraient,étais,était,étions,étiez,étaient,fus,fut,fûmes,fûtes,furent,sois,soit,soyons,soyez,soient,fusse,fusses,fût,fussions,fussiez,fussent,ayant,eu,eue,eues,eus,ai,as,avons,avez,ont,aurai,auras,aura,aurons,aurez,auront,aurais,aurait,aurions,auriez,auraient,avais,avait,avions,aviez,avaient,eut,eûmes,eûtes,eurent,aie,aies,ait,ayons,ayez,aient,eusse,eusses,eût,eussions,eussiez,eussent,ceci,cela,celà,cet,cette,ici,ils,les,leurs,quel,quels,quelle,quelles,sans,soi,
@@ -0,0 +1 @@
1
+ a,ach,ag,agus,an,aon,ar,arna,as,b',ba,beirt,bhúr,caoga,ceathair,ceathrar,chomh,chtó,chuig,chun,cois,céad,cúig,cúigear,d',daichead,dar,de,deich,deichniúr,den,dhá,do,don,dtí,dá,dár,dó,faoi,faoin,faoina,faoinár,fara,fiche,gach,gan,go,gur,haon,hocht,i,iad,idir,in,ina,ins,inár,is,le,leis,lena,lenár,m',mar,mo,mé,na,nach,naoi,naonúr,ná,ní,níor,nó,nócha,ocht,ochtar,os,roimh,sa,seacht,seachtar,seachtó,seasca,seisear,siad,sibh,sinn,sna,sé,sí,tar,thar,thú,triúr,trí,trína,trínár,tríocha,tú,um,ár,é,éis,í,ó,ón,óna,ónár,
@@ -0,0 +1 @@
1
+ a,aínda,alí,aquel,aquela,aquelas,aqueles,aquilo,aquí,ao,aos,as,así,á,ben,cando,che,co,coa,comigo,con,connosco,contigo,convosco,coas,cos,cun,cuns,cunha,cunhas,da,dalgunha,dalgunhas,dalgún,dalgúns,das,de,del,dela,delas,deles,desde,deste,do,dos,dun,duns,dunha,dunhas,e,el,ela,elas,eles,en,era,eran,esa,esas,ese,eses,esta,estar,estaba,está,están,este,estes,estiven,estou,eu,é,facer,foi,foron,fun,había,hai,iso,isto,la,las,lle,lles,lo,los,mais,me,meu,meus,min,miña,miñas,moi,na,nas,neste,nin,no,non,nos,nosa,nosas,noso,nosos,nós,nun,nunha,nuns,nunhas,o,os,ou,ó,ós,para,pero,pode,pois,pola,polas,polo,polos,por,que,se,senón,ser,seu,seus,sexa,sido,sobre,súa,súas,tamén,tan,te,ten,teñen,teño,ter,teu,teus,ti,tido,tiña,tiven,túa,túas,un,unha,unhas,uns,vos,vosa,vosas,voso,vosos,vós,
@@ -0,0 +1 @@
1
+ אבל,או,אולי,אותה,אותו,אותי,אותך,אותם,אותן,אותנו,אז,אחר,אחרות,אחרי,אחריכן,אחרים,אחרת,אי,איזה,איך,אין,איפה,איתה,איתו,איתי,איתך,איתכם,איתכן,איתם,איתן,איתנו,אך,אל,אלה,אלו,אם,אנחנו,אני,אף,אצל,אשר,את,אתה,אתכם,אתכן,אתם,אתן,באמצע,באמצעות,בגלל,בין,בלי,במידה,ברם,בשביל,בתוך,גם,דרך,הוא,היא,היה,היכן,היתה,היתי,הם,הן,הנה,הרי,ואילו,ואת,זאת,זה,זות,יהיה,יוכל,יוכלו,יותר,יכול,יכולה,יכולות,יכולים,יכל,יכלה,יכלו,יש,כאן,כאשר,כולם,כולן,כזה,כי,כיצד,כך,ככה,כל,כלל,כמו,כן,כפי,לא,לאו,לאן,לבין,לה,להיות,להם,להן,לו,לי,לכם,לכן,למה,למטה,למעלה,למרות,לנו,לעבר,לעיכן,לפיכך,לפני,מאד,מאחורי,מאין,מאיפה,מבלי,מבעד,מדוע,מה,מהיכן,מול,מחוץ,מי,מכאן,מכיוון,מלבד,מן,מנין,מסוגל,מעט,מעטים,מעל,מצד,מתחת,מתי,נגד,נגר,נו,עד,עז,על,עלי,עליה,עליהם,עליהן,עליו,עליך,עליכם,עלינו,עם,עצמה,עצמהם,עצמהן,עצמו,עצמי,עצמם,עצמן,עצמנו,פה,רק,שוב,של,שלה,שלהם,שלהן,שלו,שלי,שלך,שלכה,שלכם,שלכן,שלנו,שם,תהיה,תחת,לאחר,זו,תוך,
@@ -0,0 +1 @@
1
+ अंदर,अत,अपना,अपनी,अपने,अभी,आदि,आप,इत्यादि,इन,इनका,इन्हीं,इन्हें,इन्हों,इस,इसका,इसकी,इसके,इसमें,इसी,इसे,उन,उनका,उनकी,उनके,उनको,उन्हीं,उन्हें,उन्हों,उस,उसके,उसी,उसे,एक,एवं,एस,ऐसे,और,कई,कर,करता,करते,करना,करने,करें,कहते,कहा,का,काफ़ी,कि,कितना,किन्हें,किन्हों,किया,किर,किस,किसी,किसे,की,कुछ,कुल,के,को,कोई,कौन,कौनसा,गया,घर,जब,जहाँ,जा,जितना,जिन,जिन्हें,जिन्हों,जिस,जिसे,जीधर,जैसा,जैसे,जो,तक,तब,तरह,तिन,तिन्हें,तिन्हों,तिस,तिसे,तो,था,थी,थे,दबारा,दिया,दुसरा,दूसरे,दो,द्वारा,न,नहीं,ना,निहायत,नीचे,ने,पर,पर,पहले,पूरा,पे,फिर,बनी,बही,बहुत,बाद,बाला,बिलकुल,भी,भीतर,मगर,मानो,मे,में,यदि,यह,यहाँ,यही,या,यिह,ये,रखें,रहा,रहे,ऱ्वासा,लिए,लिये,लेकिन,व,वर्ग,वह,वह,वहाँ,वहीं,वाले,वुह,वे,वग़ैरह,संग,सकता,सकते,सबसे,सभी,साथ,साबुत,साभ,सारा,से,सो,ही,हुआ,हुई,हुए,है,हैं,हो,होता,होती,होते,होना,होने,अपनि,जेसे,होति,सभि,तिंहों,इंहों,दवारा,इसि,किंहें,थि,उंहों,ओर,जिंहें,वहिं,अभि,बनि,हि,उंहिं,उंहें,हें,वगेरह,एसे,रवासा,कोन,निचे,काफि,उसि,पुरा,भितर,हे,बहि,वहां,कोइ,यहां,जिंहों,तिंहें,किसि,कइ,यहि,इंहिं,जिधर,इंहें,अदि,इतयादि,हुइ,कोनसा,इसकि,दुसरे,जहां,अप,किंहों,उनकि,भि,वरग,हुअ,जेसा,नहिं,
@@ -0,0 +1 @@
1
+ a,ako,ali,bi,bih,bila,bili,bilo,bio,bismo,biste,biti,bumo,da,do,duž,ga,hoće,hoćemo,hoćete,hoćeš,hoću,i,iako,ih,ili,iz,ja,je,jedna,jedne,jedno,jer,jesam,jesi,jesmo,jest,jeste,jesu,jim,joj,još,ju,kada,kako,kao,koja,koje,koji,kojima,koju,kroz,li,me,mene,meni,mi,mimo,moj,moja,moje,mu,na,nad,nakon,nam,nama,nas,naš,naša,naše,našeg,ne,nego,neka,neki,nekog,neku,nema,netko,neće,nećemo,nećete,nećeš,neću,nešto,ni,nije,nikoga,nikoje,nikoju,nisam,nisi,nismo,niste,nisu,njega,njegov,njegova,njegovo,njemu,njezin,njezina,njezino,njih,njihov,njihova,njihovo,njim,njima,njoj,nju,no,o,od,odmah,on,ona,oni,ono,ova,pa,pak,po,pod,pored,prije,s,sa,sam,samo,se,sebe,sebi,si,smo,ste,su,sve,svi,svog,svoj,svoja,svoje,svom,ta,tada,taj,tako,te,tebe,tebi,ti,to,toj,tome,tu,tvoj,tvoja,tvoje,u,uz,vam,vama,vas,vaš,vaša,vaše,već,vi,vrlo,za,zar,će,ćemo,ćete,ćeš,ću,što
@@ -0,0 +1 @@
1
+ a,ahogy,ahol,aki,akik,akkor,alatt,által,általában,amely,amelyek,amelyekben,amelyeket,amelyet,amelynek,ami,amit,amolyan,amíg,amikor,át,abban,ahhoz,annak,arra,arról,az,azok,azon,azt,azzal,azért,aztán,azután,azonban,bár,be,belül,benne,cikk,cikkek,cikkeket,csak,de,e,eddig,egész,egy,egyes,egyetlen,egyéb,egyik,egyre,ekkor,el,elég,ellen,elő,először,előtt,első,én,éppen,ebben,ehhez,emilyen,ennek,erre,ez,ezt,ezek,ezen,ezzel,ezért,és,fel,felé,hanem,hiszen,hogy,hogyan,igen,így,illetve,ill.,ill,ilyen,ilyenkor,ison,ismét,itt,jó,jól,jobban,kell,kellett,keresztül,keressünk,ki,kívül,között,közül,legalább,lehet,lehetett,legyen,lenne,lenni,lesz,lett,maga,magát,majd,majd,már,más,másik,meg,még,mellett,mert,mely,melyek,mi,mit,míg,miért,milyen,mikor,minden,mindent,mindenki,mindig,mint,mintha,mivel,most,nagy,nagyobb,nagyon,ne,néha,nekem,neki,nem,néhány,nélkül,nincs,olyan,ott,össze,ő,ők,őket,pedig,persze,rá,s,saját,sem,semmi,sok,sokat,sokkal,számára,szemben,szerint,szinte,talán,tehát,teljes,tovább,továbbá,több,úgy,ugyanis,új,újabb,újra,után,utána,utolsó,vagy,vagyis,valaki,valami,valamint,való,vagyok,van,vannak,volt,voltam,voltak,voltunk,vissza,vele,viszont,volna,
@@ -0,0 +1 @@
1
+ այդ,այլ,այն,այս,դու,դուք,եմ,են,ենք,ես,եք,է,էի,էին,էինք,էիր,էիք,էր,ըստ,թ,ի,ին,իսկ,իր,կամ,համար,հետ,հետո,մենք,մեջ,մի,ն,նա,նաև,նրա,նրանք,որ,որը,որոնք,որպես,ու,ում,պիտի,վրա,և,
@@ -0,0 +1 @@
1
+ ada,adanya,adalah,adapun,agak,agaknya,agar,akan,akankah,akhirnya,aku,akulah,amat,amatlah,anda,andalah,antar,diantaranya,antara,antaranya,diantara,apa,apaan,mengapa,apabila,apakah,apalagi,apatah,atau,ataukah,ataupun,bagai,bagaikan,sebagai,sebagainya,bagaimana,bagaimanapun,sebagaimana,bagaimanakah,bagi,bahkan,bahwa,bahwasanya,sebaliknya,banyak,sebanyak,beberapa,seberapa,begini,beginian,beginikah,beginilah,sebegini,begitu,begitukah,begitulah,begitupun,sebegitu,belum,belumlah,sebelum,sebelumnya,sebenarnya,berapa,berapakah,berapalah,berapapun,betulkah,sebetulnya,biasa,biasanya,bila,bilakah,bisa,bisakah,sebisanya,boleh,bolehkah,bolehlah,buat,bukan,bukankah,bukanlah,bukannya,cuma,percuma,dahulu,dalam,dan,dapat,dari,daripada,dekat,demi,demikian,demikianlah,sedemikian,dengan,depan,di,dia,dialah,dini,diri,dirinya,terdiri,dong,dulu,enggak,enggaknya,entah,entahlah,terhadap,terhadapnya,hal,hampir,hanya,hanyalah,harus,haruslah,harusnya,seharusnya,hendak,hendaklah,hendaknya,hingga,sehingga,ia,ialah,ibarat,ingin,inginkah,inginkan,ini,inikah,inilah,itu,itukah,itulah,jangan,jangankan,janganlah,jika,jikalau,juga,justru,kala,kalau,kalaulah,kalaupun,kalian,kami,kamilah,kamu,kamulah,kan,kapan,kapankah,kapanpun,dikarenakan,karena,karenanya,ke,kecil,kemudian,kenapa,kepada,kepadanya,ketika,seketika,khususnya,kini,kinilah,kiranya,sekiranya,kita,kitalah,kok,lagi,lagian,selagi,lah,lain,lainnya,melainkan,selaku,lalu,melalui,terlalu,lama,lamanya,selama,selama,selamanya,lebih,terlebih,bermacam,macam,semacam,maka,makanya,makin,malah,malahan,mampu,mampukah,mana,manakala,manalagi,masih,masihkah,semasih,masing,mau,maupun,semaunya,memang,mereka,merekalah,meski,meskipun,semula,mungkin,mungkinkah,nah,namun,nanti,nantinya,nyaris,oleh,olehnya,seorang,seseorang,pada,padanya,padahal,paling,sepanjang,pantas,sepantasnya,sepantasnyalah,para,pasti,pastilah,per,pernah,pula,pun,merupakan,rupanya,serupa,saat,saatnya,sesaat,saja,sajalah,saling,bersama,sama,sesama,sambil,sampai,sana,sangat,sangatlah,saya,sayalah,se,sebab,sebabnya,sebuah,tersebut,tersebutlah,sedang,sedangkan,sedikit,sedikitnya,segala,segalanya,segera,sesegera,sejak,sejenak,sekali,sekalian,sekalipun,sesekali,sekaligus,sekarang,sekarang,sekitar,sekitarnya,sela,selain,selalu,seluruh,seluruhnya,semakin,sementara,sempat,semua,semuanya,sendiri,sendirinya,seolah,seperti,sepertinya,sering,seringnya,serta,siapa,siapakah,siapapun,disini,disinilah,sini,sinilah,sesuatu,sesuatunya,suatu,sesudah,sesudahnya,sudah,sudahkah,sudahlah,supaya,tadi,tadinya,tak,tanpa,setelah,telah,tentang,tentu,tentulah,tentunya,tertentu,seterusnya,tapi,tetapi,setiap,tiap,setidaknya,tidak,tidakkah,tidaklah,toh,waduh,wah,wahai,sewaktu,walau,walaupun,wong,yaitu,yakni,yang,
@@ -0,0 +1 @@
1
+ ad,al,allo,ai,agli,all,agl,alla,alle,con,col,coi,da,dal,dallo,dai,dagli,dall,dagl,dalla,dalle,di,del,dello,dei,degli,dell,degl,della,delle,in,nel,nello,nei,negli,nell,negl,nella,nelle,su,sul,sullo,sui,sugli,sull,sugl,sulla,sulle,per,tra,contro,io,tu,lui,lei,noi,voi,loro,mio,mia,miei,mie,tuo,tua,tuoi,tue,suo,sua,suoi,sue,nostro,nostra,nostri,nostre,vostro,vostra,vostri,vostre,mi,ti,ci,vi,lo,la,li,le,gli,ne,il,un,uno,una,ma,ed,se,perché,anche,come,dov,dove,che,chi,cui,non,più,quale,quanto,quanti,quanta,quante,quello,quelli,quella,quelle,questo,questi,questa,queste,si,tutto,tutti,a,c,e,i,l,o,ho,hai,ha,abbiamo,avete,hanno,abbia,abbiate,abbiano,avrò,avrai,avrà,avremo,avrete,avranno,avrei,avresti,avrebbe,avremmo,avreste,avrebbero,avevo,avevi,aveva,avevamo,avevate,avevano,ebbi,avesti,ebbe,avemmo,aveste,ebbero,avessi,avesse,avessimo,avessero,avendo,avuto,avuta,avuti,avute,sono,sei,è,siamo,siete,sia,siate,siano,sarò,sarai,sarà,saremo,sarete,saranno,sarei,saresti,sarebbe,saremmo,sareste,sarebbero,ero,eri,era,eravamo,eravate,erano,fui,fosti,fu,fummo,foste,furono,fossi,fosse,fossimo,fossero,essendo,faccio,fai,facciamo,fanno,faccia,facciate,facciano,farò,farai,farà,faremo,farete,faranno,farei,faresti,farebbe,faremmo,fareste,farebbero,facevo,facevi,faceva,facevamo,facevate,facevano,feci,facesti,fece,facemmo,faceste,fecero,facessi,facesse,facessimo,facessero,facendo,sto,stai,sta,stiamo,stanno,stia,stiate,stiano,starò,starai,starà,staremo,starete,staranno,starei,staresti,starebbe,staremmo,stareste,starebbero,stavo,stavi,stava,stavamo,stavate,stavano,stetti,stesti,stette,stemmo,steste,stettero,stessi,stesse,stessimo,stessero,stando,
@@ -0,0 +1 @@
1
+ あっ,あり,ある,い,いう,いる,う,うち,お,および,おり,か,かつて,から,が,き,ここ,こと,この,これ,これら,さ,さらに,し,しかし,する,ず,せ,せる,そして,その,その他,その後,それ,それぞれ,た,ただし,たち,ため,たり,だ,だっ,つ,て,で,でき,できる,です,では,でも,と,という,といった,とき,ところ,として,とともに,とも,と共に,な,ない,なお,なかっ,ながら,なく,なっ,など,なら,なり,なる,に,において,における,について,にて,によって,により,による,に対して,に対する,に関する,の,ので,のみ,は,ば,へ,ほか,ほとんど,ほど,ます,また,または,まで,も,もの,ものの,や,よう,より,ら,られ,られる,れ,れる,を,ん,及び,特に
@@ -0,0 +1 @@
1
+ !,",$,%,&,',(,),*,+,,,-,.,...,0,1,2,3,4,5,6,7,8,9,;,<,=,>,?,@,\,^,_,`,~,·,—,——,‘,’,“,”,…,、,。,〈,〉,《,》,가,가까스로,가령,각,각각,각자,각종,갖고말하자면,같다,같이,개의치않고,거니와,거바,거의,것,것과,같이,것들,게다가,게우다,겨우,견지에서,결과에,이르다,결국,결론을,낼,수,있다,겸사겸사,고려하면,고로,곧,공동으로,과,과연,관계가,있다,관계없이,관련이,있다,관하여,관한,관해서는,구,구체적으로,구토하다,그,그들,그때,그래,그래도,그래서,그러나,그러니,그러니까,그러면,그러므로,그러한즉,그런,까닭에,그런데,그런즉,그럼,그럼에도,불구하고,그렇게,함으로써,그렇지,그렇지,않다면,그렇지,않으면,그렇지만,그렇지않으면,그리고,그리하여,그만이다,그에,따르는,그위에,그저,그중에서,그치지,않다,근거로,근거하여,기대여,기점으로,기준으로,기타,까닭으로,까악,까지,까지,미치다,까지도,꽈당,끙끙,끼익,나,나머지는,남들,남짓,너,너희,너희들,네,넷,년,논하지,않다,놀라다,누가,알겠는가,누구,다른,다른,방면으로,다만,다섯,다소,다수,다시,말하자면,다시말하면,다음,다음에,다음으로,단지,답다,당신,당장,대로,하다,대하면,대하여,대해,말하자면,대해서,댕그,더구나,더군다나,더라도,더불어,더욱더,더욱이는,도달하다,도착하다,동시에,동안,된바에야,된이상,두번째로,둘,둥둥,뒤따라,뒤이어,든간에,들,등,등등,딩동,따라,따라서,따위,따지지,않다,딱,때,때가,되어,때문에,또,또한,뚝뚝,라,해도,령,로,로,인하여,로부터,로써,륙,를,마음대로,마저,마저도,마치,막론하고,만,못하다,만약,만약에,만은,아니다,만이,아니다,만일,만큼,말하자면,말할것도,없고,매,매번,메쓰겁다,몇,모,모두,무렵,무릎쓰고,무슨,무엇,무엇때문에,물론,및,바꾸어말하면,바꾸어말하자면,바꾸어서,말하면,바꾸어서,한다면,바꿔,말하면,바로,바와같이,밖에,안된다,반대로,반대로,말하자면,반드시,버금,보는데서,보다더,보드득,본대로,봐,봐라,부류의,사람들,부터,불구하고,불문하고,붕붕,비걱거리다,비교적,비길수,없다,비로소,비록,비슷하다,비추어,보아,비하면,뿐만,아니라,뿐만아니라,뿐이다,삐걱,삐걱거리다,사,삼,상대적으로,말하자면,생각한대로,설령,설마,설사,셋,소생,소인,솨,쉿,습니까,습니다,시각,시간,시작하여,시초에,시키다,실로,심지어,아,아니,아니나다를가,아니라면,아니면,아니었다면,아래윗,아무거나,아무도,아야,아울러,아이,아이고,아이구,아이야,아이쿠,아하,아홉,안,그러면,않기,위하여,않기,위해서,알,수,있다,알았어,앗,앞에서,앞의것,야,약간,양자,어,어기여차,어느,어느,년도,어느것,어느곳,어느때,어느쪽,어느해,어디,어때,어떠한,어떤,어떤것,어떤것들,어떻게,어떻해,어이,어째서,어쨋든,어쩔수,없다,어찌,어찌됏든,어찌됏어,어찌하든지,어찌하여,언제,언젠가,얼마,얼마,안,되는,것,얼마간,얼마나,얼마든지,얼마만큼,얼마큼,엉엉,에,에,가서,에,달려,있다,에,대해,에,있다,에,한하다,에게,에서,여,여기,여덟,여러분,여보시오,여부,여섯,여전히,여차,연관되다,연이서,영,영차,옆사람,예,예를,들면,예를,들자면,예컨대,예하면,오,오로지,오르다,오자마자,오직,오호,오히려,와,와,같은,사람들,와르르,와아,왜,왜냐하면,외에도,요만큼,요만한,것,요만한걸,요컨대,우르르,우리,우리들,우선,우에,종합한것과같이,운운,월,위에서,서술한바와같이,위하여,위해서,윙윙,육,으로,으로,인하여,으로서,으로써,을,응,응당,의,의거하여,의지하여,의해,의해되다,의해서,이,이,되다,이,때문에,이,밖에,이,외에,이,정도의,이것,이곳,이때,이라면,이래,이러이러하다,이러한,이런,이럴정도로,이렇게,많은,것,이렇게되면,이렇게말하자면,이렇구나,이로,인하여,이르기까지,이리하여,이만큼,이번,이봐,이상,이어서,이었다,이와,같다,이와,같은,이와,반대로,이와같다면,이외에도,이용하여,이유만으로,이젠,이지만,이쪽,이천구,이천육,이천칠,이천팔,인,듯하다,인젠,일,일것이다,일곱,일단,일때,일반적으로,일지라도,임에,틀림없다,입각하여,입장에서,잇따라,있다,자,자기,자기집,자마자,자신,잠깐,잠시,저,저것,저것만큼,저기,저쪽,저희,전부,전자,전후,점에서,보아,정도에,이르다,제,제각기,제외하고,조금,조차,조차도,졸졸,좀,좋아,좍좍,주룩주룩,주저하지,않고,줄은,몰랏다,줄은모른다,중에서,중의하나,즈음하여,즉,즉시,지든지,지만,지말고,진짜로,쪽으로,차라리,참,참나,첫번째로,쳇,총적으로,총적으로,말하면,총적으로,보면,칠,콸콸,쾅쾅,쿵,타다,타인,탕탕,토하다,통하여,툭,퉤,틈타,팍,팔,퍽,펄렁,하,하게될것이다,하게하다,하겠는가,하고,있다,하고있었다,하곤하였다,하구나,하기,때문에,하기,위하여,하기는한데,하기만,하면,하기보다는,하기에,하나,하느니,하는,김에,하는,편이,낫다,하는것도,하는것만,못하다,하는것이,낫다,하는바,하더라도,하도다,하도록시키다,하도록하다,하든지,하려고하다,하마터면,하면,할수록,하면된다,하면서,하물며,하여금,하여야,하자마자,하지,않는다면,하지,않도록,하지마,하지마라,하지만,하하,한,까닭에,한,이유는,한,후,한다면,한다면,몰라도,한데,한마디,한적이있다,한켠으로는,한항목,할,따름이다,할,생각이다,할,줄,안다,할,지경이다,할,힘이,있다,할때,할만하다,할망정,할뿐,할수있다,할수있어,할줄알다,할지라도,할지언정,함께,해도된다,해도좋다,해봐요,해서는,안된다,해야한다,해요,했어요,향하다,향하여,향해서,허,허걱,허허,헉,헉헉,헐떡헐떡,형식으로,쓰여,혹시,혹은,혼자,훨씬,휘익,휴,흐흐,흥,힘입어,︿,!,#,$,%,&,(,),*,+,,,0,1,2,3,4,5,6,7,8,9,:,;,<,>,?,@,[,],{,|,},~,¥
@@ -0,0 +1 @@
1
+ a,ab,ac,ad,at,atque,aut,autem,cum,de,dum,e,erant,erat,est,et,etiam,ex,haec,hic,hoc,in,ita,me,nec,neque,non,per,qua,quae,quam,qui,quibus,quidem,quo,quod,re,rebus,rem,res,sed,si,sic,sunt,tamen,tandem,te,ut,vel
@@ -0,0 +1 @@
1
+ ant,apie,ar,arba,aš,be,bei,bet,bus,būti,būtų,buvo,dėl,gali,į,iki,ir,iš,ja,ją,jai,jais,jam,jame,jas,jei,ji,jį,jie,jiedu,jiedvi,jiedviem,jiedviese,jiems,jis,jo,jodviem,jog,joje,jomis,joms,jos,jose,jų,judu,judvi,judviejų,jųdviejų,judviem,judviese,jumis,jums,jumyse,juo,juodu,juodviese,juos,juose,jus,jūs,jūsų,ką,kad,kai,kaip,kas,kiek,kol,kur,kurie,kuris,man,mane,manęs,manimi,mano,manyje,mes,metu,mudu,mudvi,mudviejų,mudviem,mudviese,mumis,mums,mumyse,mus,mūsų,nei,nes,net,nors,nuo,o,pat,per,po,prie,prieš,sau,save,savęs,savimi,savo,savyje,su,tačiau,tada,tai,taip,tas,tau,tave,tavęs,tavimi,tavyje,ten,to,todėl,tu,tuo,už,visi,yra,
@@ -0,0 +1 @@
1
+ aiz,ap,ar,apakš,ārpus,augšpus,bez,caur,dēļ,gar,iekš,iz,kopš,labad,lejpus,līdz,no,otrpus,pa,par,pār,pēc,pie,pirms,pret,priekš,starp,šaipus,uz,viņpus,virs,virspus,zem,apakšpus,un,bet,jo,ja,ka,lai,tomēr,tikko,turpretī,arī,kaut,gan,tādēļ,tā,ne,tikvien,vien,kā,ir,te,vai,kamēr,ar,diezin,droši,diemžēl,nebūt,ik,it,taču,nu,pat,tiklab,iekšpus,nedz,tik,nevis,turpretim,jeb,iekam,iekām,iekāms,kolīdz,līdzko,tiklīdz,jebšu,tālab,tāpēc,nekā,itin,jā,jau,jel,nē,nezin,tad,tikai,vis,tak,iekams,vien,būt,biju,biji,bija,bijām,bijāt,esmu,esi,esam,esat,būšu,būsi,būs,būsim,būsiet,tikt,tiku,tiki,tika,tikām,tikāt,tieku,tiec,tiek,tiekam,tiekat,tikšu,tiks,tiksim,tiksiet,tapt,tapi,tapāt,topat,tapšu,tapsi,taps,tapsim,tapsiet,kļūt,kļuvu,kļuvi,kļuva,kļuvām,kļuvāt,kļūstu,kļūsti,kļūst,kļūstam,kļūstat,kļūšu,kļūsi,kļūs,kļūsim,kļūsiet,varēt,varēju,varējām,varēšu,varēsim,var,varēji,varējāt,varēsi,varēsiet,varat,varēja,varēs,
@@ -0,0 +1 @@
1
+ अधिक,अनेक,अशी,असलयाचे,असलेल्या,असा,असून,असे,आज,आणि,आता,आपल्या,आला,आली,आले,आहे,आहेत,एक,एका,कमी,करणयात,करून,का,काम,काय,काही,किवा,की,केला,केली,केले,कोटी,गेल्या,घेऊन,जात,झाला,झाली,झाले,झालेल्या,टा,डॉ,तर,तरी,तसेच,ता,ती,तीन,ते,तो,त्या,त्याचा,त्याची,त्याच्या,त्याना,त्यानी,त्यामुळे,त्री,दिली,दोन,न,नाही,निर्ण्य,पण,पम,परयतन,पाटील,म,मात्र,माहिती,मी,मुबी,म्हणजे,म्हणाले,म्हणून,या,याचा,याची,याच्या,याना,यानी,येणार,येत,येथील,येथे,लाख,व,व्यकत,सर्व,सागित्ले,सुरू,हजार,हा,ही,हे,होणार,होत,होता,होती,होते
@@ -0,0 +1 @@
1
+ de,en,van,ik,te,dat,die,in,een,hij,het,niet,zijn,is,was,op,aan,met,als,voor,had,er,maar,om,hem,dan,zou,of,wat,mijn,men,dit,zo,door,over,ze,zich,bij,ook,tot,je,mij,uit,der,daar,haar,naar,heb,hoe,heeft,hebben,deze,u,want,nog,zal,me,zij,nu,ge,geen,omdat,iets,worden,toch,al,waren,veel,meer,doen,toen,moet,ben,zonder,kan,hun,dus,alles,onder,ja,eens,hier,wie,werd,altijd,doch,wordt,wezen,kunnen,ons,zelf,tegen,na,reeds,wil,kon,niets,uw,iemand,geweest,andere,
@@ -0,0 +1 @@
1
+ og,i,jeg,det,at,en,et,den,til,er,som,på,de,med,han,av,ikke,ikkje,der,så,var,meg,seg,men,ett,har,om,vi,min,mitt,ha,hadde,hun,nå,over,da,ved,fra,du,ut,sin,dem,oss,opp,man,kan,hans,hvor,eller,hva,skal,selv,sjøl,her,alle,vil,bli,ble,blei,blitt,kunne,inn,når,være,kom,noen,noe,ville,dere,som,deres,kun,ja,etter,ned,skulle,denne,for,deg,si,sine,sitt,mot,å,meget,hvorfor,dette,disse,uten,hvordan,ingen,din,ditt,blir,samme,hvilken,hvilke,sånn,inni,mellom,vår,hver,hvem,vors,hvis,både,bare,enn,fordi,før,mange,også,slik,vært,være,båe,begge,siden,dykk,dykkar,dei,deira,deires,deim,di,då,eg,ein,eit,eitt,elles,honom,hjå,ho,hoe,henne,hennar,hennes,hoss,hossen,ikkje,ingi,inkje,korleis,korso,kva,kvar,kvarhelst,kven,kvi,kvifor,me,medan,mi,mine,mykje,no,nokon,noka,nokor,noko,nokre,si,sia,sidan,so,somt,somme,um,upp,vere,vore,verte,vort,varte,vart,
@@ -0,0 +1 @@
1
+ aby,ach,aj,albo,ale,ani,aż,bardzo,bez,bo,bowiem,by,byli,bym,być,był,była,było,były,będzie,będą,chce,choć,ci,ciebie,cię,co,coraz,coś,czy,czyli,często,daleko,dla,dlaczego,dlatego,do,dobrze,dokąd,dość,dr,dużo,dwa,dwaj,dwie,dwoje,dzisiaj,dziś,gdy,gdyby,gdyż,gdzie,go,godz,hab,i,ich,ii,iii,ile,im,inne,inny,inż,iv,ix,iż,ja,jak,jakby,jaki,jakie,jako,je,jeden,jedna,jednak,jedno,jednym,jedynie,jego,jej,jemu,jest,jestem,jeszcze,jeśli,jeżeli,już,ją,każdy,kiedy,kierunku,kilku,kto,która,które,którego,której,który,których,którym,którzy,ku,lat,lecz,lub,ma,mają,mam,mamy,mgr,mi,miał,mimo,mnie,mną,mogą,moi,moja,moje,może,można,mu,musi,my,mój,na,nad,nam,nami,nas,nasi,nasz,nasza,nasze,natychmiast,nawet,nic,nich,nie,niego,niej,niemu,nigdy,nim,nimi,nią,niż,no,nowe,np,nr,o,o.o.,obok,od,ok,około,on,ona,one,oni,ono,oraz,owszem,pan,pl,po,pod,ponad,ponieważ,poza,prof,przed,przede,przedtem,przez,przy,raz,razie,roku,również,sam,sama,się,skąd,sobie,sposób,swoje,są,ta,tak,taki,takich,takie,także,tam,te,tego,tej,tel,temu,ten,teraz,też,to,tobie,tobą,trzeba,tu,tutaj,twoi,twoja,twoje,twój,ty,tych,tylko,tym,tys,tzw,tę,u,ul,vi,vii,viii,vol,w,wam,wami,was,wasi,wasz,wasza,wasze,we,wie,więc,wszystko,wtedy,www,wy,właśnie,wśród,xi,xii,xiii,xiv,xv,z,za,zawsze,zaś,ze,zł,żaden,że,żeby
@@ -0,0 +1 @@
1
+ de,a,o,que,e,do,da,em,um,para,com,não,uma,os,no,se,na,por,mais,as,dos,como,mas,ao,ele,das,à,seu,sua,ou,quando,muito,nos,já,eu,também,só,pelo,pela,até,isso,ela,entre,depois,sem,mesmo,aos,seus,quem,nas,me,esse,eles,você,essa,num,nem,suas,meu,às,minha,numa,pelos,elas,qual,nós,lhe,deles,essas,esses,pelas,este,dele,tu,te,vocês,vos,lhes,meus,minhas,teu,tua,teus,tuas,nosso,nossa,nossos,nossas,dela,delas,esta,estes,estas,aquele,aquela,aqueles,aquelas,isto,aquilo,estou,está,estamos,estão,estive,esteve,estivemos,estiveram,estava,estávamos,estavam,estivera,estivéramos,esteja,estejamos,estejam,estivesse,estivéssemos,estivessem,estiver,estivermos,estiverem,hei,há,havemos,hão,houve,houvemos,houveram,houvera,houvéramos,haja,hajamos,hajam,houvesse,houvéssemos,houvessem,houver,houvermos,houverem,houverei,houverá,houveremos,houverão,houveria,houveríamos,houveriam,sou,somos,são,era,éramos,eram,fui,foi,fomos,foram,fora,fôramos,seja,sejamos,sejam,fosse,fôssemos,fossem,for,formos,forem,serei,será,seremos,serão,seria,seríamos,seriam,tenho,tem,temos,tém,tinha,tínhamos,tinham,tive,teve,tivemos,tiveram,tivera,tivéramos,tenha,tenhamos,tenham,tivesse,tivéssemos,tivessem,tiver,tivermos,tiverem,terei,terá,teremos,terão,teria,teríamos,teriam,
@@ -0,0 +1 @@
1
+ acea,aceasta,această,aceea,acei,aceia,acel,acela,acele,acelea,acest,acesta,aceste,acestea,aceşti,aceştia,acolo,acum,ai,aia,aibă,aici,al,ăla,ale,alea,ălea,altceva,altcineva,am,ar,are,aş,aşadar,asemenea,asta,ăsta,astăzi,astea,ăstea,ăştia,asupra,aţi,au,avea,avem,aveţi,azi,bine,bucur,bună,ca,că,căci,când,care,cărei,căror,cărui,cât,câte,câţi,către,câtva,ce,cel,ceva,chiar,cînd,cine,cineva,cît,cîte,cîţi,cîtva,contra,cu,cum,cumva,curând,curînd,da,dă,dacă,dar,datorită,de,deci,deja,deoarece,departe,deşi,din,dinaintea,dintr,dintre,drept,după,ea,ei,el,ele,eram,este,eşti,eu,face,fără,fi,fie,fiecare,fii,fim,fiţi,iar,ieri,îi,îl,îmi,împotriva,în,înainte,înaintea,încât,încît,încotro,între,întrucât,întrucît,îţi,la,lângă,le,li,lîngă,lor,lui,mă,mâine,mea,mei,mele,mereu,meu,mi,mine,mult,multă,mulţi,ne,nicăieri,nici,nimeni,nişte,noastră,noastre,noi,noştri,nostru,nu,ori,oricând,oricare,oricât,orice,oricînd,oricine,oricît,oricum,oriunde,până,pe,pentru,peste,pînă,poate,pot,prea,prima,primul,prin,printr,sa,să,săi,sale,sau,său,se,şi,sînt,sîntem,sînteţi,spre,sub,sunt,suntem,sunteţi,ta,tăi,tale,tău,te,ţi,ţie,tine,toată,toate,tot,toţi,totuşi,tu,un,una,unde,undeva,unei,unele,uneori,unor,vă,vi,voastră,voastre,voi,voştri,vostru,vouă,vreo,vreun
@@ -0,0 +1 @@
1
+ и,в,во,не,что,он,на,я,с,со,как,а,то,все,она,так,его,но,да,ты,к,у,же,вы,за,бы,по,только,ее,мне,было,вот,от,меня,еще,нет,о,из,ему,теперь,когда,даже,ну,вдруг,ли,если,уже,или,ни,быть,был,него,до,вас,нибудь,опять,уж,вам,сказал,ведь,там,потом,себя,ничего,ей,может,они,тут,где,есть,надо,ней,для,мы,тебя,их,чем,была,сам,чтоб,без,будто,человек,чего,раз,тоже,себе,под,жизнь,будет,ж,тогда,кто,этот,говорил,того,потому,этого,какой,совсем,ним,здесь,этом,один,почти,мой,тем,чтобы,нее,кажется,сейчас,были,куда,зачем,сказать,всех,никогда,сегодня,можно,при,наконец,два,об,другой,хоть,после,над,больше,тот,через,эти,нас,про,всего,них,какая,много,разве,сказала,три,эту,моя,впрочем,хорошо,свою,этой,перед,иногда,лучше,чуть,том,нельзя,такой,им,более,всегда,конечно,всю,между,
@@ -0,0 +1 @@
1
+ a,aby,aj,ako,aký,ale,alebo,ani,avšak,ba,bez,buï,cez,do,ho,hoci,i,ich,im,ja,jeho,jej,jemu,ju,k,kam,kde,kedže,keï,kto,ktorý,ku,lebo,ma,mi,mne,mnou,mu,my,mòa,môj,na,nad,nami,neho,nej,nemu,nich,nielen,nim,no,nám,nás,náš,ním,o,od,on,ona,oni,ono,ony,po,pod,pre,pred,pri,s,sa,seba,sem,so,svoj,taký,tam,teba,tebe,tebou,tej,ten,ti,tie,to,toho,tomu,tou,tvoj,ty,tá,tým,v,vami,veï,vo,vy,vám,vás,váš,však,z,za,zo,a,èi,èo,èí,òom,òou,òu,že
@@ -0,0 +1 @@
1
+ a,ali,april,avgust,b,bi,bil,bila,bile,bili,bilo,biti,blizu,bo,bodo,bojo,bolj,bom,bomo,boste,bova,boš,brez,c,cel,cela,celi,celo,d,da,daleč,dan,danes,datum,december,deset,deseta,deseti,deseto,devet,deveta,deveti,deveto,do,dober,dobra,dobri,dobro,dokler,dol,dolg,dolga,dolgi,dovolj,drug,druga,drugi,drugo,dva,dve,e,eden,en,ena,ene,eni,enkrat,eno,etc.,f,februar,g,g.,ga,ga.,gor,gospa,gospod,h,halo,i,idr.,ii,iii,in,iv,ix,iz,j,januar,jaz,je,ji,jih,jim,jo,julij,junij,jutri,k,kadarkoli,kaj,kajti,kako,kakor,kamor,kamorkoli,kar,karkoli,katerikoli,kdaj,kdo,kdorkoli,ker,ki,kje,kjer,kjerkoli,ko,koder,koderkoli,koga,komu,kot,kratek,kratka,kratke,kratki,l,lahka,lahke,lahki,lahko,le,lep,lepa,lepe,lepi,lepo,leto,m,maj,majhen,majhna,majhni,malce,malo,manj,marec,me,med,medtem,mene,mesec,mi,midva,midve,mnogo,moj,moja,moje,mora,morajo,moram,moramo,morate,moraš,morem,mu,n,na,nad,naj,najina,najino,najmanj,naju,največ,nam,narobe,nas,nato,nazaj,naš,naša,naše,ne,nedavno,nedelja,nek,neka,nekaj,nekatere,nekateri,nekatero,nekdo,neke,nekega,neki,nekje,neko,nekoga,nekoč,ni,nikamor,nikdar,nikjer,nikoli,nič,nje,njega,njegov,njegova,njegovo,njej,njemu,njen,njena,njeno,nji,njih,njihov,njihova,njihovo,njiju,njim,njo,njun,njuna,njuno,no,nocoj,november,npr.,o,ob,oba,obe,oboje,od,odprt,odprta,odprti,okoli,oktober,on,onadva,one,oni,onidve,osem,osma,osmi,osmo,oz.,p,pa,pet,peta,petek,peti,peto,po,pod,pogosto,poleg,poln,polna,polni,polno,ponavadi,ponedeljek,ponovno,potem,povsod,pozdravljen,pozdravljeni,prav,prava,prave,pravi,pravo,prazen,prazna,prazno,prbl.,precej,pred,prej,preko,pri,pribl.,približno,primer,pripravljen,pripravljena,pripravljeni,proti,prva,prvi,prvo,r,ravno,redko,res,reč,s,saj,sam,sama,same,sami,samo,se,sebe,sebi,sedaj,sedem,sedma,sedmi,sedmo,sem,september,seveda,si,sicer,skoraj,skozi,slab,smo,so,sobota,spet,sreda,srednja,srednji,sta,ste,stran,stvar,sva,t,ta,tak,taka,take,taki,tako,takoj,tam,te,tebe,tebi,tega,težak,težka,težki,težko,ti,tista,tiste,tisti,tisto,tj.,tja,to,toda,torek,tretja,tretje,tretji,tri,tu,tudi,tukaj,tvoj,tvoja,tvoje,u,v,vaju,vam,vas,vaš,vaša,vaše,ve,vedno,velik,velika,veliki,veliko,vendar,ves,več,vi,vidva,vii,viii,visok,visoka,visoke,visoki,vsa,vsaj,vsak,vsaka,vsakdo,vsake,vsaki,vsakomur,vse,vsega,vsi,vso,včasih,včeraj,x,z,za,zadaj,zadnji,zakaj,zaprta,zaprti,zaprto,zdaj,zelo,zunaj,č,če,često,četrta,četrtek,četrti,četrto,čez,čigav,š,šest,šesta,šesti,šesto,štiri,ž,že
@@ -0,0 +1 @@
1
+ aad,albaabkii,atabo,ay,ayaa,ayee,ayuu,dhan,hadana,in,inuu,isku,jiray,jirtay,ka,kale,kasoo,ku,kuu,lakin,markii,oo,si,soo,uga,ugu,uu,waa,waxa,waxuu
@@ -0,0 +1 @@
1
+ a,ba,bane,bona,e,ea,eaba,empa,ena,ha,hae,hape,ho,hore,ka,ke,la,le,li,me,mo,moo,ne,o,oa,re,sa,se,tloha,tsa,tse
@@ -0,0 +1 @@
1
+ och,det,att,i,en,jag,hon,som,han,på,den,med,var,sig,för,så,till,är,men,ett,om,hade,de,av,icke,mig,du,henne,då,sin,nu,har,inte,hans,honom,skulle,hennes,där,min,man,ej,vid,kunde,något,från,ut,när,efter,upp,vi,dem,vara,vad,över,än,dig,kan,sina,här,ha,mot,alla,under,någon,eller,allt,mycket,sedan,ju,denna,själv,detta,åt,utan,varit,hur,ingen,mitt,ni,bli,blev,oss,din,dessa,några,deras,blir,mina,samma,vilken,er,sådan,vår,blivit,dess,inom,mellan,sådant,varför,varje,vilka,ditt,vem,vilket,sitta,sådana,vart,dina,vars,vårt,våra,ert,era,vilkas,
@@ -0,0 +1 @@
1
+ akasema,alikuwa,alisema,baada,basi,bila,cha,chini,hadi,hapo,hata,hivyo,hiyo,huku,huo,ili,ilikuwa,juu,kama,karibu,katika,kila,kima,kisha,kubwa,kutoka,kuwa,kwa,kwamba,kwenda,kwenye,la,lakini,mara,mdogo,mimi,mkubwa,mmoja,moja,muda,mwenye,na,naye,ndani,ng,ni,nini,nonkungu,pamoja,pia,sana,sasa,sauti,tafadhali,tena,tu,vile,wa,wakati,wake,walikuwa,wao,watu,wengine,wote,ya,yake,yangu,yao,yeye,yule,za,zaidi,zake
@@ -0,0 +1 @@
1
+ ไว้,ไม่,ไป,ได้,ให้,ใน,โดย,แห่ง,แล้ว,และ,แรก,แบบ,แต่,เอง,เห็น,เลย,เริ่ม,เรา,เมื่อ,เพื่อ,เพราะ,เป็นการ,เป็น,เปิดเผย,เปิด,เนื่องจาก,เดียวกัน,เดียว,เช่น,เฉพาะ,เคย,เข้า,เขา,อีก,อาจ,อะไร,ออก,อย่าง,อยู่,อยาก,หาก,หลาย,หลังจาก,หลัง,หรือ,หนึ่ง,ส่วน,ส่ง,สุด,สําหรับ,ว่า,วัน,ลง,ร่วม,ราย,รับ,ระหว่าง,รวม,ยัง,มี,มาก,มา,พร้อม,พบ,ผ่าน,ผล,บาง,น่า,นี้,นํา,นั้น,นัก,นอกจาก,ทุก,ที่สุด,ที่,ทําให้,ทํา,ทาง,ทั้งนี้,ทั้ง,ถ้า,ถูก,ถึง,ต้อง,ต่างๆ,ต่าง,ต่อ,ตาม,ตั้งแต่,ตั้ง,ด้าน,ด้วย,ดัง,ซึ่ง,ช่วง,จึง,จาก,จัด,จะ,คือ,ความ,ครั้ง,คง,ขึ้น,ของ,ขอ,ขณะ,ก่อน,ก็,การ,กับ,กัน,กว่า,กล่าว,
@@ -0,0 +1 @@
1
+ acaba,altmış,altı,ama,ancak,arada,aslında,ayrıca,bana,bazı,belki,ben,benden,beni,benim,beri,beş,bile,bin,bir,birçok,biri,birkaç,birkez,birşey,birşeyi,biz,bize,bizden,bizi,bizim,böyle,böylece,bu,buna,bunda,bundan,bunlar,bunları,bunların,bunu,bunun,burada,çok,çünkü,da,daha,dahi,de,defa,değil,diğer,diye,doksan,dokuz,dolayı,dolayısıyla,dört,edecek,eden,ederek,edilecek,ediliyor,edilmesi,ediyor,eğer,elli,en,etmesi,etti,ettiği,ettiğini,gibi,göre,halen,hangi,hatta,hem,henüz,hep,hepsi,her,herhangi,herkesin,hiç,hiçbir,için,iki,ile,ilgili,ise,işte,itibaren,itibariyle,kadar,karşın,katrilyon,kendi,kendilerine,kendini,kendisi,kendisine,kendisini,kez,ki,kim,kimden,kime,kimi,kimse,kırk,milyar,milyon,mu,mü,mı,nasıl,ne,neden,nedenle,nerde,nerede,nereye,niye,niçin,o,olan,olarak,oldu,olduğu,olduğunu,olduklarını,olmadı,olmadığı,olmak,olması,olmayan,olmaz,olsa,olsun,olup,olur,olursa,oluyor,on,ona,ondan,onlar,onlardan,onları,onların,onu,onun,otuz,oysa,öyle,pek,rağmen,sadece,sanki,sekiz,seksen,sen,senden,seni,senin,siz,sizden,sizi,sizin,şey,şeyden,şeyi,şeyler,şöyle,şu,şuna,şunda,şundan,şunları,şunu,tarafından,trilyon,tüm,üç,üzere,var,vardı,ve,veya,ya,yani,yapacak,yapılan,yapılması,yapıyor,yapmak,yaptı,yaptığı,yaptığını,yaptıkları,yedi,yerine,yetmiş,yine,yirmi,yoksa,yüz,zaten,
@@ -0,0 +1 @@
1
+ a,an,bá,bí,bẹ̀rẹ̀,fún,fẹ́,gbogbo,inú,jù,jẹ,jẹ́,kan,kì,kí,kò,láti,lè,lọ,mi,mo,máa,mọ̀,ni,náà,ní,nígbà,nítorí,nǹkan,o,padà,pé,púpọ̀,pẹ̀lú,rẹ̀,sì,sí,sínú,ṣ,ti,tí,wà,wá,wọn,wọ́n,yìí,àti,àwọn,é,í,òun,ó,ń,ńlá,ṣe,ṣé,ṣùgbọ́n,ẹmọ́,ọjọ́,ọ̀pọ̀lọpọ̀
@@ -0,0 +1 @@
1
+ 、,。,〈,〉,《,》,一,一切,一则,一方面,一旦,一来,一样,一般,七,万一,三,上下,不仅,不但,不光,不单,不只,不如,不怕,不惟,不成,不拘,不比,不然,不特,不独,不管,不论,不过,不问,与,与其,与否,与此同时,且,两者,个,临,为,为了,为什么,为何,为着,乃,乃至,么,之,之一,之所以,之类,乌乎,乎,乘,九,也,也好,也罢,了,二,于,于是,于是乎,云云,五,人家,什么,什么样,从,从而,他,他人,他们,以,以便,以免,以及,以至,以至于,以致,们,任,任何,任凭,似的,但,但是,何,何况,何处,何时,作为,你,你们,使得,例如,依,依照,俺,俺们,倘,倘使,倘或,倘然,倘若,借,假使,假如,假若,像,八,六,兮,关于,其,其一,其中,其二,其他,其余,其它,其次,具体地说,具体说来,再者,再说,冒,冲,况且,几,几时,凭,凭借,则,别,别的,别说,到,前后,前者,加之,即,即令,即使,即便,即或,即若,又,及,及其,及至,反之,反过来,反过来说,另,另一方面,另外,只是,只有,只要,只限,叫,叮咚,可,可以,可是,可见,各,各个,各位,各种,各自,同,同时,向,向着,吓,吗,否则,吧,吧哒,吱,呀,呃,呕,呗,呜,呜呼,呢,呵,呸,呼哧,咋,和,咚,咦,咱,咱们,咳,哇,哈,哈哈,哉,哎,哎呀,哎哟,哗,哟,哦,哩,哪,哪个,哪些,哪儿,哪天,哪年,哪怕,哪样,哪边,哪里,哼,哼唷,唉,啊,啐,啥,啦,啪达,喂,喏,喔唷,嗡嗡,嗬,嗯,嗳,嘎,嘎登,嘘,嘛,嘻,嘿,四,因,因为,因此,因而,固然,在,在下,地,多,多少,她,她们,如,如上所述,如何,如其,如果,如此,如若,宁,宁可,宁愿,宁肯,它,它们,对,对于,将,尔后,尚且,就,就是,就是说,尽,尽管,岂但,己,并,并且,开外,开始,归,当,当着,彼,彼此,往,待,得,怎,怎么,怎么办,怎么样,怎样,总之,总的来看,总的来说,总的说来,总而言之,恰恰相反,您,慢说,我,我们,或,或是,或者,所,所以,打,把,抑或,拿,按,按照,换句话说,换言之,据,接着,故,故此,旁人,无宁,无论,既,既是,既然,时候,是,是的,替,有,有些,有关,有的,望,朝,朝着,本,本着,来,来着,极了,果然,果真,某,某个,某些,根据,正如,此,此外,此间,毋宁,每,每当,比,比如,比方,沿,沿着,漫说,焉,然则,然后,然而,照,照着,甚么,甚而,甚至,用,由,由于,由此可见,的,的话,相对而言,省得,着,着呢,矣,离,第,等,等等,管,紧接着,纵,纵令,纵使,纵然,经,经过,结果,给,继而,综上所述,罢了,者,而,而且,而况,而外,而已,而是,而言,能,腾,自,自个儿,自从,自各儿,自家,自己,自身,至,至于,若,若是,若非,莫若,虽,虽则,虽然,虽说,被,要,要不,要不是,要不然,要么,要是,让,论,设使,设若,该,诸位,谁,谁知,赶,起,起见,趁,趁着,越是,跟,较,较之,边,过,还是,还有,这,这个,这么,这么些,这么样,这么点儿,这些,这会儿,这儿,这就是说,这时,这样,这边,这里,进而,连,连同,通过,遵照,那,那个,那么,那么些,那么样,那些,那会儿,那儿,那时,那样,那边,那里,鄙人,鉴于,阿,除,除了,除此之外,除非,随,随着,零,非但,非徒,靠,顺,顺着,首先,︿,!,#,$,%,&,(,),*,+,,,0,1,2,3,4,5,6,7,8,9,:,;,<,>,?,@,[,],{,|,},~,¥
@@ -0,0 +1 @@
1
+ futhi,kahle,kakhulu,kanye,khona,kodwa,kungani,kusho,la,lakhe,lapho,mina,ngesikhathi,nje,phansi,phezulu,u,ukuba,ukuthi,ukuze,uma,wahamba,wakhe,wami,wase,wathi,yakhe,zakhe,zonke
@@ -0,0 +1,21 @@
1
+ module Stopwords
2
+ module Snowball
3
+ class WordSieve
4
+ def initialize(custom_list = [])
5
+ @filters = Dir["#{File.dirname(__FILE__)}/locales/*"].each_with_object({}) do |file, filters|
6
+ lang = File.basename(file)
7
+ puts file
8
+ filters[lang.to_sym] = Stopwords::Snowball::Filter.new lang, custom_list
9
+ end
10
+ end
11
+
12
+ def stopword?(args = {})
13
+ args[:lang] ? @filters[args[:lang]].stopword?(args[:word]) : false
14
+ end
15
+
16
+ def filter(args = {})
17
+ args[:lang] ? @filters[args[:lang]].filter(args[:words]) : args[:words]
18
+ end
19
+ end
20
+ end
21
+ end
@@ -0,0 +1,7 @@
1
+ # frozen_string_literal: true
2
+
3
+ # A module for filtering stopwords from text using the Snowball algorithm.
4
+ module Stopwords::Snowball
5
+ require_relative 'snowball/filter'
6
+ require_relative 'snowball/wordsieve'
7
+ end
data/lib/stopwords.rb ADDED
@@ -0,0 +1,7 @@
1
+ # frozen_string_literal: true
2
+
3
+ # A module for filtering stopwords from text.
4
+ module Stopwords
5
+ require_relative 'stopwords/filter'
6
+ require_relative 'stopwords/snowball'
7
+ end
@@ -0,0 +1,19 @@
1
+ # frozen_string_literal: true
2
+
3
+ require_relative('../spec_helper')
4
+
5
+ describe Stopwords::Filter do
6
+ context 'when fed with a list of arbitrary words' do
7
+ let(:filter) { Stopwords::Filter.new stopwords }
8
+ let(:stopwords) { %w[A desde] }
9
+
10
+ subject { filter }
11
+
12
+ it('should remove the stopwords for the list of words to be filtered') {
13
+ expect(filter.filter('desde Santurce A Bilbao'.split)).to eq %w[Santurce Bilbao]
14
+ }
15
+ it("should remove stopwords even if upcase and downcases doesn't match") {
16
+ expect(filter.filter('Desde Santurce a Bilbao'.split)).to eq %w[Santurce Bilbao]
17
+ }
18
+ end
19
+ end
@@ -0,0 +1,40 @@
1
+ # frozen_string_literal: true
2
+
3
+ require_relative('../spec_helper')
4
+
5
+ describe Stopwords::Snowball::Filter do
6
+ context 'when pointed to a valid locale' do
7
+ let(:filter) { Stopwords::Snowball::Filter.new 'es' }
8
+
9
+ subject { filter }
10
+
11
+ it('should have the appropriate stopwords') do
12
+ expect(subject.stopwords).to eq %w[
13
+ de la que el en y a los del se las por un para con no una su al lo como más
14
+ pero sus le ya o este sí porque esta entre cuando muy sin sobre también me hasta hay donde quien desde todo nos durante todos uno les ni contra otros ese eso ante ellos e esto mí antes algunos qué unos yo otro otras otra él tanto esa estos mucho quienes nada muchos cual poco ella estar estas algunas algo nosotros mi mis tú te ti tu tus ellas nosotras vosotros vosotras os mío mía míos mías tuyo tuya tuyos tuyas suyo suya suyos suyas nuestro nuestra nuestros nuestras vuestro vuestra vuestros vuestras esos esas estoy estás está estamos estáis están esté estés estemos estéis estén estaré estarás estará estaremos estaréis estarán estaría estarías estaríamos estaríais estarían estaba estabas estábamos estabais estaban estuve estuviste estuvo estuvimos estuvisteis estuvieron estuviera estuvieras estuviéramos estuvierais estuvieran estuviese estuvieses estuviésemos estuvieseis estuviesen estando estado estada estados estadas estad he has ha hemos habéis han haya hayas hayamos hayáis hayan habré habrás habrá habremos habréis habrán habría habrías habríamos habríais habrían había habías habíamos habíais habían hube hubiste hubo hubimos hubisteis hubieron hubiera hubieras hubiéramos hubierais hubieran hubiese hubieses hubiésemos hubieseis hubiesen habiendo habido habida habidos habidas soy eres es somos sois son sea seas seamos seáis sean seré serás será seremos seréis serán sería serías seríamos seríais serían era eras éramos erais eran fui fuiste fue fuimos fuisteis fueron fuera fueras fuéramos fuerais fueran fuese fueses fuésemos fueseis fuesen siendo sido tengo tienes tiene tenemos tenéis tienen tenga tengas tengamos tengáis tengan tendré tendrás tendrá tendremos tendréis tendrán tendría tendrías tendríamos tendríais tendrían tenía tenías teníamos teníais tenían tuve tuviste tuvo tuvimos tuvisteis tuvieron tuviera tuvieras tuviéramos tuvierais tuvieran tuviese tuvieses tuviésemos tuvieseis tuviesen teniendo tenido tenida tenidos tenidas tened
15
+ ]
16
+ end
17
+
18
+ it('should remove the stopwords for the list of words to be filtered') {
19
+ expect(filter.filter('desde Santurce a Bilbao'.split)).to eq %w[Santurce Bilbao]
20
+ }
21
+ end
22
+
23
+ context 'when custom list' do
24
+ let(:filter) { Stopwords::Snowball::Filter.new('es', ['Santurce']) }
25
+
26
+ subject { filter }
27
+
28
+ it('should remove the stopwords for the list of words to be filtered') {
29
+ expect(filter.filter('desde Santurce a Bilbao'.split)).to eq ['Bilbao']
30
+ }
31
+ end
32
+
33
+ context 'when locale is not found' do
34
+ let(:filter) { Stopwords::Snowball::Filter.new 'no-real' }
35
+
36
+ subject { filter }
37
+
38
+ it('should throw an error explaining the locale not found') { expect { filter }.to raise_error(ArgumentError) }
39
+ end
40
+ end
@@ -0,0 +1,3 @@
1
+ # frozen_string_literal: true
2
+
3
+ require_relative '../lib/stopwords'
metadata ADDED
@@ -0,0 +1,110 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: stopwords-filters
3
+ version: !ruby/object:Gem::Version
4
+ version: 1.0.0
5
+ platform: ruby
6
+ authors:
7
+ - Silviu Panaite
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2024-09-06 00:00:00.000000000 Z
12
+ dependencies: []
13
+ description: Small library that allows you to create a simple stopwords filter or
14
+ use some based on Snowball stopwords lists
15
+ email: silviu.panaite@gmail.com
16
+ executables: []
17
+ extensions: []
18
+ extra_rdoc_files:
19
+ - CHANGELOG
20
+ - LICENSE.txt
21
+ - README.md
22
+ files:
23
+ - CHANGELOG
24
+ - Gemfile
25
+ - Gemfile.lock
26
+ - LICENSE.txt
27
+ - README.md
28
+ - VERSION
29
+ - lib/stopwords.rb
30
+ - lib/stopwords/filter.rb
31
+ - lib/stopwords/snowball.rb
32
+ - lib/stopwords/snowball/filter.rb
33
+ - lib/stopwords/snowball/locales/af
34
+ - lib/stopwords/snowball/locales/ar
35
+ - lib/stopwords/snowball/locales/bg
36
+ - lib/stopwords/snowball/locales/bn
37
+ - lib/stopwords/snowball/locales/ca
38
+ - lib/stopwords/snowball/locales/ckb
39
+ - lib/stopwords/snowball/locales/cz
40
+ - lib/stopwords/snowball/locales/da
41
+ - lib/stopwords/snowball/locales/de
42
+ - lib/stopwords/snowball/locales/el
43
+ - lib/stopwords/snowball/locales/en
44
+ - lib/stopwords/snowball/locales/eo
45
+ - lib/stopwords/snowball/locales/es
46
+ - lib/stopwords/snowball/locales/et
47
+ - lib/stopwords/snowball/locales/eu
48
+ - lib/stopwords/snowball/locales/fa
49
+ - lib/stopwords/snowball/locales/fi
50
+ - lib/stopwords/snowball/locales/fr
51
+ - lib/stopwords/snowball/locales/ga
52
+ - lib/stopwords/snowball/locales/gl
53
+ - lib/stopwords/snowball/locales/he
54
+ - lib/stopwords/snowball/locales/hi
55
+ - lib/stopwords/snowball/locales/hr
56
+ - lib/stopwords/snowball/locales/hu
57
+ - lib/stopwords/snowball/locales/hy
58
+ - lib/stopwords/snowball/locales/id
59
+ - lib/stopwords/snowball/locales/it
60
+ - lib/stopwords/snowball/locales/ja
61
+ - lib/stopwords/snowball/locales/ko
62
+ - lib/stopwords/snowball/locales/la
63
+ - lib/stopwords/snowball/locales/lt
64
+ - lib/stopwords/snowball/locales/lv
65
+ - lib/stopwords/snowball/locales/mr
66
+ - lib/stopwords/snowball/locales/nl
67
+ - lib/stopwords/snowball/locales/no
68
+ - lib/stopwords/snowball/locales/pl
69
+ - lib/stopwords/snowball/locales/pt
70
+ - lib/stopwords/snowball/locales/ro
71
+ - lib/stopwords/snowball/locales/ru
72
+ - lib/stopwords/snowball/locales/sk
73
+ - lib/stopwords/snowball/locales/sl
74
+ - lib/stopwords/snowball/locales/so
75
+ - lib/stopwords/snowball/locales/st
76
+ - lib/stopwords/snowball/locales/sv
77
+ - lib/stopwords/snowball/locales/sw
78
+ - lib/stopwords/snowball/locales/th
79
+ - lib/stopwords/snowball/locales/tr
80
+ - lib/stopwords/snowball/locales/yo
81
+ - lib/stopwords/snowball/locales/zh
82
+ - lib/stopwords/snowball/locales/zu
83
+ - lib/stopwords/snowball/wordsieve.rb
84
+ - spec/lib/filter_spec.rb
85
+ - spec/lib/snowball_filter_spec.rb
86
+ - spec/spec_helper.rb
87
+ homepage: http://github.com/brenes/stopwords-filters
88
+ licenses:
89
+ - MIT
90
+ metadata: {}
91
+ post_install_message:
92
+ rdoc_options: []
93
+ require_paths:
94
+ - lib
95
+ required_ruby_version: !ruby/object:Gem::Requirement
96
+ requirements:
97
+ - - ">="
98
+ - !ruby/object:Gem::Version
99
+ version: '0'
100
+ required_rubygems_version: !ruby/object:Gem::Requirement
101
+ requirements:
102
+ - - ">="
103
+ - !ruby/object:Gem::Version
104
+ version: '0'
105
+ requirements: []
106
+ rubygems_version: 3.5.6
107
+ signing_key:
108
+ specification_version: 4
109
+ summary: Snowball based filters for stopwords
110
+ test_files: []