rere 0.0.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (168) hide show
  1. data/.classpath +260 -0
  2. data/.gitignore +28 -0
  3. data/.project +14 -0
  4. data/.ruby-version +1 -0
  5. data/.settings/org.eclim.prefs +3 -0
  6. data/.settings/org.eclipse.jdt.core.prefs +5 -0
  7. data/.settings/org.eclipse.jdt.ui.prefs +2 -0
  8. data/Gemfile +7 -0
  9. data/LICENSE +22 -0
  10. data/README.md +44 -0
  11. data/Rakefile +65 -0
  12. data/bin/solr +61 -0
  13. data/example/config/solr.yml +23 -0
  14. data/example/log/.gitkeep +0 -0
  15. data/example/solr/README.txt +63 -0
  16. data/example/solr/collection1/README.txt +50 -0
  17. data/example/solr/collection1/conf/admin-extra.html +24 -0
  18. data/example/solr/collection1/conf/admin-extra.menu-bottom.html +25 -0
  19. data/example/solr/collection1/conf/admin-extra.menu-top.html +25 -0
  20. data/example/solr/collection1/conf/currency.xml +67 -0
  21. data/example/solr/collection1/conf/elevate.xml +38 -0
  22. data/example/solr/collection1/conf/lang/contractions_ca.txt +8 -0
  23. data/example/solr/collection1/conf/lang/contractions_fr.txt +15 -0
  24. data/example/solr/collection1/conf/lang/contractions_ga.txt +5 -0
  25. data/example/solr/collection1/conf/lang/contractions_it.txt +23 -0
  26. data/example/solr/collection1/conf/lang/hyphenations_ga.txt +5 -0
  27. data/example/solr/collection1/conf/lang/stemdict_nl.txt +6 -0
  28. data/example/solr/collection1/conf/lang/stoptags_ja.txt +420 -0
  29. data/example/solr/collection1/conf/lang/stopwords_ar.txt +125 -0
  30. data/example/solr/collection1/conf/lang/stopwords_bg.txt +193 -0
  31. data/example/solr/collection1/conf/lang/stopwords_ca.txt +220 -0
  32. data/example/solr/collection1/conf/lang/stopwords_cz.txt +172 -0
  33. data/example/solr/collection1/conf/lang/stopwords_da.txt +108 -0
  34. data/example/solr/collection1/conf/lang/stopwords_de.txt +292 -0
  35. data/example/solr/collection1/conf/lang/stopwords_el.txt +78 -0
  36. data/example/solr/collection1/conf/lang/stopwords_en.txt +54 -0
  37. data/example/solr/collection1/conf/lang/stopwords_es.txt +354 -0
  38. data/example/solr/collection1/conf/lang/stopwords_eu.txt +99 -0
  39. data/example/solr/collection1/conf/lang/stopwords_fa.txt +313 -0
  40. data/example/solr/collection1/conf/lang/stopwords_fi.txt +95 -0
  41. data/example/solr/collection1/conf/lang/stopwords_fr.txt +184 -0
  42. data/example/solr/collection1/conf/lang/stopwords_ga.txt +110 -0
  43. data/example/solr/collection1/conf/lang/stopwords_gl.txt +161 -0
  44. data/example/solr/collection1/conf/lang/stopwords_hi.txt +235 -0
  45. data/example/solr/collection1/conf/lang/stopwords_hu.txt +209 -0
  46. data/example/solr/collection1/conf/lang/stopwords_hy.txt +46 -0
  47. data/example/solr/collection1/conf/lang/stopwords_id.txt +359 -0
  48. data/example/solr/collection1/conf/lang/stopwords_it.txt +301 -0
  49. data/example/solr/collection1/conf/lang/stopwords_ja.txt +127 -0
  50. data/example/solr/collection1/conf/lang/stopwords_lv.txt +172 -0
  51. data/example/solr/collection1/conf/lang/stopwords_nl.txt +117 -0
  52. data/example/solr/collection1/conf/lang/stopwords_no.txt +192 -0
  53. data/example/solr/collection1/conf/lang/stopwords_pt.txt +251 -0
  54. data/example/solr/collection1/conf/lang/stopwords_ro.txt +233 -0
  55. data/example/solr/collection1/conf/lang/stopwords_ru.txt +241 -0
  56. data/example/solr/collection1/conf/lang/stopwords_sv.txt +131 -0
  57. data/example/solr/collection1/conf/lang/stopwords_th.txt +119 -0
  58. data/example/solr/collection1/conf/lang/stopwords_tr.txt +212 -0
  59. data/example/solr/collection1/conf/lang/userdict_ja.txt +29 -0
  60. data/example/solr/collection1/conf/mapping-FoldToASCII.txt +3813 -0
  61. data/example/solr/collection1/conf/mapping-ISOLatin1Accent.txt +246 -0
  62. data/example/solr/collection1/conf/protwords.txt +21 -0
  63. data/example/solr/collection1/conf/schema.xml +1125 -0
  64. data/example/solr/collection1/conf/scripts.conf +24 -0
  65. data/example/solr/collection1/conf/solrconfig.xml +1816 -0
  66. data/example/solr/collection1/conf/spellings.txt +2 -0
  67. data/example/solr/collection1/conf/stopwords.txt +14 -0
  68. data/example/solr/collection1/conf/synonyms.txt +29 -0
  69. data/example/solr/collection1/conf/update-script.js +53 -0
  70. data/example/solr/collection1/conf/velocity/VM_global_library.vm +170 -0
  71. data/example/solr/collection1/conf/velocity/browse.vm +50 -0
  72. data/example/solr/collection1/conf/velocity/cluster.vm +9 -0
  73. data/example/solr/collection1/conf/velocity/clusterResults.vm +12 -0
  74. data/example/solr/collection1/conf/velocity/debug.vm +17 -0
  75. data/example/solr/collection1/conf/velocity/did_you_mean.vm +4 -0
  76. data/example/solr/collection1/conf/velocity/facet_fields.vm +15 -0
  77. data/example/solr/collection1/conf/velocity/facet_pivot.vm +3 -0
  78. data/example/solr/collection1/conf/velocity/facet_queries.vm +3 -0
  79. data/example/solr/collection1/conf/velocity/facet_ranges.vm +15 -0
  80. data/example/solr/collection1/conf/velocity/facets.vm +5 -0
  81. data/example/solr/collection1/conf/velocity/footer.vm +17 -0
  82. data/example/solr/collection1/conf/velocity/head.vm +32 -0
  83. data/example/solr/collection1/conf/velocity/header.vm +3 -0
  84. data/example/solr/collection1/conf/velocity/hit.vm +11 -0
  85. data/example/solr/collection1/conf/velocity/hitGrouped.vm +24 -0
  86. data/example/solr/collection1/conf/velocity/join-doc.vm +4 -0
  87. data/example/solr/collection1/conf/velocity/jquery.autocomplete.css +48 -0
  88. data/example/solr/collection1/conf/velocity/jquery.autocomplete.js +763 -0
  89. data/example/solr/collection1/conf/velocity/layout.vm +20 -0
  90. data/example/solr/collection1/conf/velocity/main.css +208 -0
  91. data/example/solr/collection1/conf/velocity/product-doc.vm +27 -0
  92. data/example/solr/collection1/conf/velocity/query.vm +42 -0
  93. data/example/solr/collection1/conf/velocity/queryGroup.vm +19 -0
  94. data/example/solr/collection1/conf/velocity/querySpatial.vm +40 -0
  95. data/example/solr/collection1/conf/velocity/richtext-doc.vm +114 -0
  96. data/example/solr/collection1/conf/velocity/suggest.vm +3 -0
  97. data/example/solr/collection1/conf/velocity/tabs.vm +6 -0
  98. data/example/solr/collection1/conf/xslt/example.xsl +132 -0
  99. data/example/solr/collection1/conf/xslt/example_atom.xsl +67 -0
  100. data/example/solr/collection1/conf/xslt/example_rss.xsl +66 -0
  101. data/example/solr/collection1/conf/xslt/luke.xsl +337 -0
  102. data/example/solr/collection1/conf/xslt/updateXml.xsl +70 -0
  103. data/example/solr/collection1/data/index/segments.gen +0 -0
  104. data/example/solr/collection1/data/index/segments_1 +0 -0
  105. data/example/solr/data/development/index/segments.gen +0 -0
  106. data/example/solr/data/development/index/segments_1 +0 -0
  107. data/example/solr/solr.xml +53 -0
  108. data/example/solr/zoo.cfg +17 -0
  109. data/lib/rere.rb +66 -0
  110. data/lib/rere/railtie.rb +8 -0
  111. data/lib/rere/server.rb +380 -0
  112. data/lib/rere/tasks/solr.rake +47 -0
  113. data/lib/rere/version.rb +3 -0
  114. data/pom.xml +168 -0
  115. data/rere.gemspec +26 -0
  116. data/server/README.txt +78 -0
  117. data/server/cloud-scripts/zkcli.bat +12 -0
  118. data/server/cloud-scripts/zkcli.sh +14 -0
  119. data/server/contexts/solr-jetty-context.xml +8 -0
  120. data/server/etc/create-solrtest.keystore.sh +37 -0
  121. data/server/etc/jetty.xml +205 -0
  122. data/server/etc/logging.properties +38 -0
  123. data/server/etc/solrtest.keystore +0 -0
  124. data/server/etc/webdefault.xml +527 -0
  125. data/server/exampledocs/books.csv +11 -0
  126. data/server/exampledocs/books.json +51 -0
  127. data/server/exampledocs/gb18030-example.xml +32 -0
  128. data/server/exampledocs/hd.xml +56 -0
  129. data/server/exampledocs/ipod_other.xml +60 -0
  130. data/server/exampledocs/ipod_video.xml +40 -0
  131. data/server/exampledocs/manufacturers.xml +75 -0
  132. data/server/exampledocs/mem.xml +77 -0
  133. data/server/exampledocs/money.xml +65 -0
  134. data/server/exampledocs/monitor.xml +35 -0
  135. data/server/exampledocs/monitor2.xml +34 -0
  136. data/server/exampledocs/mp500.xml +43 -0
  137. data/server/exampledocs/post.jar +0 -0
  138. data/server/exampledocs/post.sh +30 -0
  139. data/server/exampledocs/sd500.xml +38 -0
  140. data/server/exampledocs/solr.xml +38 -0
  141. data/server/exampledocs/test_utf8.sh +93 -0
  142. data/server/exampledocs/utf8-example.xml +42 -0
  143. data/server/exampledocs/vidcard.xml +62 -0
  144. data/server/lib/ext/jcl-over-slf4j-1.6.6.jar +0 -0
  145. data/server/lib/ext/jul-to-slf4j-1.6.6.jar +0 -0
  146. data/server/lib/ext/log4j-1.2.16.jar +0 -0
  147. data/server/lib/ext/slf4j-api-1.6.6.jar +0 -0
  148. data/server/lib/ext/slf4j-log4j12-1.6.6.jar +0 -0
  149. data/server/lib/jetty-continuation-8.1.8.v20121106.jar +0 -0
  150. data/server/lib/jetty-deploy-8.1.8.v20121106.jar +0 -0
  151. data/server/lib/jetty-http-8.1.8.v20121106.jar +0 -0
  152. data/server/lib/jetty-io-8.1.8.v20121106.jar +0 -0
  153. data/server/lib/jetty-jmx-8.1.8.v20121106.jar +0 -0
  154. data/server/lib/jetty-security-8.1.8.v20121106.jar +0 -0
  155. data/server/lib/jetty-server-8.1.8.v20121106.jar +0 -0
  156. data/server/lib/jetty-servlet-8.1.8.v20121106.jar +0 -0
  157. data/server/lib/jetty-util-8.1.8.v20121106.jar +0 -0
  158. data/server/lib/jetty-webapp-8.1.8.v20121106.jar +0 -0
  159. data/server/lib/jetty-xml-8.1.8.v20121106.jar +0 -0
  160. data/server/lib/servlet-api-3.0.jar +0 -0
  161. data/server/resources/log4j.properties +19 -0
  162. data/server/solr/README.txt +63 -0
  163. data/server/solr/solr.xml +53 -0
  164. data/server/solr/zoo.cfg +17 -0
  165. data/server/start.jar +0 -0
  166. data/server/webapps/solr.war +0 -0
  167. data/solr/lib/solr-winds-0.1.jar +0 -0
  168. metadata +284 -0
@@ -0,0 +1,131 @@
1
+ | From svn.tartarus.org/snowball/trunk/website/algorithms/swedish/stop.txt
2
+ | This file is distributed under the BSD License.
3
+ | See http://snowball.tartarus.org/license.php
4
+ | Also see http://www.opensource.org/licenses/bsd-license.html
5
+ | - Encoding was converted to UTF-8.
6
+ | - This notice was added.
7
+
8
+ | A Swedish stop word list. Comments begin with vertical bar. Each stop
9
+ | word is at the start of a line.
10
+
11
+ | This is a ranked list (commonest to rarest) of stopwords derived from
12
+ | a large text sample.
13
+
14
+ | Swedish stop words occasionally exhibit homonym clashes. For example
15
+ | så = so, but also seed. These are indicated clearly below.
16
+
17
+ och | and
18
+ det | it, this/that
19
+ att | to (with infinitive)
20
+ i | in, at
21
+ en | a
22
+ jag | I
23
+ hon | she
24
+ som | who, that
25
+ han | he
26
+ på | on
27
+ den | it, this/that
28
+ med | with
29
+ var | where, each
30
+ sig | him(self) etc
31
+ för | for
32
+ så | so (also: seed)
33
+ till | to
34
+ är | is
35
+ men | but
36
+ ett | a
37
+ om | if; around, about
38
+ hade | had
39
+ de | they, these/those
40
+ av | of
41
+ icke | not, no
42
+ mig | me
43
+ du | you
44
+ henne | her
45
+ då | then, when
46
+ sin | his
47
+ nu | now
48
+ har | have
49
+ inte | inte någon = no one
50
+ hans | his
51
+ honom | him
52
+ skulle | 'sake'
53
+ hennes | her
54
+ där | there
55
+ min | my
56
+ man | one (pronoun)
57
+ ej | nor
58
+ vid | at, by, on (also: vast)
59
+ kunde | could
60
+ något | some etc
61
+ från | from, off
62
+ ut | out
63
+ när | when
64
+ efter | after, behind
65
+ upp | up
66
+ vi | we
67
+ dem | them
68
+ vara | be
69
+ vad | what
70
+ över | over
71
+ än | than
72
+ dig | you
73
+ kan | can
74
+ sina | his
75
+ här | here
76
+ ha | have
77
+ mot | towards
78
+ alla | all
79
+ under | under (also: wonder)
80
+ någon | some etc
81
+ eller | or (else)
82
+ allt | all
83
+ mycket | much
84
+ sedan | since
85
+ ju | why
86
+ denna | this/that
87
+ själv | myself, yourself etc
88
+ detta | this/that
89
+ åt | to
90
+ utan | without
91
+ varit | was
92
+ hur | how
93
+ ingen | no
94
+ mitt | my
95
+ ni | you
96
+ bli | to be, become
97
+ blev | from bli
98
+ oss | us
99
+ din | thy
100
+ dessa | these/those
101
+ några | some etc
102
+ deras | their
103
+ blir | from bli
104
+ mina | my
105
+ samma | (the) same
106
+ vilken | who, that
107
+ er | you, your
108
+ sådan | such a
109
+ vår | our
110
+ blivit | from bli
111
+ dess | its
112
+ inom | within
113
+ mellan | between
114
+ sådant | such a
115
+ varför | why
116
+ varje | each
117
+ vilka | who, that
118
+ ditt | thy
119
+ vem | who
120
+ vilket | who, that
121
+ sitta | his
122
+ sådana | such a
123
+ vart | each
124
+ dina | thy
125
+ vars | whose
126
+ vårt | our
127
+ våra | our
128
+ ert | your
129
+ era | your
130
+ vilkas | whose
131
+
@@ -0,0 +1,119 @@
1
+ # Thai stopwords from:
2
+ # "Opinion Detection in Thai Political News Columns
3
+ # Based on Subjectivity Analysis"
4
+ # Khampol Sukhum, Supot Nitsuwat, and Choochart Haruechaiyasak
5
+ ไว้
6
+ ไม่
7
+ ไป
8
+ ได้
9
+ ให้
10
+ ใน
11
+ โดย
12
+ แห่ง
13
+ แล้ว
14
+ และ
15
+ แรก
16
+ แบบ
17
+ แต่
18
+ เอง
19
+ เห็น
20
+ เลย
21
+ เริ่ม
22
+ เรา
23
+ เมื่อ
24
+ เพื่อ
25
+ เพราะ
26
+ เป็นการ
27
+ เป็น
28
+ เปิดเผย
29
+ เปิด
30
+ เนื่องจาก
31
+ เดียวกัน
32
+ เดียว
33
+ เช่น
34
+ เฉพาะ
35
+ เคย
36
+ เข้า
37
+ เขา
38
+ อีก
39
+ อาจ
40
+ อะไร
41
+ ออก
42
+ อย่าง
43
+ อยู่
44
+ อยาก
45
+ หาก
46
+ หลาย
47
+ หลังจาก
48
+ หลัง
49
+ หรือ
50
+ หนึ่ง
51
+ ส่วน
52
+ ส่ง
53
+ สุด
54
+ สําหรับ
55
+ ว่า
56
+ วัน
57
+ ลง
58
+ ร่วม
59
+ ราย
60
+ รับ
61
+ ระหว่าง
62
+ รวม
63
+ ยัง
64
+ มี
65
+ มาก
66
+ มา
67
+ พร้อม
68
+ พบ
69
+ ผ่าน
70
+ ผล
71
+ บาง
72
+ น่า
73
+ นี้
74
+ นํา
75
+ นั้น
76
+ นัก
77
+ นอกจาก
78
+ ทุก
79
+ ที่สุด
80
+ ที่
81
+ ทําให้
82
+ ทํา
83
+ ทาง
84
+ ทั้งนี้
85
+ ทั้ง
86
+ ถ้า
87
+ ถูก
88
+ ถึง
89
+ ต้อง
90
+ ต่างๆ
91
+ ต่าง
92
+ ต่อ
93
+ ตาม
94
+ ตั้งแต่
95
+ ตั้ง
96
+ ด้าน
97
+ ด้วย
98
+ ดัง
99
+ ซึ่ง
100
+ ช่วง
101
+ จึง
102
+ จาก
103
+ จัด
104
+ จะ
105
+ คือ
106
+ ความ
107
+ ครั้ง
108
+ คง
109
+ ขึ้น
110
+ ของ
111
+ ขอ
112
+ ขณะ
113
+ ก่อน
114
+ ก็
115
+ การ
116
+ กับ
117
+ กัน
118
+ กว่า
119
+ กล่าว
@@ -0,0 +1,212 @@
1
+ # Turkish stopwords from LUCENE-559
2
+ # merged with the list from "Information Retrieval on Turkish Texts"
3
+ # (http://www.users.muohio.edu/canf/papers/JASIST2008offPrint.pdf)
4
+ acaba
5
+ altmış
6
+ altı
7
+ ama
8
+ ancak
9
+ arada
10
+ aslında
11
+ ayrıca
12
+ bana
13
+ bazı
14
+ belki
15
+ ben
16
+ benden
17
+ beni
18
+ benim
19
+ beri
20
+ beş
21
+ bile
22
+ bin
23
+ bir
24
+ birçok
25
+ biri
26
+ birkaç
27
+ birkez
28
+ birşey
29
+ birşeyi
30
+ biz
31
+ bize
32
+ bizden
33
+ bizi
34
+ bizim
35
+ böyle
36
+ böylece
37
+ bu
38
+ buna
39
+ bunda
40
+ bundan
41
+ bunlar
42
+ bunları
43
+ bunların
44
+ bunu
45
+ bunun
46
+ burada
47
+ çok
48
+ çünkü
49
+ da
50
+ daha
51
+ dahi
52
+ de
53
+ defa
54
+ değil
55
+ diğer
56
+ diye
57
+ doksan
58
+ dokuz
59
+ dolayı
60
+ dolayısıyla
61
+ dört
62
+ edecek
63
+ eden
64
+ ederek
65
+ edilecek
66
+ ediliyor
67
+ edilmesi
68
+ ediyor
69
+ eğer
70
+ elli
71
+ en
72
+ etmesi
73
+ etti
74
+ ettiği
75
+ ettiğini
76
+ gibi
77
+ göre
78
+ halen
79
+ hangi
80
+ hatta
81
+ hem
82
+ henüz
83
+ hep
84
+ hepsi
85
+ her
86
+ herhangi
87
+ herkesin
88
+ hiç
89
+ hiçbir
90
+ için
91
+ iki
92
+ ile
93
+ ilgili
94
+ ise
95
+ işte
96
+ itibaren
97
+ itibariyle
98
+ kadar
99
+ karşın
100
+ katrilyon
101
+ kendi
102
+ kendilerine
103
+ kendini
104
+ kendisi
105
+ kendisine
106
+ kendisini
107
+ kez
108
+ ki
109
+ kim
110
+ kimden
111
+ kime
112
+ kimi
113
+ kimse
114
+ kırk
115
+ milyar
116
+ milyon
117
+ mu
118
+
119
+
120
+ nasıl
121
+ ne
122
+ neden
123
+ nedenle
124
+ nerde
125
+ nerede
126
+ nereye
127
+ niye
128
+ niçin
129
+ o
130
+ olan
131
+ olarak
132
+ oldu
133
+ olduğu
134
+ olduğunu
135
+ olduklarını
136
+ olmadı
137
+ olmadığı
138
+ olmak
139
+ olması
140
+ olmayan
141
+ olmaz
142
+ olsa
143
+ olsun
144
+ olup
145
+ olur
146
+ olursa
147
+ oluyor
148
+ on
149
+ ona
150
+ ondan
151
+ onlar
152
+ onlardan
153
+ onları
154
+ onların
155
+ onu
156
+ onun
157
+ otuz
158
+ oysa
159
+ öyle
160
+ pek
161
+ rağmen
162
+ sadece
163
+ sanki
164
+ sekiz
165
+ seksen
166
+ sen
167
+ senden
168
+ seni
169
+ senin
170
+ siz
171
+ sizden
172
+ sizi
173
+ sizin
174
+ şey
175
+ şeyden
176
+ şeyi
177
+ şeyler
178
+ şöyle
179
+ şu
180
+ şuna
181
+ şunda
182
+ şundan
183
+ şunları
184
+ şunu
185
+ tarafından
186
+ trilyon
187
+ tüm
188
+ üç
189
+ üzere
190
+ var
191
+ vardı
192
+ ve
193
+ veya
194
+ ya
195
+ yani
196
+ yapacak
197
+ yapılan
198
+ yapılması
199
+ yapıyor
200
+ yapmak
201
+ yaptı
202
+ yaptığı
203
+ yaptığını
204
+ yaptıkları
205
+ yedi
206
+ yerine
207
+ yetmiş
208
+ yine
209
+ yirmi
210
+ yoksa
211
+ yüz
212
+ zaten