ruby-spark 1.1.0.1-java

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (180) hide show
  1. checksums.yaml +7 -0
  2. data/.gitignore +37 -0
  3. data/Gemfile +47 -0
  4. data/Guardfile +5 -0
  5. data/LICENSE.txt +22 -0
  6. data/README.md +252 -0
  7. data/Rakefile +35 -0
  8. data/TODO.md +6 -0
  9. data/benchmark/aggregate.rb +33 -0
  10. data/benchmark/bisect.rb +88 -0
  11. data/benchmark/comparison/prepare.sh +18 -0
  12. data/benchmark/comparison/python.py +156 -0
  13. data/benchmark/comparison/r.r +69 -0
  14. data/benchmark/comparison/ruby.rb +167 -0
  15. data/benchmark/comparison/run-all.sh +160 -0
  16. data/benchmark/comparison/scala.scala +181 -0
  17. data/benchmark/custom_marshal.rb +94 -0
  18. data/benchmark/digest.rb +150 -0
  19. data/benchmark/enumerator.rb +88 -0
  20. data/benchmark/serializer.rb +82 -0
  21. data/benchmark/sort.rb +43 -0
  22. data/benchmark/sort2.rb +164 -0
  23. data/benchmark/take.rb +28 -0
  24. data/bin/ruby-spark +8 -0
  25. data/example/pi.rb +28 -0
  26. data/example/website_search.rb +83 -0
  27. data/ext/ruby_c/extconf.rb +3 -0
  28. data/ext/ruby_c/murmur.c +158 -0
  29. data/ext/ruby_c/murmur.h +9 -0
  30. data/ext/ruby_c/ruby-spark.c +18 -0
  31. data/ext/ruby_java/Digest.java +36 -0
  32. data/ext/ruby_java/Murmur2.java +98 -0
  33. data/ext/ruby_java/RubySparkExtService.java +28 -0
  34. data/ext/ruby_java/extconf.rb +3 -0
  35. data/ext/spark/build.sbt +73 -0
  36. data/ext/spark/project/plugins.sbt +9 -0
  37. data/ext/spark/sbt/sbt +34 -0
  38. data/ext/spark/src/main/scala/Exec.scala +91 -0
  39. data/ext/spark/src/main/scala/MLLibAPI.scala +4 -0
  40. data/ext/spark/src/main/scala/Marshal.scala +52 -0
  41. data/ext/spark/src/main/scala/MarshalDump.scala +113 -0
  42. data/ext/spark/src/main/scala/MarshalLoad.scala +220 -0
  43. data/ext/spark/src/main/scala/RubyAccumulatorParam.scala +69 -0
  44. data/ext/spark/src/main/scala/RubyBroadcast.scala +13 -0
  45. data/ext/spark/src/main/scala/RubyConstant.scala +13 -0
  46. data/ext/spark/src/main/scala/RubyMLLibAPI.scala +55 -0
  47. data/ext/spark/src/main/scala/RubyMLLibUtilAPI.scala +21 -0
  48. data/ext/spark/src/main/scala/RubyPage.scala +34 -0
  49. data/ext/spark/src/main/scala/RubyRDD.scala +392 -0
  50. data/ext/spark/src/main/scala/RubySerializer.scala +14 -0
  51. data/ext/spark/src/main/scala/RubyTab.scala +11 -0
  52. data/ext/spark/src/main/scala/RubyUtils.scala +15 -0
  53. data/ext/spark/src/main/scala/RubyWorker.scala +257 -0
  54. data/ext/spark/src/test/scala/MarshalSpec.scala +84 -0
  55. data/lib/ruby-spark.rb +1 -0
  56. data/lib/spark.rb +198 -0
  57. data/lib/spark/accumulator.rb +260 -0
  58. data/lib/spark/broadcast.rb +98 -0
  59. data/lib/spark/build.rb +43 -0
  60. data/lib/spark/cli.rb +169 -0
  61. data/lib/spark/command.rb +86 -0
  62. data/lib/spark/command/base.rb +158 -0
  63. data/lib/spark/command/basic.rb +345 -0
  64. data/lib/spark/command/pair.rb +124 -0
  65. data/lib/spark/command/sort.rb +51 -0
  66. data/lib/spark/command/statistic.rb +144 -0
  67. data/lib/spark/command_builder.rb +141 -0
  68. data/lib/spark/command_validator.rb +34 -0
  69. data/lib/spark/config.rb +238 -0
  70. data/lib/spark/constant.rb +14 -0
  71. data/lib/spark/context.rb +322 -0
  72. data/lib/spark/error.rb +50 -0
  73. data/lib/spark/ext/hash.rb +41 -0
  74. data/lib/spark/ext/integer.rb +25 -0
  75. data/lib/spark/ext/io.rb +67 -0
  76. data/lib/spark/ext/ip_socket.rb +29 -0
  77. data/lib/spark/ext/module.rb +58 -0
  78. data/lib/spark/ext/object.rb +24 -0
  79. data/lib/spark/ext/string.rb +24 -0
  80. data/lib/spark/helper.rb +10 -0
  81. data/lib/spark/helper/logger.rb +40 -0
  82. data/lib/spark/helper/parser.rb +85 -0
  83. data/lib/spark/helper/serialize.rb +71 -0
  84. data/lib/spark/helper/statistic.rb +93 -0
  85. data/lib/spark/helper/system.rb +42 -0
  86. data/lib/spark/java_bridge.rb +19 -0
  87. data/lib/spark/java_bridge/base.rb +203 -0
  88. data/lib/spark/java_bridge/jruby.rb +23 -0
  89. data/lib/spark/java_bridge/rjb.rb +41 -0
  90. data/lib/spark/logger.rb +76 -0
  91. data/lib/spark/mllib.rb +100 -0
  92. data/lib/spark/mllib/classification/common.rb +31 -0
  93. data/lib/spark/mllib/classification/logistic_regression.rb +223 -0
  94. data/lib/spark/mllib/classification/naive_bayes.rb +97 -0
  95. data/lib/spark/mllib/classification/svm.rb +135 -0
  96. data/lib/spark/mllib/clustering/gaussian_mixture.rb +82 -0
  97. data/lib/spark/mllib/clustering/kmeans.rb +118 -0
  98. data/lib/spark/mllib/matrix.rb +120 -0
  99. data/lib/spark/mllib/regression/common.rb +73 -0
  100. data/lib/spark/mllib/regression/labeled_point.rb +41 -0
  101. data/lib/spark/mllib/regression/lasso.rb +100 -0
  102. data/lib/spark/mllib/regression/linear.rb +124 -0
  103. data/lib/spark/mllib/regression/ridge.rb +97 -0
  104. data/lib/spark/mllib/ruby_matrix/matrix_adapter.rb +53 -0
  105. data/lib/spark/mllib/ruby_matrix/vector_adapter.rb +57 -0
  106. data/lib/spark/mllib/stat/distribution.rb +12 -0
  107. data/lib/spark/mllib/vector.rb +185 -0
  108. data/lib/spark/rdd.rb +1377 -0
  109. data/lib/spark/sampler.rb +92 -0
  110. data/lib/spark/serializer.rb +79 -0
  111. data/lib/spark/serializer/auto_batched.rb +59 -0
  112. data/lib/spark/serializer/base.rb +63 -0
  113. data/lib/spark/serializer/batched.rb +84 -0
  114. data/lib/spark/serializer/cartesian.rb +13 -0
  115. data/lib/spark/serializer/compressed.rb +27 -0
  116. data/lib/spark/serializer/marshal.rb +17 -0
  117. data/lib/spark/serializer/message_pack.rb +23 -0
  118. data/lib/spark/serializer/oj.rb +23 -0
  119. data/lib/spark/serializer/pair.rb +41 -0
  120. data/lib/spark/serializer/text.rb +25 -0
  121. data/lib/spark/sort.rb +189 -0
  122. data/lib/spark/stat_counter.rb +125 -0
  123. data/lib/spark/storage_level.rb +39 -0
  124. data/lib/spark/version.rb +3 -0
  125. data/lib/spark/worker/master.rb +144 -0
  126. data/lib/spark/worker/spark_files.rb +15 -0
  127. data/lib/spark/worker/worker.rb +200 -0
  128. data/ruby-spark.gemspec +47 -0
  129. data/spec/generator.rb +37 -0
  130. data/spec/inputs/lorem_300.txt +316 -0
  131. data/spec/inputs/numbers/1.txt +50 -0
  132. data/spec/inputs/numbers/10.txt +50 -0
  133. data/spec/inputs/numbers/11.txt +50 -0
  134. data/spec/inputs/numbers/12.txt +50 -0
  135. data/spec/inputs/numbers/13.txt +50 -0
  136. data/spec/inputs/numbers/14.txt +50 -0
  137. data/spec/inputs/numbers/15.txt +50 -0
  138. data/spec/inputs/numbers/16.txt +50 -0
  139. data/spec/inputs/numbers/17.txt +50 -0
  140. data/spec/inputs/numbers/18.txt +50 -0
  141. data/spec/inputs/numbers/19.txt +50 -0
  142. data/spec/inputs/numbers/2.txt +50 -0
  143. data/spec/inputs/numbers/20.txt +50 -0
  144. data/spec/inputs/numbers/3.txt +50 -0
  145. data/spec/inputs/numbers/4.txt +50 -0
  146. data/spec/inputs/numbers/5.txt +50 -0
  147. data/spec/inputs/numbers/6.txt +50 -0
  148. data/spec/inputs/numbers/7.txt +50 -0
  149. data/spec/inputs/numbers/8.txt +50 -0
  150. data/spec/inputs/numbers/9.txt +50 -0
  151. data/spec/inputs/numbers_0_100.txt +101 -0
  152. data/spec/inputs/numbers_1_100.txt +100 -0
  153. data/spec/lib/collect_spec.rb +42 -0
  154. data/spec/lib/command_spec.rb +68 -0
  155. data/spec/lib/config_spec.rb +64 -0
  156. data/spec/lib/context_spec.rb +165 -0
  157. data/spec/lib/ext_spec.rb +72 -0
  158. data/spec/lib/external_apps_spec.rb +45 -0
  159. data/spec/lib/filter_spec.rb +80 -0
  160. data/spec/lib/flat_map_spec.rb +100 -0
  161. data/spec/lib/group_spec.rb +109 -0
  162. data/spec/lib/helper_spec.rb +19 -0
  163. data/spec/lib/key_spec.rb +41 -0
  164. data/spec/lib/manipulation_spec.rb +122 -0
  165. data/spec/lib/map_partitions_spec.rb +87 -0
  166. data/spec/lib/map_spec.rb +91 -0
  167. data/spec/lib/mllib/classification_spec.rb +54 -0
  168. data/spec/lib/mllib/clustering_spec.rb +35 -0
  169. data/spec/lib/mllib/matrix_spec.rb +32 -0
  170. data/spec/lib/mllib/regression_spec.rb +116 -0
  171. data/spec/lib/mllib/vector_spec.rb +77 -0
  172. data/spec/lib/reduce_by_key_spec.rb +118 -0
  173. data/spec/lib/reduce_spec.rb +131 -0
  174. data/spec/lib/sample_spec.rb +46 -0
  175. data/spec/lib/serializer_spec.rb +88 -0
  176. data/spec/lib/sort_spec.rb +58 -0
  177. data/spec/lib/statistic_spec.rb +170 -0
  178. data/spec/lib/whole_text_files_spec.rb +33 -0
  179. data/spec/spec_helper.rb +38 -0
  180. metadata +389 -0
@@ -0,0 +1,33 @@
1
+ require "spec_helper"
2
+
3
+ RSpec::shared_examples "a whole_text_files" do |workers|
4
+ it "with #{workers || 'default'} worker" do
5
+ rdd2 = rdd(workers).map(get_numbers)
6
+ result = files.size
7
+
8
+ expect(rdd2.collect.size).to eql(result)
9
+
10
+ rdd3 = rdd(workers)
11
+ rdd3 = rdd3.flat_map(get_numbers)
12
+
13
+ result = 0
14
+ files.each{|f| result += File.read(f).split.map(&:to_i).reduce(:+)}
15
+
16
+ expect(rdd3.sum).to eql(result)
17
+ end
18
+ end
19
+
20
+ RSpec::describe "Spark::Context" do
21
+ let(:get_numbers) { lambda{|file, content| content.split.map(&:to_i)} }
22
+
23
+ let(:dir) { File.join("spec", "inputs", "numbers") }
24
+ let(:files) { Dir.glob(File.join(dir, "*")) }
25
+
26
+ def rdd(workers)
27
+ $sc.whole_text_files(dir, workers)
28
+ end
29
+
30
+ it_behaves_like "a whole_text_files", nil
31
+ it_behaves_like "a whole_text_files", 1
32
+ it_behaves_like "a whole_text_files", rand(2..10)
33
+ end
@@ -0,0 +1,38 @@
1
+ # require 'simplecov'
2
+ # SimpleCov.start
3
+
4
+ $LOAD_PATH.unshift File.dirname(__FILE__) + '/../lib'
5
+ require 'ruby-spark'
6
+ require 'generator'
7
+
8
+ # Loading
9
+ Spark.load_lib
10
+ Spark.jb.load_test
11
+ Spark::Mllib.import
12
+
13
+ # Keep it on method because its called from config test
14
+ def spark_start
15
+ Spark.logger.disable
16
+ Spark.config do
17
+ set 'spark.ruby.serializer.batch_size', 100
18
+ end
19
+ Spark.start
20
+ $sc = Spark.context
21
+ end
22
+
23
+ def windows?
24
+ RbConfig::CONFIG['host_os'] =~ /mswin|mingw/
25
+ end
26
+
27
+ RSpec.configure do |config|
28
+ config.default_formatter = 'doc'
29
+ config.color = true
30
+ config.tty = true
31
+
32
+ config.before(:suite) do
33
+ spark_start
34
+ end
35
+ config.after(:suite) do
36
+ Spark.stop
37
+ end
38
+ end
metadata ADDED
@@ -0,0 +1,389 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: ruby-spark
3
+ version: !ruby/object:Gem::Version
4
+ version: 1.1.0.1
5
+ platform: java
6
+ authors:
7
+ - Ondřej Moravčík
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2015-05-16 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: sourcify
15
+ version_requirements: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - '='
18
+ - !ruby/object:Gem::Version
19
+ version: 0.6.0.rc4
20
+ requirement: !ruby/object:Gem::Requirement
21
+ requirements:
22
+ - - '='
23
+ - !ruby/object:Gem::Version
24
+ version: 0.6.0.rc4
25
+ prerelease: false
26
+ type: :runtime
27
+ - !ruby/object:Gem::Dependency
28
+ name: method_source
29
+ version_requirements: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - ">="
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ requirement: !ruby/object:Gem::Requirement
35
+ requirements:
36
+ - - ">="
37
+ - !ruby/object:Gem::Version
38
+ version: '0'
39
+ prerelease: false
40
+ type: :runtime
41
+ - !ruby/object:Gem::Dependency
42
+ name: commander
43
+ version_requirements: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - ">="
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ requirement: !ruby/object:Gem::Requirement
49
+ requirements:
50
+ - - ">="
51
+ - !ruby/object:Gem::Version
52
+ version: '0'
53
+ prerelease: false
54
+ type: :runtime
55
+ - !ruby/object:Gem::Dependency
56
+ name: pry
57
+ version_requirements: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - ">="
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ requirement: !ruby/object:Gem::Requirement
63
+ requirements:
64
+ - - ">="
65
+ - !ruby/object:Gem::Version
66
+ version: '0'
67
+ prerelease: false
68
+ type: :runtime
69
+ - !ruby/object:Gem::Dependency
70
+ name: nio4r
71
+ version_requirements: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - ">="
74
+ - !ruby/object:Gem::Version
75
+ version: '0'
76
+ requirement: !ruby/object:Gem::Requirement
77
+ requirements:
78
+ - - ">="
79
+ - !ruby/object:Gem::Version
80
+ version: '0'
81
+ prerelease: false
82
+ type: :runtime
83
+ - !ruby/object:Gem::Dependency
84
+ name: distribution
85
+ version_requirements: !ruby/object:Gem::Requirement
86
+ requirements:
87
+ - - ">="
88
+ - !ruby/object:Gem::Version
89
+ version: '0'
90
+ requirement: !ruby/object:Gem::Requirement
91
+ requirements:
92
+ - - ">="
93
+ - !ruby/object:Gem::Version
94
+ version: '0'
95
+ prerelease: false
96
+ type: :runtime
97
+ - !ruby/object:Gem::Dependency
98
+ name: bundler
99
+ version_requirements: !ruby/object:Gem::Requirement
100
+ requirements:
101
+ - - "~>"
102
+ - !ruby/object:Gem::Version
103
+ version: '1.6'
104
+ requirement: !ruby/object:Gem::Requirement
105
+ requirements:
106
+ - - "~>"
107
+ - !ruby/object:Gem::Version
108
+ version: '1.6'
109
+ prerelease: false
110
+ type: :development
111
+ - !ruby/object:Gem::Dependency
112
+ name: rake
113
+ version_requirements: !ruby/object:Gem::Requirement
114
+ requirements:
115
+ - - ">="
116
+ - !ruby/object:Gem::Version
117
+ version: '0'
118
+ requirement: !ruby/object:Gem::Requirement
119
+ requirements:
120
+ - - ">="
121
+ - !ruby/object:Gem::Version
122
+ version: '0'
123
+ prerelease: false
124
+ type: :development
125
+ description: ''
126
+ email:
127
+ - moravcik.ondrej@gmail.com
128
+ executables:
129
+ - ruby-spark
130
+ extensions:
131
+ - ext/ruby_java/extconf.rb
132
+ extra_rdoc_files: []
133
+ files:
134
+ - ".gitignore"
135
+ - Gemfile
136
+ - Guardfile
137
+ - LICENSE.txt
138
+ - README.md
139
+ - Rakefile
140
+ - TODO.md
141
+ - benchmark/aggregate.rb
142
+ - benchmark/bisect.rb
143
+ - benchmark/comparison/prepare.sh
144
+ - benchmark/comparison/python.py
145
+ - benchmark/comparison/r.r
146
+ - benchmark/comparison/ruby.rb
147
+ - benchmark/comparison/run-all.sh
148
+ - benchmark/comparison/scala.scala
149
+ - benchmark/custom_marshal.rb
150
+ - benchmark/digest.rb
151
+ - benchmark/enumerator.rb
152
+ - benchmark/serializer.rb
153
+ - benchmark/sort.rb
154
+ - benchmark/sort2.rb
155
+ - benchmark/take.rb
156
+ - bin/ruby-spark
157
+ - example/pi.rb
158
+ - example/website_search.rb
159
+ - ext/ruby_c/extconf.rb
160
+ - ext/ruby_c/murmur.c
161
+ - ext/ruby_c/murmur.h
162
+ - ext/ruby_c/ruby-spark.c
163
+ - ext/ruby_java/Digest.java
164
+ - ext/ruby_java/Murmur2.java
165
+ - ext/ruby_java/RubySparkExtService.java
166
+ - ext/ruby_java/extconf.rb
167
+ - ext/spark/build.sbt
168
+ - ext/spark/project/plugins.sbt
169
+ - ext/spark/sbt/sbt
170
+ - ext/spark/src/main/scala/Exec.scala
171
+ - ext/spark/src/main/scala/MLLibAPI.scala
172
+ - ext/spark/src/main/scala/Marshal.scala
173
+ - ext/spark/src/main/scala/MarshalDump.scala
174
+ - ext/spark/src/main/scala/MarshalLoad.scala
175
+ - ext/spark/src/main/scala/RubyAccumulatorParam.scala
176
+ - ext/spark/src/main/scala/RubyBroadcast.scala
177
+ - ext/spark/src/main/scala/RubyConstant.scala
178
+ - ext/spark/src/main/scala/RubyMLLibAPI.scala
179
+ - ext/spark/src/main/scala/RubyMLLibUtilAPI.scala
180
+ - ext/spark/src/main/scala/RubyPage.scala
181
+ - ext/spark/src/main/scala/RubyRDD.scala
182
+ - ext/spark/src/main/scala/RubySerializer.scala
183
+ - ext/spark/src/main/scala/RubyTab.scala
184
+ - ext/spark/src/main/scala/RubyUtils.scala
185
+ - ext/spark/src/main/scala/RubyWorker.scala
186
+ - ext/spark/src/test/scala/MarshalSpec.scala
187
+ - lib/ruby-spark.rb
188
+ - lib/spark.rb
189
+ - lib/spark/accumulator.rb
190
+ - lib/spark/broadcast.rb
191
+ - lib/spark/build.rb
192
+ - lib/spark/cli.rb
193
+ - lib/spark/command.rb
194
+ - lib/spark/command/base.rb
195
+ - lib/spark/command/basic.rb
196
+ - lib/spark/command/pair.rb
197
+ - lib/spark/command/sort.rb
198
+ - lib/spark/command/statistic.rb
199
+ - lib/spark/command_builder.rb
200
+ - lib/spark/command_validator.rb
201
+ - lib/spark/config.rb
202
+ - lib/spark/constant.rb
203
+ - lib/spark/context.rb
204
+ - lib/spark/error.rb
205
+ - lib/spark/ext/hash.rb
206
+ - lib/spark/ext/integer.rb
207
+ - lib/spark/ext/io.rb
208
+ - lib/spark/ext/ip_socket.rb
209
+ - lib/spark/ext/module.rb
210
+ - lib/spark/ext/object.rb
211
+ - lib/spark/ext/string.rb
212
+ - lib/spark/helper.rb
213
+ - lib/spark/helper/logger.rb
214
+ - lib/spark/helper/parser.rb
215
+ - lib/spark/helper/serialize.rb
216
+ - lib/spark/helper/statistic.rb
217
+ - lib/spark/helper/system.rb
218
+ - lib/spark/java_bridge.rb
219
+ - lib/spark/java_bridge/base.rb
220
+ - lib/spark/java_bridge/jruby.rb
221
+ - lib/spark/java_bridge/rjb.rb
222
+ - lib/spark/logger.rb
223
+ - lib/spark/mllib.rb
224
+ - lib/spark/mllib/classification/common.rb
225
+ - lib/spark/mllib/classification/logistic_regression.rb
226
+ - lib/spark/mllib/classification/naive_bayes.rb
227
+ - lib/spark/mllib/classification/svm.rb
228
+ - lib/spark/mllib/clustering/gaussian_mixture.rb
229
+ - lib/spark/mllib/clustering/kmeans.rb
230
+ - lib/spark/mllib/matrix.rb
231
+ - lib/spark/mllib/regression/common.rb
232
+ - lib/spark/mllib/regression/labeled_point.rb
233
+ - lib/spark/mllib/regression/lasso.rb
234
+ - lib/spark/mllib/regression/linear.rb
235
+ - lib/spark/mllib/regression/ridge.rb
236
+ - lib/spark/mllib/ruby_matrix/matrix_adapter.rb
237
+ - lib/spark/mllib/ruby_matrix/vector_adapter.rb
238
+ - lib/spark/mllib/stat/distribution.rb
239
+ - lib/spark/mllib/vector.rb
240
+ - lib/spark/rdd.rb
241
+ - lib/spark/sampler.rb
242
+ - lib/spark/serializer.rb
243
+ - lib/spark/serializer/auto_batched.rb
244
+ - lib/spark/serializer/base.rb
245
+ - lib/spark/serializer/batched.rb
246
+ - lib/spark/serializer/cartesian.rb
247
+ - lib/spark/serializer/compressed.rb
248
+ - lib/spark/serializer/marshal.rb
249
+ - lib/spark/serializer/message_pack.rb
250
+ - lib/spark/serializer/oj.rb
251
+ - lib/spark/serializer/pair.rb
252
+ - lib/spark/serializer/text.rb
253
+ - lib/spark/sort.rb
254
+ - lib/spark/stat_counter.rb
255
+ - lib/spark/storage_level.rb
256
+ - lib/spark/version.rb
257
+ - lib/spark/worker/master.rb
258
+ - lib/spark/worker/spark_files.rb
259
+ - lib/spark/worker/worker.rb
260
+ - ruby-spark.gemspec
261
+ - spec/generator.rb
262
+ - spec/inputs/lorem_300.txt
263
+ - spec/inputs/numbers/1.txt
264
+ - spec/inputs/numbers/10.txt
265
+ - spec/inputs/numbers/11.txt
266
+ - spec/inputs/numbers/12.txt
267
+ - spec/inputs/numbers/13.txt
268
+ - spec/inputs/numbers/14.txt
269
+ - spec/inputs/numbers/15.txt
270
+ - spec/inputs/numbers/16.txt
271
+ - spec/inputs/numbers/17.txt
272
+ - spec/inputs/numbers/18.txt
273
+ - spec/inputs/numbers/19.txt
274
+ - spec/inputs/numbers/2.txt
275
+ - spec/inputs/numbers/20.txt
276
+ - spec/inputs/numbers/3.txt
277
+ - spec/inputs/numbers/4.txt
278
+ - spec/inputs/numbers/5.txt
279
+ - spec/inputs/numbers/6.txt
280
+ - spec/inputs/numbers/7.txt
281
+ - spec/inputs/numbers/8.txt
282
+ - spec/inputs/numbers/9.txt
283
+ - spec/inputs/numbers_0_100.txt
284
+ - spec/inputs/numbers_1_100.txt
285
+ - spec/lib/collect_spec.rb
286
+ - spec/lib/command_spec.rb
287
+ - spec/lib/config_spec.rb
288
+ - spec/lib/context_spec.rb
289
+ - spec/lib/ext_spec.rb
290
+ - spec/lib/external_apps_spec.rb
291
+ - spec/lib/filter_spec.rb
292
+ - spec/lib/flat_map_spec.rb
293
+ - spec/lib/group_spec.rb
294
+ - spec/lib/helper_spec.rb
295
+ - spec/lib/key_spec.rb
296
+ - spec/lib/manipulation_spec.rb
297
+ - spec/lib/map_partitions_spec.rb
298
+ - spec/lib/map_spec.rb
299
+ - spec/lib/mllib/classification_spec.rb
300
+ - spec/lib/mllib/clustering_spec.rb
301
+ - spec/lib/mllib/matrix_spec.rb
302
+ - spec/lib/mllib/regression_spec.rb
303
+ - spec/lib/mllib/vector_spec.rb
304
+ - spec/lib/reduce_by_key_spec.rb
305
+ - spec/lib/reduce_spec.rb
306
+ - spec/lib/sample_spec.rb
307
+ - spec/lib/serializer_spec.rb
308
+ - spec/lib/sort_spec.rb
309
+ - spec/lib/statistic_spec.rb
310
+ - spec/lib/whole_text_files_spec.rb
311
+ - spec/spec_helper.rb
312
+ homepage: ''
313
+ licenses:
314
+ - MIT
315
+ metadata: {}
316
+ post_install_message:
317
+ rdoc_options: []
318
+ require_paths:
319
+ - lib
320
+ required_ruby_version: !ruby/object:Gem::Requirement
321
+ requirements:
322
+ - - ">="
323
+ - !ruby/object:Gem::Version
324
+ version: '2.0'
325
+ required_rubygems_version: !ruby/object:Gem::Requirement
326
+ requirements:
327
+ - - ">="
328
+ - !ruby/object:Gem::Version
329
+ version: '0'
330
+ requirements:
331
+ - java, scala
332
+ rubyforge_project:
333
+ rubygems_version: 2.4.5
334
+ signing_key:
335
+ specification_version: 4
336
+ summary: Ruby wrapper for Apache Spark
337
+ test_files:
338
+ - spec/generator.rb
339
+ - spec/inputs/lorem_300.txt
340
+ - spec/inputs/numbers/1.txt
341
+ - spec/inputs/numbers/10.txt
342
+ - spec/inputs/numbers/11.txt
343
+ - spec/inputs/numbers/12.txt
344
+ - spec/inputs/numbers/13.txt
345
+ - spec/inputs/numbers/14.txt
346
+ - spec/inputs/numbers/15.txt
347
+ - spec/inputs/numbers/16.txt
348
+ - spec/inputs/numbers/17.txt
349
+ - spec/inputs/numbers/18.txt
350
+ - spec/inputs/numbers/19.txt
351
+ - spec/inputs/numbers/2.txt
352
+ - spec/inputs/numbers/20.txt
353
+ - spec/inputs/numbers/3.txt
354
+ - spec/inputs/numbers/4.txt
355
+ - spec/inputs/numbers/5.txt
356
+ - spec/inputs/numbers/6.txt
357
+ - spec/inputs/numbers/7.txt
358
+ - spec/inputs/numbers/8.txt
359
+ - spec/inputs/numbers/9.txt
360
+ - spec/inputs/numbers_0_100.txt
361
+ - spec/inputs/numbers_1_100.txt
362
+ - spec/lib/collect_spec.rb
363
+ - spec/lib/command_spec.rb
364
+ - spec/lib/config_spec.rb
365
+ - spec/lib/context_spec.rb
366
+ - spec/lib/ext_spec.rb
367
+ - spec/lib/external_apps_spec.rb
368
+ - spec/lib/filter_spec.rb
369
+ - spec/lib/flat_map_spec.rb
370
+ - spec/lib/group_spec.rb
371
+ - spec/lib/helper_spec.rb
372
+ - spec/lib/key_spec.rb
373
+ - spec/lib/manipulation_spec.rb
374
+ - spec/lib/map_partitions_spec.rb
375
+ - spec/lib/map_spec.rb
376
+ - spec/lib/mllib/classification_spec.rb
377
+ - spec/lib/mllib/clustering_spec.rb
378
+ - spec/lib/mllib/matrix_spec.rb
379
+ - spec/lib/mllib/regression_spec.rb
380
+ - spec/lib/mllib/vector_spec.rb
381
+ - spec/lib/reduce_by_key_spec.rb
382
+ - spec/lib/reduce_spec.rb
383
+ - spec/lib/sample_spec.rb
384
+ - spec/lib/serializer_spec.rb
385
+ - spec/lib/sort_spec.rb
386
+ - spec/lib/statistic_spec.rb
387
+ - spec/lib/whole_text_files_spec.rb
388
+ - spec/spec_helper.rb
389
+ has_rdoc: