rp-emr 1.0.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,23 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR::Instances do
4
+ describe "#to_hash" do
5
+ let(:instances_args) { {} }
6
+
7
+ let(:instances) do
8
+ RP::EMR::Instances.new(instances_args)
9
+ end
10
+
11
+ it "returns a hash" do
12
+ expect(instances.to_hash).to eq({})
13
+ end
14
+
15
+ context "with stuff specified" do
16
+ let(:instances_args) { {master_instance_type: 'master_instance_type'} }
17
+
18
+ it "adds stuff to hash" do
19
+ expect(instances.to_hash).to eq(master_instance_type: 'master_instance_type')
20
+ end
21
+ end
22
+ end
23
+ end
@@ -0,0 +1,31 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR::Job do
4
+ describe "#to_hash" do
5
+ let(:instances_args) { {} }
6
+
7
+ let(:instances) do
8
+ RP::EMR::Instances.new(instances_args)
9
+ end
10
+
11
+ let(:job_args) { {} }
12
+
13
+ let(:job) do
14
+ RP::EMR::Job.new(job_args) do |j|
15
+ j.instances = instances.to_hash
16
+ end
17
+ end
18
+
19
+ it "returns a hash" do
20
+ expect(job.to_hash).to eq(ami_version: 'latest', visible_to_all_users: true)
21
+ end
22
+
23
+ context "with stuff specified" do
24
+ let(:job_args) { {ami_version: 'ami_version'} }
25
+
26
+ it "adds stuff to hash" do
27
+ expect(job.to_hash[:ami_version]).to eq('ami_version')
28
+ end
29
+ end
30
+ end
31
+ end
@@ -0,0 +1,136 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR::Step::Pig do
4
+ describe "#to_hash" do
5
+ let(:written) { [] }
6
+
7
+ before(:each) do
8
+ allow_any_instance_of(AWS::S3::S3Object).to receive(:write) do |data|
9
+ written << data
10
+ end
11
+ end
12
+
13
+ after(:each) do
14
+ script.delete
15
+ end
16
+
17
+ let(:script_contents) { 'script_contents' }
18
+
19
+ let(:script) do
20
+ script = Tempfile.new('pig_step_test')
21
+ script.write(script_contents)
22
+ script.close
23
+ script
24
+ end
25
+
26
+ let(:expected_script_path) do
27
+ hash = Digest::MD5.hexdigest(script_contents)
28
+ "scripts/emr_gem/#{File.basename(script.path, '.pig')}_#{hash}.pig"
29
+ end
30
+
31
+ let(:step_args) { {} }
32
+
33
+ let(:step) do
34
+ RP::EMR::Step::Pig.new(step_args) do |s|
35
+ s.name = 'step_name'
36
+ s.script_path = script.path
37
+ s.script_bucket = 'script_bucket'
38
+ end
39
+ end
40
+
41
+ it "writes script to expected path" do
42
+ expect_any_instance_of(AWS::S3::ObjectCollection).to receive(:[]).with(expected_script_path).and_call_original
43
+
44
+ step.to_hash
45
+ end
46
+
47
+ it "uploads pig script contents" do
48
+ pending "Strange behavior with test setup?"
49
+ step.to_hash
50
+
51
+ expect(written).to eq(['script_contents'])
52
+ end
53
+
54
+ it "returns hash" do
55
+ expect(step.to_hash).to eq(
56
+ :name=>"step_name",
57
+ :hadoop_jar_step=>{
58
+ :jar=>"s3://us-east-1.elasticmapreduce/libs/script-runner/script-runner.jar",
59
+ :args=>[
60
+ "s3://us-east-1.elasticmapreduce/libs/pig/pig-script",
61
+ "--base-path", "s3://us-east-1.elasticmapreduce/libs/pig/",
62
+ "--pig-versions", "0.11.1.1",
63
+ "--run-pig-script",
64
+ "--args",
65
+ "-f", "s3://script_bucket/#{expected_script_path}",
66
+ ]
67
+ }
68
+ )
69
+ end
70
+
71
+ context "with args" do
72
+ let(:step_args) { {args: ['foo', 'bar']} }
73
+
74
+ it "adds to the args array" do
75
+ expect(step.to_hash[:hadoop_jar_step][:args]).to eq([
76
+ "s3://us-east-1.elasticmapreduce/libs/pig/pig-script",
77
+ "--base-path", "s3://us-east-1.elasticmapreduce/libs/pig/",
78
+ "--pig-versions", "0.11.1.1",
79
+ "--run-pig-script",
80
+ "foo", "bar",
81
+ "--args",
82
+ "-f", "s3://script_bucket/#{expected_script_path}",
83
+ ])
84
+ end
85
+ end
86
+
87
+ context "with pig_params" do
88
+ let(:step_args) { {pig_params: {foo: 'bar'}} }
89
+
90
+ it "adds to the args array" do
91
+ expect(step.to_hash[:hadoop_jar_step][:args]).to eq([
92
+ "s3://us-east-1.elasticmapreduce/libs/pig/pig-script",
93
+ "--base-path", "s3://us-east-1.elasticmapreduce/libs/pig/",
94
+ "--pig-versions", "0.11.1.1",
95
+ "--run-pig-script",
96
+ "--args",
97
+ "-f", "s3://script_bucket/#{expected_script_path}",
98
+ "-p", "foo=bar",
99
+ ])
100
+ end
101
+ end
102
+
103
+ context "with pig_version" do
104
+ let(:step_args) { {pig_version: 'pig_version'} }
105
+
106
+ it "adds to the args array" do
107
+ expect(step.to_hash[:hadoop_jar_step][:args]).to eq([
108
+ "s3://us-east-1.elasticmapreduce/libs/pig/pig-script",
109
+ "--base-path", "s3://us-east-1.elasticmapreduce/libs/pig/",
110
+ "--pig-versions", "pig_version",
111
+ "--run-pig-script",
112
+ "--args",
113
+ "-f", "s3://script_bucket/#{expected_script_path}",
114
+ ])
115
+ end
116
+ end
117
+
118
+ context "with action_on_failure" do
119
+ let(:step_args) { {action_on_failure: 'action_on_failure'} }
120
+
121
+ it "sets the step action on failure" do
122
+ expect(step.to_hash[:action_on_failure]).to eq('action_on_failure')
123
+ end
124
+ end
125
+
126
+ context "with dry_run" do
127
+ let(:step_args) { {dry_run: true} }
128
+
129
+ it "doesn't upload pig script" do
130
+ step.to_hash
131
+
132
+ expect(written).to eq([])
133
+ end
134
+ end
135
+ end
136
+ end
@@ -0,0 +1,83 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR::Step::S3DistCp do
4
+ describe "#to_hash" do
5
+ let(:step_args) { {} }
6
+
7
+ let(:step) do
8
+ RP::EMR::Step::S3DistCp.new(step_args)
9
+ end
10
+
11
+ it "returns hash" do
12
+ expect(step.to_hash).to eq(
13
+ :name=>"S3DistCp",
14
+ :hadoop_jar_step=>{
15
+ :jar=>"/home/hadoop/lib/emr-s3distcp-1.0.jar",
16
+ :args=>[]
17
+ }
18
+ )
19
+ end
20
+
21
+ context "with hash args" do
22
+ let(:step_args) do
23
+ {
24
+ src: 'src',
25
+ dest: 'dest',
26
+ groupBy: '.*',
27
+ outputCodec: nil,
28
+ }
29
+ end
30
+
31
+ it "returns hash" do
32
+ expect(step.to_hash[:hadoop_jar_step][:args]).to eq([
33
+ '--src', 'src',
34
+ '--dest', 'dest',
35
+ '--groupBy', '.*',
36
+ ])
37
+ end
38
+ end
39
+
40
+ context "with numeric hash args" do
41
+ let(:step_args) do
42
+ {targetSize: 100}
43
+ end
44
+
45
+ it "converts to strings" do
46
+ expect(step.to_hash[:hadoop_jar_step][:args]).to eq([
47
+ '--targetSize', '100',
48
+ ])
49
+ end
50
+ end
51
+
52
+ context "with boolean args" do
53
+ let(:step_args) do
54
+ {
55
+ deleteOnSuccess: true,
56
+ numberFiles: false,
57
+ }
58
+ end
59
+
60
+ it "returns hash" do
61
+ expect(step.to_hash[:hadoop_jar_step][:args]).to eq([
62
+ '--deleteOnSuccess',
63
+ ])
64
+ end
65
+ end
66
+
67
+ context "with action_on_failure" do
68
+ let(:step_args) { {action_on_failure: 'action_on_failure'} }
69
+
70
+ it "sets the step action on failure" do
71
+ expect(step.to_hash[:action_on_failure]).to eq('action_on_failure')
72
+ end
73
+ end
74
+
75
+ context "with name" do
76
+ let(:step_args) { {name: 'name'} }
77
+
78
+ it "sets the step name" do
79
+ expect(step.to_hash[:name]).to eq('name')
80
+ end
81
+ end
82
+ end
83
+ end
@@ -0,0 +1,29 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR::Step::SetupDebugging do
4
+ describe "#to_hash" do
5
+ let(:step_args) { {} }
6
+
7
+ let(:step) do
8
+ RP::EMR::Step::SetupDebugging.new(step_args)
9
+ end
10
+
11
+ it "returns hash" do
12
+ expect(step.to_hash).to eq(
13
+ :name=>"Setup Hadoop Debugging",
14
+ :hadoop_jar_step=>{
15
+ :jar=>"s3://us-east-1.elasticmapreduce/libs/script-runner/script-runner.jar",
16
+ :args=>["s3://us-east-1.elasticmapreduce/libs/state-pusher/0.1/fetch"]
17
+ }
18
+ )
19
+ end
20
+
21
+ context "with action_on_failure" do
22
+ let(:step_args) { {action_on_failure: 'action_on_failure'} }
23
+
24
+ it "sets the step action on failure" do
25
+ expect(step.to_hash[:action_on_failure]).to eq('action_on_failure')
26
+ end
27
+ end
28
+ end
29
+ end
@@ -0,0 +1,47 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR::Step::SetupPig do
4
+ describe "#to_hash" do
5
+ let(:step_args) { {} }
6
+
7
+ let(:step) do
8
+ RP::EMR::Step::SetupPig.new(step_args)
9
+ end
10
+
11
+ it "returns hash" do
12
+ expect(step.to_hash).to eq(
13
+ :name=>"Setup Pig",
14
+ :hadoop_jar_step=>{
15
+ :jar=>"s3://us-east-1.elasticmapreduce/libs/script-runner/script-runner.jar",
16
+ :args=>[
17
+ "s3://us-east-1.elasticmapreduce/libs/pig/pig-script",
18
+ "--base-path", "s3://us-east-1.elasticmapreduce/libs/pig/",
19
+ "--install-pig",
20
+ "--pig-versions", "0.11.1.1"
21
+ ]
22
+ }
23
+ )
24
+ end
25
+
26
+ context "with pig_version" do
27
+ let(:step_args) { {pig_version: 'pig_version'} }
28
+
29
+ it "sets the pig version" do
30
+ expect(step.to_hash[:hadoop_jar_step][:args]).to eq([
31
+ "s3://us-east-1.elasticmapreduce/libs/pig/pig-script",
32
+ "--base-path", "s3://us-east-1.elasticmapreduce/libs/pig/",
33
+ "--install-pig",
34
+ "--pig-versions", "pig_version"
35
+ ])
36
+ end
37
+ end
38
+
39
+ context "with action_on_failure" do
40
+ let(:step_args) { {action_on_failure: 'action_on_failure'} }
41
+
42
+ it "sets the step action on failure" do
43
+ expect(step.to_hash[:action_on_failure]).to eq('action_on_failure')
44
+ end
45
+ end
46
+ end
47
+ end
@@ -0,0 +1,33 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR::Step do
4
+ describe "#to_hash" do
5
+ let(:step_args) { {} }
6
+
7
+ let(:step) do
8
+ RP::EMR::Step.new(step_args) do |s|
9
+ s.name = 'name'
10
+ end
11
+ end
12
+
13
+ it "returns a hash" do
14
+ expect(step.to_hash).to eq(name: 'name')
15
+ end
16
+
17
+ context "with action_on_failure" do
18
+ let(:step_args) { {action_on_failure: 'action_on_failure'} }
19
+
20
+ it "sets action on failure" do
21
+ expect(step.to_hash[:action_on_failure]).to eq('action_on_failure')
22
+ end
23
+ end
24
+
25
+ context "with hadoop_jar_step" do
26
+ let(:step_args) { {hadoop_jar_step: 'hadoop_jar_step'} }
27
+
28
+ it "sets hadoop jar step" do
29
+ expect(step.to_hash[:hadoop_jar_step]).to eq('hadoop_jar_step')
30
+ end
31
+ end
32
+ end
33
+ end
@@ -0,0 +1,5 @@
1
+ require 'spec_helper'
2
+
3
+ describe RP::EMR do
4
+ end
5
+
@@ -0,0 +1,10 @@
1
+ require 'rubygems'
2
+ require 'rspec'
3
+ require 'pry'
4
+
5
+ require 'rp/emr'
6
+
7
+ RSpec.configure do |config|
8
+ config.order = "random"
9
+ end
10
+
metadata ADDED
@@ -0,0 +1,221 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: rp-emr
3
+ version: !ruby/object:Gem::Version
4
+ version: 1.0.3
5
+ platform: ruby
6
+ authors:
7
+ - Ryan Michael
8
+ - Andrew Harrison
9
+ autorequire:
10
+ bindir: bin
11
+ cert_chain: []
12
+ date: 2014-09-12 00:00:00.000000000 Z
13
+ dependencies:
14
+ - !ruby/object:Gem::Dependency
15
+ name: activesupport
16
+ requirement: !ruby/object:Gem::Requirement
17
+ requirements:
18
+ - - ">="
19
+ - !ruby/object:Gem::Version
20
+ version: '0'
21
+ type: :runtime
22
+ prerelease: false
23
+ version_requirements: !ruby/object:Gem::Requirement
24
+ requirements:
25
+ - - ">="
26
+ - !ruby/object:Gem::Version
27
+ version: '0'
28
+ - !ruby/object:Gem::Dependency
29
+ name: aws-sdk
30
+ requirement: !ruby/object:Gem::Requirement
31
+ requirements:
32
+ - - ">="
33
+ - !ruby/object:Gem::Version
34
+ version: '0'
35
+ type: :runtime
36
+ prerelease: false
37
+ version_requirements: !ruby/object:Gem::Requirement
38
+ requirements:
39
+ - - ">="
40
+ - !ruby/object:Gem::Version
41
+ version: '0'
42
+ - !ruby/object:Gem::Dependency
43
+ name: assembler
44
+ requirement: !ruby/object:Gem::Requirement
45
+ requirements:
46
+ - - ">="
47
+ - !ruby/object:Gem::Version
48
+ version: '0'
49
+ type: :runtime
50
+ prerelease: false
51
+ version_requirements: !ruby/object:Gem::Requirement
52
+ requirements:
53
+ - - ">="
54
+ - !ruby/object:Gem::Version
55
+ version: '0'
56
+ - !ruby/object:Gem::Dependency
57
+ name: thor
58
+ requirement: !ruby/object:Gem::Requirement
59
+ requirements:
60
+ - - ">="
61
+ - !ruby/object:Gem::Version
62
+ version: '0'
63
+ type: :runtime
64
+ prerelease: false
65
+ version_requirements: !ruby/object:Gem::Requirement
66
+ requirements:
67
+ - - ">="
68
+ - !ruby/object:Gem::Version
69
+ version: '0'
70
+ - !ruby/object:Gem::Dependency
71
+ name: bundler
72
+ requirement: !ruby/object:Gem::Requirement
73
+ requirements:
74
+ - - ">="
75
+ - !ruby/object:Gem::Version
76
+ version: '0'
77
+ type: :development
78
+ prerelease: false
79
+ version_requirements: !ruby/object:Gem::Requirement
80
+ requirements:
81
+ - - ">="
82
+ - !ruby/object:Gem::Version
83
+ version: '0'
84
+ - !ruby/object:Gem::Dependency
85
+ name: rake
86
+ requirement: !ruby/object:Gem::Requirement
87
+ requirements:
88
+ - - ">="
89
+ - !ruby/object:Gem::Version
90
+ version: '0'
91
+ type: :development
92
+ prerelease: false
93
+ version_requirements: !ruby/object:Gem::Requirement
94
+ requirements:
95
+ - - ">="
96
+ - !ruby/object:Gem::Version
97
+ version: '0'
98
+ - !ruby/object:Gem::Dependency
99
+ name: rspec
100
+ requirement: !ruby/object:Gem::Requirement
101
+ requirements:
102
+ - - ">="
103
+ - !ruby/object:Gem::Version
104
+ version: '0'
105
+ type: :development
106
+ prerelease: false
107
+ version_requirements: !ruby/object:Gem::Requirement
108
+ requirements:
109
+ - - ">="
110
+ - !ruby/object:Gem::Version
111
+ version: '0'
112
+ - !ruby/object:Gem::Dependency
113
+ name: pry
114
+ requirement: !ruby/object:Gem::Requirement
115
+ requirements:
116
+ - - ">="
117
+ - !ruby/object:Gem::Version
118
+ version: '0'
119
+ type: :development
120
+ prerelease: false
121
+ version_requirements: !ruby/object:Gem::Requirement
122
+ requirements:
123
+ - - ">="
124
+ - !ruby/object:Gem::Version
125
+ version: '0'
126
+ - !ruby/object:Gem::Dependency
127
+ name: fuubar
128
+ requirement: !ruby/object:Gem::Requirement
129
+ requirements:
130
+ - - ">="
131
+ - !ruby/object:Gem::Version
132
+ version: '0'
133
+ type: :development
134
+ prerelease: false
135
+ version_requirements: !ruby/object:Gem::Requirement
136
+ requirements:
137
+ - - ">="
138
+ - !ruby/object:Gem::Version
139
+ version: '0'
140
+ description: Framework for launching EMR job flows
141
+ email:
142
+ - ryanmichael@otherinbox.com
143
+ - andrew.harrison@returnpath.com
144
+ executables:
145
+ - emr
146
+ extensions: []
147
+ extra_rdoc_files: []
148
+ files:
149
+ - ".gitignore"
150
+ - ".rspec"
151
+ - CHANGELOG.md
152
+ - Gemfile
153
+ - LICENSE.txt
154
+ - README.md
155
+ - Rakefile
156
+ - bin/emr
157
+ - lib/rp/emr.rb
158
+ - lib/rp/emr/bootstrap_action.rb
159
+ - lib/rp/emr/cli.rb
160
+ - lib/rp/emr/instance_group.rb
161
+ - lib/rp/emr/instance_groups.rb
162
+ - lib/rp/emr/instances.rb
163
+ - lib/rp/emr/job.rb
164
+ - lib/rp/emr/step.rb
165
+ - lib/rp/emr/step/pig.rb
166
+ - lib/rp/emr/step/s3_dist_cp.rb
167
+ - lib/rp/emr/step/setup_debugging.rb
168
+ - lib/rp/emr/step/setup_hive.rb
169
+ - lib/rp/emr/step/setup_pig.rb
170
+ - lib/rp/emr/version.rb
171
+ - rp-emr.gemspec
172
+ - spec/rp/emr/bootstrap_action_spec.rb
173
+ - spec/rp/emr/instance_group_spec.rb
174
+ - spec/rp/emr/instance_groups_spec.rb
175
+ - spec/rp/emr/instances_spec.rb
176
+ - spec/rp/emr/job_spec.rb
177
+ - spec/rp/emr/step/pig_spec.rb
178
+ - spec/rp/emr/step/s3_dist_cp_step_spec.rb
179
+ - spec/rp/emr/step/setup_debugging_spec.rb
180
+ - spec/rp/emr/step/setup_pig_spec.rb
181
+ - spec/rp/emr/step_spec.rb
182
+ - spec/rp/emr_spec.rb
183
+ - spec/spec_helper.rb
184
+ homepage: ''
185
+ licenses:
186
+ - MIT
187
+ metadata: {}
188
+ post_install_message:
189
+ rdoc_options: []
190
+ require_paths:
191
+ - lib
192
+ required_ruby_version: !ruby/object:Gem::Requirement
193
+ requirements:
194
+ - - ">="
195
+ - !ruby/object:Gem::Version
196
+ version: '0'
197
+ required_rubygems_version: !ruby/object:Gem::Requirement
198
+ requirements:
199
+ - - ">="
200
+ - !ruby/object:Gem::Version
201
+ version: '0'
202
+ requirements: []
203
+ rubyforge_project:
204
+ rubygems_version: 2.4.1
205
+ signing_key:
206
+ specification_version: 4
207
+ summary: EMR Helpers
208
+ test_files:
209
+ - spec/rp/emr/bootstrap_action_spec.rb
210
+ - spec/rp/emr/instance_group_spec.rb
211
+ - spec/rp/emr/instance_groups_spec.rb
212
+ - spec/rp/emr/instances_spec.rb
213
+ - spec/rp/emr/job_spec.rb
214
+ - spec/rp/emr/step/pig_spec.rb
215
+ - spec/rp/emr/step/s3_dist_cp_step_spec.rb
216
+ - spec/rp/emr/step/setup_debugging_spec.rb
217
+ - spec/rp/emr/step/setup_pig_spec.rb
218
+ - spec/rp/emr/step_spec.rb
219
+ - spec/rp/emr_spec.rb
220
+ - spec/spec_helper.rb
221
+ has_rdoc: