masamune 0.11.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (185) hide show
  1. checksums.yaml +7 -0
  2. data/LICENSE.txt +21 -0
  3. data/README.md +54 -0
  4. data/Rakefile +15 -0
  5. data/bin/masamune-elastic-mapreduce +4 -0
  6. data/bin/masamune-hive +4 -0
  7. data/bin/masamune-psql +4 -0
  8. data/bin/masamune-shell +4 -0
  9. data/lib/masamune.rb +56 -0
  10. data/lib/masamune/accumulate.rb +60 -0
  11. data/lib/masamune/actions.rb +38 -0
  12. data/lib/masamune/actions/data_flow.rb +131 -0
  13. data/lib/masamune/actions/date_parse.rb +75 -0
  14. data/lib/masamune/actions/elastic_mapreduce.rb +68 -0
  15. data/lib/masamune/actions/execute.rb +52 -0
  16. data/lib/masamune/actions/filesystem.rb +37 -0
  17. data/lib/masamune/actions/hadoop_filesystem.rb +40 -0
  18. data/lib/masamune/actions/hadoop_streaming.rb +41 -0
  19. data/lib/masamune/actions/hive.rb +74 -0
  20. data/lib/masamune/actions/postgres.rb +76 -0
  21. data/lib/masamune/actions/postgres_admin.rb +34 -0
  22. data/lib/masamune/actions/s3cmd.rb +44 -0
  23. data/lib/masamune/actions/transform.rb +89 -0
  24. data/lib/masamune/after_initialize_callbacks.rb +55 -0
  25. data/lib/masamune/cached_filesystem.rb +110 -0
  26. data/lib/masamune/commands.rb +37 -0
  27. data/lib/masamune/commands/elastic_mapreduce.rb +119 -0
  28. data/lib/masamune/commands/hadoop_filesystem.rb +57 -0
  29. data/lib/masamune/commands/hadoop_streaming.rb +116 -0
  30. data/lib/masamune/commands/hive.rb +178 -0
  31. data/lib/masamune/commands/interactive.rb +37 -0
  32. data/lib/masamune/commands/postgres.rb +128 -0
  33. data/lib/masamune/commands/postgres_admin.rb +72 -0
  34. data/lib/masamune/commands/postgres_common.rb +33 -0
  35. data/lib/masamune/commands/retry_with_backoff.rb +60 -0
  36. data/lib/masamune/commands/s3cmd.rb +70 -0
  37. data/lib/masamune/commands/shell.rb +202 -0
  38. data/lib/masamune/configuration.rb +195 -0
  39. data/lib/masamune/data_plan.rb +31 -0
  40. data/lib/masamune/data_plan/builder.rb +66 -0
  41. data/lib/masamune/data_plan/elem.rb +190 -0
  42. data/lib/masamune/data_plan/engine.rb +162 -0
  43. data/lib/masamune/data_plan/rule.rb +292 -0
  44. data/lib/masamune/data_plan/set.rb +176 -0
  45. data/lib/masamune/environment.rb +164 -0
  46. data/lib/masamune/filesystem.rb +567 -0
  47. data/lib/masamune/has_environment.rb +40 -0
  48. data/lib/masamune/helpers.rb +27 -0
  49. data/lib/masamune/helpers/postgres.rb +84 -0
  50. data/lib/masamune/io.rb +33 -0
  51. data/lib/masamune/last_element.rb +53 -0
  52. data/lib/masamune/method_logger.rb +41 -0
  53. data/lib/masamune/multi_io.rb +39 -0
  54. data/lib/masamune/schema.rb +36 -0
  55. data/lib/masamune/schema/catalog.rb +233 -0
  56. data/lib/masamune/schema/column.rb +527 -0
  57. data/lib/masamune/schema/dimension.rb +133 -0
  58. data/lib/masamune/schema/event.rb +121 -0
  59. data/lib/masamune/schema/fact.rb +133 -0
  60. data/lib/masamune/schema/map.rb +265 -0
  61. data/lib/masamune/schema/row.rb +133 -0
  62. data/lib/masamune/schema/store.rb +115 -0
  63. data/lib/masamune/schema/table.rb +308 -0
  64. data/lib/masamune/schema/table_reference.rb +76 -0
  65. data/lib/masamune/spec_helper.rb +23 -0
  66. data/lib/masamune/string_format.rb +34 -0
  67. data/lib/masamune/tasks/elastic_mapreduce_thor.rb +60 -0
  68. data/lib/masamune/tasks/hive_thor.rb +55 -0
  69. data/lib/masamune/tasks/postgres_thor.rb +47 -0
  70. data/lib/masamune/tasks/shell_thor.rb +63 -0
  71. data/lib/masamune/template.rb +77 -0
  72. data/lib/masamune/thor.rb +186 -0
  73. data/lib/masamune/thor_loader.rb +38 -0
  74. data/lib/masamune/topological_hash.rb +34 -0
  75. data/lib/masamune/transform.rb +47 -0
  76. data/lib/masamune/transform/bulk_upsert.psql.erb +64 -0
  77. data/lib/masamune/transform/bulk_upsert.rb +52 -0
  78. data/lib/masamune/transform/consolidate_dimension.rb +54 -0
  79. data/lib/masamune/transform/deduplicate_dimension.psql.erb +52 -0
  80. data/lib/masamune/transform/deduplicate_dimension.rb +53 -0
  81. data/lib/masamune/transform/define_event_view.hql.erb +51 -0
  82. data/lib/masamune/transform/define_event_view.rb +60 -0
  83. data/lib/masamune/transform/define_index.psql.erb +34 -0
  84. data/lib/masamune/transform/define_schema.hql.erb +23 -0
  85. data/lib/masamune/transform/define_schema.psql.erb +79 -0
  86. data/lib/masamune/transform/define_schema.rb +56 -0
  87. data/lib/masamune/transform/define_table.hql.erb +34 -0
  88. data/lib/masamune/transform/define_table.psql.erb +95 -0
  89. data/lib/masamune/transform/define_table.rb +40 -0
  90. data/lib/masamune/transform/define_unique.psql.erb +30 -0
  91. data/lib/masamune/transform/insert_reference_values.psql.erb +43 -0
  92. data/lib/masamune/transform/insert_reference_values.rb +64 -0
  93. data/lib/masamune/transform/load_dimension.rb +47 -0
  94. data/lib/masamune/transform/load_fact.rb +45 -0
  95. data/lib/masamune/transform/operator.rb +96 -0
  96. data/lib/masamune/transform/relabel_dimension.psql.erb +76 -0
  97. data/lib/masamune/transform/relabel_dimension.rb +39 -0
  98. data/lib/masamune/transform/rollup_fact.psql.erb +79 -0
  99. data/lib/masamune/transform/rollup_fact.rb +149 -0
  100. data/lib/masamune/transform/snapshot_dimension.psql.erb +75 -0
  101. data/lib/masamune/transform/snapshot_dimension.rb +74 -0
  102. data/lib/masamune/transform/stage_dimension.psql.erb +39 -0
  103. data/lib/masamune/transform/stage_dimension.rb +83 -0
  104. data/lib/masamune/transform/stage_fact.psql.erb +80 -0
  105. data/lib/masamune/transform/stage_fact.rb +111 -0
  106. data/lib/masamune/version.rb +25 -0
  107. data/spec/fixtures/aggregate.sql.erb +25 -0
  108. data/spec/fixtures/comment.sql.erb +27 -0
  109. data/spec/fixtures/invalid.sql.erb +23 -0
  110. data/spec/fixtures/relative.sql.erb +23 -0
  111. data/spec/fixtures/simple.sql.erb +28 -0
  112. data/spec/fixtures/whitespace.sql.erb +30 -0
  113. data/spec/masamune/actions/elastic_mapreduce_spec.rb +108 -0
  114. data/spec/masamune/actions/execute_spec.rb +50 -0
  115. data/spec/masamune/actions/hadoop_filesystem_spec.rb +44 -0
  116. data/spec/masamune/actions/hadoop_streaming_spec.rb +74 -0
  117. data/spec/masamune/actions/hive_spec.rb +117 -0
  118. data/spec/masamune/actions/postgres_admin_spec.rb +58 -0
  119. data/spec/masamune/actions/postgres_spec.rb +134 -0
  120. data/spec/masamune/actions/s3cmd_spec.rb +44 -0
  121. data/spec/masamune/actions/transform_spec.rb +144 -0
  122. data/spec/masamune/after_initialization_callbacks_spec.rb +61 -0
  123. data/spec/masamune/cached_filesystem_spec.rb +167 -0
  124. data/spec/masamune/commands/hadoop_filesystem_spec.rb +50 -0
  125. data/spec/masamune/commands/hadoop_streaming_spec.rb +106 -0
  126. data/spec/masamune/commands/hive_spec.rb +117 -0
  127. data/spec/masamune/commands/postgres_admin_spec.rb +69 -0
  128. data/spec/masamune/commands/postgres_spec.rb +100 -0
  129. data/spec/masamune/commands/retry_with_backoff_spec.rb +116 -0
  130. data/spec/masamune/commands/s3cmd_spec.rb +50 -0
  131. data/spec/masamune/commands/shell_spec.rb +101 -0
  132. data/spec/masamune/configuration_spec.rb +102 -0
  133. data/spec/masamune/data_plan/builder_spec.rb +91 -0
  134. data/spec/masamune/data_plan/elem_spec.rb +102 -0
  135. data/spec/masamune/data_plan/engine_spec.rb +356 -0
  136. data/spec/masamune/data_plan/rule_spec.rb +407 -0
  137. data/spec/masamune/data_plan/set_spec.rb +517 -0
  138. data/spec/masamune/environment_spec.rb +65 -0
  139. data/spec/masamune/filesystem_spec.rb +1421 -0
  140. data/spec/masamune/helpers/postgres_spec.rb +95 -0
  141. data/spec/masamune/schema/catalog_spec.rb +613 -0
  142. data/spec/masamune/schema/column_spec.rb +696 -0
  143. data/spec/masamune/schema/dimension_spec.rb +137 -0
  144. data/spec/masamune/schema/event_spec.rb +75 -0
  145. data/spec/masamune/schema/fact_spec.rb +117 -0
  146. data/spec/masamune/schema/map_spec.rb +593 -0
  147. data/spec/masamune/schema/row_spec.rb +28 -0
  148. data/spec/masamune/schema/store_spec.rb +49 -0
  149. data/spec/masamune/schema/table_spec.rb +395 -0
  150. data/spec/masamune/string_format_spec.rb +60 -0
  151. data/spec/masamune/tasks/elastic_mapreduce_thor_spec.rb +57 -0
  152. data/spec/masamune/tasks/hive_thor_spec.rb +75 -0
  153. data/spec/masamune/tasks/postgres_thor_spec.rb +42 -0
  154. data/spec/masamune/tasks/shell_thor_spec.rb +51 -0
  155. data/spec/masamune/template_spec.rb +77 -0
  156. data/spec/masamune/thor_spec.rb +238 -0
  157. data/spec/masamune/transform/bulk_upsert.dimension_spec.rb +200 -0
  158. data/spec/masamune/transform/consolidate_dimension_spec.rb +62 -0
  159. data/spec/masamune/transform/deduplicate_dimension_spec.rb +84 -0
  160. data/spec/masamune/transform/define_event_view_spec.rb +84 -0
  161. data/spec/masamune/transform/define_schema_spec.rb +83 -0
  162. data/spec/masamune/transform/define_table.dimension_spec.rb +306 -0
  163. data/spec/masamune/transform/define_table.fact_spec.rb +291 -0
  164. data/spec/masamune/transform/define_table.table_spec.rb +525 -0
  165. data/spec/masamune/transform/insert_reference_values.dimension_spec.rb +111 -0
  166. data/spec/masamune/transform/insert_reference_values.fact_spec.rb +149 -0
  167. data/spec/masamune/transform/load_dimension_spec.rb +76 -0
  168. data/spec/masamune/transform/load_fact_spec.rb +89 -0
  169. data/spec/masamune/transform/relabel_dimension_spec.rb +102 -0
  170. data/spec/masamune/transform/rollup_fact_spec.rb +333 -0
  171. data/spec/masamune/transform/snapshot_dimension_spec.rb +103 -0
  172. data/spec/masamune/transform/stage_dimension_spec.rb +115 -0
  173. data/spec/masamune/transform/stage_fact_spec.rb +204 -0
  174. data/spec/masamune_spec.rb +32 -0
  175. data/spec/spec_helper.rb +41 -0
  176. data/spec/support/masamune/example_group.rb +36 -0
  177. data/spec/support/masamune/mock_command.rb +99 -0
  178. data/spec/support/masamune/mock_delegate.rb +51 -0
  179. data/spec/support/masamune/mock_filesystem.rb +96 -0
  180. data/spec/support/masamune/thor_mute.rb +35 -0
  181. data/spec/support/rspec/example/action_example_group.rb +34 -0
  182. data/spec/support/rspec/example/task_example_group.rb +80 -0
  183. data/spec/support/rspec/example/transform_example_group.rb +36 -0
  184. data/spec/support/shared_examples/postgres_common_examples.rb +53 -0
  185. metadata +462 -0
@@ -0,0 +1,517 @@
1
+ # The MIT License (MIT)
2
+ #
3
+ # Copyright (c) 2014-2015, VMware, Inc. All Rights Reserved.
4
+ #
5
+ # Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ # of this software and associated documentation files (the "Software"), to deal
7
+ # in the Software without restriction, including without limitation the rights
8
+ # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ # copies of the Software, and to permit persons to whom the Software is
10
+ # furnished to do so, subject to the following conditions:
11
+ #
12
+ # The above copyright notice and this permission notice shall be included in
13
+ # all copies or substantial portions of the Software.
14
+ #
15
+ # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
21
+ # THE SOFTWARE.
22
+
23
+ require 'spec_helper'
24
+
25
+ describe Masamune::DataPlan::Set do
26
+ let(:fs) { Masamune::MockFilesystem.new }
27
+ let!(:engine) { Masamune::DataPlan::Engine.new }
28
+
29
+ let!(:source_rule) { engine.add_source_rule('primary', path: '/log/%Y%m%d.*.log') }
30
+ let!(:target_rule) { engine.add_target_rule('primary', path: '/table/y=%Y/m=%m/d=%d') }
31
+
32
+ before do
33
+ engine.filesystem = fs
34
+ end
35
+
36
+ describe '#missing' do
37
+ let(:paths) { ['/table/y=2013/m=01/d=01', '/table/y=2013/m=01/d=02', '/table/y=2013/m=01/d=03'] }
38
+
39
+ let(:instance) { Masamune::DataPlan::Set.new(target_rule, paths) }
40
+
41
+ subject(:missing) do
42
+ instance.missing
43
+ end
44
+
45
+ context 'when all missing' do
46
+ it { expect(missing.size).to eq(3) }
47
+ it { expect(missing).to include '/table/y=2013/m=01/d=01' }
48
+ it { expect(missing).to include '/table/y=2013/m=01/d=02' }
49
+ it { expect(missing).to include '/table/y=2013/m=01/d=03' }
50
+ end
51
+
52
+ context 'when files missing' do
53
+ before do
54
+ fs.touch!('/table/y=2013/m=01/d=01', '/table/y=2013/m=01/d=02')
55
+ end
56
+ it { expect(missing.size).to eq(3) }
57
+ it { expect(missing).to include '/table/y=2013/m=01/d=01' }
58
+ it { expect(missing).to include '/table/y=2013/m=01/d=02' }
59
+ it { expect(missing).to include '/table/y=2013/m=01/d=03' }
60
+ end
61
+
62
+ context 'when some missing' do
63
+ before do
64
+ fs.touch!('/table/y=2013/m=01/d=01/0000', '/table/y=2013/m=01/d=02/0000')
65
+ end
66
+ it { expect(missing.size).to eq(1) }
67
+ it { expect(missing).to include '/table/y=2013/m=01/d=03' }
68
+ end
69
+
70
+ context 'when none missing' do
71
+ before do
72
+ fs.touch!('/table/y=2013/m=01/d=01/0000', '/table/y=2013/m=01/d=02/0000', '/table/y=2013/m=01/d=03/0000')
73
+ end
74
+ it { expect(missing).to be_empty }
75
+ end
76
+ end
77
+
78
+ describe '#existing' do
79
+ let(:instance) { Masamune::DataPlan::Set.new(source_rule, paths) }
80
+
81
+ subject(:existing) do
82
+ instance.existing
83
+ end
84
+
85
+ context 'with basic paths' do
86
+ let(:paths) { ['/log/20130101.random_1.log', '/log/20130102.random_1.log'] }
87
+
88
+ context 'when none existing' do
89
+ it { expect(existing).to be_empty }
90
+ end
91
+
92
+ context 'when some existing' do
93
+ before do
94
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
95
+ end
96
+ it { expect(existing.size).to eq(1) }
97
+ it { expect(existing).to include '/log/20130101.random_1.log' }
98
+ end
99
+
100
+ context 'when all existing' do
101
+ before do
102
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
103
+ fs.touch!('/log/20130102.random_1.log', '/log/20130102.random_2.log')
104
+ end
105
+ it { expect(existing.size).to eq(2) }
106
+ it { expect(existing).to include '/log/20130101.random_1.log' }
107
+ it { expect(existing).to include '/log/20130102.random_1.log' }
108
+ end
109
+ end
110
+
111
+ context 'with wildcard paths' do
112
+ let(:paths) { ['/log/20130101.*.log', '/log/20130102.*.log'] }
113
+
114
+ context 'when none existing' do
115
+ it { expect(existing).to be_empty }
116
+ end
117
+
118
+ context 'when some existing' do
119
+ before do
120
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
121
+ end
122
+ it { expect(existing.size).to eq(2) }
123
+ it { expect(existing).to include '/log/20130101.random_1.log' }
124
+ it { expect(existing).to include '/log/20130101.random_2.log' }
125
+ end
126
+
127
+ context 'when all existing' do
128
+ before do
129
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
130
+ fs.touch!('/log/20130102.random_1.log', '/log/20130102.random_2.log')
131
+ end
132
+ it { expect(existing.size).to eq(4) }
133
+ it { expect(existing).to include '/log/20130101.random_1.log' }
134
+ it { expect(existing).to include '/log/20130101.random_2.log' }
135
+ it { expect(existing).to include '/log/20130102.random_1.log' }
136
+ it { expect(existing).to include '/log/20130102.random_2.log' }
137
+ end
138
+ end
139
+ end
140
+
141
+ describe '#adjacent' do
142
+ let(:instance) { Masamune::DataPlan::Set.new(source_rule, paths) }
143
+
144
+ subject(:sources) do
145
+ instance.adjacent
146
+ end
147
+
148
+ subject(:existing) do
149
+ instance.adjacent.existing
150
+ end
151
+
152
+ context 'with window of 1 time_step' do
153
+ let(:paths) { ['/log/20130101.*.log'] }
154
+
155
+ before do
156
+ allow(instance.rule).to receive(:window) { 1 }
157
+ end
158
+
159
+ it { expect(sources.size).to eq(3) }
160
+ it { expect(sources).to include '/log/20121231.*.log' }
161
+ it { expect(sources).to include '/log/20130101.*.log' }
162
+ it { expect(sources).to include '/log/20130102.*.log' }
163
+
164
+ context 'when none existing' do
165
+ it { expect(existing).to be_empty }
166
+ end
167
+
168
+ context 'when some existing' do
169
+ before do
170
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
171
+ end
172
+ it { expect(existing.size).to eq(2) }
173
+ it { expect(existing).to include '/log/20130101.random_1.log' }
174
+ it { expect(existing).to include '/log/20130101.random_2.log' }
175
+ end
176
+
177
+ context 'when all existing' do
178
+ before do
179
+ fs.touch!('/log/20121231.random_1.log', '/log/20121231.random_2.log')
180
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
181
+ fs.touch!('/log/20130102.random_1.log', '/log/20130102.random_2.log')
182
+ fs.touch!('/log/20130103.random_1.log', '/log/20130103.random_2.log')
183
+ end
184
+ it { expect(existing.size).to eq(6) }
185
+ it { expect(existing).to include '/log/20121231.random_1.log' }
186
+ it { expect(existing).to include '/log/20121231.random_2.log' }
187
+ it { expect(existing).to include '/log/20130101.random_1.log' }
188
+ it { expect(existing).to include '/log/20130101.random_2.log' }
189
+ it { expect(existing).to include '/log/20130102.random_1.log' }
190
+ it { expect(existing).to include '/log/20130102.random_2.log' }
191
+ end
192
+ end
193
+ end
194
+
195
+ describe '#stale' do
196
+ context 'when source rule' do
197
+ let(:paths) { ['/log/20130101.random_1.log', '/log/20130102.random_1.log'] }
198
+ let(:instance) { Masamune::DataPlan::Set.new(source_rule, paths) }
199
+
200
+ subject(:stale_sources) do
201
+ instance.stale
202
+ end
203
+
204
+ it { expect(stale_sources).to be_empty }
205
+ end
206
+
207
+ let(:paths) { ['/table/y=2013/m=01/d=01', '/table/y=2013/m=01/d=02', '/table/y=2013/m=01/d=03'] }
208
+ let(:instance) { Masamune::DataPlan::Set.new(target_rule, paths) }
209
+ let(:past_time) { Time.parse('2013-01-01 09:00:00 +0000') }
210
+ let(:present_time) { Time.parse('2013-01-01 09:30:00 +0000') }
211
+ let(:future_time) { Time.parse('2013-01-01 10:00:00 +0000') }
212
+
213
+ before do
214
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log', mtime: past_time)
215
+ fs.touch!('/log/20130102.random_1.log', '/log/20130102.random_2.log', mtime: past_time)
216
+ fs.touch!('/log/20130103.random_1.log', '/log/20130103.random_2.log', mtime: past_time)
217
+ fs.touch!('/table/y=2013/m=01/d=01', '/table/y=2013/m=01/d=02', '/table/y=2013/m=01/d=03', mtime: present_time)
218
+ end
219
+
220
+ subject(:stale_targets) do
221
+ instance.stale
222
+ end
223
+
224
+ context 'when none stale targets' do
225
+ it { expect(stale_targets).to be_empty }
226
+ end
227
+
228
+ context 'when some stale targets (first source)' do
229
+ before do
230
+ fs.touch!('/log/20130101.random_1.log', mtime: future_time)
231
+ end
232
+
233
+ it { expect(stale_targets.size).to eq(1) }
234
+ it { expect(stale_targets).to include '/table/y=2013/m=01/d=01' }
235
+ end
236
+
237
+ context 'when some stale targets (second source)' do
238
+ before do
239
+ fs.touch!('/log/20130101.random_2.log', mtime: future_time)
240
+ end
241
+
242
+ it { expect(stale_targets.size).to eq(1) }
243
+ it { expect(stale_targets).to include '/table/y=2013/m=01/d=01' }
244
+ end
245
+
246
+ context 'when some stale targets (tie breaker)' do
247
+ before do
248
+ fs.touch!('/log/20130101.random_1.log', mtime: present_time)
249
+ end
250
+
251
+ it { expect(stale_targets.size).to eq(1) }
252
+ it { expect(stale_targets).to include '/table/y=2013/m=01/d=01' }
253
+ end
254
+
255
+ context 'when all stale targets' do
256
+ before do
257
+ fs.touch!('/log/20130101.random_1.log', mtime: future_time)
258
+ fs.touch!('/log/20130102.random_2.log', mtime: future_time)
259
+ fs.touch!('/log/20130103.random_1.log', mtime: future_time)
260
+ fs.touch!('/log/20130103.random_2.log', mtime: future_time)
261
+ end
262
+
263
+ it { expect(stale_targets.size).to eq(3) }
264
+ it { expect(stale_targets).to include '/table/y=2013/m=01/d=01' }
265
+ it { expect(stale_targets).to include '/table/y=2013/m=01/d=02' }
266
+ it { expect(stale_targets).to include '/table/y=2013/m=01/d=03' }
267
+ end
268
+
269
+ context 'when missing source last_modified_at' do
270
+ before do
271
+ fs.touch!('/log/20130101.random_1.log', mtime: Masamune::DataPlan::Elem::MISSING_MODIFIED_AT)
272
+ end
273
+
274
+ it { expect(stale_targets).to be_empty }
275
+ end
276
+ end
277
+
278
+ describe '#with_grain' do
279
+ let(:paths) { ['/table/y=2012/m=12/d=29', '/table/y=2012/m=12/d=30', '/table/y=2012/m=12/d=31',
280
+ '/table/y=2013/m=01/d=01', '/table/y=2013/m=01/d=02', '/table/y=2013/m=02/d=01', ] }
281
+
282
+ let(:instance) { Masamune::DataPlan::Set.new(target_rule, paths) }
283
+
284
+ subject(:granular_targets) do
285
+ instance.with_grain(grain)
286
+ end
287
+
288
+ context 'when :day' do
289
+ let(:grain) { :day }
290
+ it 'has 6 items' do
291
+ expect(subject.size).to eq(6)
292
+ end
293
+ it { is_expected.to include '/table/y=2012/m=12/d=29' }
294
+ it { is_expected.to include '/table/y=2012/m=12/d=30' }
295
+ it { is_expected.to include '/table/y=2012/m=12/d=31' }
296
+ it { is_expected.to include '/table/y=2013/m=01/d=01' }
297
+ it { is_expected.to include '/table/y=2013/m=01/d=02' }
298
+ it { is_expected.to include '/table/y=2013/m=02/d=01' }
299
+ end
300
+
301
+ context 'when :month' do
302
+ let(:grain) { :month }
303
+ it 'has 3 items' do
304
+ expect(subject.size).to eq(3)
305
+ end
306
+ it { is_expected.to include '/table/y=2012/m=12' }
307
+ it { is_expected.to include '/table/y=2013/m=01' }
308
+ it { is_expected.to include '/table/y=2013/m=02' }
309
+ end
310
+
311
+ context 'when :year' do
312
+ let(:grain) { :year }
313
+ it 'has 2 items' do
314
+ expect(subject.size).to eq(2)
315
+ end
316
+ it { is_expected.to include '/table/y=2012' }
317
+ it { is_expected.to include '/table/y=2013' }
318
+ end
319
+ end
320
+
321
+ describe '#include?' do
322
+ let(:instance) { Masamune::DataPlan::Set.new(source_rule, enum) }
323
+ subject do
324
+ instance.include?(elem)
325
+ end
326
+
327
+ context 'with basic enum and basic elem' do
328
+ let(:enum) { ['/log/20130101.random_1.log', '/log/20130102.random_2.log'] }
329
+ let(:elem) { '/log/20130101.random_1.log' }
330
+
331
+ it { is_expected.to eq(true) }
332
+ end
333
+
334
+ context 'with basic enum and wildcard elem' do
335
+ let(:enum) { ['/log/20130101.random_1.log', '/log/20130102.random_2.log'] }
336
+ let(:elem) { '/log/20130101.*.log' }
337
+
338
+ it { is_expected.to eq(false) }
339
+ end
340
+
341
+ context 'with wildcard enum and wildcard elem' do
342
+ let(:enum) { ['/log/20130101.*.log', '/log/20130102.*.log'] }
343
+ let(:elem) { '/log/20130101.*.log' }
344
+
345
+ it { is_expected.to eq(true) }
346
+ end
347
+
348
+ context 'with wildcard enum and basic elem' do
349
+ let(:enum) { ['/log/20130101.*.log', '/log/20130102.*.log'] }
350
+ let(:elem) { '/log/20130101.random_1.log' }
351
+
352
+ it { is_expected.to eq(false) }
353
+ end
354
+ end
355
+
356
+ describe '#incomplete' do
357
+ let!(:source_rule) { engine.add_source_rule('primary', path: '/log/%Y%m%d.*.log') }
358
+ let!(:target_rule) { engine.add_target_rule('primary', path: '/table/y=%Y/m=%m') }
359
+
360
+ let(:paths) { ['/log/20140101.random_1.log', '/log/20140102.random_1.log', '/log/20140201.random_1.log', '/log/20140202.random_1.log'] }
361
+
362
+ let(:instance) { Masamune::DataPlan::Set.new(source_rule, paths) }
363
+
364
+ subject(:incomplete) do
365
+ instance.targets.incomplete
366
+ end
367
+
368
+ context 'when all incomplete' do
369
+ it { expect(incomplete.size).to eq(2) }
370
+ it { expect(incomplete).to include '/table/y=2014/m=01' }
371
+ it { expect(incomplete).to include '/table/y=2014/m=02' }
372
+ end
373
+
374
+ context 'when some incomplete' do
375
+ before do
376
+ (1..31).each do |day|
377
+ fs.touch!('/log/201401%02d.random_1.log' % day)
378
+ end
379
+ end
380
+
381
+ it { expect(incomplete.size).to eq(1) }
382
+ it { expect(incomplete).to include '/table/y=2014/m=02' }
383
+ end
384
+
385
+ context 'when none incomplete' do
386
+ before do
387
+ (1..31).each do |day|
388
+ fs.touch!('/log/201401%02d.random_1.log' % day)
389
+ fs.touch!('/log/201402%02d.random_1.log' % day)
390
+ end
391
+ end
392
+
393
+ it { expect(incomplete.size).to eq(0) }
394
+ end
395
+ end
396
+
397
+ describe '#updatable' do
398
+ let(:paths) { ['/table/y=2013/m=01/d=01', '/table/y=2013/m=01/d=02', '/table/y=2013/m=01/d=03'] }
399
+
400
+ let(:instance) { Masamune::DataPlan::Set.new(target_rule, paths) }
401
+
402
+ let(:past_time) { Time.parse('2013-01-01 09:00:00 +0000') }
403
+ let(:present_time) { Time.parse('2013-01-01 09:30:00 +0000') }
404
+ let(:future_time) { Time.parse('2013-01-01 10:00:00 +0000') }
405
+
406
+ subject(:actionable) do
407
+ instance.actionable
408
+ end
409
+
410
+ subject(:updateable) do
411
+ instance.updateable
412
+ end
413
+
414
+ context 'when targets are existing' do
415
+ before do
416
+ fs.touch!('/table/y=2013/m=01/d=01/0000', '/table/y=2013/m=01/d=02/0000', '/table/y=2013/m=01/d=03/0000', mtime: present_time)
417
+ end
418
+
419
+ context 'when all sources missing' do
420
+ it 'actionable is equivalent to incomplete' do
421
+ expect(actionable).to eq(instance.incomplete)
422
+ end
423
+ it { expect(updateable).to be_empty }
424
+ end
425
+
426
+ context 'when all sources existing (stale)' do
427
+ before do
428
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log', mtime: future_time)
429
+ fs.touch!('/log/20130102.random_1.log', '/log/20130102.random_2.log', mtime: future_time)
430
+ fs.touch!('/log/20130103.random_1.log', '/log/20130103.random_2.log', mtime: future_time)
431
+ end
432
+ it 'actionable is equivalent to stale' do
433
+ expect(actionable).to eq(instance.stale)
434
+ end
435
+ it { expect(updateable.size).to eq(3) }
436
+ it { expect(updateable).to include '/table/y=2013/m=01/d=01' }
437
+ it { expect(updateable).to include '/table/y=2013/m=01/d=02' }
438
+ it { expect(updateable).to include '/table/y=2013/m=01/d=03' }
439
+ end
440
+
441
+ context 'when all sources existing (fresh)' do
442
+ before do
443
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log', mtime: past_time)
444
+ fs.touch!('/log/20130102.random_1.log', '/log/20130102.random_2.log', mtime: past_time)
445
+ fs.touch!('/log/20130103.random_1.log', '/log/20130103.random_2.log', mtime: past_time)
446
+ end
447
+ it { expect(actionable).to be_empty }
448
+ it { expect(updateable).to be_empty }
449
+ end
450
+ end
451
+
452
+ context 'when targets are missing' do
453
+ context 'when all sources missing' do
454
+ it 'actionable is equivalent to incomplete' do
455
+ expect(actionable).to eq(instance.incomplete)
456
+ end
457
+ it { expect(updateable).to be_empty }
458
+ end
459
+
460
+ context 'when some sources missing' do
461
+ before do
462
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
463
+ end
464
+ it 'actionable is equivalent to missing' do
465
+ expect(actionable).to eq(instance.missing)
466
+ end
467
+ it { expect(updateable.size).to eq(1) }
468
+ it { expect(updateable).to include '/table/y=2013/m=01/d=01' }
469
+ end
470
+
471
+ context 'when all sources existing' do
472
+ before do
473
+ fs.touch!('/log/20130101.random_1.log', '/log/20130101.random_2.log')
474
+ fs.touch!('/log/20130102.random_1.log', '/log/20130102.random_2.log')
475
+ fs.touch!('/log/20130103.random_1.log', '/log/20130103.random_2.log')
476
+ end
477
+ it 'actionable is equivalent to missing' do
478
+ expect(actionable).to eq(instance.missing)
479
+ end
480
+ it { expect(updateable.size).to eq(3) }
481
+ it { expect(updateable).to include '/table/y=2013/m=01/d=01' }
482
+ it { expect(updateable).to include '/table/y=2013/m=01/d=02' }
483
+ it { expect(updateable).to include '/table/y=2013/m=01/d=03' }
484
+ end
485
+ end
486
+ end
487
+
488
+ context 'when sets are chained together' do
489
+ let!(:source_rule) { engine.add_source_rule('primary', path: '/log/%Y%m%d.*.log') }
490
+ let!(:target_rule) { engine.add_target_rule('primary', path: '/table/y=%Y/m=%m') }
491
+
492
+ let(:paths) { ['/log/20140101.random_1.log', '/log/20140102.random_1.log', '/log/20140201.random_1.log', '/log/20140202.random_1.log'] }
493
+
494
+ let(:instance) { Masamune::DataPlan::Set.new(source_rule, paths) }
495
+
496
+ context 'when sources are missing' do
497
+ it 'should chain expectedly' do
498
+ expect(instance.targets.size).to eq(2)
499
+ expect(instance.targets.sources.existing.size).to eq(0)
500
+ expect(instance.targets.sources.existing.targets.size).to eq(0)
501
+ end
502
+ end
503
+
504
+ context 'when sources are present' do
505
+ before do
506
+ fs.touch!(*paths)
507
+ end
508
+
509
+ it 'should chain expectedly' do
510
+ expect(instance.targets.size).to eq(2)
511
+ expect(instance.targets.sources.existing.size).to eq(4)
512
+ expect(instance.targets.sources.existing.targets.size).to eq(2)
513
+ expect(instance.targets.sources.existing.targets.sources.existing.size).to eq(4)
514
+ end
515
+ end
516
+ end
517
+ end