masamune 0.11.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (185) hide show
  1. checksums.yaml +7 -0
  2. data/LICENSE.txt +21 -0
  3. data/README.md +54 -0
  4. data/Rakefile +15 -0
  5. data/bin/masamune-elastic-mapreduce +4 -0
  6. data/bin/masamune-hive +4 -0
  7. data/bin/masamune-psql +4 -0
  8. data/bin/masamune-shell +4 -0
  9. data/lib/masamune.rb +56 -0
  10. data/lib/masamune/accumulate.rb +60 -0
  11. data/lib/masamune/actions.rb +38 -0
  12. data/lib/masamune/actions/data_flow.rb +131 -0
  13. data/lib/masamune/actions/date_parse.rb +75 -0
  14. data/lib/masamune/actions/elastic_mapreduce.rb +68 -0
  15. data/lib/masamune/actions/execute.rb +52 -0
  16. data/lib/masamune/actions/filesystem.rb +37 -0
  17. data/lib/masamune/actions/hadoop_filesystem.rb +40 -0
  18. data/lib/masamune/actions/hadoop_streaming.rb +41 -0
  19. data/lib/masamune/actions/hive.rb +74 -0
  20. data/lib/masamune/actions/postgres.rb +76 -0
  21. data/lib/masamune/actions/postgres_admin.rb +34 -0
  22. data/lib/masamune/actions/s3cmd.rb +44 -0
  23. data/lib/masamune/actions/transform.rb +89 -0
  24. data/lib/masamune/after_initialize_callbacks.rb +55 -0
  25. data/lib/masamune/cached_filesystem.rb +110 -0
  26. data/lib/masamune/commands.rb +37 -0
  27. data/lib/masamune/commands/elastic_mapreduce.rb +119 -0
  28. data/lib/masamune/commands/hadoop_filesystem.rb +57 -0
  29. data/lib/masamune/commands/hadoop_streaming.rb +116 -0
  30. data/lib/masamune/commands/hive.rb +178 -0
  31. data/lib/masamune/commands/interactive.rb +37 -0
  32. data/lib/masamune/commands/postgres.rb +128 -0
  33. data/lib/masamune/commands/postgres_admin.rb +72 -0
  34. data/lib/masamune/commands/postgres_common.rb +33 -0
  35. data/lib/masamune/commands/retry_with_backoff.rb +60 -0
  36. data/lib/masamune/commands/s3cmd.rb +70 -0
  37. data/lib/masamune/commands/shell.rb +202 -0
  38. data/lib/masamune/configuration.rb +195 -0
  39. data/lib/masamune/data_plan.rb +31 -0
  40. data/lib/masamune/data_plan/builder.rb +66 -0
  41. data/lib/masamune/data_plan/elem.rb +190 -0
  42. data/lib/masamune/data_plan/engine.rb +162 -0
  43. data/lib/masamune/data_plan/rule.rb +292 -0
  44. data/lib/masamune/data_plan/set.rb +176 -0
  45. data/lib/masamune/environment.rb +164 -0
  46. data/lib/masamune/filesystem.rb +567 -0
  47. data/lib/masamune/has_environment.rb +40 -0
  48. data/lib/masamune/helpers.rb +27 -0
  49. data/lib/masamune/helpers/postgres.rb +84 -0
  50. data/lib/masamune/io.rb +33 -0
  51. data/lib/masamune/last_element.rb +53 -0
  52. data/lib/masamune/method_logger.rb +41 -0
  53. data/lib/masamune/multi_io.rb +39 -0
  54. data/lib/masamune/schema.rb +36 -0
  55. data/lib/masamune/schema/catalog.rb +233 -0
  56. data/lib/masamune/schema/column.rb +527 -0
  57. data/lib/masamune/schema/dimension.rb +133 -0
  58. data/lib/masamune/schema/event.rb +121 -0
  59. data/lib/masamune/schema/fact.rb +133 -0
  60. data/lib/masamune/schema/map.rb +265 -0
  61. data/lib/masamune/schema/row.rb +133 -0
  62. data/lib/masamune/schema/store.rb +115 -0
  63. data/lib/masamune/schema/table.rb +308 -0
  64. data/lib/masamune/schema/table_reference.rb +76 -0
  65. data/lib/masamune/spec_helper.rb +23 -0
  66. data/lib/masamune/string_format.rb +34 -0
  67. data/lib/masamune/tasks/elastic_mapreduce_thor.rb +60 -0
  68. data/lib/masamune/tasks/hive_thor.rb +55 -0
  69. data/lib/masamune/tasks/postgres_thor.rb +47 -0
  70. data/lib/masamune/tasks/shell_thor.rb +63 -0
  71. data/lib/masamune/template.rb +77 -0
  72. data/lib/masamune/thor.rb +186 -0
  73. data/lib/masamune/thor_loader.rb +38 -0
  74. data/lib/masamune/topological_hash.rb +34 -0
  75. data/lib/masamune/transform.rb +47 -0
  76. data/lib/masamune/transform/bulk_upsert.psql.erb +64 -0
  77. data/lib/masamune/transform/bulk_upsert.rb +52 -0
  78. data/lib/masamune/transform/consolidate_dimension.rb +54 -0
  79. data/lib/masamune/transform/deduplicate_dimension.psql.erb +52 -0
  80. data/lib/masamune/transform/deduplicate_dimension.rb +53 -0
  81. data/lib/masamune/transform/define_event_view.hql.erb +51 -0
  82. data/lib/masamune/transform/define_event_view.rb +60 -0
  83. data/lib/masamune/transform/define_index.psql.erb +34 -0
  84. data/lib/masamune/transform/define_schema.hql.erb +23 -0
  85. data/lib/masamune/transform/define_schema.psql.erb +79 -0
  86. data/lib/masamune/transform/define_schema.rb +56 -0
  87. data/lib/masamune/transform/define_table.hql.erb +34 -0
  88. data/lib/masamune/transform/define_table.psql.erb +95 -0
  89. data/lib/masamune/transform/define_table.rb +40 -0
  90. data/lib/masamune/transform/define_unique.psql.erb +30 -0
  91. data/lib/masamune/transform/insert_reference_values.psql.erb +43 -0
  92. data/lib/masamune/transform/insert_reference_values.rb +64 -0
  93. data/lib/masamune/transform/load_dimension.rb +47 -0
  94. data/lib/masamune/transform/load_fact.rb +45 -0
  95. data/lib/masamune/transform/operator.rb +96 -0
  96. data/lib/masamune/transform/relabel_dimension.psql.erb +76 -0
  97. data/lib/masamune/transform/relabel_dimension.rb +39 -0
  98. data/lib/masamune/transform/rollup_fact.psql.erb +79 -0
  99. data/lib/masamune/transform/rollup_fact.rb +149 -0
  100. data/lib/masamune/transform/snapshot_dimension.psql.erb +75 -0
  101. data/lib/masamune/transform/snapshot_dimension.rb +74 -0
  102. data/lib/masamune/transform/stage_dimension.psql.erb +39 -0
  103. data/lib/masamune/transform/stage_dimension.rb +83 -0
  104. data/lib/masamune/transform/stage_fact.psql.erb +80 -0
  105. data/lib/masamune/transform/stage_fact.rb +111 -0
  106. data/lib/masamune/version.rb +25 -0
  107. data/spec/fixtures/aggregate.sql.erb +25 -0
  108. data/spec/fixtures/comment.sql.erb +27 -0
  109. data/spec/fixtures/invalid.sql.erb +23 -0
  110. data/spec/fixtures/relative.sql.erb +23 -0
  111. data/spec/fixtures/simple.sql.erb +28 -0
  112. data/spec/fixtures/whitespace.sql.erb +30 -0
  113. data/spec/masamune/actions/elastic_mapreduce_spec.rb +108 -0
  114. data/spec/masamune/actions/execute_spec.rb +50 -0
  115. data/spec/masamune/actions/hadoop_filesystem_spec.rb +44 -0
  116. data/spec/masamune/actions/hadoop_streaming_spec.rb +74 -0
  117. data/spec/masamune/actions/hive_spec.rb +117 -0
  118. data/spec/masamune/actions/postgres_admin_spec.rb +58 -0
  119. data/spec/masamune/actions/postgres_spec.rb +134 -0
  120. data/spec/masamune/actions/s3cmd_spec.rb +44 -0
  121. data/spec/masamune/actions/transform_spec.rb +144 -0
  122. data/spec/masamune/after_initialization_callbacks_spec.rb +61 -0
  123. data/spec/masamune/cached_filesystem_spec.rb +167 -0
  124. data/spec/masamune/commands/hadoop_filesystem_spec.rb +50 -0
  125. data/spec/masamune/commands/hadoop_streaming_spec.rb +106 -0
  126. data/spec/masamune/commands/hive_spec.rb +117 -0
  127. data/spec/masamune/commands/postgres_admin_spec.rb +69 -0
  128. data/spec/masamune/commands/postgres_spec.rb +100 -0
  129. data/spec/masamune/commands/retry_with_backoff_spec.rb +116 -0
  130. data/spec/masamune/commands/s3cmd_spec.rb +50 -0
  131. data/spec/masamune/commands/shell_spec.rb +101 -0
  132. data/spec/masamune/configuration_spec.rb +102 -0
  133. data/spec/masamune/data_plan/builder_spec.rb +91 -0
  134. data/spec/masamune/data_plan/elem_spec.rb +102 -0
  135. data/spec/masamune/data_plan/engine_spec.rb +356 -0
  136. data/spec/masamune/data_plan/rule_spec.rb +407 -0
  137. data/spec/masamune/data_plan/set_spec.rb +517 -0
  138. data/spec/masamune/environment_spec.rb +65 -0
  139. data/spec/masamune/filesystem_spec.rb +1421 -0
  140. data/spec/masamune/helpers/postgres_spec.rb +95 -0
  141. data/spec/masamune/schema/catalog_spec.rb +613 -0
  142. data/spec/masamune/schema/column_spec.rb +696 -0
  143. data/spec/masamune/schema/dimension_spec.rb +137 -0
  144. data/spec/masamune/schema/event_spec.rb +75 -0
  145. data/spec/masamune/schema/fact_spec.rb +117 -0
  146. data/spec/masamune/schema/map_spec.rb +593 -0
  147. data/spec/masamune/schema/row_spec.rb +28 -0
  148. data/spec/masamune/schema/store_spec.rb +49 -0
  149. data/spec/masamune/schema/table_spec.rb +395 -0
  150. data/spec/masamune/string_format_spec.rb +60 -0
  151. data/spec/masamune/tasks/elastic_mapreduce_thor_spec.rb +57 -0
  152. data/spec/masamune/tasks/hive_thor_spec.rb +75 -0
  153. data/spec/masamune/tasks/postgres_thor_spec.rb +42 -0
  154. data/spec/masamune/tasks/shell_thor_spec.rb +51 -0
  155. data/spec/masamune/template_spec.rb +77 -0
  156. data/spec/masamune/thor_spec.rb +238 -0
  157. data/spec/masamune/transform/bulk_upsert.dimension_spec.rb +200 -0
  158. data/spec/masamune/transform/consolidate_dimension_spec.rb +62 -0
  159. data/spec/masamune/transform/deduplicate_dimension_spec.rb +84 -0
  160. data/spec/masamune/transform/define_event_view_spec.rb +84 -0
  161. data/spec/masamune/transform/define_schema_spec.rb +83 -0
  162. data/spec/masamune/transform/define_table.dimension_spec.rb +306 -0
  163. data/spec/masamune/transform/define_table.fact_spec.rb +291 -0
  164. data/spec/masamune/transform/define_table.table_spec.rb +525 -0
  165. data/spec/masamune/transform/insert_reference_values.dimension_spec.rb +111 -0
  166. data/spec/masamune/transform/insert_reference_values.fact_spec.rb +149 -0
  167. data/spec/masamune/transform/load_dimension_spec.rb +76 -0
  168. data/spec/masamune/transform/load_fact_spec.rb +89 -0
  169. data/spec/masamune/transform/relabel_dimension_spec.rb +102 -0
  170. data/spec/masamune/transform/rollup_fact_spec.rb +333 -0
  171. data/spec/masamune/transform/snapshot_dimension_spec.rb +103 -0
  172. data/spec/masamune/transform/stage_dimension_spec.rb +115 -0
  173. data/spec/masamune/transform/stage_fact_spec.rb +204 -0
  174. data/spec/masamune_spec.rb +32 -0
  175. data/spec/spec_helper.rb +41 -0
  176. data/spec/support/masamune/example_group.rb +36 -0
  177. data/spec/support/masamune/mock_command.rb +99 -0
  178. data/spec/support/masamune/mock_delegate.rb +51 -0
  179. data/spec/support/masamune/mock_filesystem.rb +96 -0
  180. data/spec/support/masamune/thor_mute.rb +35 -0
  181. data/spec/support/rspec/example/action_example_group.rb +34 -0
  182. data/spec/support/rspec/example/task_example_group.rb +80 -0
  183. data/spec/support/rspec/example/transform_example_group.rb +36 -0
  184. data/spec/support/shared_examples/postgres_common_examples.rb +53 -0
  185. metadata +462 -0
@@ -0,0 +1,292 @@
1
+ # The MIT License (MIT)
2
+ #
3
+ # Copyright (c) 2014-2015, VMware, Inc. All Rights Reserved.
4
+ #
5
+ # Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ # of this software and associated documentation files (the "Software"), to deal
7
+ # in the Software without restriction, including without limitation the rights
8
+ # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ # copies of the Software, and to permit persons to whom the Software is
10
+ # furnished to do so, subject to the following conditions:
11
+ #
12
+ # The above copyright notice and this permission notice shall be included in
13
+ # all copies or substantial portions of the Software.
14
+ #
15
+ # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
21
+ # THE SOFTWARE.
22
+
23
+ require 'active_support'
24
+ require 'active_support/duration'
25
+ require 'active_support/values/time_zone'
26
+ require 'active_support/core_ext/time/calculations'
27
+ require 'active_support/core_ext/date/calculations'
28
+ require 'active_support/core_ext/date_time/calculations'
29
+ require 'date'
30
+
31
+ class Masamune::DataPlan::Rule
32
+ TERMINAL = nil
33
+
34
+ include Masamune::Accumulate
35
+
36
+ attr_reader :engine, :name, :type, :options
37
+
38
+ def initialize(engine, name, type, options = {})
39
+ @engine = engine
40
+ @name = name
41
+ @type = type
42
+ @options = options
43
+ end
44
+
45
+ def for_targets?
46
+ @type == :target
47
+ end
48
+
49
+ def for_sources?
50
+ @type == :source
51
+ end
52
+
53
+ def for_path?
54
+ @options.key?(:path)
55
+ end
56
+
57
+ def for_table?
58
+ @options.key?(:table)
59
+ end
60
+
61
+ def for_table_with_partition?
62
+ @options.key?(:table) && @options.key?(:partition)
63
+ end
64
+
65
+ def path
66
+ @options[:path]
67
+ end
68
+
69
+ def table
70
+ @options[:table]
71
+ end
72
+
73
+ def partition
74
+ @options[:partition]
75
+ end
76
+
77
+ def ==(other)
78
+ engine == other.engine &&
79
+ name == other.name &&
80
+ type == other.type &&
81
+ pattern == other.pattern &&
82
+ options == other.options
83
+ end
84
+
85
+ def eql?(other)
86
+ self == other
87
+ end
88
+
89
+ def hash
90
+ [engine, name, type, pattern, options].hash
91
+ end
92
+
93
+ def pattern
94
+ @pattern ||= begin
95
+ if for_path?
96
+ path.respond_to?(:call) ? path.call(engine.filesystem) : path
97
+ elsif for_table_with_partition?
98
+ [table , partition].join('_')
99
+ elsif for_table?
100
+ table
101
+ end.to_s
102
+ end
103
+ end
104
+
105
+ def primary?
106
+ @options.fetch(:primary, true)
107
+ end
108
+
109
+ def matches?(input)
110
+ matched_pattern = match_data_hash(matcher.match(input))
111
+ matched_pattern.present? && matched_pattern[:rest].blank?
112
+ end
113
+
114
+ def bind_date(input_date)
115
+ output_date = tz.utc_to_local(input_date)
116
+ Masamune::DataPlan::Elem.new(self, output_date, options_for_elem)
117
+ end
118
+
119
+ def bind_input(input)
120
+ return input if input.is_a?(Masamune::DataPlan::Elem)
121
+ matched_pattern = match_data_hash(matcher.match(input))
122
+ raise "Cannot bind_input #{input} to #{pattern}" unless matched_pattern
123
+ output_date = matched_date(matched_pattern)
124
+ Masamune::DataPlan::Elem.new(self, output_date, options_for_elem.merge(matched_extra(matched_pattern)))
125
+ end
126
+
127
+ def unify(elem, rule)
128
+ rule.bind_date(elem.start_time)
129
+ end
130
+
131
+ def generate(start_time, stop_time, &block)
132
+ instance = bind_date(start_time)
133
+
134
+ begin
135
+ yield instance
136
+ instance = instance.next
137
+ end while instance.start_time <= stop_time
138
+ end
139
+ method_accumulate :generate
140
+
141
+ def generate_via_unify(elem, rule, &block)
142
+ instance = unify(elem, rule)
143
+
144
+ stop_time = instance.start_time.advance(time_step => 1)
145
+ begin
146
+ yield instance
147
+ instance = instance.next
148
+ end while instance.start_time < stop_time
149
+ end
150
+ method_accumulate :generate_via_unify
151
+
152
+ def tz
153
+ ActiveSupport::TimeZone[@options.fetch(:tz, 'UTC')]
154
+ end
155
+
156
+ def time_step
157
+ @time_step ||=
158
+ case pattern
159
+ when /%s/
160
+ :hours
161
+ when /%H-s/
162
+ :hours
163
+ when /%d-s/
164
+ :days
165
+ when /%m-s/
166
+ :months
167
+ when /%Y-s/
168
+ :years
169
+ when /%-?k/, /%-?H/
170
+ :hours
171
+ when /%-?d/
172
+ :days
173
+ when /%-?m/
174
+ :months
175
+ when /%-?Y/
176
+ :years
177
+ else
178
+ :hours
179
+ end
180
+ end
181
+
182
+ def time_round(time)
183
+ case time_step
184
+ when :hours
185
+ DateTime.civil(time.year, time.month, time.day, time.hour)
186
+ when :days
187
+ DateTime.civil(time.year, time.month, time.day)
188
+ when :months
189
+ DateTime.civil(time.year, time.month)
190
+ when :years
191
+ DateTime.civil(time.year)
192
+ else
193
+ time
194
+ end
195
+ end
196
+
197
+ def window
198
+ @options[:window] || 0
199
+ end
200
+
201
+ def adjacent_matches(instance)
202
+ (-window .. -1).each do |i|
203
+ yield instance.prev(i.abs)
204
+ end
205
+ yield instance
206
+ (1 .. window).each do |i|
207
+ yield instance.next(i)
208
+ end
209
+ end
210
+ method_accumulate :adjacent_matches
211
+
212
+ def inspect
213
+ {type: type, pattern: pattern, options: options}.to_s
214
+ end
215
+
216
+ def strftime_format
217
+ @strftime_format ||=
218
+ pattern.dup.tap do |format|
219
+ format.gsub!('%H-s', '%s')
220
+ format.gsub!('%d-s', '%s')
221
+ format.gsub!('%m-s', '%s')
222
+ format.gsub!('%Y-s', '%s')
223
+ end
224
+ end
225
+
226
+ def round(grain)
227
+ pattern_parts = pattern.split('/')
228
+ part_index = pattern_parts.find_index { |part| part =~ time_step_to_format(grain) }
229
+ raise "cannot round to :#{grain} for #{pattern}" unless part_index
230
+ new_pattern = pattern_parts[0..part_index].join('/')
231
+ self.class.new(engine, name, type, options.merge(path: new_pattern))
232
+ end
233
+
234
+ private
235
+
236
+ def time_step_to_format(step)
237
+ case step
238
+ when :hour, :hours
239
+ /%-?[H|k]/
240
+ when :day, :days
241
+ /%-?d/
242
+ when :month, :months
243
+ /%-?m/
244
+ when :year, :years
245
+ /%Y/
246
+ end
247
+ end
248
+
249
+ def matcher
250
+ @matcher ||= begin
251
+ regexp = pattern.dup
252
+ regexp.gsub!(/%([YmdH]-)?s/, '(?<timestamp>\d{10})')
253
+ regexp.gsub!('%Y', '(?<year>\d{4})')
254
+ regexp.gsub!('%m', '(?<month>\d{2})')
255
+ regexp.gsub!('%-m', '(?<month>\d{1,2})')
256
+ regexp.gsub!('%d', '(?<day>\d{2})')
257
+ regexp.gsub!('%-d', '(?<day>\d{1,2})')
258
+ regexp.gsub!('%H', '(?<hour>\d{2})')
259
+ regexp.gsub!('%k', '(?<hour>\d{2})')
260
+ regexp.gsub!('%-k', '(?<hour>\d{1,2})')
261
+ regexp.gsub!('*', '(?<glob>.*?)')
262
+ regexp.gsub!(/$/, '(?<rest>.*?)\z')
263
+ Regexp.compile(regexp)
264
+ end
265
+ end
266
+
267
+ def match_data_hash(match_data = nil)
268
+ return unless match_data.present?
269
+ Hash.new.tap do |hash|
270
+ match_data.names.map(&:to_sym).each do |key|
271
+ hash[key] = match_data[key.to_sym]
272
+ end
273
+ end
274
+ end
275
+
276
+ def matched_date(matched_data)
277
+ if timestamp = matched_data[:timestamp]
278
+ Time.at(timestamp.to_i).to_datetime
279
+ else
280
+ DateTime.new(*matched_data.values_at(:year, :month, :day, :hour).compact.map(&:to_i))
281
+ end
282
+ end
283
+
284
+ def matched_extra(matched_data)
285
+ return {} unless matched_data.has_key?(:glob)
286
+ {glob: matched_data[:glob]}.reject { |_,v| v == '*' }
287
+ end
288
+
289
+ def options_for_elem
290
+ @options.reject { |k,_| [:path, :table].include?(k) }
291
+ end
292
+ end
@@ -0,0 +1,176 @@
1
+ # The MIT License (MIT)
2
+ #
3
+ # Copyright (c) 2014-2015, VMware, Inc. All Rights Reserved.
4
+ #
5
+ # Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ # of this software and associated documentation files (the "Software"), to deal
7
+ # in the Software without restriction, including without limitation the rights
8
+ # to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ # copies of the Software, and to permit persons to whom the Software is
10
+ # furnished to do so, subject to the following conditions:
11
+ #
12
+ # The above copyright notice and this permission notice shall be included in
13
+ # all copies or substantial portions of the Software.
14
+ #
15
+ # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
21
+ # THE SOFTWARE.
22
+
23
+ require 'set'
24
+
25
+ class Masamune::DataPlan::Set < Set
26
+ EMPTY = self.new
27
+
28
+ include Masamune::Accumulate
29
+
30
+ attr_reader :rule
31
+
32
+ def initialize(rule, enum = nil)
33
+ @rule = rule
34
+ super convert_enum(enum)
35
+ end
36
+
37
+ def union(enum = nil)
38
+ super(convert_enum(enum) || EMPTY)
39
+ end
40
+
41
+ def add(elem = nil)
42
+ super convert_elem(elem)
43
+ end
44
+
45
+ def include?(elem = nil)
46
+ super convert_elem(elem)
47
+ end
48
+
49
+ def missing(&block)
50
+ self.each do |elem|
51
+ yield elem if elem.explode.empty?
52
+ end
53
+ end
54
+ method_accumulate :missing, lambda { |set| set.class.new(set.rule) }
55
+
56
+ def existing(&block)
57
+ self.each do |elem|
58
+ elem.explode do |new_elem|
59
+ yield new_elem
60
+ end
61
+ end
62
+ end
63
+ method_accumulate :existing, lambda { |set| set.class.new(set.rule) }
64
+
65
+ def adjacent(&block)
66
+ self.each do |elem|
67
+ @rule.adjacent_matches(elem) do |adj_elem|
68
+ yield adj_elem
69
+ end
70
+ end
71
+ end
72
+ method_accumulate :adjacent, lambda { |set| set.class.new(set.rule) }
73
+
74
+ def stale(&block)
75
+ return Masamune::DataPlan::Set::EMPTY if empty? || @rule.for_sources?
76
+ self.each do |target|
77
+ yield target if target.sources.existing.any? { |source| target_stale?(source, target) }
78
+ end
79
+ end
80
+ method_accumulate :stale, lambda { |set| set.class.new(set.rule) }
81
+
82
+ def incomplete(&block)
83
+ return Masamune::DataPlan::Set::EMPTY if empty? || @rule.for_sources?
84
+ set = Set.new
85
+ self.each do |target|
86
+ yield target if set.add?(target) unless target.complete?
87
+ end
88
+ end
89
+ method_accumulate :incomplete, lambda { |set| set.class.new(set.rule) }
90
+
91
+ def actionable(&block)
92
+ return Masamune::DataPlan::Set::EMPTY if empty? || @rule.for_sources?
93
+ set = Set.new
94
+ missing.each do |target|
95
+ yield target if set.add?(target)
96
+ end
97
+ incomplete.each do |target|
98
+ yield target if set.add?(target)
99
+ end
100
+ stale.each do |target|
101
+ yield target if set.add?(target)
102
+ end
103
+ end
104
+ method_accumulate :actionable, lambda { |set| set.class.new(set.rule) }
105
+
106
+ def updateable(&block)
107
+ return Masamune::DataPlan::Set::EMPTY if empty? || @rule.for_sources?
108
+ set = Set.new
109
+ actionable.each do |target|
110
+ yield target if set.add?(target) && target.sources.existing.any?
111
+ end
112
+ end
113
+ method_accumulate :updateable, lambda { |set| set.class.new(set.rule) }
114
+
115
+ # TODO detect & warn or correct if coarser grain set is incomplete
116
+ def with_grain(grain, &block)
117
+ seen = Set.new
118
+ self.each do |elem|
119
+ granular_elem = elem.round(grain)
120
+ yield granular_elem if seen.add?(granular_elem)
121
+ end
122
+ end
123
+ method_accumulate :with_grain, lambda { |set, grain| set.class.new(set.rule.round(grain)) }
124
+
125
+ def targets
126
+ return Masamune::DataPlan::Set::EMPTY if empty? || @rule.for_targets?
127
+ self.class.new(self.first.targets.rule).tap do |set|
128
+ self.each do |elem|
129
+ set.merge elem.targets
130
+ end
131
+ end
132
+ end
133
+
134
+ def sources
135
+ return Masamune::DataPlan::Set::EMPTY if empty? || @rule.for_sources?
136
+ self.class.new(self.first.sources.rule).tap do |set|
137
+ self.each do |elem|
138
+ set.merge elem.sources
139
+ end
140
+ end
141
+ end
142
+
143
+ private
144
+
145
+ def convert_elem(elem)
146
+ case elem
147
+ when nil
148
+ when Masamune::DataPlan::Elem
149
+ elem
150
+ when String
151
+ @rule.bind_input(elem)
152
+ else
153
+ raise "Unhandled elem class #{elem.class}"
154
+ end
155
+ end
156
+
157
+ def convert_enum(enum)
158
+ case enum
159
+ when nil
160
+ when Array
161
+ enum.flatten.uniq
162
+ when Set, self.class
163
+ enum
164
+ when String
165
+ [enum]
166
+ else
167
+ raise "Unhandled enum class #{enum.class}"
168
+ end
169
+ end
170
+
171
+ def target_stale?(source, target)
172
+ target.last_modified_at != Masamune::DataPlan::Elem::MISSING_MODIFIED_AT &&
173
+ source.last_modified_at != Masamune::DataPlan::Elem::MISSING_MODIFIED_AT &&
174
+ source.last_modified_at >= target.last_modified_at
175
+ end
176
+ end