masamune 0.11.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/LICENSE.txt +21 -0
- data/README.md +54 -0
- data/Rakefile +15 -0
- data/bin/masamune-elastic-mapreduce +4 -0
- data/bin/masamune-hive +4 -0
- data/bin/masamune-psql +4 -0
- data/bin/masamune-shell +4 -0
- data/lib/masamune.rb +56 -0
- data/lib/masamune/accumulate.rb +60 -0
- data/lib/masamune/actions.rb +38 -0
- data/lib/masamune/actions/data_flow.rb +131 -0
- data/lib/masamune/actions/date_parse.rb +75 -0
- data/lib/masamune/actions/elastic_mapreduce.rb +68 -0
- data/lib/masamune/actions/execute.rb +52 -0
- data/lib/masamune/actions/filesystem.rb +37 -0
- data/lib/masamune/actions/hadoop_filesystem.rb +40 -0
- data/lib/masamune/actions/hadoop_streaming.rb +41 -0
- data/lib/masamune/actions/hive.rb +74 -0
- data/lib/masamune/actions/postgres.rb +76 -0
- data/lib/masamune/actions/postgres_admin.rb +34 -0
- data/lib/masamune/actions/s3cmd.rb +44 -0
- data/lib/masamune/actions/transform.rb +89 -0
- data/lib/masamune/after_initialize_callbacks.rb +55 -0
- data/lib/masamune/cached_filesystem.rb +110 -0
- data/lib/masamune/commands.rb +37 -0
- data/lib/masamune/commands/elastic_mapreduce.rb +119 -0
- data/lib/masamune/commands/hadoop_filesystem.rb +57 -0
- data/lib/masamune/commands/hadoop_streaming.rb +116 -0
- data/lib/masamune/commands/hive.rb +178 -0
- data/lib/masamune/commands/interactive.rb +37 -0
- data/lib/masamune/commands/postgres.rb +128 -0
- data/lib/masamune/commands/postgres_admin.rb +72 -0
- data/lib/masamune/commands/postgres_common.rb +33 -0
- data/lib/masamune/commands/retry_with_backoff.rb +60 -0
- data/lib/masamune/commands/s3cmd.rb +70 -0
- data/lib/masamune/commands/shell.rb +202 -0
- data/lib/masamune/configuration.rb +195 -0
- data/lib/masamune/data_plan.rb +31 -0
- data/lib/masamune/data_plan/builder.rb +66 -0
- data/lib/masamune/data_plan/elem.rb +190 -0
- data/lib/masamune/data_plan/engine.rb +162 -0
- data/lib/masamune/data_plan/rule.rb +292 -0
- data/lib/masamune/data_plan/set.rb +176 -0
- data/lib/masamune/environment.rb +164 -0
- data/lib/masamune/filesystem.rb +567 -0
- data/lib/masamune/has_environment.rb +40 -0
- data/lib/masamune/helpers.rb +27 -0
- data/lib/masamune/helpers/postgres.rb +84 -0
- data/lib/masamune/io.rb +33 -0
- data/lib/masamune/last_element.rb +53 -0
- data/lib/masamune/method_logger.rb +41 -0
- data/lib/masamune/multi_io.rb +39 -0
- data/lib/masamune/schema.rb +36 -0
- data/lib/masamune/schema/catalog.rb +233 -0
- data/lib/masamune/schema/column.rb +527 -0
- data/lib/masamune/schema/dimension.rb +133 -0
- data/lib/masamune/schema/event.rb +121 -0
- data/lib/masamune/schema/fact.rb +133 -0
- data/lib/masamune/schema/map.rb +265 -0
- data/lib/masamune/schema/row.rb +133 -0
- data/lib/masamune/schema/store.rb +115 -0
- data/lib/masamune/schema/table.rb +308 -0
- data/lib/masamune/schema/table_reference.rb +76 -0
- data/lib/masamune/spec_helper.rb +23 -0
- data/lib/masamune/string_format.rb +34 -0
- data/lib/masamune/tasks/elastic_mapreduce_thor.rb +60 -0
- data/lib/masamune/tasks/hive_thor.rb +55 -0
- data/lib/masamune/tasks/postgres_thor.rb +47 -0
- data/lib/masamune/tasks/shell_thor.rb +63 -0
- data/lib/masamune/template.rb +77 -0
- data/lib/masamune/thor.rb +186 -0
- data/lib/masamune/thor_loader.rb +38 -0
- data/lib/masamune/topological_hash.rb +34 -0
- data/lib/masamune/transform.rb +47 -0
- data/lib/masamune/transform/bulk_upsert.psql.erb +64 -0
- data/lib/masamune/transform/bulk_upsert.rb +52 -0
- data/lib/masamune/transform/consolidate_dimension.rb +54 -0
- data/lib/masamune/transform/deduplicate_dimension.psql.erb +52 -0
- data/lib/masamune/transform/deduplicate_dimension.rb +53 -0
- data/lib/masamune/transform/define_event_view.hql.erb +51 -0
- data/lib/masamune/transform/define_event_view.rb +60 -0
- data/lib/masamune/transform/define_index.psql.erb +34 -0
- data/lib/masamune/transform/define_schema.hql.erb +23 -0
- data/lib/masamune/transform/define_schema.psql.erb +79 -0
- data/lib/masamune/transform/define_schema.rb +56 -0
- data/lib/masamune/transform/define_table.hql.erb +34 -0
- data/lib/masamune/transform/define_table.psql.erb +95 -0
- data/lib/masamune/transform/define_table.rb +40 -0
- data/lib/masamune/transform/define_unique.psql.erb +30 -0
- data/lib/masamune/transform/insert_reference_values.psql.erb +43 -0
- data/lib/masamune/transform/insert_reference_values.rb +64 -0
- data/lib/masamune/transform/load_dimension.rb +47 -0
- data/lib/masamune/transform/load_fact.rb +45 -0
- data/lib/masamune/transform/operator.rb +96 -0
- data/lib/masamune/transform/relabel_dimension.psql.erb +76 -0
- data/lib/masamune/transform/relabel_dimension.rb +39 -0
- data/lib/masamune/transform/rollup_fact.psql.erb +79 -0
- data/lib/masamune/transform/rollup_fact.rb +149 -0
- data/lib/masamune/transform/snapshot_dimension.psql.erb +75 -0
- data/lib/masamune/transform/snapshot_dimension.rb +74 -0
- data/lib/masamune/transform/stage_dimension.psql.erb +39 -0
- data/lib/masamune/transform/stage_dimension.rb +83 -0
- data/lib/masamune/transform/stage_fact.psql.erb +80 -0
- data/lib/masamune/transform/stage_fact.rb +111 -0
- data/lib/masamune/version.rb +25 -0
- data/spec/fixtures/aggregate.sql.erb +25 -0
- data/spec/fixtures/comment.sql.erb +27 -0
- data/spec/fixtures/invalid.sql.erb +23 -0
- data/spec/fixtures/relative.sql.erb +23 -0
- data/spec/fixtures/simple.sql.erb +28 -0
- data/spec/fixtures/whitespace.sql.erb +30 -0
- data/spec/masamune/actions/elastic_mapreduce_spec.rb +108 -0
- data/spec/masamune/actions/execute_spec.rb +50 -0
- data/spec/masamune/actions/hadoop_filesystem_spec.rb +44 -0
- data/spec/masamune/actions/hadoop_streaming_spec.rb +74 -0
- data/spec/masamune/actions/hive_spec.rb +117 -0
- data/spec/masamune/actions/postgres_admin_spec.rb +58 -0
- data/spec/masamune/actions/postgres_spec.rb +134 -0
- data/spec/masamune/actions/s3cmd_spec.rb +44 -0
- data/spec/masamune/actions/transform_spec.rb +144 -0
- data/spec/masamune/after_initialization_callbacks_spec.rb +61 -0
- data/spec/masamune/cached_filesystem_spec.rb +167 -0
- data/spec/masamune/commands/hadoop_filesystem_spec.rb +50 -0
- data/spec/masamune/commands/hadoop_streaming_spec.rb +106 -0
- data/spec/masamune/commands/hive_spec.rb +117 -0
- data/spec/masamune/commands/postgres_admin_spec.rb +69 -0
- data/spec/masamune/commands/postgres_spec.rb +100 -0
- data/spec/masamune/commands/retry_with_backoff_spec.rb +116 -0
- data/spec/masamune/commands/s3cmd_spec.rb +50 -0
- data/spec/masamune/commands/shell_spec.rb +101 -0
- data/spec/masamune/configuration_spec.rb +102 -0
- data/spec/masamune/data_plan/builder_spec.rb +91 -0
- data/spec/masamune/data_plan/elem_spec.rb +102 -0
- data/spec/masamune/data_plan/engine_spec.rb +356 -0
- data/spec/masamune/data_plan/rule_spec.rb +407 -0
- data/spec/masamune/data_plan/set_spec.rb +517 -0
- data/spec/masamune/environment_spec.rb +65 -0
- data/spec/masamune/filesystem_spec.rb +1421 -0
- data/spec/masamune/helpers/postgres_spec.rb +95 -0
- data/spec/masamune/schema/catalog_spec.rb +613 -0
- data/spec/masamune/schema/column_spec.rb +696 -0
- data/spec/masamune/schema/dimension_spec.rb +137 -0
- data/spec/masamune/schema/event_spec.rb +75 -0
- data/spec/masamune/schema/fact_spec.rb +117 -0
- data/spec/masamune/schema/map_spec.rb +593 -0
- data/spec/masamune/schema/row_spec.rb +28 -0
- data/spec/masamune/schema/store_spec.rb +49 -0
- data/spec/masamune/schema/table_spec.rb +395 -0
- data/spec/masamune/string_format_spec.rb +60 -0
- data/spec/masamune/tasks/elastic_mapreduce_thor_spec.rb +57 -0
- data/spec/masamune/tasks/hive_thor_spec.rb +75 -0
- data/spec/masamune/tasks/postgres_thor_spec.rb +42 -0
- data/spec/masamune/tasks/shell_thor_spec.rb +51 -0
- data/spec/masamune/template_spec.rb +77 -0
- data/spec/masamune/thor_spec.rb +238 -0
- data/spec/masamune/transform/bulk_upsert.dimension_spec.rb +200 -0
- data/spec/masamune/transform/consolidate_dimension_spec.rb +62 -0
- data/spec/masamune/transform/deduplicate_dimension_spec.rb +84 -0
- data/spec/masamune/transform/define_event_view_spec.rb +84 -0
- data/spec/masamune/transform/define_schema_spec.rb +83 -0
- data/spec/masamune/transform/define_table.dimension_spec.rb +306 -0
- data/spec/masamune/transform/define_table.fact_spec.rb +291 -0
- data/spec/masamune/transform/define_table.table_spec.rb +525 -0
- data/spec/masamune/transform/insert_reference_values.dimension_spec.rb +111 -0
- data/spec/masamune/transform/insert_reference_values.fact_spec.rb +149 -0
- data/spec/masamune/transform/load_dimension_spec.rb +76 -0
- data/spec/masamune/transform/load_fact_spec.rb +89 -0
- data/spec/masamune/transform/relabel_dimension_spec.rb +102 -0
- data/spec/masamune/transform/rollup_fact_spec.rb +333 -0
- data/spec/masamune/transform/snapshot_dimension_spec.rb +103 -0
- data/spec/masamune/transform/stage_dimension_spec.rb +115 -0
- data/spec/masamune/transform/stage_fact_spec.rb +204 -0
- data/spec/masamune_spec.rb +32 -0
- data/spec/spec_helper.rb +41 -0
- data/spec/support/masamune/example_group.rb +36 -0
- data/spec/support/masamune/mock_command.rb +99 -0
- data/spec/support/masamune/mock_delegate.rb +51 -0
- data/spec/support/masamune/mock_filesystem.rb +96 -0
- data/spec/support/masamune/thor_mute.rb +35 -0
- data/spec/support/rspec/example/action_example_group.rb +34 -0
- data/spec/support/rspec/example/task_example_group.rb +80 -0
- data/spec/support/rspec/example/transform_example_group.rb +36 -0
- data/spec/support/shared_examples/postgres_common_examples.rb +53 -0
- metadata +462 -0
@@ -0,0 +1,95 @@
|
|
1
|
+
# The MIT License (MIT)
|
2
|
+
#
|
3
|
+
# Copyright (c) 2014-2015, VMware, Inc. All Rights Reserved.
|
4
|
+
#
|
5
|
+
# Permission is hereby granted, free of charge, to any person obtaining a copy
|
6
|
+
# of this software and associated documentation files (the "Software"), to deal
|
7
|
+
# in the Software without restriction, including without limitation the rights
|
8
|
+
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
9
|
+
# copies of the Software, and to permit persons to whom the Software is
|
10
|
+
# furnished to do so, subject to the following conditions:
|
11
|
+
#
|
12
|
+
# The above copyright notice and this permission notice shall be included in
|
13
|
+
# all copies or substantial portions of the Software.
|
14
|
+
#
|
15
|
+
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
16
|
+
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
17
|
+
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
18
|
+
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
19
|
+
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
20
|
+
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
21
|
+
# THE SOFTWARE.
|
22
|
+
|
23
|
+
require 'spec_helper'
|
24
|
+
|
25
|
+
describe Masamune::Helpers::Postgres do
|
26
|
+
let(:environment) { double }
|
27
|
+
let(:instance) { described_class.new(environment) }
|
28
|
+
|
29
|
+
describe '#table_exists' do
|
30
|
+
before do
|
31
|
+
expect(instance).to receive(:database_exists?).and_return(true)
|
32
|
+
expect(instance).to receive(:postgres).with(hash_including(:exec, :tuple_output)).and_yield(' foo').and_yield(' bar').and_yield(' baz')
|
33
|
+
end
|
34
|
+
|
35
|
+
subject { instance.table_exists?(table) }
|
36
|
+
|
37
|
+
context 'when table exists' do
|
38
|
+
let(:table) { 'foo' }
|
39
|
+
it { is_expected.to eq(true) }
|
40
|
+
end
|
41
|
+
|
42
|
+
context 'when other table exists' do
|
43
|
+
let(:table) { 'baz' }
|
44
|
+
it { is_expected.to eq(true) }
|
45
|
+
end
|
46
|
+
|
47
|
+
context 'when table does not exist' do
|
48
|
+
let(:table) { 'zombo' }
|
49
|
+
it { is_expected.to eq(false) }
|
50
|
+
end
|
51
|
+
end
|
52
|
+
|
53
|
+
describe '#table_last_modified_at' do
|
54
|
+
subject { instance.table_last_modified_at('foo', options) }
|
55
|
+
|
56
|
+
context 'with last_modified_at option' do
|
57
|
+
before do
|
58
|
+
expect(instance).to receive(:table_exists?).and_return(true)
|
59
|
+
expect(instance).to receive(:postgres).with(hash_including(:exec, :tuple_output)).and_yield(output)
|
60
|
+
end
|
61
|
+
|
62
|
+
let(:options) { { last_modified_at: 'last_modified_at' } }
|
63
|
+
|
64
|
+
context 'with expected output' do
|
65
|
+
let(:output) { ' 2014-06-04 10:20:19.539656-07' }
|
66
|
+
|
67
|
+
it { is_expected.to be_a(Time) }
|
68
|
+
it { is_expected.to eq(Time.parse('2014-06-04 17:20:00 +0000')) }
|
69
|
+
end
|
70
|
+
|
71
|
+
context 'with blank output' do
|
72
|
+
let(:output) { ' ' }
|
73
|
+
|
74
|
+
it { is_expected.to be_nil }
|
75
|
+
end
|
76
|
+
|
77
|
+
context 'with invalid output' do
|
78
|
+
let(:output) { ' 2XXX' }
|
79
|
+
|
80
|
+
it { is_expected.to be_nil }
|
81
|
+
end
|
82
|
+
end
|
83
|
+
|
84
|
+
context 'without last_modified_at option' do
|
85
|
+
let(:options) { {} }
|
86
|
+
|
87
|
+
before do
|
88
|
+
expect(instance).to receive(:table_exists?).never
|
89
|
+
expect(instance).to receive(:postgres).never
|
90
|
+
end
|
91
|
+
|
92
|
+
it { is_expected.to be_nil }
|
93
|
+
end
|
94
|
+
end
|
95
|
+
end
|
@@ -0,0 +1,613 @@
|
|
1
|
+
# The MIT License (MIT)
|
2
|
+
#
|
3
|
+
# Copyright (c) 2014-2015, VMware, Inc. All Rights Reserved.
|
4
|
+
#
|
5
|
+
# Permission is hereby granted, free of charge, to any person obtaining a copy
|
6
|
+
# of this software and associated documentation files (the "Software"), to deal
|
7
|
+
# in the Software without restriction, including without limitation the rights
|
8
|
+
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
9
|
+
# copies of the Software, and to permit persons to whom the Software is
|
10
|
+
# furnished to do so, subject to the following conditions:
|
11
|
+
#
|
12
|
+
# The above copyright notice and this permission notice shall be included in
|
13
|
+
# all copies or substantial portions of the Software.
|
14
|
+
#
|
15
|
+
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
16
|
+
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
17
|
+
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
18
|
+
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
19
|
+
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
20
|
+
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
21
|
+
# THE SOFTWARE.
|
22
|
+
|
23
|
+
require 'spec_helper'
|
24
|
+
|
25
|
+
describe Masamune::Schema::Catalog do
|
26
|
+
let(:environment) { double }
|
27
|
+
let(:instance) { described_class.new(environment) }
|
28
|
+
let(:postgres) { instance.postgres }
|
29
|
+
let(:hive) { instance.hive }
|
30
|
+
let(:files) { instance.files }
|
31
|
+
|
32
|
+
describe '#method_missing' do
|
33
|
+
before do
|
34
|
+
instance.schema :postgres do
|
35
|
+
dimension 'foo', type: :two
|
36
|
+
end
|
37
|
+
end
|
38
|
+
|
39
|
+
it { expect(postgres.foo_dimension.id).to eq(:foo) }
|
40
|
+
it { expect(postgres.bar_dimension).to be_nil }
|
41
|
+
it { expect { postgres.foo_baz }.to raise_error ArgumentError, "unknown attribute type 'baz'" }
|
42
|
+
end
|
43
|
+
|
44
|
+
describe '#[]' do
|
45
|
+
context 'with :postgres' do
|
46
|
+
subject { instance[:postgres] }
|
47
|
+
it { is_expected.to eq(postgres) }
|
48
|
+
end
|
49
|
+
context 'with :hive' do
|
50
|
+
subject { instance[:hive] }
|
51
|
+
it { is_expected.to eq(hive) }
|
52
|
+
end
|
53
|
+
context 'with :mysql' do
|
54
|
+
subject { instance[:mysql] }
|
55
|
+
it { expect { subject }.to raise_error ArgumentError, "unknown type: 'mysql'" }
|
56
|
+
end
|
57
|
+
end
|
58
|
+
|
59
|
+
context '#load' do
|
60
|
+
let(:postgres_extra) { %w(/tmp/schema.psql /tmp/00_schema.psql /tmp/20_schema.psql) }
|
61
|
+
let(:hive_extra) { %w(/tmp/schema.hql /tmp/00_schema.hql /tmp/20_schema.hql) }
|
62
|
+
let(:extra) { postgres_extra + hive_extra }
|
63
|
+
|
64
|
+
before do
|
65
|
+
extra.each do |e|
|
66
|
+
instance.load(e)
|
67
|
+
end
|
68
|
+
end
|
69
|
+
|
70
|
+
it 'should load postgres extra in order' do
|
71
|
+
expect(instance.postgres.extra).to eq(postgres_extra)
|
72
|
+
expect(instance.postgres.extra(:pre).size).to eq(2)
|
73
|
+
expect(instance.postgres.extra(:post).size).to eq(1)
|
74
|
+
end
|
75
|
+
|
76
|
+
it 'should load hive extra in order' do
|
77
|
+
expect(instance.hive.extra).to eq(hive_extra)
|
78
|
+
expect(instance.hive.extra(:pre).size).to eq(2)
|
79
|
+
expect(instance.hive.extra(:post).size).to eq(1)
|
80
|
+
end
|
81
|
+
end
|
82
|
+
|
83
|
+
describe '#schema' do
|
84
|
+
context 'when schema does not define store' do
|
85
|
+
subject(:schema) do
|
86
|
+
instance.schema do
|
87
|
+
dimension 'foo', type: :two
|
88
|
+
dimension 'bar', type: :two
|
89
|
+
end
|
90
|
+
end
|
91
|
+
|
92
|
+
it { expect { schema }.to raise_error ArgumentError, "schema store arguments required" }
|
93
|
+
end
|
94
|
+
|
95
|
+
context 'when schema defines unknown store' do
|
96
|
+
subject(:schema) do
|
97
|
+
instance.schema :mysql do
|
98
|
+
dimension 'foo', type: :two
|
99
|
+
dimension 'bar', type: :two
|
100
|
+
end
|
101
|
+
end
|
102
|
+
|
103
|
+
it { expect { schema }.to raise_error ArgumentError, "unknown type: 'mysql'" }
|
104
|
+
end
|
105
|
+
|
106
|
+
context 'when schema contains dimensions' do
|
107
|
+
before do
|
108
|
+
instance.schema :postgres do
|
109
|
+
dimension 'foo', type: :two
|
110
|
+
dimension 'bar', type: :two
|
111
|
+
end
|
112
|
+
end
|
113
|
+
|
114
|
+
it { expect(postgres.dimensions).to include :foo }
|
115
|
+
it { expect(postgres.dimensions).to include :bar }
|
116
|
+
it { expect(postgres.foo_dimension.id).to eq(:foo) }
|
117
|
+
it { expect(postgres.bar_dimension.id).to eq(:bar) }
|
118
|
+
end
|
119
|
+
|
120
|
+
context 'when schema contains columns' do
|
121
|
+
before do
|
122
|
+
instance.schema :postgres do
|
123
|
+
dimension 'table_one', type: :two do
|
124
|
+
column 'column_one'
|
125
|
+
column 'column_two'
|
126
|
+
end
|
127
|
+
|
128
|
+
dimension 'table_two', type: :two do
|
129
|
+
column 'column_three'
|
130
|
+
column 'column_four'
|
131
|
+
end
|
132
|
+
end
|
133
|
+
end
|
134
|
+
|
135
|
+
let(:table_one_columns) { postgres.table_one_dimension.columns }
|
136
|
+
let(:table_two_columns) { postgres.table_two_dimension.columns }
|
137
|
+
|
138
|
+
it { expect(table_one_columns).to include :column_one }
|
139
|
+
it { expect(table_one_columns).to include :column_two }
|
140
|
+
it { expect(table_one_columns).to_not include :column_three }
|
141
|
+
it { expect(table_one_columns).to_not include :column_four }
|
142
|
+
it { expect(table_two_columns).to_not include :column_one }
|
143
|
+
it { expect(table_two_columns).to_not include :column_two }
|
144
|
+
it { expect(table_two_columns).to include :column_three }
|
145
|
+
it { expect(table_two_columns).to include :column_four }
|
146
|
+
end
|
147
|
+
|
148
|
+
context 'when schema contains columns and rows' do
|
149
|
+
before do
|
150
|
+
instance.schema :postgres do
|
151
|
+
dimension 'table_one', type: :two do
|
152
|
+
column 'column_one', type: :integer
|
153
|
+
column 'column_two', type: :string
|
154
|
+
row column_one: 1, column_two: 'a'
|
155
|
+
row column_one: 2, column_two: 'b'
|
156
|
+
end
|
157
|
+
end
|
158
|
+
end
|
159
|
+
|
160
|
+
let(:table_one_rows) { postgres.table_one_dimension.rows }
|
161
|
+
|
162
|
+
it { expect(table_one_rows[0].values).to include(column_one: 1, column_two: 'a') }
|
163
|
+
it { expect(table_one_rows[1].values).to include(column_one: 2, column_two: 'b') }
|
164
|
+
end
|
165
|
+
|
166
|
+
context 'when schema contains references' do
|
167
|
+
before do
|
168
|
+
instance.schema :postgres do
|
169
|
+
dimension 'foo', type: :one
|
170
|
+
dimension 'bar', type: :one
|
171
|
+
dimension 'baz', type: :two do
|
172
|
+
references :foo
|
173
|
+
references :bar, label: :quux
|
174
|
+
end
|
175
|
+
end
|
176
|
+
end
|
177
|
+
|
178
|
+
subject(:references) { postgres.baz_dimension.references }
|
179
|
+
|
180
|
+
it { is_expected.to include :foo }
|
181
|
+
it { is_expected.to include :quux_bar }
|
182
|
+
it { expect(references[:foo].label).to be_nil }
|
183
|
+
it { expect(references[:quux_bar].label).to eq(:quux) }
|
184
|
+
end
|
185
|
+
|
186
|
+
context 'when schema contains overrides' do
|
187
|
+
before do
|
188
|
+
instance.schema :postgres do
|
189
|
+
dimension 'cluster', type: :mini do
|
190
|
+
column 'uuid', type: :uuid, surrogate_key: true
|
191
|
+
column 'name', type: :string, unique: true
|
192
|
+
column 'description', type: :string
|
193
|
+
|
194
|
+
row name: 'current_database()', attributes: {default: true}
|
195
|
+
end
|
196
|
+
end
|
197
|
+
end
|
198
|
+
|
199
|
+
subject { postgres.cluster_dimension.columns }
|
200
|
+
|
201
|
+
it { is_expected.to include :uuid }
|
202
|
+
it { is_expected.to_not include :id }
|
203
|
+
end
|
204
|
+
|
205
|
+
context 'when schema contains facts' do
|
206
|
+
before do
|
207
|
+
instance.schema :postgres do
|
208
|
+
dimension 'dimension_one', type: :two do
|
209
|
+
column 'column_one'
|
210
|
+
column 'column_two'
|
211
|
+
end
|
212
|
+
|
213
|
+
fact 'fact_one' do
|
214
|
+
references :dimension_one
|
215
|
+
measure 'measure_one', aggregate: :sum
|
216
|
+
end
|
217
|
+
|
218
|
+
fact 'fact_two' do
|
219
|
+
references :dimension_one
|
220
|
+
measure 'measure_two', aggregate: :average
|
221
|
+
end
|
222
|
+
end
|
223
|
+
end
|
224
|
+
|
225
|
+
let(:fact_one) { postgres.fact_one_fact }
|
226
|
+
let(:fact_two) { postgres.fact_two_fact }
|
227
|
+
|
228
|
+
it { expect(fact_one.references).to include :dimension_one}
|
229
|
+
it { expect(fact_one.measures).to include :measure_one }
|
230
|
+
it { expect(fact_one.measures[:measure_one].aggregate).to eq(:sum) }
|
231
|
+
it { expect(fact_two.references).to include :dimension_one}
|
232
|
+
it { expect(fact_two.measures).to include :measure_two }
|
233
|
+
it { expect(fact_two.measures[:measure_two].aggregate).to eq(:average) }
|
234
|
+
end
|
235
|
+
|
236
|
+
context 'when schema contains fact with partition table' do
|
237
|
+
before do
|
238
|
+
instance.schema :hive do
|
239
|
+
fact 'visits', partition: 'y%Ym%m' do
|
240
|
+
measure 'count', aggregate: :sum
|
241
|
+
end
|
242
|
+
end
|
243
|
+
end
|
244
|
+
|
245
|
+
it { expect(hive.visits_fact.partition).to eq('y%Ym%m') }
|
246
|
+
it { expect(hive.visits_fact.measures).to include :count }
|
247
|
+
it { expect(hive.visits_fact.measures[:count].aggregate).to eq(:sum) }
|
248
|
+
end
|
249
|
+
|
250
|
+
context 'when schema contains fact with partition columns' do
|
251
|
+
before do
|
252
|
+
instance.schema :hive do
|
253
|
+
fact 'visits' do
|
254
|
+
partition 'y', type: :integer
|
255
|
+
partition 'm', type: :integer
|
256
|
+
partition 'd', type: :integer
|
257
|
+
measure 'count', aggregate: :sum
|
258
|
+
end
|
259
|
+
end
|
260
|
+
end
|
261
|
+
|
262
|
+
it { expect(hive.visits_fact.partitions).to include :y }
|
263
|
+
it { expect(hive.visits_fact.partitions).to include :m }
|
264
|
+
it { expect(hive.visits_fact.partitions).to include :d }
|
265
|
+
it { expect(hive.visits_fact.measures).to include :count }
|
266
|
+
it { expect(hive.visits_fact.measures[:count].aggregate).to eq(:sum) }
|
267
|
+
end
|
268
|
+
|
269
|
+
context 'when schema contains fact with degenerate dimension references' do
|
270
|
+
before do
|
271
|
+
instance.schema :hive do
|
272
|
+
fact 'visits' do
|
273
|
+
references :message_kind, degenerate: true
|
274
|
+
measure 'count', aggregate: :sum
|
275
|
+
end
|
276
|
+
end
|
277
|
+
end
|
278
|
+
|
279
|
+
it { expect(hive.visits_fact.references).to include :message_kind }
|
280
|
+
it { expect(hive.visits_fact.columns).to include :message_kind_type_id }
|
281
|
+
it { expect(hive.visits_fact.measures).to include :count }
|
282
|
+
it { expect(hive.visits_fact.measures[:count].aggregate).to eq(:sum) }
|
283
|
+
end
|
284
|
+
|
285
|
+
context 'when schema contains fact with a single grain' do
|
286
|
+
before do
|
287
|
+
instance.schema :postgres do
|
288
|
+
dimension 'user', type: :two do
|
289
|
+
column 'user_id'
|
290
|
+
end
|
291
|
+
|
292
|
+
fact 'visits', grain: 'hourly' do
|
293
|
+
references :user
|
294
|
+
measure 'count'
|
295
|
+
end
|
296
|
+
end
|
297
|
+
end
|
298
|
+
|
299
|
+
let(:visits_hourly) { postgres.visits_hourly_fact }
|
300
|
+
|
301
|
+
it { expect(visits_hourly.name).to eq('visits_hourly_fact') }
|
302
|
+
it { expect(visits_hourly.references).to include :user }
|
303
|
+
it { expect(visits_hourly.measures).to include :count }
|
304
|
+
end
|
305
|
+
|
306
|
+
context 'when schema contains fact with multiple grain' do
|
307
|
+
before do
|
308
|
+
instance.schema :postgres do
|
309
|
+
dimension 'user', type: :two do
|
310
|
+
column 'user_id'
|
311
|
+
end
|
312
|
+
|
313
|
+
fact 'visits', grain: %w(hourly daily monthly) do
|
314
|
+
references :user
|
315
|
+
measure 'count'
|
316
|
+
end
|
317
|
+
end
|
318
|
+
end
|
319
|
+
|
320
|
+
let(:visits_hourly) { postgres.visits_hourly_fact }
|
321
|
+
let(:visits_daily) { postgres.visits_daily_fact }
|
322
|
+
let(:visits_monthly) { postgres.visits_monthly_fact }
|
323
|
+
|
324
|
+
it { expect(visits_hourly.name).to eq('visits_hourly_fact') }
|
325
|
+
it { expect(visits_hourly.references).to include :user }
|
326
|
+
it { expect(visits_hourly.measures).to include :count }
|
327
|
+
it { expect(visits_daily.name).to eq('visits_daily_fact') }
|
328
|
+
it { expect(visits_daily.references).to include :user }
|
329
|
+
it { expect(visits_daily.measures).to include :count }
|
330
|
+
it { expect(visits_monthly.name).to eq('visits_monthly_fact') }
|
331
|
+
it { expect(visits_monthly.references).to include :user }
|
332
|
+
it { expect(visits_monthly.measures).to include :count }
|
333
|
+
end
|
334
|
+
|
335
|
+
context 'when schema contains events' do
|
336
|
+
before do
|
337
|
+
instance.schema :hive do
|
338
|
+
event 'event_one' do
|
339
|
+
attribute 'attribute_one'
|
340
|
+
attribute 'attribute_two'
|
341
|
+
end
|
342
|
+
|
343
|
+
event 'event_two' do
|
344
|
+
attribute 'attribute_three'
|
345
|
+
attribute 'attribute_four'
|
346
|
+
end
|
347
|
+
end
|
348
|
+
end
|
349
|
+
|
350
|
+
let(:event_one) { hive.event_one_event }
|
351
|
+
let(:event_two) { hive.event_two_event }
|
352
|
+
|
353
|
+
it { expect(event_one.attributes).to include :attribute_one }
|
354
|
+
it { expect(event_one.attributes).to include :attribute_two }
|
355
|
+
it { expect(event_two.attributes).to include :attribute_three }
|
356
|
+
it { expect(event_two.attributes).to include :attribute_four }
|
357
|
+
end
|
358
|
+
|
359
|
+
context 'when schema contains file' do
|
360
|
+
before do
|
361
|
+
instance.schema :postgres do
|
362
|
+
dimension 'user_account', type: :mini do
|
363
|
+
column 'name', type: :string
|
364
|
+
end
|
365
|
+
end
|
366
|
+
|
367
|
+
instance.schema :files do
|
368
|
+
file 'users' do
|
369
|
+
column 'postgres.user_account.name', type: :string
|
370
|
+
column 'admin', type: :boolean
|
371
|
+
end
|
372
|
+
end
|
373
|
+
end
|
374
|
+
|
375
|
+
subject(:file) { files.users }
|
376
|
+
|
377
|
+
it 'should expect dot notation column names to reference dimensions' do
|
378
|
+
expect(file.columns).to include :user_account_type_name
|
379
|
+
expect(file.columns).to include :admin
|
380
|
+
expect(file.columns[:user_account_type_name].reference).to eq(postgres.dimensions[:user_account])
|
381
|
+
expect(file.columns[:admin].reference).to be_nil
|
382
|
+
end
|
383
|
+
end
|
384
|
+
|
385
|
+
context 'when schema contains file with headers & format override' do
|
386
|
+
before do
|
387
|
+
instance.schema :postgres do
|
388
|
+
file 'override', headers: false, format: :tsv do; end
|
389
|
+
file 'default' do; end
|
390
|
+
end
|
391
|
+
end
|
392
|
+
|
393
|
+
it 'should override store format' do
|
394
|
+
expect(postgres.headers).to eq(true)
|
395
|
+
expect(postgres.format).to eq(:csv)
|
396
|
+
expect(postgres.override_file.store.headers).to eq(false)
|
397
|
+
expect(postgres.override_file.store.format).to eq(:tsv)
|
398
|
+
expect(postgres.default_file.store.headers).to eq(true)
|
399
|
+
expect(postgres.default_file.store.format).to eq(:csv)
|
400
|
+
end
|
401
|
+
end
|
402
|
+
|
403
|
+
context 'when schema contains file with invalid reference' do
|
404
|
+
subject(:schema) do
|
405
|
+
instance.schema :postgres do
|
406
|
+
file 'users' do
|
407
|
+
column 'user_account.name', type: :string
|
408
|
+
column 'admin', type: :boolean
|
409
|
+
end
|
410
|
+
end
|
411
|
+
end
|
412
|
+
|
413
|
+
it 'should raise an exception' do
|
414
|
+
expect { schema }.to raise_error /dimension user_account not defined/
|
415
|
+
end
|
416
|
+
end
|
417
|
+
|
418
|
+
context 'when schema contains map from: file' do
|
419
|
+
before do
|
420
|
+
instance.schema :postgres do
|
421
|
+
dimension 'user_account_state', type: :mini do
|
422
|
+
column 'name', type: :string
|
423
|
+
end
|
424
|
+
|
425
|
+
dimension 'user', type: :two do
|
426
|
+
references :user_account_state
|
427
|
+
column 'tenant_id', type: :integer, natural_key: true
|
428
|
+
column 'user_id', type: :integer, natural_key: true
|
429
|
+
end
|
430
|
+
end
|
431
|
+
|
432
|
+
instance.schema :files do
|
433
|
+
file 'users' do
|
434
|
+
column 'id', type: :integer
|
435
|
+
column 'tenant_id', type: :integer
|
436
|
+
column 'updated_at', type: :timestamp
|
437
|
+
column 'deleted_at', type: :timestamp
|
438
|
+
end
|
439
|
+
|
440
|
+
map from: files.users, to: postgres.user_dimension do |row|
|
441
|
+
{
|
442
|
+
'tenant_id' => row[:tenant_id],
|
443
|
+
'user_id' => row[:id],
|
444
|
+
'user_account_state.name' => row[:deleted_at] ? 'deleted' : 'active',
|
445
|
+
'start_at' => row[:updated_at],
|
446
|
+
'delta' => 0
|
447
|
+
}
|
448
|
+
end
|
449
|
+
end
|
450
|
+
end
|
451
|
+
|
452
|
+
subject(:map) { files.users.map(to: postgres.user_dimension) }
|
453
|
+
|
454
|
+
it 'constructs map' do
|
455
|
+
expect(map.function).to_not be_nil
|
456
|
+
end
|
457
|
+
end
|
458
|
+
|
459
|
+
context 'when schema contains map from: event' do
|
460
|
+
before do
|
461
|
+
instance.schema :postgres do
|
462
|
+
dimension 'user', type: :mini do
|
463
|
+
column 'user_id', type: :integer, natural_key: true
|
464
|
+
column 'name', type: :string
|
465
|
+
end
|
466
|
+
|
467
|
+
event 'users' do
|
468
|
+
attribute 'id', type: :integer, immutable: true
|
469
|
+
attribute 'name', type: :string
|
470
|
+
end
|
471
|
+
|
472
|
+
map from: postgres.users_event, to: postgres.user_dimension do |row|
|
473
|
+
{
|
474
|
+
'user_id' => row[:id],
|
475
|
+
'name' => row[:name_now]
|
476
|
+
}
|
477
|
+
end
|
478
|
+
end
|
479
|
+
end
|
480
|
+
|
481
|
+
subject(:map) { postgres.users_event.map(to: postgres.user_dimension) }
|
482
|
+
|
483
|
+
it 'constructs map' do
|
484
|
+
expect(map.function).to_not be_nil
|
485
|
+
end
|
486
|
+
end
|
487
|
+
|
488
|
+
context 'when schema contains map missing the from: field' do
|
489
|
+
subject(:schema) do
|
490
|
+
instance.schema :postgres do
|
491
|
+
map do |row|
|
492
|
+
{
|
493
|
+
id: row[:id]
|
494
|
+
}
|
495
|
+
end
|
496
|
+
end
|
497
|
+
end
|
498
|
+
|
499
|
+
it 'should raise an exception' do
|
500
|
+
expect { schema }.to raise_error /invalid map, from: is missing/
|
501
|
+
end
|
502
|
+
end
|
503
|
+
|
504
|
+
context 'when schema contains map with invalid options' do
|
505
|
+
subject(:schema) do
|
506
|
+
instance.schema :postgres do
|
507
|
+
map :x do |row|
|
508
|
+
{
|
509
|
+
id: row[:id]
|
510
|
+
}
|
511
|
+
end
|
512
|
+
end
|
513
|
+
end
|
514
|
+
|
515
|
+
it 'should raise an exception' do
|
516
|
+
expect { schema }.to raise_error /invalid map, from: is missing/
|
517
|
+
end
|
518
|
+
end
|
519
|
+
|
520
|
+
context 'when schema contains map missing the to: field' do
|
521
|
+
subject(:schema) do
|
522
|
+
instance.schema :postgres do
|
523
|
+
file 'users' do; end
|
524
|
+
|
525
|
+
map from: postgres.users_file do
|
526
|
+
field 'tenant_id'
|
527
|
+
end
|
528
|
+
end
|
529
|
+
end
|
530
|
+
|
531
|
+
it 'should raise an exception' do
|
532
|
+
expect { schema }.to raise_error /invalid map from: 'users', to: is missing/
|
533
|
+
end
|
534
|
+
end
|
535
|
+
|
536
|
+
context 'when schema addressed with symbols' do
|
537
|
+
before do
|
538
|
+
instance.schema :postgres do
|
539
|
+
dimension 'user', type: :one do; end
|
540
|
+
file 'users' do; end
|
541
|
+
|
542
|
+
map from: postgres.files[:users], to: postgres.dimensions[:user] do
|
543
|
+
field 'tenant_id'
|
544
|
+
end
|
545
|
+
end
|
546
|
+
end
|
547
|
+
|
548
|
+
subject(:map) { postgres.files[:users].map(to: postgres.dimensions[:user]) }
|
549
|
+
|
550
|
+
it 'should construct map' do
|
551
|
+
is_expected.to_not be_nil
|
552
|
+
end
|
553
|
+
end
|
554
|
+
|
555
|
+
context 'when schema addressed with strings' do
|
556
|
+
before do
|
557
|
+
instance.schema :postgres do
|
558
|
+
dimension 'user', type: :one do; end
|
559
|
+
file 'users' do; end
|
560
|
+
|
561
|
+
map from: postgres.files['users'], to: postgres.dimensions['user'] do
|
562
|
+
field 'tenant_id'
|
563
|
+
end
|
564
|
+
end
|
565
|
+
end
|
566
|
+
|
567
|
+
subject(:map) { postgres.files['users'].map(to: postgres.dimensions['user']) }
|
568
|
+
|
569
|
+
it 'should construct map' do
|
570
|
+
is_expected.to_not be_nil
|
571
|
+
end
|
572
|
+
end
|
573
|
+
end
|
574
|
+
|
575
|
+
describe '.dereference_column' do
|
576
|
+
before do
|
577
|
+
instance.schema :postgres do
|
578
|
+
dimension 'table_one', type: :two do
|
579
|
+
column 'column_one'
|
580
|
+
end
|
581
|
+
|
582
|
+
dimension 'table_two', type: :two do
|
583
|
+
references :table_one
|
584
|
+
references :table_one, label: :label_one
|
585
|
+
|
586
|
+
column 'column_two'
|
587
|
+
end
|
588
|
+
end
|
589
|
+
end
|
590
|
+
|
591
|
+
subject(:result) { postgres.dereference_column(input) }
|
592
|
+
|
593
|
+
context 'with a column name' do
|
594
|
+
let(:input) { 'column_two' }
|
595
|
+
it { expect(result.name).to eq(:column_two) }
|
596
|
+
end
|
597
|
+
|
598
|
+
context 'with a table.column name' do
|
599
|
+
let(:input) { 'table_one.column_one' }
|
600
|
+
it { expect(result.name).to eq(:table_one_dimension_column_one) }
|
601
|
+
end
|
602
|
+
|
603
|
+
context 'with a labeled table.column name' do
|
604
|
+
let(:input) { 'label_one_table_one.column_one' }
|
605
|
+
it { expect(result.name).to eq(:label_one_table_one_dimension_column_one) }
|
606
|
+
end
|
607
|
+
|
608
|
+
context 'with a undefined table.column name' do
|
609
|
+
let(:input) { 'undef.column_one' }
|
610
|
+
it { expect { result }.to raise_error ArgumentError, /dimension undef not defined/ }
|
611
|
+
end
|
612
|
+
end
|
613
|
+
end
|