duckdb 0.7.2-dev1901.0 → 0.7.2-dev2144.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/binding.gyp +2 -0
- package/package.json +1 -1
- package/src/duckdb/extension/parquet/include/parquet_writer.hpp +1 -1
- package/src/duckdb/extension/parquet/parquet_metadata.cpp +4 -2
- package/src/duckdb/src/catalog/catalog_entry/duck_index_entry.cpp +1 -1
- package/src/duckdb/src/common/arrow/arrow_appender.cpp +69 -44
- package/src/duckdb/src/common/arrow/arrow_converter.cpp +1 -1
- package/src/duckdb/src/common/arrow/arrow_wrapper.cpp +20 -2
- package/src/duckdb/src/common/box_renderer.cpp +4 -2
- package/src/duckdb/src/common/constants.cpp +10 -1
- package/src/duckdb/src/common/filename_pattern.cpp +41 -0
- package/src/duckdb/src/common/hive_partitioning.cpp +144 -15
- package/src/duckdb/src/common/radix_partitioning.cpp +101 -369
- package/src/duckdb/src/common/row_operations/row_aggregate.cpp +8 -9
- package/src/duckdb/src/common/row_operations/row_external.cpp +1 -1
- package/src/duckdb/src/common/row_operations/row_gather.cpp +5 -3
- package/src/duckdb/src/common/row_operations/row_match.cpp +117 -22
- package/src/duckdb/src/common/row_operations/row_scatter.cpp +2 -2
- package/src/duckdb/src/common/sort/partition_state.cpp +1 -1
- package/src/duckdb/src/common/sort/sort_state.cpp +2 -1
- package/src/duckdb/src/common/sort/sorted_block.cpp +1 -1
- package/src/duckdb/src/common/types/{column_data_allocator.cpp → column/column_data_allocator.cpp} +2 -2
- package/src/duckdb/src/common/types/{column_data_collection.cpp → column/column_data_collection.cpp} +22 -4
- package/src/duckdb/src/common/types/{column_data_collection_segment.cpp → column/column_data_collection_segment.cpp} +2 -1
- package/src/duckdb/src/common/types/{column_data_consumer.cpp → column/column_data_consumer.cpp} +1 -1
- package/src/duckdb/src/common/types/{partitioned_column_data.cpp → column/partitioned_column_data.cpp} +11 -9
- package/src/duckdb/src/common/types/row/partitioned_tuple_data.cpp +316 -0
- package/src/duckdb/src/common/types/{row_data_collection.cpp → row/row_data_collection.cpp} +1 -1
- package/src/duckdb/src/common/types/{row_data_collection_scanner.cpp → row/row_data_collection_scanner.cpp} +2 -2
- package/src/duckdb/src/common/types/{row_layout.cpp → row/row_layout.cpp} +1 -1
- package/src/duckdb/src/common/types/row/tuple_data_allocator.cpp +465 -0
- package/src/duckdb/src/common/types/row/tuple_data_collection.cpp +511 -0
- package/src/duckdb/src/common/types/row/tuple_data_iterator.cpp +96 -0
- package/src/duckdb/src/common/types/row/tuple_data_layout.cpp +119 -0
- package/src/duckdb/src/common/types/row/tuple_data_scatter_gather.cpp +1200 -0
- package/src/duckdb/src/common/types/row/tuple_data_segment.cpp +170 -0
- package/src/duckdb/src/common/types/vector.cpp +1 -1
- package/src/duckdb/src/execution/aggregate_hashtable.cpp +252 -290
- package/src/duckdb/src/execution/join_hashtable.cpp +192 -328
- package/src/duckdb/src/execution/operator/aggregate/physical_window.cpp +4 -4
- package/src/duckdb/src/execution/operator/helper/physical_execute.cpp +3 -3
- package/src/duckdb/src/execution/operator/helper/physical_limit_percent.cpp +2 -3
- package/src/duckdb/src/execution/operator/helper/physical_result_collector.cpp +2 -3
- package/src/duckdb/src/execution/operator/join/perfect_hash_join_executor.cpp +36 -21
- package/src/duckdb/src/execution/operator/join/physical_blockwise_nl_join.cpp +2 -2
- package/src/duckdb/src/execution/operator/join/physical_cross_product.cpp +1 -1
- package/src/duckdb/src/execution/operator/join/physical_delim_join.cpp +2 -2
- package/src/duckdb/src/execution/operator/join/physical_hash_join.cpp +166 -144
- package/src/duckdb/src/execution/operator/join/physical_index_join.cpp +5 -5
- package/src/duckdb/src/execution/operator/join/physical_join.cpp +2 -10
- package/src/duckdb/src/execution/operator/join/physical_positional_join.cpp +0 -1
- package/src/duckdb/src/execution/operator/order/physical_top_n.cpp +2 -2
- package/src/duckdb/src/execution/operator/persistent/physical_copy_to_file.cpp +13 -11
- package/src/duckdb/src/execution/operator/persistent/physical_delete.cpp +3 -2
- package/src/duckdb/src/execution/operator/persistent/physical_export.cpp +25 -24
- package/src/duckdb/src/execution/operator/persistent/physical_insert.cpp +1 -1
- package/src/duckdb/src/execution/operator/persistent/physical_update.cpp +4 -3
- package/src/duckdb/src/execution/operator/schema/physical_create_type.cpp +1 -1
- package/src/duckdb/src/execution/operator/set/physical_recursive_cte.cpp +3 -3
- package/src/duckdb/src/execution/partitionable_hashtable.cpp +9 -37
- package/src/duckdb/src/execution/physical_operator.cpp +1 -1
- package/src/duckdb/src/execution/physical_plan/plan_comparison_join.cpp +19 -18
- package/src/duckdb/src/execution/physical_plan/plan_copy_to_file.cpp +2 -1
- package/src/duckdb/src/execution/physical_plan/plan_execute.cpp +2 -2
- package/src/duckdb/src/execution/physical_plan/plan_explain.cpp +5 -6
- package/src/duckdb/src/execution/physical_plan/plan_expression_get.cpp +2 -2
- package/src/duckdb/src/execution/physical_plan/plan_recursive_cte.cpp +3 -3
- package/src/duckdb/src/execution/physical_plan_generator.cpp +1 -1
- package/src/duckdb/src/execution/radix_partitioned_hashtable.cpp +39 -17
- package/src/duckdb/src/function/aggregate/sorted_aggregate_function.cpp +2 -2
- package/src/duckdb/src/function/table/pragma_detailed_profiling_output.cpp +5 -5
- package/src/duckdb/src/function/table/pragma_last_profiling_output.cpp +2 -2
- package/src/duckdb/src/function/table/version/pragma_version.cpp +2 -2
- package/src/duckdb/src/include/duckdb/catalog/catalog_entry/index_catalog_entry.hpp +1 -1
- package/src/duckdb/src/include/duckdb/common/arrow/arrow_appender.hpp +1 -1
- package/src/duckdb/src/include/duckdb/common/constants.hpp +2 -0
- package/src/duckdb/src/include/duckdb/common/exception.hpp +3 -0
- package/src/duckdb/src/include/duckdb/common/fast_mem.hpp +528 -0
- package/src/duckdb/src/include/duckdb/common/filename_pattern.hpp +34 -0
- package/src/duckdb/src/include/duckdb/common/helper.hpp +10 -0
- package/src/duckdb/src/include/duckdb/common/hive_partitioning.hpp +13 -3
- package/src/duckdb/src/include/duckdb/common/optional_ptr.hpp +8 -0
- package/src/duckdb/src/include/duckdb/common/perfect_map_set.hpp +34 -0
- package/src/duckdb/src/include/duckdb/common/radix_partitioning.hpp +80 -27
- package/src/duckdb/src/include/duckdb/common/reference_map.hpp +38 -0
- package/src/duckdb/src/include/duckdb/common/row_operations/row_operations.hpp +7 -6
- package/src/duckdb/src/include/duckdb/common/sort/comparators.hpp +1 -1
- package/src/duckdb/src/include/duckdb/common/sort/partition_state.hpp +1 -1
- package/src/duckdb/src/include/duckdb/common/sort/sort.hpp +1 -1
- package/src/duckdb/src/include/duckdb/common/sort/sorted_block.hpp +2 -2
- package/src/duckdb/src/include/duckdb/common/types/batched_data_collection.hpp +1 -1
- package/src/duckdb/src/include/duckdb/common/types/{column_data_allocator.hpp → column/column_data_allocator.hpp} +4 -4
- package/src/duckdb/src/include/duckdb/common/types/{column_data_collection.hpp → column/column_data_collection.hpp} +2 -2
- package/src/duckdb/src/include/duckdb/common/types/{column_data_collection_iterators.hpp → column/column_data_collection_iterators.hpp} +2 -2
- package/src/duckdb/src/include/duckdb/common/types/{column_data_collection_segment.hpp → column/column_data_collection_segment.hpp} +3 -3
- package/src/duckdb/src/include/duckdb/common/types/{column_data_consumer.hpp → column/column_data_consumer.hpp} +8 -4
- package/src/duckdb/src/include/duckdb/common/types/{column_data_scan_states.hpp → column/column_data_scan_states.hpp} +1 -1
- package/src/duckdb/src/include/duckdb/common/types/{partitioned_column_data.hpp → column/partitioned_column_data.hpp} +15 -7
- package/src/duckdb/src/include/duckdb/common/types/row/partitioned_tuple_data.hpp +140 -0
- package/src/duckdb/src/include/duckdb/common/types/{row_data_collection.hpp → row/row_data_collection.hpp} +1 -1
- package/src/duckdb/src/include/duckdb/common/types/{row_data_collection_scanner.hpp → row/row_data_collection_scanner.hpp} +2 -2
- package/src/duckdb/src/include/duckdb/common/types/{row_layout.hpp → row/row_layout.hpp} +3 -1
- package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_allocator.hpp +116 -0
- package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_collection.hpp +239 -0
- package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_iterator.hpp +64 -0
- package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_layout.hpp +113 -0
- package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_segment.hpp +124 -0
- package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_states.hpp +74 -0
- package/src/duckdb/src/include/duckdb/common/types/validity_mask.hpp +3 -0
- package/src/duckdb/src/include/duckdb/common/types/value.hpp +4 -12
- package/src/duckdb/src/include/duckdb/execution/aggregate_hashtable.hpp +34 -31
- package/src/duckdb/src/include/duckdb/execution/base_aggregate_hashtable.hpp +2 -2
- package/src/duckdb/src/include/duckdb/execution/execution_context.hpp +3 -2
- package/src/duckdb/src/include/duckdb/execution/expression_executor.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/join_hashtable.hpp +41 -67
- package/src/duckdb/src/include/duckdb/execution/nested_loop_join.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_execute.hpp +2 -2
- package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_result_collector.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/operator/join/outer_join_marker.hpp +2 -2
- package/src/duckdb/src/include/duckdb/execution/operator/join/perfect_hash_join_executor.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/operator/join/physical_cross_product.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/operator/join/physical_hash_join.hpp +0 -2
- package/src/duckdb/src/include/duckdb/execution/operator/join/physical_index_join.hpp +2 -2
- package/src/duckdb/src/include/duckdb/execution/operator/join/physical_positional_join.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/operator/persistent/physical_copy_to_file.hpp +4 -1
- package/src/duckdb/src/include/duckdb/execution/operator/scan/physical_column_data_scan.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/operator/set/physical_recursive_cte.hpp +1 -1
- package/src/duckdb/src/include/duckdb/execution/partitionable_hashtable.hpp +2 -2
- package/src/duckdb/src/include/duckdb/main/materialized_query_result.hpp +1 -1
- package/src/duckdb/src/include/duckdb/main/query_result.hpp +14 -1
- package/src/duckdb/src/include/duckdb/optimizer/expression_rewriter.hpp +3 -3
- package/src/duckdb/src/include/duckdb/optimizer/join_order/cardinality_estimator.hpp +16 -16
- package/src/duckdb/src/include/duckdb/optimizer/join_order/join_node.hpp +8 -8
- package/src/duckdb/src/include/duckdb/optimizer/join_order/join_order_optimizer.hpp +23 -15
- package/src/duckdb/src/include/duckdb/optimizer/join_order/join_relation.hpp +9 -10
- package/src/duckdb/src/include/duckdb/optimizer/join_order/query_graph.hpp +18 -11
- package/src/duckdb/src/include/duckdb/parallel/meta_pipeline.hpp +1 -1
- package/src/duckdb/src/include/duckdb/parser/parsed_data/exported_table_data.hpp +5 -1
- package/src/duckdb/src/include/duckdb/parser/parsed_data/vacuum_info.hpp +3 -2
- package/src/duckdb/src/include/duckdb/parser/query_error_context.hpp +4 -2
- package/src/duckdb/src/include/duckdb/parser/transformer.hpp +9 -35
- package/src/duckdb/src/include/duckdb/planner/binder.hpp +24 -23
- package/src/duckdb/src/include/duckdb/planner/expression_binder.hpp +3 -3
- package/src/duckdb/src/include/duckdb/planner/operator/logical_column_data_get.hpp +1 -1
- package/src/duckdb/src/include/duckdb/planner/operator/logical_copy_to_file.hpp +3 -1
- package/src/duckdb/src/include/duckdb/storage/table/table_index_list.hpp +1 -1
- package/src/duckdb/src/main/appender.cpp +6 -6
- package/src/duckdb/src/main/client_context.cpp +1 -1
- package/src/duckdb/src/main/connection.cpp +2 -2
- package/src/duckdb/src/main/query_result.cpp +13 -0
- package/src/duckdb/src/optimizer/expression_rewriter.cpp +4 -4
- package/src/duckdb/src/optimizer/join_order/cardinality_estimator.cpp +91 -105
- package/src/duckdb/src/optimizer/join_order/join_node.cpp +5 -8
- package/src/duckdb/src/optimizer/join_order/join_order_optimizer.cpp +163 -160
- package/src/duckdb/src/optimizer/join_order/join_relation_set.cpp +30 -30
- package/src/duckdb/src/optimizer/join_order/query_graph.cpp +37 -38
- package/src/duckdb/src/parallel/executor.cpp +1 -1
- package/src/duckdb/src/parallel/meta_pipeline.cpp +2 -2
- package/src/duckdb/src/parser/transform/helpers/transform_cte.cpp +1 -1
- package/src/duckdb/src/parser/transform/tableref/transform_subquery.cpp +1 -1
- package/src/duckdb/src/parser/transformer.cpp +50 -9
- package/src/duckdb/src/planner/binder/statement/bind_copy.cpp +15 -5
- package/src/duckdb/src/planner/binder/statement/bind_create.cpp +19 -17
- package/src/duckdb/src/planner/binder/statement/bind_create_table.cpp +4 -4
- package/src/duckdb/src/planner/binder/statement/bind_export.cpp +20 -21
- package/src/duckdb/src/planner/binder/tableref/bind_basetableref.cpp +24 -22
- package/src/duckdb/src/planner/binder/tableref/bind_subqueryref.cpp +2 -2
- package/src/duckdb/src/planner/binder.cpp +16 -19
- package/src/duckdb/src/planner/expression_binder.cpp +8 -8
- package/src/duckdb/src/planner/operator/logical_copy_to_file.cpp +3 -3
- package/src/duckdb/src/storage/checkpoint_manager.cpp +23 -23
- package/src/duckdb/src/storage/standard_buffer_manager.cpp +1 -1
- package/src/duckdb/src/storage/table_index_list.cpp +3 -3
- package/src/duckdb/src/verification/statement_verifier.cpp +1 -1
- package/src/duckdb/third_party/libpg_query/src_backend_parser_gram.cpp +5552 -5598
- package/src/duckdb/ub_src_common.cpp +2 -0
- package/src/duckdb/ub_src_common_types.cpp +0 -16
- package/src/duckdb/ub_src_common_types_column.cpp +10 -0
- package/src/duckdb/ub_src_common_types_row.cpp +20 -0
@@ -2,11 +2,13 @@
|
|
2
2
|
|
3
3
|
#include "duckdb/common/operator/cast_operators.hpp"
|
4
4
|
#include "duckdb/common/operator/comparison_operators.hpp"
|
5
|
+
#include "duckdb/common/optional_ptr.hpp"
|
6
|
+
#include "duckdb/common/radix_partitioning.hpp"
|
5
7
|
#include "duckdb/common/row_operations/row_operations.hpp"
|
6
8
|
#include "duckdb/common/sort/partition_state.hpp"
|
7
9
|
#include "duckdb/common/types/chunk_collection.hpp"
|
8
|
-
#include "duckdb/common/types/column_data_consumer.hpp"
|
9
|
-
#include "duckdb/common/types/row_data_collection_scanner.hpp"
|
10
|
+
#include "duckdb/common/types/column/column_data_consumer.hpp"
|
11
|
+
#include "duckdb/common/types/row/row_data_collection_scanner.hpp"
|
10
12
|
#include "duckdb/common/vector_operations/vector_operations.hpp"
|
11
13
|
#include "duckdb/common/windows_undefs.hpp"
|
12
14
|
#include "duckdb/execution/expression_executor.hpp"
|
@@ -17,8 +19,6 @@
|
|
17
19
|
#include "duckdb/parallel/base_pipeline_event.hpp"
|
18
20
|
#include "duckdb/planner/expression/bound_reference_expression.hpp"
|
19
21
|
#include "duckdb/planner/expression/bound_window_expression.hpp"
|
20
|
-
#include "duckdb/common/radix_partitioning.hpp"
|
21
|
-
#include "duckdb/common/optional_ptr.hpp"
|
22
22
|
|
23
23
|
#include <algorithm>
|
24
24
|
#include <cmath>
|
@@ -4,12 +4,12 @@
|
|
4
4
|
|
5
5
|
namespace duckdb {
|
6
6
|
|
7
|
-
PhysicalExecute::PhysicalExecute(PhysicalOperator
|
8
|
-
: PhysicalOperator(PhysicalOperatorType::EXECUTE, plan
|
7
|
+
PhysicalExecute::PhysicalExecute(PhysicalOperator &plan)
|
8
|
+
: PhysicalOperator(PhysicalOperatorType::EXECUTE, plan.types, -1), plan(plan) {
|
9
9
|
}
|
10
10
|
|
11
11
|
vector<PhysicalOperator *> PhysicalExecute::GetChildren() const {
|
12
|
-
return {plan};
|
12
|
+
return {&plan};
|
13
13
|
}
|
14
14
|
|
15
15
|
void PhysicalExecute::BuildPipelines(Pipeline ¤t, MetaPipeline &meta_pipeline) {
|
@@ -1,10 +1,9 @@
|
|
1
1
|
#include "duckdb/execution/operator/helper/physical_limit_percent.hpp"
|
2
|
-
#include "duckdb/execution/operator/helper/physical_limit.hpp"
|
3
2
|
|
4
3
|
#include "duckdb/common/algorithm.hpp"
|
5
|
-
|
4
|
+
#include "duckdb/common/types/column/column_data_collection.hpp"
|
6
5
|
#include "duckdb/execution/expression_executor.hpp"
|
7
|
-
#include "duckdb/
|
6
|
+
#include "duckdb/execution/operator/helper/physical_limit.hpp"
|
8
7
|
|
9
8
|
namespace duckdb {
|
10
9
|
|
@@ -12,7 +12,7 @@ namespace duckdb {
|
|
12
12
|
|
13
13
|
PhysicalResultCollector::PhysicalResultCollector(PreparedStatementData &data)
|
14
14
|
: PhysicalOperator(PhysicalOperatorType::RESULT_COLLECTOR, {LogicalType::BOOLEAN}, 0),
|
15
|
-
statement_type(data.statement_type), properties(data.properties), plan(data.plan
|
15
|
+
statement_type(data.statement_type), properties(data.properties), plan(*data.plan), names(data.names) {
|
16
16
|
this->types = data.types;
|
17
17
|
}
|
18
18
|
|
@@ -32,7 +32,7 @@ unique_ptr<PhysicalResultCollector> PhysicalResultCollector::GetResultCollector(
|
|
32
32
|
}
|
33
33
|
|
34
34
|
vector<PhysicalOperator *> PhysicalResultCollector::GetChildren() const {
|
35
|
-
return {plan};
|
35
|
+
return {&plan};
|
36
36
|
}
|
37
37
|
|
38
38
|
void PhysicalResultCollector::BuildPipelines(Pipeline ¤t, MetaPipeline &meta_pipeline) {
|
@@ -40,7 +40,6 @@ void PhysicalResultCollector::BuildPipelines(Pipeline ¤t, MetaPipeline &me
|
|
40
40
|
sink_state.reset();
|
41
41
|
|
42
42
|
D_ASSERT(children.empty());
|
43
|
-
D_ASSERT(plan);
|
44
43
|
|
45
44
|
// single operator: the operator becomes the data source of the current pipeline
|
46
45
|
auto &state = meta_pipeline.GetState();
|
@@ -1,6 +1,6 @@
|
|
1
1
|
#include "duckdb/execution/operator/join/perfect_hash_join_executor.hpp"
|
2
2
|
|
3
|
-
#include "duckdb/common/types/row_layout.hpp"
|
3
|
+
#include "duckdb/common/types/row/row_layout.hpp"
|
4
4
|
#include "duckdb/execution/operator/join/physical_hash_join.hpp"
|
5
5
|
|
6
6
|
namespace duckdb {
|
@@ -23,32 +23,41 @@ bool PerfectHashJoinExecutor::BuildPerfectHashTable(LogicalType &key_type) {
|
|
23
23
|
for (const auto &type : ht.build_types) {
|
24
24
|
perfect_hash_table.emplace_back(type, build_size);
|
25
25
|
}
|
26
|
+
|
26
27
|
// and for duplicate_checking
|
27
28
|
bitmap_build_idx = unique_ptr<bool[]>(new bool[build_size]);
|
28
29
|
memset(bitmap_build_idx.get(), 0, sizeof(bool) * build_size); // set false
|
29
30
|
|
30
|
-
// pin all fixed-size blocks (variable-sized should still be pinned)
|
31
|
-
ht.PinAllBlocks();
|
32
|
-
|
33
31
|
// Now fill columns with build data
|
34
|
-
|
35
|
-
return FullScanHashTable(
|
32
|
+
|
33
|
+
return FullScanHashTable(key_type);
|
36
34
|
}
|
37
35
|
|
38
|
-
bool PerfectHashJoinExecutor::FullScanHashTable(
|
39
|
-
|
40
|
-
|
36
|
+
bool PerfectHashJoinExecutor::FullScanHashTable(LogicalType &key_type) {
|
37
|
+
auto &data_collection = ht.GetDataCollection();
|
38
|
+
|
41
39
|
// TODO: In a parallel finalize: One should exclusively lock and each thread should do one part of the code below.
|
42
|
-
|
43
|
-
|
40
|
+
Vector tuples_addresses(LogicalType::POINTER, ht.Count()); // allocate space for all the tuples
|
41
|
+
|
42
|
+
idx_t key_count = 0;
|
43
|
+
if (data_collection.ChunkCount() > 0) {
|
44
|
+
JoinHTScanState join_ht_state(data_collection, 0, data_collection.ChunkCount(),
|
45
|
+
TupleDataPinProperties::KEEP_EVERYTHING_PINNED);
|
46
|
+
|
47
|
+
// Go through all the blocks and fill the keys addresses
|
48
|
+
key_count = ht.FillWithHTOffsets(join_ht_state, tuples_addresses);
|
49
|
+
}
|
50
|
+
|
44
51
|
// Scan the build keys in the hash table
|
45
|
-
Vector build_vector(key_type,
|
46
|
-
RowOperations::FullScanColumn(ht.layout, tuples_addresses, build_vector,
|
52
|
+
Vector build_vector(key_type, key_count);
|
53
|
+
RowOperations::FullScanColumn(ht.layout, tuples_addresses, build_vector, key_count, 0);
|
54
|
+
|
47
55
|
// Now fill the selection vector using the build keys and create a sequential vector
|
48
|
-
//
|
49
|
-
SelectionVector sel_build(
|
50
|
-
SelectionVector sel_tuples(
|
51
|
-
bool success = FillSelectionVectorSwitchBuild(build_vector, sel_build, sel_tuples,
|
56
|
+
// TODO: add check for fast pass when probe is part of build domain
|
57
|
+
SelectionVector sel_build(key_count + 1);
|
58
|
+
SelectionVector sel_tuples(key_count + 1);
|
59
|
+
bool success = FillSelectionVectorSwitchBuild(build_vector, sel_build, sel_tuples, key_count);
|
60
|
+
|
52
61
|
// early out
|
53
62
|
if (!success) {
|
54
63
|
return false;
|
@@ -56,16 +65,22 @@ bool PerfectHashJoinExecutor::FullScanHashTable(JoinHTScanState &state, LogicalT
|
|
56
65
|
if (unique_keys == perfect_join_statistics.build_range + 1 && !ht.has_null) {
|
57
66
|
perfect_join_statistics.is_build_dense = true;
|
58
67
|
}
|
59
|
-
|
68
|
+
key_count = unique_keys; // do not consider keys out of the range
|
69
|
+
|
60
70
|
// Full scan the remaining build columns and fill the perfect hash table
|
71
|
+
const auto build_size = perfect_join_statistics.build_range + 1;
|
61
72
|
for (idx_t i = 0; i < ht.build_types.size(); i++) {
|
62
|
-
auto build_size = perfect_join_statistics.build_range + 1;
|
63
73
|
auto &vector = perfect_hash_table[i];
|
64
74
|
D_ASSERT(vector.GetType() == ht.build_types[i]);
|
75
|
+
if (build_size > STANDARD_VECTOR_SIZE) {
|
76
|
+
auto &col_mask = FlatVector::Validity(vector);
|
77
|
+
col_mask.Initialize(build_size);
|
78
|
+
}
|
79
|
+
|
65
80
|
const auto col_no = ht.condition_types.size() + i;
|
66
|
-
|
67
|
-
build_size);
|
81
|
+
data_collection.Gather(tuples_addresses, sel_tuples, key_count, col_no, vector, sel_build);
|
68
82
|
}
|
83
|
+
|
69
84
|
return true;
|
70
85
|
}
|
71
86
|
|
@@ -1,10 +1,10 @@
|
|
1
1
|
#include "duckdb/execution/operator/join/physical_blockwise_nl_join.hpp"
|
2
2
|
|
3
|
+
#include "duckdb/common/types/column/column_data_collection.hpp"
|
3
4
|
#include "duckdb/common/vector_operations/vector_operations.hpp"
|
4
5
|
#include "duckdb/execution/expression_executor.hpp"
|
5
|
-
#include "duckdb/execution/operator/join/physical_comparison_join.hpp"
|
6
|
-
#include "duckdb/common/types/column_data_collection.hpp"
|
7
6
|
#include "duckdb/execution/operator/join/outer_join_marker.hpp"
|
7
|
+
#include "duckdb/execution/operator/join/physical_comparison_join.hpp"
|
8
8
|
#include "duckdb/execution/operator/join/physical_cross_product.hpp"
|
9
9
|
|
10
10
|
namespace duckdb {
|
@@ -1,6 +1,6 @@
|
|
1
1
|
#include "duckdb/execution/operator/join/physical_cross_product.hpp"
|
2
2
|
|
3
|
-
#include "duckdb/common/types/column_data_collection.hpp"
|
3
|
+
#include "duckdb/common/types/column/column_data_collection.hpp"
|
4
4
|
#include "duckdb/common/vector_operations/vector_operations.hpp"
|
5
5
|
#include "duckdb/execution/operator/join/physical_join.hpp"
|
6
6
|
|
@@ -1,6 +1,6 @@
|
|
1
1
|
#include "duckdb/execution/operator/join/physical_delim_join.hpp"
|
2
2
|
|
3
|
-
#include "duckdb/common/types/column_data_collection.hpp"
|
3
|
+
#include "duckdb/common/types/column/column_data_collection.hpp"
|
4
4
|
#include "duckdb/common/vector_operations/vector_operations.hpp"
|
5
5
|
#include "duckdb/execution/operator/aggregate/physical_hash_aggregate.hpp"
|
6
6
|
#include "duckdb/execution/operator/scan/physical_column_data_scan.hpp"
|
@@ -125,7 +125,7 @@ void PhysicalDelimJoin::BuildPipelines(Pipeline ¤t, MetaPipeline &meta_pip
|
|
125
125
|
sink_state.reset();
|
126
126
|
|
127
127
|
auto child_meta_pipeline = meta_pipeline.CreateChildMetaPipeline(current, this);
|
128
|
-
child_meta_pipeline->Build(children[0]
|
128
|
+
child_meta_pipeline->Build(*children[0]);
|
129
129
|
|
130
130
|
if (type == PhysicalOperatorType::DELIM_JOIN) {
|
131
131
|
// recurse into the actual join
|