duckdb 0.7.2-dev1901.0 → 0.7.2-dev2144.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (179) hide show
  1. package/binding.gyp +2 -0
  2. package/package.json +1 -1
  3. package/src/duckdb/extension/parquet/include/parquet_writer.hpp +1 -1
  4. package/src/duckdb/extension/parquet/parquet_metadata.cpp +4 -2
  5. package/src/duckdb/src/catalog/catalog_entry/duck_index_entry.cpp +1 -1
  6. package/src/duckdb/src/common/arrow/arrow_appender.cpp +69 -44
  7. package/src/duckdb/src/common/arrow/arrow_converter.cpp +1 -1
  8. package/src/duckdb/src/common/arrow/arrow_wrapper.cpp +20 -2
  9. package/src/duckdb/src/common/box_renderer.cpp +4 -2
  10. package/src/duckdb/src/common/constants.cpp +10 -1
  11. package/src/duckdb/src/common/filename_pattern.cpp +41 -0
  12. package/src/duckdb/src/common/hive_partitioning.cpp +144 -15
  13. package/src/duckdb/src/common/radix_partitioning.cpp +101 -369
  14. package/src/duckdb/src/common/row_operations/row_aggregate.cpp +8 -9
  15. package/src/duckdb/src/common/row_operations/row_external.cpp +1 -1
  16. package/src/duckdb/src/common/row_operations/row_gather.cpp +5 -3
  17. package/src/duckdb/src/common/row_operations/row_match.cpp +117 -22
  18. package/src/duckdb/src/common/row_operations/row_scatter.cpp +2 -2
  19. package/src/duckdb/src/common/sort/partition_state.cpp +1 -1
  20. package/src/duckdb/src/common/sort/sort_state.cpp +2 -1
  21. package/src/duckdb/src/common/sort/sorted_block.cpp +1 -1
  22. package/src/duckdb/src/common/types/{column_data_allocator.cpp → column/column_data_allocator.cpp} +2 -2
  23. package/src/duckdb/src/common/types/{column_data_collection.cpp → column/column_data_collection.cpp} +22 -4
  24. package/src/duckdb/src/common/types/{column_data_collection_segment.cpp → column/column_data_collection_segment.cpp} +2 -1
  25. package/src/duckdb/src/common/types/{column_data_consumer.cpp → column/column_data_consumer.cpp} +1 -1
  26. package/src/duckdb/src/common/types/{partitioned_column_data.cpp → column/partitioned_column_data.cpp} +11 -9
  27. package/src/duckdb/src/common/types/row/partitioned_tuple_data.cpp +316 -0
  28. package/src/duckdb/src/common/types/{row_data_collection.cpp → row/row_data_collection.cpp} +1 -1
  29. package/src/duckdb/src/common/types/{row_data_collection_scanner.cpp → row/row_data_collection_scanner.cpp} +2 -2
  30. package/src/duckdb/src/common/types/{row_layout.cpp → row/row_layout.cpp} +1 -1
  31. package/src/duckdb/src/common/types/row/tuple_data_allocator.cpp +465 -0
  32. package/src/duckdb/src/common/types/row/tuple_data_collection.cpp +511 -0
  33. package/src/duckdb/src/common/types/row/tuple_data_iterator.cpp +96 -0
  34. package/src/duckdb/src/common/types/row/tuple_data_layout.cpp +119 -0
  35. package/src/duckdb/src/common/types/row/tuple_data_scatter_gather.cpp +1200 -0
  36. package/src/duckdb/src/common/types/row/tuple_data_segment.cpp +170 -0
  37. package/src/duckdb/src/common/types/vector.cpp +1 -1
  38. package/src/duckdb/src/execution/aggregate_hashtable.cpp +252 -290
  39. package/src/duckdb/src/execution/join_hashtable.cpp +192 -328
  40. package/src/duckdb/src/execution/operator/aggregate/physical_window.cpp +4 -4
  41. package/src/duckdb/src/execution/operator/helper/physical_execute.cpp +3 -3
  42. package/src/duckdb/src/execution/operator/helper/physical_limit_percent.cpp +2 -3
  43. package/src/duckdb/src/execution/operator/helper/physical_result_collector.cpp +2 -3
  44. package/src/duckdb/src/execution/operator/join/perfect_hash_join_executor.cpp +36 -21
  45. package/src/duckdb/src/execution/operator/join/physical_blockwise_nl_join.cpp +2 -2
  46. package/src/duckdb/src/execution/operator/join/physical_cross_product.cpp +1 -1
  47. package/src/duckdb/src/execution/operator/join/physical_delim_join.cpp +2 -2
  48. package/src/duckdb/src/execution/operator/join/physical_hash_join.cpp +166 -144
  49. package/src/duckdb/src/execution/operator/join/physical_index_join.cpp +5 -5
  50. package/src/duckdb/src/execution/operator/join/physical_join.cpp +2 -10
  51. package/src/duckdb/src/execution/operator/join/physical_positional_join.cpp +0 -1
  52. package/src/duckdb/src/execution/operator/order/physical_top_n.cpp +2 -2
  53. package/src/duckdb/src/execution/operator/persistent/physical_copy_to_file.cpp +13 -11
  54. package/src/duckdb/src/execution/operator/persistent/physical_delete.cpp +3 -2
  55. package/src/duckdb/src/execution/operator/persistent/physical_export.cpp +25 -24
  56. package/src/duckdb/src/execution/operator/persistent/physical_insert.cpp +1 -1
  57. package/src/duckdb/src/execution/operator/persistent/physical_update.cpp +4 -3
  58. package/src/duckdb/src/execution/operator/schema/physical_create_type.cpp +1 -1
  59. package/src/duckdb/src/execution/operator/set/physical_recursive_cte.cpp +3 -3
  60. package/src/duckdb/src/execution/partitionable_hashtable.cpp +9 -37
  61. package/src/duckdb/src/execution/physical_operator.cpp +1 -1
  62. package/src/duckdb/src/execution/physical_plan/plan_comparison_join.cpp +19 -18
  63. package/src/duckdb/src/execution/physical_plan/plan_copy_to_file.cpp +2 -1
  64. package/src/duckdb/src/execution/physical_plan/plan_execute.cpp +2 -2
  65. package/src/duckdb/src/execution/physical_plan/plan_explain.cpp +5 -6
  66. package/src/duckdb/src/execution/physical_plan/plan_expression_get.cpp +2 -2
  67. package/src/duckdb/src/execution/physical_plan/plan_recursive_cte.cpp +3 -3
  68. package/src/duckdb/src/execution/physical_plan_generator.cpp +1 -1
  69. package/src/duckdb/src/execution/radix_partitioned_hashtable.cpp +39 -17
  70. package/src/duckdb/src/function/aggregate/sorted_aggregate_function.cpp +2 -2
  71. package/src/duckdb/src/function/table/pragma_detailed_profiling_output.cpp +5 -5
  72. package/src/duckdb/src/function/table/pragma_last_profiling_output.cpp +2 -2
  73. package/src/duckdb/src/function/table/version/pragma_version.cpp +2 -2
  74. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/index_catalog_entry.hpp +1 -1
  75. package/src/duckdb/src/include/duckdb/common/arrow/arrow_appender.hpp +1 -1
  76. package/src/duckdb/src/include/duckdb/common/constants.hpp +2 -0
  77. package/src/duckdb/src/include/duckdb/common/exception.hpp +3 -0
  78. package/src/duckdb/src/include/duckdb/common/fast_mem.hpp +528 -0
  79. package/src/duckdb/src/include/duckdb/common/filename_pattern.hpp +34 -0
  80. package/src/duckdb/src/include/duckdb/common/helper.hpp +10 -0
  81. package/src/duckdb/src/include/duckdb/common/hive_partitioning.hpp +13 -3
  82. package/src/duckdb/src/include/duckdb/common/optional_ptr.hpp +8 -0
  83. package/src/duckdb/src/include/duckdb/common/perfect_map_set.hpp +34 -0
  84. package/src/duckdb/src/include/duckdb/common/radix_partitioning.hpp +80 -27
  85. package/src/duckdb/src/include/duckdb/common/reference_map.hpp +38 -0
  86. package/src/duckdb/src/include/duckdb/common/row_operations/row_operations.hpp +7 -6
  87. package/src/duckdb/src/include/duckdb/common/sort/comparators.hpp +1 -1
  88. package/src/duckdb/src/include/duckdb/common/sort/partition_state.hpp +1 -1
  89. package/src/duckdb/src/include/duckdb/common/sort/sort.hpp +1 -1
  90. package/src/duckdb/src/include/duckdb/common/sort/sorted_block.hpp +2 -2
  91. package/src/duckdb/src/include/duckdb/common/types/batched_data_collection.hpp +1 -1
  92. package/src/duckdb/src/include/duckdb/common/types/{column_data_allocator.hpp → column/column_data_allocator.hpp} +4 -4
  93. package/src/duckdb/src/include/duckdb/common/types/{column_data_collection.hpp → column/column_data_collection.hpp} +2 -2
  94. package/src/duckdb/src/include/duckdb/common/types/{column_data_collection_iterators.hpp → column/column_data_collection_iterators.hpp} +2 -2
  95. package/src/duckdb/src/include/duckdb/common/types/{column_data_collection_segment.hpp → column/column_data_collection_segment.hpp} +3 -3
  96. package/src/duckdb/src/include/duckdb/common/types/{column_data_consumer.hpp → column/column_data_consumer.hpp} +8 -4
  97. package/src/duckdb/src/include/duckdb/common/types/{column_data_scan_states.hpp → column/column_data_scan_states.hpp} +1 -1
  98. package/src/duckdb/src/include/duckdb/common/types/{partitioned_column_data.hpp → column/partitioned_column_data.hpp} +15 -7
  99. package/src/duckdb/src/include/duckdb/common/types/row/partitioned_tuple_data.hpp +140 -0
  100. package/src/duckdb/src/include/duckdb/common/types/{row_data_collection.hpp → row/row_data_collection.hpp} +1 -1
  101. package/src/duckdb/src/include/duckdb/common/types/{row_data_collection_scanner.hpp → row/row_data_collection_scanner.hpp} +2 -2
  102. package/src/duckdb/src/include/duckdb/common/types/{row_layout.hpp → row/row_layout.hpp} +3 -1
  103. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_allocator.hpp +116 -0
  104. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_collection.hpp +239 -0
  105. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_iterator.hpp +64 -0
  106. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_layout.hpp +113 -0
  107. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_segment.hpp +124 -0
  108. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_states.hpp +74 -0
  109. package/src/duckdb/src/include/duckdb/common/types/validity_mask.hpp +3 -0
  110. package/src/duckdb/src/include/duckdb/common/types/value.hpp +4 -12
  111. package/src/duckdb/src/include/duckdb/execution/aggregate_hashtable.hpp +34 -31
  112. package/src/duckdb/src/include/duckdb/execution/base_aggregate_hashtable.hpp +2 -2
  113. package/src/duckdb/src/include/duckdb/execution/execution_context.hpp +3 -2
  114. package/src/duckdb/src/include/duckdb/execution/expression_executor.hpp +1 -1
  115. package/src/duckdb/src/include/duckdb/execution/join_hashtable.hpp +41 -67
  116. package/src/duckdb/src/include/duckdb/execution/nested_loop_join.hpp +1 -1
  117. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_execute.hpp +2 -2
  118. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_result_collector.hpp +1 -1
  119. package/src/duckdb/src/include/duckdb/execution/operator/join/outer_join_marker.hpp +2 -2
  120. package/src/duckdb/src/include/duckdb/execution/operator/join/perfect_hash_join_executor.hpp +1 -1
  121. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_cross_product.hpp +1 -1
  122. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_hash_join.hpp +0 -2
  123. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_index_join.hpp +2 -2
  124. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_positional_join.hpp +1 -1
  125. package/src/duckdb/src/include/duckdb/execution/operator/persistent/physical_copy_to_file.hpp +4 -1
  126. package/src/duckdb/src/include/duckdb/execution/operator/scan/physical_column_data_scan.hpp +1 -1
  127. package/src/duckdb/src/include/duckdb/execution/operator/set/physical_recursive_cte.hpp +1 -1
  128. package/src/duckdb/src/include/duckdb/execution/partitionable_hashtable.hpp +2 -2
  129. package/src/duckdb/src/include/duckdb/main/materialized_query_result.hpp +1 -1
  130. package/src/duckdb/src/include/duckdb/main/query_result.hpp +14 -1
  131. package/src/duckdb/src/include/duckdb/optimizer/expression_rewriter.hpp +3 -3
  132. package/src/duckdb/src/include/duckdb/optimizer/join_order/cardinality_estimator.hpp +16 -16
  133. package/src/duckdb/src/include/duckdb/optimizer/join_order/join_node.hpp +8 -8
  134. package/src/duckdb/src/include/duckdb/optimizer/join_order/join_order_optimizer.hpp +23 -15
  135. package/src/duckdb/src/include/duckdb/optimizer/join_order/join_relation.hpp +9 -10
  136. package/src/duckdb/src/include/duckdb/optimizer/join_order/query_graph.hpp +18 -11
  137. package/src/duckdb/src/include/duckdb/parallel/meta_pipeline.hpp +1 -1
  138. package/src/duckdb/src/include/duckdb/parser/parsed_data/exported_table_data.hpp +5 -1
  139. package/src/duckdb/src/include/duckdb/parser/parsed_data/vacuum_info.hpp +3 -2
  140. package/src/duckdb/src/include/duckdb/parser/query_error_context.hpp +4 -2
  141. package/src/duckdb/src/include/duckdb/parser/transformer.hpp +9 -35
  142. package/src/duckdb/src/include/duckdb/planner/binder.hpp +24 -23
  143. package/src/duckdb/src/include/duckdb/planner/expression_binder.hpp +3 -3
  144. package/src/duckdb/src/include/duckdb/planner/operator/logical_column_data_get.hpp +1 -1
  145. package/src/duckdb/src/include/duckdb/planner/operator/logical_copy_to_file.hpp +3 -1
  146. package/src/duckdb/src/include/duckdb/storage/table/table_index_list.hpp +1 -1
  147. package/src/duckdb/src/main/appender.cpp +6 -6
  148. package/src/duckdb/src/main/client_context.cpp +1 -1
  149. package/src/duckdb/src/main/connection.cpp +2 -2
  150. package/src/duckdb/src/main/query_result.cpp +13 -0
  151. package/src/duckdb/src/optimizer/expression_rewriter.cpp +4 -4
  152. package/src/duckdb/src/optimizer/join_order/cardinality_estimator.cpp +91 -105
  153. package/src/duckdb/src/optimizer/join_order/join_node.cpp +5 -8
  154. package/src/duckdb/src/optimizer/join_order/join_order_optimizer.cpp +163 -160
  155. package/src/duckdb/src/optimizer/join_order/join_relation_set.cpp +30 -30
  156. package/src/duckdb/src/optimizer/join_order/query_graph.cpp +37 -38
  157. package/src/duckdb/src/parallel/executor.cpp +1 -1
  158. package/src/duckdb/src/parallel/meta_pipeline.cpp +2 -2
  159. package/src/duckdb/src/parser/transform/helpers/transform_cte.cpp +1 -1
  160. package/src/duckdb/src/parser/transform/tableref/transform_subquery.cpp +1 -1
  161. package/src/duckdb/src/parser/transformer.cpp +50 -9
  162. package/src/duckdb/src/planner/binder/statement/bind_copy.cpp +15 -5
  163. package/src/duckdb/src/planner/binder/statement/bind_create.cpp +19 -17
  164. package/src/duckdb/src/planner/binder/statement/bind_create_table.cpp +4 -4
  165. package/src/duckdb/src/planner/binder/statement/bind_export.cpp +20 -21
  166. package/src/duckdb/src/planner/binder/tableref/bind_basetableref.cpp +24 -22
  167. package/src/duckdb/src/planner/binder/tableref/bind_subqueryref.cpp +2 -2
  168. package/src/duckdb/src/planner/binder.cpp +16 -19
  169. package/src/duckdb/src/planner/expression_binder.cpp +8 -8
  170. package/src/duckdb/src/planner/operator/logical_copy_to_file.cpp +3 -3
  171. package/src/duckdb/src/storage/checkpoint_manager.cpp +23 -23
  172. package/src/duckdb/src/storage/standard_buffer_manager.cpp +1 -1
  173. package/src/duckdb/src/storage/table_index_list.cpp +3 -3
  174. package/src/duckdb/src/verification/statement_verifier.cpp +1 -1
  175. package/src/duckdb/third_party/libpg_query/src_backend_parser_gram.cpp +5552 -5598
  176. package/src/duckdb/ub_src_common.cpp +2 -0
  177. package/src/duckdb/ub_src_common_types.cpp +0 -16
  178. package/src/duckdb/ub_src_common_types_column.cpp +10 -0
  179. package/src/duckdb/ub_src_common_types_row.cpp +20 -0
@@ -2,11 +2,13 @@
2
2
 
3
3
  #include "duckdb/common/operator/cast_operators.hpp"
4
4
  #include "duckdb/common/operator/comparison_operators.hpp"
5
+ #include "duckdb/common/optional_ptr.hpp"
6
+ #include "duckdb/common/radix_partitioning.hpp"
5
7
  #include "duckdb/common/row_operations/row_operations.hpp"
6
8
  #include "duckdb/common/sort/partition_state.hpp"
7
9
  #include "duckdb/common/types/chunk_collection.hpp"
8
- #include "duckdb/common/types/column_data_consumer.hpp"
9
- #include "duckdb/common/types/row_data_collection_scanner.hpp"
10
+ #include "duckdb/common/types/column/column_data_consumer.hpp"
11
+ #include "duckdb/common/types/row/row_data_collection_scanner.hpp"
10
12
  #include "duckdb/common/vector_operations/vector_operations.hpp"
11
13
  #include "duckdb/common/windows_undefs.hpp"
12
14
  #include "duckdb/execution/expression_executor.hpp"
@@ -17,8 +19,6 @@
17
19
  #include "duckdb/parallel/base_pipeline_event.hpp"
18
20
  #include "duckdb/planner/expression/bound_reference_expression.hpp"
19
21
  #include "duckdb/planner/expression/bound_window_expression.hpp"
20
- #include "duckdb/common/radix_partitioning.hpp"
21
- #include "duckdb/common/optional_ptr.hpp"
22
22
 
23
23
  #include <algorithm>
24
24
  #include <cmath>
@@ -4,12 +4,12 @@
4
4
 
5
5
  namespace duckdb {
6
6
 
7
- PhysicalExecute::PhysicalExecute(PhysicalOperator *plan)
8
- : PhysicalOperator(PhysicalOperatorType::EXECUTE, plan->types, -1), plan(plan) {
7
+ PhysicalExecute::PhysicalExecute(PhysicalOperator &plan)
8
+ : PhysicalOperator(PhysicalOperatorType::EXECUTE, plan.types, -1), plan(plan) {
9
9
  }
10
10
 
11
11
  vector<PhysicalOperator *> PhysicalExecute::GetChildren() const {
12
- return {plan};
12
+ return {&plan};
13
13
  }
14
14
 
15
15
  void PhysicalExecute::BuildPipelines(Pipeline &current, MetaPipeline &meta_pipeline) {
@@ -1,10 +1,9 @@
1
1
  #include "duckdb/execution/operator/helper/physical_limit_percent.hpp"
2
- #include "duckdb/execution/operator/helper/physical_limit.hpp"
3
2
 
4
3
  #include "duckdb/common/algorithm.hpp"
5
-
4
+ #include "duckdb/common/types/column/column_data_collection.hpp"
6
5
  #include "duckdb/execution/expression_executor.hpp"
7
- #include "duckdb/common/types/column_data_collection.hpp"
6
+ #include "duckdb/execution/operator/helper/physical_limit.hpp"
8
7
 
9
8
  namespace duckdb {
10
9
 
@@ -12,7 +12,7 @@ namespace duckdb {
12
12
 
13
13
  PhysicalResultCollector::PhysicalResultCollector(PreparedStatementData &data)
14
14
  : PhysicalOperator(PhysicalOperatorType::RESULT_COLLECTOR, {LogicalType::BOOLEAN}, 0),
15
- statement_type(data.statement_type), properties(data.properties), plan(data.plan.get()), names(data.names) {
15
+ statement_type(data.statement_type), properties(data.properties), plan(*data.plan), names(data.names) {
16
16
  this->types = data.types;
17
17
  }
18
18
 
@@ -32,7 +32,7 @@ unique_ptr<PhysicalResultCollector> PhysicalResultCollector::GetResultCollector(
32
32
  }
33
33
 
34
34
  vector<PhysicalOperator *> PhysicalResultCollector::GetChildren() const {
35
- return {plan};
35
+ return {&plan};
36
36
  }
37
37
 
38
38
  void PhysicalResultCollector::BuildPipelines(Pipeline &current, MetaPipeline &meta_pipeline) {
@@ -40,7 +40,6 @@ void PhysicalResultCollector::BuildPipelines(Pipeline &current, MetaPipeline &me
40
40
  sink_state.reset();
41
41
 
42
42
  D_ASSERT(children.empty());
43
- D_ASSERT(plan);
44
43
 
45
44
  // single operator: the operator becomes the data source of the current pipeline
46
45
  auto &state = meta_pipeline.GetState();
@@ -1,6 +1,6 @@
1
1
  #include "duckdb/execution/operator/join/perfect_hash_join_executor.hpp"
2
2
 
3
- #include "duckdb/common/types/row_layout.hpp"
3
+ #include "duckdb/common/types/row/row_layout.hpp"
4
4
  #include "duckdb/execution/operator/join/physical_hash_join.hpp"
5
5
 
6
6
  namespace duckdb {
@@ -23,32 +23,41 @@ bool PerfectHashJoinExecutor::BuildPerfectHashTable(LogicalType &key_type) {
23
23
  for (const auto &type : ht.build_types) {
24
24
  perfect_hash_table.emplace_back(type, build_size);
25
25
  }
26
+
26
27
  // and for duplicate_checking
27
28
  bitmap_build_idx = unique_ptr<bool[]>(new bool[build_size]);
28
29
  memset(bitmap_build_idx.get(), 0, sizeof(bool) * build_size); // set false
29
30
 
30
- // pin all fixed-size blocks (variable-sized should still be pinned)
31
- ht.PinAllBlocks();
32
-
33
31
  // Now fill columns with build data
34
- JoinHTScanState join_ht_state;
35
- return FullScanHashTable(join_ht_state, key_type);
32
+
33
+ return FullScanHashTable(key_type);
36
34
  }
37
35
 
38
- bool PerfectHashJoinExecutor::FullScanHashTable(JoinHTScanState &state, LogicalType &key_type) {
39
- Vector tuples_addresses(LogicalType::POINTER, ht.Count()); // allocate space for all the tuples
40
- auto key_locations = FlatVector::GetData<data_ptr_t>(tuples_addresses); // get a pointer to vector data
36
+ bool PerfectHashJoinExecutor::FullScanHashTable(LogicalType &key_type) {
37
+ auto &data_collection = ht.GetDataCollection();
38
+
41
39
  // TODO: In a parallel finalize: One should exclusively lock and each thread should do one part of the code below.
42
- // Go through all the blocks and fill the keys addresses
43
- auto keys_count = ht.FillWithHTOffsets(key_locations, state);
40
+ Vector tuples_addresses(LogicalType::POINTER, ht.Count()); // allocate space for all the tuples
41
+
42
+ idx_t key_count = 0;
43
+ if (data_collection.ChunkCount() > 0) {
44
+ JoinHTScanState join_ht_state(data_collection, 0, data_collection.ChunkCount(),
45
+ TupleDataPinProperties::KEEP_EVERYTHING_PINNED);
46
+
47
+ // Go through all the blocks and fill the keys addresses
48
+ key_count = ht.FillWithHTOffsets(join_ht_state, tuples_addresses);
49
+ }
50
+
44
51
  // Scan the build keys in the hash table
45
- Vector build_vector(key_type, keys_count);
46
- RowOperations::FullScanColumn(ht.layout, tuples_addresses, build_vector, keys_count, 0);
52
+ Vector build_vector(key_type, key_count);
53
+ RowOperations::FullScanColumn(ht.layout, tuples_addresses, build_vector, key_count, 0);
54
+
47
55
  // Now fill the selection vector using the build keys and create a sequential vector
48
- // todo: add check for fast pass when probe is part of build domain
49
- SelectionVector sel_build(keys_count + 1);
50
- SelectionVector sel_tuples(keys_count + 1);
51
- bool success = FillSelectionVectorSwitchBuild(build_vector, sel_build, sel_tuples, keys_count);
56
+ // TODO: add check for fast pass when probe is part of build domain
57
+ SelectionVector sel_build(key_count + 1);
58
+ SelectionVector sel_tuples(key_count + 1);
59
+ bool success = FillSelectionVectorSwitchBuild(build_vector, sel_build, sel_tuples, key_count);
60
+
52
61
  // early out
53
62
  if (!success) {
54
63
  return false;
@@ -56,16 +65,22 @@ bool PerfectHashJoinExecutor::FullScanHashTable(JoinHTScanState &state, LogicalT
56
65
  if (unique_keys == perfect_join_statistics.build_range + 1 && !ht.has_null) {
57
66
  perfect_join_statistics.is_build_dense = true;
58
67
  }
59
- keys_count = unique_keys; // do not consider keys out of the range
68
+ key_count = unique_keys; // do not consider keys out of the range
69
+
60
70
  // Full scan the remaining build columns and fill the perfect hash table
71
+ const auto build_size = perfect_join_statistics.build_range + 1;
61
72
  for (idx_t i = 0; i < ht.build_types.size(); i++) {
62
- auto build_size = perfect_join_statistics.build_range + 1;
63
73
  auto &vector = perfect_hash_table[i];
64
74
  D_ASSERT(vector.GetType() == ht.build_types[i]);
75
+ if (build_size > STANDARD_VECTOR_SIZE) {
76
+ auto &col_mask = FlatVector::Validity(vector);
77
+ col_mask.Initialize(build_size);
78
+ }
79
+
65
80
  const auto col_no = ht.condition_types.size() + i;
66
- RowOperations::Gather(tuples_addresses, sel_tuples, vector, sel_build, keys_count, ht.layout, col_no,
67
- build_size);
81
+ data_collection.Gather(tuples_addresses, sel_tuples, key_count, col_no, vector, sel_build);
68
82
  }
83
+
69
84
  return true;
70
85
  }
71
86
 
@@ -1,10 +1,10 @@
1
1
  #include "duckdb/execution/operator/join/physical_blockwise_nl_join.hpp"
2
2
 
3
+ #include "duckdb/common/types/column/column_data_collection.hpp"
3
4
  #include "duckdb/common/vector_operations/vector_operations.hpp"
4
5
  #include "duckdb/execution/expression_executor.hpp"
5
- #include "duckdb/execution/operator/join/physical_comparison_join.hpp"
6
- #include "duckdb/common/types/column_data_collection.hpp"
7
6
  #include "duckdb/execution/operator/join/outer_join_marker.hpp"
7
+ #include "duckdb/execution/operator/join/physical_comparison_join.hpp"
8
8
  #include "duckdb/execution/operator/join/physical_cross_product.hpp"
9
9
 
10
10
  namespace duckdb {
@@ -1,6 +1,6 @@
1
1
  #include "duckdb/execution/operator/join/physical_cross_product.hpp"
2
2
 
3
- #include "duckdb/common/types/column_data_collection.hpp"
3
+ #include "duckdb/common/types/column/column_data_collection.hpp"
4
4
  #include "duckdb/common/vector_operations/vector_operations.hpp"
5
5
  #include "duckdb/execution/operator/join/physical_join.hpp"
6
6
 
@@ -1,6 +1,6 @@
1
1
  #include "duckdb/execution/operator/join/physical_delim_join.hpp"
2
2
 
3
- #include "duckdb/common/types/column_data_collection.hpp"
3
+ #include "duckdb/common/types/column/column_data_collection.hpp"
4
4
  #include "duckdb/common/vector_operations/vector_operations.hpp"
5
5
  #include "duckdb/execution/operator/aggregate/physical_hash_aggregate.hpp"
6
6
  #include "duckdb/execution/operator/scan/physical_column_data_scan.hpp"
@@ -125,7 +125,7 @@ void PhysicalDelimJoin::BuildPipelines(Pipeline &current, MetaPipeline &meta_pip
125
125
  sink_state.reset();
126
126
 
127
127
  auto child_meta_pipeline = meta_pipeline.CreateChildMetaPipeline(current, this);
128
- child_meta_pipeline->Build(children[0].get());
128
+ child_meta_pipeline->Build(*children[0]);
129
129
 
130
130
  if (type == PhysicalOperatorType::DELIM_JOIN) {
131
131
  // recurse into the actual join