duckdb 1.0.1-dev22.0 → 1.0.1-dev27.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (1389) hide show
  1. package/.github/workflows/NodeJS.yml +1 -1
  2. package/binding.gyp +41 -0
  3. package/package.json +1 -1
  4. package/src/duckdb/extension/icu/icu-dateadd.cpp +4 -2
  5. package/src/duckdb/extension/icu/icu-datefunc.cpp +6 -2
  6. package/src/duckdb/extension/icu/icu-datesub.cpp +13 -2
  7. package/src/duckdb/extension/icu/icu-strptime.cpp +6 -6
  8. package/src/duckdb/extension/icu/icu-table-range.cpp +92 -73
  9. package/src/duckdb/extension/icu/icu-timebucket.cpp +12 -2
  10. package/src/duckdb/extension/icu/icu-timezone.cpp +3 -3
  11. package/src/duckdb/extension/icu/icu_extension.cpp +61 -9
  12. package/src/duckdb/extension/json/include/json_executors.hpp +20 -23
  13. package/src/duckdb/extension/json/include/json_functions.hpp +4 -0
  14. package/src/duckdb/extension/json/include/json_scan.hpp +6 -2
  15. package/src/duckdb/extension/json/include/json_structure.hpp +12 -9
  16. package/src/duckdb/extension/json/json_common.cpp +66 -10
  17. package/src/duckdb/extension/json/json_extension.cpp +13 -5
  18. package/src/duckdb/extension/json/json_functions/json_array_length.cpp +1 -1
  19. package/src/duckdb/extension/json/json_functions/json_create.cpp +21 -4
  20. package/src/duckdb/extension/json/json_functions/json_exists.cpp +32 -0
  21. package/src/duckdb/extension/json/json_functions/json_extract.cpp +2 -2
  22. package/src/duckdb/extension/json/json_functions/json_keys.cpp +1 -1
  23. package/src/duckdb/extension/json/json_functions/json_pretty.cpp +32 -0
  24. package/src/duckdb/extension/json/json_functions/json_serialize_sql.cpp +5 -1
  25. package/src/duckdb/extension/json/json_functions/json_structure.cpp +305 -94
  26. package/src/duckdb/extension/json/json_functions/json_transform.cpp +1 -1
  27. package/src/duckdb/extension/json/json_functions/json_type.cpp +3 -3
  28. package/src/duckdb/extension/json/json_functions/json_value.cpp +42 -0
  29. package/src/duckdb/extension/json/json_functions/read_json.cpp +16 -2
  30. package/src/duckdb/extension/json/json_functions/read_json_objects.cpp +3 -2
  31. package/src/duckdb/extension/json/json_functions.cpp +5 -1
  32. package/src/duckdb/extension/json/json_scan.cpp +13 -12
  33. package/src/duckdb/extension/json/serialize_json.cpp +5 -3
  34. package/src/duckdb/extension/parquet/column_reader.cpp +206 -43
  35. package/src/duckdb/extension/parquet/column_writer.cpp +133 -62
  36. package/src/duckdb/extension/parquet/geo_parquet.cpp +391 -0
  37. package/src/duckdb/extension/parquet/include/boolean_column_reader.hpp +16 -5
  38. package/src/duckdb/extension/parquet/include/column_reader.hpp +37 -12
  39. package/src/duckdb/extension/parquet/include/column_writer.hpp +10 -11
  40. package/src/duckdb/extension/parquet/include/expression_column_reader.hpp +52 -0
  41. package/src/duckdb/extension/parquet/include/geo_parquet.hpp +139 -0
  42. package/src/duckdb/extension/parquet/include/parquet_crypto.hpp +13 -8
  43. package/src/duckdb/extension/parquet/include/parquet_decimal_utils.hpp +3 -0
  44. package/src/duckdb/extension/parquet/include/parquet_file_metadata_cache.hpp +7 -3
  45. package/src/duckdb/extension/parquet/include/parquet_reader.hpp +55 -8
  46. package/src/duckdb/extension/parquet/include/parquet_rle_bp_decoder.hpp +3 -3
  47. package/src/duckdb/extension/parquet/include/parquet_rle_bp_encoder.hpp +1 -1
  48. package/src/duckdb/extension/parquet/include/parquet_timestamp.hpp +8 -0
  49. package/src/duckdb/extension/parquet/include/parquet_writer.hpp +21 -7
  50. package/src/duckdb/extension/parquet/include/resizable_buffer.hpp +33 -11
  51. package/src/duckdb/extension/parquet/include/string_column_reader.hpp +5 -2
  52. package/src/duckdb/extension/parquet/include/templated_column_reader.hpp +48 -14
  53. package/src/duckdb/extension/parquet/parquet_crypto.cpp +109 -61
  54. package/src/duckdb/extension/parquet/parquet_extension.cpp +305 -72
  55. package/src/duckdb/extension/parquet/parquet_metadata.cpp +4 -4
  56. package/src/duckdb/extension/parquet/parquet_reader.cpp +151 -40
  57. package/src/duckdb/extension/parquet/parquet_statistics.cpp +50 -16
  58. package/src/duckdb/extension/parquet/parquet_timestamp.cpp +42 -1
  59. package/src/duckdb/extension/parquet/parquet_writer.cpp +67 -75
  60. package/src/duckdb/extension/parquet/serialize_parquet.cpp +3 -1
  61. package/src/duckdb/extension/parquet/zstd_file_system.cpp +5 -1
  62. package/src/duckdb/src/catalog/catalog.cpp +14 -16
  63. package/src/duckdb/src/catalog/catalog_entry/duck_index_entry.cpp +14 -11
  64. package/src/duckdb/src/catalog/catalog_entry/duck_schema_entry.cpp +39 -19
  65. package/src/duckdb/src/catalog/catalog_entry/duck_table_entry.cpp +92 -78
  66. package/src/duckdb/src/catalog/catalog_entry/index_catalog_entry.cpp +10 -2
  67. package/src/duckdb/src/catalog/catalog_entry/macro_catalog_entry.cpp +10 -3
  68. package/src/duckdb/src/catalog/catalog_entry/schema_catalog_entry.cpp +3 -3
  69. package/src/duckdb/src/catalog/catalog_entry/table_catalog_entry.cpp +7 -7
  70. package/src/duckdb/src/catalog/catalog_entry.cpp +6 -3
  71. package/src/duckdb/src/catalog/catalog_set.cpp +14 -19
  72. package/src/duckdb/src/catalog/default/default_functions.cpp +179 -166
  73. package/src/duckdb/src/catalog/default/default_generator.cpp +24 -0
  74. package/src/duckdb/src/catalog/default/default_schemas.cpp +4 -3
  75. package/src/duckdb/src/catalog/default/default_table_functions.cpp +148 -0
  76. package/src/duckdb/src/catalog/default/default_views.cpp +7 -3
  77. package/src/duckdb/src/catalog/duck_catalog.cpp +7 -1
  78. package/src/duckdb/src/common/adbc/adbc.cpp +120 -58
  79. package/src/duckdb/src/common/allocator.cpp +71 -6
  80. package/src/duckdb/src/common/arrow/appender/bool_data.cpp +8 -7
  81. package/src/duckdb/src/common/arrow/appender/fixed_size_list_data.cpp +1 -1
  82. package/src/duckdb/src/common/arrow/appender/union_data.cpp +4 -5
  83. package/src/duckdb/src/common/arrow/arrow_appender.cpp +55 -21
  84. package/src/duckdb/src/common/arrow/arrow_converter.cpp +85 -10
  85. package/src/duckdb/src/common/arrow/arrow_merge_event.cpp +142 -0
  86. package/src/duckdb/src/common/arrow/arrow_query_result.cpp +56 -0
  87. package/src/duckdb/src/common/arrow/physical_arrow_batch_collector.cpp +37 -0
  88. package/src/duckdb/src/common/arrow/physical_arrow_collector.cpp +128 -0
  89. package/src/duckdb/src/common/arrow/schema_metadata.cpp +101 -0
  90. package/src/duckdb/src/common/cgroups.cpp +189 -0
  91. package/src/duckdb/src/common/compressed_file_system.cpp +6 -3
  92. package/src/duckdb/src/common/encryption_state.cpp +38 -0
  93. package/src/duckdb/src/common/enum_util.cpp +682 -14
  94. package/src/duckdb/src/common/enums/file_compression_type.cpp +24 -0
  95. package/src/duckdb/src/common/enums/metric_type.cpp +208 -0
  96. package/src/duckdb/src/common/enums/optimizer_type.cpp +8 -2
  97. package/src/duckdb/src/common/enums/physical_operator_type.cpp +2 -0
  98. package/src/duckdb/src/common/enums/relation_type.cpp +4 -0
  99. package/src/duckdb/src/common/enums/statement_type.cpp +15 -0
  100. package/src/duckdb/src/common/error_data.cpp +22 -20
  101. package/src/duckdb/src/common/exception/binder_exception.cpp +5 -0
  102. package/src/duckdb/src/common/exception.cpp +11 -1
  103. package/src/duckdb/src/common/extra_type_info.cpp +3 -0
  104. package/src/duckdb/src/common/file_buffer.cpp +1 -1
  105. package/src/duckdb/src/common/file_system.cpp +25 -3
  106. package/src/duckdb/src/common/filename_pattern.cpp +1 -0
  107. package/src/duckdb/src/common/fsst.cpp +15 -14
  108. package/src/duckdb/src/common/gzip_file_system.cpp +3 -1
  109. package/src/duckdb/src/common/hive_partitioning.cpp +103 -43
  110. package/src/duckdb/src/common/http_util.cpp +25 -0
  111. package/src/duckdb/src/common/local_file_system.cpp +48 -27
  112. package/src/duckdb/src/common/multi_file_list.cpp +113 -22
  113. package/src/duckdb/src/common/multi_file_reader.cpp +59 -58
  114. package/src/duckdb/src/common/operator/cast_operators.cpp +133 -34
  115. package/src/duckdb/src/common/operator/string_cast.cpp +42 -11
  116. package/src/duckdb/src/common/progress_bar/progress_bar.cpp +2 -2
  117. package/src/duckdb/src/common/progress_bar/terminal_progress_bar_display.cpp +1 -1
  118. package/src/duckdb/src/common/radix_partitioning.cpp +31 -21
  119. package/src/duckdb/src/common/random_engine.cpp +4 -0
  120. package/src/duckdb/src/common/re2_regex.cpp +47 -12
  121. package/src/duckdb/src/common/render_tree.cpp +243 -0
  122. package/src/duckdb/src/common/row_operations/row_aggregate.cpp +1 -1
  123. package/src/duckdb/src/common/row_operations/row_gather.cpp +2 -2
  124. package/src/duckdb/src/common/row_operations/row_matcher.cpp +58 -5
  125. package/src/duckdb/src/common/row_operations/row_radix_scatter.cpp +79 -43
  126. package/src/duckdb/src/common/serializer/binary_deserializer.cpp +1 -1
  127. package/src/duckdb/src/common/serializer/buffered_file_reader.cpp +6 -4
  128. package/src/duckdb/src/common/serializer/buffered_file_writer.cpp +18 -9
  129. package/src/duckdb/src/common/serializer/memory_stream.cpp +1 -0
  130. package/src/duckdb/src/common/sort/partition_state.cpp +33 -18
  131. package/src/duckdb/src/common/sort/radix_sort.cpp +22 -15
  132. package/src/duckdb/src/common/sort/sort_state.cpp +19 -16
  133. package/src/duckdb/src/common/sort/sorted_block.cpp +11 -10
  134. package/src/duckdb/src/common/string_util.cpp +167 -10
  135. package/src/duckdb/src/common/tree_renderer/graphviz_tree_renderer.cpp +108 -0
  136. package/src/duckdb/src/common/tree_renderer/html_tree_renderer.cpp +267 -0
  137. package/src/duckdb/src/common/tree_renderer/json_tree_renderer.cpp +116 -0
  138. package/src/duckdb/src/common/tree_renderer/text_tree_renderer.cpp +482 -0
  139. package/src/duckdb/src/common/tree_renderer/tree_renderer.cpp +12 -0
  140. package/src/duckdb/src/common/tree_renderer.cpp +16 -508
  141. package/src/duckdb/src/common/types/batched_data_collection.cpp +78 -9
  142. package/src/duckdb/src/common/types/bit.cpp +24 -22
  143. package/src/duckdb/src/common/types/blob.cpp +15 -11
  144. package/src/duckdb/src/common/types/column/column_data_allocator.cpp +18 -9
  145. package/src/duckdb/src/common/types/column/column_data_collection.cpp +4 -4
  146. package/src/duckdb/src/common/types/column/column_data_collection_segment.cpp +3 -4
  147. package/src/duckdb/src/common/types/column/column_data_consumer.cpp +2 -2
  148. package/src/duckdb/src/common/types/column/partitioned_column_data.cpp +70 -21
  149. package/src/duckdb/src/common/types/data_chunk.cpp +10 -1
  150. package/src/duckdb/src/common/types/date.cpp +8 -19
  151. package/src/duckdb/src/common/types/decimal.cpp +3 -2
  152. package/src/duckdb/src/common/types/hugeint.cpp +11 -3
  153. package/src/duckdb/src/common/types/hyperloglog.cpp +212 -227
  154. package/src/duckdb/src/common/types/interval.cpp +1 -1
  155. package/src/duckdb/src/common/types/list_segment.cpp +83 -49
  156. package/src/duckdb/src/common/types/row/partitioned_tuple_data.cpp +22 -83
  157. package/src/duckdb/src/common/types/row/row_data_collection.cpp +2 -2
  158. package/src/duckdb/src/common/types/row/row_data_collection_scanner.cpp +20 -4
  159. package/src/duckdb/src/common/types/row/tuple_data_allocator.cpp +28 -7
  160. package/src/duckdb/src/common/types/row/tuple_data_collection.cpp +29 -14
  161. package/src/duckdb/src/common/types/row/tuple_data_scatter_gather.cpp +152 -102
  162. package/src/duckdb/src/common/types/row/tuple_data_segment.cpp +4 -1
  163. package/src/duckdb/src/common/types/selection_vector.cpp +17 -1
  164. package/src/duckdb/src/common/types/time.cpp +62 -31
  165. package/src/duckdb/src/common/types/timestamp.cpp +70 -12
  166. package/src/duckdb/src/common/types/uuid.cpp +1 -1
  167. package/src/duckdb/src/common/types/validity_mask.cpp +40 -5
  168. package/src/duckdb/src/common/types/value.cpp +50 -8
  169. package/src/duckdb/src/common/types/varint.cpp +295 -0
  170. package/src/duckdb/src/common/types/vector.cpp +165 -54
  171. package/src/duckdb/src/common/types/vector_buffer.cpp +5 -4
  172. package/src/duckdb/src/common/types.cpp +106 -26
  173. package/src/duckdb/src/common/vector_operations/vector_copy.cpp +13 -25
  174. package/src/duckdb/src/common/vector_operations/vector_hash.cpp +6 -0
  175. package/src/duckdb/src/common/virtual_file_system.cpp +3 -3
  176. package/src/duckdb/src/core_functions/aggregate/distributive/approx_count.cpp +35 -82
  177. package/src/duckdb/src/core_functions/aggregate/distributive/arg_min_max.cpp +283 -46
  178. package/src/duckdb/src/core_functions/aggregate/distributive/bitagg.cpp +4 -4
  179. package/src/duckdb/src/core_functions/aggregate/distributive/entropy.cpp +3 -2
  180. package/src/duckdb/src/core_functions/aggregate/distributive/minmax.cpp +226 -338
  181. package/src/duckdb/src/core_functions/aggregate/distributive/sum.cpp +2 -0
  182. package/src/duckdb/src/core_functions/aggregate/holistic/approx_top_k.cpp +388 -0
  183. package/src/duckdb/src/core_functions/aggregate/holistic/approximate_quantile.cpp +63 -21
  184. package/src/duckdb/src/core_functions/aggregate/holistic/mad.cpp +330 -0
  185. package/src/duckdb/src/core_functions/aggregate/holistic/mode.cpp +136 -97
  186. package/src/duckdb/src/core_functions/aggregate/holistic/quantile.cpp +601 -1485
  187. package/src/duckdb/src/core_functions/aggregate/nested/binned_histogram.cpp +405 -0
  188. package/src/duckdb/src/core_functions/aggregate/nested/histogram.cpp +136 -165
  189. package/src/duckdb/src/core_functions/function_list.cpp +35 -8
  190. package/src/duckdb/src/core_functions/lambda_functions.cpp +5 -7
  191. package/src/duckdb/src/core_functions/scalar/array/array_functions.cpp +172 -198
  192. package/src/duckdb/src/core_functions/scalar/blob/create_sort_key.cpp +341 -54
  193. package/src/duckdb/src/core_functions/scalar/date/date_diff.cpp +2 -2
  194. package/src/duckdb/src/core_functions/scalar/date/date_part.cpp +89 -29
  195. package/src/duckdb/src/core_functions/scalar/date/date_trunc.cpp +1 -1
  196. package/src/duckdb/src/core_functions/scalar/date/make_date.cpp +2 -2
  197. package/src/duckdb/src/core_functions/scalar/date/strftime.cpp +133 -71
  198. package/src/duckdb/src/core_functions/scalar/date/to_interval.cpp +1 -1
  199. package/src/duckdb/src/core_functions/scalar/enum/enum_functions.cpp +1 -1
  200. package/src/duckdb/src/core_functions/scalar/generic/can_implicitly_cast.cpp +40 -0
  201. package/src/duckdb/src/core_functions/scalar/generic/error.cpp +1 -1
  202. package/src/duckdb/src/core_functions/scalar/generic/least.cpp +161 -58
  203. package/src/duckdb/src/core_functions/scalar/generic/typeof.cpp +13 -0
  204. package/src/duckdb/src/core_functions/scalar/list/array_slice.cpp +1 -1
  205. package/src/duckdb/src/core_functions/scalar/list/list_aggregates.cpp +59 -75
  206. package/src/duckdb/src/core_functions/scalar/list/list_distance.cpp +93 -40
  207. package/src/duckdb/src/core_functions/scalar/list/list_has_any_or_all.cpp +227 -0
  208. package/src/duckdb/src/core_functions/scalar/list/list_reduce.cpp +20 -19
  209. package/src/duckdb/src/core_functions/scalar/list/list_sort.cpp +0 -2
  210. package/src/duckdb/src/core_functions/scalar/list/list_value.cpp +106 -8
  211. package/src/duckdb/src/core_functions/scalar/map/map_contains.cpp +56 -0
  212. package/src/duckdb/src/core_functions/scalar/map/map_extract.cpp +73 -118
  213. package/src/duckdb/src/core_functions/scalar/math/numeric.cpp +98 -2
  214. package/src/duckdb/src/core_functions/scalar/operators/bitwise.cpp +1 -2
  215. package/src/duckdb/src/core_functions/scalar/random/setseed.cpp +1 -1
  216. package/src/duckdb/src/core_functions/scalar/string/bar.cpp +1 -1
  217. package/src/duckdb/src/core_functions/scalar/string/hex.cpp +5 -1
  218. package/src/duckdb/src/core_functions/scalar/string/md5.cpp +10 -37
  219. package/src/duckdb/src/core_functions/scalar/string/printf.cpp +18 -2
  220. package/src/duckdb/src/core_functions/scalar/string/repeat.cpp +45 -0
  221. package/src/duckdb/src/core_functions/scalar/string/reverse.cpp +4 -5
  222. package/src/duckdb/src/core_functions/scalar/string/sha1.cpp +35 -0
  223. package/src/duckdb/src/core_functions/scalar/string/sha256.cpp +5 -2
  224. package/src/duckdb/src/core_functions/scalar/string/url_encode.cpp +49 -0
  225. package/src/duckdb/src/core_functions/scalar/struct/struct_pack.cpp +1 -2
  226. package/src/duckdb/src/core_functions/scalar/union/union_extract.cpp +4 -2
  227. package/src/duckdb/src/execution/adaptive_filter.cpp +30 -11
  228. package/src/duckdb/src/execution/aggregate_hashtable.cpp +13 -18
  229. package/src/duckdb/src/execution/expression_executor/execute_conjunction.cpp +4 -9
  230. package/src/duckdb/src/execution/expression_executor.cpp +1 -1
  231. package/src/duckdb/src/execution/index/art/art.cpp +683 -670
  232. package/src/duckdb/src/execution/index/art/art_key.cpp +121 -38
  233. package/src/duckdb/src/execution/index/art/base_leaf.cpp +168 -0
  234. package/src/duckdb/src/execution/index/art/base_node.cpp +163 -0
  235. package/src/duckdb/src/execution/index/art/iterator.cpp +148 -77
  236. package/src/duckdb/src/execution/index/art/leaf.cpp +159 -263
  237. package/src/duckdb/src/execution/index/art/node.cpp +493 -247
  238. package/src/duckdb/src/execution/index/art/node256.cpp +31 -91
  239. package/src/duckdb/src/execution/index/art/node256_leaf.cpp +71 -0
  240. package/src/duckdb/src/execution/index/art/node48.cpp +75 -143
  241. package/src/duckdb/src/execution/index/art/prefix.cpp +424 -244
  242. package/src/duckdb/src/execution/index/bound_index.cpp +7 -1
  243. package/src/duckdb/src/execution/index/fixed_size_allocator.cpp +22 -18
  244. package/src/duckdb/src/execution/index/fixed_size_buffer.cpp +22 -73
  245. package/src/duckdb/src/execution/join_hashtable.cpp +637 -179
  246. package/src/duckdb/src/execution/operator/aggregate/aggregate_object.cpp +4 -4
  247. package/src/duckdb/src/execution/operator/aggregate/physical_hash_aggregate.cpp +15 -10
  248. package/src/duckdb/src/execution/operator/aggregate/physical_perfecthash_aggregate.cpp +13 -8
  249. package/src/duckdb/src/execution/operator/aggregate/physical_streaming_window.cpp +525 -132
  250. package/src/duckdb/src/execution/operator/aggregate/physical_ungrouped_aggregate.cpp +147 -138
  251. package/src/duckdb/src/execution/operator/aggregate/physical_window.cpp +531 -312
  252. package/src/duckdb/src/execution/operator/csv_scanner/buffer_manager/csv_buffer.cpp +1 -1
  253. package/src/duckdb/src/execution/operator/csv_scanner/buffer_manager/csv_buffer_manager.cpp +4 -3
  254. package/src/duckdb/src/execution/operator/csv_scanner/buffer_manager/csv_file_handle.cpp +9 -2
  255. package/src/duckdb/src/execution/operator/csv_scanner/scanner/base_scanner.cpp +13 -17
  256. package/src/duckdb/src/execution/operator/csv_scanner/scanner/column_count_scanner.cpp +60 -16
  257. package/src/duckdb/src/execution/operator/csv_scanner/scanner/csv_schema.cpp +105 -0
  258. package/src/duckdb/src/execution/operator/csv_scanner/scanner/scanner_boundary.cpp +24 -24
  259. package/src/duckdb/src/execution/operator/csv_scanner/scanner/skip_scanner.cpp +25 -2
  260. package/src/duckdb/src/execution/operator/csv_scanner/scanner/string_value_scanner.cpp +275 -112
  261. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/csv_sniffer.cpp +106 -11
  262. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/dialect_detection.cpp +253 -115
  263. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/header_detection.cpp +93 -52
  264. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/type_detection.cpp +116 -76
  265. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/type_refinement.cpp +29 -14
  266. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/type_replacement.cpp +1 -1
  267. package/src/duckdb/src/execution/operator/csv_scanner/state_machine/csv_state_machine_cache.cpp +70 -26
  268. package/src/duckdb/src/execution/operator/csv_scanner/table_function/csv_file_scanner.cpp +81 -60
  269. package/src/duckdb/src/execution/operator/csv_scanner/table_function/global_csv_state.cpp +88 -50
  270. package/src/duckdb/src/execution/operator/csv_scanner/util/csv_error.cpp +161 -51
  271. package/src/duckdb/src/execution/operator/csv_scanner/util/csv_reader_options.cpp +59 -17
  272. package/src/duckdb/src/execution/operator/filter/physical_filter.cpp +5 -5
  273. package/src/duckdb/src/execution/operator/helper/physical_batch_collector.cpp +0 -21
  274. package/src/duckdb/src/execution/operator/helper/physical_buffered_batch_collector.cpp +109 -0
  275. package/src/duckdb/src/execution/operator/helper/physical_buffered_collector.cpp +5 -13
  276. package/src/duckdb/src/execution/operator/helper/physical_explain_analyze.cpp +1 -1
  277. package/src/duckdb/src/execution/operator/helper/physical_load.cpp +12 -4
  278. package/src/duckdb/src/execution/operator/helper/physical_materialized_collector.cpp +0 -16
  279. package/src/duckdb/src/execution/operator/helper/physical_reservoir_sample.cpp +4 -2
  280. package/src/duckdb/src/execution/operator/helper/physical_reset.cpp +5 -0
  281. package/src/duckdb/src/execution/operator/helper/physical_result_collector.cpp +3 -1
  282. package/src/duckdb/src/execution/operator/helper/physical_set_variable.cpp +39 -0
  283. package/src/duckdb/src/execution/operator/helper/physical_streaming_sample.cpp +4 -2
  284. package/src/duckdb/src/execution/operator/helper/physical_transaction.cpp +16 -5
  285. package/src/duckdb/src/execution/operator/join/outer_join_marker.cpp +1 -1
  286. package/src/duckdb/src/execution/operator/join/perfect_hash_join_executor.cpp +1 -1
  287. package/src/duckdb/src/execution/operator/join/physical_asof_join.cpp +1 -1
  288. package/src/duckdb/src/execution/operator/join/physical_blockwise_nl_join.cpp +5 -4
  289. package/src/duckdb/src/execution/operator/join/physical_comparison_join.cpp +59 -21
  290. package/src/duckdb/src/execution/operator/join/physical_delim_join.cpp +7 -4
  291. package/src/duckdb/src/execution/operator/join/physical_hash_join.cpp +333 -176
  292. package/src/duckdb/src/execution/operator/join/physical_iejoin.cpp +57 -34
  293. package/src/duckdb/src/execution/operator/join/physical_join.cpp +16 -8
  294. package/src/duckdb/src/execution/operator/join/physical_left_delim_join.cpp +10 -4
  295. package/src/duckdb/src/execution/operator/join/physical_nested_loop_join.cpp +2 -5
  296. package/src/duckdb/src/execution/operator/join/physical_piecewise_merge_join.cpp +3 -3
  297. package/src/duckdb/src/execution/operator/join/physical_range_join.cpp +5 -5
  298. package/src/duckdb/src/execution/operator/join/physical_right_delim_join.cpp +7 -2
  299. package/src/duckdb/src/execution/operator/order/physical_order.cpp +17 -12
  300. package/src/duckdb/src/execution/operator/order/physical_top_n.cpp +12 -9
  301. package/src/duckdb/src/execution/operator/persistent/physical_batch_copy_to_file.cpp +35 -17
  302. package/src/duckdb/src/execution/operator/persistent/physical_batch_insert.cpp +17 -11
  303. package/src/duckdb/src/execution/operator/persistent/physical_copy_database.cpp +5 -1
  304. package/src/duckdb/src/execution/operator/persistent/physical_copy_to_file.cpp +156 -47
  305. package/src/duckdb/src/execution/operator/persistent/physical_insert.cpp +10 -2
  306. package/src/duckdb/src/execution/operator/persistent/physical_update.cpp +1 -3
  307. package/src/duckdb/src/execution/operator/projection/physical_pivot.cpp +2 -2
  308. package/src/duckdb/src/execution/operator/projection/physical_projection.cpp +13 -6
  309. package/src/duckdb/src/execution/operator/projection/physical_tableinout_function.cpp +22 -3
  310. package/src/duckdb/src/execution/operator/projection/physical_unnest.cpp +19 -3
  311. package/src/duckdb/src/execution/operator/scan/physical_column_data_scan.cpp +37 -22
  312. package/src/duckdb/src/execution/operator/scan/physical_table_scan.cpp +77 -21
  313. package/src/duckdb/src/execution/operator/schema/physical_attach.cpp +27 -55
  314. package/src/duckdb/src/execution/operator/schema/physical_create_art_index.cpp +41 -44
  315. package/src/duckdb/src/execution/operator/set/physical_cte.cpp +4 -6
  316. package/src/duckdb/src/execution/operator/set/physical_recursive_cte.cpp +4 -6
  317. package/src/duckdb/src/execution/operator/set/physical_union.cpp +18 -4
  318. package/src/duckdb/src/execution/perfect_aggregate_hashtable.cpp +3 -2
  319. package/src/duckdb/src/execution/physical_operator.cpp +45 -4
  320. package/src/duckdb/src/execution/physical_plan/plan_comparison_join.cpp +18 -7
  321. package/src/duckdb/src/execution/physical_plan/plan_copy_to_file.cpp +8 -3
  322. package/src/duckdb/src/execution/physical_plan/plan_delim_join.cpp +13 -6
  323. package/src/duckdb/src/execution/physical_plan/plan_explain.cpp +3 -3
  324. package/src/duckdb/src/execution/physical_plan/plan_get.cpp +111 -19
  325. package/src/duckdb/src/execution/physical_plan/plan_limit.cpp +19 -2
  326. package/src/duckdb/src/execution/physical_plan/plan_set.cpp +9 -0
  327. package/src/duckdb/src/execution/physical_plan/plan_window.cpp +3 -1
  328. package/src/duckdb/src/execution/physical_plan_generator.cpp +3 -3
  329. package/src/duckdb/src/execution/radix_partitioned_hashtable.cpp +49 -49
  330. package/src/duckdb/src/execution/reservoir_sample.cpp +2 -2
  331. package/src/duckdb/src/execution/window_executor.cpp +556 -318
  332. package/src/duckdb/src/execution/window_segment_tree.cpp +1058 -485
  333. package/src/duckdb/src/function/aggregate/distributive/count.cpp +5 -5
  334. package/src/duckdb/src/function/aggregate/distributive/first.cpp +92 -95
  335. package/src/duckdb/src/function/aggregate/sorted_aggregate_function.cpp +10 -9
  336. package/src/duckdb/src/function/aggregate_function.cpp +8 -0
  337. package/src/duckdb/src/function/cast/cast_function_set.cpp +10 -1
  338. package/src/duckdb/src/function/cast/decimal_cast.cpp +10 -1
  339. package/src/duckdb/src/function/cast/default_casts.cpp +2 -0
  340. package/src/duckdb/src/function/cast/numeric_casts.cpp +3 -0
  341. package/src/duckdb/src/function/cast/string_cast.cpp +8 -5
  342. package/src/duckdb/src/function/cast/time_casts.cpp +2 -2
  343. package/src/duckdb/src/function/cast/union_casts.cpp +1 -1
  344. package/src/duckdb/src/function/cast/varint_casts.cpp +283 -0
  345. package/src/duckdb/src/function/cast/vector_cast_helpers.cpp +3 -1
  346. package/src/duckdb/src/function/cast_rules.cpp +104 -15
  347. package/src/duckdb/src/function/compression_config.cpp +35 -33
  348. package/src/duckdb/src/function/copy_function.cpp +27 -0
  349. package/src/duckdb/src/function/function_binder.cpp +39 -11
  350. package/src/duckdb/src/function/macro_function.cpp +75 -32
  351. package/src/duckdb/src/function/pragma/pragma_queries.cpp +10 -0
  352. package/src/duckdb/src/function/scalar/compressed_materialization/compress_string.cpp +1 -0
  353. package/src/duckdb/src/function/scalar/generic/binning.cpp +507 -0
  354. package/src/duckdb/src/function/scalar/generic/getvariable.cpp +58 -0
  355. package/src/duckdb/src/function/scalar/generic_functions.cpp +1 -0
  356. package/src/duckdb/src/function/scalar/list/contains_or_position.cpp +33 -47
  357. package/src/duckdb/src/function/scalar/list/list_extract.cpp +70 -143
  358. package/src/duckdb/src/function/scalar/list/list_resize.cpp +93 -84
  359. package/src/duckdb/src/function/scalar/list/list_zip.cpp +3 -0
  360. package/src/duckdb/src/function/scalar/operators/arithmetic.cpp +24 -11
  361. package/src/duckdb/src/function/scalar/sequence/nextval.cpp +4 -4
  362. package/src/duckdb/src/function/scalar/strftime_format.cpp +196 -57
  363. package/src/duckdb/src/function/scalar/string/caseconvert.cpp +9 -7
  364. package/src/duckdb/src/function/scalar/string/concat.cpp +239 -123
  365. package/src/duckdb/src/function/scalar/string/concat_ws.cpp +149 -0
  366. package/src/duckdb/src/function/scalar/string/contains.cpp +18 -7
  367. package/src/duckdb/src/function/scalar/string/like.cpp +2 -2
  368. package/src/duckdb/src/function/scalar/string/substring.cpp +6 -11
  369. package/src/duckdb/src/function/scalar/string_functions.cpp +1 -0
  370. package/src/duckdb/src/function/scalar/struct/struct_extract.cpp +7 -3
  371. package/src/duckdb/src/function/scalar/system/aggregate_export.cpp +5 -5
  372. package/src/duckdb/src/function/scalar_function.cpp +5 -2
  373. package/src/duckdb/src/function/scalar_macro_function.cpp +2 -2
  374. package/src/duckdb/src/function/table/arrow/arrow_duck_schema.cpp +20 -39
  375. package/src/duckdb/src/function/table/arrow/arrow_type_info.cpp +135 -0
  376. package/src/duckdb/src/function/table/arrow.cpp +194 -52
  377. package/src/duckdb/src/function/table/arrow_conversion.cpp +212 -69
  378. package/src/duckdb/src/function/table/copy_csv.cpp +43 -14
  379. package/src/duckdb/src/function/table/query_function.cpp +80 -0
  380. package/src/duckdb/src/function/table/range.cpp +222 -142
  381. package/src/duckdb/src/function/table/read_csv.cpp +25 -13
  382. package/src/duckdb/src/function/table/sniff_csv.cpp +55 -35
  383. package/src/duckdb/src/function/table/system/duckdb_constraints.cpp +141 -129
  384. package/src/duckdb/src/function/table/system/duckdb_extensions.cpp +25 -14
  385. package/src/duckdb/src/function/table/system/duckdb_functions.cpp +20 -14
  386. package/src/duckdb/src/function/table/system/duckdb_indexes.cpp +15 -1
  387. package/src/duckdb/src/function/table/system/duckdb_variables.cpp +84 -0
  388. package/src/duckdb/src/function/table/system/test_all_types.cpp +1 -0
  389. package/src/duckdb/src/function/table/system/test_vector_types.cpp +33 -3
  390. package/src/duckdb/src/function/table/system_functions.cpp +1 -0
  391. package/src/duckdb/src/function/table/table_scan.cpp +45 -22
  392. package/src/duckdb/src/function/table/unnest.cpp +2 -2
  393. package/src/duckdb/src/function/table/version/pragma_version.cpp +4 -4
  394. package/src/duckdb/src/function/table_function.cpp +5 -4
  395. package/src/duckdb/src/function/table_macro_function.cpp +2 -2
  396. package/src/duckdb/src/include/duckdb/catalog/catalog.hpp +8 -4
  397. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/duck_index_entry.hpp +5 -2
  398. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/duck_schema_entry.hpp +3 -0
  399. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/index_catalog_entry.hpp +2 -2
  400. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/macro_catalog_entry.hpp +3 -4
  401. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/table_catalog_entry.hpp +5 -5
  402. package/src/duckdb/src/include/duckdb/catalog/default/builtin_types/types.hpp +2 -1
  403. package/src/duckdb/src/include/duckdb/catalog/default/default_functions.hpp +4 -5
  404. package/src/duckdb/src/include/duckdb/catalog/default/default_generator.hpp +4 -5
  405. package/src/duckdb/src/include/duckdb/catalog/default/default_schemas.hpp +2 -1
  406. package/src/duckdb/src/include/duckdb/catalog/default/default_table_functions.hpp +47 -0
  407. package/src/duckdb/src/include/duckdb/catalog/duck_catalog.hpp +2 -0
  408. package/src/duckdb/src/include/duckdb/catalog/similar_catalog_entry.hpp +2 -2
  409. package/src/duckdb/src/include/duckdb/common/allocator.hpp +9 -1
  410. package/src/duckdb/src/include/duckdb/common/array_ptr.hpp +120 -0
  411. package/src/duckdb/src/include/duckdb/common/arrow/appender/append_data.hpp +37 -11
  412. package/src/duckdb/src/include/duckdb/common/arrow/appender/enum_data.hpp +9 -8
  413. package/src/duckdb/src/include/duckdb/common/arrow/appender/list.hpp +1 -0
  414. package/src/duckdb/src/include/duckdb/common/arrow/appender/list_data.hpp +6 -4
  415. package/src/duckdb/src/include/duckdb/common/arrow/appender/list_view_data.hpp +92 -0
  416. package/src/duckdb/src/include/duckdb/common/arrow/appender/map_data.hpp +2 -2
  417. package/src/duckdb/src/include/duckdb/common/arrow/appender/scalar_data.hpp +26 -4
  418. package/src/duckdb/src/include/duckdb/common/arrow/appender/varchar_data.hpp +90 -11
  419. package/src/duckdb/src/include/duckdb/common/arrow/arrow_appender.hpp +6 -6
  420. package/src/duckdb/src/include/duckdb/common/arrow/arrow_buffer.hpp +8 -1
  421. package/src/duckdb/src/include/duckdb/common/arrow/arrow_merge_event.hpp +62 -0
  422. package/src/duckdb/src/include/duckdb/common/arrow/arrow_query_result.hpp +52 -0
  423. package/src/duckdb/src/include/duckdb/common/arrow/arrow_types_extension.hpp +42 -0
  424. package/src/duckdb/src/include/duckdb/common/arrow/physical_arrow_batch_collector.hpp +30 -0
  425. package/src/duckdb/src/include/duckdb/common/arrow/physical_arrow_collector.hpp +65 -0
  426. package/src/duckdb/src/include/duckdb/common/arrow/schema_metadata.hpp +43 -0
  427. package/src/duckdb/src/include/duckdb/common/bswap.hpp +18 -16
  428. package/src/duckdb/src/include/duckdb/common/cgroups.hpp +30 -0
  429. package/src/duckdb/src/include/duckdb/common/compressed_file_system.hpp +3 -0
  430. package/src/duckdb/src/include/duckdb/common/dl.hpp +8 -1
  431. package/src/duckdb/src/include/duckdb/common/encryption_state.hpp +48 -0
  432. package/src/duckdb/src/include/duckdb/common/enum_util.hpp +88 -0
  433. package/src/duckdb/src/include/duckdb/common/enums/checkpoint_type.hpp +2 -2
  434. package/src/duckdb/src/include/duckdb/common/enums/copy_overwrite_mode.hpp +6 -1
  435. package/src/duckdb/src/include/duckdb/common/enums/destroy_buffer_upon.hpp +21 -0
  436. package/src/duckdb/src/include/duckdb/common/enums/explain_format.hpp +17 -0
  437. package/src/duckdb/src/include/duckdb/common/enums/file_compression_type.hpp +4 -0
  438. package/src/duckdb/src/include/duckdb/common/enums/join_type.hpp +2 -2
  439. package/src/duckdb/src/include/duckdb/common/enums/metric_type.hpp +88 -0
  440. package/src/duckdb/src/include/duckdb/common/enums/optimizer_type.hpp +6 -1
  441. package/src/duckdb/src/include/duckdb/common/enums/pending_execution_result.hpp +2 -1
  442. package/src/duckdb/src/include/duckdb/common/enums/physical_operator_type.hpp +1 -0
  443. package/src/duckdb/src/include/duckdb/common/enums/profiler_format.hpp +1 -1
  444. package/src/duckdb/src/include/duckdb/common/enums/relation_type.hpp +3 -1
  445. package/src/duckdb/src/include/duckdb/common/enums/set_scope.hpp +2 -1
  446. package/src/duckdb/src/include/duckdb/common/enums/statement_type.hpp +23 -2
  447. package/src/duckdb/src/include/duckdb/common/enums/stream_execution_result.hpp +25 -0
  448. package/src/duckdb/src/include/duckdb/common/enums/tableref_type.hpp +2 -1
  449. package/src/duckdb/src/include/duckdb/common/enums/wal_type.hpp +1 -0
  450. package/src/duckdb/src/include/duckdb/common/error_data.hpp +5 -2
  451. package/src/duckdb/src/include/duckdb/common/exception/binder_exception.hpp +1 -0
  452. package/src/duckdb/src/include/duckdb/common/exception.hpp +20 -2
  453. package/src/duckdb/src/include/duckdb/common/extra_operator_info.hpp +12 -0
  454. package/src/duckdb/src/include/duckdb/common/file_buffer.hpp +2 -0
  455. package/src/duckdb/src/include/duckdb/common/file_open_flags.hpp +16 -0
  456. package/src/duckdb/src/include/duckdb/common/file_opener.hpp +18 -0
  457. package/src/duckdb/src/include/duckdb/common/file_system.hpp +3 -0
  458. package/src/duckdb/src/include/duckdb/common/filename_pattern.hpp +4 -0
  459. package/src/duckdb/src/include/duckdb/common/fixed_size_map.hpp +160 -96
  460. package/src/duckdb/src/include/duckdb/common/fsst.hpp +9 -2
  461. package/src/duckdb/src/include/duckdb/common/helper.hpp +22 -8
  462. package/src/duckdb/src/include/duckdb/common/hive_partitioning.hpp +16 -7
  463. package/src/duckdb/src/include/duckdb/common/http_util.hpp +19 -0
  464. package/src/duckdb/src/include/duckdb/common/insertion_order_preserving_map.hpp +19 -6
  465. package/src/duckdb/src/include/duckdb/common/limits.hpp +9 -2
  466. package/src/duckdb/src/include/duckdb/common/multi_file_list.hpp +38 -6
  467. package/src/duckdb/src/include/duckdb/common/multi_file_reader.hpp +9 -2
  468. package/src/duckdb/src/include/duckdb/common/multi_file_reader_options.hpp +5 -1
  469. package/src/duckdb/src/include/duckdb/common/numeric_utils.hpp +82 -50
  470. package/src/duckdb/src/include/duckdb/common/operator/abs.hpp +11 -0
  471. package/src/duckdb/src/include/duckdb/common/operator/cast_operators.hpp +7 -3
  472. package/src/duckdb/src/include/duckdb/common/operator/decimal_cast_operators.hpp +23 -1
  473. package/src/duckdb/src/include/duckdb/common/operator/double_cast_operator.hpp +2 -1
  474. package/src/duckdb/src/include/duckdb/common/operator/integer_cast_operator.hpp +1 -1
  475. package/src/duckdb/src/include/duckdb/common/operator/numeric_cast.hpp +4 -0
  476. package/src/duckdb/src/include/duckdb/common/operator/string_cast.hpp +2 -0
  477. package/src/duckdb/src/include/duckdb/common/optional_ptr.hpp +10 -5
  478. package/src/duckdb/src/include/duckdb/common/optionally_owned_ptr.hpp +1 -0
  479. package/src/duckdb/src/include/duckdb/common/owning_string_map.hpp +155 -0
  480. package/src/duckdb/src/include/duckdb/common/perfect_map_set.hpp +2 -3
  481. package/src/duckdb/src/include/duckdb/common/platform.hpp +58 -0
  482. package/src/duckdb/src/include/duckdb/common/radix.hpp +172 -27
  483. package/src/duckdb/src/include/duckdb/common/radix_partitioning.hpp +5 -1
  484. package/src/duckdb/src/include/duckdb/common/random_engine.hpp +1 -0
  485. package/src/duckdb/src/include/duckdb/common/re2_regex.hpp +1 -1
  486. package/src/duckdb/src/include/duckdb/common/render_tree.hpp +77 -0
  487. package/src/duckdb/src/include/duckdb/common/row_operations/row_matcher.hpp +12 -0
  488. package/src/duckdb/src/include/duckdb/common/serializer/binary_serializer.hpp +6 -2
  489. package/src/duckdb/src/include/duckdb/common/serializer/buffered_file_writer.hpp +5 -3
  490. package/src/duckdb/src/include/duckdb/common/serializer/deserializer.hpp +15 -7
  491. package/src/duckdb/src/include/duckdb/common/serializer/memory_stream.hpp +3 -1
  492. package/src/duckdb/src/include/duckdb/common/serializer/serialization_data.hpp +245 -0
  493. package/src/duckdb/src/include/duckdb/common/serializer/serializer.hpp +10 -0
  494. package/src/duckdb/src/include/duckdb/common/sort/duckdb_pdqsort.hpp +10 -11
  495. package/src/duckdb/src/include/duckdb/common/sort/partition_state.hpp +12 -6
  496. package/src/duckdb/src/include/duckdb/common/string_util.hpp +37 -7
  497. package/src/duckdb/src/include/duckdb/common/tree_renderer/graphviz_tree_renderer.hpp +44 -0
  498. package/src/duckdb/src/include/duckdb/common/tree_renderer/html_tree_renderer.hpp +44 -0
  499. package/src/duckdb/src/include/duckdb/common/tree_renderer/json_tree_renderer.hpp +44 -0
  500. package/src/duckdb/src/include/duckdb/common/tree_renderer/text_tree_renderer.hpp +119 -0
  501. package/src/duckdb/src/include/duckdb/common/tree_renderer.hpp +9 -123
  502. package/src/duckdb/src/include/duckdb/common/type_visitor.hpp +96 -0
  503. package/src/duckdb/src/include/duckdb/common/typedefs.hpp +11 -1
  504. package/src/duckdb/src/include/duckdb/common/types/arrow_string_view_type.hpp +84 -0
  505. package/src/duckdb/src/include/duckdb/common/types/batched_data_collection.hpp +36 -1
  506. package/src/duckdb/src/include/duckdb/common/types/bit.hpp +1 -1
  507. package/src/duckdb/src/include/duckdb/common/types/cast_helpers.hpp +2 -2
  508. package/src/duckdb/src/include/duckdb/common/types/column/column_data_allocator.hpp +4 -2
  509. package/src/duckdb/src/include/duckdb/common/types/column/partitioned_column_data.hpp +52 -0
  510. package/src/duckdb/src/include/duckdb/common/types/data_chunk.hpp +2 -0
  511. package/src/duckdb/src/include/duckdb/common/types/date.hpp +0 -3
  512. package/src/duckdb/src/include/duckdb/common/types/date_lookup_cache.hpp +65 -0
  513. package/src/duckdb/src/include/duckdb/common/types/datetime.hpp +5 -2
  514. package/src/duckdb/src/include/duckdb/common/types/hyperloglog.hpp +49 -40
  515. package/src/duckdb/src/include/duckdb/common/types/interval.hpp +5 -1
  516. package/src/duckdb/src/include/duckdb/common/types/list_segment.hpp +2 -1
  517. package/src/duckdb/src/include/duckdb/common/types/row/partitioned_tuple_data.hpp +41 -9
  518. package/src/duckdb/src/include/duckdb/common/types/row/row_data_collection.hpp +4 -3
  519. package/src/duckdb/src/include/duckdb/common/types/row/row_data_collection_scanner.hpp +3 -1
  520. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_allocator.hpp +4 -0
  521. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_collection.hpp +4 -0
  522. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_states.hpp +1 -1
  523. package/src/duckdb/src/include/duckdb/common/types/selection_vector.hpp +4 -0
  524. package/src/duckdb/src/include/duckdb/common/types/string_type.hpp +4 -1
  525. package/src/duckdb/src/include/duckdb/common/types/time.hpp +11 -6
  526. package/src/duckdb/src/include/duckdb/common/types/timestamp.hpp +13 -3
  527. package/src/duckdb/src/include/duckdb/common/types/validity_mask.hpp +103 -12
  528. package/src/duckdb/src/include/duckdb/common/types/value.hpp +12 -3
  529. package/src/duckdb/src/include/duckdb/common/types/varint.hpp +107 -0
  530. package/src/duckdb/src/include/duckdb/common/types/vector.hpp +5 -1
  531. package/src/duckdb/src/include/duckdb/common/types/vector_buffer.hpp +7 -2
  532. package/src/duckdb/src/include/duckdb/common/types.hpp +6 -39
  533. package/src/duckdb/src/include/duckdb/common/union_by_name.hpp +42 -10
  534. package/src/duckdb/src/include/duckdb/common/vector_operations/generic_executor.hpp +29 -0
  535. package/src/duckdb/src/include/duckdb/common/vector_operations/unary_executor.hpp +0 -7
  536. package/src/duckdb/src/include/duckdb/common/vector_operations/vector_operations.hpp +2 -0
  537. package/src/duckdb/src/include/duckdb/common/winapi.hpp +8 -0
  538. package/src/duckdb/src/include/duckdb/core_functions/aggregate/algebraic/covar.hpp +8 -4
  539. package/src/duckdb/src/include/duckdb/core_functions/aggregate/algebraic/stddev.hpp +8 -4
  540. package/src/duckdb/src/include/duckdb/core_functions/aggregate/distributive_functions.hpp +4 -2
  541. package/src/duckdb/src/include/duckdb/core_functions/aggregate/histogram_helpers.hpp +99 -0
  542. package/src/duckdb/src/include/duckdb/core_functions/aggregate/holistic_functions.hpp +16 -7
  543. package/src/duckdb/src/include/duckdb/core_functions/aggregate/minmax_n_helpers.hpp +396 -0
  544. package/src/duckdb/src/include/duckdb/core_functions/aggregate/nested_functions.hpp +10 -0
  545. package/src/duckdb/src/include/duckdb/core_functions/aggregate/quantile_helpers.hpp +65 -0
  546. package/src/duckdb/src/include/duckdb/core_functions/aggregate/quantile_sort_tree.hpp +349 -0
  547. package/src/duckdb/src/include/duckdb/core_functions/aggregate/quantile_state.hpp +300 -0
  548. package/src/duckdb/src/include/duckdb/core_functions/aggregate/regression/regr_slope.hpp +1 -1
  549. package/src/duckdb/src/include/duckdb/core_functions/aggregate/sort_key_helpers.hpp +55 -0
  550. package/src/duckdb/src/include/duckdb/core_functions/array_kernels.hpp +107 -0
  551. package/src/duckdb/src/include/duckdb/core_functions/create_sort_key.hpp +55 -0
  552. package/src/duckdb/src/include/duckdb/core_functions/lambda_functions.hpp +1 -2
  553. package/src/duckdb/src/include/duckdb/core_functions/scalar/array_functions.hpp +24 -0
  554. package/src/duckdb/src/include/duckdb/core_functions/scalar/date_functions.hpp +9 -0
  555. package/src/duckdb/src/include/duckdb/core_functions/scalar/generic_functions.hpp +27 -0
  556. package/src/duckdb/src/include/duckdb/core_functions/scalar/list_functions.hpp +80 -8
  557. package/src/duckdb/src/include/duckdb/core_functions/scalar/map_functions.hpp +9 -0
  558. package/src/duckdb/src/include/duckdb/core_functions/scalar/math_functions.hpp +54 -0
  559. package/src/duckdb/src/include/duckdb/core_functions/scalar/string_functions.hpp +30 -21
  560. package/src/duckdb/src/include/duckdb/execution/adaptive_filter.hpp +25 -14
  561. package/src/duckdb/src/include/duckdb/execution/aggregate_hashtable.hpp +2 -48
  562. package/src/duckdb/src/include/duckdb/execution/executor.hpp +25 -2
  563. package/src/duckdb/src/include/duckdb/execution/ht_entry.hpp +102 -0
  564. package/src/duckdb/src/include/duckdb/execution/index/art/art.hpp +94 -101
  565. package/src/duckdb/src/include/duckdb/execution/index/art/art_key.hpp +43 -25
  566. package/src/duckdb/src/include/duckdb/execution/index/art/base_leaf.hpp +109 -0
  567. package/src/duckdb/src/include/duckdb/execution/index/art/base_node.hpp +140 -0
  568. package/src/duckdb/src/include/duckdb/execution/index/art/iterator.hpp +43 -24
  569. package/src/duckdb/src/include/duckdb/execution/index/art/leaf.hpp +41 -52
  570. package/src/duckdb/src/include/duckdb/execution/index/art/node.hpp +133 -74
  571. package/src/duckdb/src/include/duckdb/execution/index/art/node256.hpp +46 -29
  572. package/src/duckdb/src/include/duckdb/execution/index/art/node256_leaf.hpp +53 -0
  573. package/src/duckdb/src/include/duckdb/execution/index/art/node48.hpp +52 -35
  574. package/src/duckdb/src/include/duckdb/execution/index/art/prefix.hpp +96 -57
  575. package/src/duckdb/src/include/duckdb/execution/index/bound_index.hpp +9 -4
  576. package/src/duckdb/src/include/duckdb/execution/index/fixed_size_allocator.hpp +48 -10
  577. package/src/duckdb/src/include/duckdb/execution/index/fixed_size_buffer.hpp +0 -2
  578. package/src/duckdb/src/include/duckdb/execution/index/index_pointer.hpp +4 -2
  579. package/src/duckdb/src/include/duckdb/execution/join_hashtable.hpp +114 -36
  580. package/src/duckdb/src/include/duckdb/execution/merge_sort_tree.hpp +158 -67
  581. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/aggregate_object.hpp +1 -1
  582. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_hash_aggregate.hpp +1 -1
  583. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_perfecthash_aggregate.hpp +1 -1
  584. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_streaming_window.hpp +19 -2
  585. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_ungrouped_aggregate.hpp +1 -1
  586. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_window.hpp +1 -1
  587. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/ungrouped_aggregate_state.hpp +75 -0
  588. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/base_scanner.hpp +81 -23
  589. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/column_count_scanner.hpp +27 -8
  590. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_buffer_manager.hpp +2 -1
  591. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_error.hpp +31 -22
  592. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_file_handle.hpp +4 -2
  593. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_file_scanner.hpp +48 -5
  594. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_option.hpp +7 -3
  595. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_reader_options.hpp +22 -12
  596. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_schema.hpp +35 -0
  597. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_sniffer.hpp +81 -39
  598. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_state.hpp +2 -1
  599. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_state_machine.hpp +18 -1
  600. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_state_machine_cache.hpp +9 -7
  601. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/global_csv_state.hpp +5 -4
  602. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/header_value.hpp +26 -0
  603. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/scanner_boundary.hpp +6 -9
  604. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/skip_scanner.hpp +3 -0
  605. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/state_machine_options.hpp +5 -3
  606. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/string_value_scanner.hpp +36 -19
  607. package/src/duckdb/src/include/duckdb/execution/operator/filter/physical_filter.hpp +1 -1
  608. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_batch_collector.hpp +21 -0
  609. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_buffered_batch_collector.hpp +53 -0
  610. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_buffered_collector.hpp +3 -0
  611. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_explain_analyze.hpp +6 -2
  612. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_materialized_collector.hpp +18 -0
  613. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_reservoir_sample.hpp +1 -1
  614. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_result_collector.hpp +6 -0
  615. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_set.hpp +2 -2
  616. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_set_variable.hpp +43 -0
  617. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_streaming_sample.hpp +1 -1
  618. package/src/duckdb/src/include/duckdb/execution/operator/join/join_filter_pushdown.hpp +59 -0
  619. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_blockwise_nl_join.hpp +1 -1
  620. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_comparison_join.hpp +8 -1
  621. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_delim_join.hpp +5 -2
  622. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_hash_join.hpp +4 -2
  623. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_iejoin.hpp +2 -0
  624. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_join.hpp +1 -1
  625. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_left_delim_join.hpp +3 -1
  626. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_range_join.hpp +4 -1
  627. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_right_delim_join.hpp +3 -1
  628. package/src/duckdb/src/include/duckdb/execution/operator/order/physical_order.hpp +1 -1
  629. package/src/duckdb/src/include/duckdb/execution/operator/order/physical_top_n.hpp +1 -1
  630. package/src/duckdb/src/include/duckdb/execution/operator/persistent/batch_memory_manager.hpp +5 -37
  631. package/src/duckdb/src/include/duckdb/execution/operator/persistent/physical_batch_copy_to_file.hpp +5 -4
  632. package/src/duckdb/src/include/duckdb/execution/operator/persistent/physical_copy_to_file.hpp +8 -2
  633. package/src/duckdb/src/include/duckdb/execution/operator/projection/physical_projection.hpp +1 -1
  634. package/src/duckdb/src/include/duckdb/execution/operator/projection/physical_tableinout_function.hpp +2 -0
  635. package/src/duckdb/src/include/duckdb/execution/operator/scan/physical_column_data_scan.hpp +9 -3
  636. package/src/duckdb/src/include/duckdb/execution/operator/scan/physical_table_scan.hpp +8 -6
  637. package/src/duckdb/src/include/duckdb/execution/operator/schema/physical_create_art_index.hpp +2 -2
  638. package/src/duckdb/src/include/duckdb/execution/operator/set/physical_cte.hpp +1 -1
  639. package/src/duckdb/src/include/duckdb/execution/operator/set/physical_recursive_cte.hpp +1 -1
  640. package/src/duckdb/src/include/duckdb/execution/physical_operator.hpp +21 -6
  641. package/src/duckdb/src/include/duckdb/execution/physical_operator_states.hpp +3 -2
  642. package/src/duckdb/src/include/duckdb/execution/physical_plan_generator.hpp +3 -0
  643. package/src/duckdb/src/include/duckdb/execution/window_executor.hpp +137 -110
  644. package/src/duckdb/src/include/duckdb/execution/window_segment_tree.hpp +57 -126
  645. package/src/duckdb/src/include/duckdb/function/aggregate_function.hpp +21 -4
  646. package/src/duckdb/src/include/duckdb/function/cast/default_casts.hpp +1 -1
  647. package/src/duckdb/src/include/duckdb/function/compression/compression.hpp +10 -10
  648. package/src/duckdb/src/include/duckdb/function/compression_function.hpp +37 -7
  649. package/src/duckdb/src/include/duckdb/function/copy_function.hpp +24 -11
  650. package/src/duckdb/src/include/duckdb/function/function_binder.hpp +4 -4
  651. package/src/duckdb/src/include/duckdb/function/function_serialization.hpp +41 -1
  652. package/src/duckdb/src/include/duckdb/function/macro_function.hpp +15 -5
  653. package/src/duckdb/src/include/duckdb/function/pragma/pragma_functions.hpp +1 -0
  654. package/src/duckdb/src/include/duckdb/function/replacement_scan.hpp +20 -4
  655. package/src/duckdb/src/include/duckdb/function/scalar/generic_functions.hpp +6 -0
  656. package/src/duckdb/src/include/duckdb/function/scalar/list/contains_or_position.hpp +77 -109
  657. package/src/duckdb/src/include/duckdb/function/scalar/nested_functions.hpp +1 -1
  658. package/src/duckdb/src/include/duckdb/function/scalar/regexp.hpp +6 -3
  659. package/src/duckdb/src/include/duckdb/function/scalar/strftime_format.hpp +25 -12
  660. package/src/duckdb/src/include/duckdb/function/scalar/string_functions.hpp +9 -8
  661. package/src/duckdb/src/include/duckdb/function/scalar_function.hpp +38 -4
  662. package/src/duckdb/src/include/duckdb/function/scalar_macro_function.hpp +1 -1
  663. package/src/duckdb/src/include/duckdb/function/table/arrow/arrow_duck_schema.hpp +11 -57
  664. package/src/duckdb/src/include/duckdb/function/table/arrow/arrow_type_info.hpp +142 -0
  665. package/src/duckdb/src/include/duckdb/function/table/arrow/enum/arrow_datetime_type.hpp +18 -0
  666. package/src/duckdb/src/include/duckdb/function/table/arrow/enum/arrow_type_info_type.hpp +7 -0
  667. package/src/duckdb/src/include/duckdb/function/table/arrow/enum/arrow_variable_size_type.hpp +10 -0
  668. package/src/duckdb/src/include/duckdb/function/table/arrow.hpp +2 -0
  669. package/src/duckdb/src/include/duckdb/function/table/range.hpp +4 -0
  670. package/src/duckdb/src/include/duckdb/function/table/read_csv.hpp +4 -1
  671. package/src/duckdb/src/include/duckdb/function/table/system_functions.hpp +4 -0
  672. package/src/duckdb/src/include/duckdb/function/table/table_scan.hpp +5 -5
  673. package/src/duckdb/src/include/duckdb/function/table_function.hpp +14 -2
  674. package/src/duckdb/src/include/duckdb/function/table_macro_function.hpp +1 -1
  675. package/src/duckdb/src/include/duckdb/main/appender.hpp +14 -4
  676. package/src/duckdb/src/include/duckdb/main/attached_database.hpp +25 -7
  677. package/src/duckdb/src/include/duckdb/main/buffered_data/batched_buffered_data.hpp +79 -0
  678. package/src/duckdb/src/include/duckdb/main/buffered_data/buffered_data.hpp +10 -20
  679. package/src/duckdb/src/include/duckdb/main/buffered_data/simple_buffered_data.hpp +11 -12
  680. package/src/duckdb/src/include/duckdb/main/capi/capi_internal.hpp +7 -2
  681. package/src/duckdb/src/include/duckdb/main/capi/cast/generic.hpp +1 -1
  682. package/src/duckdb/src/include/duckdb/main/capi/cast/utils.hpp +2 -2
  683. package/src/duckdb/src/include/duckdb/main/capi/extension_api.hpp +809 -0
  684. package/src/duckdb/src/include/duckdb/main/chunk_scan_state/batched_data_collection.hpp +35 -0
  685. package/src/duckdb/src/include/duckdb/main/client_config.hpp +68 -2
  686. package/src/duckdb/src/include/duckdb/main/client_context.hpp +30 -22
  687. package/src/duckdb/src/include/duckdb/main/client_context_state.hpp +79 -1
  688. package/src/duckdb/src/include/duckdb/main/client_properties.hpp +9 -3
  689. package/src/duckdb/src/include/duckdb/main/config.hpp +55 -7
  690. package/src/duckdb/src/include/duckdb/main/connection.hpp +5 -1
  691. package/src/duckdb/src/include/duckdb/main/database.hpp +16 -5
  692. package/src/duckdb/src/include/duckdb/main/database_manager.hpp +9 -8
  693. package/src/duckdb/src/include/duckdb/main/db_instance_cache.hpp +21 -6
  694. package/src/duckdb/src/include/duckdb/main/extension.hpp +20 -0
  695. package/src/duckdb/src/include/duckdb/main/extension_entries.hpp +25 -0
  696. package/src/duckdb/src/include/duckdb/main/extension_helper.hpp +29 -23
  697. package/src/duckdb/src/include/duckdb/main/extension_install_info.hpp +6 -0
  698. package/src/duckdb/src/include/duckdb/main/extension_util.hpp +3 -0
  699. package/src/duckdb/src/include/duckdb/main/pending_query_result.hpp +4 -2
  700. package/src/duckdb/src/include/duckdb/main/prepared_statement.hpp +5 -6
  701. package/src/duckdb/src/include/duckdb/main/prepared_statement_data.hpp +2 -5
  702. package/src/duckdb/src/include/duckdb/main/profiling_info.hpp +87 -0
  703. package/src/duckdb/src/include/duckdb/main/profiling_node.hpp +60 -0
  704. package/src/duckdb/src/include/duckdb/main/query_profiler.hpp +72 -34
  705. package/src/duckdb/src/include/duckdb/main/query_result.hpp +1 -1
  706. package/src/duckdb/src/include/duckdb/main/relation/create_table_relation.hpp +2 -1
  707. package/src/duckdb/src/include/duckdb/main/relation/delim_get_relation.hpp +30 -0
  708. package/src/duckdb/src/include/duckdb/main/relation/explain_relation.hpp +3 -1
  709. package/src/duckdb/src/include/duckdb/main/relation/join_relation.hpp +3 -0
  710. package/src/duckdb/src/include/duckdb/main/relation/materialized_relation.hpp +1 -4
  711. package/src/duckdb/src/include/duckdb/main/relation/query_relation.hpp +4 -1
  712. package/src/duckdb/src/include/duckdb/main/relation/read_json_relation.hpp +6 -0
  713. package/src/duckdb/src/include/duckdb/main/relation/table_function_relation.hpp +1 -0
  714. package/src/duckdb/src/include/duckdb/main/relation/view_relation.hpp +2 -0
  715. package/src/duckdb/src/include/duckdb/main/relation.hpp +7 -4
  716. package/src/duckdb/src/include/duckdb/main/secret/default_secrets.hpp +36 -0
  717. package/src/duckdb/src/include/duckdb/main/secret/secret.hpp +108 -0
  718. package/src/duckdb/src/include/duckdb/main/secret/secret_manager.hpp +14 -4
  719. package/src/duckdb/src/include/duckdb/main/settings.hpp +227 -3
  720. package/src/duckdb/src/include/duckdb/main/stream_query_result.hpp +8 -0
  721. package/src/duckdb/src/include/duckdb/optimizer/build_probe_side_optimizer.hpp +51 -0
  722. package/src/duckdb/src/include/duckdb/optimizer/compressed_materialization.hpp +7 -0
  723. package/src/duckdb/src/include/duckdb/optimizer/cte_filter_pusher.hpp +46 -0
  724. package/src/duckdb/src/include/duckdb/optimizer/filter_combiner.hpp +1 -1
  725. package/src/duckdb/src/include/duckdb/optimizer/filter_pushdown.hpp +7 -0
  726. package/src/duckdb/src/include/duckdb/optimizer/join_filter_pushdown_optimizer.hpp +31 -0
  727. package/src/duckdb/src/include/duckdb/optimizer/join_order/cardinality_estimator.hpp +51 -10
  728. package/src/duckdb/src/include/duckdb/optimizer/join_order/cost_model.hpp +1 -0
  729. package/src/duckdb/src/include/duckdb/optimizer/join_order/join_order_optimizer.hpp +17 -5
  730. package/src/duckdb/src/include/duckdb/optimizer/join_order/query_graph.hpp +1 -1
  731. package/src/duckdb/src/include/duckdb/optimizer/join_order/query_graph_manager.hpp +15 -13
  732. package/src/duckdb/src/include/duckdb/optimizer/join_order/relation_manager.hpp +9 -4
  733. package/src/duckdb/src/include/duckdb/optimizer/limit_pushdown.hpp +25 -0
  734. package/src/duckdb/src/include/duckdb/optimizer/optimizer.hpp +1 -0
  735. package/src/duckdb/src/include/duckdb/optimizer/rule/join_dependent_filter.hpp +37 -0
  736. package/src/duckdb/src/include/duckdb/parallel/executor_task.hpp +6 -1
  737. package/src/duckdb/src/include/duckdb/parallel/interrupt.hpp +54 -2
  738. package/src/duckdb/src/include/duckdb/parallel/meta_pipeline.hpp +27 -8
  739. package/src/duckdb/src/include/duckdb/parallel/pipeline.hpp +1 -0
  740. package/src/duckdb/src/include/duckdb/parallel/pipeline_prepare_finish_event.hpp +25 -0
  741. package/src/duckdb/src/include/duckdb/parallel/task_executor.hpp +63 -0
  742. package/src/duckdb/src/include/duckdb/parallel/task_scheduler.hpp +10 -1
  743. package/src/duckdb/src/include/duckdb/parser/expression/function_expression.hpp +4 -1
  744. package/src/duckdb/src/include/duckdb/parser/expression/star_expression.hpp +5 -0
  745. package/src/duckdb/src/include/duckdb/parser/parsed_data/alter_table_info.hpp +5 -0
  746. package/src/duckdb/src/include/duckdb/parser/parsed_data/attach_info.hpp +5 -0
  747. package/src/duckdb/src/include/duckdb/parser/parsed_data/create_index_info.hpp +2 -0
  748. package/src/duckdb/src/include/duckdb/parser/parsed_data/create_macro_info.hpp +11 -1
  749. package/src/duckdb/src/include/duckdb/parser/parsed_data/transaction_info.hpp +9 -0
  750. package/src/duckdb/src/include/duckdb/parser/parsed_expression_iterator.hpp +13 -6
  751. package/src/duckdb/src/include/duckdb/parser/parser_extension.hpp +1 -1
  752. package/src/duckdb/src/include/duckdb/parser/sql_statement.hpp +1 -3
  753. package/src/duckdb/src/include/duckdb/parser/statement/copy_statement.hpp +2 -0
  754. package/src/duckdb/src/include/duckdb/parser/statement/explain_statement.hpp +5 -1
  755. package/src/duckdb/src/include/duckdb/parser/statement/set_statement.hpp +2 -2
  756. package/src/duckdb/src/include/duckdb/parser/statement/transaction_statement.hpp +1 -1
  757. package/src/duckdb/src/include/duckdb/parser/tableref/basetableref.hpp +0 -2
  758. package/src/duckdb/src/include/duckdb/parser/tableref/column_data_ref.hpp +9 -7
  759. package/src/duckdb/src/include/duckdb/parser/tableref/delimgetref.hpp +37 -0
  760. package/src/duckdb/src/include/duckdb/parser/tableref/joinref.hpp +4 -0
  761. package/src/duckdb/src/include/duckdb/parser/tableref/pivotref.hpp +0 -2
  762. package/src/duckdb/src/include/duckdb/parser/tableref/subqueryref.hpp +0 -2
  763. package/src/duckdb/src/include/duckdb/parser/tableref/table_function_ref.hpp +0 -1
  764. package/src/duckdb/src/include/duckdb/parser/tableref.hpp +3 -1
  765. package/src/duckdb/src/include/duckdb/parser/transformer.hpp +17 -9
  766. package/src/duckdb/src/include/duckdb/planner/binder.hpp +24 -14
  767. package/src/duckdb/src/include/duckdb/planner/collation_binding.hpp +44 -0
  768. package/src/duckdb/src/include/duckdb/planner/expression/bound_aggregate_expression.hpp +1 -1
  769. package/src/duckdb/src/include/duckdb/planner/expression/bound_between_expression.hpp +1 -1
  770. package/src/duckdb/src/include/duckdb/planner/expression/bound_case_expression.hpp +1 -1
  771. package/src/duckdb/src/include/duckdb/planner/expression/bound_cast_expression.hpp +1 -1
  772. package/src/duckdb/src/include/duckdb/planner/expression/bound_columnref_expression.hpp +1 -1
  773. package/src/duckdb/src/include/duckdb/planner/expression/bound_comparison_expression.hpp +1 -1
  774. package/src/duckdb/src/include/duckdb/planner/expression/bound_conjunction_expression.hpp +1 -1
  775. package/src/duckdb/src/include/duckdb/planner/expression/bound_constant_expression.hpp +1 -1
  776. package/src/duckdb/src/include/duckdb/planner/expression/bound_default_expression.hpp +1 -1
  777. package/src/duckdb/src/include/duckdb/planner/expression/bound_expanded_expression.hpp +1 -1
  778. package/src/duckdb/src/include/duckdb/planner/expression/bound_function_expression.hpp +1 -1
  779. package/src/duckdb/src/include/duckdb/planner/expression/bound_lambda_expression.hpp +1 -1
  780. package/src/duckdb/src/include/duckdb/planner/expression/bound_lambdaref_expression.hpp +1 -1
  781. package/src/duckdb/src/include/duckdb/planner/expression/bound_operator_expression.hpp +1 -1
  782. package/src/duckdb/src/include/duckdb/planner/expression/bound_parameter_data.hpp +2 -0
  783. package/src/duckdb/src/include/duckdb/planner/expression/bound_parameter_expression.hpp +1 -1
  784. package/src/duckdb/src/include/duckdb/planner/expression/bound_reference_expression.hpp +1 -1
  785. package/src/duckdb/src/include/duckdb/planner/expression/bound_subquery_expression.hpp +2 -2
  786. package/src/duckdb/src/include/duckdb/planner/expression/bound_unnest_expression.hpp +1 -1
  787. package/src/duckdb/src/include/duckdb/planner/expression/bound_window_expression.hpp +1 -1
  788. package/src/duckdb/src/include/duckdb/planner/expression.hpp +2 -2
  789. package/src/duckdb/src/include/duckdb/planner/expression_binder/column_alias_binder.hpp +2 -0
  790. package/src/duckdb/src/include/duckdb/planner/expression_binder/group_binder.hpp +1 -0
  791. package/src/duckdb/src/include/duckdb/planner/expression_binder/order_binder.hpp +6 -5
  792. package/src/duckdb/src/include/duckdb/planner/expression_binder/where_binder.hpp +1 -0
  793. package/src/duckdb/src/include/duckdb/planner/expression_binder.hpp +19 -11
  794. package/src/duckdb/src/include/duckdb/planner/filter/conjunction_filter.hpp +4 -0
  795. package/src/duckdb/src/include/duckdb/planner/filter/constant_filter.hpp +2 -0
  796. package/src/duckdb/src/include/duckdb/planner/filter/null_filter.hpp +4 -0
  797. package/src/duckdb/src/include/duckdb/planner/filter/struct_filter.hpp +2 -0
  798. package/src/duckdb/src/include/duckdb/planner/logical_operator.hpp +7 -2
  799. package/src/duckdb/src/include/duckdb/planner/logical_operator_visitor.hpp +2 -1
  800. package/src/duckdb/src/include/duckdb/planner/operator/logical_aggregate.hpp +1 -1
  801. package/src/duckdb/src/include/duckdb/planner/operator/logical_any_join.hpp +1 -1
  802. package/src/duckdb/src/include/duckdb/planner/operator/logical_comparison_join.hpp +6 -1
  803. package/src/duckdb/src/include/duckdb/planner/operator/logical_copy_to_file.hpp +10 -2
  804. package/src/duckdb/src/include/duckdb/planner/operator/logical_cteref.hpp +1 -0
  805. package/src/duckdb/src/include/duckdb/planner/operator/logical_delim_get.hpp +1 -1
  806. package/src/duckdb/src/include/duckdb/planner/operator/logical_distinct.hpp +1 -1
  807. package/src/duckdb/src/include/duckdb/planner/operator/logical_execute.hpp +1 -1
  808. package/src/duckdb/src/include/duckdb/planner/operator/logical_explain.hpp +4 -2
  809. package/src/duckdb/src/include/duckdb/planner/operator/logical_get.hpp +15 -5
  810. package/src/duckdb/src/include/duckdb/planner/operator/logical_materialized_cte.hpp +1 -0
  811. package/src/duckdb/src/include/duckdb/planner/operator/logical_order.hpp +1 -1
  812. package/src/duckdb/src/include/duckdb/planner/subquery/flatten_dependent_join.hpp +2 -1
  813. package/src/duckdb/src/include/duckdb/planner/table_filter.hpp +24 -2
  814. package/src/duckdb/src/include/duckdb/planner/tableref/bound_delimgetref.hpp +26 -0
  815. package/src/duckdb/src/include/duckdb/planner/tableref/bound_joinref.hpp +6 -0
  816. package/src/duckdb/src/include/duckdb/planner/tableref/bound_subqueryref.hpp +1 -1
  817. package/src/duckdb/src/include/duckdb/planner/tableref/bound_table_function.hpp +2 -0
  818. package/src/duckdb/src/include/duckdb/planner/tableref/list.hpp +2 -0
  819. package/src/duckdb/src/include/duckdb/storage/arena_allocator.hpp +2 -1
  820. package/src/duckdb/src/include/duckdb/storage/block.hpp +4 -2
  821. package/src/duckdb/src/include/duckdb/storage/block_manager.hpp +48 -3
  822. package/src/duckdb/src/include/duckdb/storage/buffer/block_handle.hpp +21 -7
  823. package/src/duckdb/src/include/duckdb/storage/buffer/buffer_pool.hpp +65 -51
  824. package/src/duckdb/src/include/duckdb/storage/buffer_manager.hpp +14 -5
  825. package/src/duckdb/src/include/duckdb/storage/checkpoint/row_group_writer.hpp +0 -4
  826. package/src/duckdb/src/include/duckdb/storage/checkpoint/string_checkpoint_state.hpp +3 -2
  827. package/src/duckdb/src/include/duckdb/storage/checkpoint/table_data_writer.hpp +1 -0
  828. package/src/duckdb/src/include/duckdb/storage/checkpoint/write_overflow_strings_to_disk.hpp +3 -4
  829. package/src/duckdb/src/include/duckdb/storage/checkpoint_manager.hpp +2 -0
  830. package/src/duckdb/src/include/duckdb/storage/compression/alp/algorithm/alp.hpp +4 -4
  831. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_analyze.hpp +6 -4
  832. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_compress.hpp +19 -17
  833. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_constants.hpp +2 -2
  834. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_scan.hpp +3 -4
  835. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_utils.hpp +3 -2
  836. package/src/duckdb/src/include/duckdb/storage/compression/alprd/algorithm/alprd.hpp +3 -2
  837. package/src/duckdb/src/include/duckdb/storage/compression/alprd/alprd_analyze.hpp +13 -11
  838. package/src/duckdb/src/include/duckdb/storage/compression/alprd/alprd_compress.hpp +19 -19
  839. package/src/duckdb/src/include/duckdb/storage/compression/alprd/alprd_scan.hpp +3 -4
  840. package/src/duckdb/src/include/duckdb/storage/compression/chimp/chimp_scan.hpp +1 -1
  841. package/src/duckdb/src/include/duckdb/storage/compression/patas/patas_scan.hpp +1 -1
  842. package/src/duckdb/src/include/duckdb/storage/data_pointer.hpp +10 -2
  843. package/src/duckdb/src/include/duckdb/storage/data_table.hpp +3 -2
  844. package/src/duckdb/src/include/duckdb/storage/in_memory_block_manager.hpp +15 -0
  845. package/src/duckdb/src/include/duckdb/storage/index_storage_info.hpp +14 -10
  846. package/src/duckdb/src/include/duckdb/storage/metadata/metadata_manager.hpp +6 -8
  847. package/src/duckdb/src/include/duckdb/storage/partial_block_manager.hpp +7 -4
  848. package/src/duckdb/src/include/duckdb/storage/segment/uncompressed.hpp +4 -7
  849. package/src/duckdb/src/include/duckdb/storage/single_file_block_manager.hpp +29 -4
  850. package/src/duckdb/src/include/duckdb/storage/standard_buffer_manager.hpp +22 -7
  851. package/src/duckdb/src/include/duckdb/storage/statistics/base_statistics.hpp +15 -2
  852. package/src/duckdb/src/include/duckdb/storage/statistics/distinct_statistics.hpp +8 -2
  853. package/src/duckdb/src/include/duckdb/storage/statistics/numeric_stats.hpp +5 -16
  854. package/src/duckdb/src/include/duckdb/storage/statistics/numeric_stats_union.hpp +51 -13
  855. package/src/duckdb/src/include/duckdb/storage/statistics/string_stats.hpp +6 -3
  856. package/src/duckdb/src/include/duckdb/storage/storage_info.hpp +29 -19
  857. package/src/duckdb/src/include/duckdb/storage/storage_manager.hpp +23 -7
  858. package/src/duckdb/src/include/duckdb/storage/string_uncompressed.hpp +27 -18
  859. package/src/duckdb/src/include/duckdb/storage/table/append_state.hpp +6 -3
  860. package/src/duckdb/src/include/duckdb/storage/table/array_column_data.hpp +5 -2
  861. package/src/duckdb/src/include/duckdb/storage/table/chunk_info.hpp +3 -0
  862. package/src/duckdb/src/include/duckdb/storage/table/column_checkpoint_state.hpp +5 -1
  863. package/src/duckdb/src/include/duckdb/storage/table/column_data.hpp +77 -6
  864. package/src/duckdb/src/include/duckdb/storage/table/column_segment.hpp +23 -11
  865. package/src/duckdb/src/include/duckdb/storage/table/data_table_info.hpp +3 -0
  866. package/src/duckdb/src/include/duckdb/storage/table/list_column_data.hpp +5 -2
  867. package/src/duckdb/src/include/duckdb/storage/table/row_group.hpp +18 -4
  868. package/src/duckdb/src/include/duckdb/storage/table/row_group_collection.hpp +7 -1
  869. package/src/duckdb/src/include/duckdb/storage/table/row_version_manager.hpp +2 -1
  870. package/src/duckdb/src/include/duckdb/storage/table/scan_state.hpp +89 -14
  871. package/src/duckdb/src/include/duckdb/storage/table/standard_column_data.hpp +4 -2
  872. package/src/duckdb/src/include/duckdb/storage/table/struct_column_data.hpp +4 -2
  873. package/src/duckdb/src/include/duckdb/storage/table/table_index_list.hpp +2 -2
  874. package/src/duckdb/src/include/duckdb/storage/table/validity_column_data.hpp +1 -1
  875. package/src/duckdb/src/include/duckdb/storage/temporary_memory_manager.hpp +33 -15
  876. package/src/duckdb/src/include/duckdb/storage/write_ahead_log.hpp +9 -9
  877. package/src/duckdb/src/include/duckdb/transaction/cleanup_state.hpp +3 -1
  878. package/src/duckdb/src/include/duckdb/transaction/commit_state.hpp +4 -16
  879. package/src/duckdb/src/include/duckdb/transaction/duck_transaction.hpp +27 -4
  880. package/src/duckdb/src/include/duckdb/transaction/duck_transaction_manager.hpp +11 -0
  881. package/src/duckdb/src/include/duckdb/transaction/local_storage.hpp +6 -2
  882. package/src/duckdb/src/include/duckdb/transaction/meta_transaction.hpp +5 -5
  883. package/src/duckdb/src/include/duckdb/transaction/transaction_context.hpp +6 -2
  884. package/src/duckdb/src/include/duckdb/transaction/undo_buffer.hpp +5 -3
  885. package/src/duckdb/src/include/duckdb/transaction/wal_write_state.hpp +48 -0
  886. package/src/duckdb/src/include/duckdb.h +1779 -739
  887. package/src/duckdb/src/include/duckdb_extension.h +921 -0
  888. package/src/duckdb/src/main/appender.cpp +53 -7
  889. package/src/duckdb/src/main/attached_database.cpp +87 -17
  890. package/src/duckdb/src/main/buffered_data/batched_buffered_data.cpp +226 -0
  891. package/src/duckdb/src/main/buffered_data/buffered_data.cpp +35 -0
  892. package/src/duckdb/src/main/buffered_data/simple_buffered_data.cpp +48 -23
  893. package/src/duckdb/src/main/capi/aggregate_function-c.cpp +327 -0
  894. package/src/duckdb/src/main/capi/appender-c.cpp +18 -0
  895. package/src/duckdb/src/main/capi/cast/utils-c.cpp +2 -2
  896. package/src/duckdb/src/main/capi/cast_function-c.cpp +210 -0
  897. package/src/duckdb/src/main/capi/config-c.cpp +3 -3
  898. package/src/duckdb/src/main/capi/data_chunk-c.cpp +18 -7
  899. package/src/duckdb/src/main/capi/duckdb_value-c.cpp +223 -24
  900. package/src/duckdb/src/main/capi/helper-c.cpp +51 -11
  901. package/src/duckdb/src/main/capi/logical_types-c.cpp +105 -46
  902. package/src/duckdb/src/main/capi/pending-c.cpp +7 -6
  903. package/src/duckdb/src/main/capi/prepared-c.cpp +18 -7
  904. package/src/duckdb/src/main/capi/profiling_info-c.cpp +84 -0
  905. package/src/duckdb/src/main/capi/result-c.cpp +139 -37
  906. package/src/duckdb/src/main/capi/scalar_function-c.cpp +269 -0
  907. package/src/duckdb/src/main/capi/table_description-c.cpp +82 -0
  908. package/src/duckdb/src/main/capi/table_function-c.cpp +161 -95
  909. package/src/duckdb/src/main/capi/value-c.cpp +2 -2
  910. package/src/duckdb/src/main/chunk_scan_state/batched_data_collection.cpp +57 -0
  911. package/src/duckdb/src/main/client_config.cpp +17 -0
  912. package/src/duckdb/src/main/client_context.cpp +67 -52
  913. package/src/duckdb/src/main/client_data.cpp +3 -3
  914. package/src/duckdb/src/main/config.cpp +120 -62
  915. package/src/duckdb/src/main/connection.cpp +14 -2
  916. package/src/duckdb/src/main/database.cpp +96 -35
  917. package/src/duckdb/src/main/database_manager.cpp +25 -23
  918. package/src/duckdb/src/main/database_path_and_type.cpp +2 -2
  919. package/src/duckdb/src/main/db_instance_cache.cpp +54 -19
  920. package/src/duckdb/src/main/extension/extension_helper.cpp +47 -42
  921. package/src/duckdb/src/main/extension/extension_install.cpp +155 -87
  922. package/src/duckdb/src/main/extension/extension_load.cpp +180 -26
  923. package/src/duckdb/src/main/extension/extension_util.cpp +8 -0
  924. package/src/duckdb/src/main/extension.cpp +72 -5
  925. package/src/duckdb/src/main/pending_query_result.cpp +20 -12
  926. package/src/duckdb/src/main/prepared_statement.cpp +6 -6
  927. package/src/duckdb/src/main/prepared_statement_data.cpp +28 -17
  928. package/src/duckdb/src/main/profiling_info.cpp +196 -0
  929. package/src/duckdb/src/main/query_profiler.cpp +413 -224
  930. package/src/duckdb/src/main/query_result.cpp +1 -1
  931. package/src/duckdb/src/main/relation/create_table_relation.cpp +4 -2
  932. package/src/duckdb/src/main/relation/create_view_relation.cpp +0 -6
  933. package/src/duckdb/src/main/relation/delim_get_relation.cpp +44 -0
  934. package/src/duckdb/src/main/relation/explain_relation.cpp +4 -3
  935. package/src/duckdb/src/main/relation/join_relation.cpp +5 -0
  936. package/src/duckdb/src/main/relation/limit_relation.cpp +1 -1
  937. package/src/duckdb/src/main/relation/materialized_relation.cpp +3 -3
  938. package/src/duckdb/src/main/relation/query_relation.cpp +42 -15
  939. package/src/duckdb/src/main/relation/read_csv_relation.cpp +7 -14
  940. package/src/duckdb/src/main/relation/read_json_relation.cpp +20 -0
  941. package/src/duckdb/src/main/relation/setop_relation.cpp +1 -1
  942. package/src/duckdb/src/main/relation/table_function_relation.cpp +6 -0
  943. package/src/duckdb/src/main/relation/view_relation.cpp +10 -0
  944. package/src/duckdb/src/main/relation.cpp +12 -8
  945. package/src/duckdb/src/main/secret/default_secrets.cpp +108 -0
  946. package/src/duckdb/src/main/secret/secret.cpp +145 -2
  947. package/src/duckdb/src/main/secret/secret_manager.cpp +85 -35
  948. package/src/duckdb/src/main/secret/secret_storage.cpp +29 -17
  949. package/src/duckdb/src/main/settings/settings.cpp +503 -11
  950. package/src/duckdb/src/main/stream_query_result.cpp +75 -2
  951. package/src/duckdb/src/optimizer/build_probe_side_optimizer.cpp +248 -0
  952. package/src/duckdb/src/optimizer/column_lifetime_analyzer.cpp +28 -6
  953. package/src/duckdb/src/optimizer/compressed_materialization/compress_comparison_join.cpp +152 -0
  954. package/src/duckdb/src/optimizer/compressed_materialization.cpp +11 -1
  955. package/src/duckdb/src/optimizer/cse_optimizer.cpp +3 -0
  956. package/src/duckdb/src/optimizer/cte_filter_pusher.cpp +117 -0
  957. package/src/duckdb/src/optimizer/filter_combiner.cpp +30 -9
  958. package/src/duckdb/src/optimizer/filter_pullup.cpp +54 -2
  959. package/src/duckdb/src/optimizer/filter_pushdown.cpp +71 -3
  960. package/src/duckdb/src/optimizer/join_filter_pushdown_optimizer.cpp +154 -0
  961. package/src/duckdb/src/optimizer/join_order/cardinality_estimator.cpp +245 -114
  962. package/src/duckdb/src/optimizer/join_order/join_order_optimizer.cpp +42 -20
  963. package/src/duckdb/src/optimizer/join_order/join_relation_set.cpp +6 -2
  964. package/src/duckdb/src/optimizer/join_order/plan_enumerator.cpp +32 -10
  965. package/src/duckdb/src/optimizer/join_order/query_graph_manager.cpp +97 -131
  966. package/src/duckdb/src/optimizer/join_order/relation_manager.cpp +265 -51
  967. package/src/duckdb/src/optimizer/join_order/relation_statistics_helper.cpp +21 -17
  968. package/src/duckdb/src/optimizer/limit_pushdown.cpp +42 -0
  969. package/src/duckdb/src/optimizer/optimizer.cpp +51 -8
  970. package/src/duckdb/src/optimizer/pushdown/pushdown_aggregate.cpp +17 -17
  971. package/src/duckdb/src/optimizer/pushdown/pushdown_cross_product.cpp +22 -4
  972. package/src/duckdb/src/optimizer/pushdown/pushdown_get.cpp +1 -18
  973. package/src/duckdb/src/optimizer/pushdown/pushdown_inner_join.cpp +6 -0
  974. package/src/duckdb/src/optimizer/pushdown/pushdown_mark_join.cpp +4 -2
  975. package/src/duckdb/src/optimizer/pushdown/pushdown_window.cpp +91 -0
  976. package/src/duckdb/src/optimizer/remove_unused_columns.cpp +21 -25
  977. package/src/duckdb/src/optimizer/rule/comparison_simplification.cpp +1 -0
  978. package/src/duckdb/src/optimizer/rule/empty_needle_removal.cpp +3 -0
  979. package/src/duckdb/src/optimizer/rule/equal_or_null_simplification.cpp +2 -2
  980. package/src/duckdb/src/optimizer/rule/in_clause_simplification_rule.cpp +8 -2
  981. package/src/duckdb/src/optimizer/rule/join_dependent_filter.cpp +135 -0
  982. package/src/duckdb/src/optimizer/rule/like_optimizations.cpp +1 -1
  983. package/src/duckdb/src/optimizer/rule/regex_optimizations.cpp +1 -1
  984. package/src/duckdb/src/optimizer/statistics/operator/propagate_filter.cpp +6 -1
  985. package/src/duckdb/src/optimizer/statistics/operator/propagate_get.cpp +7 -6
  986. package/src/duckdb/src/optimizer/statistics/operator/propagate_join.cpp +1 -1
  987. package/src/duckdb/src/optimizer/topn_optimizer.cpp +46 -7
  988. package/src/duckdb/src/parallel/executor.cpp +129 -51
  989. package/src/duckdb/src/parallel/executor_task.cpp +16 -3
  990. package/src/duckdb/src/parallel/meta_pipeline.cpp +98 -29
  991. package/src/duckdb/src/parallel/pipeline.cpp +17 -3
  992. package/src/duckdb/src/parallel/pipeline_executor.cpp +14 -2
  993. package/src/duckdb/src/parallel/pipeline_prepare_finish_event.cpp +34 -0
  994. package/src/duckdb/src/parallel/task_executor.cpp +84 -0
  995. package/src/duckdb/src/parallel/task_scheduler.cpp +94 -16
  996. package/src/duckdb/src/parallel/thread_context.cpp +1 -1
  997. package/src/duckdb/src/parser/expression/function_expression.cpp +14 -0
  998. package/src/duckdb/src/parser/expression/star_expression.cpp +35 -2
  999. package/src/duckdb/src/parser/parsed_data/alter_table_info.cpp +5 -1
  1000. package/src/duckdb/src/parser/parsed_data/attach_info.cpp +17 -0
  1001. package/src/duckdb/src/parser/parsed_data/create_index_info.cpp +37 -28
  1002. package/src/duckdb/src/parser/parsed_data/create_macro_info.cpp +44 -2
  1003. package/src/duckdb/src/parser/parsed_data/transaction_info.cpp +21 -1
  1004. package/src/duckdb/src/parser/parsed_expression_iterator.cpp +29 -25
  1005. package/src/duckdb/src/parser/parser.cpp +41 -1
  1006. package/src/duckdb/src/parser/query_node/recursive_cte_node.cpp +1 -0
  1007. package/src/duckdb/src/parser/statement/explain_statement.cpp +28 -13
  1008. package/src/duckdb/src/parser/statement/relation_statement.cpp +5 -0
  1009. package/src/duckdb/src/parser/statement/set_statement.cpp +4 -2
  1010. package/src/duckdb/src/parser/statement/transaction_statement.cpp +3 -3
  1011. package/src/duckdb/src/parser/tableref/column_data_ref.cpp +1 -27
  1012. package/src/duckdb/src/parser/tableref/delimgetref.cpp +30 -0
  1013. package/src/duckdb/src/parser/tableref/joinref.cpp +4 -0
  1014. package/src/duckdb/src/parser/transform/constraint/transform_constraint.cpp +35 -29
  1015. package/src/duckdb/src/parser/transform/expression/transform_array_access.cpp +32 -32
  1016. package/src/duckdb/src/parser/transform/expression/transform_columnref.cpp +2 -1
  1017. package/src/duckdb/src/parser/transform/expression/transform_constant.cpp +17 -0
  1018. package/src/duckdb/src/parser/transform/expression/transform_function.cpp +5 -0
  1019. package/src/duckdb/src/parser/transform/expression/transform_multi_assign_reference.cpp +36 -34
  1020. package/src/duckdb/src/parser/transform/expression/transform_operator.cpp +30 -14
  1021. package/src/duckdb/src/parser/transform/expression/transform_subquery.cpp +1 -1
  1022. package/src/duckdb/src/parser/transform/helpers/transform_alias.cpp +2 -1
  1023. package/src/duckdb/src/parser/transform/helpers/transform_cte.cpp +27 -19
  1024. package/src/duckdb/src/parser/transform/helpers/transform_orderby.cpp +31 -28
  1025. package/src/duckdb/src/parser/transform/statement/transform_alter_table.cpp +25 -27
  1026. package/src/duckdb/src/parser/transform/statement/transform_copy.cpp +1 -1
  1027. package/src/duckdb/src/parser/transform/statement/transform_create_function.cpp +53 -42
  1028. package/src/duckdb/src/parser/transform/statement/transform_create_table.cpp +6 -6
  1029. package/src/duckdb/src/parser/transform/statement/transform_create_table_as.cpp +1 -1
  1030. package/src/duckdb/src/parser/transform/statement/transform_create_type.cpp +1 -1
  1031. package/src/duckdb/src/parser/transform/statement/transform_create_view.cpp +1 -1
  1032. package/src/duckdb/src/parser/transform/statement/transform_explain.cpp +38 -3
  1033. package/src/duckdb/src/parser/transform/statement/transform_insert.cpp +1 -2
  1034. package/src/duckdb/src/parser/transform/statement/transform_pivot_stmt.cpp +1 -1
  1035. package/src/duckdb/src/parser/transform/statement/transform_prepare.cpp +1 -1
  1036. package/src/duckdb/src/parser/transform/statement/transform_select.cpp +26 -21
  1037. package/src/duckdb/src/parser/transform/statement/transform_set.cpp +8 -8
  1038. package/src/duckdb/src/parser/transform/statement/transform_show.cpp +5 -2
  1039. package/src/duckdb/src/parser/transform/statement/transform_show_select.cpp +6 -4
  1040. package/src/duckdb/src/parser/transform/statement/transform_transaction.cpp +27 -6
  1041. package/src/duckdb/src/parser/transform/statement/transform_update.cpp +8 -9
  1042. package/src/duckdb/src/parser/transform/statement/transform_upsert.cpp +11 -12
  1043. package/src/duckdb/src/parser/transform/statement/transform_vacuum.cpp +3 -3
  1044. package/src/duckdb/src/parser/transform/tableref/transform_join.cpp +16 -10
  1045. package/src/duckdb/src/parser/transform/tableref/transform_pivot.cpp +1 -1
  1046. package/src/duckdb/src/parser/transform/tableref/transform_subquery.cpp +1 -1
  1047. package/src/duckdb/src/parser/transformer.cpp +11 -7
  1048. package/src/duckdb/src/planner/bind_context.cpp +3 -3
  1049. package/src/duckdb/src/planner/binder/expression/bind_aggregate_expression.cpp +22 -7
  1050. package/src/duckdb/src/planner/binder/expression/bind_between_expression.cpp +3 -3
  1051. package/src/duckdb/src/planner/binder/expression/bind_collate_expression.cpp +3 -2
  1052. package/src/duckdb/src/planner/binder/expression/bind_columnref_expression.cpp +11 -4
  1053. package/src/duckdb/src/planner/binder/expression/bind_comparison_expression.cpp +9 -54
  1054. package/src/duckdb/src/planner/binder/expression/bind_function_expression.cpp +3 -5
  1055. package/src/duckdb/src/planner/binder/expression/bind_macro_expression.cpp +24 -27
  1056. package/src/duckdb/src/planner/binder/expression/bind_operator_expression.cpp +7 -7
  1057. package/src/duckdb/src/planner/binder/expression/bind_parameter_expression.cpp +9 -2
  1058. package/src/duckdb/src/planner/binder/expression/bind_star_expression.cpp +26 -7
  1059. package/src/duckdb/src/planner/binder/expression/bind_unnest_expression.cpp +5 -0
  1060. package/src/duckdb/src/planner/binder/expression/bind_unpacked_star_expression.cpp +91 -0
  1061. package/src/duckdb/src/planner/binder/expression/bind_window_expression.cpp +2 -2
  1062. package/src/duckdb/src/planner/binder/query_node/bind_select_node.cpp +11 -8
  1063. package/src/duckdb/src/planner/binder/query_node/bind_setop_node.cpp +1 -1
  1064. package/src/duckdb/src/planner/binder/query_node/bind_table_macro_node.cpp +6 -10
  1065. package/src/duckdb/src/planner/binder/query_node/plan_cte_node.cpp +14 -10
  1066. package/src/duckdb/src/planner/binder/query_node/plan_setop.cpp +3 -3
  1067. package/src/duckdb/src/planner/binder/query_node/plan_subquery.cpp +46 -7
  1068. package/src/duckdb/src/planner/binder/statement/bind_call.cpp +13 -20
  1069. package/src/duckdb/src/planner/binder/statement/bind_copy.cpp +105 -13
  1070. package/src/duckdb/src/planner/binder/statement/bind_copy_database.cpp +7 -3
  1071. package/src/duckdb/src/planner/binder/statement/bind_create.cpp +75 -55
  1072. package/src/duckdb/src/planner/binder/statement/bind_create_table.cpp +1 -1
  1073. package/src/duckdb/src/planner/binder/statement/bind_delete.cpp +5 -4
  1074. package/src/duckdb/src/planner/binder/statement/bind_drop.cpp +2 -2
  1075. package/src/duckdb/src/planner/binder/statement/bind_execute.cpp +24 -8
  1076. package/src/duckdb/src/planner/binder/statement/bind_explain.cpp +2 -2
  1077. package/src/duckdb/src/planner/binder/statement/bind_export.cpp +5 -105
  1078. package/src/duckdb/src/planner/binder/statement/bind_extension.cpp +2 -2
  1079. package/src/duckdb/src/planner/binder/statement/bind_insert.cpp +109 -41
  1080. package/src/duckdb/src/planner/binder/statement/bind_set.cpp +23 -7
  1081. package/src/duckdb/src/planner/binder/statement/bind_simple.cpp +4 -1
  1082. package/src/duckdb/src/planner/binder/statement/bind_summarize.cpp +17 -3
  1083. package/src/duckdb/src/planner/binder/statement/bind_update.cpp +5 -4
  1084. package/src/duckdb/src/planner/binder/statement/bind_vacuum.cpp +8 -6
  1085. package/src/duckdb/src/planner/binder/tableref/bind_basetableref.cpp +55 -42
  1086. package/src/duckdb/src/planner/binder/tableref/bind_column_data_ref.cpp +3 -2
  1087. package/src/duckdb/src/planner/binder/tableref/bind_delimgetref.cpp +16 -0
  1088. package/src/duckdb/src/planner/binder/tableref/bind_joinref.cpp +31 -1
  1089. package/src/duckdb/src/planner/binder/tableref/bind_pivot.cpp +6 -0
  1090. package/src/duckdb/src/planner/binder/tableref/bind_showref.cpp +2 -0
  1091. package/src/duckdb/src/planner/binder/tableref/bind_table_function.cpp +106 -46
  1092. package/src/duckdb/src/planner/binder/tableref/plan_delimgetref.cpp +11 -0
  1093. package/src/duckdb/src/planner/binder/tableref/plan_joinref.cpp +15 -2
  1094. package/src/duckdb/src/planner/binder/tableref/plan_table_function.cpp +4 -0
  1095. package/src/duckdb/src/planner/binder.cpp +172 -15
  1096. package/src/duckdb/src/planner/collation_binding.cpp +99 -0
  1097. package/src/duckdb/src/planner/expression/bound_aggregate_expression.cpp +10 -4
  1098. package/src/duckdb/src/planner/expression/bound_between_expression.cpp +1 -1
  1099. package/src/duckdb/src/planner/expression/bound_case_expression.cpp +1 -1
  1100. package/src/duckdb/src/planner/expression/bound_cast_expression.cpp +14 -12
  1101. package/src/duckdb/src/planner/expression/bound_columnref_expression.cpp +1 -1
  1102. package/src/duckdb/src/planner/expression/bound_comparison_expression.cpp +1 -1
  1103. package/src/duckdb/src/planner/expression/bound_conjunction_expression.cpp +1 -1
  1104. package/src/duckdb/src/planner/expression/bound_constant_expression.cpp +1 -1
  1105. package/src/duckdb/src/planner/expression/bound_expanded_expression.cpp +1 -1
  1106. package/src/duckdb/src/planner/expression/bound_function_expression.cpp +8 -2
  1107. package/src/duckdb/src/planner/expression/bound_lambda_expression.cpp +1 -1
  1108. package/src/duckdb/src/planner/expression/bound_lambdaref_expression.cpp +1 -1
  1109. package/src/duckdb/src/planner/expression/bound_operator_expression.cpp +1 -1
  1110. package/src/duckdb/src/planner/expression/bound_parameter_expression.cpp +1 -1
  1111. package/src/duckdb/src/planner/expression/bound_reference_expression.cpp +1 -1
  1112. package/src/duckdb/src/planner/expression/bound_subquery_expression.cpp +1 -1
  1113. package/src/duckdb/src/planner/expression/bound_unnest_expression.cpp +1 -1
  1114. package/src/duckdb/src/planner/expression/bound_window_expression.cpp +6 -6
  1115. package/src/duckdb/src/planner/expression_binder/aggregate_binder.cpp +1 -1
  1116. package/src/duckdb/src/planner/expression_binder/alter_binder.cpp +2 -2
  1117. package/src/duckdb/src/planner/expression_binder/base_select_binder.cpp +1 -1
  1118. package/src/duckdb/src/planner/expression_binder/column_alias_binder.cpp +7 -0
  1119. package/src/duckdb/src/planner/expression_binder/constant_binder.cpp +3 -3
  1120. package/src/duckdb/src/planner/expression_binder/group_binder.cpp +26 -22
  1121. package/src/duckdb/src/planner/expression_binder/having_binder.cpp +7 -1
  1122. package/src/duckdb/src/planner/expression_binder/index_binder.cpp +2 -2
  1123. package/src/duckdb/src/planner/expression_binder/insert_binder.cpp +2 -2
  1124. package/src/duckdb/src/planner/expression_binder/lateral_binder.cpp +2 -2
  1125. package/src/duckdb/src/planner/expression_binder/order_binder.cpp +61 -43
  1126. package/src/duckdb/src/planner/expression_binder/qualify_binder.cpp +2 -2
  1127. package/src/duckdb/src/planner/expression_binder/relation_binder.cpp +4 -4
  1128. package/src/duckdb/src/planner/expression_binder/returning_binder.cpp +3 -2
  1129. package/src/duckdb/src/planner/expression_binder/table_function_binder.cpp +10 -3
  1130. package/src/duckdb/src/planner/expression_binder/update_binder.cpp +1 -1
  1131. package/src/duckdb/src/planner/expression_binder/where_binder.cpp +9 -2
  1132. package/src/duckdb/src/planner/expression_binder.cpp +121 -21
  1133. package/src/duckdb/src/planner/expression_iterator.cpp +26 -1
  1134. package/src/duckdb/src/planner/filter/conjunction_filter.cpp +33 -0
  1135. package/src/duckdb/src/planner/filter/constant_filter.cpp +15 -0
  1136. package/src/duckdb/src/planner/filter/null_filter.cpp +22 -0
  1137. package/src/duckdb/src/planner/filter/struct_filter.cpp +16 -0
  1138. package/src/duckdb/src/planner/logical_operator.cpp +24 -7
  1139. package/src/duckdb/src/planner/operator/logical_aggregate.cpp +13 -7
  1140. package/src/duckdb/src/planner/operator/logical_any_join.cpp +5 -2
  1141. package/src/duckdb/src/planner/operator/logical_comparison_join.cpp +13 -5
  1142. package/src/duckdb/src/planner/operator/logical_copy_to_file.cpp +64 -8
  1143. package/src/duckdb/src/planner/operator/logical_cteref.cpp +7 -0
  1144. package/src/duckdb/src/planner/operator/logical_distinct.cpp +6 -5
  1145. package/src/duckdb/src/planner/operator/logical_get.cpp +60 -18
  1146. package/src/duckdb/src/planner/operator/logical_materialized_cte.cpp +7 -0
  1147. package/src/duckdb/src/planner/operator/logical_order.cpp +7 -4
  1148. package/src/duckdb/src/planner/operator/logical_top_n.cpp +2 -2
  1149. package/src/duckdb/src/planner/operator/logical_vacuum.cpp +1 -1
  1150. package/src/duckdb/src/planner/planner.cpp +2 -3
  1151. package/src/duckdb/src/planner/subquery/flatten_dependent_join.cpp +27 -10
  1152. package/src/duckdb/src/planner/table_filter.cpp +51 -0
  1153. package/src/duckdb/src/storage/arena_allocator.cpp +28 -10
  1154. package/src/duckdb/src/storage/block.cpp +3 -2
  1155. package/src/duckdb/src/storage/buffer/block_handle.cpp +29 -14
  1156. package/src/duckdb/src/storage/buffer/block_manager.cpp +6 -5
  1157. package/src/duckdb/src/storage/buffer/buffer_handle.cpp +1 -1
  1158. package/src/duckdb/src/storage/buffer/buffer_pool.cpp +264 -125
  1159. package/src/duckdb/src/storage/buffer_manager.cpp +5 -1
  1160. package/src/duckdb/src/storage/checkpoint/row_group_writer.cpp +0 -6
  1161. package/src/duckdb/src/storage/checkpoint/table_data_writer.cpp +26 -3
  1162. package/src/duckdb/src/storage/checkpoint/write_overflow_strings_to_disk.cpp +21 -9
  1163. package/src/duckdb/src/storage/checkpoint_manager.cpp +49 -24
  1164. package/src/duckdb/src/storage/compression/alp/alp.cpp +6 -11
  1165. package/src/duckdb/src/storage/compression/alprd.cpp +5 -9
  1166. package/src/duckdb/src/storage/compression/bitpacking.cpp +35 -31
  1167. package/src/duckdb/src/storage/compression/chimp/chimp.cpp +6 -8
  1168. package/src/duckdb/src/storage/compression/dictionary_compression.cpp +71 -58
  1169. package/src/duckdb/src/storage/compression/fixed_size_uncompressed.cpp +15 -13
  1170. package/src/duckdb/src/storage/compression/fsst.cpp +66 -53
  1171. package/src/duckdb/src/storage/compression/numeric_constant.cpp +4 -5
  1172. package/src/duckdb/src/storage/compression/patas.cpp +6 -17
  1173. package/src/duckdb/src/storage/compression/rle.cpp +20 -18
  1174. package/src/duckdb/src/storage/compression/string_uncompressed.cpp +71 -52
  1175. package/src/duckdb/src/storage/compression/uncompressed.cpp +2 -2
  1176. package/src/duckdb/src/storage/compression/validity_uncompressed.cpp +8 -7
  1177. package/src/duckdb/src/storage/data_pointer.cpp +22 -0
  1178. package/src/duckdb/src/storage/data_table.cpp +41 -12
  1179. package/src/duckdb/src/storage/local_storage.cpp +22 -8
  1180. package/src/duckdb/src/storage/metadata/metadata_manager.cpp +33 -17
  1181. package/src/duckdb/src/storage/metadata/metadata_reader.cpp +4 -4
  1182. package/src/duckdb/src/storage/metadata/metadata_writer.cpp +3 -3
  1183. package/src/duckdb/src/storage/partial_block_manager.cpp +19 -8
  1184. package/src/duckdb/src/storage/serialization/serialize_create_info.cpp +11 -8
  1185. package/src/duckdb/src/storage/serialization/serialize_expression.cpp +1 -1
  1186. package/src/duckdb/src/storage/serialization/serialize_extension_install_info.cpp +2 -0
  1187. package/src/duckdb/src/storage/serialization/serialize_logical_operator.cpp +3 -3
  1188. package/src/duckdb/src/storage/serialization/serialize_nodes.cpp +19 -5
  1189. package/src/duckdb/src/storage/serialization/serialize_parse_info.cpp +21 -1
  1190. package/src/duckdb/src/storage/serialization/serialize_parsed_expression.cpp +4 -2
  1191. package/src/duckdb/src/storage/serialization/serialize_query_node.cpp +2 -2
  1192. package/src/duckdb/src/storage/serialization/serialize_storage.cpp +2 -0
  1193. package/src/duckdb/src/storage/serialization/serialize_tableref.cpp +8 -4
  1194. package/src/duckdb/src/storage/serialization/serialize_types.cpp +4 -4
  1195. package/src/duckdb/src/storage/single_file_block_manager.cpp +170 -34
  1196. package/src/duckdb/src/storage/standard_buffer_manager.cpp +221 -64
  1197. package/src/duckdb/src/storage/statistics/column_statistics.cpp +4 -3
  1198. package/src/duckdb/src/storage/statistics/distinct_statistics.cpp +36 -26
  1199. package/src/duckdb/src/storage/statistics/numeric_stats.cpp +4 -15
  1200. package/src/duckdb/src/storage/statistics/string_stats.cpp +14 -8
  1201. package/src/duckdb/src/storage/statistics/struct_stats.cpp +2 -1
  1202. package/src/duckdb/src/storage/storage_info.cpp +34 -9
  1203. package/src/duckdb/src/storage/storage_manager.cpp +147 -74
  1204. package/src/duckdb/src/storage/table/array_column_data.cpp +37 -17
  1205. package/src/duckdb/src/storage/table/chunk_info.cpp +38 -0
  1206. package/src/duckdb/src/storage/table/column_checkpoint_state.cpp +10 -6
  1207. package/src/duckdb/src/storage/table/column_data.cpp +252 -31
  1208. package/src/duckdb/src/storage/table/column_data_checkpointer.cpp +2 -12
  1209. package/src/duckdb/src/storage/table/column_segment.cpp +63 -34
  1210. package/src/duckdb/src/storage/table/list_column_data.cpp +34 -15
  1211. package/src/duckdb/src/storage/table/row_group.cpp +228 -120
  1212. package/src/duckdb/src/storage/table/row_group_collection.cpp +122 -120
  1213. package/src/duckdb/src/storage/table/row_version_manager.cpp +27 -1
  1214. package/src/duckdb/src/storage/table/scan_state.cpp +101 -18
  1215. package/src/duckdb/src/storage/table/standard_column_data.cpp +20 -34
  1216. package/src/duckdb/src/storage/table/struct_column_data.cpp +39 -42
  1217. package/src/duckdb/src/storage/table/table_statistics.cpp +2 -1
  1218. package/src/duckdb/src/storage/table/update_segment.cpp +9 -8
  1219. package/src/duckdb/src/storage/table/validity_column_data.cpp +2 -2
  1220. package/src/duckdb/src/storage/table_index_list.cpp +8 -7
  1221. package/src/duckdb/src/storage/temporary_file_manager.cpp +11 -9
  1222. package/src/duckdb/src/storage/temporary_memory_manager.cpp +227 -39
  1223. package/src/duckdb/src/storage/wal_replay.cpp +68 -28
  1224. package/src/duckdb/src/storage/write_ahead_log.cpp +56 -47
  1225. package/src/duckdb/src/transaction/cleanup_state.cpp +9 -1
  1226. package/src/duckdb/src/transaction/commit_state.cpp +7 -170
  1227. package/src/duckdb/src/transaction/duck_transaction.cpp +87 -19
  1228. package/src/duckdb/src/transaction/duck_transaction_manager.cpp +65 -10
  1229. package/src/duckdb/src/transaction/meta_transaction.cpp +18 -3
  1230. package/src/duckdb/src/transaction/transaction_context.cpp +21 -17
  1231. package/src/duckdb/src/transaction/undo_buffer.cpp +20 -14
  1232. package/src/duckdb/src/transaction/wal_write_state.cpp +292 -0
  1233. package/src/duckdb/src/verification/prepared_statement_verifier.cpp +0 -1
  1234. package/src/duckdb/third_party/brotli/common/brotli_constants.h +204 -0
  1235. package/src/duckdb/third_party/brotli/common/brotli_platform.h +543 -0
  1236. package/src/duckdb/third_party/brotli/common/constants.cpp +17 -0
  1237. package/src/duckdb/third_party/brotli/common/context.cpp +156 -0
  1238. package/src/duckdb/third_party/brotli/common/context.h +110 -0
  1239. package/src/duckdb/third_party/brotli/common/dictionary.cpp +5912 -0
  1240. package/src/duckdb/third_party/brotli/common/dictionary.h +60 -0
  1241. package/src/duckdb/third_party/brotli/common/platform.cpp +24 -0
  1242. package/src/duckdb/third_party/brotli/common/shared_dictionary.cpp +517 -0
  1243. package/src/duckdb/third_party/brotli/common/shared_dictionary_internal.h +71 -0
  1244. package/src/duckdb/third_party/brotli/common/transform.cpp +287 -0
  1245. package/src/duckdb/third_party/brotli/common/transform.h +77 -0
  1246. package/src/duckdb/third_party/brotli/common/version.h +51 -0
  1247. package/src/duckdb/third_party/brotli/dec/bit_reader.cpp +74 -0
  1248. package/src/duckdb/third_party/brotli/dec/bit_reader.h +419 -0
  1249. package/src/duckdb/third_party/brotli/dec/decode.cpp +2758 -0
  1250. package/src/duckdb/third_party/brotli/dec/huffman.cpp +338 -0
  1251. package/src/duckdb/third_party/brotli/dec/huffman.h +118 -0
  1252. package/src/duckdb/third_party/brotli/dec/prefix.h +733 -0
  1253. package/src/duckdb/third_party/brotli/dec/state.cpp +178 -0
  1254. package/src/duckdb/third_party/brotli/dec/state.h +386 -0
  1255. package/src/duckdb/third_party/brotli/enc/backward_references.cpp +3775 -0
  1256. package/src/duckdb/third_party/brotli/enc/backward_references.h +36 -0
  1257. package/src/duckdb/third_party/brotli/enc/backward_references_hq.cpp +935 -0
  1258. package/src/duckdb/third_party/brotli/enc/backward_references_hq.h +92 -0
  1259. package/src/duckdb/third_party/brotli/enc/bit_cost.cpp +410 -0
  1260. package/src/duckdb/third_party/brotli/enc/bit_cost.h +60 -0
  1261. package/src/duckdb/third_party/brotli/enc/block_splitter.cpp +1653 -0
  1262. package/src/duckdb/third_party/brotli/enc/block_splitter.h +48 -0
  1263. package/src/duckdb/third_party/brotli/enc/brotli_bit_stream.cpp +1431 -0
  1264. package/src/duckdb/third_party/brotli/enc/brotli_bit_stream.h +85 -0
  1265. package/src/duckdb/third_party/brotli/enc/brotli_hash.h +4352 -0
  1266. package/src/duckdb/third_party/brotli/enc/brotli_params.h +47 -0
  1267. package/src/duckdb/third_party/brotli/enc/cluster.cpp +1025 -0
  1268. package/src/duckdb/third_party/brotli/enc/cluster.h +1017 -0
  1269. package/src/duckdb/third_party/brotli/enc/command.cpp +24 -0
  1270. package/src/duckdb/third_party/brotli/enc/command.h +187 -0
  1271. package/src/duckdb/third_party/brotli/enc/compound_dictionary.cpp +209 -0
  1272. package/src/duckdb/third_party/brotli/enc/compound_dictionary.h +75 -0
  1273. package/src/duckdb/third_party/brotli/enc/compress_fragment.cpp +796 -0
  1274. package/src/duckdb/third_party/brotli/enc/compress_fragment.h +82 -0
  1275. package/src/duckdb/third_party/brotli/enc/compress_fragment_two_pass.cpp +653 -0
  1276. package/src/duckdb/third_party/brotli/enc/compress_fragment_two_pass.h +68 -0
  1277. package/src/duckdb/third_party/brotli/enc/dictionary_hash.cpp +1844 -0
  1278. package/src/duckdb/third_party/brotli/enc/dictionary_hash.h +21 -0
  1279. package/src/duckdb/third_party/brotli/enc/encode.cpp +1990 -0
  1280. package/src/duckdb/third_party/brotli/enc/encoder_dict.cpp +636 -0
  1281. package/src/duckdb/third_party/brotli/enc/encoder_dict.h +153 -0
  1282. package/src/duckdb/third_party/brotli/enc/entropy_encode.cpp +500 -0
  1283. package/src/duckdb/third_party/brotli/enc/entropy_encode.h +119 -0
  1284. package/src/duckdb/third_party/brotli/enc/entropy_encode_static.h +538 -0
  1285. package/src/duckdb/third_party/brotli/enc/fast_log.cpp +101 -0
  1286. package/src/duckdb/third_party/brotli/enc/fast_log.h +63 -0
  1287. package/src/duckdb/third_party/brotli/enc/find_match_length.h +68 -0
  1288. package/src/duckdb/third_party/brotli/enc/histogram.cpp +96 -0
  1289. package/src/duckdb/third_party/brotli/enc/histogram.h +210 -0
  1290. package/src/duckdb/third_party/brotli/enc/literal_cost.cpp +176 -0
  1291. package/src/duckdb/third_party/brotli/enc/literal_cost.h +28 -0
  1292. package/src/duckdb/third_party/brotli/enc/memory.cpp +190 -0
  1293. package/src/duckdb/third_party/brotli/enc/memory.h +127 -0
  1294. package/src/duckdb/third_party/brotli/enc/metablock.cpp +1225 -0
  1295. package/src/duckdb/third_party/brotli/enc/metablock.h +102 -0
  1296. package/src/duckdb/third_party/brotli/enc/prefix.h +50 -0
  1297. package/src/duckdb/third_party/brotli/enc/quality.h +202 -0
  1298. package/src/duckdb/third_party/brotli/enc/ringbuffer.h +164 -0
  1299. package/src/duckdb/third_party/brotli/enc/state.h +106 -0
  1300. package/src/duckdb/third_party/brotli/enc/static_dict.cpp +538 -0
  1301. package/src/duckdb/third_party/brotli/enc/static_dict.h +37 -0
  1302. package/src/duckdb/third_party/brotli/enc/static_dict_lut.h +5862 -0
  1303. package/src/duckdb/third_party/brotli/enc/utf8_util.cpp +81 -0
  1304. package/src/duckdb/third_party/brotli/enc/utf8_util.h +29 -0
  1305. package/src/duckdb/third_party/brotli/enc/write_bits.h +84 -0
  1306. package/src/duckdb/third_party/brotli/include/brotli/decode.h +405 -0
  1307. package/src/duckdb/third_party/brotli/include/brotli/encode.h +489 -0
  1308. package/src/duckdb/third_party/brotli/include/brotli/port.h +238 -0
  1309. package/src/duckdb/third_party/brotli/include/brotli/shared_dictionary.h +96 -0
  1310. package/src/duckdb/third_party/brotli/include/brotli/types.h +83 -0
  1311. package/src/duckdb/third_party/fast_float/fast_float/fast_float.h +20 -4
  1312. package/src/duckdb/third_party/fmt/include/fmt/format.h +54 -10
  1313. package/src/duckdb/third_party/fsst/fsst.h +2 -2
  1314. package/src/duckdb/third_party/fsst/libfsst.hpp +2 -2
  1315. package/src/duckdb/third_party/httplib/httplib.hpp +6763 -5580
  1316. package/src/duckdb/third_party/hyperloglog/hyperloglog.cpp +13 -30
  1317. package/src/duckdb/third_party/hyperloglog/hyperloglog.hpp +8 -2
  1318. package/src/duckdb/third_party/libpg_query/include/nodes/nodes.hpp +1 -0
  1319. package/src/duckdb/third_party/libpg_query/include/nodes/parsenodes.hpp +22 -9
  1320. package/src/duckdb/third_party/libpg_query/include/parser/gram.hpp +1041 -554
  1321. package/src/duckdb/third_party/libpg_query/include/parser/kwlist.hpp +1 -0
  1322. package/src/duckdb/third_party/libpg_query/postgres_parser.cpp +2 -1
  1323. package/src/duckdb/third_party/libpg_query/src_backend_parser_gram.cpp +21605 -21752
  1324. package/src/duckdb/third_party/libpg_query/src_backend_parser_scan.cpp +538 -299
  1325. package/src/duckdb/third_party/mbedtls/include/mbedtls/mbedtls_config.h +1 -0
  1326. package/src/duckdb/third_party/mbedtls/include/mbedtls_wrapper.hpp +36 -12
  1327. package/src/duckdb/third_party/mbedtls/library/md.cpp +6 -6
  1328. package/src/duckdb/third_party/mbedtls/library/sha1.cpp +2 -0
  1329. package/src/duckdb/third_party/mbedtls/library/sha256.cpp +3 -0
  1330. package/src/duckdb/third_party/mbedtls/mbedtls_wrapper.cpp +99 -47
  1331. package/src/duckdb/third_party/pcg/pcg_extras.hpp +1 -1
  1332. package/src/duckdb/third_party/re2/re2/prog.cc +2 -2
  1333. package/src/duckdb/third_party/snappy/snappy-internal.h +398 -0
  1334. package/src/duckdb/third_party/snappy/snappy-sinksource.cc +111 -9
  1335. package/src/duckdb/third_party/snappy/snappy-sinksource.h +158 -0
  1336. package/src/duckdb/third_party/snappy/snappy-stubs-internal.h +523 -3
  1337. package/src/duckdb/third_party/snappy/snappy-stubs-public.h +34 -1
  1338. package/src/duckdb/third_party/snappy/snappy.cc +2626 -0
  1339. package/src/duckdb/third_party/snappy/snappy.h +223 -0
  1340. package/src/duckdb/third_party/snappy/snappy_version.hpp +11 -0
  1341. package/src/duckdb/third_party/utf8proc/include/utf8proc.hpp +69 -101
  1342. package/src/duckdb/third_party/utf8proc/include/utf8proc_wrapper.hpp +53 -0
  1343. package/src/duckdb/third_party/utf8proc/utf8proc.cpp +627 -678
  1344. package/src/duckdb/third_party/utf8proc/utf8proc_data.cpp +15008 -12868
  1345. package/src/duckdb/third_party/utf8proc/utf8proc_wrapper.cpp +185 -29
  1346. package/src/duckdb/ub_extension_json_json_functions.cpp +6 -0
  1347. package/src/duckdb/ub_src_catalog_default.cpp +4 -0
  1348. package/src/duckdb/ub_src_common.cpp +7 -1
  1349. package/src/duckdb/ub_src_common_arrow.cpp +10 -0
  1350. package/src/duckdb/ub_src_common_enums.cpp +2 -0
  1351. package/src/duckdb/ub_src_common_tree_renderer.cpp +10 -0
  1352. package/src/duckdb/ub_src_common_types.cpp +2 -0
  1353. package/src/duckdb/ub_src_core_functions_aggregate_holistic.cpp +4 -0
  1354. package/src/duckdb/ub_src_core_functions_aggregate_nested.cpp +2 -0
  1355. package/src/duckdb/ub_src_core_functions_scalar_generic.cpp +2 -0
  1356. package/src/duckdb/ub_src_core_functions_scalar_list.cpp +2 -4
  1357. package/src/duckdb/ub_src_core_functions_scalar_map.cpp +2 -0
  1358. package/src/duckdb/ub_src_core_functions_scalar_string.cpp +4 -0
  1359. package/src/duckdb/ub_src_execution_index_art.cpp +5 -3
  1360. package/src/duckdb/ub_src_execution_operator_csv_scanner_scanner.cpp +2 -0
  1361. package/src/duckdb/ub_src_execution_operator_helper.cpp +4 -0
  1362. package/src/duckdb/ub_src_function.cpp +4 -0
  1363. package/src/duckdb/ub_src_function_cast.cpp +2 -0
  1364. package/src/duckdb/ub_src_function_scalar_generic.cpp +4 -0
  1365. package/src/duckdb/ub_src_function_scalar_list.cpp +0 -2
  1366. package/src/duckdb/ub_src_function_scalar_string.cpp +2 -0
  1367. package/src/duckdb/ub_src_function_table.cpp +2 -0
  1368. package/src/duckdb/ub_src_function_table_arrow.cpp +2 -0
  1369. package/src/duckdb/ub_src_function_table_system.cpp +2 -0
  1370. package/src/duckdb/ub_src_main.cpp +4 -0
  1371. package/src/duckdb/ub_src_main_buffered_data.cpp +4 -0
  1372. package/src/duckdb/ub_src_main_capi.cpp +10 -0
  1373. package/src/duckdb/ub_src_main_chunk_scan_state.cpp +2 -0
  1374. package/src/duckdb/ub_src_main_relation.cpp +2 -0
  1375. package/src/duckdb/ub_src_main_secret.cpp +2 -0
  1376. package/src/duckdb/ub_src_optimizer.cpp +8 -0
  1377. package/src/duckdb/ub_src_optimizer_compressed_materialization.cpp +2 -0
  1378. package/src/duckdb/ub_src_optimizer_pushdown.cpp +2 -0
  1379. package/src/duckdb/ub_src_optimizer_rule.cpp +2 -0
  1380. package/src/duckdb/ub_src_parallel.cpp +4 -0
  1381. package/src/duckdb/ub_src_parser_tableref.cpp +2 -0
  1382. package/src/duckdb/ub_src_planner.cpp +2 -0
  1383. package/src/duckdb/ub_src_planner_binder_expression.cpp +2 -0
  1384. package/src/duckdb/ub_src_planner_binder_tableref.cpp +4 -0
  1385. package/src/duckdb/ub_src_storage_statistics.cpp +0 -2
  1386. package/src/duckdb/ub_src_transaction.cpp +2 -0
  1387. package/test/columns.test.ts +1 -1
  1388. package/test/prepare.test.ts +1 -1
  1389. package/test/test_all_types.test.ts +1 -1
@@ -0,0 +1,1225 @@
1
+ /* Copyright 2015 Google Inc. All Rights Reserved.
2
+
3
+ Distributed under MIT license.
4
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
5
+ */
6
+
7
+ /* Algorithms for distributing the literals and commands of a metablock between
8
+ block types and contexts. */
9
+
10
+ #include "metablock.h"
11
+
12
+ #include <brotli/types.h>
13
+
14
+ #include "../common/brotli_constants.h"
15
+ #include "../common/context.h"
16
+ #include "../common/brotli_platform.h"
17
+ #include "bit_cost.h"
18
+ #include "block_splitter.h"
19
+ #include "cluster.h"
20
+ #include "entropy_encode.h"
21
+ #include "histogram.h"
22
+ #include "memory.h"
23
+ #include "quality.h"
24
+
25
+ using namespace duckdb_brotli;
26
+
27
+ void duckdb_brotli::BrotliInitDistanceParams(BrotliDistanceParams* dist_params,
28
+ uint32_t npostfix, uint32_t ndirect, BROTLI_BOOL large_window) {
29
+ uint32_t alphabet_size_max;
30
+ uint32_t alphabet_size_limit;
31
+ uint32_t max_distance;
32
+
33
+ dist_params->distance_postfix_bits = npostfix;
34
+ dist_params->num_direct_distance_codes = ndirect;
35
+
36
+ alphabet_size_max = BROTLI_DISTANCE_ALPHABET_SIZE(
37
+ npostfix, ndirect, BROTLI_MAX_DISTANCE_BITS);
38
+ alphabet_size_limit = alphabet_size_max;
39
+ max_distance = ndirect + (1U << (BROTLI_MAX_DISTANCE_BITS + npostfix + 2)) -
40
+ (1U << (npostfix + 2));
41
+
42
+ if (large_window) {
43
+ BrotliDistanceCodeLimit limit = BrotliCalculateDistanceCodeLimit(
44
+ BROTLI_MAX_ALLOWED_DISTANCE, npostfix, ndirect);
45
+ alphabet_size_max = BROTLI_DISTANCE_ALPHABET_SIZE(
46
+ npostfix, ndirect, BROTLI_LARGE_MAX_DISTANCE_BITS);
47
+ alphabet_size_limit = limit.max_alphabet_size;
48
+ max_distance = limit.max_distance;
49
+ }
50
+
51
+ dist_params->alphabet_size_max = alphabet_size_max;
52
+ dist_params->alphabet_size_limit = alphabet_size_limit;
53
+ dist_params->max_distance = max_distance;
54
+ }
55
+
56
+ static void RecomputeDistancePrefixes(Command* cmds,
57
+ size_t num_commands,
58
+ const BrotliDistanceParams* orig_params,
59
+ const BrotliDistanceParams* new_params) {
60
+ size_t i;
61
+
62
+ if (orig_params->distance_postfix_bits == new_params->distance_postfix_bits &&
63
+ orig_params->num_direct_distance_codes ==
64
+ new_params->num_direct_distance_codes) {
65
+ return;
66
+ }
67
+
68
+ for (i = 0; i < num_commands; ++i) {
69
+ Command* cmd = &cmds[i];
70
+ if (CommandCopyLen(cmd) && cmd->cmd_prefix_ >= 128) {
71
+ PrefixEncodeCopyDistance(CommandRestoreDistanceCode(cmd, orig_params),
72
+ new_params->num_direct_distance_codes,
73
+ new_params->distance_postfix_bits,
74
+ &cmd->dist_prefix_,
75
+ &cmd->dist_extra_);
76
+ }
77
+ }
78
+ }
79
+
80
+ static BROTLI_BOOL ComputeDistanceCost(const Command* cmds,
81
+ size_t num_commands,
82
+ const BrotliDistanceParams* orig_params,
83
+ const BrotliDistanceParams* new_params,
84
+ double* cost,
85
+ HistogramDistance* tmp) {
86
+ size_t i;
87
+ BROTLI_BOOL equal_params = BROTLI_FALSE;
88
+ uint16_t dist_prefix;
89
+ uint32_t dist_extra;
90
+ double extra_bits = 0.0;
91
+ HistogramClearDistance(tmp);
92
+
93
+ if (orig_params->distance_postfix_bits == new_params->distance_postfix_bits &&
94
+ orig_params->num_direct_distance_codes ==
95
+ new_params->num_direct_distance_codes) {
96
+ equal_params = BROTLI_TRUE;
97
+ }
98
+
99
+ for (i = 0; i < num_commands; i++) {
100
+ const Command* cmd = &cmds[i];
101
+ if (CommandCopyLen(cmd) && cmd->cmd_prefix_ >= 128) {
102
+ if (equal_params) {
103
+ dist_prefix = cmd->dist_prefix_;
104
+ } else {
105
+ uint32_t distance = CommandRestoreDistanceCode(cmd, orig_params);
106
+ if (distance > new_params->max_distance) {
107
+ return BROTLI_FALSE;
108
+ }
109
+ PrefixEncodeCopyDistance(distance,
110
+ new_params->num_direct_distance_codes,
111
+ new_params->distance_postfix_bits,
112
+ &dist_prefix,
113
+ &dist_extra);
114
+ }
115
+ HistogramAddDistance(tmp, dist_prefix & 0x3FF);
116
+ extra_bits += dist_prefix >> 10;
117
+ }
118
+ }
119
+
120
+ *cost = BrotliPopulationCostDistance(tmp) + extra_bits;
121
+ return BROTLI_TRUE;
122
+ }
123
+
124
+ void duckdb_brotli::BrotliBuildMetaBlock(MemoryManager* m,
125
+ const uint8_t* ringbuffer,
126
+ const size_t pos,
127
+ const size_t mask,
128
+ BrotliEncoderParams* params,
129
+ uint8_t prev_byte,
130
+ uint8_t prev_byte2,
131
+ Command* cmds,
132
+ size_t num_commands,
133
+ ContextType literal_context_mode,
134
+ MetaBlockSplit* mb) {
135
+ /* Histogram ids need to fit in one byte. */
136
+ static const size_t kMaxNumberOfHistograms = 256;
137
+ HistogramDistance* distance_histograms;
138
+ HistogramLiteral* literal_histograms;
139
+ ContextType* literal_context_modes = NULL;
140
+ size_t literal_histograms_size;
141
+ size_t distance_histograms_size;
142
+ size_t i;
143
+ size_t literal_context_multiplier = 1;
144
+ uint32_t npostfix;
145
+ uint32_t ndirect_msb = 0;
146
+ BROTLI_BOOL check_orig = BROTLI_TRUE;
147
+ double best_dist_cost = 1e99;
148
+ BrotliDistanceParams orig_params = params->dist;
149
+ BrotliDistanceParams new_params = params->dist;
150
+ HistogramDistance* tmp = BROTLI_ALLOC(m, HistogramDistance, 1);
151
+
152
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(tmp)) return;
153
+
154
+ for (npostfix = 0; npostfix <= BROTLI_MAX_NPOSTFIX; npostfix++) {
155
+ for (; ndirect_msb < 16; ndirect_msb++) {
156
+ uint32_t ndirect = ndirect_msb << npostfix;
157
+ BROTLI_BOOL skip;
158
+ double dist_cost;
159
+ BrotliInitDistanceParams(&new_params, npostfix, ndirect,
160
+ params->large_window);
161
+ if (npostfix == orig_params.distance_postfix_bits &&
162
+ ndirect == orig_params.num_direct_distance_codes) {
163
+ check_orig = BROTLI_FALSE;
164
+ }
165
+ skip = !ComputeDistanceCost(
166
+ cmds, num_commands, &orig_params, &new_params, &dist_cost, tmp);
167
+ if (skip || (dist_cost > best_dist_cost)) {
168
+ break;
169
+ }
170
+ best_dist_cost = dist_cost;
171
+ params->dist = new_params;
172
+ }
173
+ if (ndirect_msb > 0) ndirect_msb--;
174
+ ndirect_msb /= 2;
175
+ }
176
+ if (check_orig) {
177
+ double dist_cost;
178
+ ComputeDistanceCost(cmds, num_commands, &orig_params, &orig_params,
179
+ &dist_cost, tmp);
180
+ if (dist_cost < best_dist_cost) {
181
+ /* NB: currently unused; uncomment when more param tuning is added. */
182
+ /* best_dist_cost = dist_cost; */
183
+ params->dist = orig_params;
184
+ }
185
+ }
186
+ BROTLI_FREE(m, tmp);
187
+ RecomputeDistancePrefixes(cmds, num_commands, &orig_params, &params->dist);
188
+
189
+ BrotliSplitBlock(m, cmds, num_commands,
190
+ ringbuffer, pos, mask, params,
191
+ &mb->literal_split,
192
+ &mb->command_split,
193
+ &mb->distance_split);
194
+ if (BROTLI_IS_OOM(m)) return;
195
+
196
+ if (!params->disable_literal_context_modeling) {
197
+ literal_context_multiplier = 1 << BROTLI_LITERAL_CONTEXT_BITS;
198
+ literal_context_modes =
199
+ BROTLI_ALLOC(m, ContextType, mb->literal_split.num_types);
200
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(literal_context_modes)) return;
201
+ for (i = 0; i < mb->literal_split.num_types; ++i) {
202
+ literal_context_modes[i] = literal_context_mode;
203
+ }
204
+ }
205
+
206
+ literal_histograms_size =
207
+ mb->literal_split.num_types * literal_context_multiplier;
208
+ literal_histograms =
209
+ BROTLI_ALLOC(m, HistogramLiteral, literal_histograms_size);
210
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(literal_histograms)) return;
211
+ ClearHistogramsLiteral(literal_histograms, literal_histograms_size);
212
+
213
+ distance_histograms_size =
214
+ mb->distance_split.num_types << BROTLI_DISTANCE_CONTEXT_BITS;
215
+ distance_histograms =
216
+ BROTLI_ALLOC(m, HistogramDistance, distance_histograms_size);
217
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(distance_histograms)) return;
218
+ ClearHistogramsDistance(distance_histograms, distance_histograms_size);
219
+
220
+ BROTLI_DCHECK(mb->command_histograms == 0);
221
+ mb->command_histograms_size = mb->command_split.num_types;
222
+ mb->command_histograms =
223
+ BROTLI_ALLOC(m, HistogramCommand, mb->command_histograms_size);
224
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->command_histograms)) return;
225
+ ClearHistogramsCommand(mb->command_histograms, mb->command_histograms_size);
226
+
227
+ BrotliBuildHistogramsWithContext(cmds, num_commands,
228
+ &mb->literal_split, &mb->command_split, &mb->distance_split,
229
+ ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_modes,
230
+ literal_histograms, mb->command_histograms, distance_histograms);
231
+ BROTLI_FREE(m, literal_context_modes);
232
+
233
+ BROTLI_DCHECK(mb->literal_context_map == 0);
234
+ mb->literal_context_map_size =
235
+ mb->literal_split.num_types << BROTLI_LITERAL_CONTEXT_BITS;
236
+ mb->literal_context_map =
237
+ BROTLI_ALLOC(m, uint32_t, mb->literal_context_map_size);
238
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->literal_context_map)) return;
239
+
240
+ BROTLI_DCHECK(mb->literal_histograms == 0);
241
+ mb->literal_histograms_size = mb->literal_context_map_size;
242
+ mb->literal_histograms =
243
+ BROTLI_ALLOC(m, HistogramLiteral, mb->literal_histograms_size);
244
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->literal_histograms)) return;
245
+
246
+ BrotliClusterHistogramsLiteral(m, literal_histograms, literal_histograms_size,
247
+ kMaxNumberOfHistograms, mb->literal_histograms,
248
+ &mb->literal_histograms_size, mb->literal_context_map);
249
+ if (BROTLI_IS_OOM(m)) return;
250
+ BROTLI_FREE(m, literal_histograms);
251
+
252
+ if (params->disable_literal_context_modeling) {
253
+ /* Distribute assignment to all contexts. */
254
+ for (i = mb->literal_split.num_types; i != 0;) {
255
+ size_t j = 0;
256
+ i--;
257
+ for (; j < (1 << BROTLI_LITERAL_CONTEXT_BITS); j++) {
258
+ mb->literal_context_map[(i << BROTLI_LITERAL_CONTEXT_BITS) + j] =
259
+ mb->literal_context_map[i];
260
+ }
261
+ }
262
+ }
263
+
264
+ BROTLI_DCHECK(mb->distance_context_map == 0);
265
+ mb->distance_context_map_size =
266
+ mb->distance_split.num_types << BROTLI_DISTANCE_CONTEXT_BITS;
267
+ mb->distance_context_map =
268
+ BROTLI_ALLOC(m, uint32_t, mb->distance_context_map_size);
269
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->distance_context_map)) return;
270
+
271
+ BROTLI_DCHECK(mb->distance_histograms == 0);
272
+ mb->distance_histograms_size = mb->distance_context_map_size;
273
+ mb->distance_histograms =
274
+ BROTLI_ALLOC(m, HistogramDistance, mb->distance_histograms_size);
275
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->distance_histograms)) return;
276
+
277
+ BrotliClusterHistogramsDistance(m, distance_histograms,
278
+ mb->distance_context_map_size,
279
+ kMaxNumberOfHistograms,
280
+ mb->distance_histograms,
281
+ &mb->distance_histograms_size,
282
+ mb->distance_context_map);
283
+ if (BROTLI_IS_OOM(m)) return;
284
+ BROTLI_FREE(m, distance_histograms);
285
+ }
286
+
287
+ #define FN(X) X ## Literal
288
+ /* NOLINT(build/header_guard) */
289
+ /* Copyright 2015 Google Inc. All Rights Reserved.
290
+
291
+ Distributed under MIT license.
292
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
293
+ */
294
+
295
+ /* template parameters: FN */
296
+
297
+ #define HistogramType FN(Histogram)
298
+
299
+ /* Greedy block splitter for one block category (literal, command or distance).
300
+ */
301
+ typedef struct FN(BlockSplitter) {
302
+ /* Alphabet size of particular block category. */
303
+ size_t alphabet_size_;
304
+ /* We collect at least this many symbols for each block. */
305
+ size_t min_block_size_;
306
+ /* We merge histograms A and B if
307
+ entropy(A+B) < entropy(A) + entropy(B) + split_threshold_,
308
+ where A is the current histogram and B is the histogram of the last or the
309
+ second last block type. */
310
+ double split_threshold_;
311
+
312
+ size_t num_blocks_;
313
+ BlockSplit* split_; /* not owned */
314
+ HistogramType* histograms_; /* not owned */
315
+ size_t* histograms_size_; /* not owned */
316
+
317
+ /* Temporary storage for BlockSplitterFinishBlock. */
318
+ HistogramType combined_histo[2];
319
+
320
+ /* The number of symbols that we want to collect before deciding on whether
321
+ or not to merge the block with a previous one or emit a new block. */
322
+ size_t target_block_size_;
323
+ /* The number of symbols in the current histogram. */
324
+ size_t block_size_;
325
+ /* Offset of the current histogram. */
326
+ size_t curr_histogram_ix_;
327
+ /* Offset of the histograms of the previous two block types. */
328
+ size_t last_histogram_ix_[2];
329
+ /* Entropy of the previous two block types. */
330
+ double last_entropy_[2];
331
+ /* The number of times we merged the current block with the last one. */
332
+ size_t merge_last_count_;
333
+ } FN(BlockSplitter);
334
+
335
+ static void FN(InitBlockSplitter)(
336
+ MemoryManager* m, FN(BlockSplitter)* self, size_t alphabet_size,
337
+ size_t min_block_size, double split_threshold, size_t num_symbols,
338
+ BlockSplit* split, HistogramType** histograms, size_t* histograms_size) {
339
+ size_t max_num_blocks = num_symbols / min_block_size + 1;
340
+ /* We have to allocate one more histogram than the maximum number of block
341
+ types for the current histogram when the meta-block is too big. */
342
+ size_t max_num_types =
343
+ BROTLI_MIN(size_t, max_num_blocks, BROTLI_MAX_NUMBER_OF_BLOCK_TYPES + 1);
344
+ self->alphabet_size_ = alphabet_size;
345
+ self->min_block_size_ = min_block_size;
346
+ self->split_threshold_ = split_threshold;
347
+ self->num_blocks_ = 0;
348
+ self->split_ = split;
349
+ self->histograms_size_ = histograms_size;
350
+ self->target_block_size_ = min_block_size;
351
+ self->block_size_ = 0;
352
+ self->curr_histogram_ix_ = 0;
353
+ self->merge_last_count_ = 0;
354
+ BROTLI_ENSURE_CAPACITY(m, uint8_t,
355
+ split->types, split->types_alloc_size, max_num_blocks);
356
+ BROTLI_ENSURE_CAPACITY(m, uint32_t,
357
+ split->lengths, split->lengths_alloc_size, max_num_blocks);
358
+ if (BROTLI_IS_OOM(m)) return;
359
+ self->split_->num_blocks = max_num_blocks;
360
+ BROTLI_DCHECK(*histograms == 0);
361
+ *histograms_size = max_num_types;
362
+ *histograms = BROTLI_ALLOC(m, HistogramType, *histograms_size);
363
+ self->histograms_ = *histograms;
364
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(*histograms)) return;
365
+ /* Clear only current histogram. */
366
+ FN(HistogramClear)(&self->histograms_[0]);
367
+ self->last_histogram_ix_[0] = self->last_histogram_ix_[1] = 0;
368
+ }
369
+
370
+ /* Does either of three things:
371
+ (1) emits the current block with a new block type;
372
+ (2) emits the current block with the type of the second last block;
373
+ (3) merges the current block with the last block. */
374
+ static void FN(BlockSplitterFinishBlock)(
375
+ FN(BlockSplitter)* self, BROTLI_BOOL is_final) {
376
+ BlockSplit* split = self->split_;
377
+ double* last_entropy = self->last_entropy_;
378
+ HistogramType* histograms = self->histograms_;
379
+ self->block_size_ =
380
+ BROTLI_MAX(size_t, self->block_size_, self->min_block_size_);
381
+ if (self->num_blocks_ == 0) {
382
+ /* Create first block. */
383
+ split->lengths[0] = (uint32_t)self->block_size_;
384
+ split->types[0] = 0;
385
+ last_entropy[0] =
386
+ BitsEntropy(histograms[0].data_, self->alphabet_size_);
387
+ last_entropy[1] = last_entropy[0];
388
+ ++self->num_blocks_;
389
+ ++split->num_types;
390
+ ++self->curr_histogram_ix_;
391
+ if (self->curr_histogram_ix_ < *self->histograms_size_)
392
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
393
+ self->block_size_ = 0;
394
+ } else if (self->block_size_ > 0) {
395
+ double entropy = BitsEntropy(histograms[self->curr_histogram_ix_].data_,
396
+ self->alphabet_size_);
397
+ double combined_entropy[2];
398
+ double diff[2];
399
+ size_t j;
400
+ for (j = 0; j < 2; ++j) {
401
+ size_t last_histogram_ix = self->last_histogram_ix_[j];
402
+ self->combined_histo[j] = histograms[self->curr_histogram_ix_];
403
+ FN(HistogramAddHistogram)(&self->combined_histo[j],
404
+ &histograms[last_histogram_ix]);
405
+ combined_entropy[j] = BitsEntropy(
406
+ &self->combined_histo[j].data_[0], self->alphabet_size_);
407
+ diff[j] = combined_entropy[j] - entropy - last_entropy[j];
408
+ }
409
+
410
+ if (split->num_types < BROTLI_MAX_NUMBER_OF_BLOCK_TYPES &&
411
+ diff[0] > self->split_threshold_ &&
412
+ diff[1] > self->split_threshold_) {
413
+ /* Create new block. */
414
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
415
+ split->types[self->num_blocks_] = (uint8_t)split->num_types;
416
+ self->last_histogram_ix_[1] = self->last_histogram_ix_[0];
417
+ self->last_histogram_ix_[0] = (uint8_t)split->num_types;
418
+ last_entropy[1] = last_entropy[0];
419
+ last_entropy[0] = entropy;
420
+ ++self->num_blocks_;
421
+ ++split->num_types;
422
+ ++self->curr_histogram_ix_;
423
+ if (self->curr_histogram_ix_ < *self->histograms_size_)
424
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
425
+ self->block_size_ = 0;
426
+ self->merge_last_count_ = 0;
427
+ self->target_block_size_ = self->min_block_size_;
428
+ } else if (diff[1] < diff[0] - 20.0) {
429
+ /* Combine this block with second last block. */
430
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
431
+ split->types[self->num_blocks_] = split->types[self->num_blocks_ - 2];
432
+ BROTLI_SWAP(size_t, self->last_histogram_ix_, 0, 1);
433
+ histograms[self->last_histogram_ix_[0]] = self->combined_histo[1];
434
+ last_entropy[1] = last_entropy[0];
435
+ last_entropy[0] = combined_entropy[1];
436
+ ++self->num_blocks_;
437
+ self->block_size_ = 0;
438
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
439
+ self->merge_last_count_ = 0;
440
+ self->target_block_size_ = self->min_block_size_;
441
+ } else {
442
+ /* Combine this block with last block. */
443
+ split->lengths[self->num_blocks_ - 1] += (uint32_t)self->block_size_;
444
+ histograms[self->last_histogram_ix_[0]] = self->combined_histo[0];
445
+ last_entropy[0] = combined_entropy[0];
446
+ if (split->num_types == 1) {
447
+ last_entropy[1] = last_entropy[0];
448
+ }
449
+ self->block_size_ = 0;
450
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
451
+ if (++self->merge_last_count_ > 1) {
452
+ self->target_block_size_ += self->min_block_size_;
453
+ }
454
+ }
455
+ }
456
+ if (is_final) {
457
+ *self->histograms_size_ = split->num_types;
458
+ split->num_blocks = self->num_blocks_;
459
+ }
460
+ }
461
+
462
+ /* Adds the next symbol to the current histogram. When the current histogram
463
+ reaches the target size, decides on merging the block. */
464
+ static void FN(BlockSplitterAddSymbol)(FN(BlockSplitter)* self, size_t symbol) {
465
+ FN(HistogramAdd)(&self->histograms_[self->curr_histogram_ix_], symbol);
466
+ ++self->block_size_;
467
+ if (self->block_size_ == self->target_block_size_) {
468
+ FN(BlockSplitterFinishBlock)(self, /* is_final = */ BROTLI_FALSE);
469
+ }
470
+ }
471
+
472
+ #undef HistogramType
473
+ #undef FN
474
+
475
+ #define FN(X) X ## Command
476
+ /* NOLINT(build/header_guard) */
477
+ /* Copyright 2015 Google Inc. All Rights Reserved.
478
+
479
+ Distributed under MIT license.
480
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
481
+ */
482
+
483
+ /* template parameters: FN */
484
+
485
+ #define HistogramType FN(Histogram)
486
+
487
+ /* Greedy block splitter for one block category (literal, command or distance).
488
+ */
489
+ typedef struct FN(BlockSplitter) {
490
+ /* Alphabet size of particular block category. */
491
+ size_t alphabet_size_;
492
+ /* We collect at least this many symbols for each block. */
493
+ size_t min_block_size_;
494
+ /* We merge histograms A and B if
495
+ entropy(A+B) < entropy(A) + entropy(B) + split_threshold_,
496
+ where A is the current histogram and B is the histogram of the last or the
497
+ second last block type. */
498
+ double split_threshold_;
499
+
500
+ size_t num_blocks_;
501
+ BlockSplit* split_; /* not owned */
502
+ HistogramType* histograms_; /* not owned */
503
+ size_t* histograms_size_; /* not owned */
504
+
505
+ /* Temporary storage for BlockSplitterFinishBlock. */
506
+ HistogramType combined_histo[2];
507
+
508
+ /* The number of symbols that we want to collect before deciding on whether
509
+ or not to merge the block with a previous one or emit a new block. */
510
+ size_t target_block_size_;
511
+ /* The number of symbols in the current histogram. */
512
+ size_t block_size_;
513
+ /* Offset of the current histogram. */
514
+ size_t curr_histogram_ix_;
515
+ /* Offset of the histograms of the previous two block types. */
516
+ size_t last_histogram_ix_[2];
517
+ /* Entropy of the previous two block types. */
518
+ double last_entropy_[2];
519
+ /* The number of times we merged the current block with the last one. */
520
+ size_t merge_last_count_;
521
+ } FN(BlockSplitter);
522
+
523
+ static void FN(InitBlockSplitter)(
524
+ MemoryManager* m, FN(BlockSplitter)* self, size_t alphabet_size,
525
+ size_t min_block_size, double split_threshold, size_t num_symbols,
526
+ BlockSplit* split, HistogramType** histograms, size_t* histograms_size) {
527
+ size_t max_num_blocks = num_symbols / min_block_size + 1;
528
+ /* We have to allocate one more histogram than the maximum number of block
529
+ types for the current histogram when the meta-block is too big. */
530
+ size_t max_num_types =
531
+ BROTLI_MIN(size_t, max_num_blocks, BROTLI_MAX_NUMBER_OF_BLOCK_TYPES + 1);
532
+ self->alphabet_size_ = alphabet_size;
533
+ self->min_block_size_ = min_block_size;
534
+ self->split_threshold_ = split_threshold;
535
+ self->num_blocks_ = 0;
536
+ self->split_ = split;
537
+ self->histograms_size_ = histograms_size;
538
+ self->target_block_size_ = min_block_size;
539
+ self->block_size_ = 0;
540
+ self->curr_histogram_ix_ = 0;
541
+ self->merge_last_count_ = 0;
542
+ BROTLI_ENSURE_CAPACITY(m, uint8_t,
543
+ split->types, split->types_alloc_size, max_num_blocks);
544
+ BROTLI_ENSURE_CAPACITY(m, uint32_t,
545
+ split->lengths, split->lengths_alloc_size, max_num_blocks);
546
+ if (BROTLI_IS_OOM(m)) return;
547
+ self->split_->num_blocks = max_num_blocks;
548
+ BROTLI_DCHECK(*histograms == 0);
549
+ *histograms_size = max_num_types;
550
+ *histograms = BROTLI_ALLOC(m, HistogramType, *histograms_size);
551
+ self->histograms_ = *histograms;
552
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(*histograms)) return;
553
+ /* Clear only current histogram. */
554
+ FN(HistogramClear)(&self->histograms_[0]);
555
+ self->last_histogram_ix_[0] = self->last_histogram_ix_[1] = 0;
556
+ }
557
+
558
+ /* Does either of three things:
559
+ (1) emits the current block with a new block type;
560
+ (2) emits the current block with the type of the second last block;
561
+ (3) merges the current block with the last block. */
562
+ static void FN(BlockSplitterFinishBlock)(
563
+ FN(BlockSplitter)* self, BROTLI_BOOL is_final) {
564
+ BlockSplit* split = self->split_;
565
+ double* last_entropy = self->last_entropy_;
566
+ HistogramType* histograms = self->histograms_;
567
+ self->block_size_ =
568
+ BROTLI_MAX(size_t, self->block_size_, self->min_block_size_);
569
+ if (self->num_blocks_ == 0) {
570
+ /* Create first block. */
571
+ split->lengths[0] = (uint32_t)self->block_size_;
572
+ split->types[0] = 0;
573
+ last_entropy[0] =
574
+ BitsEntropy(histograms[0].data_, self->alphabet_size_);
575
+ last_entropy[1] = last_entropy[0];
576
+ ++self->num_blocks_;
577
+ ++split->num_types;
578
+ ++self->curr_histogram_ix_;
579
+ if (self->curr_histogram_ix_ < *self->histograms_size_)
580
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
581
+ self->block_size_ = 0;
582
+ } else if (self->block_size_ > 0) {
583
+ double entropy = BitsEntropy(histograms[self->curr_histogram_ix_].data_,
584
+ self->alphabet_size_);
585
+ double combined_entropy[2];
586
+ double diff[2];
587
+ size_t j;
588
+ for (j = 0; j < 2; ++j) {
589
+ size_t last_histogram_ix = self->last_histogram_ix_[j];
590
+ self->combined_histo[j] = histograms[self->curr_histogram_ix_];
591
+ FN(HistogramAddHistogram)(&self->combined_histo[j],
592
+ &histograms[last_histogram_ix]);
593
+ combined_entropy[j] = BitsEntropy(
594
+ &self->combined_histo[j].data_[0], self->alphabet_size_);
595
+ diff[j] = combined_entropy[j] - entropy - last_entropy[j];
596
+ }
597
+
598
+ if (split->num_types < BROTLI_MAX_NUMBER_OF_BLOCK_TYPES &&
599
+ diff[0] > self->split_threshold_ &&
600
+ diff[1] > self->split_threshold_) {
601
+ /* Create new block. */
602
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
603
+ split->types[self->num_blocks_] = (uint8_t)split->num_types;
604
+ self->last_histogram_ix_[1] = self->last_histogram_ix_[0];
605
+ self->last_histogram_ix_[0] = (uint8_t)split->num_types;
606
+ last_entropy[1] = last_entropy[0];
607
+ last_entropy[0] = entropy;
608
+ ++self->num_blocks_;
609
+ ++split->num_types;
610
+ ++self->curr_histogram_ix_;
611
+ if (self->curr_histogram_ix_ < *self->histograms_size_)
612
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
613
+ self->block_size_ = 0;
614
+ self->merge_last_count_ = 0;
615
+ self->target_block_size_ = self->min_block_size_;
616
+ } else if (diff[1] < diff[0] - 20.0) {
617
+ /* Combine this block with second last block. */
618
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
619
+ split->types[self->num_blocks_] = split->types[self->num_blocks_ - 2];
620
+ BROTLI_SWAP(size_t, self->last_histogram_ix_, 0, 1);
621
+ histograms[self->last_histogram_ix_[0]] = self->combined_histo[1];
622
+ last_entropy[1] = last_entropy[0];
623
+ last_entropy[0] = combined_entropy[1];
624
+ ++self->num_blocks_;
625
+ self->block_size_ = 0;
626
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
627
+ self->merge_last_count_ = 0;
628
+ self->target_block_size_ = self->min_block_size_;
629
+ } else {
630
+ /* Combine this block with last block. */
631
+ split->lengths[self->num_blocks_ - 1] += (uint32_t)self->block_size_;
632
+ histograms[self->last_histogram_ix_[0]] = self->combined_histo[0];
633
+ last_entropy[0] = combined_entropy[0];
634
+ if (split->num_types == 1) {
635
+ last_entropy[1] = last_entropy[0];
636
+ }
637
+ self->block_size_ = 0;
638
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
639
+ if (++self->merge_last_count_ > 1) {
640
+ self->target_block_size_ += self->min_block_size_;
641
+ }
642
+ }
643
+ }
644
+ if (is_final) {
645
+ *self->histograms_size_ = split->num_types;
646
+ split->num_blocks = self->num_blocks_;
647
+ }
648
+ }
649
+
650
+ /* Adds the next symbol to the current histogram. When the current histogram
651
+ reaches the target size, decides on merging the block. */
652
+ static void FN(BlockSplitterAddSymbol)(FN(BlockSplitter)* self, size_t symbol) {
653
+ FN(HistogramAdd)(&self->histograms_[self->curr_histogram_ix_], symbol);
654
+ ++self->block_size_;
655
+ if (self->block_size_ == self->target_block_size_) {
656
+ FN(BlockSplitterFinishBlock)(self, /* is_final = */ BROTLI_FALSE);
657
+ }
658
+ }
659
+
660
+ #undef HistogramType
661
+ #undef FN
662
+
663
+ #define FN(X) X ## Distance
664
+ /* NOLINT(build/header_guard) */
665
+ /* Copyright 2015 Google Inc. All Rights Reserved.
666
+
667
+ Distributed under MIT license.
668
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
669
+ */
670
+
671
+ /* template parameters: FN */
672
+
673
+ #define HistogramType FN(Histogram)
674
+
675
+ /* Greedy block splitter for one block category (literal, command or distance).
676
+ */
677
+ typedef struct FN(BlockSplitter) {
678
+ /* Alphabet size of particular block category. */
679
+ size_t alphabet_size_;
680
+ /* We collect at least this many symbols for each block. */
681
+ size_t min_block_size_;
682
+ /* We merge histograms A and B if
683
+ entropy(A+B) < entropy(A) + entropy(B) + split_threshold_,
684
+ where A is the current histogram and B is the histogram of the last or the
685
+ second last block type. */
686
+ double split_threshold_;
687
+
688
+ size_t num_blocks_;
689
+ BlockSplit* split_; /* not owned */
690
+ HistogramType* histograms_; /* not owned */
691
+ size_t* histograms_size_; /* not owned */
692
+
693
+ /* Temporary storage for BlockSplitterFinishBlock. */
694
+ HistogramType combined_histo[2];
695
+
696
+ /* The number of symbols that we want to collect before deciding on whether
697
+ or not to merge the block with a previous one or emit a new block. */
698
+ size_t target_block_size_;
699
+ /* The number of symbols in the current histogram. */
700
+ size_t block_size_;
701
+ /* Offset of the current histogram. */
702
+ size_t curr_histogram_ix_;
703
+ /* Offset of the histograms of the previous two block types. */
704
+ size_t last_histogram_ix_[2];
705
+ /* Entropy of the previous two block types. */
706
+ double last_entropy_[2];
707
+ /* The number of times we merged the current block with the last one. */
708
+ size_t merge_last_count_;
709
+ } FN(BlockSplitter);
710
+
711
+ static void FN(InitBlockSplitter)(
712
+ MemoryManager* m, FN(BlockSplitter)* self, size_t alphabet_size,
713
+ size_t min_block_size, double split_threshold, size_t num_symbols,
714
+ BlockSplit* split, HistogramType** histograms, size_t* histograms_size) {
715
+ size_t max_num_blocks = num_symbols / min_block_size + 1;
716
+ /* We have to allocate one more histogram than the maximum number of block
717
+ types for the current histogram when the meta-block is too big. */
718
+ size_t max_num_types =
719
+ BROTLI_MIN(size_t, max_num_blocks, BROTLI_MAX_NUMBER_OF_BLOCK_TYPES + 1);
720
+ self->alphabet_size_ = alphabet_size;
721
+ self->min_block_size_ = min_block_size;
722
+ self->split_threshold_ = split_threshold;
723
+ self->num_blocks_ = 0;
724
+ self->split_ = split;
725
+ self->histograms_size_ = histograms_size;
726
+ self->target_block_size_ = min_block_size;
727
+ self->block_size_ = 0;
728
+ self->curr_histogram_ix_ = 0;
729
+ self->merge_last_count_ = 0;
730
+ BROTLI_ENSURE_CAPACITY(m, uint8_t,
731
+ split->types, split->types_alloc_size, max_num_blocks);
732
+ BROTLI_ENSURE_CAPACITY(m, uint32_t,
733
+ split->lengths, split->lengths_alloc_size, max_num_blocks);
734
+ if (BROTLI_IS_OOM(m)) return;
735
+ self->split_->num_blocks = max_num_blocks;
736
+ BROTLI_DCHECK(*histograms == 0);
737
+ *histograms_size = max_num_types;
738
+ *histograms = BROTLI_ALLOC(m, HistogramType, *histograms_size);
739
+ self->histograms_ = *histograms;
740
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(*histograms)) return;
741
+ /* Clear only current histogram. */
742
+ FN(HistogramClear)(&self->histograms_[0]);
743
+ self->last_histogram_ix_[0] = self->last_histogram_ix_[1] = 0;
744
+ }
745
+
746
+ /* Does either of three things:
747
+ (1) emits the current block with a new block type;
748
+ (2) emits the current block with the type of the second last block;
749
+ (3) merges the current block with the last block. */
750
+ static void FN(BlockSplitterFinishBlock)(
751
+ FN(BlockSplitter)* self, BROTLI_BOOL is_final) {
752
+ BlockSplit* split = self->split_;
753
+ double* last_entropy = self->last_entropy_;
754
+ HistogramType* histograms = self->histograms_;
755
+ self->block_size_ =
756
+ BROTLI_MAX(size_t, self->block_size_, self->min_block_size_);
757
+ if (self->num_blocks_ == 0) {
758
+ /* Create first block. */
759
+ split->lengths[0] = (uint32_t)self->block_size_;
760
+ split->types[0] = 0;
761
+ last_entropy[0] =
762
+ BitsEntropy(histograms[0].data_, self->alphabet_size_);
763
+ last_entropy[1] = last_entropy[0];
764
+ ++self->num_blocks_;
765
+ ++split->num_types;
766
+ ++self->curr_histogram_ix_;
767
+ if (self->curr_histogram_ix_ < *self->histograms_size_)
768
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
769
+ self->block_size_ = 0;
770
+ } else if (self->block_size_ > 0) {
771
+ double entropy = BitsEntropy(histograms[self->curr_histogram_ix_].data_,
772
+ self->alphabet_size_);
773
+ double combined_entropy[2];
774
+ double diff[2];
775
+ size_t j;
776
+ for (j = 0; j < 2; ++j) {
777
+ size_t last_histogram_ix = self->last_histogram_ix_[j];
778
+ self->combined_histo[j] = histograms[self->curr_histogram_ix_];
779
+ FN(HistogramAddHistogram)(&self->combined_histo[j],
780
+ &histograms[last_histogram_ix]);
781
+ combined_entropy[j] = BitsEntropy(
782
+ &self->combined_histo[j].data_[0], self->alphabet_size_);
783
+ diff[j] = combined_entropy[j] - entropy - last_entropy[j];
784
+ }
785
+
786
+ if (split->num_types < BROTLI_MAX_NUMBER_OF_BLOCK_TYPES &&
787
+ diff[0] > self->split_threshold_ &&
788
+ diff[1] > self->split_threshold_) {
789
+ /* Create new block. */
790
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
791
+ split->types[self->num_blocks_] = (uint8_t)split->num_types;
792
+ self->last_histogram_ix_[1] = self->last_histogram_ix_[0];
793
+ self->last_histogram_ix_[0] = (uint8_t)split->num_types;
794
+ last_entropy[1] = last_entropy[0];
795
+ last_entropy[0] = entropy;
796
+ ++self->num_blocks_;
797
+ ++split->num_types;
798
+ ++self->curr_histogram_ix_;
799
+ if (self->curr_histogram_ix_ < *self->histograms_size_)
800
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
801
+ self->block_size_ = 0;
802
+ self->merge_last_count_ = 0;
803
+ self->target_block_size_ = self->min_block_size_;
804
+ } else if (diff[1] < diff[0] - 20.0) {
805
+ /* Combine this block with second last block. */
806
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
807
+ split->types[self->num_blocks_] = split->types[self->num_blocks_ - 2];
808
+ BROTLI_SWAP(size_t, self->last_histogram_ix_, 0, 1);
809
+ histograms[self->last_histogram_ix_[0]] = self->combined_histo[1];
810
+ last_entropy[1] = last_entropy[0];
811
+ last_entropy[0] = combined_entropy[1];
812
+ ++self->num_blocks_;
813
+ self->block_size_ = 0;
814
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
815
+ self->merge_last_count_ = 0;
816
+ self->target_block_size_ = self->min_block_size_;
817
+ } else {
818
+ /* Combine this block with last block. */
819
+ split->lengths[self->num_blocks_ - 1] += (uint32_t)self->block_size_;
820
+ histograms[self->last_histogram_ix_[0]] = self->combined_histo[0];
821
+ last_entropy[0] = combined_entropy[0];
822
+ if (split->num_types == 1) {
823
+ last_entropy[1] = last_entropy[0];
824
+ }
825
+ self->block_size_ = 0;
826
+ FN(HistogramClear)(&histograms[self->curr_histogram_ix_]);
827
+ if (++self->merge_last_count_ > 1) {
828
+ self->target_block_size_ += self->min_block_size_;
829
+ }
830
+ }
831
+ }
832
+ if (is_final) {
833
+ *self->histograms_size_ = split->num_types;
834
+ split->num_blocks = self->num_blocks_;
835
+ }
836
+ }
837
+
838
+ /* Adds the next symbol to the current histogram. When the current histogram
839
+ reaches the target size, decides on merging the block. */
840
+ static void FN(BlockSplitterAddSymbol)(FN(BlockSplitter)* self, size_t symbol) {
841
+ FN(HistogramAdd)(&self->histograms_[self->curr_histogram_ix_], symbol);
842
+ ++self->block_size_;
843
+ if (self->block_size_ == self->target_block_size_) {
844
+ FN(BlockSplitterFinishBlock)(self, /* is_final = */ BROTLI_FALSE);
845
+ }
846
+ }
847
+
848
+ #undef HistogramType
849
+ #undef FN
850
+
851
+ #define BROTLI_MAX_STATIC_CONTEXTS 13
852
+
853
+ /* Greedy block splitter for one block category (literal, command or distance).
854
+ Gathers histograms for all context buckets. */
855
+ typedef struct ContextBlockSplitter {
856
+ /* Alphabet size of particular block category. */
857
+ size_t alphabet_size_;
858
+ size_t num_contexts_;
859
+ size_t max_block_types_;
860
+ /* We collect at least this many symbols for each block. */
861
+ size_t min_block_size_;
862
+ /* We merge histograms A and B if
863
+ entropy(A+B) < entropy(A) + entropy(B) + split_threshold_,
864
+ where A is the current histogram and B is the histogram of the last or the
865
+ second last block type. */
866
+ double split_threshold_;
867
+
868
+ size_t num_blocks_;
869
+ BlockSplit* split_; /* not owned */
870
+ HistogramLiteral* histograms_; /* not owned */
871
+ size_t* histograms_size_; /* not owned */
872
+
873
+ /* The number of symbols that we want to collect before deciding on whether
874
+ or not to merge the block with a previous one or emit a new block. */
875
+ size_t target_block_size_;
876
+ /* The number of symbols in the current histogram. */
877
+ size_t block_size_;
878
+ /* Offset of the current histogram. */
879
+ size_t curr_histogram_ix_;
880
+ /* Offset of the histograms of the previous two block types. */
881
+ size_t last_histogram_ix_[2];
882
+ /* Entropy of the previous two block types. */
883
+ double last_entropy_[2 * BROTLI_MAX_STATIC_CONTEXTS];
884
+ /* The number of times we merged the current block with the last one. */
885
+ size_t merge_last_count_;
886
+ } ContextBlockSplitter;
887
+
888
+ static void InitContextBlockSplitter(
889
+ MemoryManager* m, ContextBlockSplitter* self, size_t alphabet_size,
890
+ size_t num_contexts, size_t min_block_size, double split_threshold,
891
+ size_t num_symbols, BlockSplit* split, HistogramLiteral** histograms,
892
+ size_t* histograms_size) {
893
+ size_t max_num_blocks = num_symbols / min_block_size + 1;
894
+ size_t max_num_types;
895
+ BROTLI_DCHECK(num_contexts <= BROTLI_MAX_STATIC_CONTEXTS);
896
+
897
+ self->alphabet_size_ = alphabet_size;
898
+ self->num_contexts_ = num_contexts;
899
+ self->max_block_types_ = BROTLI_MAX_NUMBER_OF_BLOCK_TYPES / num_contexts;
900
+ self->min_block_size_ = min_block_size;
901
+ self->split_threshold_ = split_threshold;
902
+ self->num_blocks_ = 0;
903
+ self->split_ = split;
904
+ self->histograms_size_ = histograms_size;
905
+ self->target_block_size_ = min_block_size;
906
+ self->block_size_ = 0;
907
+ self->curr_histogram_ix_ = 0;
908
+ self->merge_last_count_ = 0;
909
+
910
+ /* We have to allocate one more histogram than the maximum number of block
911
+ types for the current histogram when the meta-block is too big. */
912
+ max_num_types =
913
+ BROTLI_MIN(size_t, max_num_blocks, self->max_block_types_ + 1);
914
+ BROTLI_ENSURE_CAPACITY(m, uint8_t,
915
+ split->types, split->types_alloc_size, max_num_blocks);
916
+ BROTLI_ENSURE_CAPACITY(m, uint32_t,
917
+ split->lengths, split->lengths_alloc_size, max_num_blocks);
918
+ if (BROTLI_IS_OOM(m)) return;
919
+ split->num_blocks = max_num_blocks;
920
+ if (BROTLI_IS_OOM(m)) return;
921
+ BROTLI_DCHECK(*histograms == 0);
922
+ *histograms_size = max_num_types * num_contexts;
923
+ *histograms = BROTLI_ALLOC(m, HistogramLiteral, *histograms_size);
924
+ self->histograms_ = *histograms;
925
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(*histograms)) return;
926
+ /* Clear only current histogram. */
927
+ ClearHistogramsLiteral(&self->histograms_[0], num_contexts);
928
+ self->last_histogram_ix_[0] = self->last_histogram_ix_[1] = 0;
929
+ }
930
+
931
+ /* Does either of three things:
932
+ (1) emits the current block with a new block type;
933
+ (2) emits the current block with the type of the second last block;
934
+ (3) merges the current block with the last block. */
935
+ static void ContextBlockSplitterFinishBlock(
936
+ ContextBlockSplitter* self, MemoryManager* m, BROTLI_BOOL is_final) {
937
+ BlockSplit* split = self->split_;
938
+ const size_t num_contexts = self->num_contexts_;
939
+ double* last_entropy = self->last_entropy_;
940
+ HistogramLiteral* histograms = self->histograms_;
941
+
942
+ if (self->block_size_ < self->min_block_size_) {
943
+ self->block_size_ = self->min_block_size_;
944
+ }
945
+ if (self->num_blocks_ == 0) {
946
+ size_t i;
947
+ /* Create first block. */
948
+ split->lengths[0] = (uint32_t)self->block_size_;
949
+ split->types[0] = 0;
950
+
951
+ for (i = 0; i < num_contexts; ++i) {
952
+ last_entropy[i] =
953
+ BitsEntropy(histograms[i].data_, self->alphabet_size_);
954
+ last_entropy[num_contexts + i] = last_entropy[i];
955
+ }
956
+ ++self->num_blocks_;
957
+ ++split->num_types;
958
+ self->curr_histogram_ix_ += num_contexts;
959
+ if (self->curr_histogram_ix_ < *self->histograms_size_) {
960
+ ClearHistogramsLiteral(
961
+ &self->histograms_[self->curr_histogram_ix_], self->num_contexts_);
962
+ }
963
+ self->block_size_ = 0;
964
+ } else if (self->block_size_ > 0) {
965
+ /* Try merging the set of histograms for the current block type with the
966
+ respective set of histograms for the last and second last block types.
967
+ Decide over the split based on the total reduction of entropy across
968
+ all contexts. */
969
+ double entropy[BROTLI_MAX_STATIC_CONTEXTS];
970
+ HistogramLiteral* combined_histo =
971
+ BROTLI_ALLOC(m, HistogramLiteral, 2 * num_contexts);
972
+ double combined_entropy[2 * BROTLI_MAX_STATIC_CONTEXTS];
973
+ double diff[2] = { 0.0 };
974
+ size_t i;
975
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(combined_histo)) return;
976
+ for (i = 0; i < num_contexts; ++i) {
977
+ size_t curr_histo_ix = self->curr_histogram_ix_ + i;
978
+ size_t j;
979
+ entropy[i] = BitsEntropy(histograms[curr_histo_ix].data_,
980
+ self->alphabet_size_);
981
+ for (j = 0; j < 2; ++j) {
982
+ size_t jx = j * num_contexts + i;
983
+ size_t last_histogram_ix = self->last_histogram_ix_[j] + i;
984
+ combined_histo[jx] = histograms[curr_histo_ix];
985
+ HistogramAddHistogramLiteral(&combined_histo[jx],
986
+ &histograms[last_histogram_ix]);
987
+ combined_entropy[jx] = BitsEntropy(
988
+ &combined_histo[jx].data_[0], self->alphabet_size_);
989
+ diff[j] += combined_entropy[jx] - entropy[i] - last_entropy[jx];
990
+ }
991
+ }
992
+
993
+ if (split->num_types < self->max_block_types_ &&
994
+ diff[0] > self->split_threshold_ &&
995
+ diff[1] > self->split_threshold_) {
996
+ /* Create new block. */
997
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
998
+ split->types[self->num_blocks_] = (uint8_t)split->num_types;
999
+ self->last_histogram_ix_[1] = self->last_histogram_ix_[0];
1000
+ self->last_histogram_ix_[0] = split->num_types * num_contexts;
1001
+ for (i = 0; i < num_contexts; ++i) {
1002
+ last_entropy[num_contexts + i] = last_entropy[i];
1003
+ last_entropy[i] = entropy[i];
1004
+ }
1005
+ ++self->num_blocks_;
1006
+ ++split->num_types;
1007
+ self->curr_histogram_ix_ += num_contexts;
1008
+ if (self->curr_histogram_ix_ < *self->histograms_size_) {
1009
+ ClearHistogramsLiteral(
1010
+ &self->histograms_[self->curr_histogram_ix_], self->num_contexts_);
1011
+ }
1012
+ self->block_size_ = 0;
1013
+ self->merge_last_count_ = 0;
1014
+ self->target_block_size_ = self->min_block_size_;
1015
+ } else if (diff[1] < diff[0] - 20.0) {
1016
+ /* Combine this block with second last block. */
1017
+ split->lengths[self->num_blocks_] = (uint32_t)self->block_size_;
1018
+ split->types[self->num_blocks_] = split->types[self->num_blocks_ - 2];
1019
+ BROTLI_SWAP(size_t, self->last_histogram_ix_, 0, 1);
1020
+ for (i = 0; i < num_contexts; ++i) {
1021
+ histograms[self->last_histogram_ix_[0] + i] =
1022
+ combined_histo[num_contexts + i];
1023
+ last_entropy[num_contexts + i] = last_entropy[i];
1024
+ last_entropy[i] = combined_entropy[num_contexts + i];
1025
+ HistogramClearLiteral(&histograms[self->curr_histogram_ix_ + i]);
1026
+ }
1027
+ ++self->num_blocks_;
1028
+ self->block_size_ = 0;
1029
+ self->merge_last_count_ = 0;
1030
+ self->target_block_size_ = self->min_block_size_;
1031
+ } else {
1032
+ /* Combine this block with last block. */
1033
+ split->lengths[self->num_blocks_ - 1] += (uint32_t)self->block_size_;
1034
+ for (i = 0; i < num_contexts; ++i) {
1035
+ histograms[self->last_histogram_ix_[0] + i] = combined_histo[i];
1036
+ last_entropy[i] = combined_entropy[i];
1037
+ if (split->num_types == 1) {
1038
+ last_entropy[num_contexts + i] = last_entropy[i];
1039
+ }
1040
+ HistogramClearLiteral(&histograms[self->curr_histogram_ix_ + i]);
1041
+ }
1042
+ self->block_size_ = 0;
1043
+ if (++self->merge_last_count_ > 1) {
1044
+ self->target_block_size_ += self->min_block_size_;
1045
+ }
1046
+ }
1047
+ BROTLI_FREE(m, combined_histo);
1048
+ }
1049
+ if (is_final) {
1050
+ *self->histograms_size_ = split->num_types * num_contexts;
1051
+ split->num_blocks = self->num_blocks_;
1052
+ }
1053
+ }
1054
+
1055
+ /* Adds the next symbol to the current block type and context. When the
1056
+ current block reaches the target size, decides on merging the block. */
1057
+ static void ContextBlockSplitterAddSymbol(
1058
+ ContextBlockSplitter* self, MemoryManager* m,
1059
+ size_t symbol, size_t context) {
1060
+ HistogramAddLiteral(&self->histograms_[self->curr_histogram_ix_ + context],
1061
+ symbol);
1062
+ ++self->block_size_;
1063
+ if (self->block_size_ == self->target_block_size_) {
1064
+ ContextBlockSplitterFinishBlock(self, m, /* is_final = */ BROTLI_FALSE);
1065
+ if (BROTLI_IS_OOM(m)) return;
1066
+ }
1067
+ }
1068
+
1069
+ static void MapStaticContexts(MemoryManager* m,
1070
+ size_t num_contexts,
1071
+ const uint32_t* static_context_map,
1072
+ MetaBlockSplit* mb) {
1073
+ size_t i;
1074
+ BROTLI_DCHECK(mb->literal_context_map == 0);
1075
+ mb->literal_context_map_size =
1076
+ mb->literal_split.num_types << BROTLI_LITERAL_CONTEXT_BITS;
1077
+ mb->literal_context_map =
1078
+ BROTLI_ALLOC(m, uint32_t, mb->literal_context_map_size);
1079
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(mb->literal_context_map)) return;
1080
+
1081
+ for (i = 0; i < mb->literal_split.num_types; ++i) {
1082
+ uint32_t offset = (uint32_t)(i * num_contexts);
1083
+ size_t j;
1084
+ for (j = 0; j < (1u << BROTLI_LITERAL_CONTEXT_BITS); ++j) {
1085
+ mb->literal_context_map[(i << BROTLI_LITERAL_CONTEXT_BITS) + j] =
1086
+ offset + static_context_map[j];
1087
+ }
1088
+ }
1089
+ }
1090
+
1091
+ typedef struct GreedyMetablockArena {
1092
+ union {
1093
+ BlockSplitterLiteral plain;
1094
+ ContextBlockSplitter ctx;
1095
+ } lit_blocks;
1096
+ BlockSplitterCommand cmd_blocks;
1097
+ BlockSplitterDistance dist_blocks;
1098
+ } GreedyMetablockArena;
1099
+
1100
+ static BROTLI_INLINE void BrotliBuildMetaBlockGreedyInternal(
1101
+ MemoryManager* m, GreedyMetablockArena* arena, const uint8_t* ringbuffer,
1102
+ size_t pos, size_t mask, uint8_t prev_byte, uint8_t prev_byte2,
1103
+ ContextLut literal_context_lut, const size_t num_contexts,
1104
+ const uint32_t* static_context_map, const Command* commands,
1105
+ size_t n_commands, MetaBlockSplit* mb) {
1106
+ size_t num_literals = 0;
1107
+ size_t i;
1108
+ for (i = 0; i < n_commands; ++i) {
1109
+ num_literals += commands[i].insert_len_;
1110
+ }
1111
+
1112
+ if (num_contexts == 1) {
1113
+ InitBlockSplitterLiteral(m, &arena->lit_blocks.plain, 256, 512, 400.0,
1114
+ num_literals, &mb->literal_split, &mb->literal_histograms,
1115
+ &mb->literal_histograms_size);
1116
+ } else {
1117
+ InitContextBlockSplitter(m, &arena->lit_blocks.ctx, 256, num_contexts, 512,
1118
+ 400.0, num_literals, &mb->literal_split, &mb->literal_histograms,
1119
+ &mb->literal_histograms_size);
1120
+ }
1121
+ if (BROTLI_IS_OOM(m)) return;
1122
+ InitBlockSplitterCommand(m, &arena->cmd_blocks, BROTLI_NUM_COMMAND_SYMBOLS,
1123
+ 1024, 500.0, n_commands, &mb->command_split, &mb->command_histograms,
1124
+ &mb->command_histograms_size);
1125
+ if (BROTLI_IS_OOM(m)) return;
1126
+ InitBlockSplitterDistance(m, &arena->dist_blocks, 64, 512, 100.0, n_commands,
1127
+ &mb->distance_split, &mb->distance_histograms,
1128
+ &mb->distance_histograms_size);
1129
+ if (BROTLI_IS_OOM(m)) return;
1130
+
1131
+ for (i = 0; i < n_commands; ++i) {
1132
+ const Command cmd = commands[i];
1133
+ size_t j;
1134
+ BlockSplitterAddSymbolCommand(&arena->cmd_blocks, cmd.cmd_prefix_);
1135
+ for (j = cmd.insert_len_; j != 0; --j) {
1136
+ uint8_t literal = ringbuffer[pos & mask];
1137
+ if (num_contexts == 1) {
1138
+ BlockSplitterAddSymbolLiteral(&arena->lit_blocks.plain, literal);
1139
+ } else {
1140
+ size_t context =
1141
+ BROTLI_CONTEXT(prev_byte, prev_byte2, literal_context_lut);
1142
+ ContextBlockSplitterAddSymbol(&arena->lit_blocks.ctx, m, literal,
1143
+ static_context_map[context]);
1144
+ if (BROTLI_IS_OOM(m)) return;
1145
+ }
1146
+ prev_byte2 = prev_byte;
1147
+ prev_byte = literal;
1148
+ ++pos;
1149
+ }
1150
+ pos += CommandCopyLen(&cmd);
1151
+ if (CommandCopyLen(&cmd)) {
1152
+ prev_byte2 = ringbuffer[(pos - 2) & mask];
1153
+ prev_byte = ringbuffer[(pos - 1) & mask];
1154
+ if (cmd.cmd_prefix_ >= 128) {
1155
+ BlockSplitterAddSymbolDistance(
1156
+ &arena->dist_blocks, cmd.dist_prefix_ & 0x3FF);
1157
+ }
1158
+ }
1159
+ }
1160
+
1161
+ if (num_contexts == 1) {
1162
+ BlockSplitterFinishBlockLiteral(
1163
+ &arena->lit_blocks.plain, /* is_final = */ BROTLI_TRUE);
1164
+ } else {
1165
+ ContextBlockSplitterFinishBlock(
1166
+ &arena->lit_blocks.ctx, m, /* is_final = */ BROTLI_TRUE);
1167
+ if (BROTLI_IS_OOM(m)) return;
1168
+ }
1169
+ BlockSplitterFinishBlockCommand(
1170
+ &arena->cmd_blocks, /* is_final = */ BROTLI_TRUE);
1171
+ BlockSplitterFinishBlockDistance(
1172
+ &arena->dist_blocks, /* is_final = */ BROTLI_TRUE);
1173
+
1174
+ if (num_contexts > 1) {
1175
+ MapStaticContexts(m, num_contexts, static_context_map, mb);
1176
+ }
1177
+ }
1178
+
1179
+ void duckdb_brotli::BrotliBuildMetaBlockGreedy(MemoryManager* m,
1180
+ const uint8_t* ringbuffer,
1181
+ size_t pos,
1182
+ size_t mask,
1183
+ uint8_t prev_byte,
1184
+ uint8_t prev_byte2,
1185
+ ContextLut literal_context_lut,
1186
+ size_t num_contexts,
1187
+ const uint32_t* static_context_map,
1188
+ const Command* commands,
1189
+ size_t n_commands,
1190
+ MetaBlockSplit* mb) {
1191
+ GreedyMetablockArena* arena = BROTLI_ALLOC(m, GreedyMetablockArena, 1);
1192
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(arena)) return;
1193
+ if (num_contexts == 1) {
1194
+ BrotliBuildMetaBlockGreedyInternal(m, arena, ringbuffer, pos, mask,
1195
+ prev_byte, prev_byte2, literal_context_lut, 1, NULL, commands,
1196
+ n_commands, mb);
1197
+ } else {
1198
+ BrotliBuildMetaBlockGreedyInternal(m, arena, ringbuffer, pos, mask,
1199
+ prev_byte, prev_byte2, literal_context_lut, num_contexts,
1200
+ static_context_map, commands, n_commands, mb);
1201
+ }
1202
+ BROTLI_FREE(m, arena);
1203
+ }
1204
+
1205
+ void duckdb_brotli::BrotliOptimizeHistograms(uint32_t num_distance_codes,
1206
+ MetaBlockSplit* mb) {
1207
+ uint8_t good_for_rle[BROTLI_NUM_COMMAND_SYMBOLS];
1208
+ size_t i;
1209
+ for (i = 0; i < mb->literal_histograms_size; ++i) {
1210
+ BrotliOptimizeHuffmanCountsForRle(256, mb->literal_histograms[i].data_,
1211
+ good_for_rle);
1212
+ }
1213
+ for (i = 0; i < mb->command_histograms_size; ++i) {
1214
+ BrotliOptimizeHuffmanCountsForRle(BROTLI_NUM_COMMAND_SYMBOLS,
1215
+ mb->command_histograms[i].data_,
1216
+ good_for_rle);
1217
+ }
1218
+ for (i = 0; i < mb->distance_histograms_size; ++i) {
1219
+ BrotliOptimizeHuffmanCountsForRle(num_distance_codes,
1220
+ mb->distance_histograms[i].data_,
1221
+ good_for_rle);
1222
+ }
1223
+ }
1224
+
1225
+