duckdb 1.0.1-dev21.0 → 1.0.1-dev27.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (1390) hide show
  1. package/.github/workflows/HighPriorityIssues.yml +2 -2
  2. package/.github/workflows/NodeJS.yml +1 -1
  3. package/binding.gyp +41 -0
  4. package/package.json +1 -1
  5. package/src/duckdb/extension/icu/icu-dateadd.cpp +4 -2
  6. package/src/duckdb/extension/icu/icu-datefunc.cpp +6 -2
  7. package/src/duckdb/extension/icu/icu-datesub.cpp +13 -2
  8. package/src/duckdb/extension/icu/icu-strptime.cpp +6 -6
  9. package/src/duckdb/extension/icu/icu-table-range.cpp +92 -73
  10. package/src/duckdb/extension/icu/icu-timebucket.cpp +12 -2
  11. package/src/duckdb/extension/icu/icu-timezone.cpp +3 -3
  12. package/src/duckdb/extension/icu/icu_extension.cpp +61 -9
  13. package/src/duckdb/extension/json/include/json_executors.hpp +20 -23
  14. package/src/duckdb/extension/json/include/json_functions.hpp +4 -0
  15. package/src/duckdb/extension/json/include/json_scan.hpp +6 -2
  16. package/src/duckdb/extension/json/include/json_structure.hpp +12 -9
  17. package/src/duckdb/extension/json/json_common.cpp +66 -10
  18. package/src/duckdb/extension/json/json_extension.cpp +13 -5
  19. package/src/duckdb/extension/json/json_functions/json_array_length.cpp +1 -1
  20. package/src/duckdb/extension/json/json_functions/json_create.cpp +21 -4
  21. package/src/duckdb/extension/json/json_functions/json_exists.cpp +32 -0
  22. package/src/duckdb/extension/json/json_functions/json_extract.cpp +2 -2
  23. package/src/duckdb/extension/json/json_functions/json_keys.cpp +1 -1
  24. package/src/duckdb/extension/json/json_functions/json_pretty.cpp +32 -0
  25. package/src/duckdb/extension/json/json_functions/json_serialize_sql.cpp +5 -1
  26. package/src/duckdb/extension/json/json_functions/json_structure.cpp +305 -94
  27. package/src/duckdb/extension/json/json_functions/json_transform.cpp +1 -1
  28. package/src/duckdb/extension/json/json_functions/json_type.cpp +3 -3
  29. package/src/duckdb/extension/json/json_functions/json_value.cpp +42 -0
  30. package/src/duckdb/extension/json/json_functions/read_json.cpp +16 -2
  31. package/src/duckdb/extension/json/json_functions/read_json_objects.cpp +3 -2
  32. package/src/duckdb/extension/json/json_functions.cpp +5 -1
  33. package/src/duckdb/extension/json/json_scan.cpp +13 -12
  34. package/src/duckdb/extension/json/serialize_json.cpp +5 -3
  35. package/src/duckdb/extension/parquet/column_reader.cpp +206 -43
  36. package/src/duckdb/extension/parquet/column_writer.cpp +133 -62
  37. package/src/duckdb/extension/parquet/geo_parquet.cpp +391 -0
  38. package/src/duckdb/extension/parquet/include/boolean_column_reader.hpp +16 -5
  39. package/src/duckdb/extension/parquet/include/column_reader.hpp +37 -12
  40. package/src/duckdb/extension/parquet/include/column_writer.hpp +10 -11
  41. package/src/duckdb/extension/parquet/include/expression_column_reader.hpp +52 -0
  42. package/src/duckdb/extension/parquet/include/geo_parquet.hpp +139 -0
  43. package/src/duckdb/extension/parquet/include/parquet_crypto.hpp +13 -8
  44. package/src/duckdb/extension/parquet/include/parquet_decimal_utils.hpp +3 -0
  45. package/src/duckdb/extension/parquet/include/parquet_file_metadata_cache.hpp +7 -3
  46. package/src/duckdb/extension/parquet/include/parquet_reader.hpp +55 -8
  47. package/src/duckdb/extension/parquet/include/parquet_rle_bp_decoder.hpp +3 -3
  48. package/src/duckdb/extension/parquet/include/parquet_rle_bp_encoder.hpp +1 -1
  49. package/src/duckdb/extension/parquet/include/parquet_timestamp.hpp +8 -0
  50. package/src/duckdb/extension/parquet/include/parquet_writer.hpp +21 -7
  51. package/src/duckdb/extension/parquet/include/resizable_buffer.hpp +33 -11
  52. package/src/duckdb/extension/parquet/include/string_column_reader.hpp +5 -2
  53. package/src/duckdb/extension/parquet/include/templated_column_reader.hpp +48 -14
  54. package/src/duckdb/extension/parquet/parquet_crypto.cpp +109 -61
  55. package/src/duckdb/extension/parquet/parquet_extension.cpp +305 -72
  56. package/src/duckdb/extension/parquet/parquet_metadata.cpp +4 -4
  57. package/src/duckdb/extension/parquet/parquet_reader.cpp +151 -40
  58. package/src/duckdb/extension/parquet/parquet_statistics.cpp +50 -16
  59. package/src/duckdb/extension/parquet/parquet_timestamp.cpp +42 -1
  60. package/src/duckdb/extension/parquet/parquet_writer.cpp +67 -75
  61. package/src/duckdb/extension/parquet/serialize_parquet.cpp +3 -1
  62. package/src/duckdb/extension/parquet/zstd_file_system.cpp +5 -1
  63. package/src/duckdb/src/catalog/catalog.cpp +14 -16
  64. package/src/duckdb/src/catalog/catalog_entry/duck_index_entry.cpp +14 -11
  65. package/src/duckdb/src/catalog/catalog_entry/duck_schema_entry.cpp +39 -19
  66. package/src/duckdb/src/catalog/catalog_entry/duck_table_entry.cpp +92 -78
  67. package/src/duckdb/src/catalog/catalog_entry/index_catalog_entry.cpp +10 -2
  68. package/src/duckdb/src/catalog/catalog_entry/macro_catalog_entry.cpp +10 -3
  69. package/src/duckdb/src/catalog/catalog_entry/schema_catalog_entry.cpp +3 -3
  70. package/src/duckdb/src/catalog/catalog_entry/table_catalog_entry.cpp +7 -7
  71. package/src/duckdb/src/catalog/catalog_entry.cpp +6 -3
  72. package/src/duckdb/src/catalog/catalog_set.cpp +14 -19
  73. package/src/duckdb/src/catalog/default/default_functions.cpp +179 -166
  74. package/src/duckdb/src/catalog/default/default_generator.cpp +24 -0
  75. package/src/duckdb/src/catalog/default/default_schemas.cpp +4 -3
  76. package/src/duckdb/src/catalog/default/default_table_functions.cpp +148 -0
  77. package/src/duckdb/src/catalog/default/default_views.cpp +7 -3
  78. package/src/duckdb/src/catalog/duck_catalog.cpp +7 -1
  79. package/src/duckdb/src/common/adbc/adbc.cpp +120 -58
  80. package/src/duckdb/src/common/allocator.cpp +71 -6
  81. package/src/duckdb/src/common/arrow/appender/bool_data.cpp +8 -7
  82. package/src/duckdb/src/common/arrow/appender/fixed_size_list_data.cpp +1 -1
  83. package/src/duckdb/src/common/arrow/appender/union_data.cpp +4 -5
  84. package/src/duckdb/src/common/arrow/arrow_appender.cpp +55 -21
  85. package/src/duckdb/src/common/arrow/arrow_converter.cpp +85 -10
  86. package/src/duckdb/src/common/arrow/arrow_merge_event.cpp +142 -0
  87. package/src/duckdb/src/common/arrow/arrow_query_result.cpp +56 -0
  88. package/src/duckdb/src/common/arrow/physical_arrow_batch_collector.cpp +37 -0
  89. package/src/duckdb/src/common/arrow/physical_arrow_collector.cpp +128 -0
  90. package/src/duckdb/src/common/arrow/schema_metadata.cpp +101 -0
  91. package/src/duckdb/src/common/cgroups.cpp +189 -0
  92. package/src/duckdb/src/common/compressed_file_system.cpp +6 -3
  93. package/src/duckdb/src/common/encryption_state.cpp +38 -0
  94. package/src/duckdb/src/common/enum_util.cpp +682 -14
  95. package/src/duckdb/src/common/enums/file_compression_type.cpp +24 -0
  96. package/src/duckdb/src/common/enums/metric_type.cpp +208 -0
  97. package/src/duckdb/src/common/enums/optimizer_type.cpp +8 -2
  98. package/src/duckdb/src/common/enums/physical_operator_type.cpp +2 -0
  99. package/src/duckdb/src/common/enums/relation_type.cpp +4 -0
  100. package/src/duckdb/src/common/enums/statement_type.cpp +15 -0
  101. package/src/duckdb/src/common/error_data.cpp +22 -20
  102. package/src/duckdb/src/common/exception/binder_exception.cpp +5 -0
  103. package/src/duckdb/src/common/exception.cpp +11 -1
  104. package/src/duckdb/src/common/extra_type_info.cpp +3 -0
  105. package/src/duckdb/src/common/file_buffer.cpp +1 -1
  106. package/src/duckdb/src/common/file_system.cpp +25 -3
  107. package/src/duckdb/src/common/filename_pattern.cpp +1 -0
  108. package/src/duckdb/src/common/fsst.cpp +15 -14
  109. package/src/duckdb/src/common/gzip_file_system.cpp +3 -1
  110. package/src/duckdb/src/common/hive_partitioning.cpp +103 -43
  111. package/src/duckdb/src/common/http_util.cpp +25 -0
  112. package/src/duckdb/src/common/local_file_system.cpp +48 -27
  113. package/src/duckdb/src/common/multi_file_list.cpp +113 -22
  114. package/src/duckdb/src/common/multi_file_reader.cpp +59 -58
  115. package/src/duckdb/src/common/operator/cast_operators.cpp +133 -34
  116. package/src/duckdb/src/common/operator/string_cast.cpp +42 -11
  117. package/src/duckdb/src/common/progress_bar/progress_bar.cpp +2 -2
  118. package/src/duckdb/src/common/progress_bar/terminal_progress_bar_display.cpp +1 -1
  119. package/src/duckdb/src/common/radix_partitioning.cpp +31 -21
  120. package/src/duckdb/src/common/random_engine.cpp +4 -0
  121. package/src/duckdb/src/common/re2_regex.cpp +47 -12
  122. package/src/duckdb/src/common/render_tree.cpp +243 -0
  123. package/src/duckdb/src/common/row_operations/row_aggregate.cpp +1 -1
  124. package/src/duckdb/src/common/row_operations/row_gather.cpp +2 -2
  125. package/src/duckdb/src/common/row_operations/row_matcher.cpp +58 -5
  126. package/src/duckdb/src/common/row_operations/row_radix_scatter.cpp +79 -43
  127. package/src/duckdb/src/common/serializer/binary_deserializer.cpp +1 -1
  128. package/src/duckdb/src/common/serializer/buffered_file_reader.cpp +6 -4
  129. package/src/duckdb/src/common/serializer/buffered_file_writer.cpp +18 -9
  130. package/src/duckdb/src/common/serializer/memory_stream.cpp +1 -0
  131. package/src/duckdb/src/common/sort/partition_state.cpp +33 -18
  132. package/src/duckdb/src/common/sort/radix_sort.cpp +22 -15
  133. package/src/duckdb/src/common/sort/sort_state.cpp +19 -16
  134. package/src/duckdb/src/common/sort/sorted_block.cpp +11 -10
  135. package/src/duckdb/src/common/string_util.cpp +167 -10
  136. package/src/duckdb/src/common/tree_renderer/graphviz_tree_renderer.cpp +108 -0
  137. package/src/duckdb/src/common/tree_renderer/html_tree_renderer.cpp +267 -0
  138. package/src/duckdb/src/common/tree_renderer/json_tree_renderer.cpp +116 -0
  139. package/src/duckdb/src/common/tree_renderer/text_tree_renderer.cpp +482 -0
  140. package/src/duckdb/src/common/tree_renderer/tree_renderer.cpp +12 -0
  141. package/src/duckdb/src/common/tree_renderer.cpp +16 -508
  142. package/src/duckdb/src/common/types/batched_data_collection.cpp +78 -9
  143. package/src/duckdb/src/common/types/bit.cpp +24 -22
  144. package/src/duckdb/src/common/types/blob.cpp +15 -11
  145. package/src/duckdb/src/common/types/column/column_data_allocator.cpp +18 -9
  146. package/src/duckdb/src/common/types/column/column_data_collection.cpp +4 -4
  147. package/src/duckdb/src/common/types/column/column_data_collection_segment.cpp +3 -4
  148. package/src/duckdb/src/common/types/column/column_data_consumer.cpp +2 -2
  149. package/src/duckdb/src/common/types/column/partitioned_column_data.cpp +70 -21
  150. package/src/duckdb/src/common/types/data_chunk.cpp +10 -1
  151. package/src/duckdb/src/common/types/date.cpp +8 -19
  152. package/src/duckdb/src/common/types/decimal.cpp +3 -2
  153. package/src/duckdb/src/common/types/hugeint.cpp +11 -3
  154. package/src/duckdb/src/common/types/hyperloglog.cpp +212 -227
  155. package/src/duckdb/src/common/types/interval.cpp +1 -1
  156. package/src/duckdb/src/common/types/list_segment.cpp +83 -49
  157. package/src/duckdb/src/common/types/row/partitioned_tuple_data.cpp +22 -83
  158. package/src/duckdb/src/common/types/row/row_data_collection.cpp +2 -2
  159. package/src/duckdb/src/common/types/row/row_data_collection_scanner.cpp +20 -4
  160. package/src/duckdb/src/common/types/row/tuple_data_allocator.cpp +28 -7
  161. package/src/duckdb/src/common/types/row/tuple_data_collection.cpp +29 -14
  162. package/src/duckdb/src/common/types/row/tuple_data_scatter_gather.cpp +152 -102
  163. package/src/duckdb/src/common/types/row/tuple_data_segment.cpp +4 -1
  164. package/src/duckdb/src/common/types/selection_vector.cpp +17 -1
  165. package/src/duckdb/src/common/types/time.cpp +62 -31
  166. package/src/duckdb/src/common/types/timestamp.cpp +70 -12
  167. package/src/duckdb/src/common/types/uuid.cpp +1 -1
  168. package/src/duckdb/src/common/types/validity_mask.cpp +40 -5
  169. package/src/duckdb/src/common/types/value.cpp +50 -8
  170. package/src/duckdb/src/common/types/varint.cpp +295 -0
  171. package/src/duckdb/src/common/types/vector.cpp +165 -54
  172. package/src/duckdb/src/common/types/vector_buffer.cpp +5 -4
  173. package/src/duckdb/src/common/types.cpp +106 -26
  174. package/src/duckdb/src/common/vector_operations/vector_copy.cpp +13 -25
  175. package/src/duckdb/src/common/vector_operations/vector_hash.cpp +6 -0
  176. package/src/duckdb/src/common/virtual_file_system.cpp +3 -3
  177. package/src/duckdb/src/core_functions/aggregate/distributive/approx_count.cpp +35 -82
  178. package/src/duckdb/src/core_functions/aggregate/distributive/arg_min_max.cpp +283 -46
  179. package/src/duckdb/src/core_functions/aggregate/distributive/bitagg.cpp +4 -4
  180. package/src/duckdb/src/core_functions/aggregate/distributive/entropy.cpp +3 -2
  181. package/src/duckdb/src/core_functions/aggregate/distributive/minmax.cpp +226 -338
  182. package/src/duckdb/src/core_functions/aggregate/distributive/sum.cpp +2 -0
  183. package/src/duckdb/src/core_functions/aggregate/holistic/approx_top_k.cpp +388 -0
  184. package/src/duckdb/src/core_functions/aggregate/holistic/approximate_quantile.cpp +63 -21
  185. package/src/duckdb/src/core_functions/aggregate/holistic/mad.cpp +330 -0
  186. package/src/duckdb/src/core_functions/aggregate/holistic/mode.cpp +136 -97
  187. package/src/duckdb/src/core_functions/aggregate/holistic/quantile.cpp +601 -1485
  188. package/src/duckdb/src/core_functions/aggregate/nested/binned_histogram.cpp +405 -0
  189. package/src/duckdb/src/core_functions/aggregate/nested/histogram.cpp +136 -165
  190. package/src/duckdb/src/core_functions/function_list.cpp +35 -8
  191. package/src/duckdb/src/core_functions/lambda_functions.cpp +5 -7
  192. package/src/duckdb/src/core_functions/scalar/array/array_functions.cpp +172 -198
  193. package/src/duckdb/src/core_functions/scalar/blob/create_sort_key.cpp +341 -54
  194. package/src/duckdb/src/core_functions/scalar/date/date_diff.cpp +2 -2
  195. package/src/duckdb/src/core_functions/scalar/date/date_part.cpp +89 -29
  196. package/src/duckdb/src/core_functions/scalar/date/date_trunc.cpp +1 -1
  197. package/src/duckdb/src/core_functions/scalar/date/make_date.cpp +2 -2
  198. package/src/duckdb/src/core_functions/scalar/date/strftime.cpp +133 -71
  199. package/src/duckdb/src/core_functions/scalar/date/to_interval.cpp +1 -1
  200. package/src/duckdb/src/core_functions/scalar/enum/enum_functions.cpp +1 -1
  201. package/src/duckdb/src/core_functions/scalar/generic/can_implicitly_cast.cpp +40 -0
  202. package/src/duckdb/src/core_functions/scalar/generic/error.cpp +1 -1
  203. package/src/duckdb/src/core_functions/scalar/generic/least.cpp +161 -58
  204. package/src/duckdb/src/core_functions/scalar/generic/typeof.cpp +13 -0
  205. package/src/duckdb/src/core_functions/scalar/list/array_slice.cpp +1 -1
  206. package/src/duckdb/src/core_functions/scalar/list/list_aggregates.cpp +59 -75
  207. package/src/duckdb/src/core_functions/scalar/list/list_distance.cpp +93 -40
  208. package/src/duckdb/src/core_functions/scalar/list/list_has_any_or_all.cpp +227 -0
  209. package/src/duckdb/src/core_functions/scalar/list/list_reduce.cpp +20 -19
  210. package/src/duckdb/src/core_functions/scalar/list/list_sort.cpp +0 -2
  211. package/src/duckdb/src/core_functions/scalar/list/list_value.cpp +106 -8
  212. package/src/duckdb/src/core_functions/scalar/map/map_contains.cpp +56 -0
  213. package/src/duckdb/src/core_functions/scalar/map/map_extract.cpp +73 -118
  214. package/src/duckdb/src/core_functions/scalar/math/numeric.cpp +98 -2
  215. package/src/duckdb/src/core_functions/scalar/operators/bitwise.cpp +1 -2
  216. package/src/duckdb/src/core_functions/scalar/random/setseed.cpp +1 -1
  217. package/src/duckdb/src/core_functions/scalar/string/bar.cpp +1 -1
  218. package/src/duckdb/src/core_functions/scalar/string/hex.cpp +5 -1
  219. package/src/duckdb/src/core_functions/scalar/string/md5.cpp +10 -37
  220. package/src/duckdb/src/core_functions/scalar/string/printf.cpp +18 -2
  221. package/src/duckdb/src/core_functions/scalar/string/repeat.cpp +45 -0
  222. package/src/duckdb/src/core_functions/scalar/string/reverse.cpp +4 -5
  223. package/src/duckdb/src/core_functions/scalar/string/sha1.cpp +35 -0
  224. package/src/duckdb/src/core_functions/scalar/string/sha256.cpp +5 -2
  225. package/src/duckdb/src/core_functions/scalar/string/url_encode.cpp +49 -0
  226. package/src/duckdb/src/core_functions/scalar/struct/struct_pack.cpp +1 -2
  227. package/src/duckdb/src/core_functions/scalar/union/union_extract.cpp +4 -2
  228. package/src/duckdb/src/execution/adaptive_filter.cpp +30 -11
  229. package/src/duckdb/src/execution/aggregate_hashtable.cpp +13 -18
  230. package/src/duckdb/src/execution/expression_executor/execute_conjunction.cpp +4 -9
  231. package/src/duckdb/src/execution/expression_executor.cpp +1 -1
  232. package/src/duckdb/src/execution/index/art/art.cpp +683 -670
  233. package/src/duckdb/src/execution/index/art/art_key.cpp +121 -38
  234. package/src/duckdb/src/execution/index/art/base_leaf.cpp +168 -0
  235. package/src/duckdb/src/execution/index/art/base_node.cpp +163 -0
  236. package/src/duckdb/src/execution/index/art/iterator.cpp +148 -77
  237. package/src/duckdb/src/execution/index/art/leaf.cpp +159 -263
  238. package/src/duckdb/src/execution/index/art/node.cpp +493 -247
  239. package/src/duckdb/src/execution/index/art/node256.cpp +31 -91
  240. package/src/duckdb/src/execution/index/art/node256_leaf.cpp +71 -0
  241. package/src/duckdb/src/execution/index/art/node48.cpp +75 -143
  242. package/src/duckdb/src/execution/index/art/prefix.cpp +424 -244
  243. package/src/duckdb/src/execution/index/bound_index.cpp +7 -1
  244. package/src/duckdb/src/execution/index/fixed_size_allocator.cpp +22 -18
  245. package/src/duckdb/src/execution/index/fixed_size_buffer.cpp +22 -73
  246. package/src/duckdb/src/execution/join_hashtable.cpp +637 -179
  247. package/src/duckdb/src/execution/operator/aggregate/aggregate_object.cpp +4 -4
  248. package/src/duckdb/src/execution/operator/aggregate/physical_hash_aggregate.cpp +15 -10
  249. package/src/duckdb/src/execution/operator/aggregate/physical_perfecthash_aggregate.cpp +13 -8
  250. package/src/duckdb/src/execution/operator/aggregate/physical_streaming_window.cpp +525 -132
  251. package/src/duckdb/src/execution/operator/aggregate/physical_ungrouped_aggregate.cpp +147 -138
  252. package/src/duckdb/src/execution/operator/aggregate/physical_window.cpp +531 -312
  253. package/src/duckdb/src/execution/operator/csv_scanner/buffer_manager/csv_buffer.cpp +1 -1
  254. package/src/duckdb/src/execution/operator/csv_scanner/buffer_manager/csv_buffer_manager.cpp +4 -3
  255. package/src/duckdb/src/execution/operator/csv_scanner/buffer_manager/csv_file_handle.cpp +9 -2
  256. package/src/duckdb/src/execution/operator/csv_scanner/scanner/base_scanner.cpp +13 -17
  257. package/src/duckdb/src/execution/operator/csv_scanner/scanner/column_count_scanner.cpp +60 -16
  258. package/src/duckdb/src/execution/operator/csv_scanner/scanner/csv_schema.cpp +105 -0
  259. package/src/duckdb/src/execution/operator/csv_scanner/scanner/scanner_boundary.cpp +24 -24
  260. package/src/duckdb/src/execution/operator/csv_scanner/scanner/skip_scanner.cpp +25 -2
  261. package/src/duckdb/src/execution/operator/csv_scanner/scanner/string_value_scanner.cpp +275 -112
  262. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/csv_sniffer.cpp +106 -11
  263. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/dialect_detection.cpp +253 -115
  264. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/header_detection.cpp +93 -52
  265. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/type_detection.cpp +116 -76
  266. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/type_refinement.cpp +29 -14
  267. package/src/duckdb/src/execution/operator/csv_scanner/sniffer/type_replacement.cpp +1 -1
  268. package/src/duckdb/src/execution/operator/csv_scanner/state_machine/csv_state_machine_cache.cpp +70 -26
  269. package/src/duckdb/src/execution/operator/csv_scanner/table_function/csv_file_scanner.cpp +81 -60
  270. package/src/duckdb/src/execution/operator/csv_scanner/table_function/global_csv_state.cpp +88 -50
  271. package/src/duckdb/src/execution/operator/csv_scanner/util/csv_error.cpp +161 -51
  272. package/src/duckdb/src/execution/operator/csv_scanner/util/csv_reader_options.cpp +59 -17
  273. package/src/duckdb/src/execution/operator/filter/physical_filter.cpp +5 -5
  274. package/src/duckdb/src/execution/operator/helper/physical_batch_collector.cpp +0 -21
  275. package/src/duckdb/src/execution/operator/helper/physical_buffered_batch_collector.cpp +109 -0
  276. package/src/duckdb/src/execution/operator/helper/physical_buffered_collector.cpp +5 -13
  277. package/src/duckdb/src/execution/operator/helper/physical_explain_analyze.cpp +1 -1
  278. package/src/duckdb/src/execution/operator/helper/physical_load.cpp +12 -4
  279. package/src/duckdb/src/execution/operator/helper/physical_materialized_collector.cpp +0 -16
  280. package/src/duckdb/src/execution/operator/helper/physical_reservoir_sample.cpp +4 -2
  281. package/src/duckdb/src/execution/operator/helper/physical_reset.cpp +5 -0
  282. package/src/duckdb/src/execution/operator/helper/physical_result_collector.cpp +3 -1
  283. package/src/duckdb/src/execution/operator/helper/physical_set_variable.cpp +39 -0
  284. package/src/duckdb/src/execution/operator/helper/physical_streaming_sample.cpp +4 -2
  285. package/src/duckdb/src/execution/operator/helper/physical_transaction.cpp +16 -5
  286. package/src/duckdb/src/execution/operator/join/outer_join_marker.cpp +1 -1
  287. package/src/duckdb/src/execution/operator/join/perfect_hash_join_executor.cpp +1 -1
  288. package/src/duckdb/src/execution/operator/join/physical_asof_join.cpp +1 -1
  289. package/src/duckdb/src/execution/operator/join/physical_blockwise_nl_join.cpp +5 -4
  290. package/src/duckdb/src/execution/operator/join/physical_comparison_join.cpp +59 -21
  291. package/src/duckdb/src/execution/operator/join/physical_delim_join.cpp +7 -4
  292. package/src/duckdb/src/execution/operator/join/physical_hash_join.cpp +333 -176
  293. package/src/duckdb/src/execution/operator/join/physical_iejoin.cpp +57 -34
  294. package/src/duckdb/src/execution/operator/join/physical_join.cpp +16 -8
  295. package/src/duckdb/src/execution/operator/join/physical_left_delim_join.cpp +10 -4
  296. package/src/duckdb/src/execution/operator/join/physical_nested_loop_join.cpp +2 -5
  297. package/src/duckdb/src/execution/operator/join/physical_piecewise_merge_join.cpp +3 -3
  298. package/src/duckdb/src/execution/operator/join/physical_range_join.cpp +5 -5
  299. package/src/duckdb/src/execution/operator/join/physical_right_delim_join.cpp +7 -2
  300. package/src/duckdb/src/execution/operator/order/physical_order.cpp +17 -12
  301. package/src/duckdb/src/execution/operator/order/physical_top_n.cpp +12 -9
  302. package/src/duckdb/src/execution/operator/persistent/physical_batch_copy_to_file.cpp +35 -17
  303. package/src/duckdb/src/execution/operator/persistent/physical_batch_insert.cpp +17 -11
  304. package/src/duckdb/src/execution/operator/persistent/physical_copy_database.cpp +5 -1
  305. package/src/duckdb/src/execution/operator/persistent/physical_copy_to_file.cpp +156 -47
  306. package/src/duckdb/src/execution/operator/persistent/physical_insert.cpp +10 -2
  307. package/src/duckdb/src/execution/operator/persistent/physical_update.cpp +1 -3
  308. package/src/duckdb/src/execution/operator/projection/physical_pivot.cpp +2 -2
  309. package/src/duckdb/src/execution/operator/projection/physical_projection.cpp +13 -6
  310. package/src/duckdb/src/execution/operator/projection/physical_tableinout_function.cpp +22 -3
  311. package/src/duckdb/src/execution/operator/projection/physical_unnest.cpp +19 -3
  312. package/src/duckdb/src/execution/operator/scan/physical_column_data_scan.cpp +37 -22
  313. package/src/duckdb/src/execution/operator/scan/physical_table_scan.cpp +77 -21
  314. package/src/duckdb/src/execution/operator/schema/physical_attach.cpp +27 -55
  315. package/src/duckdb/src/execution/operator/schema/physical_create_art_index.cpp +41 -44
  316. package/src/duckdb/src/execution/operator/set/physical_cte.cpp +4 -6
  317. package/src/duckdb/src/execution/operator/set/physical_recursive_cte.cpp +4 -6
  318. package/src/duckdb/src/execution/operator/set/physical_union.cpp +18 -4
  319. package/src/duckdb/src/execution/perfect_aggregate_hashtable.cpp +3 -2
  320. package/src/duckdb/src/execution/physical_operator.cpp +45 -4
  321. package/src/duckdb/src/execution/physical_plan/plan_comparison_join.cpp +18 -7
  322. package/src/duckdb/src/execution/physical_plan/plan_copy_to_file.cpp +8 -3
  323. package/src/duckdb/src/execution/physical_plan/plan_delim_join.cpp +13 -6
  324. package/src/duckdb/src/execution/physical_plan/plan_explain.cpp +3 -3
  325. package/src/duckdb/src/execution/physical_plan/plan_get.cpp +111 -19
  326. package/src/duckdb/src/execution/physical_plan/plan_limit.cpp +19 -2
  327. package/src/duckdb/src/execution/physical_plan/plan_set.cpp +9 -0
  328. package/src/duckdb/src/execution/physical_plan/plan_window.cpp +3 -1
  329. package/src/duckdb/src/execution/physical_plan_generator.cpp +3 -3
  330. package/src/duckdb/src/execution/radix_partitioned_hashtable.cpp +49 -49
  331. package/src/duckdb/src/execution/reservoir_sample.cpp +2 -2
  332. package/src/duckdb/src/execution/window_executor.cpp +556 -318
  333. package/src/duckdb/src/execution/window_segment_tree.cpp +1058 -485
  334. package/src/duckdb/src/function/aggregate/distributive/count.cpp +5 -5
  335. package/src/duckdb/src/function/aggregate/distributive/first.cpp +92 -95
  336. package/src/duckdb/src/function/aggregate/sorted_aggregate_function.cpp +10 -9
  337. package/src/duckdb/src/function/aggregate_function.cpp +8 -0
  338. package/src/duckdb/src/function/cast/cast_function_set.cpp +10 -1
  339. package/src/duckdb/src/function/cast/decimal_cast.cpp +10 -1
  340. package/src/duckdb/src/function/cast/default_casts.cpp +2 -0
  341. package/src/duckdb/src/function/cast/numeric_casts.cpp +3 -0
  342. package/src/duckdb/src/function/cast/string_cast.cpp +8 -5
  343. package/src/duckdb/src/function/cast/time_casts.cpp +2 -2
  344. package/src/duckdb/src/function/cast/union_casts.cpp +1 -1
  345. package/src/duckdb/src/function/cast/varint_casts.cpp +283 -0
  346. package/src/duckdb/src/function/cast/vector_cast_helpers.cpp +3 -1
  347. package/src/duckdb/src/function/cast_rules.cpp +104 -15
  348. package/src/duckdb/src/function/compression_config.cpp +35 -33
  349. package/src/duckdb/src/function/copy_function.cpp +27 -0
  350. package/src/duckdb/src/function/function_binder.cpp +39 -11
  351. package/src/duckdb/src/function/macro_function.cpp +75 -32
  352. package/src/duckdb/src/function/pragma/pragma_queries.cpp +10 -0
  353. package/src/duckdb/src/function/scalar/compressed_materialization/compress_string.cpp +1 -0
  354. package/src/duckdb/src/function/scalar/generic/binning.cpp +507 -0
  355. package/src/duckdb/src/function/scalar/generic/getvariable.cpp +58 -0
  356. package/src/duckdb/src/function/scalar/generic_functions.cpp +1 -0
  357. package/src/duckdb/src/function/scalar/list/contains_or_position.cpp +33 -47
  358. package/src/duckdb/src/function/scalar/list/list_extract.cpp +70 -143
  359. package/src/duckdb/src/function/scalar/list/list_resize.cpp +93 -84
  360. package/src/duckdb/src/function/scalar/list/list_zip.cpp +3 -0
  361. package/src/duckdb/src/function/scalar/operators/arithmetic.cpp +24 -11
  362. package/src/duckdb/src/function/scalar/sequence/nextval.cpp +4 -4
  363. package/src/duckdb/src/function/scalar/strftime_format.cpp +196 -57
  364. package/src/duckdb/src/function/scalar/string/caseconvert.cpp +9 -7
  365. package/src/duckdb/src/function/scalar/string/concat.cpp +239 -123
  366. package/src/duckdb/src/function/scalar/string/concat_ws.cpp +149 -0
  367. package/src/duckdb/src/function/scalar/string/contains.cpp +18 -7
  368. package/src/duckdb/src/function/scalar/string/like.cpp +2 -2
  369. package/src/duckdb/src/function/scalar/string/substring.cpp +6 -11
  370. package/src/duckdb/src/function/scalar/string_functions.cpp +1 -0
  371. package/src/duckdb/src/function/scalar/struct/struct_extract.cpp +7 -3
  372. package/src/duckdb/src/function/scalar/system/aggregate_export.cpp +5 -5
  373. package/src/duckdb/src/function/scalar_function.cpp +5 -2
  374. package/src/duckdb/src/function/scalar_macro_function.cpp +2 -2
  375. package/src/duckdb/src/function/table/arrow/arrow_duck_schema.cpp +20 -39
  376. package/src/duckdb/src/function/table/arrow/arrow_type_info.cpp +135 -0
  377. package/src/duckdb/src/function/table/arrow.cpp +194 -52
  378. package/src/duckdb/src/function/table/arrow_conversion.cpp +212 -69
  379. package/src/duckdb/src/function/table/copy_csv.cpp +43 -14
  380. package/src/duckdb/src/function/table/query_function.cpp +80 -0
  381. package/src/duckdb/src/function/table/range.cpp +222 -142
  382. package/src/duckdb/src/function/table/read_csv.cpp +25 -13
  383. package/src/duckdb/src/function/table/sniff_csv.cpp +55 -35
  384. package/src/duckdb/src/function/table/system/duckdb_constraints.cpp +141 -129
  385. package/src/duckdb/src/function/table/system/duckdb_extensions.cpp +25 -14
  386. package/src/duckdb/src/function/table/system/duckdb_functions.cpp +20 -14
  387. package/src/duckdb/src/function/table/system/duckdb_indexes.cpp +15 -1
  388. package/src/duckdb/src/function/table/system/duckdb_variables.cpp +84 -0
  389. package/src/duckdb/src/function/table/system/test_all_types.cpp +1 -0
  390. package/src/duckdb/src/function/table/system/test_vector_types.cpp +33 -3
  391. package/src/duckdb/src/function/table/system_functions.cpp +1 -0
  392. package/src/duckdb/src/function/table/table_scan.cpp +45 -22
  393. package/src/duckdb/src/function/table/unnest.cpp +2 -2
  394. package/src/duckdb/src/function/table/version/pragma_version.cpp +4 -4
  395. package/src/duckdb/src/function/table_function.cpp +5 -4
  396. package/src/duckdb/src/function/table_macro_function.cpp +2 -2
  397. package/src/duckdb/src/include/duckdb/catalog/catalog.hpp +8 -4
  398. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/duck_index_entry.hpp +5 -2
  399. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/duck_schema_entry.hpp +3 -0
  400. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/index_catalog_entry.hpp +2 -2
  401. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/macro_catalog_entry.hpp +3 -4
  402. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/table_catalog_entry.hpp +5 -5
  403. package/src/duckdb/src/include/duckdb/catalog/default/builtin_types/types.hpp +2 -1
  404. package/src/duckdb/src/include/duckdb/catalog/default/default_functions.hpp +4 -5
  405. package/src/duckdb/src/include/duckdb/catalog/default/default_generator.hpp +4 -5
  406. package/src/duckdb/src/include/duckdb/catalog/default/default_schemas.hpp +2 -1
  407. package/src/duckdb/src/include/duckdb/catalog/default/default_table_functions.hpp +47 -0
  408. package/src/duckdb/src/include/duckdb/catalog/duck_catalog.hpp +2 -0
  409. package/src/duckdb/src/include/duckdb/catalog/similar_catalog_entry.hpp +2 -2
  410. package/src/duckdb/src/include/duckdb/common/allocator.hpp +9 -1
  411. package/src/duckdb/src/include/duckdb/common/array_ptr.hpp +120 -0
  412. package/src/duckdb/src/include/duckdb/common/arrow/appender/append_data.hpp +37 -11
  413. package/src/duckdb/src/include/duckdb/common/arrow/appender/enum_data.hpp +9 -8
  414. package/src/duckdb/src/include/duckdb/common/arrow/appender/list.hpp +1 -0
  415. package/src/duckdb/src/include/duckdb/common/arrow/appender/list_data.hpp +6 -4
  416. package/src/duckdb/src/include/duckdb/common/arrow/appender/list_view_data.hpp +92 -0
  417. package/src/duckdb/src/include/duckdb/common/arrow/appender/map_data.hpp +2 -2
  418. package/src/duckdb/src/include/duckdb/common/arrow/appender/scalar_data.hpp +26 -4
  419. package/src/duckdb/src/include/duckdb/common/arrow/appender/varchar_data.hpp +90 -11
  420. package/src/duckdb/src/include/duckdb/common/arrow/arrow_appender.hpp +6 -6
  421. package/src/duckdb/src/include/duckdb/common/arrow/arrow_buffer.hpp +8 -1
  422. package/src/duckdb/src/include/duckdb/common/arrow/arrow_merge_event.hpp +62 -0
  423. package/src/duckdb/src/include/duckdb/common/arrow/arrow_query_result.hpp +52 -0
  424. package/src/duckdb/src/include/duckdb/common/arrow/arrow_types_extension.hpp +42 -0
  425. package/src/duckdb/src/include/duckdb/common/arrow/physical_arrow_batch_collector.hpp +30 -0
  426. package/src/duckdb/src/include/duckdb/common/arrow/physical_arrow_collector.hpp +65 -0
  427. package/src/duckdb/src/include/duckdb/common/arrow/schema_metadata.hpp +43 -0
  428. package/src/duckdb/src/include/duckdb/common/bswap.hpp +18 -16
  429. package/src/duckdb/src/include/duckdb/common/cgroups.hpp +30 -0
  430. package/src/duckdb/src/include/duckdb/common/compressed_file_system.hpp +3 -0
  431. package/src/duckdb/src/include/duckdb/common/dl.hpp +8 -1
  432. package/src/duckdb/src/include/duckdb/common/encryption_state.hpp +48 -0
  433. package/src/duckdb/src/include/duckdb/common/enum_util.hpp +88 -0
  434. package/src/duckdb/src/include/duckdb/common/enums/checkpoint_type.hpp +2 -2
  435. package/src/duckdb/src/include/duckdb/common/enums/copy_overwrite_mode.hpp +6 -1
  436. package/src/duckdb/src/include/duckdb/common/enums/destroy_buffer_upon.hpp +21 -0
  437. package/src/duckdb/src/include/duckdb/common/enums/explain_format.hpp +17 -0
  438. package/src/duckdb/src/include/duckdb/common/enums/file_compression_type.hpp +4 -0
  439. package/src/duckdb/src/include/duckdb/common/enums/join_type.hpp +2 -2
  440. package/src/duckdb/src/include/duckdb/common/enums/metric_type.hpp +88 -0
  441. package/src/duckdb/src/include/duckdb/common/enums/optimizer_type.hpp +6 -1
  442. package/src/duckdb/src/include/duckdb/common/enums/pending_execution_result.hpp +2 -1
  443. package/src/duckdb/src/include/duckdb/common/enums/physical_operator_type.hpp +1 -0
  444. package/src/duckdb/src/include/duckdb/common/enums/profiler_format.hpp +1 -1
  445. package/src/duckdb/src/include/duckdb/common/enums/relation_type.hpp +3 -1
  446. package/src/duckdb/src/include/duckdb/common/enums/set_scope.hpp +2 -1
  447. package/src/duckdb/src/include/duckdb/common/enums/statement_type.hpp +23 -2
  448. package/src/duckdb/src/include/duckdb/common/enums/stream_execution_result.hpp +25 -0
  449. package/src/duckdb/src/include/duckdb/common/enums/tableref_type.hpp +2 -1
  450. package/src/duckdb/src/include/duckdb/common/enums/wal_type.hpp +1 -0
  451. package/src/duckdb/src/include/duckdb/common/error_data.hpp +5 -2
  452. package/src/duckdb/src/include/duckdb/common/exception/binder_exception.hpp +1 -0
  453. package/src/duckdb/src/include/duckdb/common/exception.hpp +20 -2
  454. package/src/duckdb/src/include/duckdb/common/extra_operator_info.hpp +12 -0
  455. package/src/duckdb/src/include/duckdb/common/file_buffer.hpp +2 -0
  456. package/src/duckdb/src/include/duckdb/common/file_open_flags.hpp +16 -0
  457. package/src/duckdb/src/include/duckdb/common/file_opener.hpp +18 -0
  458. package/src/duckdb/src/include/duckdb/common/file_system.hpp +3 -0
  459. package/src/duckdb/src/include/duckdb/common/filename_pattern.hpp +4 -0
  460. package/src/duckdb/src/include/duckdb/common/fixed_size_map.hpp +160 -96
  461. package/src/duckdb/src/include/duckdb/common/fsst.hpp +9 -2
  462. package/src/duckdb/src/include/duckdb/common/helper.hpp +22 -8
  463. package/src/duckdb/src/include/duckdb/common/hive_partitioning.hpp +16 -7
  464. package/src/duckdb/src/include/duckdb/common/http_util.hpp +19 -0
  465. package/src/duckdb/src/include/duckdb/common/insertion_order_preserving_map.hpp +19 -6
  466. package/src/duckdb/src/include/duckdb/common/limits.hpp +9 -2
  467. package/src/duckdb/src/include/duckdb/common/multi_file_list.hpp +38 -6
  468. package/src/duckdb/src/include/duckdb/common/multi_file_reader.hpp +9 -2
  469. package/src/duckdb/src/include/duckdb/common/multi_file_reader_options.hpp +5 -1
  470. package/src/duckdb/src/include/duckdb/common/numeric_utils.hpp +82 -50
  471. package/src/duckdb/src/include/duckdb/common/operator/abs.hpp +11 -0
  472. package/src/duckdb/src/include/duckdb/common/operator/cast_operators.hpp +7 -3
  473. package/src/duckdb/src/include/duckdb/common/operator/decimal_cast_operators.hpp +23 -1
  474. package/src/duckdb/src/include/duckdb/common/operator/double_cast_operator.hpp +2 -1
  475. package/src/duckdb/src/include/duckdb/common/operator/integer_cast_operator.hpp +1 -1
  476. package/src/duckdb/src/include/duckdb/common/operator/numeric_cast.hpp +4 -0
  477. package/src/duckdb/src/include/duckdb/common/operator/string_cast.hpp +2 -0
  478. package/src/duckdb/src/include/duckdb/common/optional_ptr.hpp +10 -5
  479. package/src/duckdb/src/include/duckdb/common/optionally_owned_ptr.hpp +1 -0
  480. package/src/duckdb/src/include/duckdb/common/owning_string_map.hpp +155 -0
  481. package/src/duckdb/src/include/duckdb/common/perfect_map_set.hpp +2 -3
  482. package/src/duckdb/src/include/duckdb/common/platform.hpp +58 -0
  483. package/src/duckdb/src/include/duckdb/common/radix.hpp +172 -27
  484. package/src/duckdb/src/include/duckdb/common/radix_partitioning.hpp +5 -1
  485. package/src/duckdb/src/include/duckdb/common/random_engine.hpp +1 -0
  486. package/src/duckdb/src/include/duckdb/common/re2_regex.hpp +1 -1
  487. package/src/duckdb/src/include/duckdb/common/render_tree.hpp +77 -0
  488. package/src/duckdb/src/include/duckdb/common/row_operations/row_matcher.hpp +12 -0
  489. package/src/duckdb/src/include/duckdb/common/serializer/binary_serializer.hpp +6 -2
  490. package/src/duckdb/src/include/duckdb/common/serializer/buffered_file_writer.hpp +5 -3
  491. package/src/duckdb/src/include/duckdb/common/serializer/deserializer.hpp +15 -7
  492. package/src/duckdb/src/include/duckdb/common/serializer/memory_stream.hpp +3 -1
  493. package/src/duckdb/src/include/duckdb/common/serializer/serialization_data.hpp +245 -0
  494. package/src/duckdb/src/include/duckdb/common/serializer/serializer.hpp +10 -0
  495. package/src/duckdb/src/include/duckdb/common/sort/duckdb_pdqsort.hpp +10 -11
  496. package/src/duckdb/src/include/duckdb/common/sort/partition_state.hpp +12 -6
  497. package/src/duckdb/src/include/duckdb/common/string_util.hpp +37 -7
  498. package/src/duckdb/src/include/duckdb/common/tree_renderer/graphviz_tree_renderer.hpp +44 -0
  499. package/src/duckdb/src/include/duckdb/common/tree_renderer/html_tree_renderer.hpp +44 -0
  500. package/src/duckdb/src/include/duckdb/common/tree_renderer/json_tree_renderer.hpp +44 -0
  501. package/src/duckdb/src/include/duckdb/common/tree_renderer/text_tree_renderer.hpp +119 -0
  502. package/src/duckdb/src/include/duckdb/common/tree_renderer.hpp +9 -123
  503. package/src/duckdb/src/include/duckdb/common/type_visitor.hpp +96 -0
  504. package/src/duckdb/src/include/duckdb/common/typedefs.hpp +11 -1
  505. package/src/duckdb/src/include/duckdb/common/types/arrow_string_view_type.hpp +84 -0
  506. package/src/duckdb/src/include/duckdb/common/types/batched_data_collection.hpp +36 -1
  507. package/src/duckdb/src/include/duckdb/common/types/bit.hpp +1 -1
  508. package/src/duckdb/src/include/duckdb/common/types/cast_helpers.hpp +2 -2
  509. package/src/duckdb/src/include/duckdb/common/types/column/column_data_allocator.hpp +4 -2
  510. package/src/duckdb/src/include/duckdb/common/types/column/partitioned_column_data.hpp +52 -0
  511. package/src/duckdb/src/include/duckdb/common/types/data_chunk.hpp +2 -0
  512. package/src/duckdb/src/include/duckdb/common/types/date.hpp +0 -3
  513. package/src/duckdb/src/include/duckdb/common/types/date_lookup_cache.hpp +65 -0
  514. package/src/duckdb/src/include/duckdb/common/types/datetime.hpp +5 -2
  515. package/src/duckdb/src/include/duckdb/common/types/hyperloglog.hpp +49 -40
  516. package/src/duckdb/src/include/duckdb/common/types/interval.hpp +5 -1
  517. package/src/duckdb/src/include/duckdb/common/types/list_segment.hpp +2 -1
  518. package/src/duckdb/src/include/duckdb/common/types/row/partitioned_tuple_data.hpp +41 -9
  519. package/src/duckdb/src/include/duckdb/common/types/row/row_data_collection.hpp +4 -3
  520. package/src/duckdb/src/include/duckdb/common/types/row/row_data_collection_scanner.hpp +3 -1
  521. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_allocator.hpp +4 -0
  522. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_collection.hpp +4 -0
  523. package/src/duckdb/src/include/duckdb/common/types/row/tuple_data_states.hpp +1 -1
  524. package/src/duckdb/src/include/duckdb/common/types/selection_vector.hpp +4 -0
  525. package/src/duckdb/src/include/duckdb/common/types/string_type.hpp +4 -1
  526. package/src/duckdb/src/include/duckdb/common/types/time.hpp +11 -6
  527. package/src/duckdb/src/include/duckdb/common/types/timestamp.hpp +13 -3
  528. package/src/duckdb/src/include/duckdb/common/types/validity_mask.hpp +103 -12
  529. package/src/duckdb/src/include/duckdb/common/types/value.hpp +12 -3
  530. package/src/duckdb/src/include/duckdb/common/types/varint.hpp +107 -0
  531. package/src/duckdb/src/include/duckdb/common/types/vector.hpp +5 -1
  532. package/src/duckdb/src/include/duckdb/common/types/vector_buffer.hpp +7 -2
  533. package/src/duckdb/src/include/duckdb/common/types.hpp +6 -39
  534. package/src/duckdb/src/include/duckdb/common/union_by_name.hpp +42 -10
  535. package/src/duckdb/src/include/duckdb/common/vector_operations/generic_executor.hpp +29 -0
  536. package/src/duckdb/src/include/duckdb/common/vector_operations/unary_executor.hpp +0 -7
  537. package/src/duckdb/src/include/duckdb/common/vector_operations/vector_operations.hpp +2 -0
  538. package/src/duckdb/src/include/duckdb/common/winapi.hpp +8 -0
  539. package/src/duckdb/src/include/duckdb/core_functions/aggregate/algebraic/covar.hpp +8 -4
  540. package/src/duckdb/src/include/duckdb/core_functions/aggregate/algebraic/stddev.hpp +8 -4
  541. package/src/duckdb/src/include/duckdb/core_functions/aggregate/distributive_functions.hpp +4 -2
  542. package/src/duckdb/src/include/duckdb/core_functions/aggregate/histogram_helpers.hpp +99 -0
  543. package/src/duckdb/src/include/duckdb/core_functions/aggregate/holistic_functions.hpp +16 -7
  544. package/src/duckdb/src/include/duckdb/core_functions/aggregate/minmax_n_helpers.hpp +396 -0
  545. package/src/duckdb/src/include/duckdb/core_functions/aggregate/nested_functions.hpp +10 -0
  546. package/src/duckdb/src/include/duckdb/core_functions/aggregate/quantile_helpers.hpp +65 -0
  547. package/src/duckdb/src/include/duckdb/core_functions/aggregate/quantile_sort_tree.hpp +349 -0
  548. package/src/duckdb/src/include/duckdb/core_functions/aggregate/quantile_state.hpp +300 -0
  549. package/src/duckdb/src/include/duckdb/core_functions/aggregate/regression/regr_slope.hpp +1 -1
  550. package/src/duckdb/src/include/duckdb/core_functions/aggregate/sort_key_helpers.hpp +55 -0
  551. package/src/duckdb/src/include/duckdb/core_functions/array_kernels.hpp +107 -0
  552. package/src/duckdb/src/include/duckdb/core_functions/create_sort_key.hpp +55 -0
  553. package/src/duckdb/src/include/duckdb/core_functions/lambda_functions.hpp +1 -2
  554. package/src/duckdb/src/include/duckdb/core_functions/scalar/array_functions.hpp +24 -0
  555. package/src/duckdb/src/include/duckdb/core_functions/scalar/date_functions.hpp +9 -0
  556. package/src/duckdb/src/include/duckdb/core_functions/scalar/generic_functions.hpp +27 -0
  557. package/src/duckdb/src/include/duckdb/core_functions/scalar/list_functions.hpp +80 -8
  558. package/src/duckdb/src/include/duckdb/core_functions/scalar/map_functions.hpp +9 -0
  559. package/src/duckdb/src/include/duckdb/core_functions/scalar/math_functions.hpp +54 -0
  560. package/src/duckdb/src/include/duckdb/core_functions/scalar/string_functions.hpp +30 -21
  561. package/src/duckdb/src/include/duckdb/execution/adaptive_filter.hpp +25 -14
  562. package/src/duckdb/src/include/duckdb/execution/aggregate_hashtable.hpp +2 -48
  563. package/src/duckdb/src/include/duckdb/execution/executor.hpp +25 -2
  564. package/src/duckdb/src/include/duckdb/execution/ht_entry.hpp +102 -0
  565. package/src/duckdb/src/include/duckdb/execution/index/art/art.hpp +94 -101
  566. package/src/duckdb/src/include/duckdb/execution/index/art/art_key.hpp +43 -25
  567. package/src/duckdb/src/include/duckdb/execution/index/art/base_leaf.hpp +109 -0
  568. package/src/duckdb/src/include/duckdb/execution/index/art/base_node.hpp +140 -0
  569. package/src/duckdb/src/include/duckdb/execution/index/art/iterator.hpp +43 -24
  570. package/src/duckdb/src/include/duckdb/execution/index/art/leaf.hpp +41 -52
  571. package/src/duckdb/src/include/duckdb/execution/index/art/node.hpp +133 -74
  572. package/src/duckdb/src/include/duckdb/execution/index/art/node256.hpp +46 -29
  573. package/src/duckdb/src/include/duckdb/execution/index/art/node256_leaf.hpp +53 -0
  574. package/src/duckdb/src/include/duckdb/execution/index/art/node48.hpp +52 -35
  575. package/src/duckdb/src/include/duckdb/execution/index/art/prefix.hpp +96 -57
  576. package/src/duckdb/src/include/duckdb/execution/index/bound_index.hpp +9 -4
  577. package/src/duckdb/src/include/duckdb/execution/index/fixed_size_allocator.hpp +48 -10
  578. package/src/duckdb/src/include/duckdb/execution/index/fixed_size_buffer.hpp +0 -2
  579. package/src/duckdb/src/include/duckdb/execution/index/index_pointer.hpp +4 -2
  580. package/src/duckdb/src/include/duckdb/execution/join_hashtable.hpp +114 -36
  581. package/src/duckdb/src/include/duckdb/execution/merge_sort_tree.hpp +158 -67
  582. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/aggregate_object.hpp +1 -1
  583. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_hash_aggregate.hpp +1 -1
  584. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_perfecthash_aggregate.hpp +1 -1
  585. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_streaming_window.hpp +19 -2
  586. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_ungrouped_aggregate.hpp +1 -1
  587. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/physical_window.hpp +1 -1
  588. package/src/duckdb/src/include/duckdb/execution/operator/aggregate/ungrouped_aggregate_state.hpp +75 -0
  589. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/base_scanner.hpp +81 -23
  590. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/column_count_scanner.hpp +27 -8
  591. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_buffer_manager.hpp +2 -1
  592. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_error.hpp +31 -22
  593. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_file_handle.hpp +4 -2
  594. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_file_scanner.hpp +48 -5
  595. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_option.hpp +7 -3
  596. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_reader_options.hpp +22 -12
  597. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_schema.hpp +35 -0
  598. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_sniffer.hpp +81 -39
  599. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_state.hpp +2 -1
  600. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_state_machine.hpp +18 -1
  601. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/csv_state_machine_cache.hpp +9 -7
  602. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/global_csv_state.hpp +5 -4
  603. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/header_value.hpp +26 -0
  604. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/scanner_boundary.hpp +6 -9
  605. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/skip_scanner.hpp +3 -0
  606. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/state_machine_options.hpp +5 -3
  607. package/src/duckdb/src/include/duckdb/execution/operator/csv_scanner/string_value_scanner.hpp +36 -19
  608. package/src/duckdb/src/include/duckdb/execution/operator/filter/physical_filter.hpp +1 -1
  609. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_batch_collector.hpp +21 -0
  610. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_buffered_batch_collector.hpp +53 -0
  611. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_buffered_collector.hpp +3 -0
  612. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_explain_analyze.hpp +6 -2
  613. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_materialized_collector.hpp +18 -0
  614. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_reservoir_sample.hpp +1 -1
  615. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_result_collector.hpp +6 -0
  616. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_set.hpp +2 -2
  617. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_set_variable.hpp +43 -0
  618. package/src/duckdb/src/include/duckdb/execution/operator/helper/physical_streaming_sample.hpp +1 -1
  619. package/src/duckdb/src/include/duckdb/execution/operator/join/join_filter_pushdown.hpp +59 -0
  620. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_blockwise_nl_join.hpp +1 -1
  621. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_comparison_join.hpp +8 -1
  622. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_delim_join.hpp +5 -2
  623. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_hash_join.hpp +4 -2
  624. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_iejoin.hpp +2 -0
  625. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_join.hpp +1 -1
  626. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_left_delim_join.hpp +3 -1
  627. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_range_join.hpp +4 -1
  628. package/src/duckdb/src/include/duckdb/execution/operator/join/physical_right_delim_join.hpp +3 -1
  629. package/src/duckdb/src/include/duckdb/execution/operator/order/physical_order.hpp +1 -1
  630. package/src/duckdb/src/include/duckdb/execution/operator/order/physical_top_n.hpp +1 -1
  631. package/src/duckdb/src/include/duckdb/execution/operator/persistent/batch_memory_manager.hpp +5 -37
  632. package/src/duckdb/src/include/duckdb/execution/operator/persistent/physical_batch_copy_to_file.hpp +5 -4
  633. package/src/duckdb/src/include/duckdb/execution/operator/persistent/physical_copy_to_file.hpp +8 -2
  634. package/src/duckdb/src/include/duckdb/execution/operator/projection/physical_projection.hpp +1 -1
  635. package/src/duckdb/src/include/duckdb/execution/operator/projection/physical_tableinout_function.hpp +2 -0
  636. package/src/duckdb/src/include/duckdb/execution/operator/scan/physical_column_data_scan.hpp +9 -3
  637. package/src/duckdb/src/include/duckdb/execution/operator/scan/physical_table_scan.hpp +8 -6
  638. package/src/duckdb/src/include/duckdb/execution/operator/schema/physical_create_art_index.hpp +2 -2
  639. package/src/duckdb/src/include/duckdb/execution/operator/set/physical_cte.hpp +1 -1
  640. package/src/duckdb/src/include/duckdb/execution/operator/set/physical_recursive_cte.hpp +1 -1
  641. package/src/duckdb/src/include/duckdb/execution/physical_operator.hpp +21 -6
  642. package/src/duckdb/src/include/duckdb/execution/physical_operator_states.hpp +3 -2
  643. package/src/duckdb/src/include/duckdb/execution/physical_plan_generator.hpp +3 -0
  644. package/src/duckdb/src/include/duckdb/execution/window_executor.hpp +137 -110
  645. package/src/duckdb/src/include/duckdb/execution/window_segment_tree.hpp +57 -126
  646. package/src/duckdb/src/include/duckdb/function/aggregate_function.hpp +21 -4
  647. package/src/duckdb/src/include/duckdb/function/cast/default_casts.hpp +1 -1
  648. package/src/duckdb/src/include/duckdb/function/compression/compression.hpp +10 -10
  649. package/src/duckdb/src/include/duckdb/function/compression_function.hpp +37 -7
  650. package/src/duckdb/src/include/duckdb/function/copy_function.hpp +24 -11
  651. package/src/duckdb/src/include/duckdb/function/function_binder.hpp +4 -4
  652. package/src/duckdb/src/include/duckdb/function/function_serialization.hpp +41 -1
  653. package/src/duckdb/src/include/duckdb/function/macro_function.hpp +15 -5
  654. package/src/duckdb/src/include/duckdb/function/pragma/pragma_functions.hpp +1 -0
  655. package/src/duckdb/src/include/duckdb/function/replacement_scan.hpp +20 -4
  656. package/src/duckdb/src/include/duckdb/function/scalar/generic_functions.hpp +6 -0
  657. package/src/duckdb/src/include/duckdb/function/scalar/list/contains_or_position.hpp +77 -109
  658. package/src/duckdb/src/include/duckdb/function/scalar/nested_functions.hpp +1 -1
  659. package/src/duckdb/src/include/duckdb/function/scalar/regexp.hpp +6 -3
  660. package/src/duckdb/src/include/duckdb/function/scalar/strftime_format.hpp +25 -12
  661. package/src/duckdb/src/include/duckdb/function/scalar/string_functions.hpp +9 -8
  662. package/src/duckdb/src/include/duckdb/function/scalar_function.hpp +38 -4
  663. package/src/duckdb/src/include/duckdb/function/scalar_macro_function.hpp +1 -1
  664. package/src/duckdb/src/include/duckdb/function/table/arrow/arrow_duck_schema.hpp +11 -57
  665. package/src/duckdb/src/include/duckdb/function/table/arrow/arrow_type_info.hpp +142 -0
  666. package/src/duckdb/src/include/duckdb/function/table/arrow/enum/arrow_datetime_type.hpp +18 -0
  667. package/src/duckdb/src/include/duckdb/function/table/arrow/enum/arrow_type_info_type.hpp +7 -0
  668. package/src/duckdb/src/include/duckdb/function/table/arrow/enum/arrow_variable_size_type.hpp +10 -0
  669. package/src/duckdb/src/include/duckdb/function/table/arrow.hpp +2 -0
  670. package/src/duckdb/src/include/duckdb/function/table/range.hpp +4 -0
  671. package/src/duckdb/src/include/duckdb/function/table/read_csv.hpp +4 -1
  672. package/src/duckdb/src/include/duckdb/function/table/system_functions.hpp +4 -0
  673. package/src/duckdb/src/include/duckdb/function/table/table_scan.hpp +5 -5
  674. package/src/duckdb/src/include/duckdb/function/table_function.hpp +14 -2
  675. package/src/duckdb/src/include/duckdb/function/table_macro_function.hpp +1 -1
  676. package/src/duckdb/src/include/duckdb/main/appender.hpp +14 -4
  677. package/src/duckdb/src/include/duckdb/main/attached_database.hpp +25 -7
  678. package/src/duckdb/src/include/duckdb/main/buffered_data/batched_buffered_data.hpp +79 -0
  679. package/src/duckdb/src/include/duckdb/main/buffered_data/buffered_data.hpp +10 -20
  680. package/src/duckdb/src/include/duckdb/main/buffered_data/simple_buffered_data.hpp +11 -12
  681. package/src/duckdb/src/include/duckdb/main/capi/capi_internal.hpp +7 -2
  682. package/src/duckdb/src/include/duckdb/main/capi/cast/generic.hpp +1 -1
  683. package/src/duckdb/src/include/duckdb/main/capi/cast/utils.hpp +2 -2
  684. package/src/duckdb/src/include/duckdb/main/capi/extension_api.hpp +809 -0
  685. package/src/duckdb/src/include/duckdb/main/chunk_scan_state/batched_data_collection.hpp +35 -0
  686. package/src/duckdb/src/include/duckdb/main/client_config.hpp +68 -2
  687. package/src/duckdb/src/include/duckdb/main/client_context.hpp +30 -22
  688. package/src/duckdb/src/include/duckdb/main/client_context_state.hpp +79 -1
  689. package/src/duckdb/src/include/duckdb/main/client_properties.hpp +9 -3
  690. package/src/duckdb/src/include/duckdb/main/config.hpp +55 -7
  691. package/src/duckdb/src/include/duckdb/main/connection.hpp +5 -1
  692. package/src/duckdb/src/include/duckdb/main/database.hpp +16 -5
  693. package/src/duckdb/src/include/duckdb/main/database_manager.hpp +9 -8
  694. package/src/duckdb/src/include/duckdb/main/db_instance_cache.hpp +21 -6
  695. package/src/duckdb/src/include/duckdb/main/extension.hpp +20 -0
  696. package/src/duckdb/src/include/duckdb/main/extension_entries.hpp +25 -0
  697. package/src/duckdb/src/include/duckdb/main/extension_helper.hpp +29 -23
  698. package/src/duckdb/src/include/duckdb/main/extension_install_info.hpp +6 -0
  699. package/src/duckdb/src/include/duckdb/main/extension_util.hpp +3 -0
  700. package/src/duckdb/src/include/duckdb/main/pending_query_result.hpp +4 -2
  701. package/src/duckdb/src/include/duckdb/main/prepared_statement.hpp +5 -6
  702. package/src/duckdb/src/include/duckdb/main/prepared_statement_data.hpp +2 -5
  703. package/src/duckdb/src/include/duckdb/main/profiling_info.hpp +87 -0
  704. package/src/duckdb/src/include/duckdb/main/profiling_node.hpp +60 -0
  705. package/src/duckdb/src/include/duckdb/main/query_profiler.hpp +72 -34
  706. package/src/duckdb/src/include/duckdb/main/query_result.hpp +1 -1
  707. package/src/duckdb/src/include/duckdb/main/relation/create_table_relation.hpp +2 -1
  708. package/src/duckdb/src/include/duckdb/main/relation/delim_get_relation.hpp +30 -0
  709. package/src/duckdb/src/include/duckdb/main/relation/explain_relation.hpp +3 -1
  710. package/src/duckdb/src/include/duckdb/main/relation/join_relation.hpp +3 -0
  711. package/src/duckdb/src/include/duckdb/main/relation/materialized_relation.hpp +1 -4
  712. package/src/duckdb/src/include/duckdb/main/relation/query_relation.hpp +4 -1
  713. package/src/duckdb/src/include/duckdb/main/relation/read_json_relation.hpp +6 -0
  714. package/src/duckdb/src/include/duckdb/main/relation/table_function_relation.hpp +1 -0
  715. package/src/duckdb/src/include/duckdb/main/relation/view_relation.hpp +2 -0
  716. package/src/duckdb/src/include/duckdb/main/relation.hpp +7 -4
  717. package/src/duckdb/src/include/duckdb/main/secret/default_secrets.hpp +36 -0
  718. package/src/duckdb/src/include/duckdb/main/secret/secret.hpp +108 -0
  719. package/src/duckdb/src/include/duckdb/main/secret/secret_manager.hpp +14 -4
  720. package/src/duckdb/src/include/duckdb/main/settings.hpp +227 -3
  721. package/src/duckdb/src/include/duckdb/main/stream_query_result.hpp +8 -0
  722. package/src/duckdb/src/include/duckdb/optimizer/build_probe_side_optimizer.hpp +51 -0
  723. package/src/duckdb/src/include/duckdb/optimizer/compressed_materialization.hpp +7 -0
  724. package/src/duckdb/src/include/duckdb/optimizer/cte_filter_pusher.hpp +46 -0
  725. package/src/duckdb/src/include/duckdb/optimizer/filter_combiner.hpp +1 -1
  726. package/src/duckdb/src/include/duckdb/optimizer/filter_pushdown.hpp +7 -0
  727. package/src/duckdb/src/include/duckdb/optimizer/join_filter_pushdown_optimizer.hpp +31 -0
  728. package/src/duckdb/src/include/duckdb/optimizer/join_order/cardinality_estimator.hpp +51 -10
  729. package/src/duckdb/src/include/duckdb/optimizer/join_order/cost_model.hpp +1 -0
  730. package/src/duckdb/src/include/duckdb/optimizer/join_order/join_order_optimizer.hpp +17 -5
  731. package/src/duckdb/src/include/duckdb/optimizer/join_order/query_graph.hpp +1 -1
  732. package/src/duckdb/src/include/duckdb/optimizer/join_order/query_graph_manager.hpp +15 -13
  733. package/src/duckdb/src/include/duckdb/optimizer/join_order/relation_manager.hpp +9 -4
  734. package/src/duckdb/src/include/duckdb/optimizer/limit_pushdown.hpp +25 -0
  735. package/src/duckdb/src/include/duckdb/optimizer/optimizer.hpp +1 -0
  736. package/src/duckdb/src/include/duckdb/optimizer/rule/join_dependent_filter.hpp +37 -0
  737. package/src/duckdb/src/include/duckdb/parallel/executor_task.hpp +6 -1
  738. package/src/duckdb/src/include/duckdb/parallel/interrupt.hpp +54 -2
  739. package/src/duckdb/src/include/duckdb/parallel/meta_pipeline.hpp +27 -8
  740. package/src/duckdb/src/include/duckdb/parallel/pipeline.hpp +1 -0
  741. package/src/duckdb/src/include/duckdb/parallel/pipeline_prepare_finish_event.hpp +25 -0
  742. package/src/duckdb/src/include/duckdb/parallel/task_executor.hpp +63 -0
  743. package/src/duckdb/src/include/duckdb/parallel/task_scheduler.hpp +10 -1
  744. package/src/duckdb/src/include/duckdb/parser/expression/function_expression.hpp +4 -1
  745. package/src/duckdb/src/include/duckdb/parser/expression/star_expression.hpp +5 -0
  746. package/src/duckdb/src/include/duckdb/parser/parsed_data/alter_table_info.hpp +5 -0
  747. package/src/duckdb/src/include/duckdb/parser/parsed_data/attach_info.hpp +5 -0
  748. package/src/duckdb/src/include/duckdb/parser/parsed_data/create_index_info.hpp +2 -0
  749. package/src/duckdb/src/include/duckdb/parser/parsed_data/create_macro_info.hpp +11 -1
  750. package/src/duckdb/src/include/duckdb/parser/parsed_data/transaction_info.hpp +9 -0
  751. package/src/duckdb/src/include/duckdb/parser/parsed_expression_iterator.hpp +13 -6
  752. package/src/duckdb/src/include/duckdb/parser/parser_extension.hpp +1 -1
  753. package/src/duckdb/src/include/duckdb/parser/sql_statement.hpp +1 -3
  754. package/src/duckdb/src/include/duckdb/parser/statement/copy_statement.hpp +2 -0
  755. package/src/duckdb/src/include/duckdb/parser/statement/explain_statement.hpp +5 -1
  756. package/src/duckdb/src/include/duckdb/parser/statement/set_statement.hpp +2 -2
  757. package/src/duckdb/src/include/duckdb/parser/statement/transaction_statement.hpp +1 -1
  758. package/src/duckdb/src/include/duckdb/parser/tableref/basetableref.hpp +0 -2
  759. package/src/duckdb/src/include/duckdb/parser/tableref/column_data_ref.hpp +9 -7
  760. package/src/duckdb/src/include/duckdb/parser/tableref/delimgetref.hpp +37 -0
  761. package/src/duckdb/src/include/duckdb/parser/tableref/joinref.hpp +4 -0
  762. package/src/duckdb/src/include/duckdb/parser/tableref/pivotref.hpp +0 -2
  763. package/src/duckdb/src/include/duckdb/parser/tableref/subqueryref.hpp +0 -2
  764. package/src/duckdb/src/include/duckdb/parser/tableref/table_function_ref.hpp +0 -1
  765. package/src/duckdb/src/include/duckdb/parser/tableref.hpp +3 -1
  766. package/src/duckdb/src/include/duckdb/parser/transformer.hpp +17 -9
  767. package/src/duckdb/src/include/duckdb/planner/binder.hpp +24 -14
  768. package/src/duckdb/src/include/duckdb/planner/collation_binding.hpp +44 -0
  769. package/src/duckdb/src/include/duckdb/planner/expression/bound_aggregate_expression.hpp +1 -1
  770. package/src/duckdb/src/include/duckdb/planner/expression/bound_between_expression.hpp +1 -1
  771. package/src/duckdb/src/include/duckdb/planner/expression/bound_case_expression.hpp +1 -1
  772. package/src/duckdb/src/include/duckdb/planner/expression/bound_cast_expression.hpp +1 -1
  773. package/src/duckdb/src/include/duckdb/planner/expression/bound_columnref_expression.hpp +1 -1
  774. package/src/duckdb/src/include/duckdb/planner/expression/bound_comparison_expression.hpp +1 -1
  775. package/src/duckdb/src/include/duckdb/planner/expression/bound_conjunction_expression.hpp +1 -1
  776. package/src/duckdb/src/include/duckdb/planner/expression/bound_constant_expression.hpp +1 -1
  777. package/src/duckdb/src/include/duckdb/planner/expression/bound_default_expression.hpp +1 -1
  778. package/src/duckdb/src/include/duckdb/planner/expression/bound_expanded_expression.hpp +1 -1
  779. package/src/duckdb/src/include/duckdb/planner/expression/bound_function_expression.hpp +1 -1
  780. package/src/duckdb/src/include/duckdb/planner/expression/bound_lambda_expression.hpp +1 -1
  781. package/src/duckdb/src/include/duckdb/planner/expression/bound_lambdaref_expression.hpp +1 -1
  782. package/src/duckdb/src/include/duckdb/planner/expression/bound_operator_expression.hpp +1 -1
  783. package/src/duckdb/src/include/duckdb/planner/expression/bound_parameter_data.hpp +2 -0
  784. package/src/duckdb/src/include/duckdb/planner/expression/bound_parameter_expression.hpp +1 -1
  785. package/src/duckdb/src/include/duckdb/planner/expression/bound_reference_expression.hpp +1 -1
  786. package/src/duckdb/src/include/duckdb/planner/expression/bound_subquery_expression.hpp +2 -2
  787. package/src/duckdb/src/include/duckdb/planner/expression/bound_unnest_expression.hpp +1 -1
  788. package/src/duckdb/src/include/duckdb/planner/expression/bound_window_expression.hpp +1 -1
  789. package/src/duckdb/src/include/duckdb/planner/expression.hpp +2 -2
  790. package/src/duckdb/src/include/duckdb/planner/expression_binder/column_alias_binder.hpp +2 -0
  791. package/src/duckdb/src/include/duckdb/planner/expression_binder/group_binder.hpp +1 -0
  792. package/src/duckdb/src/include/duckdb/planner/expression_binder/order_binder.hpp +6 -5
  793. package/src/duckdb/src/include/duckdb/planner/expression_binder/where_binder.hpp +1 -0
  794. package/src/duckdb/src/include/duckdb/planner/expression_binder.hpp +19 -11
  795. package/src/duckdb/src/include/duckdb/planner/filter/conjunction_filter.hpp +4 -0
  796. package/src/duckdb/src/include/duckdb/planner/filter/constant_filter.hpp +2 -0
  797. package/src/duckdb/src/include/duckdb/planner/filter/null_filter.hpp +4 -0
  798. package/src/duckdb/src/include/duckdb/planner/filter/struct_filter.hpp +2 -0
  799. package/src/duckdb/src/include/duckdb/planner/logical_operator.hpp +7 -2
  800. package/src/duckdb/src/include/duckdb/planner/logical_operator_visitor.hpp +2 -1
  801. package/src/duckdb/src/include/duckdb/planner/operator/logical_aggregate.hpp +1 -1
  802. package/src/duckdb/src/include/duckdb/planner/operator/logical_any_join.hpp +1 -1
  803. package/src/duckdb/src/include/duckdb/planner/operator/logical_comparison_join.hpp +6 -1
  804. package/src/duckdb/src/include/duckdb/planner/operator/logical_copy_to_file.hpp +10 -2
  805. package/src/duckdb/src/include/duckdb/planner/operator/logical_cteref.hpp +1 -0
  806. package/src/duckdb/src/include/duckdb/planner/operator/logical_delim_get.hpp +1 -1
  807. package/src/duckdb/src/include/duckdb/planner/operator/logical_distinct.hpp +1 -1
  808. package/src/duckdb/src/include/duckdb/planner/operator/logical_execute.hpp +1 -1
  809. package/src/duckdb/src/include/duckdb/planner/operator/logical_explain.hpp +4 -2
  810. package/src/duckdb/src/include/duckdb/planner/operator/logical_get.hpp +15 -5
  811. package/src/duckdb/src/include/duckdb/planner/operator/logical_materialized_cte.hpp +1 -0
  812. package/src/duckdb/src/include/duckdb/planner/operator/logical_order.hpp +1 -1
  813. package/src/duckdb/src/include/duckdb/planner/subquery/flatten_dependent_join.hpp +2 -1
  814. package/src/duckdb/src/include/duckdb/planner/table_filter.hpp +24 -2
  815. package/src/duckdb/src/include/duckdb/planner/tableref/bound_delimgetref.hpp +26 -0
  816. package/src/duckdb/src/include/duckdb/planner/tableref/bound_joinref.hpp +6 -0
  817. package/src/duckdb/src/include/duckdb/planner/tableref/bound_subqueryref.hpp +1 -1
  818. package/src/duckdb/src/include/duckdb/planner/tableref/bound_table_function.hpp +2 -0
  819. package/src/duckdb/src/include/duckdb/planner/tableref/list.hpp +2 -0
  820. package/src/duckdb/src/include/duckdb/storage/arena_allocator.hpp +2 -1
  821. package/src/duckdb/src/include/duckdb/storage/block.hpp +4 -2
  822. package/src/duckdb/src/include/duckdb/storage/block_manager.hpp +48 -3
  823. package/src/duckdb/src/include/duckdb/storage/buffer/block_handle.hpp +21 -7
  824. package/src/duckdb/src/include/duckdb/storage/buffer/buffer_pool.hpp +65 -51
  825. package/src/duckdb/src/include/duckdb/storage/buffer_manager.hpp +14 -5
  826. package/src/duckdb/src/include/duckdb/storage/checkpoint/row_group_writer.hpp +0 -4
  827. package/src/duckdb/src/include/duckdb/storage/checkpoint/string_checkpoint_state.hpp +3 -2
  828. package/src/duckdb/src/include/duckdb/storage/checkpoint/table_data_writer.hpp +1 -0
  829. package/src/duckdb/src/include/duckdb/storage/checkpoint/write_overflow_strings_to_disk.hpp +3 -4
  830. package/src/duckdb/src/include/duckdb/storage/checkpoint_manager.hpp +2 -0
  831. package/src/duckdb/src/include/duckdb/storage/compression/alp/algorithm/alp.hpp +4 -4
  832. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_analyze.hpp +6 -4
  833. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_compress.hpp +19 -17
  834. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_constants.hpp +2 -2
  835. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_scan.hpp +3 -4
  836. package/src/duckdb/src/include/duckdb/storage/compression/alp/alp_utils.hpp +3 -2
  837. package/src/duckdb/src/include/duckdb/storage/compression/alprd/algorithm/alprd.hpp +3 -2
  838. package/src/duckdb/src/include/duckdb/storage/compression/alprd/alprd_analyze.hpp +13 -11
  839. package/src/duckdb/src/include/duckdb/storage/compression/alprd/alprd_compress.hpp +19 -19
  840. package/src/duckdb/src/include/duckdb/storage/compression/alprd/alprd_scan.hpp +3 -4
  841. package/src/duckdb/src/include/duckdb/storage/compression/chimp/chimp_scan.hpp +1 -1
  842. package/src/duckdb/src/include/duckdb/storage/compression/patas/patas_scan.hpp +1 -1
  843. package/src/duckdb/src/include/duckdb/storage/data_pointer.hpp +10 -2
  844. package/src/duckdb/src/include/duckdb/storage/data_table.hpp +3 -2
  845. package/src/duckdb/src/include/duckdb/storage/in_memory_block_manager.hpp +15 -0
  846. package/src/duckdb/src/include/duckdb/storage/index_storage_info.hpp +14 -10
  847. package/src/duckdb/src/include/duckdb/storage/metadata/metadata_manager.hpp +6 -8
  848. package/src/duckdb/src/include/duckdb/storage/partial_block_manager.hpp +7 -4
  849. package/src/duckdb/src/include/duckdb/storage/segment/uncompressed.hpp +4 -7
  850. package/src/duckdb/src/include/duckdb/storage/single_file_block_manager.hpp +29 -4
  851. package/src/duckdb/src/include/duckdb/storage/standard_buffer_manager.hpp +22 -7
  852. package/src/duckdb/src/include/duckdb/storage/statistics/base_statistics.hpp +15 -2
  853. package/src/duckdb/src/include/duckdb/storage/statistics/distinct_statistics.hpp +8 -2
  854. package/src/duckdb/src/include/duckdb/storage/statistics/numeric_stats.hpp +5 -16
  855. package/src/duckdb/src/include/duckdb/storage/statistics/numeric_stats_union.hpp +51 -13
  856. package/src/duckdb/src/include/duckdb/storage/statistics/string_stats.hpp +6 -3
  857. package/src/duckdb/src/include/duckdb/storage/storage_info.hpp +29 -19
  858. package/src/duckdb/src/include/duckdb/storage/storage_manager.hpp +23 -7
  859. package/src/duckdb/src/include/duckdb/storage/string_uncompressed.hpp +27 -18
  860. package/src/duckdb/src/include/duckdb/storage/table/append_state.hpp +6 -3
  861. package/src/duckdb/src/include/duckdb/storage/table/array_column_data.hpp +5 -2
  862. package/src/duckdb/src/include/duckdb/storage/table/chunk_info.hpp +3 -0
  863. package/src/duckdb/src/include/duckdb/storage/table/column_checkpoint_state.hpp +5 -1
  864. package/src/duckdb/src/include/duckdb/storage/table/column_data.hpp +77 -6
  865. package/src/duckdb/src/include/duckdb/storage/table/column_segment.hpp +23 -11
  866. package/src/duckdb/src/include/duckdb/storage/table/data_table_info.hpp +3 -0
  867. package/src/duckdb/src/include/duckdb/storage/table/list_column_data.hpp +5 -2
  868. package/src/duckdb/src/include/duckdb/storage/table/row_group.hpp +18 -4
  869. package/src/duckdb/src/include/duckdb/storage/table/row_group_collection.hpp +7 -1
  870. package/src/duckdb/src/include/duckdb/storage/table/row_version_manager.hpp +2 -1
  871. package/src/duckdb/src/include/duckdb/storage/table/scan_state.hpp +89 -14
  872. package/src/duckdb/src/include/duckdb/storage/table/standard_column_data.hpp +4 -2
  873. package/src/duckdb/src/include/duckdb/storage/table/struct_column_data.hpp +4 -2
  874. package/src/duckdb/src/include/duckdb/storage/table/table_index_list.hpp +2 -2
  875. package/src/duckdb/src/include/duckdb/storage/table/validity_column_data.hpp +1 -1
  876. package/src/duckdb/src/include/duckdb/storage/temporary_memory_manager.hpp +33 -15
  877. package/src/duckdb/src/include/duckdb/storage/write_ahead_log.hpp +9 -9
  878. package/src/duckdb/src/include/duckdb/transaction/cleanup_state.hpp +3 -1
  879. package/src/duckdb/src/include/duckdb/transaction/commit_state.hpp +4 -16
  880. package/src/duckdb/src/include/duckdb/transaction/duck_transaction.hpp +27 -4
  881. package/src/duckdb/src/include/duckdb/transaction/duck_transaction_manager.hpp +11 -0
  882. package/src/duckdb/src/include/duckdb/transaction/local_storage.hpp +6 -2
  883. package/src/duckdb/src/include/duckdb/transaction/meta_transaction.hpp +5 -5
  884. package/src/duckdb/src/include/duckdb/transaction/transaction_context.hpp +6 -2
  885. package/src/duckdb/src/include/duckdb/transaction/undo_buffer.hpp +5 -3
  886. package/src/duckdb/src/include/duckdb/transaction/wal_write_state.hpp +48 -0
  887. package/src/duckdb/src/include/duckdb.h +1779 -739
  888. package/src/duckdb/src/include/duckdb_extension.h +921 -0
  889. package/src/duckdb/src/main/appender.cpp +53 -7
  890. package/src/duckdb/src/main/attached_database.cpp +87 -17
  891. package/src/duckdb/src/main/buffered_data/batched_buffered_data.cpp +226 -0
  892. package/src/duckdb/src/main/buffered_data/buffered_data.cpp +35 -0
  893. package/src/duckdb/src/main/buffered_data/simple_buffered_data.cpp +48 -23
  894. package/src/duckdb/src/main/capi/aggregate_function-c.cpp +327 -0
  895. package/src/duckdb/src/main/capi/appender-c.cpp +18 -0
  896. package/src/duckdb/src/main/capi/cast/utils-c.cpp +2 -2
  897. package/src/duckdb/src/main/capi/cast_function-c.cpp +210 -0
  898. package/src/duckdb/src/main/capi/config-c.cpp +3 -3
  899. package/src/duckdb/src/main/capi/data_chunk-c.cpp +18 -7
  900. package/src/duckdb/src/main/capi/duckdb_value-c.cpp +223 -24
  901. package/src/duckdb/src/main/capi/helper-c.cpp +51 -11
  902. package/src/duckdb/src/main/capi/logical_types-c.cpp +105 -46
  903. package/src/duckdb/src/main/capi/pending-c.cpp +7 -6
  904. package/src/duckdb/src/main/capi/prepared-c.cpp +18 -7
  905. package/src/duckdb/src/main/capi/profiling_info-c.cpp +84 -0
  906. package/src/duckdb/src/main/capi/result-c.cpp +139 -37
  907. package/src/duckdb/src/main/capi/scalar_function-c.cpp +269 -0
  908. package/src/duckdb/src/main/capi/table_description-c.cpp +82 -0
  909. package/src/duckdb/src/main/capi/table_function-c.cpp +161 -95
  910. package/src/duckdb/src/main/capi/value-c.cpp +2 -2
  911. package/src/duckdb/src/main/chunk_scan_state/batched_data_collection.cpp +57 -0
  912. package/src/duckdb/src/main/client_config.cpp +17 -0
  913. package/src/duckdb/src/main/client_context.cpp +67 -52
  914. package/src/duckdb/src/main/client_data.cpp +3 -3
  915. package/src/duckdb/src/main/config.cpp +120 -62
  916. package/src/duckdb/src/main/connection.cpp +14 -2
  917. package/src/duckdb/src/main/database.cpp +96 -35
  918. package/src/duckdb/src/main/database_manager.cpp +25 -23
  919. package/src/duckdb/src/main/database_path_and_type.cpp +2 -2
  920. package/src/duckdb/src/main/db_instance_cache.cpp +54 -19
  921. package/src/duckdb/src/main/extension/extension_helper.cpp +47 -42
  922. package/src/duckdb/src/main/extension/extension_install.cpp +155 -87
  923. package/src/duckdb/src/main/extension/extension_load.cpp +180 -26
  924. package/src/duckdb/src/main/extension/extension_util.cpp +8 -0
  925. package/src/duckdb/src/main/extension.cpp +72 -5
  926. package/src/duckdb/src/main/pending_query_result.cpp +20 -12
  927. package/src/duckdb/src/main/prepared_statement.cpp +6 -6
  928. package/src/duckdb/src/main/prepared_statement_data.cpp +28 -17
  929. package/src/duckdb/src/main/profiling_info.cpp +196 -0
  930. package/src/duckdb/src/main/query_profiler.cpp +413 -224
  931. package/src/duckdb/src/main/query_result.cpp +1 -1
  932. package/src/duckdb/src/main/relation/create_table_relation.cpp +4 -2
  933. package/src/duckdb/src/main/relation/create_view_relation.cpp +0 -6
  934. package/src/duckdb/src/main/relation/delim_get_relation.cpp +44 -0
  935. package/src/duckdb/src/main/relation/explain_relation.cpp +4 -3
  936. package/src/duckdb/src/main/relation/join_relation.cpp +5 -0
  937. package/src/duckdb/src/main/relation/limit_relation.cpp +1 -1
  938. package/src/duckdb/src/main/relation/materialized_relation.cpp +3 -3
  939. package/src/duckdb/src/main/relation/query_relation.cpp +42 -15
  940. package/src/duckdb/src/main/relation/read_csv_relation.cpp +7 -14
  941. package/src/duckdb/src/main/relation/read_json_relation.cpp +20 -0
  942. package/src/duckdb/src/main/relation/setop_relation.cpp +1 -1
  943. package/src/duckdb/src/main/relation/table_function_relation.cpp +6 -0
  944. package/src/duckdb/src/main/relation/view_relation.cpp +10 -0
  945. package/src/duckdb/src/main/relation.cpp +12 -8
  946. package/src/duckdb/src/main/secret/default_secrets.cpp +108 -0
  947. package/src/duckdb/src/main/secret/secret.cpp +145 -2
  948. package/src/duckdb/src/main/secret/secret_manager.cpp +85 -35
  949. package/src/duckdb/src/main/secret/secret_storage.cpp +29 -17
  950. package/src/duckdb/src/main/settings/settings.cpp +503 -11
  951. package/src/duckdb/src/main/stream_query_result.cpp +75 -2
  952. package/src/duckdb/src/optimizer/build_probe_side_optimizer.cpp +248 -0
  953. package/src/duckdb/src/optimizer/column_lifetime_analyzer.cpp +28 -6
  954. package/src/duckdb/src/optimizer/compressed_materialization/compress_comparison_join.cpp +152 -0
  955. package/src/duckdb/src/optimizer/compressed_materialization.cpp +11 -1
  956. package/src/duckdb/src/optimizer/cse_optimizer.cpp +3 -0
  957. package/src/duckdb/src/optimizer/cte_filter_pusher.cpp +117 -0
  958. package/src/duckdb/src/optimizer/filter_combiner.cpp +30 -9
  959. package/src/duckdb/src/optimizer/filter_pullup.cpp +54 -2
  960. package/src/duckdb/src/optimizer/filter_pushdown.cpp +71 -3
  961. package/src/duckdb/src/optimizer/join_filter_pushdown_optimizer.cpp +154 -0
  962. package/src/duckdb/src/optimizer/join_order/cardinality_estimator.cpp +245 -114
  963. package/src/duckdb/src/optimizer/join_order/join_order_optimizer.cpp +42 -20
  964. package/src/duckdb/src/optimizer/join_order/join_relation_set.cpp +6 -2
  965. package/src/duckdb/src/optimizer/join_order/plan_enumerator.cpp +32 -10
  966. package/src/duckdb/src/optimizer/join_order/query_graph_manager.cpp +97 -131
  967. package/src/duckdb/src/optimizer/join_order/relation_manager.cpp +265 -51
  968. package/src/duckdb/src/optimizer/join_order/relation_statistics_helper.cpp +21 -17
  969. package/src/duckdb/src/optimizer/limit_pushdown.cpp +42 -0
  970. package/src/duckdb/src/optimizer/optimizer.cpp +51 -8
  971. package/src/duckdb/src/optimizer/pushdown/pushdown_aggregate.cpp +17 -17
  972. package/src/duckdb/src/optimizer/pushdown/pushdown_cross_product.cpp +22 -4
  973. package/src/duckdb/src/optimizer/pushdown/pushdown_get.cpp +1 -18
  974. package/src/duckdb/src/optimizer/pushdown/pushdown_inner_join.cpp +6 -0
  975. package/src/duckdb/src/optimizer/pushdown/pushdown_mark_join.cpp +4 -2
  976. package/src/duckdb/src/optimizer/pushdown/pushdown_window.cpp +91 -0
  977. package/src/duckdb/src/optimizer/remove_unused_columns.cpp +21 -25
  978. package/src/duckdb/src/optimizer/rule/comparison_simplification.cpp +1 -0
  979. package/src/duckdb/src/optimizer/rule/empty_needle_removal.cpp +3 -0
  980. package/src/duckdb/src/optimizer/rule/equal_or_null_simplification.cpp +2 -2
  981. package/src/duckdb/src/optimizer/rule/in_clause_simplification_rule.cpp +8 -2
  982. package/src/duckdb/src/optimizer/rule/join_dependent_filter.cpp +135 -0
  983. package/src/duckdb/src/optimizer/rule/like_optimizations.cpp +1 -1
  984. package/src/duckdb/src/optimizer/rule/regex_optimizations.cpp +1 -1
  985. package/src/duckdb/src/optimizer/statistics/operator/propagate_filter.cpp +6 -1
  986. package/src/duckdb/src/optimizer/statistics/operator/propagate_get.cpp +7 -6
  987. package/src/duckdb/src/optimizer/statistics/operator/propagate_join.cpp +1 -1
  988. package/src/duckdb/src/optimizer/topn_optimizer.cpp +46 -7
  989. package/src/duckdb/src/parallel/executor.cpp +129 -51
  990. package/src/duckdb/src/parallel/executor_task.cpp +16 -3
  991. package/src/duckdb/src/parallel/meta_pipeline.cpp +98 -29
  992. package/src/duckdb/src/parallel/pipeline.cpp +17 -3
  993. package/src/duckdb/src/parallel/pipeline_executor.cpp +14 -2
  994. package/src/duckdb/src/parallel/pipeline_prepare_finish_event.cpp +34 -0
  995. package/src/duckdb/src/parallel/task_executor.cpp +84 -0
  996. package/src/duckdb/src/parallel/task_scheduler.cpp +94 -16
  997. package/src/duckdb/src/parallel/thread_context.cpp +1 -1
  998. package/src/duckdb/src/parser/expression/function_expression.cpp +14 -0
  999. package/src/duckdb/src/parser/expression/star_expression.cpp +35 -2
  1000. package/src/duckdb/src/parser/parsed_data/alter_table_info.cpp +5 -1
  1001. package/src/duckdb/src/parser/parsed_data/attach_info.cpp +17 -0
  1002. package/src/duckdb/src/parser/parsed_data/create_index_info.cpp +37 -28
  1003. package/src/duckdb/src/parser/parsed_data/create_macro_info.cpp +44 -2
  1004. package/src/duckdb/src/parser/parsed_data/transaction_info.cpp +21 -1
  1005. package/src/duckdb/src/parser/parsed_expression_iterator.cpp +29 -25
  1006. package/src/duckdb/src/parser/parser.cpp +41 -1
  1007. package/src/duckdb/src/parser/query_node/recursive_cte_node.cpp +1 -0
  1008. package/src/duckdb/src/parser/statement/explain_statement.cpp +28 -13
  1009. package/src/duckdb/src/parser/statement/relation_statement.cpp +5 -0
  1010. package/src/duckdb/src/parser/statement/set_statement.cpp +4 -2
  1011. package/src/duckdb/src/parser/statement/transaction_statement.cpp +3 -3
  1012. package/src/duckdb/src/parser/tableref/column_data_ref.cpp +1 -27
  1013. package/src/duckdb/src/parser/tableref/delimgetref.cpp +30 -0
  1014. package/src/duckdb/src/parser/tableref/joinref.cpp +4 -0
  1015. package/src/duckdb/src/parser/transform/constraint/transform_constraint.cpp +35 -29
  1016. package/src/duckdb/src/parser/transform/expression/transform_array_access.cpp +32 -32
  1017. package/src/duckdb/src/parser/transform/expression/transform_columnref.cpp +2 -1
  1018. package/src/duckdb/src/parser/transform/expression/transform_constant.cpp +17 -0
  1019. package/src/duckdb/src/parser/transform/expression/transform_function.cpp +5 -0
  1020. package/src/duckdb/src/parser/transform/expression/transform_multi_assign_reference.cpp +36 -34
  1021. package/src/duckdb/src/parser/transform/expression/transform_operator.cpp +30 -14
  1022. package/src/duckdb/src/parser/transform/expression/transform_subquery.cpp +1 -1
  1023. package/src/duckdb/src/parser/transform/helpers/transform_alias.cpp +2 -1
  1024. package/src/duckdb/src/parser/transform/helpers/transform_cte.cpp +27 -19
  1025. package/src/duckdb/src/parser/transform/helpers/transform_orderby.cpp +31 -28
  1026. package/src/duckdb/src/parser/transform/statement/transform_alter_table.cpp +25 -27
  1027. package/src/duckdb/src/parser/transform/statement/transform_copy.cpp +1 -1
  1028. package/src/duckdb/src/parser/transform/statement/transform_create_function.cpp +53 -42
  1029. package/src/duckdb/src/parser/transform/statement/transform_create_table.cpp +6 -6
  1030. package/src/duckdb/src/parser/transform/statement/transform_create_table_as.cpp +1 -1
  1031. package/src/duckdb/src/parser/transform/statement/transform_create_type.cpp +1 -1
  1032. package/src/duckdb/src/parser/transform/statement/transform_create_view.cpp +1 -1
  1033. package/src/duckdb/src/parser/transform/statement/transform_explain.cpp +38 -3
  1034. package/src/duckdb/src/parser/transform/statement/transform_insert.cpp +1 -2
  1035. package/src/duckdb/src/parser/transform/statement/transform_pivot_stmt.cpp +1 -1
  1036. package/src/duckdb/src/parser/transform/statement/transform_prepare.cpp +1 -1
  1037. package/src/duckdb/src/parser/transform/statement/transform_select.cpp +26 -21
  1038. package/src/duckdb/src/parser/transform/statement/transform_set.cpp +8 -8
  1039. package/src/duckdb/src/parser/transform/statement/transform_show.cpp +5 -2
  1040. package/src/duckdb/src/parser/transform/statement/transform_show_select.cpp +6 -4
  1041. package/src/duckdb/src/parser/transform/statement/transform_transaction.cpp +27 -6
  1042. package/src/duckdb/src/parser/transform/statement/transform_update.cpp +8 -9
  1043. package/src/duckdb/src/parser/transform/statement/transform_upsert.cpp +11 -12
  1044. package/src/duckdb/src/parser/transform/statement/transform_vacuum.cpp +3 -3
  1045. package/src/duckdb/src/parser/transform/tableref/transform_join.cpp +16 -10
  1046. package/src/duckdb/src/parser/transform/tableref/transform_pivot.cpp +1 -1
  1047. package/src/duckdb/src/parser/transform/tableref/transform_subquery.cpp +1 -1
  1048. package/src/duckdb/src/parser/transformer.cpp +11 -7
  1049. package/src/duckdb/src/planner/bind_context.cpp +3 -3
  1050. package/src/duckdb/src/planner/binder/expression/bind_aggregate_expression.cpp +22 -7
  1051. package/src/duckdb/src/planner/binder/expression/bind_between_expression.cpp +3 -3
  1052. package/src/duckdb/src/planner/binder/expression/bind_collate_expression.cpp +3 -2
  1053. package/src/duckdb/src/planner/binder/expression/bind_columnref_expression.cpp +11 -4
  1054. package/src/duckdb/src/planner/binder/expression/bind_comparison_expression.cpp +9 -54
  1055. package/src/duckdb/src/planner/binder/expression/bind_function_expression.cpp +3 -5
  1056. package/src/duckdb/src/planner/binder/expression/bind_macro_expression.cpp +24 -27
  1057. package/src/duckdb/src/planner/binder/expression/bind_operator_expression.cpp +7 -7
  1058. package/src/duckdb/src/planner/binder/expression/bind_parameter_expression.cpp +9 -2
  1059. package/src/duckdb/src/planner/binder/expression/bind_star_expression.cpp +26 -7
  1060. package/src/duckdb/src/planner/binder/expression/bind_unnest_expression.cpp +5 -0
  1061. package/src/duckdb/src/planner/binder/expression/bind_unpacked_star_expression.cpp +91 -0
  1062. package/src/duckdb/src/planner/binder/expression/bind_window_expression.cpp +2 -2
  1063. package/src/duckdb/src/planner/binder/query_node/bind_select_node.cpp +11 -8
  1064. package/src/duckdb/src/planner/binder/query_node/bind_setop_node.cpp +1 -1
  1065. package/src/duckdb/src/planner/binder/query_node/bind_table_macro_node.cpp +6 -10
  1066. package/src/duckdb/src/planner/binder/query_node/plan_cte_node.cpp +14 -10
  1067. package/src/duckdb/src/planner/binder/query_node/plan_setop.cpp +3 -3
  1068. package/src/duckdb/src/planner/binder/query_node/plan_subquery.cpp +46 -7
  1069. package/src/duckdb/src/planner/binder/statement/bind_call.cpp +13 -20
  1070. package/src/duckdb/src/planner/binder/statement/bind_copy.cpp +105 -13
  1071. package/src/duckdb/src/planner/binder/statement/bind_copy_database.cpp +7 -3
  1072. package/src/duckdb/src/planner/binder/statement/bind_create.cpp +75 -55
  1073. package/src/duckdb/src/planner/binder/statement/bind_create_table.cpp +1 -1
  1074. package/src/duckdb/src/planner/binder/statement/bind_delete.cpp +5 -4
  1075. package/src/duckdb/src/planner/binder/statement/bind_drop.cpp +2 -2
  1076. package/src/duckdb/src/planner/binder/statement/bind_execute.cpp +24 -8
  1077. package/src/duckdb/src/planner/binder/statement/bind_explain.cpp +2 -2
  1078. package/src/duckdb/src/planner/binder/statement/bind_export.cpp +5 -105
  1079. package/src/duckdb/src/planner/binder/statement/bind_extension.cpp +2 -2
  1080. package/src/duckdb/src/planner/binder/statement/bind_insert.cpp +109 -41
  1081. package/src/duckdb/src/planner/binder/statement/bind_set.cpp +23 -7
  1082. package/src/duckdb/src/planner/binder/statement/bind_simple.cpp +4 -1
  1083. package/src/duckdb/src/planner/binder/statement/bind_summarize.cpp +17 -3
  1084. package/src/duckdb/src/planner/binder/statement/bind_update.cpp +5 -4
  1085. package/src/duckdb/src/planner/binder/statement/bind_vacuum.cpp +8 -6
  1086. package/src/duckdb/src/planner/binder/tableref/bind_basetableref.cpp +55 -42
  1087. package/src/duckdb/src/planner/binder/tableref/bind_column_data_ref.cpp +3 -2
  1088. package/src/duckdb/src/planner/binder/tableref/bind_delimgetref.cpp +16 -0
  1089. package/src/duckdb/src/planner/binder/tableref/bind_joinref.cpp +31 -1
  1090. package/src/duckdb/src/planner/binder/tableref/bind_pivot.cpp +6 -0
  1091. package/src/duckdb/src/planner/binder/tableref/bind_showref.cpp +2 -0
  1092. package/src/duckdb/src/planner/binder/tableref/bind_table_function.cpp +106 -46
  1093. package/src/duckdb/src/planner/binder/tableref/plan_delimgetref.cpp +11 -0
  1094. package/src/duckdb/src/planner/binder/tableref/plan_joinref.cpp +15 -2
  1095. package/src/duckdb/src/planner/binder/tableref/plan_table_function.cpp +4 -0
  1096. package/src/duckdb/src/planner/binder.cpp +172 -15
  1097. package/src/duckdb/src/planner/collation_binding.cpp +99 -0
  1098. package/src/duckdb/src/planner/expression/bound_aggregate_expression.cpp +10 -4
  1099. package/src/duckdb/src/planner/expression/bound_between_expression.cpp +1 -1
  1100. package/src/duckdb/src/planner/expression/bound_case_expression.cpp +1 -1
  1101. package/src/duckdb/src/planner/expression/bound_cast_expression.cpp +14 -12
  1102. package/src/duckdb/src/planner/expression/bound_columnref_expression.cpp +1 -1
  1103. package/src/duckdb/src/planner/expression/bound_comparison_expression.cpp +1 -1
  1104. package/src/duckdb/src/planner/expression/bound_conjunction_expression.cpp +1 -1
  1105. package/src/duckdb/src/planner/expression/bound_constant_expression.cpp +1 -1
  1106. package/src/duckdb/src/planner/expression/bound_expanded_expression.cpp +1 -1
  1107. package/src/duckdb/src/planner/expression/bound_function_expression.cpp +8 -2
  1108. package/src/duckdb/src/planner/expression/bound_lambda_expression.cpp +1 -1
  1109. package/src/duckdb/src/planner/expression/bound_lambdaref_expression.cpp +1 -1
  1110. package/src/duckdb/src/planner/expression/bound_operator_expression.cpp +1 -1
  1111. package/src/duckdb/src/planner/expression/bound_parameter_expression.cpp +1 -1
  1112. package/src/duckdb/src/planner/expression/bound_reference_expression.cpp +1 -1
  1113. package/src/duckdb/src/planner/expression/bound_subquery_expression.cpp +1 -1
  1114. package/src/duckdb/src/planner/expression/bound_unnest_expression.cpp +1 -1
  1115. package/src/duckdb/src/planner/expression/bound_window_expression.cpp +6 -6
  1116. package/src/duckdb/src/planner/expression_binder/aggregate_binder.cpp +1 -1
  1117. package/src/duckdb/src/planner/expression_binder/alter_binder.cpp +2 -2
  1118. package/src/duckdb/src/planner/expression_binder/base_select_binder.cpp +1 -1
  1119. package/src/duckdb/src/planner/expression_binder/column_alias_binder.cpp +7 -0
  1120. package/src/duckdb/src/planner/expression_binder/constant_binder.cpp +3 -3
  1121. package/src/duckdb/src/planner/expression_binder/group_binder.cpp +26 -22
  1122. package/src/duckdb/src/planner/expression_binder/having_binder.cpp +7 -1
  1123. package/src/duckdb/src/planner/expression_binder/index_binder.cpp +2 -2
  1124. package/src/duckdb/src/planner/expression_binder/insert_binder.cpp +2 -2
  1125. package/src/duckdb/src/planner/expression_binder/lateral_binder.cpp +2 -2
  1126. package/src/duckdb/src/planner/expression_binder/order_binder.cpp +61 -43
  1127. package/src/duckdb/src/planner/expression_binder/qualify_binder.cpp +2 -2
  1128. package/src/duckdb/src/planner/expression_binder/relation_binder.cpp +4 -4
  1129. package/src/duckdb/src/planner/expression_binder/returning_binder.cpp +3 -2
  1130. package/src/duckdb/src/planner/expression_binder/table_function_binder.cpp +10 -3
  1131. package/src/duckdb/src/planner/expression_binder/update_binder.cpp +1 -1
  1132. package/src/duckdb/src/planner/expression_binder/where_binder.cpp +9 -2
  1133. package/src/duckdb/src/planner/expression_binder.cpp +121 -21
  1134. package/src/duckdb/src/planner/expression_iterator.cpp +26 -1
  1135. package/src/duckdb/src/planner/filter/conjunction_filter.cpp +33 -0
  1136. package/src/duckdb/src/planner/filter/constant_filter.cpp +15 -0
  1137. package/src/duckdb/src/planner/filter/null_filter.cpp +22 -0
  1138. package/src/duckdb/src/planner/filter/struct_filter.cpp +16 -0
  1139. package/src/duckdb/src/planner/logical_operator.cpp +24 -7
  1140. package/src/duckdb/src/planner/operator/logical_aggregate.cpp +13 -7
  1141. package/src/duckdb/src/planner/operator/logical_any_join.cpp +5 -2
  1142. package/src/duckdb/src/planner/operator/logical_comparison_join.cpp +13 -5
  1143. package/src/duckdb/src/planner/operator/logical_copy_to_file.cpp +64 -8
  1144. package/src/duckdb/src/planner/operator/logical_cteref.cpp +7 -0
  1145. package/src/duckdb/src/planner/operator/logical_distinct.cpp +6 -5
  1146. package/src/duckdb/src/planner/operator/logical_get.cpp +60 -18
  1147. package/src/duckdb/src/planner/operator/logical_materialized_cte.cpp +7 -0
  1148. package/src/duckdb/src/planner/operator/logical_order.cpp +7 -4
  1149. package/src/duckdb/src/planner/operator/logical_top_n.cpp +2 -2
  1150. package/src/duckdb/src/planner/operator/logical_vacuum.cpp +1 -1
  1151. package/src/duckdb/src/planner/planner.cpp +2 -3
  1152. package/src/duckdb/src/planner/subquery/flatten_dependent_join.cpp +27 -10
  1153. package/src/duckdb/src/planner/table_filter.cpp +51 -0
  1154. package/src/duckdb/src/storage/arena_allocator.cpp +28 -10
  1155. package/src/duckdb/src/storage/block.cpp +3 -2
  1156. package/src/duckdb/src/storage/buffer/block_handle.cpp +29 -14
  1157. package/src/duckdb/src/storage/buffer/block_manager.cpp +6 -5
  1158. package/src/duckdb/src/storage/buffer/buffer_handle.cpp +1 -1
  1159. package/src/duckdb/src/storage/buffer/buffer_pool.cpp +264 -125
  1160. package/src/duckdb/src/storage/buffer_manager.cpp +5 -1
  1161. package/src/duckdb/src/storage/checkpoint/row_group_writer.cpp +0 -6
  1162. package/src/duckdb/src/storage/checkpoint/table_data_writer.cpp +26 -3
  1163. package/src/duckdb/src/storage/checkpoint/write_overflow_strings_to_disk.cpp +21 -9
  1164. package/src/duckdb/src/storage/checkpoint_manager.cpp +49 -24
  1165. package/src/duckdb/src/storage/compression/alp/alp.cpp +6 -11
  1166. package/src/duckdb/src/storage/compression/alprd.cpp +5 -9
  1167. package/src/duckdb/src/storage/compression/bitpacking.cpp +35 -31
  1168. package/src/duckdb/src/storage/compression/chimp/chimp.cpp +6 -8
  1169. package/src/duckdb/src/storage/compression/dictionary_compression.cpp +71 -58
  1170. package/src/duckdb/src/storage/compression/fixed_size_uncompressed.cpp +15 -13
  1171. package/src/duckdb/src/storage/compression/fsst.cpp +66 -53
  1172. package/src/duckdb/src/storage/compression/numeric_constant.cpp +4 -5
  1173. package/src/duckdb/src/storage/compression/patas.cpp +6 -17
  1174. package/src/duckdb/src/storage/compression/rle.cpp +20 -18
  1175. package/src/duckdb/src/storage/compression/string_uncompressed.cpp +71 -52
  1176. package/src/duckdb/src/storage/compression/uncompressed.cpp +2 -2
  1177. package/src/duckdb/src/storage/compression/validity_uncompressed.cpp +8 -7
  1178. package/src/duckdb/src/storage/data_pointer.cpp +22 -0
  1179. package/src/duckdb/src/storage/data_table.cpp +41 -12
  1180. package/src/duckdb/src/storage/local_storage.cpp +22 -8
  1181. package/src/duckdb/src/storage/metadata/metadata_manager.cpp +33 -17
  1182. package/src/duckdb/src/storage/metadata/metadata_reader.cpp +4 -4
  1183. package/src/duckdb/src/storage/metadata/metadata_writer.cpp +3 -3
  1184. package/src/duckdb/src/storage/partial_block_manager.cpp +19 -8
  1185. package/src/duckdb/src/storage/serialization/serialize_create_info.cpp +11 -8
  1186. package/src/duckdb/src/storage/serialization/serialize_expression.cpp +1 -1
  1187. package/src/duckdb/src/storage/serialization/serialize_extension_install_info.cpp +2 -0
  1188. package/src/duckdb/src/storage/serialization/serialize_logical_operator.cpp +3 -3
  1189. package/src/duckdb/src/storage/serialization/serialize_nodes.cpp +19 -5
  1190. package/src/duckdb/src/storage/serialization/serialize_parse_info.cpp +21 -1
  1191. package/src/duckdb/src/storage/serialization/serialize_parsed_expression.cpp +4 -2
  1192. package/src/duckdb/src/storage/serialization/serialize_query_node.cpp +2 -2
  1193. package/src/duckdb/src/storage/serialization/serialize_storage.cpp +2 -0
  1194. package/src/duckdb/src/storage/serialization/serialize_tableref.cpp +8 -4
  1195. package/src/duckdb/src/storage/serialization/serialize_types.cpp +4 -4
  1196. package/src/duckdb/src/storage/single_file_block_manager.cpp +170 -34
  1197. package/src/duckdb/src/storage/standard_buffer_manager.cpp +221 -64
  1198. package/src/duckdb/src/storage/statistics/column_statistics.cpp +4 -3
  1199. package/src/duckdb/src/storage/statistics/distinct_statistics.cpp +36 -26
  1200. package/src/duckdb/src/storage/statistics/numeric_stats.cpp +4 -15
  1201. package/src/duckdb/src/storage/statistics/string_stats.cpp +14 -8
  1202. package/src/duckdb/src/storage/statistics/struct_stats.cpp +2 -1
  1203. package/src/duckdb/src/storage/storage_info.cpp +34 -9
  1204. package/src/duckdb/src/storage/storage_manager.cpp +147 -74
  1205. package/src/duckdb/src/storage/table/array_column_data.cpp +37 -17
  1206. package/src/duckdb/src/storage/table/chunk_info.cpp +38 -0
  1207. package/src/duckdb/src/storage/table/column_checkpoint_state.cpp +10 -6
  1208. package/src/duckdb/src/storage/table/column_data.cpp +252 -31
  1209. package/src/duckdb/src/storage/table/column_data_checkpointer.cpp +2 -12
  1210. package/src/duckdb/src/storage/table/column_segment.cpp +63 -34
  1211. package/src/duckdb/src/storage/table/list_column_data.cpp +34 -15
  1212. package/src/duckdb/src/storage/table/row_group.cpp +228 -120
  1213. package/src/duckdb/src/storage/table/row_group_collection.cpp +122 -120
  1214. package/src/duckdb/src/storage/table/row_version_manager.cpp +27 -1
  1215. package/src/duckdb/src/storage/table/scan_state.cpp +101 -18
  1216. package/src/duckdb/src/storage/table/standard_column_data.cpp +20 -34
  1217. package/src/duckdb/src/storage/table/struct_column_data.cpp +39 -42
  1218. package/src/duckdb/src/storage/table/table_statistics.cpp +2 -1
  1219. package/src/duckdb/src/storage/table/update_segment.cpp +9 -8
  1220. package/src/duckdb/src/storage/table/validity_column_data.cpp +2 -2
  1221. package/src/duckdb/src/storage/table_index_list.cpp +8 -7
  1222. package/src/duckdb/src/storage/temporary_file_manager.cpp +11 -9
  1223. package/src/duckdb/src/storage/temporary_memory_manager.cpp +227 -39
  1224. package/src/duckdb/src/storage/wal_replay.cpp +68 -28
  1225. package/src/duckdb/src/storage/write_ahead_log.cpp +56 -47
  1226. package/src/duckdb/src/transaction/cleanup_state.cpp +9 -1
  1227. package/src/duckdb/src/transaction/commit_state.cpp +7 -170
  1228. package/src/duckdb/src/transaction/duck_transaction.cpp +87 -19
  1229. package/src/duckdb/src/transaction/duck_transaction_manager.cpp +65 -10
  1230. package/src/duckdb/src/transaction/meta_transaction.cpp +18 -3
  1231. package/src/duckdb/src/transaction/transaction_context.cpp +21 -17
  1232. package/src/duckdb/src/transaction/undo_buffer.cpp +20 -14
  1233. package/src/duckdb/src/transaction/wal_write_state.cpp +292 -0
  1234. package/src/duckdb/src/verification/prepared_statement_verifier.cpp +0 -1
  1235. package/src/duckdb/third_party/brotli/common/brotli_constants.h +204 -0
  1236. package/src/duckdb/third_party/brotli/common/brotli_platform.h +543 -0
  1237. package/src/duckdb/third_party/brotli/common/constants.cpp +17 -0
  1238. package/src/duckdb/third_party/brotli/common/context.cpp +156 -0
  1239. package/src/duckdb/third_party/brotli/common/context.h +110 -0
  1240. package/src/duckdb/third_party/brotli/common/dictionary.cpp +5912 -0
  1241. package/src/duckdb/third_party/brotli/common/dictionary.h +60 -0
  1242. package/src/duckdb/third_party/brotli/common/platform.cpp +24 -0
  1243. package/src/duckdb/third_party/brotli/common/shared_dictionary.cpp +517 -0
  1244. package/src/duckdb/third_party/brotli/common/shared_dictionary_internal.h +71 -0
  1245. package/src/duckdb/third_party/brotli/common/transform.cpp +287 -0
  1246. package/src/duckdb/third_party/brotli/common/transform.h +77 -0
  1247. package/src/duckdb/third_party/brotli/common/version.h +51 -0
  1248. package/src/duckdb/third_party/brotli/dec/bit_reader.cpp +74 -0
  1249. package/src/duckdb/third_party/brotli/dec/bit_reader.h +419 -0
  1250. package/src/duckdb/third_party/brotli/dec/decode.cpp +2758 -0
  1251. package/src/duckdb/third_party/brotli/dec/huffman.cpp +338 -0
  1252. package/src/duckdb/third_party/brotli/dec/huffman.h +118 -0
  1253. package/src/duckdb/third_party/brotli/dec/prefix.h +733 -0
  1254. package/src/duckdb/third_party/brotli/dec/state.cpp +178 -0
  1255. package/src/duckdb/third_party/brotli/dec/state.h +386 -0
  1256. package/src/duckdb/third_party/brotli/enc/backward_references.cpp +3775 -0
  1257. package/src/duckdb/third_party/brotli/enc/backward_references.h +36 -0
  1258. package/src/duckdb/third_party/brotli/enc/backward_references_hq.cpp +935 -0
  1259. package/src/duckdb/third_party/brotli/enc/backward_references_hq.h +92 -0
  1260. package/src/duckdb/third_party/brotli/enc/bit_cost.cpp +410 -0
  1261. package/src/duckdb/third_party/brotli/enc/bit_cost.h +60 -0
  1262. package/src/duckdb/third_party/brotli/enc/block_splitter.cpp +1653 -0
  1263. package/src/duckdb/third_party/brotli/enc/block_splitter.h +48 -0
  1264. package/src/duckdb/third_party/brotli/enc/brotli_bit_stream.cpp +1431 -0
  1265. package/src/duckdb/third_party/brotli/enc/brotli_bit_stream.h +85 -0
  1266. package/src/duckdb/third_party/brotli/enc/brotli_hash.h +4352 -0
  1267. package/src/duckdb/third_party/brotli/enc/brotli_params.h +47 -0
  1268. package/src/duckdb/third_party/brotli/enc/cluster.cpp +1025 -0
  1269. package/src/duckdb/third_party/brotli/enc/cluster.h +1017 -0
  1270. package/src/duckdb/third_party/brotli/enc/command.cpp +24 -0
  1271. package/src/duckdb/third_party/brotli/enc/command.h +187 -0
  1272. package/src/duckdb/third_party/brotli/enc/compound_dictionary.cpp +209 -0
  1273. package/src/duckdb/third_party/brotli/enc/compound_dictionary.h +75 -0
  1274. package/src/duckdb/third_party/brotli/enc/compress_fragment.cpp +796 -0
  1275. package/src/duckdb/third_party/brotli/enc/compress_fragment.h +82 -0
  1276. package/src/duckdb/third_party/brotli/enc/compress_fragment_two_pass.cpp +653 -0
  1277. package/src/duckdb/third_party/brotli/enc/compress_fragment_two_pass.h +68 -0
  1278. package/src/duckdb/third_party/brotli/enc/dictionary_hash.cpp +1844 -0
  1279. package/src/duckdb/third_party/brotli/enc/dictionary_hash.h +21 -0
  1280. package/src/duckdb/third_party/brotli/enc/encode.cpp +1990 -0
  1281. package/src/duckdb/third_party/brotli/enc/encoder_dict.cpp +636 -0
  1282. package/src/duckdb/third_party/brotli/enc/encoder_dict.h +153 -0
  1283. package/src/duckdb/third_party/brotli/enc/entropy_encode.cpp +500 -0
  1284. package/src/duckdb/third_party/brotli/enc/entropy_encode.h +119 -0
  1285. package/src/duckdb/third_party/brotli/enc/entropy_encode_static.h +538 -0
  1286. package/src/duckdb/third_party/brotli/enc/fast_log.cpp +101 -0
  1287. package/src/duckdb/third_party/brotli/enc/fast_log.h +63 -0
  1288. package/src/duckdb/third_party/brotli/enc/find_match_length.h +68 -0
  1289. package/src/duckdb/third_party/brotli/enc/histogram.cpp +96 -0
  1290. package/src/duckdb/third_party/brotli/enc/histogram.h +210 -0
  1291. package/src/duckdb/third_party/brotli/enc/literal_cost.cpp +176 -0
  1292. package/src/duckdb/third_party/brotli/enc/literal_cost.h +28 -0
  1293. package/src/duckdb/third_party/brotli/enc/memory.cpp +190 -0
  1294. package/src/duckdb/third_party/brotli/enc/memory.h +127 -0
  1295. package/src/duckdb/third_party/brotli/enc/metablock.cpp +1225 -0
  1296. package/src/duckdb/third_party/brotli/enc/metablock.h +102 -0
  1297. package/src/duckdb/third_party/brotli/enc/prefix.h +50 -0
  1298. package/src/duckdb/third_party/brotli/enc/quality.h +202 -0
  1299. package/src/duckdb/third_party/brotli/enc/ringbuffer.h +164 -0
  1300. package/src/duckdb/third_party/brotli/enc/state.h +106 -0
  1301. package/src/duckdb/third_party/brotli/enc/static_dict.cpp +538 -0
  1302. package/src/duckdb/third_party/brotli/enc/static_dict.h +37 -0
  1303. package/src/duckdb/third_party/brotli/enc/static_dict_lut.h +5862 -0
  1304. package/src/duckdb/third_party/brotli/enc/utf8_util.cpp +81 -0
  1305. package/src/duckdb/third_party/brotli/enc/utf8_util.h +29 -0
  1306. package/src/duckdb/third_party/brotli/enc/write_bits.h +84 -0
  1307. package/src/duckdb/third_party/brotli/include/brotli/decode.h +405 -0
  1308. package/src/duckdb/third_party/brotli/include/brotli/encode.h +489 -0
  1309. package/src/duckdb/third_party/brotli/include/brotli/port.h +238 -0
  1310. package/src/duckdb/third_party/brotli/include/brotli/shared_dictionary.h +96 -0
  1311. package/src/duckdb/third_party/brotli/include/brotli/types.h +83 -0
  1312. package/src/duckdb/third_party/fast_float/fast_float/fast_float.h +20 -4
  1313. package/src/duckdb/third_party/fmt/include/fmt/format.h +54 -10
  1314. package/src/duckdb/third_party/fsst/fsst.h +2 -2
  1315. package/src/duckdb/third_party/fsst/libfsst.hpp +2 -2
  1316. package/src/duckdb/third_party/httplib/httplib.hpp +6763 -5580
  1317. package/src/duckdb/third_party/hyperloglog/hyperloglog.cpp +13 -30
  1318. package/src/duckdb/third_party/hyperloglog/hyperloglog.hpp +8 -2
  1319. package/src/duckdb/third_party/libpg_query/include/nodes/nodes.hpp +1 -0
  1320. package/src/duckdb/third_party/libpg_query/include/nodes/parsenodes.hpp +22 -9
  1321. package/src/duckdb/third_party/libpg_query/include/parser/gram.hpp +1041 -554
  1322. package/src/duckdb/third_party/libpg_query/include/parser/kwlist.hpp +1 -0
  1323. package/src/duckdb/third_party/libpg_query/postgres_parser.cpp +2 -1
  1324. package/src/duckdb/third_party/libpg_query/src_backend_parser_gram.cpp +21605 -21752
  1325. package/src/duckdb/third_party/libpg_query/src_backend_parser_scan.cpp +538 -299
  1326. package/src/duckdb/third_party/mbedtls/include/mbedtls/mbedtls_config.h +1 -0
  1327. package/src/duckdb/third_party/mbedtls/include/mbedtls_wrapper.hpp +36 -12
  1328. package/src/duckdb/third_party/mbedtls/library/md.cpp +6 -6
  1329. package/src/duckdb/third_party/mbedtls/library/sha1.cpp +2 -0
  1330. package/src/duckdb/third_party/mbedtls/library/sha256.cpp +3 -0
  1331. package/src/duckdb/third_party/mbedtls/mbedtls_wrapper.cpp +99 -47
  1332. package/src/duckdb/third_party/pcg/pcg_extras.hpp +1 -1
  1333. package/src/duckdb/third_party/re2/re2/prog.cc +2 -2
  1334. package/src/duckdb/third_party/snappy/snappy-internal.h +398 -0
  1335. package/src/duckdb/third_party/snappy/snappy-sinksource.cc +111 -9
  1336. package/src/duckdb/third_party/snappy/snappy-sinksource.h +158 -0
  1337. package/src/duckdb/third_party/snappy/snappy-stubs-internal.h +523 -3
  1338. package/src/duckdb/third_party/snappy/snappy-stubs-public.h +34 -1
  1339. package/src/duckdb/third_party/snappy/snappy.cc +2626 -0
  1340. package/src/duckdb/third_party/snappy/snappy.h +223 -0
  1341. package/src/duckdb/third_party/snappy/snappy_version.hpp +11 -0
  1342. package/src/duckdb/third_party/utf8proc/include/utf8proc.hpp +69 -101
  1343. package/src/duckdb/third_party/utf8proc/include/utf8proc_wrapper.hpp +53 -0
  1344. package/src/duckdb/third_party/utf8proc/utf8proc.cpp +627 -678
  1345. package/src/duckdb/third_party/utf8proc/utf8proc_data.cpp +15008 -12868
  1346. package/src/duckdb/third_party/utf8proc/utf8proc_wrapper.cpp +185 -29
  1347. package/src/duckdb/ub_extension_json_json_functions.cpp +6 -0
  1348. package/src/duckdb/ub_src_catalog_default.cpp +4 -0
  1349. package/src/duckdb/ub_src_common.cpp +7 -1
  1350. package/src/duckdb/ub_src_common_arrow.cpp +10 -0
  1351. package/src/duckdb/ub_src_common_enums.cpp +2 -0
  1352. package/src/duckdb/ub_src_common_tree_renderer.cpp +10 -0
  1353. package/src/duckdb/ub_src_common_types.cpp +2 -0
  1354. package/src/duckdb/ub_src_core_functions_aggregate_holistic.cpp +4 -0
  1355. package/src/duckdb/ub_src_core_functions_aggregate_nested.cpp +2 -0
  1356. package/src/duckdb/ub_src_core_functions_scalar_generic.cpp +2 -0
  1357. package/src/duckdb/ub_src_core_functions_scalar_list.cpp +2 -4
  1358. package/src/duckdb/ub_src_core_functions_scalar_map.cpp +2 -0
  1359. package/src/duckdb/ub_src_core_functions_scalar_string.cpp +4 -0
  1360. package/src/duckdb/ub_src_execution_index_art.cpp +5 -3
  1361. package/src/duckdb/ub_src_execution_operator_csv_scanner_scanner.cpp +2 -0
  1362. package/src/duckdb/ub_src_execution_operator_helper.cpp +4 -0
  1363. package/src/duckdb/ub_src_function.cpp +4 -0
  1364. package/src/duckdb/ub_src_function_cast.cpp +2 -0
  1365. package/src/duckdb/ub_src_function_scalar_generic.cpp +4 -0
  1366. package/src/duckdb/ub_src_function_scalar_list.cpp +0 -2
  1367. package/src/duckdb/ub_src_function_scalar_string.cpp +2 -0
  1368. package/src/duckdb/ub_src_function_table.cpp +2 -0
  1369. package/src/duckdb/ub_src_function_table_arrow.cpp +2 -0
  1370. package/src/duckdb/ub_src_function_table_system.cpp +2 -0
  1371. package/src/duckdb/ub_src_main.cpp +4 -0
  1372. package/src/duckdb/ub_src_main_buffered_data.cpp +4 -0
  1373. package/src/duckdb/ub_src_main_capi.cpp +10 -0
  1374. package/src/duckdb/ub_src_main_chunk_scan_state.cpp +2 -0
  1375. package/src/duckdb/ub_src_main_relation.cpp +2 -0
  1376. package/src/duckdb/ub_src_main_secret.cpp +2 -0
  1377. package/src/duckdb/ub_src_optimizer.cpp +8 -0
  1378. package/src/duckdb/ub_src_optimizer_compressed_materialization.cpp +2 -0
  1379. package/src/duckdb/ub_src_optimizer_pushdown.cpp +2 -0
  1380. package/src/duckdb/ub_src_optimizer_rule.cpp +2 -0
  1381. package/src/duckdb/ub_src_parallel.cpp +4 -0
  1382. package/src/duckdb/ub_src_parser_tableref.cpp +2 -0
  1383. package/src/duckdb/ub_src_planner.cpp +2 -0
  1384. package/src/duckdb/ub_src_planner_binder_expression.cpp +2 -0
  1385. package/src/duckdb/ub_src_planner_binder_tableref.cpp +4 -0
  1386. package/src/duckdb/ub_src_storage_statistics.cpp +0 -2
  1387. package/src/duckdb/ub_src_transaction.cpp +2 -0
  1388. package/test/columns.test.ts +1 -1
  1389. package/test/prepare.test.ts +1 -1
  1390. package/test/test_all_types.test.ts +1 -1
@@ -0,0 +1,1431 @@
1
+ /* Copyright 2014 Google Inc. All Rights Reserved.
2
+
3
+ Distributed under MIT license.
4
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
5
+ */
6
+
7
+ /* Brotli bit stream functions to support the low level format. There are no
8
+ compression algorithms here, just the right ordering of bits to match the
9
+ specs. */
10
+
11
+ #include "brotli_bit_stream.h"
12
+
13
+ #include <string.h> /* memcpy, memset */
14
+
15
+ #include <brotli/types.h>
16
+
17
+ #include "../common/brotli_constants.h"
18
+ #include "../common/context.h"
19
+ #include "../common/brotli_platform.h"
20
+ #include "entropy_encode.h"
21
+ #include "entropy_encode_static.h"
22
+ #include "fast_log.h"
23
+ #include "histogram.h"
24
+ #include "memory.h"
25
+ #include "write_bits.h"
26
+
27
+ using namespace duckdb_brotli;
28
+
29
+ #define MAX_HUFFMAN_TREE_SIZE (2 * BROTLI_NUM_COMMAND_SYMBOLS + 1)
30
+ /* The maximum size of Huffman dictionary for distances assuming that
31
+ NPOSTFIX = 0 and NDIRECT = 0. */
32
+ #define MAX_SIMPLE_DISTANCE_ALPHABET_SIZE \
33
+ BROTLI_DISTANCE_ALPHABET_SIZE(0, 0, BROTLI_LARGE_MAX_DISTANCE_BITS)
34
+ /* MAX_SIMPLE_DISTANCE_ALPHABET_SIZE == 140 */
35
+
36
+ static BROTLI_INLINE uint32_t BlockLengthPrefixCode(uint32_t len) {
37
+ uint32_t code = (len >= 177) ? (len >= 753 ? 20 : 14) : (len >= 41 ? 7 : 0);
38
+ while (code < (BROTLI_NUM_BLOCK_LEN_SYMBOLS - 1) &&
39
+ len >= _kBrotliPrefixCodeRanges[code + 1].offset) ++code;
40
+ return code;
41
+ }
42
+
43
+ static BROTLI_INLINE void GetBlockLengthPrefixCode(uint32_t len, size_t* code,
44
+ uint32_t* n_extra, uint32_t* extra) {
45
+ *code = BlockLengthPrefixCode(len);
46
+ *n_extra = _kBrotliPrefixCodeRanges[*code].nbits;
47
+ *extra = len - _kBrotliPrefixCodeRanges[*code].offset;
48
+ }
49
+
50
+ typedef struct BlockTypeCodeCalculator {
51
+ size_t last_type;
52
+ size_t second_last_type;
53
+ } BlockTypeCodeCalculator;
54
+
55
+ static void InitBlockTypeCodeCalculator(BlockTypeCodeCalculator* self) {
56
+ self->last_type = 1;
57
+ self->second_last_type = 0;
58
+ }
59
+
60
+ static BROTLI_INLINE size_t NextBlockTypeCode(
61
+ BlockTypeCodeCalculator* calculator, uint8_t type) {
62
+ size_t type_code = (type == calculator->last_type + 1) ? 1u :
63
+ (type == calculator->second_last_type) ? 0u : type + 2u;
64
+ calculator->second_last_type = calculator->last_type;
65
+ calculator->last_type = type;
66
+ return type_code;
67
+ }
68
+
69
+ /* |nibblesbits| represents the 2 bits to encode MNIBBLES (0-3)
70
+ REQUIRES: length > 0
71
+ REQUIRES: length <= (1 << 24) */
72
+ static void BrotliEncodeMlen(size_t length, uint64_t* bits,
73
+ size_t* numbits, uint64_t* nibblesbits) {
74
+ size_t lg = (length == 1) ? 1 : Log2FloorNonZero((uint32_t)(length - 1)) + 1;
75
+ size_t mnibbles = (lg < 16 ? 16 : (lg + 3)) / 4;
76
+ BROTLI_DCHECK(length > 0);
77
+ BROTLI_DCHECK(length <= (1 << 24));
78
+ BROTLI_DCHECK(lg <= 24);
79
+ *nibblesbits = mnibbles - 4;
80
+ *numbits = mnibbles * 4;
81
+ *bits = length - 1;
82
+ }
83
+
84
+ static BROTLI_INLINE void StoreCommandExtra(
85
+ const Command* cmd, size_t* storage_ix, uint8_t* storage) {
86
+ uint32_t copylen_code = CommandCopyLenCode(cmd);
87
+ uint16_t inscode = GetInsertLengthCode(cmd->insert_len_);
88
+ uint16_t copycode = GetCopyLengthCode(copylen_code);
89
+ uint32_t insnumextra = GetInsertExtra(inscode);
90
+ uint64_t insextraval = cmd->insert_len_ - GetInsertBase(inscode);
91
+ uint64_t copyextraval = copylen_code - GetCopyBase(copycode);
92
+ uint64_t bits = (copyextraval << insnumextra) | insextraval;
93
+ BrotliWriteBits(
94
+ insnumextra + GetCopyExtra(copycode), bits, storage_ix, storage);
95
+ }
96
+
97
+ /* Data structure that stores almost everything that is needed to encode each
98
+ block switch command. */
99
+ typedef struct BlockSplitCode {
100
+ BlockTypeCodeCalculator type_code_calculator;
101
+ uint8_t type_depths[BROTLI_MAX_BLOCK_TYPE_SYMBOLS];
102
+ uint16_t type_bits[BROTLI_MAX_BLOCK_TYPE_SYMBOLS];
103
+ uint8_t length_depths[BROTLI_NUM_BLOCK_LEN_SYMBOLS];
104
+ uint16_t length_bits[BROTLI_NUM_BLOCK_LEN_SYMBOLS];
105
+ } BlockSplitCode;
106
+
107
+ /* Stores a number between 0 and 255. */
108
+ static void StoreVarLenUint8(size_t n, size_t* storage_ix, uint8_t* storage) {
109
+ if (n == 0) {
110
+ BrotliWriteBits(1, 0, storage_ix, storage);
111
+ } else {
112
+ size_t nbits = Log2FloorNonZero(n);
113
+ BrotliWriteBits(1, 1, storage_ix, storage);
114
+ BrotliWriteBits(3, nbits, storage_ix, storage);
115
+ BrotliWriteBits(nbits, n - ((size_t)1 << nbits), storage_ix, storage);
116
+ }
117
+ }
118
+
119
+ /* Stores the compressed meta-block header.
120
+ REQUIRES: length > 0
121
+ REQUIRES: length <= (1 << 24) */
122
+ static void StoreCompressedMetaBlockHeader(BROTLI_BOOL is_final_block,
123
+ size_t length,
124
+ size_t* storage_ix,
125
+ uint8_t* storage) {
126
+ uint64_t lenbits;
127
+ size_t nlenbits;
128
+ uint64_t nibblesbits;
129
+
130
+ /* Write ISLAST bit. */
131
+ BrotliWriteBits(1, (uint64_t)is_final_block, storage_ix, storage);
132
+ /* Write ISEMPTY bit. */
133
+ if (is_final_block) {
134
+ BrotliWriteBits(1, 0, storage_ix, storage);
135
+ }
136
+
137
+ BrotliEncodeMlen(length, &lenbits, &nlenbits, &nibblesbits);
138
+ BrotliWriteBits(2, nibblesbits, storage_ix, storage);
139
+ BrotliWriteBits(nlenbits, lenbits, storage_ix, storage);
140
+
141
+ if (!is_final_block) {
142
+ /* Write ISUNCOMPRESSED bit. */
143
+ BrotliWriteBits(1, 0, storage_ix, storage);
144
+ }
145
+ }
146
+
147
+ /* Stores the uncompressed meta-block header.
148
+ REQUIRES: length > 0
149
+ REQUIRES: length <= (1 << 24) */
150
+ static void BrotliStoreUncompressedMetaBlockHeader(size_t length,
151
+ size_t* storage_ix,
152
+ uint8_t* storage) {
153
+ uint64_t lenbits;
154
+ size_t nlenbits;
155
+ uint64_t nibblesbits;
156
+
157
+ /* Write ISLAST bit.
158
+ Uncompressed block cannot be the last one, so set to 0. */
159
+ BrotliWriteBits(1, 0, storage_ix, storage);
160
+ BrotliEncodeMlen(length, &lenbits, &nlenbits, &nibblesbits);
161
+ BrotliWriteBits(2, nibblesbits, storage_ix, storage);
162
+ BrotliWriteBits(nlenbits, lenbits, storage_ix, storage);
163
+ /* Write ISUNCOMPRESSED bit. */
164
+ BrotliWriteBits(1, 1, storage_ix, storage);
165
+ }
166
+
167
+ static void BrotliStoreHuffmanTreeOfHuffmanTreeToBitMask(
168
+ const int num_codes, const uint8_t* code_length_bitdepth,
169
+ size_t* storage_ix, uint8_t* storage) {
170
+ static const uint8_t kStorageOrder[BROTLI_CODE_LENGTH_CODES] = {
171
+ 1, 2, 3, 4, 0, 5, 17, 6, 16, 7, 8, 9, 10, 11, 12, 13, 14, 15
172
+ };
173
+ /* The bit lengths of the Huffman code over the code length alphabet
174
+ are compressed with the following static Huffman code:
175
+ Symbol Code
176
+ ------ ----
177
+ 0 00
178
+ 1 1110
179
+ 2 110
180
+ 3 01
181
+ 4 10
182
+ 5 1111 */
183
+ static const uint8_t kHuffmanBitLengthHuffmanCodeSymbols[6] = {
184
+ 0, 7, 3, 2, 1, 15
185
+ };
186
+ static const uint8_t kHuffmanBitLengthHuffmanCodeBitLengths[6] = {
187
+ 2, 4, 3, 2, 2, 4
188
+ };
189
+
190
+ size_t skip_some = 0; /* skips none. */
191
+
192
+ /* Throw away trailing zeros: */
193
+ size_t codes_to_store = BROTLI_CODE_LENGTH_CODES;
194
+ if (num_codes > 1) {
195
+ for (; codes_to_store > 0; --codes_to_store) {
196
+ if (code_length_bitdepth[kStorageOrder[codes_to_store - 1]] != 0) {
197
+ break;
198
+ }
199
+ }
200
+ }
201
+ if (code_length_bitdepth[kStorageOrder[0]] == 0 &&
202
+ code_length_bitdepth[kStorageOrder[1]] == 0) {
203
+ skip_some = 2; /* skips two. */
204
+ if (code_length_bitdepth[kStorageOrder[2]] == 0) {
205
+ skip_some = 3; /* skips three. */
206
+ }
207
+ }
208
+ BrotliWriteBits(2, skip_some, storage_ix, storage);
209
+ {
210
+ size_t i;
211
+ for (i = skip_some; i < codes_to_store; ++i) {
212
+ size_t l = code_length_bitdepth[kStorageOrder[i]];
213
+ BrotliWriteBits(kHuffmanBitLengthHuffmanCodeBitLengths[l],
214
+ kHuffmanBitLengthHuffmanCodeSymbols[l], storage_ix, storage);
215
+ }
216
+ }
217
+ }
218
+
219
+ static void BrotliStoreHuffmanTreeToBitMask(
220
+ const size_t huffman_tree_size, const uint8_t* huffman_tree,
221
+ const uint8_t* huffman_tree_extra_bits, const uint8_t* code_length_bitdepth,
222
+ const uint16_t* code_length_bitdepth_symbols,
223
+ size_t* BROTLI_RESTRICT storage_ix, uint8_t* BROTLI_RESTRICT storage) {
224
+ size_t i;
225
+ for (i = 0; i < huffman_tree_size; ++i) {
226
+ size_t ix = huffman_tree[i];
227
+ BrotliWriteBits(code_length_bitdepth[ix], code_length_bitdepth_symbols[ix],
228
+ storage_ix, storage);
229
+ /* Extra bits */
230
+ switch (ix) {
231
+ case BROTLI_REPEAT_PREVIOUS_CODE_LENGTH:
232
+ BrotliWriteBits(2, huffman_tree_extra_bits[i], storage_ix, storage);
233
+ break;
234
+ case BROTLI_REPEAT_ZERO_CODE_LENGTH:
235
+ BrotliWriteBits(3, huffman_tree_extra_bits[i], storage_ix, storage);
236
+ break;
237
+ }
238
+ }
239
+ }
240
+
241
+ static void StoreSimpleHuffmanTree(const uint8_t* depths,
242
+ size_t symbols[4],
243
+ size_t num_symbols,
244
+ size_t max_bits,
245
+ size_t* storage_ix, uint8_t* storage) {
246
+ /* value of 1 indicates a simple Huffman code */
247
+ BrotliWriteBits(2, 1, storage_ix, storage);
248
+ BrotliWriteBits(2, num_symbols - 1, storage_ix, storage); /* NSYM - 1 */
249
+
250
+ {
251
+ /* Sort */
252
+ size_t i;
253
+ for (i = 0; i < num_symbols; i++) {
254
+ size_t j;
255
+ for (j = i + 1; j < num_symbols; j++) {
256
+ if (depths[symbols[j]] < depths[symbols[i]]) {
257
+ BROTLI_SWAP(size_t, symbols, j, i);
258
+ }
259
+ }
260
+ }
261
+ }
262
+
263
+ if (num_symbols == 2) {
264
+ BrotliWriteBits(max_bits, symbols[0], storage_ix, storage);
265
+ BrotliWriteBits(max_bits, symbols[1], storage_ix, storage);
266
+ } else if (num_symbols == 3) {
267
+ BrotliWriteBits(max_bits, symbols[0], storage_ix, storage);
268
+ BrotliWriteBits(max_bits, symbols[1], storage_ix, storage);
269
+ BrotliWriteBits(max_bits, symbols[2], storage_ix, storage);
270
+ } else {
271
+ BrotliWriteBits(max_bits, symbols[0], storage_ix, storage);
272
+ BrotliWriteBits(max_bits, symbols[1], storage_ix, storage);
273
+ BrotliWriteBits(max_bits, symbols[2], storage_ix, storage);
274
+ BrotliWriteBits(max_bits, symbols[3], storage_ix, storage);
275
+ /* tree-select */
276
+ BrotliWriteBits(1, depths[symbols[0]] == 1 ? 1 : 0, storage_ix, storage);
277
+ }
278
+ }
279
+
280
+ /* num = alphabet size
281
+ depths = symbol depths */
282
+ void duckdb_brotli::BrotliStoreHuffmanTree(const uint8_t* depths, size_t num,
283
+ HuffmanTree* tree,
284
+ size_t* storage_ix, uint8_t* storage) {
285
+ /* Write the Huffman tree into the brotli-representation.
286
+ The command alphabet is the largest, so this allocation will fit all
287
+ alphabets. */
288
+ /* TODO(eustas): fix me */
289
+ uint8_t huffman_tree[BROTLI_NUM_COMMAND_SYMBOLS];
290
+ uint8_t huffman_tree_extra_bits[BROTLI_NUM_COMMAND_SYMBOLS];
291
+ size_t huffman_tree_size = 0;
292
+ uint8_t code_length_bitdepth[BROTLI_CODE_LENGTH_CODES] = { 0 };
293
+ uint16_t code_length_bitdepth_symbols[BROTLI_CODE_LENGTH_CODES];
294
+ uint32_t huffman_tree_histogram[BROTLI_CODE_LENGTH_CODES] = { 0 };
295
+ size_t i;
296
+ int num_codes = 0;
297
+ size_t code = 0;
298
+
299
+ BROTLI_DCHECK(num <= BROTLI_NUM_COMMAND_SYMBOLS);
300
+
301
+ BrotliWriteHuffmanTree(depths, num, &huffman_tree_size, huffman_tree,
302
+ huffman_tree_extra_bits);
303
+
304
+ /* Calculate the statistics of the Huffman tree in brotli-representation. */
305
+ for (i = 0; i < huffman_tree_size; ++i) {
306
+ ++huffman_tree_histogram[huffman_tree[i]];
307
+ }
308
+
309
+ for (i = 0; i < BROTLI_CODE_LENGTH_CODES; ++i) {
310
+ if (huffman_tree_histogram[i]) {
311
+ if (num_codes == 0) {
312
+ code = i;
313
+ num_codes = 1;
314
+ } else if (num_codes == 1) {
315
+ num_codes = 2;
316
+ break;
317
+ }
318
+ }
319
+ }
320
+
321
+ /* Calculate another Huffman tree to use for compressing both the
322
+ earlier Huffman tree with. */
323
+ BrotliCreateHuffmanTree(huffman_tree_histogram, BROTLI_CODE_LENGTH_CODES,
324
+ 5, tree, code_length_bitdepth);
325
+ BrotliConvertBitDepthsToSymbols(code_length_bitdepth,
326
+ BROTLI_CODE_LENGTH_CODES,
327
+ code_length_bitdepth_symbols);
328
+
329
+ /* Now, we have all the data, let's start storing it */
330
+ BrotliStoreHuffmanTreeOfHuffmanTreeToBitMask(num_codes, code_length_bitdepth,
331
+ storage_ix, storage);
332
+
333
+ if (num_codes == 1) {
334
+ code_length_bitdepth[code] = 0;
335
+ }
336
+
337
+ /* Store the real Huffman tree now. */
338
+ BrotliStoreHuffmanTreeToBitMask(huffman_tree_size,
339
+ huffman_tree,
340
+ huffman_tree_extra_bits,
341
+ code_length_bitdepth,
342
+ code_length_bitdepth_symbols,
343
+ storage_ix, storage);
344
+ }
345
+
346
+ /* Builds a Huffman tree from histogram[0:length] into depth[0:length] and
347
+ bits[0:length] and stores the encoded tree to the bit stream. */
348
+ static void BuildAndStoreHuffmanTree(const uint32_t* histogram,
349
+ const size_t histogram_length,
350
+ const size_t alphabet_size,
351
+ HuffmanTree* tree,
352
+ uint8_t* depth,
353
+ uint16_t* bits,
354
+ size_t* storage_ix,
355
+ uint8_t* storage) {
356
+ size_t count = 0;
357
+ size_t s4[4] = { 0 };
358
+ size_t i;
359
+ size_t max_bits = 0;
360
+ for (i = 0; i < histogram_length; i++) {
361
+ if (histogram[i]) {
362
+ if (count < 4) {
363
+ s4[count] = i;
364
+ } else if (count > 4) {
365
+ break;
366
+ }
367
+ count++;
368
+ }
369
+ }
370
+
371
+ {
372
+ size_t max_bits_counter = alphabet_size - 1;
373
+ while (max_bits_counter) {
374
+ max_bits_counter >>= 1;
375
+ ++max_bits;
376
+ }
377
+ }
378
+
379
+ if (count <= 1) {
380
+ BrotliWriteBits(4, 1, storage_ix, storage);
381
+ BrotliWriteBits(max_bits, s4[0], storage_ix, storage);
382
+ depth[s4[0]] = 0;
383
+ bits[s4[0]] = 0;
384
+ return;
385
+ }
386
+
387
+ memset(depth, 0, histogram_length * sizeof(depth[0]));
388
+ BrotliCreateHuffmanTree(histogram, histogram_length, 15, tree, depth);
389
+ BrotliConvertBitDepthsToSymbols(depth, histogram_length, bits);
390
+
391
+ if (count <= 4) {
392
+ StoreSimpleHuffmanTree(depth, s4, count, max_bits, storage_ix, storage);
393
+ } else {
394
+ BrotliStoreHuffmanTree(depth, histogram_length, tree, storage_ix, storage);
395
+ }
396
+ }
397
+
398
+ static BROTLI_INLINE BROTLI_BOOL SortHuffmanTree(
399
+ const HuffmanTree* v0, const HuffmanTree* v1) {
400
+ return TO_BROTLI_BOOL(v0->total_count_ < v1->total_count_);
401
+ }
402
+
403
+ void duckdb_brotli::BrotliBuildAndStoreHuffmanTreeFast(HuffmanTree* tree,
404
+ const uint32_t* histogram,
405
+ const size_t histogram_total,
406
+ const size_t max_bits,
407
+ uint8_t* depth, uint16_t* bits,
408
+ size_t* storage_ix,
409
+ uint8_t* storage) {
410
+ size_t count = 0;
411
+ size_t symbols[4] = { 0 };
412
+ size_t length = 0;
413
+ size_t total = histogram_total;
414
+ while (total != 0) {
415
+ if (histogram[length]) {
416
+ if (count < 4) {
417
+ symbols[count] = length;
418
+ }
419
+ ++count;
420
+ total -= histogram[length];
421
+ }
422
+ ++length;
423
+ }
424
+
425
+ if (count <= 1) {
426
+ BrotliWriteBits(4, 1, storage_ix, storage);
427
+ BrotliWriteBits(max_bits, symbols[0], storage_ix, storage);
428
+ depth[symbols[0]] = 0;
429
+ bits[symbols[0]] = 0;
430
+ return;
431
+ }
432
+
433
+ memset(depth, 0, length * sizeof(depth[0]));
434
+ {
435
+ uint32_t count_limit;
436
+ for (count_limit = 1; ; count_limit *= 2) {
437
+ HuffmanTree* node = tree;
438
+ size_t l;
439
+ for (l = length; l != 0;) {
440
+ --l;
441
+ if (histogram[l]) {
442
+ if (BROTLI_PREDICT_TRUE(histogram[l] >= count_limit)) {
443
+ InitHuffmanTree(node, histogram[l], -1, (int16_t)l);
444
+ } else {
445
+ InitHuffmanTree(node, count_limit, -1, (int16_t)l);
446
+ }
447
+ ++node;
448
+ }
449
+ }
450
+ {
451
+ const int n = (int)(node - tree);
452
+ HuffmanTree sentinel;
453
+ int i = 0; /* Points to the next leaf node. */
454
+ int j = n + 1; /* Points to the next non-leaf node. */
455
+ int k;
456
+
457
+ SortHuffmanTreeItems(tree, (size_t)n, SortHuffmanTree);
458
+ /* The nodes are:
459
+ [0, n): the sorted leaf nodes that we start with.
460
+ [n]: we add a sentinel here.
461
+ [n + 1, 2n): new parent nodes are added here, starting from
462
+ (n+1). These are naturally in ascending order.
463
+ [2n]: we add a sentinel at the end as well.
464
+ There will be (2n+1) elements at the end. */
465
+ InitHuffmanTree(&sentinel, BROTLI_UINT32_MAX, -1, -1);
466
+ *node++ = sentinel;
467
+ *node++ = sentinel;
468
+
469
+ for (k = n - 1; k > 0; --k) {
470
+ int left, right;
471
+ if (tree[i].total_count_ <= tree[j].total_count_) {
472
+ left = i;
473
+ ++i;
474
+ } else {
475
+ left = j;
476
+ ++j;
477
+ }
478
+ if (tree[i].total_count_ <= tree[j].total_count_) {
479
+ right = i;
480
+ ++i;
481
+ } else {
482
+ right = j;
483
+ ++j;
484
+ }
485
+ /* The sentinel node becomes the parent node. */
486
+ node[-1].total_count_ =
487
+ tree[left].total_count_ + tree[right].total_count_;
488
+ node[-1].index_left_ = (int16_t)left;
489
+ node[-1].index_right_or_value_ = (int16_t)right;
490
+ /* Add back the last sentinel node. */
491
+ *node++ = sentinel;
492
+ }
493
+ if (BrotliSetDepth(2 * n - 1, tree, depth, 14)) {
494
+ /* We need to pack the Huffman tree in 14 bits. If this was not
495
+ successful, add fake entities to the lowest values and retry. */
496
+ break;
497
+ }
498
+ }
499
+ }
500
+ }
501
+ BrotliConvertBitDepthsToSymbols(depth, length, bits);
502
+ if (count <= 4) {
503
+ size_t i;
504
+ /* value of 1 indicates a simple Huffman code */
505
+ BrotliWriteBits(2, 1, storage_ix, storage);
506
+ BrotliWriteBits(2, count - 1, storage_ix, storage); /* NSYM - 1 */
507
+
508
+ /* Sort */
509
+ for (i = 0; i < count; i++) {
510
+ size_t j;
511
+ for (j = i + 1; j < count; j++) {
512
+ if (depth[symbols[j]] < depth[symbols[i]]) {
513
+ BROTLI_SWAP(size_t, symbols, j, i);
514
+ }
515
+ }
516
+ }
517
+
518
+ if (count == 2) {
519
+ BrotliWriteBits(max_bits, symbols[0], storage_ix, storage);
520
+ BrotliWriteBits(max_bits, symbols[1], storage_ix, storage);
521
+ } else if (count == 3) {
522
+ BrotliWriteBits(max_bits, symbols[0], storage_ix, storage);
523
+ BrotliWriteBits(max_bits, symbols[1], storage_ix, storage);
524
+ BrotliWriteBits(max_bits, symbols[2], storage_ix, storage);
525
+ } else {
526
+ BrotliWriteBits(max_bits, symbols[0], storage_ix, storage);
527
+ BrotliWriteBits(max_bits, symbols[1], storage_ix, storage);
528
+ BrotliWriteBits(max_bits, symbols[2], storage_ix, storage);
529
+ BrotliWriteBits(max_bits, symbols[3], storage_ix, storage);
530
+ /* tree-select */
531
+ BrotliWriteBits(1, depth[symbols[0]] == 1 ? 1 : 0, storage_ix, storage);
532
+ }
533
+ } else {
534
+ uint8_t previous_value = 8;
535
+ size_t i;
536
+ /* Complex Huffman Tree */
537
+ StoreStaticCodeLengthCode(storage_ix, storage);
538
+
539
+ /* Actual RLE coding. */
540
+ for (i = 0; i < length;) {
541
+ const uint8_t value = depth[i];
542
+ size_t reps = 1;
543
+ size_t k;
544
+ for (k = i + 1; k < length && depth[k] == value; ++k) {
545
+ ++reps;
546
+ }
547
+ i += reps;
548
+ if (value == 0) {
549
+ BrotliWriteBits(kZeroRepsDepth[reps], kZeroRepsBits[reps],
550
+ storage_ix, storage);
551
+ } else {
552
+ if (previous_value != value) {
553
+ BrotliWriteBits(kCodeLengthDepth[value], kCodeLengthBits[value],
554
+ storage_ix, storage);
555
+ --reps;
556
+ }
557
+ if (reps < 3) {
558
+ while (reps != 0) {
559
+ reps--;
560
+ BrotliWriteBits(kCodeLengthDepth[value], kCodeLengthBits[value],
561
+ storage_ix, storage);
562
+ }
563
+ } else {
564
+ reps -= 3;
565
+ BrotliWriteBits(kNonZeroRepsDepth[reps], kNonZeroRepsBits[reps],
566
+ storage_ix, storage);
567
+ }
568
+ previous_value = value;
569
+ }
570
+ }
571
+ }
572
+ }
573
+
574
+ static size_t IndexOf(const uint8_t* v, size_t v_size, uint8_t value) {
575
+ size_t i = 0;
576
+ for (; i < v_size; ++i) {
577
+ if (v[i] == value) return i;
578
+ }
579
+ return i;
580
+ }
581
+
582
+ static void MoveToFront(uint8_t* v, size_t index) {
583
+ uint8_t value = v[index];
584
+ size_t i;
585
+ for (i = index; i != 0; --i) {
586
+ v[i] = v[i - 1];
587
+ }
588
+ v[0] = value;
589
+ }
590
+
591
+ static void MoveToFrontTransform(const uint32_t* BROTLI_RESTRICT v_in,
592
+ const size_t v_size,
593
+ uint32_t* v_out) {
594
+ size_t i;
595
+ uint8_t mtf[256];
596
+ uint32_t max_value;
597
+ if (v_size == 0) {
598
+ return;
599
+ }
600
+ max_value = v_in[0];
601
+ for (i = 1; i < v_size; ++i) {
602
+ if (v_in[i] > max_value) max_value = v_in[i];
603
+ }
604
+ BROTLI_DCHECK(max_value < 256u);
605
+ for (i = 0; i <= max_value; ++i) {
606
+ mtf[i] = (uint8_t)i;
607
+ }
608
+ {
609
+ size_t mtf_size = max_value + 1;
610
+ for (i = 0; i < v_size; ++i) {
611
+ size_t index = IndexOf(mtf, mtf_size, (uint8_t)v_in[i]);
612
+ BROTLI_DCHECK(index < mtf_size);
613
+ v_out[i] = (uint32_t)index;
614
+ MoveToFront(mtf, index);
615
+ }
616
+ }
617
+ }
618
+
619
+ /* Finds runs of zeros in v[0..in_size) and replaces them with a prefix code of
620
+ the run length plus extra bits (lower 9 bits is the prefix code and the rest
621
+ are the extra bits). Non-zero values in v[] are shifted by
622
+ *max_length_prefix. Will not create prefix codes bigger than the initial
623
+ value of *max_run_length_prefix. The prefix code of run length L is simply
624
+ Log2Floor(L) and the number of extra bits is the same as the prefix code. */
625
+ static void RunLengthCodeZeros(const size_t in_size,
626
+ uint32_t* BROTLI_RESTRICT v, size_t* BROTLI_RESTRICT out_size,
627
+ uint32_t* BROTLI_RESTRICT max_run_length_prefix) {
628
+ uint32_t max_reps = 0;
629
+ size_t i;
630
+ uint32_t max_prefix;
631
+ for (i = 0; i < in_size;) {
632
+ uint32_t reps = 0;
633
+ for (; i < in_size && v[i] != 0; ++i) ;
634
+ for (; i < in_size && v[i] == 0; ++i) {
635
+ ++reps;
636
+ }
637
+ max_reps = BROTLI_MAX(uint32_t, reps, max_reps);
638
+ }
639
+ max_prefix = max_reps > 0 ? Log2FloorNonZero(max_reps) : 0;
640
+ max_prefix = BROTLI_MIN(uint32_t, max_prefix, *max_run_length_prefix);
641
+ *max_run_length_prefix = max_prefix;
642
+ *out_size = 0;
643
+ for (i = 0; i < in_size;) {
644
+ BROTLI_DCHECK(*out_size <= i);
645
+ if (v[i] != 0) {
646
+ v[*out_size] = v[i] + *max_run_length_prefix;
647
+ ++i;
648
+ ++(*out_size);
649
+ } else {
650
+ uint32_t reps = 1;
651
+ size_t k;
652
+ for (k = i + 1; k < in_size && v[k] == 0; ++k) {
653
+ ++reps;
654
+ }
655
+ i += reps;
656
+ while (reps != 0) {
657
+ if (reps < (2u << max_prefix)) {
658
+ uint32_t run_length_prefix = Log2FloorNonZero(reps);
659
+ const uint32_t extra_bits = reps - (1u << run_length_prefix);
660
+ v[*out_size] = run_length_prefix + (extra_bits << 9);
661
+ ++(*out_size);
662
+ break;
663
+ } else {
664
+ const uint32_t extra_bits = (1u << max_prefix) - 1u;
665
+ v[*out_size] = max_prefix + (extra_bits << 9);
666
+ reps -= (2u << max_prefix) - 1u;
667
+ ++(*out_size);
668
+ }
669
+ }
670
+ }
671
+ }
672
+ }
673
+
674
+ #define SYMBOL_BITS 9
675
+
676
+ typedef struct EncodeContextMapArena {
677
+ uint32_t histogram[BROTLI_MAX_CONTEXT_MAP_SYMBOLS];
678
+ uint8_t depths[BROTLI_MAX_CONTEXT_MAP_SYMBOLS];
679
+ uint16_t bits[BROTLI_MAX_CONTEXT_MAP_SYMBOLS];
680
+ } EncodeContextMapArena;
681
+
682
+ static void EncodeContextMap(MemoryManager* m,
683
+ EncodeContextMapArena* arena,
684
+ const uint32_t* context_map,
685
+ size_t context_map_size,
686
+ size_t num_clusters,
687
+ HuffmanTree* tree,
688
+ size_t* storage_ix, uint8_t* storage) {
689
+ size_t i;
690
+ uint32_t* rle_symbols;
691
+ uint32_t max_run_length_prefix = 6;
692
+ size_t num_rle_symbols = 0;
693
+ uint32_t* BROTLI_RESTRICT const histogram = arena->histogram;
694
+ static const uint32_t kSymbolMask = (1u << SYMBOL_BITS) - 1u;
695
+ uint8_t* BROTLI_RESTRICT const depths = arena->depths;
696
+ uint16_t* BROTLI_RESTRICT const bits = arena->bits;
697
+
698
+ StoreVarLenUint8(num_clusters - 1, storage_ix, storage);
699
+
700
+ if (num_clusters == 1) {
701
+ return;
702
+ }
703
+
704
+ rle_symbols = BROTLI_ALLOC(m, uint32_t, context_map_size);
705
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(rle_symbols)) return;
706
+ MoveToFrontTransform(context_map, context_map_size, rle_symbols);
707
+ RunLengthCodeZeros(context_map_size, rle_symbols,
708
+ &num_rle_symbols, &max_run_length_prefix);
709
+ memset(histogram, 0, sizeof(arena->histogram));
710
+ for (i = 0; i < num_rle_symbols; ++i) {
711
+ ++histogram[rle_symbols[i] & kSymbolMask];
712
+ }
713
+ {
714
+ BROTLI_BOOL use_rle = TO_BROTLI_BOOL(max_run_length_prefix > 0);
715
+ BrotliWriteBits(1, (uint64_t)use_rle, storage_ix, storage);
716
+ if (use_rle) {
717
+ BrotliWriteBits(4, max_run_length_prefix - 1, storage_ix, storage);
718
+ }
719
+ }
720
+ BuildAndStoreHuffmanTree(histogram, num_clusters + max_run_length_prefix,
721
+ num_clusters + max_run_length_prefix,
722
+ tree, depths, bits, storage_ix, storage);
723
+ for (i = 0; i < num_rle_symbols; ++i) {
724
+ const uint32_t rle_symbol = rle_symbols[i] & kSymbolMask;
725
+ const uint32_t extra_bits_val = rle_symbols[i] >> SYMBOL_BITS;
726
+ BrotliWriteBits(depths[rle_symbol], bits[rle_symbol], storage_ix, storage);
727
+ if (rle_symbol > 0 && rle_symbol <= max_run_length_prefix) {
728
+ BrotliWriteBits(rle_symbol, extra_bits_val, storage_ix, storage);
729
+ }
730
+ }
731
+ BrotliWriteBits(1, 1, storage_ix, storage); /* use move-to-front */
732
+ BROTLI_FREE(m, rle_symbols);
733
+ }
734
+
735
+ /* Stores the block switch command with index block_ix to the bit stream. */
736
+ static BROTLI_INLINE void StoreBlockSwitch(BlockSplitCode* code,
737
+ const uint32_t block_len,
738
+ const uint8_t block_type,
739
+ BROTLI_BOOL is_first_block,
740
+ size_t* storage_ix,
741
+ uint8_t* storage) {
742
+ size_t typecode = NextBlockTypeCode(&code->type_code_calculator, block_type);
743
+ size_t lencode;
744
+ uint32_t len_nextra;
745
+ uint32_t len_extra;
746
+ if (!is_first_block) {
747
+ BrotliWriteBits(code->type_depths[typecode], code->type_bits[typecode],
748
+ storage_ix, storage);
749
+ }
750
+ GetBlockLengthPrefixCode(block_len, &lencode, &len_nextra, &len_extra);
751
+
752
+ BrotliWriteBits(code->length_depths[lencode], code->length_bits[lencode],
753
+ storage_ix, storage);
754
+ BrotliWriteBits(len_nextra, len_extra, storage_ix, storage);
755
+ }
756
+
757
+ /* Builds a BlockSplitCode data structure from the block split given by the
758
+ vector of block types and block lengths and stores it to the bit stream. */
759
+ static void BuildAndStoreBlockSplitCode(const uint8_t* types,
760
+ const uint32_t* lengths,
761
+ const size_t num_blocks,
762
+ const size_t num_types,
763
+ HuffmanTree* tree,
764
+ BlockSplitCode* code,
765
+ size_t* storage_ix,
766
+ uint8_t* storage) {
767
+ uint32_t type_histo[BROTLI_MAX_BLOCK_TYPE_SYMBOLS];
768
+ uint32_t length_histo[BROTLI_NUM_BLOCK_LEN_SYMBOLS];
769
+ size_t i;
770
+ BlockTypeCodeCalculator type_code_calculator;
771
+ memset(type_histo, 0, (num_types + 2) * sizeof(type_histo[0]));
772
+ memset(length_histo, 0, sizeof(length_histo));
773
+ InitBlockTypeCodeCalculator(&type_code_calculator);
774
+ for (i = 0; i < num_blocks; ++i) {
775
+ size_t type_code = NextBlockTypeCode(&type_code_calculator, types[i]);
776
+ if (i != 0) ++type_histo[type_code];
777
+ ++length_histo[BlockLengthPrefixCode(lengths[i])];
778
+ }
779
+ StoreVarLenUint8(num_types - 1, storage_ix, storage);
780
+ if (num_types > 1) { /* TODO(eustas): else? could StoreBlockSwitch occur? */
781
+ BuildAndStoreHuffmanTree(&type_histo[0], num_types + 2, num_types + 2, tree,
782
+ &code->type_depths[0], &code->type_bits[0],
783
+ storage_ix, storage);
784
+ BuildAndStoreHuffmanTree(&length_histo[0], BROTLI_NUM_BLOCK_LEN_SYMBOLS,
785
+ BROTLI_NUM_BLOCK_LEN_SYMBOLS,
786
+ tree, &code->length_depths[0],
787
+ &code->length_bits[0], storage_ix, storage);
788
+ StoreBlockSwitch(code, lengths[0], types[0], 1, storage_ix, storage);
789
+ }
790
+ }
791
+
792
+ /* Stores a context map where the histogram type is always the block type. */
793
+ static void StoreTrivialContextMap(EncodeContextMapArena* arena,
794
+ size_t num_types,
795
+ size_t context_bits,
796
+ HuffmanTree* tree,
797
+ size_t* storage_ix,
798
+ uint8_t* storage) {
799
+ StoreVarLenUint8(num_types - 1, storage_ix, storage);
800
+ if (num_types > 1) {
801
+ size_t repeat_code = context_bits - 1u;
802
+ size_t repeat_bits = (1u << repeat_code) - 1u;
803
+ size_t alphabet_size = num_types + repeat_code;
804
+ uint32_t* BROTLI_RESTRICT const histogram = arena->histogram;
805
+ uint8_t* BROTLI_RESTRICT const depths = arena->depths;
806
+ uint16_t* BROTLI_RESTRICT const bits = arena->bits;
807
+ size_t i;
808
+ memset(histogram, 0, alphabet_size * sizeof(histogram[0]));
809
+ /* Write RLEMAX. */
810
+ BrotliWriteBits(1, 1, storage_ix, storage);
811
+ BrotliWriteBits(4, repeat_code - 1, storage_ix, storage);
812
+ histogram[repeat_code] = (uint32_t)num_types;
813
+ histogram[0] = 1;
814
+ for (i = context_bits; i < alphabet_size; ++i) {
815
+ histogram[i] = 1;
816
+ }
817
+ BuildAndStoreHuffmanTree(histogram, alphabet_size, alphabet_size,
818
+ tree, depths, bits, storage_ix, storage);
819
+ for (i = 0; i < num_types; ++i) {
820
+ size_t code = (i == 0 ? 0 : i + context_bits - 1);
821
+ BrotliWriteBits(depths[code], bits[code], storage_ix, storage);
822
+ BrotliWriteBits(
823
+ depths[repeat_code], bits[repeat_code], storage_ix, storage);
824
+ BrotliWriteBits(repeat_code, repeat_bits, storage_ix, storage);
825
+ }
826
+ /* Write IMTF (inverse-move-to-front) bit. */
827
+ BrotliWriteBits(1, 1, storage_ix, storage);
828
+ }
829
+ }
830
+
831
+ /* Manages the encoding of one block category (literal, command or distance). */
832
+ typedef struct BlockEncoder {
833
+ size_t histogram_length_;
834
+ size_t num_block_types_;
835
+ const uint8_t* block_types_; /* Not owned. */
836
+ const uint32_t* block_lengths_; /* Not owned. */
837
+ size_t num_blocks_;
838
+ BlockSplitCode block_split_code_;
839
+ size_t block_ix_;
840
+ size_t block_len_;
841
+ size_t entropy_ix_;
842
+ uint8_t* depths_;
843
+ uint16_t* bits_;
844
+ } BlockEncoder;
845
+
846
+ static void InitBlockEncoder(BlockEncoder* self, size_t histogram_length,
847
+ size_t num_block_types, const uint8_t* block_types,
848
+ const uint32_t* block_lengths, const size_t num_blocks) {
849
+ self->histogram_length_ = histogram_length;
850
+ self->num_block_types_ = num_block_types;
851
+ self->block_types_ = block_types;
852
+ self->block_lengths_ = block_lengths;
853
+ self->num_blocks_ = num_blocks;
854
+ InitBlockTypeCodeCalculator(&self->block_split_code_.type_code_calculator);
855
+ self->block_ix_ = 0;
856
+ self->block_len_ = num_blocks == 0 ? 0 : block_lengths[0];
857
+ self->entropy_ix_ = 0;
858
+ self->depths_ = 0;
859
+ self->bits_ = 0;
860
+ }
861
+
862
+ static void CleanupBlockEncoder(MemoryManager* m, BlockEncoder* self) {
863
+ BROTLI_FREE(m, self->depths_);
864
+ BROTLI_FREE(m, self->bits_);
865
+ }
866
+
867
+ /* Creates entropy codes of block lengths and block types and stores them
868
+ to the bit stream. */
869
+ static void BuildAndStoreBlockSwitchEntropyCodes(BlockEncoder* self,
870
+ HuffmanTree* tree, size_t* storage_ix, uint8_t* storage) {
871
+ BuildAndStoreBlockSplitCode(self->block_types_, self->block_lengths_,
872
+ self->num_blocks_, self->num_block_types_, tree, &self->block_split_code_,
873
+ storage_ix, storage);
874
+ }
875
+
876
+ /* Stores the next symbol with the entropy code of the current block type.
877
+ Updates the block type and block length at block boundaries. */
878
+ static void StoreSymbol(BlockEncoder* self, size_t symbol, size_t* storage_ix,
879
+ uint8_t* storage) {
880
+ if (self->block_len_ == 0) {
881
+ size_t block_ix = ++self->block_ix_;
882
+ uint32_t block_len = self->block_lengths_[block_ix];
883
+ uint8_t block_type = self->block_types_[block_ix];
884
+ self->block_len_ = block_len;
885
+ self->entropy_ix_ = block_type * self->histogram_length_;
886
+ StoreBlockSwitch(&self->block_split_code_, block_len, block_type, 0,
887
+ storage_ix, storage);
888
+ }
889
+ --self->block_len_;
890
+ {
891
+ size_t ix = self->entropy_ix_ + symbol;
892
+ BrotliWriteBits(self->depths_[ix], self->bits_[ix], storage_ix, storage);
893
+ }
894
+ }
895
+
896
+ /* Stores the next symbol with the entropy code of the current block type and
897
+ context value.
898
+ Updates the block type and block length at block boundaries. */
899
+ static void StoreSymbolWithContext(BlockEncoder* self, size_t symbol,
900
+ size_t context, const uint32_t* context_map, size_t* storage_ix,
901
+ uint8_t* storage, const size_t context_bits) {
902
+ if (self->block_len_ == 0) {
903
+ size_t block_ix = ++self->block_ix_;
904
+ uint32_t block_len = self->block_lengths_[block_ix];
905
+ uint8_t block_type = self->block_types_[block_ix];
906
+ self->block_len_ = block_len;
907
+ self->entropy_ix_ = (size_t)block_type << context_bits;
908
+ StoreBlockSwitch(&self->block_split_code_, block_len, block_type, 0,
909
+ storage_ix, storage);
910
+ }
911
+ --self->block_len_;
912
+ {
913
+ size_t histo_ix = context_map[self->entropy_ix_ + context];
914
+ size_t ix = histo_ix * self->histogram_length_ + symbol;
915
+ BrotliWriteBits(self->depths_[ix], self->bits_[ix], storage_ix, storage);
916
+ }
917
+ }
918
+
919
+ #define FN(X) X ## Literal
920
+ /* NOLINTNEXTLINE(build/include) */
921
+ /* NOLINT(build/header_guard) */
922
+ /* Copyright 2014 Google Inc. All Rights Reserved.
923
+
924
+ Distributed under MIT license.
925
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
926
+ */
927
+
928
+ /* template parameters: FN */
929
+
930
+ #define HistogramType FN(Histogram)
931
+
932
+ /* Creates entropy codes for all block types and stores them to the bit
933
+ stream. */
934
+ static void FN(BuildAndStoreEntropyCodes)(MemoryManager* m, BlockEncoder* self,
935
+ const HistogramType* histograms, const size_t histograms_size,
936
+ const size_t alphabet_size, HuffmanTree* tree,
937
+ size_t* storage_ix, uint8_t* storage) {
938
+ const size_t table_size = histograms_size * self->histogram_length_;
939
+ self->depths_ = BROTLI_ALLOC(m, uint8_t, table_size);
940
+ self->bits_ = BROTLI_ALLOC(m, uint16_t, table_size);
941
+ if (BROTLI_IS_OOM(m)) return;
942
+
943
+ {
944
+ size_t i;
945
+ for (i = 0; i < histograms_size; ++i) {
946
+ size_t ix = i * self->histogram_length_;
947
+ BuildAndStoreHuffmanTree(&histograms[i].data_[0], self->histogram_length_,
948
+ alphabet_size, tree, &self->depths_[ix], &self->bits_[ix],
949
+ storage_ix, storage);
950
+ }
951
+ }
952
+ }
953
+
954
+ #undef HistogramType
955
+ #undef FN
956
+
957
+ #define FN(X) X ## Command
958
+ /* NOLINTNEXTLINE(build/include) */
959
+ /* NOLINT(build/header_guard) */
960
+ /* Copyright 2014 Google Inc. All Rights Reserved.
961
+
962
+ Distributed under MIT license.
963
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
964
+ */
965
+
966
+ /* template parameters: FN */
967
+
968
+ #define HistogramType FN(Histogram)
969
+
970
+ /* Creates entropy codes for all block types and stores them to the bit
971
+ stream. */
972
+ static void FN(BuildAndStoreEntropyCodes)(MemoryManager* m, BlockEncoder* self,
973
+ const HistogramType* histograms, const size_t histograms_size,
974
+ const size_t alphabet_size, HuffmanTree* tree,
975
+ size_t* storage_ix, uint8_t* storage) {
976
+ const size_t table_size = histograms_size * self->histogram_length_;
977
+ self->depths_ = BROTLI_ALLOC(m, uint8_t, table_size);
978
+ self->bits_ = BROTLI_ALLOC(m, uint16_t, table_size);
979
+ if (BROTLI_IS_OOM(m)) return;
980
+
981
+ {
982
+ size_t i;
983
+ for (i = 0; i < histograms_size; ++i) {
984
+ size_t ix = i * self->histogram_length_;
985
+ BuildAndStoreHuffmanTree(&histograms[i].data_[0], self->histogram_length_,
986
+ alphabet_size, tree, &self->depths_[ix], &self->bits_[ix],
987
+ storage_ix, storage);
988
+ }
989
+ }
990
+ }
991
+
992
+ #undef HistogramType
993
+ #undef FN
994
+
995
+ #define FN(X) X ## Distance
996
+ /* NOLINTNEXTLINE(build/include) */
997
+ /* NOLINT(build/header_guard) */
998
+ /* Copyright 2014 Google Inc. All Rights Reserved.
999
+
1000
+ Distributed under MIT license.
1001
+ See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
1002
+ */
1003
+
1004
+ /* template parameters: FN */
1005
+
1006
+ #define HistogramType FN(Histogram)
1007
+
1008
+ /* Creates entropy codes for all block types and stores them to the bit
1009
+ stream. */
1010
+ static void FN(BuildAndStoreEntropyCodes)(MemoryManager* m, BlockEncoder* self,
1011
+ const HistogramType* histograms, const size_t histograms_size,
1012
+ const size_t alphabet_size, HuffmanTree* tree,
1013
+ size_t* storage_ix, uint8_t* storage) {
1014
+ const size_t table_size = histograms_size * self->histogram_length_;
1015
+ self->depths_ = BROTLI_ALLOC(m, uint8_t, table_size);
1016
+ self->bits_ = BROTLI_ALLOC(m, uint16_t, table_size);
1017
+ if (BROTLI_IS_OOM(m)) return;
1018
+
1019
+ {
1020
+ size_t i;
1021
+ for (i = 0; i < histograms_size; ++i) {
1022
+ size_t ix = i * self->histogram_length_;
1023
+ BuildAndStoreHuffmanTree(&histograms[i].data_[0], self->histogram_length_,
1024
+ alphabet_size, tree, &self->depths_[ix], &self->bits_[ix],
1025
+ storage_ix, storage);
1026
+ }
1027
+ }
1028
+ }
1029
+
1030
+ #undef HistogramType
1031
+ #undef FN
1032
+
1033
+ static void JumpToByteBoundary(size_t* storage_ix, uint8_t* storage) {
1034
+ *storage_ix = (*storage_ix + 7u) & ~7u;
1035
+ storage[*storage_ix >> 3] = 0;
1036
+ }
1037
+
1038
+ typedef struct StoreMetablockArena {
1039
+ BlockEncoder literal_enc;
1040
+ BlockEncoder command_enc;
1041
+ BlockEncoder distance_enc;
1042
+ EncodeContextMapArena context_map_arena;
1043
+ } StoreMetablockArena;
1044
+
1045
+ void duckdb_brotli::BrotliStoreMetaBlock(MemoryManager* m,
1046
+ const uint8_t* input, size_t start_pos, size_t length, size_t mask,
1047
+ uint8_t prev_byte, uint8_t prev_byte2, BROTLI_BOOL is_last,
1048
+ const BrotliEncoderParams* params, ContextType literal_context_mode,
1049
+ const Command* commands, size_t n_commands, const MetaBlockSplit* mb,
1050
+ size_t* storage_ix, uint8_t* storage) {
1051
+
1052
+ size_t pos = start_pos;
1053
+ size_t i;
1054
+ uint32_t num_distance_symbols = params->dist.alphabet_size_max;
1055
+ uint32_t num_effective_distance_symbols = params->dist.alphabet_size_limit;
1056
+ HuffmanTree* tree;
1057
+ ContextLut literal_context_lut = BROTLI_CONTEXT_LUT(literal_context_mode);
1058
+ StoreMetablockArena* arena = NULL;
1059
+ BlockEncoder* literal_enc = NULL;
1060
+ BlockEncoder* command_enc = NULL;
1061
+ BlockEncoder* distance_enc = NULL;
1062
+ const BrotliDistanceParams* dist = &params->dist;
1063
+ BROTLI_DCHECK(
1064
+ num_effective_distance_symbols <= BROTLI_NUM_HISTOGRAM_DISTANCE_SYMBOLS);
1065
+
1066
+ StoreCompressedMetaBlockHeader(is_last, length, storage_ix, storage);
1067
+
1068
+ tree = BROTLI_ALLOC(m, HuffmanTree, MAX_HUFFMAN_TREE_SIZE);
1069
+ arena = BROTLI_ALLOC(m, StoreMetablockArena, 1);
1070
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(tree) || BROTLI_IS_NULL(arena)) return;
1071
+ literal_enc = &arena->literal_enc;
1072
+ command_enc = &arena->command_enc;
1073
+ distance_enc = &arena->distance_enc;
1074
+ InitBlockEncoder(literal_enc, BROTLI_NUM_LITERAL_SYMBOLS,
1075
+ mb->literal_split.num_types, mb->literal_split.types,
1076
+ mb->literal_split.lengths, mb->literal_split.num_blocks);
1077
+ InitBlockEncoder(command_enc, BROTLI_NUM_COMMAND_SYMBOLS,
1078
+ mb->command_split.num_types, mb->command_split.types,
1079
+ mb->command_split.lengths, mb->command_split.num_blocks);
1080
+ InitBlockEncoder(distance_enc, num_effective_distance_symbols,
1081
+ mb->distance_split.num_types, mb->distance_split.types,
1082
+ mb->distance_split.lengths, mb->distance_split.num_blocks);
1083
+
1084
+ BuildAndStoreBlockSwitchEntropyCodes(literal_enc, tree, storage_ix, storage);
1085
+ BuildAndStoreBlockSwitchEntropyCodes(command_enc, tree, storage_ix, storage);
1086
+ BuildAndStoreBlockSwitchEntropyCodes(distance_enc, tree, storage_ix, storage);
1087
+
1088
+ BrotliWriteBits(2, dist->distance_postfix_bits, storage_ix, storage);
1089
+ BrotliWriteBits(
1090
+ 4, dist->num_direct_distance_codes >> dist->distance_postfix_bits,
1091
+ storage_ix, storage);
1092
+ for (i = 0; i < mb->literal_split.num_types; ++i) {
1093
+ BrotliWriteBits(2, literal_context_mode, storage_ix, storage);
1094
+ }
1095
+
1096
+ if (mb->literal_context_map_size == 0) {
1097
+ StoreTrivialContextMap(
1098
+ &arena->context_map_arena, mb->literal_histograms_size,
1099
+ BROTLI_LITERAL_CONTEXT_BITS, tree, storage_ix, storage);
1100
+ } else {
1101
+ EncodeContextMap(m, &arena->context_map_arena,
1102
+ mb->literal_context_map, mb->literal_context_map_size,
1103
+ mb->literal_histograms_size, tree, storage_ix, storage);
1104
+ if (BROTLI_IS_OOM(m)) return;
1105
+ }
1106
+
1107
+ if (mb->distance_context_map_size == 0) {
1108
+ StoreTrivialContextMap(
1109
+ &arena->context_map_arena, mb->distance_histograms_size,
1110
+ BROTLI_DISTANCE_CONTEXT_BITS, tree, storage_ix, storage);
1111
+ } else {
1112
+ EncodeContextMap(m, &arena->context_map_arena,
1113
+ mb->distance_context_map, mb->distance_context_map_size,
1114
+ mb->distance_histograms_size, tree, storage_ix, storage);
1115
+ if (BROTLI_IS_OOM(m)) return;
1116
+ }
1117
+
1118
+ BuildAndStoreEntropyCodesLiteral(m, literal_enc, mb->literal_histograms,
1119
+ mb->literal_histograms_size, BROTLI_NUM_LITERAL_SYMBOLS, tree,
1120
+ storage_ix, storage);
1121
+ if (BROTLI_IS_OOM(m)) return;
1122
+ BuildAndStoreEntropyCodesCommand(m, command_enc, mb->command_histograms,
1123
+ mb->command_histograms_size, BROTLI_NUM_COMMAND_SYMBOLS, tree,
1124
+ storage_ix, storage);
1125
+ if (BROTLI_IS_OOM(m)) return;
1126
+ BuildAndStoreEntropyCodesDistance(m, distance_enc, mb->distance_histograms,
1127
+ mb->distance_histograms_size, num_distance_symbols, tree,
1128
+ storage_ix, storage);
1129
+ if (BROTLI_IS_OOM(m)) return;
1130
+ BROTLI_FREE(m, tree);
1131
+
1132
+ for (i = 0; i < n_commands; ++i) {
1133
+ const Command cmd = commands[i];
1134
+ size_t cmd_code = cmd.cmd_prefix_;
1135
+ StoreSymbol(command_enc, cmd_code, storage_ix, storage);
1136
+ StoreCommandExtra(&cmd, storage_ix, storage);
1137
+ if (mb->literal_context_map_size == 0) {
1138
+ size_t j;
1139
+ for (j = cmd.insert_len_; j != 0; --j) {
1140
+ StoreSymbol(literal_enc, input[pos & mask], storage_ix, storage);
1141
+ ++pos;
1142
+ }
1143
+ } else {
1144
+ size_t j;
1145
+ for (j = cmd.insert_len_; j != 0; --j) {
1146
+ size_t context =
1147
+ BROTLI_CONTEXT(prev_byte, prev_byte2, literal_context_lut);
1148
+ uint8_t literal = input[pos & mask];
1149
+ StoreSymbolWithContext(literal_enc, literal, context,
1150
+ mb->literal_context_map, storage_ix, storage,
1151
+ BROTLI_LITERAL_CONTEXT_BITS);
1152
+ prev_byte2 = prev_byte;
1153
+ prev_byte = literal;
1154
+ ++pos;
1155
+ }
1156
+ }
1157
+ pos += CommandCopyLen(&cmd);
1158
+ if (CommandCopyLen(&cmd)) {
1159
+ prev_byte2 = input[(pos - 2) & mask];
1160
+ prev_byte = input[(pos - 1) & mask];
1161
+ if (cmd.cmd_prefix_ >= 128) {
1162
+ size_t dist_code = cmd.dist_prefix_ & 0x3FF;
1163
+ uint32_t distnumextra = cmd.dist_prefix_ >> 10;
1164
+ uint64_t distextra = cmd.dist_extra_;
1165
+ if (mb->distance_context_map_size == 0) {
1166
+ StoreSymbol(distance_enc, dist_code, storage_ix, storage);
1167
+ } else {
1168
+ size_t context = CommandDistanceContext(&cmd);
1169
+ StoreSymbolWithContext(distance_enc, dist_code, context,
1170
+ mb->distance_context_map, storage_ix, storage,
1171
+ BROTLI_DISTANCE_CONTEXT_BITS);
1172
+ }
1173
+ BrotliWriteBits(distnumextra, distextra, storage_ix, storage);
1174
+ }
1175
+ }
1176
+ }
1177
+ CleanupBlockEncoder(m, distance_enc);
1178
+ CleanupBlockEncoder(m, command_enc);
1179
+ CleanupBlockEncoder(m, literal_enc);
1180
+ BROTLI_FREE(m, arena);
1181
+ if (is_last) {
1182
+ JumpToByteBoundary(storage_ix, storage);
1183
+ }
1184
+ }
1185
+
1186
+ static void BuildHistograms(const uint8_t* input,
1187
+ size_t start_pos,
1188
+ size_t mask,
1189
+ const Command* commands,
1190
+ size_t n_commands,
1191
+ HistogramLiteral* lit_histo,
1192
+ HistogramCommand* cmd_histo,
1193
+ HistogramDistance* dist_histo) {
1194
+ size_t pos = start_pos;
1195
+ size_t i;
1196
+ for (i = 0; i < n_commands; ++i) {
1197
+ const Command cmd = commands[i];
1198
+ size_t j;
1199
+ HistogramAddCommand(cmd_histo, cmd.cmd_prefix_);
1200
+ for (j = cmd.insert_len_; j != 0; --j) {
1201
+ HistogramAddLiteral(lit_histo, input[pos & mask]);
1202
+ ++pos;
1203
+ }
1204
+ pos += CommandCopyLen(&cmd);
1205
+ if (CommandCopyLen(&cmd) && cmd.cmd_prefix_ >= 128) {
1206
+ HistogramAddDistance(dist_histo, cmd.dist_prefix_ & 0x3FF);
1207
+ }
1208
+ }
1209
+ }
1210
+
1211
+ static void StoreDataWithHuffmanCodes(const uint8_t* input,
1212
+ size_t start_pos,
1213
+ size_t mask,
1214
+ const Command* commands,
1215
+ size_t n_commands,
1216
+ const uint8_t* lit_depth,
1217
+ const uint16_t* lit_bits,
1218
+ const uint8_t* cmd_depth,
1219
+ const uint16_t* cmd_bits,
1220
+ const uint8_t* dist_depth,
1221
+ const uint16_t* dist_bits,
1222
+ size_t* storage_ix,
1223
+ uint8_t* storage) {
1224
+ size_t pos = start_pos;
1225
+ size_t i;
1226
+ for (i = 0; i < n_commands; ++i) {
1227
+ const Command cmd = commands[i];
1228
+ const size_t cmd_code = cmd.cmd_prefix_;
1229
+ size_t j;
1230
+ BrotliWriteBits(
1231
+ cmd_depth[cmd_code], cmd_bits[cmd_code], storage_ix, storage);
1232
+ StoreCommandExtra(&cmd, storage_ix, storage);
1233
+ for (j = cmd.insert_len_; j != 0; --j) {
1234
+ const uint8_t literal = input[pos & mask];
1235
+ BrotliWriteBits(
1236
+ lit_depth[literal], lit_bits[literal], storage_ix, storage);
1237
+ ++pos;
1238
+ }
1239
+ pos += CommandCopyLen(&cmd);
1240
+ if (CommandCopyLen(&cmd) && cmd.cmd_prefix_ >= 128) {
1241
+ const size_t dist_code = cmd.dist_prefix_ & 0x3FF;
1242
+ const uint32_t distnumextra = cmd.dist_prefix_ >> 10;
1243
+ const uint32_t distextra = cmd.dist_extra_;
1244
+ BrotliWriteBits(dist_depth[dist_code], dist_bits[dist_code],
1245
+ storage_ix, storage);
1246
+ BrotliWriteBits(distnumextra, distextra, storage_ix, storage);
1247
+ }
1248
+ }
1249
+ }
1250
+
1251
+ /* TODO(eustas): pull alloc/dealloc to caller? */
1252
+ typedef struct MetablockArena {
1253
+ HistogramLiteral lit_histo;
1254
+ HistogramCommand cmd_histo;
1255
+ HistogramDistance dist_histo;
1256
+ /* TODO(eustas): merge bits and depth? */
1257
+ uint8_t lit_depth[BROTLI_NUM_LITERAL_SYMBOLS];
1258
+ uint16_t lit_bits[BROTLI_NUM_LITERAL_SYMBOLS];
1259
+ uint8_t cmd_depth[BROTLI_NUM_COMMAND_SYMBOLS];
1260
+ uint16_t cmd_bits[BROTLI_NUM_COMMAND_SYMBOLS];
1261
+ uint8_t dist_depth[MAX_SIMPLE_DISTANCE_ALPHABET_SIZE];
1262
+ uint16_t dist_bits[MAX_SIMPLE_DISTANCE_ALPHABET_SIZE];
1263
+ HuffmanTree tree[MAX_HUFFMAN_TREE_SIZE];
1264
+ } MetablockArena;
1265
+
1266
+ void duckdb_brotli::BrotliStoreMetaBlockTrivial(MemoryManager* m,
1267
+ const uint8_t* input, size_t start_pos, size_t length, size_t mask,
1268
+ BROTLI_BOOL is_last, const BrotliEncoderParams* params,
1269
+ const Command* commands, size_t n_commands,
1270
+ size_t* storage_ix, uint8_t* storage) {
1271
+ MetablockArena* arena = BROTLI_ALLOC(m, MetablockArena, 1);
1272
+ uint32_t num_distance_symbols = params->dist.alphabet_size_max;
1273
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(arena)) return;
1274
+
1275
+ StoreCompressedMetaBlockHeader(is_last, length, storage_ix, storage);
1276
+
1277
+ HistogramClearLiteral(&arena->lit_histo);
1278
+ HistogramClearCommand(&arena->cmd_histo);
1279
+ HistogramClearDistance(&arena->dist_histo);
1280
+
1281
+ BuildHistograms(input, start_pos, mask, commands, n_commands,
1282
+ &arena->lit_histo, &arena->cmd_histo, &arena->dist_histo);
1283
+
1284
+ BrotliWriteBits(13, 0, storage_ix, storage);
1285
+
1286
+ BuildAndStoreHuffmanTree(arena->lit_histo.data_, BROTLI_NUM_LITERAL_SYMBOLS,
1287
+ BROTLI_NUM_LITERAL_SYMBOLS, arena->tree,
1288
+ arena->lit_depth, arena->lit_bits,
1289
+ storage_ix, storage);
1290
+ BuildAndStoreHuffmanTree(arena->cmd_histo.data_, BROTLI_NUM_COMMAND_SYMBOLS,
1291
+ BROTLI_NUM_COMMAND_SYMBOLS, arena->tree,
1292
+ arena->cmd_depth, arena->cmd_bits,
1293
+ storage_ix, storage);
1294
+ BuildAndStoreHuffmanTree(arena->dist_histo.data_,
1295
+ MAX_SIMPLE_DISTANCE_ALPHABET_SIZE,
1296
+ num_distance_symbols, arena->tree,
1297
+ arena->dist_depth, arena->dist_bits,
1298
+ storage_ix, storage);
1299
+ StoreDataWithHuffmanCodes(input, start_pos, mask, commands,
1300
+ n_commands, arena->lit_depth, arena->lit_bits,
1301
+ arena->cmd_depth, arena->cmd_bits,
1302
+ arena->dist_depth, arena->dist_bits,
1303
+ storage_ix, storage);
1304
+ BROTLI_FREE(m, arena);
1305
+ if (is_last) {
1306
+ JumpToByteBoundary(storage_ix, storage);
1307
+ }
1308
+ }
1309
+
1310
+ void duckdb_brotli::BrotliStoreMetaBlockFast(MemoryManager* m,
1311
+ const uint8_t* input, size_t start_pos, size_t length, size_t mask,
1312
+ BROTLI_BOOL is_last, const BrotliEncoderParams* params,
1313
+ const Command* commands, size_t n_commands,
1314
+ size_t* storage_ix, uint8_t* storage) {
1315
+ MetablockArena* arena = BROTLI_ALLOC(m, MetablockArena, 1);
1316
+ uint32_t num_distance_symbols = params->dist.alphabet_size_max;
1317
+ uint32_t distance_alphabet_bits =
1318
+ Log2FloorNonZero(num_distance_symbols - 1) + 1;
1319
+ if (BROTLI_IS_OOM(m) || BROTLI_IS_NULL(arena)) return;
1320
+
1321
+ StoreCompressedMetaBlockHeader(is_last, length, storage_ix, storage);
1322
+
1323
+ BrotliWriteBits(13, 0, storage_ix, storage);
1324
+
1325
+ if (n_commands <= 128) {
1326
+ uint32_t histogram[BROTLI_NUM_LITERAL_SYMBOLS] = { 0 };
1327
+ size_t pos = start_pos;
1328
+ size_t num_literals = 0;
1329
+ size_t i;
1330
+ for (i = 0; i < n_commands; ++i) {
1331
+ const Command cmd = commands[i];
1332
+ size_t j;
1333
+ for (j = cmd.insert_len_; j != 0; --j) {
1334
+ ++histogram[input[pos & mask]];
1335
+ ++pos;
1336
+ }
1337
+ num_literals += cmd.insert_len_;
1338
+ pos += CommandCopyLen(&cmd);
1339
+ }
1340
+ BrotliBuildAndStoreHuffmanTreeFast(arena->tree, histogram, num_literals,
1341
+ /* max_bits = */ 8,
1342
+ arena->lit_depth, arena->lit_bits,
1343
+ storage_ix, storage);
1344
+ StoreStaticCommandHuffmanTree(storage_ix, storage);
1345
+ StoreStaticDistanceHuffmanTree(storage_ix, storage);
1346
+ StoreDataWithHuffmanCodes(input, start_pos, mask, commands,
1347
+ n_commands, arena->lit_depth, arena->lit_bits,
1348
+ kStaticCommandCodeDepth,
1349
+ kStaticCommandCodeBits,
1350
+ kStaticDistanceCodeDepth,
1351
+ kStaticDistanceCodeBits,
1352
+ storage_ix, storage);
1353
+ } else {
1354
+ HistogramClearLiteral(&arena->lit_histo);
1355
+ HistogramClearCommand(&arena->cmd_histo);
1356
+ HistogramClearDistance(&arena->dist_histo);
1357
+ BuildHistograms(input, start_pos, mask, commands, n_commands,
1358
+ &arena->lit_histo, &arena->cmd_histo, &arena->dist_histo);
1359
+ BrotliBuildAndStoreHuffmanTreeFast(arena->tree, arena->lit_histo.data_,
1360
+ arena->lit_histo.total_count_,
1361
+ /* max_bits = */ 8,
1362
+ arena->lit_depth, arena->lit_bits,
1363
+ storage_ix, storage);
1364
+ BrotliBuildAndStoreHuffmanTreeFast(arena->tree, arena->cmd_histo.data_,
1365
+ arena->cmd_histo.total_count_,
1366
+ /* max_bits = */ 10,
1367
+ arena->cmd_depth, arena->cmd_bits,
1368
+ storage_ix, storage);
1369
+ BrotliBuildAndStoreHuffmanTreeFast(arena->tree, arena->dist_histo.data_,
1370
+ arena->dist_histo.total_count_,
1371
+ /* max_bits = */
1372
+ distance_alphabet_bits,
1373
+ arena->dist_depth, arena->dist_bits,
1374
+ storage_ix, storage);
1375
+ StoreDataWithHuffmanCodes(input, start_pos, mask, commands,
1376
+ n_commands, arena->lit_depth, arena->lit_bits,
1377
+ arena->cmd_depth, arena->cmd_bits,
1378
+ arena->dist_depth, arena->dist_bits,
1379
+ storage_ix, storage);
1380
+ }
1381
+
1382
+ BROTLI_FREE(m, arena);
1383
+
1384
+ if (is_last) {
1385
+ JumpToByteBoundary(storage_ix, storage);
1386
+ }
1387
+ }
1388
+
1389
+ /* This is for storing uncompressed blocks (simple raw storage of
1390
+ bytes-as-bytes). */
1391
+ void duckdb_brotli::BrotliStoreUncompressedMetaBlock(BROTLI_BOOL is_final_block,
1392
+ const uint8_t* BROTLI_RESTRICT input,
1393
+ size_t position, size_t mask,
1394
+ size_t len,
1395
+ size_t* BROTLI_RESTRICT storage_ix,
1396
+ uint8_t* BROTLI_RESTRICT storage) {
1397
+ size_t masked_pos = position & mask;
1398
+ BrotliStoreUncompressedMetaBlockHeader(len, storage_ix, storage);
1399
+ JumpToByteBoundary(storage_ix, storage);
1400
+
1401
+ if (masked_pos + len > mask + 1) {
1402
+ size_t len1 = mask + 1 - masked_pos;
1403
+ memcpy(&storage[*storage_ix >> 3], &input[masked_pos], len1);
1404
+ *storage_ix += len1 << 3;
1405
+ len -= len1;
1406
+ masked_pos = 0;
1407
+ }
1408
+ memcpy(&storage[*storage_ix >> 3], &input[masked_pos], len);
1409
+ *storage_ix += len << 3;
1410
+
1411
+ /* We need to clear the next 4 bytes to continue to be
1412
+ compatible with BrotliWriteBits. */
1413
+ BrotliWriteBitsPrepareStorage(*storage_ix, storage);
1414
+
1415
+ /* Since the uncompressed block itself may not be the final block, add an
1416
+ empty one after this. */
1417
+ if (is_final_block) {
1418
+ BrotliWriteBits(1, 1, storage_ix, storage); /* islast */
1419
+ BrotliWriteBits(1, 1, storage_ix, storage); /* isempty */
1420
+ JumpToByteBoundary(storage_ix, storage);
1421
+ }
1422
+ }
1423
+
1424
+ #if defined(BROTLI_TEST)
1425
+ void GetBlockLengthPrefixCodeForTest(uint32_t len, size_t* code,
1426
+ uint32_t* n_extra, uint32_t* extra) {
1427
+ GetBlockLengthPrefixCode(len, code, n_extra, extra);
1428
+ }
1429
+ #endif
1430
+
1431
+