duckdb 0.7.1-dev240.0 → 0.7.1-dev320.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (60) hide show
  1. package/README.md +1 -1
  2. package/package.json +3 -3
  3. package/src/duckdb/extension/json/json_scan.cpp +1 -4
  4. package/src/duckdb/extension/parquet/column_reader.cpp +7 -0
  5. package/src/duckdb/extension/parquet/include/column_reader.hpp +1 -0
  6. package/src/duckdb/extension/parquet/parquet-extension.cpp +2 -10
  7. package/src/duckdb/src/catalog/catalog.cpp +62 -13
  8. package/src/duckdb/src/catalog/catalog_entry/index_catalog_entry.cpp +8 -7
  9. package/src/duckdb/src/catalog/default/default_views.cpp +1 -1
  10. package/src/duckdb/src/common/file_system.cpp +23 -9
  11. package/src/duckdb/src/common/local_file_system.cpp +4 -4
  12. package/src/duckdb/src/execution/index/art/art.cpp +117 -67
  13. package/src/duckdb/src/execution/index/art/art_key.cpp +24 -12
  14. package/src/duckdb/src/execution/index/art/leaf.cpp +7 -8
  15. package/src/duckdb/src/execution/index/art/node.cpp +13 -27
  16. package/src/duckdb/src/execution/index/art/node16.cpp +5 -8
  17. package/src/duckdb/src/execution/index/art/node256.cpp +3 -5
  18. package/src/duckdb/src/execution/index/art/node4.cpp +4 -7
  19. package/src/duckdb/src/execution/index/art/node48.cpp +5 -8
  20. package/src/duckdb/src/execution/index/art/prefix.cpp +2 -3
  21. package/src/duckdb/src/execution/operator/helper/physical_reset.cpp +1 -9
  22. package/src/duckdb/src/execution/operator/helper/physical_set.cpp +1 -9
  23. package/src/duckdb/src/function/pragma/pragma_queries.cpp +2 -2
  24. package/src/duckdb/src/function/scalar/generic/current_setting.cpp +2 -2
  25. package/src/duckdb/src/function/table/read_csv.cpp +3 -5
  26. package/src/duckdb/src/function/table/table_scan.cpp +3 -0
  27. package/src/duckdb/src/function/table/version/pragma_version.cpp +2 -2
  28. package/src/duckdb/src/include/duckdb/catalog/catalog.hpp +7 -1
  29. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/duck_index_entry.hpp +1 -1
  30. package/src/duckdb/src/include/duckdb/catalog/catalog_entry/index_catalog_entry.hpp +1 -1
  31. package/src/duckdb/src/include/duckdb/common/enums/wal_type.hpp +3 -0
  32. package/src/duckdb/src/include/duckdb/common/file_system.hpp +1 -1
  33. package/src/duckdb/src/include/duckdb/execution/index/art/art.hpp +37 -41
  34. package/src/duckdb/src/include/duckdb/execution/index/art/art_key.hpp +8 -11
  35. package/src/duckdb/src/include/duckdb/main/{extension_functions.hpp → extension_entries.hpp} +26 -5
  36. package/src/duckdb/src/include/duckdb/main/extension_helper.hpp +3 -0
  37. package/src/duckdb/src/include/duckdb/planner/binder.hpp +3 -0
  38. package/src/duckdb/src/include/duckdb/planner/expression_binder/index_binder.hpp +10 -3
  39. package/src/duckdb/src/include/duckdb/storage/data_table.hpp +7 -1
  40. package/src/duckdb/src/include/duckdb/storage/index.hpp +47 -38
  41. package/src/duckdb/src/include/duckdb/storage/write_ahead_log.hpp +7 -0
  42. package/src/duckdb/src/main/database.cpp +4 -2
  43. package/src/duckdb/src/main/extension/extension_load.cpp +22 -3
  44. package/src/duckdb/src/parser/parsed_data/create_index_info.cpp +3 -0
  45. package/src/duckdb/src/planner/binder/statement/bind_create_table.cpp +13 -0
  46. package/src/duckdb/src/planner/expression_binder/index_binder.cpp +32 -1
  47. package/src/duckdb/src/storage/buffer_manager.cpp +30 -3
  48. package/src/duckdb/src/storage/compression/bitpacking.cpp +16 -7
  49. package/src/duckdb/src/storage/data_table.cpp +66 -3
  50. package/src/duckdb/src/storage/index.cpp +1 -1
  51. package/src/duckdb/src/storage/local_storage.cpp +1 -1
  52. package/src/duckdb/src/storage/table_index_list.cpp +1 -2
  53. package/src/duckdb/src/storage/wal_replay.cpp +68 -0
  54. package/src/duckdb/src/storage/write_ahead_log.cpp +21 -1
  55. package/src/duckdb/src/transaction/commit_state.cpp +5 -2
  56. package/src/duckdb/third_party/concurrentqueue/blockingconcurrentqueue.h +2 -2
  57. package/src/statement.cpp +46 -12
  58. package/test/arrow.test.ts +3 -3
  59. package/test/prepare.test.ts +39 -1
  60. package/test/typescript_decls.test.ts +1 -1
@@ -28,24 +28,24 @@ public:
28
28
 
29
29
  public:
30
30
  template <class T>
31
- static inline Key CreateKey(ArenaAllocator &allocator, T element) {
31
+ static inline Key CreateKey(ArenaAllocator &allocator, const LogicalType &type, T element) {
32
32
  auto data = Key::CreateData<T>(allocator, element);
33
33
  return Key(data, sizeof(element));
34
34
  }
35
35
 
36
36
  template <class T>
37
- static inline Key CreateKey(ArenaAllocator &allocator, const Value &element) {
38
- return CreateKey(allocator, element.GetValueUnsafe<T>());
37
+ static inline Key CreateKey(ArenaAllocator &allocator, const LogicalType &type, const Value &element) {
38
+ return CreateKey(allocator, type, element.GetValueUnsafe<T>());
39
39
  }
40
40
 
41
41
  template <class T>
42
- static inline void CreateKey(ArenaAllocator &allocator, Key &key, T element) {
42
+ static inline void CreateKey(ArenaAllocator &allocator, const LogicalType &type, Key &key, T element) {
43
43
  key.data = Key::CreateData<T>(allocator, element);
44
44
  key.len = sizeof(element);
45
45
  }
46
46
 
47
47
  template <class T>
48
- static inline void CreateKey(ArenaAllocator &allocator, Key &key, const Value element) {
48
+ static inline void CreateKey(ArenaAllocator &allocator, const LogicalType &type, Key &key, const Value element) {
49
49
  key.data = Key::CreateData<T>(allocator, element.GetValueUnsafe<T>());
50
50
  key.len = sizeof(element);
51
51
  }
@@ -76,12 +76,9 @@ private:
76
76
  };
77
77
 
78
78
  template <>
79
- Key Key::CreateKey(ArenaAllocator &allocator, string_t value);
79
+ Key Key::CreateKey(ArenaAllocator &allocator, const LogicalType &type, string_t value);
80
80
  template <>
81
- Key Key::CreateKey(ArenaAllocator &allocator, const char *value);
81
+ Key Key::CreateKey(ArenaAllocator &allocator, const LogicalType &type, const char *value);
82
82
  template <>
83
- void Key::CreateKey(ArenaAllocator &allocator, Key &key, string_t value);
84
- template <>
85
- void Key::CreateKey(ArenaAllocator &allocator, Key &key, const char *value);
86
-
83
+ void Key::CreateKey(ArenaAllocator &allocator, const LogicalType &type, Key &key, string_t value);
87
84
  } // namespace duckdb
@@ -1,7 +1,7 @@
1
1
  //===----------------------------------------------------------------------===//
2
2
  // DuckDB
3
3
  //
4
- // duckdb/main/extension_functions.hpp
4
+ // duckdb/main/extension_entries.hpp
5
5
  //
6
6
  //
7
7
  //===----------------------------------------------------------------------===//
@@ -12,12 +12,12 @@
12
12
 
13
13
  namespace duckdb {
14
14
 
15
- struct ExtensionFunction {
16
- char function[48];
15
+ struct ExtensionEntry {
16
+ char name[48];
17
17
  char extension[48];
18
18
  };
19
19
 
20
- static constexpr ExtensionFunction EXTENSION_FUNCTIONS[] = {
20
+ static constexpr ExtensionEntry EXTENSION_FUNCTIONS[] = {
21
21
  {"->>", "json"},
22
22
  {"array_to_json", "json"},
23
23
  {"create_fts_index", "fts"},
@@ -30,9 +30,9 @@ static constexpr ExtensionFunction EXTENSION_FUNCTIONS[] = {
30
30
  {"from_json", "json"},
31
31
  {"from_json_strict", "json"},
32
32
  {"from_substrait", "substrait"},
33
+ {"from_substrait_json", "substrait"},
33
34
  {"get_substrait", "substrait"},
34
35
  {"get_substrait_json", "substrait"},
35
- {"from_substrait_json", "substrait"},
36
36
  {"icu_calendar_names", "icu"},
37
37
  {"icu_sort_key", "icu"},
38
38
  {"json", "json"},
@@ -88,4 +88,25 @@ static constexpr ExtensionFunction EXTENSION_FUNCTIONS[] = {
88
88
  {"visualize_json_profiling_output", "visualizer"},
89
89
  {"visualize_last_profiling_output", "visualizer"},
90
90
  };
91
+
92
+ static constexpr ExtensionEntry EXTENSION_SETTINGS[] = {
93
+ {"binary_as_string", "parquet"},
94
+ {"calendar", "icu"},
95
+ {"http_retries", "httpfs"},
96
+ {"http_retry_backoff", "httpfs"},
97
+ {"http_retry_wait_ms", "httpfs"},
98
+ {"http_timeout", "httpfs"},
99
+ {"s3_access_key_id", "httpfs"},
100
+ {"s3_endpoint", "httpfs"},
101
+ {"s3_region", "httpfs"},
102
+ {"s3_secret_access_key", "httpfs"},
103
+ {"s3_session_token", "httpfs"},
104
+ {"s3_uploader_max_filesize", "httpfs"},
105
+ {"s3_uploader_max_parts_per_file", "httpfs"},
106
+ {"s3_uploader_thread_limit", "httpfs"},
107
+ {"s3_url_style", "httpfs"},
108
+ {"s3_use_ssl", "httpfs"},
109
+ {"sqlite_all_varchar", "sqlite_scanner"},
110
+ {"timezone", "icu"},
111
+ };
91
112
  } // namespace duckdb
@@ -62,6 +62,9 @@ public:
62
62
  //! Apply any known extension aliases
63
63
  static string ApplyExtensionAlias(string extension_name);
64
64
 
65
+ static string GetExtensionName(const string &extension);
66
+ static bool IsFullPath(const string &extension);
67
+
65
68
  private:
66
69
  static const vector<string> PathComponents();
67
70
  static ExtensionInitResult InitialLoad(DBConfig &context, FileOpener *opener, const string &extension);
@@ -108,6 +108,9 @@ public:
108
108
 
109
109
  unique_ptr<BoundCreateTableInfo> BindCreateTableInfo(unique_ptr<CreateInfo> info);
110
110
  unique_ptr<BoundCreateTableInfo> BindCreateTableInfo(unique_ptr<CreateInfo> info, SchemaCatalogEntry *schema);
111
+
112
+ vector<unique_ptr<Expression>> BindCreateIndexExpressions(TableCatalogEntry *table, CreateIndexInfo *info);
113
+
111
114
  void BindCreateViewInfo(CreateViewInfo &base);
112
115
  SchemaCatalogEntry *BindSchema(CreateInfo &info);
113
116
  SchemaCatalogEntry *BindCreateFunctionInfo(CreateInfo &info);
@@ -10,20 +10,27 @@
10
10
 
11
11
  #include "duckdb/planner/expression_binder.hpp"
12
12
  #include "duckdb/common/unordered_map.hpp"
13
+ #include "duckdb/parser/parsed_data/create_index_info.hpp"
14
+ #include "duckdb/catalog/catalog_entry/table_catalog_entry.hpp"
13
15
 
14
16
  namespace duckdb {
15
17
  class BoundColumnRefExpression;
16
18
 
17
- //! The INDEX binder is responsible for binding an expression within an Index statement
19
+ //! The IndexBinder is responsible for binding an expression within an index statement
18
20
  class IndexBinder : public ExpressionBinder {
19
21
  public:
20
- IndexBinder(Binder &binder, ClientContext &context);
22
+ IndexBinder(Binder &binder, ClientContext &context, TableCatalogEntry *table = nullptr,
23
+ CreateIndexInfo *info = nullptr);
21
24
 
22
25
  protected:
23
26
  BindResult BindExpression(unique_ptr<ParsedExpression> *expr_ptr, idx_t depth,
24
27
  bool root_expression = false) override;
25
-
26
28
  string UnsupportedAggregateMessage() override;
29
+
30
+ private:
31
+ // only for WAL replay
32
+ TableCatalogEntry *table;
33
+ CreateIndexInfo *info;
27
34
  };
28
35
 
29
36
  } // namespace duckdb
@@ -122,6 +122,12 @@ public:
122
122
  void UpdateColumn(TableCatalogEntry &table, ClientContext &context, Vector &row_ids,
123
123
  const vector<column_t> &column_path, DataChunk &updates);
124
124
 
125
+ //! Add an index to the DataTable. NOTE: for CREATE (UNIQUE) INDEX statements, we use the PhysicalCreateIndex
126
+ //! operator. This function is only used during the WAL replay, and is a much less performant index creation
127
+ //! approach.
128
+ void WALAddIndex(ClientContext &context, unique_ptr<Index> index,
129
+ const vector<unique_ptr<Expression>> &expressions);
130
+
125
131
  //! Fetches an append lock
126
132
  void AppendLock(TableAppendState &state);
127
133
  //! Begin appending structs to this table, obtaining necessary locks, etc
@@ -176,7 +182,7 @@ public:
176
182
  static bool IsForeignKeyIndex(const vector<PhysicalIndex> &fk_keys, Index &index, ForeignKeyType fk_type);
177
183
 
178
184
  //! Initializes a special scan that is used to create an index on the table, it keeps locks on the table
179
- void InitializeCreateIndexScan(CreateIndexScanState &state, const vector<column_t> &column_ids);
185
+ void InitializeWALCreateIndexScan(CreateIndexScanState &state, const vector<column_t> &column_ids);
180
186
  //! Scans the next chunk for the CREATE INDEX operator
181
187
  bool CreateIndexScan(TableScanState &state, DataChunk &result, TableScanType type);
182
188
 
@@ -40,11 +40,11 @@ public:
40
40
  IndexType type;
41
41
  //! Associated table io manager
42
42
  TableIOManager &table_io_manager;
43
- //! Column identifiers to extract from the base table
43
+ //! Column identifiers to extract key columns from the base table
44
44
  vector<column_t> column_ids;
45
- //! Unordered_set of column_ids used by the index
45
+ //! Unordered set of column_ids used by the index
46
46
  unordered_set<column_t> column_id_set;
47
- //! Unbound expressions used by the index
47
+ //! Unbound expressions used by the index during optimizations
48
48
  vector<unique_ptr<Expression>> unbound_expressions;
49
49
  //! The physical types stored in the index
50
50
  vector<PhysicalType> types;
@@ -64,94 +64,103 @@ public:
64
64
  bool track_memory;
65
65
 
66
66
  public:
67
- //! Initialize a scan on the index with the given expression and column ids
68
- //! to fetch from the base table when we only have one query predicate
67
+ //! Initialize a single predicate scan on the index with the given expression and column IDs
69
68
  virtual unique_ptr<IndexScanState> InitializeScanSinglePredicate(const Transaction &transaction, const Value &value,
70
69
  ExpressionType expressionType) = 0;
71
- //! Initialize a scan on the index with the given expression and column ids
72
- //! to fetch from the base table for two query predicates
70
+ //! Initialize a two predicate scan on the index with the given expression and column IDs
73
71
  virtual unique_ptr<IndexScanState> InitializeScanTwoPredicates(Transaction &transaction, const Value &low_value,
74
72
  ExpressionType low_expression_type,
75
73
  const Value &high_value,
76
74
  ExpressionType high_expression_type) = 0;
77
- //! Perform a lookup on the index, fetching up to max_count result ids. Returns true if all row ids were fetched,
78
- //! and false otherwise.
75
+ //! Performs a lookup on the index, fetching up to max_count result IDs. Returns true if all row IDs were fetched,
76
+ //! and false otherwise
79
77
  virtual bool Scan(Transaction &transaction, DataTable &table, IndexScanState &state, idx_t max_count,
80
78
  vector<row_t> &result_ids) = 0;
81
79
 
82
80
  //! Obtain a lock on the index
83
81
  virtual void InitializeLock(IndexLock &state);
84
- //! Called when data is appended to the index. The lock obtained from InitializeAppend must be held
82
+ //! Called when data is appended to the index. The lock obtained from InitializeLock must be held
85
83
  virtual bool Append(IndexLock &state, DataChunk &entries, Vector &row_identifiers) = 0;
84
+ //! Obtains a lock and calls Append while holding that lock
86
85
  bool Append(DataChunk &entries, Vector &row_identifiers);
87
- //! Verify that data can be appended to the index
86
+ //! Verify that data can be appended to the index without a constraint violation
88
87
  virtual void VerifyAppend(DataChunk &chunk) = 0;
89
- //! Verify that data can be appended to the index
88
+ //! Verify that data can be appended to the index without a constraint violation using the conflict manager
90
89
  virtual void VerifyAppend(DataChunk &chunk, ConflictManager &conflict_manager) = 0;
91
- //! Verify that data can be appended to the index for foreign key constraint
92
- virtual void VerifyAppendForeignKey(DataChunk &chunk) = 0;
93
- //! Verify that data can be delete from the index for foreign key constraint
94
- virtual void VerifyDeleteForeignKey(DataChunk &chunk) = 0;
90
+ //! Performs constraint checking for a chunk of input data
91
+ virtual void CheckConstraintsForChunk(DataChunk &input, ConflictManager &conflict_manager) = 0;
95
92
 
96
- //! Called when data inside the index is Deleted
93
+ //! Delete a chunk of entries from the index. The lock obtained from InitializeLock must be held
97
94
  virtual void Delete(IndexLock &state, DataChunk &entries, Vector &row_identifiers) = 0;
95
+ //! Obtains a lock and calls Delete while holding that lock
98
96
  void Delete(DataChunk &entries, Vector &row_identifiers);
99
97
 
100
- //! Insert data into the index. Does not lock the index.
98
+ //! Insert a chunk of entries into the index
101
99
  virtual bool Insert(IndexLock &lock, DataChunk &input, Vector &row_identifiers) = 0;
102
100
 
103
- //! Merge other_index into this index.
101
+ //! Merge another index into this index. The lock obtained from InitializeLock must be held, and the other
102
+ //! index must also be locked during the merge
104
103
  virtual bool MergeIndexes(IndexLock &state, Index *other_index) = 0;
104
+ //! Obtains a lock and calls MergeIndexes while holding that lock
105
105
  bool MergeIndexes(Index *other_index);
106
106
 
107
107
  //! Returns the string representation of an index
108
108
  virtual string ToString() = 0;
109
- //! Verifies that the memory_size value of the index matches its actual size
109
+ //! Verifies that the in-memory size value of the index matches its actual size
110
110
  virtual void Verify() = 0;
111
-
112
- //! Returns true if the index is affected by updates on the specified column ids, and false otherwise
111
+ //! Increases the memory size by the difference between the old size and the current size
112
+ //! and performs verifications
113
+ virtual void IncreaseAndVerifyMemorySize(idx_t old_memory_size) = 0;
114
+
115
+ //! Increases the in-memory size value
116
+ inline void IncreaseMemorySize(idx_t size) {
117
+ memory_size += size;
118
+ };
119
+ //! Decreases the in-memory size value
120
+ inline void DecreaseMemorySize(idx_t size) {
121
+ D_ASSERT(memory_size >= size);
122
+ memory_size -= size;
123
+ };
124
+
125
+ //! Returns true if the index is affected by updates on the specified column IDs, and false otherwise
113
126
  bool IndexIsUpdated(const vector<PhysicalIndex> &column_ids) const;
114
127
 
115
- //! Returns how many of the input values were found in the 'input' chunk, with the option to also record what those
116
- //! matches were. For this purpose, nulls count as a match, and are returned in 'null_count'
117
- virtual void LookupValues(DataChunk &input, ConflictManager &conflict_manager) = 0;
118
-
119
128
  //! Returns unique flag
120
129
  bool IsUnique() {
121
130
  return (constraint_type == IndexConstraintType::UNIQUE || constraint_type == IndexConstraintType::PRIMARY);
122
131
  }
123
- //! Returns primary flag
132
+ //! Returns primary key flag
124
133
  bool IsPrimary() {
125
134
  return (constraint_type == IndexConstraintType::PRIMARY);
126
135
  }
127
- //! Returns foreign flag
136
+ //! Returns foreign key flag
128
137
  bool IsForeign() {
129
138
  return (constraint_type == IndexConstraintType::FOREIGN);
130
139
  }
131
- //! Serializes the index and returns the pair of block_id offset positions
132
- virtual BlockPointer Serialize(duckdb::MetaBlockWriter &writer);
133
- BlockPointer GetBlockPointer();
134
140
 
135
- //! Returns block/offset of where index was most recently serialized.
141
+ //! Serializes the index and returns the pair of block_id offset positions
142
+ virtual BlockPointer Serialize(MetaBlockWriter &writer);
143
+ //! Returns the serialized data pointer to the block and offset of the serialized index
136
144
  BlockPointer GetSerializedDataPointer() const {
137
145
  return serialized_data_pointer;
138
146
  }
139
147
 
140
- protected:
148
+ //! Execute the index expressions on an input chunk
141
149
  void ExecuteExpressions(DataChunk &input, DataChunk &result);
142
150
 
143
- //! Lock used for updating the index
151
+ protected:
152
+ //! Lock used for any changes to the index
144
153
  mutex lock;
145
-
146
- //! Pointer to most recently checkpointed index data.
154
+ //! Pointer to serialized index data
147
155
  BlockPointer serialized_data_pointer;
148
156
 
149
157
  private:
150
- //! Bound expressions used by the index
158
+ //! Bound expressions used during expression execution
151
159
  vector<unique_ptr<Expression>> bound_expressions;
152
- //! Expression executor for the index expressions
160
+ //! Expression executor to execute the index expressions
153
161
  ExpressionExecutor executor;
154
162
 
163
+ //! Bind the unbound expressions of the index
155
164
  unique_ptr<Expression> BindExpression(unique_ptr<Expression> expr);
156
165
  };
157
166
 
@@ -15,6 +15,7 @@
15
15
  #include "duckdb/catalog/catalog_entry/scalar_macro_catalog_entry.hpp"
16
16
  #include "duckdb/catalog/catalog_entry/sequence_catalog_entry.hpp"
17
17
  #include "duckdb/catalog/catalog_entry/table_macro_catalog_entry.hpp"
18
+ #include "duckdb/catalog/catalog_entry/index_catalog_entry.hpp"
18
19
  #include "duckdb/main/attached_database.hpp"
19
20
  #include "duckdb/storage/storage_info.hpp"
20
21
 
@@ -77,6 +78,9 @@ protected:
77
78
  void ReplayCreateTableMacro();
78
79
  void ReplayDropTableMacro();
79
80
 
81
+ void ReplayCreateIndex();
82
+ void ReplayDropIndex();
83
+
80
84
  void ReplayUseTable();
81
85
  void ReplayInsert();
82
86
  void ReplayDelete();
@@ -125,6 +129,9 @@ public:
125
129
  void WriteCreateTableMacro(TableMacroCatalogEntry *entry);
126
130
  void WriteDropTableMacro(TableMacroCatalogEntry *entry);
127
131
 
132
+ void WriteCreateIndex(IndexCatalogEntry *entry);
133
+ void WriteDropIndex(IndexCatalogEntry *entry);
134
+
128
135
  void WriteCreateType(TypeCatalogEntry *entry);
129
136
  void WriteDropType(TypeCatalogEntry *entry);
130
137
  //! Sets the table used for subsequent insert/delete/update commands
@@ -356,7 +356,8 @@ idx_t DuckDB::NumberOfThreads() {
356
356
  }
357
357
 
358
358
  bool DatabaseInstance::ExtensionIsLoaded(const std::string &name) {
359
- return loaded_extensions.find(name) != loaded_extensions.end();
359
+ auto extension_name = ExtensionHelper::GetExtensionName(name);
360
+ return loaded_extensions.find(extension_name) != loaded_extensions.end();
360
361
  }
361
362
 
362
363
  bool DuckDB::ExtensionIsLoaded(const std::string &name) {
@@ -364,7 +365,8 @@ bool DuckDB::ExtensionIsLoaded(const std::string &name) {
364
365
  }
365
366
 
366
367
  void DatabaseInstance::SetExtensionLoaded(const std::string &name) {
367
- loaded_extensions.insert(name);
368
+ auto extension_name = ExtensionHelper::GetExtensionName(name);
369
+ loaded_extensions.insert(extension_name);
368
370
  }
369
371
 
370
372
  bool DatabaseInstance::TryGetCurrentSetting(const std::string &key, Value &result) {
@@ -31,7 +31,7 @@ ExtensionInitResult ExtensionHelper::InitialLoad(DBConfig &config, FileOpener *o
31
31
  auto filename = fs.ConvertSeparators(extension);
32
32
 
33
33
  // shorthand case
34
- if (!StringUtil::Contains(extension, ".") && !StringUtil::Contains(extension, fs.PathSeparator())) {
34
+ if (!ExtensionHelper::IsFullPath(extension)) {
35
35
  string local_path = fs.GetHomeDirectory(opener);
36
36
  auto path_components = PathComponents();
37
37
  for (auto &path_ele : path_components) {
@@ -121,9 +121,28 @@ ExtensionInitResult ExtensionHelper::InitialLoad(DBConfig &config, FileOpener *o
121
121
  return res;
122
122
  }
123
123
 
124
+ bool ExtensionHelper::IsFullPath(const string &extension) {
125
+ return StringUtil::Contains(extension, ".") || StringUtil::Contains(extension, "/") ||
126
+ StringUtil::Contains(extension, "\\");
127
+ }
128
+
129
+ string ExtensionHelper::GetExtensionName(const string &extension) {
130
+ if (!IsFullPath(extension)) {
131
+ return extension;
132
+ }
133
+ auto splits = StringUtil::Split(StringUtil::Replace(extension, "\\", "/"), '/');
134
+ if (splits.empty()) {
135
+ return extension;
136
+ }
137
+ splits = StringUtil::Split(splits.back(), '.');
138
+ if (splits.empty()) {
139
+ return extension;
140
+ }
141
+ return StringUtil::Lower(splits.front());
142
+ }
143
+
124
144
  void ExtensionHelper::LoadExternalExtension(DatabaseInstance &db, FileOpener *opener, const string &extension) {
125
- auto &loaded_extensions = db.LoadedExtensions();
126
- if (loaded_extensions.find(extension) != loaded_extensions.end()) {
145
+ if (db.ExtensionIsLoaded(extension)) {
127
146
  return;
128
147
  }
129
148
 
@@ -16,6 +16,9 @@ unique_ptr<CreateInfo> CreateIndexInfo::Copy() const {
16
16
  for (auto &expr : expressions) {
17
17
  result->expressions.push_back(expr->Copy());
18
18
  }
19
+ for (auto &expr : parsed_expressions) {
20
+ result->parsed_expressions.push_back(expr->Copy());
21
+ }
19
22
 
20
23
  result->scan_types = scan_types;
21
24
  result->names = names;
@@ -16,6 +16,8 @@
16
16
  #include "duckdb/parser/expression/list.hpp"
17
17
  #include "duckdb/common/index_map.hpp"
18
18
  #include "duckdb/planner/expression_iterator.hpp"
19
+ #include "duckdb/planner/expression_binder/index_binder.hpp"
20
+ #include "duckdb/parser/parsed_data/create_index_info.hpp"
19
21
 
20
22
  #include <algorithm>
21
23
 
@@ -300,4 +302,15 @@ unique_ptr<BoundCreateTableInfo> Binder::BindCreateTableInfo(unique_ptr<CreateIn
300
302
  return BindCreateTableInfo(std::move(info), schema);
301
303
  }
302
304
 
305
+ vector<unique_ptr<Expression>> Binder::BindCreateIndexExpressions(TableCatalogEntry *table, CreateIndexInfo *info) {
306
+ vector<unique_ptr<Expression>> expressions;
307
+
308
+ auto index_binder = IndexBinder(*this, this->context, table, info);
309
+ for (auto &expr : info->expressions) {
310
+ expressions.push_back(index_binder.Bind(expr));
311
+ }
312
+
313
+ return expressions;
314
+ }
315
+
303
316
  } // namespace duckdb
@@ -1,8 +1,14 @@
1
1
  #include "duckdb/planner/expression_binder/index_binder.hpp"
2
2
 
3
+ #include "duckdb/parser/parsed_data/create_index_info.hpp"
4
+ #include "duckdb/parser/expression/columnref_expression.hpp"
5
+ #include "duckdb/planner/expression/bound_columnref_expression.hpp"
6
+ #include "duckdb/planner/column_binding.hpp"
7
+
3
8
  namespace duckdb {
4
9
 
5
- IndexBinder::IndexBinder(Binder &binder, ClientContext &context) : ExpressionBinder(binder, context) {
10
+ IndexBinder::IndexBinder(Binder &binder, ClientContext &context, TableCatalogEntry *table, CreateIndexInfo *info)
11
+ : ExpressionBinder(binder, context), table(table), info(info) {
6
12
  }
7
13
 
8
14
  BindResult IndexBinder::BindExpression(unique_ptr<ParsedExpression> *expr_ptr, idx_t depth, bool root_expression) {
@@ -12,6 +18,31 @@ BindResult IndexBinder::BindExpression(unique_ptr<ParsedExpression> *expr_ptr, i
12
18
  return BindResult("window functions are not allowed in index expressions");
13
19
  case ExpressionClass::SUBQUERY:
14
20
  return BindResult("cannot use subquery in index expressions");
21
+ case ExpressionClass::COLUMN_REF: {
22
+ if (table) {
23
+ // WAL replay
24
+ // we assume that the parsed expressions have qualified column names
25
+ // and that the columns exist in the table
26
+ auto &col_ref = (ColumnRefExpression &)expr;
27
+ auto col_idx = table->GetColumnIndex(col_ref.column_names.back());
28
+ auto col_type = table->GetColumn(col_idx).GetType();
29
+
30
+ // find the col_idx in the index.column_ids
31
+ auto col_id_idx = DConstants::INVALID_INDEX;
32
+ for (idx_t i = 0; i < info->column_ids.size(); i++) {
33
+ if (col_idx.index == info->column_ids[i]) {
34
+ col_id_idx = i;
35
+ }
36
+ }
37
+
38
+ if (col_id_idx == DConstants::INVALID_INDEX) {
39
+ throw InternalException("failed to replay CREATE INDEX statement - column id not found");
40
+ }
41
+ return BindResult(
42
+ make_unique<BoundColumnRefExpression>(col_ref.alias, col_type, ColumnBinding(0, col_id_idx)));
43
+ }
44
+ return ExpressionBinder::BindExpression(expr_ptr, depth);
45
+ }
15
46
  default:
16
47
  return ExpressionBinder::BindExpression(expr_ptr, depth);
17
48
  }
@@ -230,6 +230,7 @@ public:
230
230
  private:
231
231
  DatabaseInstance &db;
232
232
  string temp_directory;
233
+ bool created_directory = false;
233
234
  unique_ptr<TemporaryFileManager> temp_file;
234
235
  };
235
236
 
@@ -868,7 +869,10 @@ TemporaryDirectoryHandle::TemporaryDirectoryHandle(DatabaseInstance &db, string
868
869
  : db(db), temp_directory(std::move(path_p)), temp_file(make_unique<TemporaryFileManager>(db, temp_directory)) {
869
870
  auto &fs = FileSystem::GetFileSystem(db);
870
871
  if (!temp_directory.empty()) {
871
- fs.CreateDirectory(temp_directory);
872
+ if (!fs.DirectoryExists(temp_directory)) {
873
+ fs.CreateDirectory(temp_directory);
874
+ created_directory = true;
875
+ }
872
876
  }
873
877
  }
874
878
  TemporaryDirectoryHandle::~TemporaryDirectoryHandle() {
@@ -877,7 +881,30 @@ TemporaryDirectoryHandle::~TemporaryDirectoryHandle() {
877
881
  // then delete the temporary file directory
878
882
  auto &fs = FileSystem::GetFileSystem(db);
879
883
  if (!temp_directory.empty()) {
880
- fs.RemoveDirectory(temp_directory);
884
+ bool delete_directory = created_directory;
885
+ vector<string> files_to_delete;
886
+ if (!created_directory) {
887
+ bool deleted_everything = true;
888
+ fs.ListFiles(temp_directory, [&](const string &path, bool isdir) {
889
+ if (isdir) {
890
+ deleted_everything = false;
891
+ return;
892
+ }
893
+ if (!StringUtil::StartsWith(path, "duckdb_temp_")) {
894
+ deleted_everything = false;
895
+ return;
896
+ }
897
+ files_to_delete.push_back(path);
898
+ });
899
+ }
900
+ if (delete_directory) {
901
+ // we want to remove all files in the directory
902
+ fs.RemoveDirectory(temp_directory);
903
+ } else {
904
+ for (auto &file : files_to_delete) {
905
+ fs.RemoveFile(fs.JoinPath(temp_directory, file));
906
+ }
907
+ }
881
908
  }
882
909
  }
883
910
 
@@ -887,7 +914,7 @@ TemporaryFileManager &TemporaryDirectoryHandle::GetTempFile() {
887
914
 
888
915
  string BufferManager::GetTemporaryPath(block_id_t id) {
889
916
  auto &fs = FileSystem::GetFileSystem(db);
890
- return fs.JoinPath(temp_directory, to_string(id) + ".block");
917
+ return fs.JoinPath(temp_directory, "duckdb_temp_block-" + to_string(id) + ".block");
891
918
  }
892
919
 
893
920
  void BufferManager::RequireTemporaryDirectory() {
@@ -447,8 +447,8 @@ public:
447
447
 
448
448
  static void ReserveSpace(BitpackingCompressState<T> *state, idx_t data_bytes) {
449
449
  idx_t meta_bytes = sizeof(bitpacking_metadata_encoded_t);
450
- state->FlushAndCreateSegmentIfFull(data_bytes + meta_bytes);
451
- D_ASSERT(data_bytes + meta_bytes <= state->RemainingSize());
450
+ state->FlushAndCreateSegmentIfFull(data_bytes, meta_bytes);
451
+ D_ASSERT(state->CanStore(data_bytes, meta_bytes));
452
452
  }
453
453
 
454
454
  static void UpdateStats(BitpackingCompressState<T> *state, idx_t count) {
@@ -461,9 +461,12 @@ public:
461
461
  }
462
462
  };
463
463
 
464
- // Space remaining between the metadata_ptr growing down and data ptr growing up
465
- idx_t RemainingSize() {
466
- return metadata_ptr - data_ptr;
464
+ bool CanStore(idx_t data_bytes, idx_t meta_bytes) {
465
+ auto required_data_bytes = AlignValue<idx_t>((data_ptr + data_bytes) - data_ptr);
466
+ auto required_meta_bytes = Storage::BLOCK_SIZE - (metadata_ptr - data_ptr) + meta_bytes;
467
+
468
+ return required_data_bytes + required_meta_bytes <=
469
+ Storage::BLOCK_SIZE - BitpackingPrimitives::BITPACKING_HEADER_SIZE;
467
470
  }
468
471
 
469
472
  void CreateEmptySegment(idx_t row_start) {
@@ -489,8 +492,8 @@ public:
489
492
  }
490
493
  }
491
494
 
492
- void FlushAndCreateSegmentIfFull(idx_t required_space) {
493
- if (RemainingSize() < required_space) {
495
+ void FlushAndCreateSegmentIfFull(idx_t required_data_bytes, idx_t required_meta_bytes) {
496
+ if (!CanStore(required_data_bytes, required_meta_bytes)) {
494
497
  auto row_start = current_segment->start + current_segment->count;
495
498
  FlushSegment();
496
499
  CreateEmptySegment(row_start);
@@ -505,6 +508,12 @@ public:
505
508
  idx_t metadata_offset = AlignValue(data_ptr - base_ptr);
506
509
  idx_t metadata_size = base_ptr + Storage::BLOCK_SIZE - metadata_ptr;
507
510
  idx_t total_segment_size = metadata_offset + metadata_size;
511
+
512
+ // Asserting things are still sane here
513
+ if (!CanStore(0, 0)) {
514
+ throw InternalException("Error in bitpacking size calculation");
515
+ }
516
+
508
517
  memmove(base_ptr + metadata_offset, metadata_ptr, metadata_size);
509
518
 
510
519
  // Store the offset of the metadata of the first group (which is at the highest address).