duckdb 0.5.2-dev1745.0 → 0.5.2-dev1806.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/src/statement.cpp CHANGED
@@ -4,6 +4,9 @@
4
4
 
5
5
  #include <algorithm>
6
6
  #include <cassert>
7
+ #include <iostream>
8
+ #include <string>
9
+ #include <regex>
7
10
 
8
11
  namespace node_duckdb {
9
12
 
@@ -15,8 +18,8 @@ Napi::Object Statement::Init(Napi::Env env, Napi::Object exports) {
15
18
  Napi::Function t =
16
19
  DefineClass(env, "Statement",
17
20
  {InstanceMethod("run", &Statement::Run), InstanceMethod("all", &Statement::All),
18
- InstanceMethod("each", &Statement::Each), InstanceMethod("finalize", &Statement::Finish),
19
- InstanceMethod("stream", &Statement::Stream)});
21
+ InstanceMethod("arrowIPCAll", &Statement::ArrowIPCAll), InstanceMethod("each", &Statement::Each),
22
+ InstanceMethod("finalize", &Statement::Finish), InstanceMethod("stream", &Statement::Stream)});
20
23
 
21
24
  constructor = Napi::Persistent(t);
22
25
  constructor.SuppressDestruct();
@@ -254,7 +257,7 @@ static Napi::Value convert_chunk(Napi::Env &env, std::vector<std::string> names,
254
257
  return scope.Escape(result);
255
258
  }
256
259
 
257
- enum RunType { RUN, EACH, ALL };
260
+ enum RunType { RUN, EACH, ALL, ARROW_ALL };
258
261
 
259
262
  struct StatementParam {
260
263
  std::vector<duckdb::Value> params;
@@ -274,7 +277,8 @@ struct RunPreparedTask : public Task {
274
277
  return;
275
278
  }
276
279
 
277
- result = statement.statement->Execute(params->params, run_type != RunType::ALL);
280
+ result =
281
+ statement.statement->Execute(params->params, run_type != RunType::ALL && run_type != RunType::ARROW_ALL);
278
282
  }
279
283
 
280
284
  void Callback() override {
@@ -349,6 +353,62 @@ struct RunPreparedTask : public Task {
349
353
 
350
354
  cb.MakeCallback(statement.Value(), {env.Null(), result_arr});
351
355
  } break;
356
+ case RunType::ARROW_ALL: {
357
+ auto materialized_result = (duckdb::MaterializedQueryResult *)result.get();
358
+ // +1 is for null bytes at end of stream
359
+ Napi::Array result_arr(Napi::Array::New(env, materialized_result->RowCount() + 1));
360
+
361
+ auto deleter = [](Napi::Env, void *finalizeData, void *hint) {
362
+ delete static_cast<std::shared_ptr<duckdb::QueryResult> *>(hint);
363
+ };
364
+
365
+ std::shared_ptr<duckdb::QueryResult> result_ptr = move(result);
366
+
367
+ duckdb::idx_t out_idx = 1;
368
+ while (true) {
369
+ auto chunk = result_ptr->Fetch();
370
+
371
+ if (!chunk || chunk->size() == 0) {
372
+ break;
373
+ }
374
+
375
+ D_ASSERT(chunk->ColumnCount() == 2);
376
+ D_ASSERT(chunk->data[0].GetType() == duckdb::LogicalType::BLOB);
377
+ D_ASSERT(chunk->data[1].GetType() == duckdb::LogicalType::BOOLEAN);
378
+
379
+ for (duckdb::idx_t row_idx = 0; row_idx < chunk->size(); row_idx++) {
380
+ duckdb::string_t blob = ((duckdb::string_t *)(chunk->data[0].GetData()))[row_idx];
381
+ bool is_header = chunk->data[1].GetData()[row_idx];
382
+
383
+ // Create shared pointer to give (shared) ownership to ArrayBuffer, not that for these materialized
384
+ // query results, the string data is owned by the QueryResult
385
+ auto result_ref_ptr = new std::shared_ptr<duckdb::QueryResult>(result_ptr);
386
+
387
+ auto array_buffer = Napi::ArrayBuffer::New(env, (void *)blob.GetDataUnsafe(), blob.GetSize(),
388
+ deleter, result_ref_ptr);
389
+
390
+ auto typed_array = Napi::Uint8Array::New(env, blob.GetSize(), array_buffer, 0);
391
+
392
+ // TODO we should handle this in duckdb probably
393
+ if (is_header) {
394
+ result_arr.Set((uint32_t)0, typed_array);
395
+ } else {
396
+ D_ASSERT(out_idx < materialized_result->RowCount());
397
+ result_arr.Set(out_idx++, typed_array);
398
+ }
399
+ }
400
+ }
401
+
402
+ // TODO we should handle this in duckdb probably
403
+ auto null_arr = Napi::Uint8Array::New(env, 4);
404
+ memset(null_arr.Data(), '\0', 4);
405
+ result_arr.Set(out_idx++, null_arr);
406
+
407
+ // Confirm all rows are set
408
+ D_ASSERT(out_idx == materialized_result->RowCount() + 1);
409
+
410
+ cb.MakeCallback(statement.Value(), {env.Null(), result_arr});
411
+ } break;
352
412
  }
353
413
  }
354
414
  std::unique_ptr<duckdb::QueryResult> result;
@@ -423,6 +483,12 @@ Napi::Value Statement::All(const Napi::CallbackInfo &info) {
423
483
  return info.This();
424
484
  }
425
485
 
486
+ Napi::Value Statement::ArrowIPCAll(const Napi::CallbackInfo &info) {
487
+ connection_ref->database_ref->Schedule(
488
+ info.Env(), duckdb::make_unique<RunPreparedTask>(*this, HandleArgs(info), RunType::ARROW_ALL));
489
+ return info.This();
490
+ }
491
+
426
492
  Napi::Value Statement::Run(const Napi::CallbackInfo &info) {
427
493
  connection_ref->database_ref->Schedule(info.Env(),
428
494
  duckdb::make_unique<RunPreparedTask>(*this, HandleArgs(info), RunType::RUN));
@@ -471,7 +537,9 @@ Napi::FunctionReference QueryResult::constructor;
471
537
  Napi::Object QueryResult::Init(Napi::Env env, Napi::Object exports) {
472
538
  Napi::HandleScope scope(env);
473
539
 
474
- Napi::Function t = DefineClass(env, "QueryResult", {InstanceMethod("nextChunk", &QueryResult::NextChunk)});
540
+ Napi::Function t = DefineClass(env, "QueryResult",
541
+ {InstanceMethod("nextChunk", &QueryResult::NextChunk),
542
+ InstanceMethod("nextIpcBuffer", &QueryResult::NextIpcBuffer)});
475
543
 
476
544
  constructor = Napi::Persistent(t);
477
545
  constructor.SuppressDestruct();
@@ -521,6 +589,48 @@ struct GetChunkTask : public Task {
521
589
  std::unique_ptr<duckdb::DataChunk> chunk;
522
590
  };
523
591
 
592
+ struct GetNextArrowIpcTask : public Task {
593
+ GetNextArrowIpcTask(QueryResult &query_result, Napi::Promise::Deferred deferred)
594
+ : Task(query_result), deferred(deferred) {
595
+ }
596
+
597
+ void DoWork() override {
598
+ auto &query_result = Get<QueryResult>();
599
+ chunk = query_result.result->Fetch();
600
+ }
601
+
602
+ void DoCallback() override {
603
+ auto &query_result = Get<QueryResult>();
604
+ Napi::Env env = query_result.Env();
605
+ Napi::HandleScope scope(env);
606
+
607
+ if (chunk == nullptr || chunk->size() == 0) {
608
+ deferred.Resolve(env.Null());
609
+ return;
610
+ }
611
+
612
+ // Arrow IPC streams should be a single column of a single blob
613
+ D_ASSERT(chunk->size() == 1 && chunk->ColumnCount() == 2);
614
+ D_ASSERT(chunk->data[0].GetType() == duckdb::LogicalType::BLOB);
615
+
616
+ duckdb::string_t blob = *(duckdb::string_t *)(chunk->data[0].GetData());
617
+
618
+ // Transfer ownership and Construct ArrayBuffer
619
+ auto data_chunk_ptr = new std::unique_ptr<duckdb::DataChunk>();
620
+ *data_chunk_ptr = std::move(chunk);
621
+ auto deleter = [](Napi::Env, void *finalizeData, void *hint) {
622
+ delete static_cast<std::unique_ptr<duckdb::DataChunk> *>(hint);
623
+ };
624
+ auto array_buffer =
625
+ Napi::ArrayBuffer::New(env, (void *)blob.GetDataUnsafe(), blob.GetSize(), deleter, data_chunk_ptr);
626
+
627
+ deferred.Resolve(array_buffer);
628
+ }
629
+
630
+ Napi::Promise::Deferred deferred;
631
+ std::unique_ptr<duckdb::DataChunk> chunk;
632
+ };
633
+
524
634
  Napi::Value QueryResult::NextChunk(const Napi::CallbackInfo &info) {
525
635
  auto env = info.Env();
526
636
  auto deferred = Napi::Promise::Deferred::New(env);
@@ -529,4 +639,12 @@ Napi::Value QueryResult::NextChunk(const Napi::CallbackInfo &info) {
529
639
  return deferred.Promise();
530
640
  }
531
641
 
642
+ // Should only be called on an arrow ipc query
643
+ Napi::Value QueryResult::NextIpcBuffer(const Napi::CallbackInfo &info) {
644
+ auto env = info.Env();
645
+ auto deferred = Napi::Promise::Deferred::New(env);
646
+ database_ref->Schedule(env, duckdb::make_unique<GetNextArrowIpcTask>(*this, deferred));
647
+ return deferred.Promise();
648
+ }
649
+
532
650
  } // namespace node_duckdb
@@ -150,13 +150,13 @@ describe('open/close', function() {
150
150
  });
151
151
  });
152
152
 
153
- describe('closing with unfinalized statements', function(done) {
153
+ describe('closing with unfinalized statements', function() {
154
154
  var completed = false;
155
155
  var completedSecond = false;
156
156
  var closed = false;
157
157
 
158
158
  var db;
159
- before(function() {
159
+ before(function(done) {
160
160
  db = new sqlite3.Database(':memory:', done);
161
161
  });
162
162
 
@@ -24,17 +24,19 @@ function createdb(callback) {
24
24
  if (callback) callback();
25
25
  } else {
26
26
  console.log("Creating test database... This may take several minutes.");
27
- var db = new sqlite3.Database(db_path);
28
- db.serialize(function() {
29
- db.run("CREATE TABLE foo (id INT, txt TEXT)");
30
- db.run("BEGIN TRANSACTION");
31
- var stmt = db.prepare("INSERT INTO foo VALUES(?, ?)");
32
- for (var i = 0; i < count; i++) {
33
- stmt.run(i, randomString());
34
- }
35
- stmt.finalize();
36
- db.run("COMMIT TRANSACTION", function () {
37
- db.close(callback);
27
+ var db = new sqlite3.Database(db_path, () => {
28
+ db.serialize(function() {
29
+ db.run("CREATE TABLE foo (id INT, txt TEXT)");
30
+ db.run("BEGIN TRANSACTION");
31
+ var stmt = db.prepare("INSERT INTO foo VALUES(?, ?)");
32
+ for (var i = 0; i < count; i++) {
33
+ stmt.run(i, randomString());
34
+ }
35
+
36
+ stmt.finalize();
37
+ db.run("COMMIT TRANSACTION", function () {
38
+ db.close(callback);
39
+ });
38
40
  });
39
41
  });
40
42
  }
@@ -95,7 +95,7 @@ describe("TypeScript declarataions", function () {
95
95
  });
96
96
 
97
97
  it("typescript: ternary int udf", function (done) {
98
- db.register(
98
+ db.register_udf(
99
99
  "udf",
100
100
  "integer",
101
101
  (x: number, y: number, z: number) => x + y + z
@@ -107,7 +107,7 @@ describe("TypeScript declarataions", function () {
107
107
  assert.equal(rows[0].v, 42);
108
108
  }
109
109
  );
110
- db.unregister("udf", done);
110
+ db.unregister_udf("udf", done);
111
111
  });
112
112
  it("typescript: retrieve 100,000 rows with Statement#each", function (done) {
113
113
  var total = 100000;
package/test/udf.test.js CHANGED
@@ -9,142 +9,142 @@ describe('UDFs', function() {
9
9
  });
10
10
 
11
11
  it('0ary int', function(done) {
12
- db.register("udf", "integer", () => 42);
12
+ db.register_udf("udf", "integer", () => 42);
13
13
  db.all("select udf() v", function(err, rows) {
14
14
  if (err) throw err;
15
15
  assert.equal(rows[0].v, 42);
16
16
  });
17
- db.unregister("udf", done);
17
+ db.unregister_udf("udf", done);
18
18
  });
19
19
 
20
20
  it('0ary double', function(done) {
21
- db.register("udf", "double", () => 4.2);
21
+ db.register_udf("udf", "double", () => 4.2);
22
22
  db.all("select udf() v", function(err, rows) {
23
23
  if (err) throw err;
24
24
  assert.equal(rows[0].v, 4.2);
25
25
  });
26
- db.unregister("udf", done);
26
+ db.unregister_udf("udf", done);
27
27
  });
28
28
 
29
29
  it('0ary string', function(done) {
30
- db.register("udf", "varchar", () => 'hello');
30
+ db.register_udf("udf", "varchar", () => 'hello');
31
31
  db.all("select udf() v", function(err, rows) {
32
32
  if (err) throw err;
33
33
  assert.equal(rows[0].v, 'hello');
34
34
  });
35
- db.unregister("udf", done);
35
+ db.unregister_udf("udf", done);
36
36
  });
37
37
 
38
38
  it('0ary int null', function(done) {
39
- db.register("udf", "integer", () => undefined);
39
+ db.register_udf("udf", "integer", () => undefined);
40
40
  db.all("select udf() v", function(err, rows) {
41
41
  if (err) throw err;
42
42
  assert.equal(rows[0].v, undefined);
43
43
  });
44
- db.unregister("udf", done);
44
+ db.unregister_udf("udf", done);
45
45
  });
46
46
 
47
47
 
48
48
  it('0ary string null', function(done) {
49
- db.register("udf", "varchar", () => undefined);
49
+ db.register_udf("udf", "varchar", () => undefined);
50
50
  db.all("select udf() v", function(err, rows) {
51
51
  if (err) throw err;
52
52
  assert.equal(rows[0].v, undefined);
53
53
  });
54
- db.unregister("udf", done);
54
+ db.unregister_udf("udf", done);
55
55
  });
56
56
 
57
57
 
58
58
  it('unary int', function(done) {
59
- db.register("udf", "integer", (x) => x+1);
59
+ db.register_udf("udf", "integer", (x) => x+1);
60
60
  db.all("select udf(42) v", function(err, rows) {
61
61
  if (err) throw err;
62
62
  assert.equal(rows[0].v, 43);
63
63
  });
64
- db.unregister("udf", done);
64
+ db.unregister_udf("udf", done);
65
65
  });
66
66
 
67
67
  it('unary double', function(done) {
68
- db.register("udf", "double", (x) => x);
68
+ db.register_udf("udf", "double", (x) => x);
69
69
  db.all("select udf(4.2::double) v", function(err, rows) {
70
70
  if (err) throw err;
71
71
  assert.equal(rows[0].v, 4.2);
72
72
  });
73
- db.unregister("udf", done);
73
+ db.unregister_udf("udf", done);
74
74
  });
75
75
 
76
76
  it('unary int null', function(done) {
77
- db.register("udf", "integer", (x) => undefined);
77
+ db.register_udf("udf", "integer", (x) => undefined);
78
78
  db.all("select udf(42) v", function(err, rows) {
79
79
  if (err) throw err;
80
80
  assert.equal(rows[0].v, undefined);
81
81
  });
82
- db.unregister("udf", done);
82
+ db.unregister_udf("udf", done);
83
83
  });
84
84
 
85
85
 
86
86
  it('unary double null', function(done) {
87
- db.register("udf", "double", (x) => undefined);
87
+ db.register_udf("udf", "double", (x) => undefined);
88
88
  db.all("select udf(4.2::double) v", function(err, rows) {
89
89
  if (err) throw err;
90
90
  assert.equal(rows[0].v, undefined);
91
91
  });
92
- db.unregister("udf", done);
92
+ db.unregister_udf("udf", done);
93
93
  });
94
94
 
95
95
 
96
96
  it('unary string', function(done) {
97
- db.register("udf", "varchar", (x) => 'hello ' + x);
97
+ db.register_udf("udf", "varchar", (x) => 'hello ' + x);
98
98
  db.all("select udf('world') v", function(err, rows) {
99
99
  if (err) throw err;
100
100
  assert.equal(rows[0].v, 'hello world');
101
101
  });
102
- db.unregister("udf", done);
102
+ db.unregister_udf("udf", done);
103
103
  });
104
104
 
105
105
  it('unary string null', function(done) {
106
- db.register("udf", "varchar", (x) => undefined);
106
+ db.register_udf("udf", "varchar", (x) => undefined);
107
107
  db.all("select udf('world') v", function(err, rows) {
108
108
  if (err) throw err;
109
109
  assert.equal(rows[0].v, undefined);
110
110
  });
111
- db.unregister("udf", done);
111
+ db.unregister_udf("udf", done);
112
112
  });
113
113
 
114
114
  it('binary int', function(done) {
115
- db.register("udf", "integer", (x, y) => x + y);
115
+ db.register_udf("udf", "integer", (x, y) => x + y);
116
116
  db.all("select udf(40, 2) v", function(err, rows) {
117
117
  if (err) throw err;
118
118
  assert.equal(rows[0].v, 42);
119
119
  });
120
- db.unregister("udf", done);
120
+ db.unregister_udf("udf", done);
121
121
  });
122
122
 
123
123
  it('binary string', function(done) {
124
- db.register("udf", "varchar", (x, y) => x + ' ' + y);
124
+ db.register_udf("udf", "varchar", (x, y) => x + ' ' + y);
125
125
  db.all("select udf('hello', 'world') v", function(err, rows) {
126
126
  if (err) throw err;
127
127
  assert.equal(rows[0].v, 'hello world');
128
128
  });
129
- db.unregister("udf", done);
129
+ db.unregister_udf("udf", done);
130
130
  });
131
131
 
132
132
  it('ternary int', function(done) {
133
- db.register("udf", "integer", (x, y, z) => x + y + z);
133
+ db.register_udf("udf", "integer", (x, y, z) => x + y + z);
134
134
  db.all("select udf(21, 20, 1) v", function(err, rows) {
135
135
  if (err) throw err;
136
136
  assert.equal(rows[0].v, 42);
137
137
  });
138
- db.unregister("udf", done);
138
+ db.unregister_udf("udf", done);
139
139
  });
140
140
 
141
141
  it('unary larger series', function(done) {
142
- db.register("udf", "integer", (x) => 1);
142
+ db.register_udf("udf", "integer", (x) => 1);
143
143
  db.all("select sum(udf(range::double)) v from range(10000)", function(err, rows) {
144
144
  if (err) throw err;
145
145
  assert.equal(rows[0].v, 10000);
146
146
  });
147
- db.unregister("udf", done);
147
+ db.unregister_udf("udf", done);
148
148
  });
149
149
  });
150
150
 
@@ -155,60 +155,60 @@ describe('UDFs', function() {
155
155
  });
156
156
 
157
157
  it('tinyint', function(done) {
158
- db.register("udf", "integer", (x) => x+1);
158
+ db.register_udf("udf", "integer", (x) => x+1);
159
159
  db.all("select udf(42::tinyint) v", function(err, rows) {
160
160
  if (err) throw err;
161
161
  assert.equal(rows[0].v, 43);
162
162
  });
163
- db.unregister("udf", done);
163
+ db.unregister_udf("udf", done);
164
164
  });
165
165
 
166
166
  it('smallint', function(done) {
167
- db.register("udf", "integer", (x) => x+1);
167
+ db.register_udf("udf", "integer", (x) => x+1);
168
168
  db.all("select udf(42::smallint) v", function(err, rows) {
169
169
  if (err) throw err;
170
170
  assert.equal(rows[0].v, 43);
171
171
  });
172
- db.unregister("udf", done);
172
+ db.unregister_udf("udf", done);
173
173
  });
174
174
 
175
175
  it('int', function(done) {
176
- db.register("udf", "integer", (x) => x+1);
176
+ db.register_udf("udf", "integer", (x) => x+1);
177
177
  db.all("select udf(42::integer) v", function(err, rows) {
178
178
  if (err) throw err;
179
179
  assert.equal(rows[0].v, 43);
180
180
  });
181
- db.unregister("udf", done);
181
+ db.unregister_udf("udf", done);
182
182
  });
183
183
 
184
184
  it('timestamp', function(done) {
185
- db.register("udf", "timestamp", (x) => x);
185
+ db.register_udf("udf", "timestamp", (x) => x);
186
186
  db.all("select udf(timestamp '1992-09-20 11:30:00') v", function(err, rows) {
187
187
  if (err) throw err;
188
188
  });
189
- db.unregister("udf", done);
189
+ db.unregister_udf("udf", done);
190
190
  });
191
191
 
192
192
  it('struct', function(done) {
193
- db.register("udf", "integer", a => {
193
+ db.register_udf("udf", "integer", a => {
194
194
  return (a.x == null ? -100 : a.x);
195
195
  });
196
196
  db.all("SELECT min(udf({'x': (case when v % 2 = 0 then v else null end)::INTEGER, 'y': 42}))::INTEGER as foo FROM generate_series(1, 10000) as t(v)", function(err, rows) {
197
197
  if (err) throw err;
198
198
  assert.equal(rows[0].foo, -100);
199
199
  });
200
- db.unregister("udf", done);
200
+ db.unregister_udf("udf", done);
201
201
  });
202
202
 
203
203
  it('structnestednull', function(done) {
204
- db.register("udf", "integer", a => {
204
+ db.register_udf("udf", "integer", a => {
205
205
  return (a.x == null ? -100 : a.x.y);
206
206
  });
207
207
  db.all("SELECT min(udf({'x': (case when v % 2 = 0 then {'y': v::INTEGER } else null end), 'z': 42}))::INTEGER as foo FROM generate_series(1, 10000) as t(v)", function(err, rows) {
208
208
  if (err) throw err;
209
209
  assert.equal(rows[0].foo, -100);
210
210
  });
211
- db.unregister("udf", done);
211
+ db.unregister_udf("udf", done);
212
212
  });
213
213
  });
214
214
  });