red-arrow 0.14.1 → 0.15.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of red-arrow might be problematic. Click here for more details.

Files changed (61) hide show
  1. checksums.yaml +4 -4
  2. data/ext/arrow/arrow.cpp +34 -0
  3. data/ext/arrow/converters.cpp +42 -0
  4. data/ext/arrow/converters.hpp +626 -0
  5. data/ext/arrow/raw-records.cpp +6 -625
  6. data/ext/arrow/red-arrow.hpp +37 -3
  7. data/ext/arrow/values.cpp +154 -0
  8. data/lib/arrow/array-builder.rb +24 -1
  9. data/lib/arrow/array.rb +9 -0
  10. data/lib/arrow/chunked-array.rb +5 -0
  11. data/lib/arrow/column-containable.rb +48 -0
  12. data/lib/arrow/column.rb +36 -10
  13. data/lib/arrow/csv-loader.rb +2 -2
  14. data/lib/arrow/data-type.rb +22 -5
  15. data/lib/arrow/date64-array-builder.rb +2 -2
  16. data/lib/arrow/date64-array.rb +1 -1
  17. data/lib/arrow/decimal128-array.rb +24 -0
  18. data/lib/arrow/field-containable.rb +3 -0
  19. data/lib/arrow/group.rb +10 -13
  20. data/lib/arrow/loader.rb +20 -1
  21. data/lib/arrow/record-batch.rb +6 -4
  22. data/lib/arrow/record-containable.rb +0 -35
  23. data/lib/arrow/record.rb +12 -9
  24. data/lib/arrow/slicer.rb +2 -2
  25. data/lib/arrow/struct-array-builder.rb +1 -7
  26. data/lib/arrow/struct-array.rb +13 -11
  27. data/lib/arrow/table-loader.rb +3 -9
  28. data/lib/arrow/table-table-formatter.rb +2 -2
  29. data/lib/arrow/table.rb +61 -24
  30. data/lib/arrow/time.rb +159 -0
  31. data/lib/arrow/time32-array-builder.rb +49 -0
  32. data/lib/arrow/time32-array.rb +28 -0
  33. data/lib/arrow/time64-array-builder.rb +49 -0
  34. data/lib/arrow/time64-array.rb +28 -0
  35. data/lib/arrow/timestamp-array-builder.rb +20 -1
  36. data/lib/arrow/timestamp-array.rb +10 -22
  37. data/lib/arrow/version.rb +1 -1
  38. data/red-arrow.gemspec +1 -1
  39. data/test/raw-records/test-basic-arrays.rb +16 -8
  40. data/test/raw-records/test-dense-union-array.rb +12 -5
  41. data/test/raw-records/test-list-array.rb +21 -9
  42. data/test/raw-records/test-sparse-union-array.rb +13 -5
  43. data/test/raw-records/test-struct-array.rb +11 -4
  44. data/test/test-column.rb +56 -31
  45. data/test/test-decimal128-array-builder.rb +11 -11
  46. data/test/test-decimal128-array.rb +4 -4
  47. data/test/test-slicer.rb +1 -3
  48. data/test/test-struct-array-builder.rb +4 -4
  49. data/test/test-struct-array.rb +4 -4
  50. data/test/test-table.rb +17 -8
  51. data/test/test-time.rb +288 -0
  52. data/test/test-time32-array.rb +81 -0
  53. data/test/test-time64-array.rb +81 -0
  54. data/test/values/test-basic-arrays.rb +284 -0
  55. data/test/values/test-dense-union-array.rb +487 -0
  56. data/test/values/test-list-array.rb +497 -0
  57. data/test/values/test-sparse-union-array.rb +477 -0
  58. data/test/values/test-struct-array.rb +452 -0
  59. metadata +78 -54
  60. data/lib/arrow/struct.rb +0 -79
  61. data/test/test-struct.rb +0 -81
@@ -0,0 +1,284 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one
2
+ # or more contributor license agreements. See the NOTICE file
3
+ # distributed with this work for additional information
4
+ # regarding copyright ownership. The ASF licenses this file
5
+ # to you under the Apache License, Version 2.0 (the
6
+ # "License"); you may not use this file except in compliance
7
+ # with the License. You may obtain a copy of the License at
8
+ #
9
+ # http://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing,
12
+ # software distributed under the License is distributed on an
13
+ # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
+ # KIND, either express or implied. See the License for the
15
+ # specific language governing permissions and limitations
16
+ # under the License.
17
+
18
+ module ValuesBasicArraysTests
19
+ def test_null
20
+ target = build(Arrow::NullArray.new(4))
21
+ assert_equal([nil] * 4, target.values)
22
+ end
23
+
24
+ def test_boolean
25
+ values = [true, nil, false]
26
+ target = build(Arrow::BooleanArray.new(values))
27
+ assert_equal(values, target.values)
28
+ end
29
+
30
+ def test_int8
31
+ values = [
32
+ -(2 ** 7),
33
+ nil,
34
+ (2 ** 7) - 1,
35
+ ]
36
+ target = build(Arrow::Int8Array.new(values))
37
+ assert_equal(values, target.values)
38
+ end
39
+
40
+ def test_uint8
41
+ values = [
42
+ 0,
43
+ nil,
44
+ (2 ** 8) - 1,
45
+ ]
46
+ target = build(Arrow::UInt8Array.new(values))
47
+ assert_equal(values, target.values)
48
+ end
49
+
50
+ def test_int16
51
+ values = [
52
+ -(2 ** 15),
53
+ nil,
54
+ (2 ** 15) - 1,
55
+ ]
56
+ target = build(Arrow::Int16Array.new(values))
57
+ assert_equal(values, target.values)
58
+ end
59
+
60
+ def test_uint16
61
+ values = [
62
+ 0,
63
+ nil,
64
+ (2 ** 16) - 1,
65
+ ]
66
+ target = build(Arrow::UInt16Array.new(values))
67
+ assert_equal(values, target.values)
68
+ end
69
+
70
+ def test_int32
71
+ values = [
72
+ -(2 ** 31),
73
+ nil,
74
+ (2 ** 31) - 1,
75
+ ]
76
+ target = build(Arrow::Int32Array.new(values))
77
+ assert_equal(values, target.values)
78
+ end
79
+
80
+ def test_uint32
81
+ values = [
82
+ 0,
83
+ nil,
84
+ (2 ** 32) - 1,
85
+ ]
86
+ target = build(Arrow::UInt32Array.new(values))
87
+ assert_equal(values, target.values)
88
+ end
89
+
90
+ def test_int64
91
+ values = [
92
+ -(2 ** 63),
93
+ nil,
94
+ (2 ** 63) - 1,
95
+ ]
96
+ target = build(Arrow::Int64Array.new(values))
97
+ assert_equal(values, target.values)
98
+ end
99
+
100
+ def test_uint64
101
+ values = [
102
+ 0,
103
+ nil,
104
+ (2 ** 64) - 1,
105
+ ]
106
+ target = build(Arrow::UInt64Array.new(values))
107
+ assert_equal(values, target.values)
108
+ end
109
+
110
+ def test_float
111
+ values = [
112
+ -1.0,
113
+ nil,
114
+ 1.0,
115
+ ]
116
+ target = build(Arrow::FloatArray.new(values))
117
+ assert_equal(values, target.values)
118
+ end
119
+
120
+ def test_double
121
+ values = [
122
+ -1.0,
123
+ nil,
124
+ 1.0,
125
+ ]
126
+ target = build(Arrow::DoubleArray.new(values))
127
+ assert_equal(values, target.values)
128
+ end
129
+
130
+ def test_binary
131
+ values = [
132
+ "\x00".b,
133
+ nil,
134
+ "\xff".b,
135
+ ]
136
+ target = build(Arrow::BinaryArray.new(values))
137
+ assert_equal(values, target.values)
138
+ end
139
+
140
+ def test_tring
141
+ values = [
142
+ "Ruby",
143
+ nil,
144
+ "\u3042", # U+3042 HIRAGANA LETTER A
145
+ ]
146
+ target = build(Arrow::StringArray.new(values))
147
+ assert_equal(values, target.values)
148
+ end
149
+
150
+ def test_date32
151
+ values = [
152
+ Date.new(1960, 1, 1),
153
+ nil,
154
+ Date.new(2017, 8, 23),
155
+ ]
156
+ target = build(Arrow::Date32Array.new(values))
157
+ assert_equal(values, target.values)
158
+ end
159
+
160
+ def test_date64
161
+ values = [
162
+ DateTime.new(1960, 1, 1, 2, 9, 30),
163
+ nil,
164
+ DateTime.new(2017, 8, 23, 14, 57, 2),
165
+ ]
166
+ target = build(Arrow::Date64Array.new(values))
167
+ assert_equal(values, target.values)
168
+ end
169
+
170
+ def test_timestamp_second
171
+ values = [
172
+ Time.parse("1960-01-01T02:09:30Z"),
173
+ nil,
174
+ Time.parse("2017-08-23T14:57:02Z"),
175
+ ]
176
+ target = build(Arrow::TimestampArray.new(:second, values))
177
+ assert_equal(values, target.values)
178
+ end
179
+
180
+ def test_timestamp_milli
181
+ values = [
182
+ Time.parse("1960-01-01T02:09:30.123Z"),
183
+ nil,
184
+ Time.parse("2017-08-23T14:57:02.987Z"),
185
+ ]
186
+ target = build(Arrow::TimestampArray.new(:milli, values))
187
+ assert_equal(values, target.values)
188
+ end
189
+
190
+ def test_timestamp_micro
191
+ values = [
192
+ Time.parse("1960-01-01T02:09:30.123456Z"),
193
+ nil,
194
+ Time.parse("2017-08-23T14:57:02.987654Z"),
195
+ ]
196
+ target = build(Arrow::TimestampArray.new(:micro, values))
197
+ assert_equal(values, target.values)
198
+ end
199
+
200
+ def test_timestamp_nano
201
+ values = [
202
+ Time.parse("1960-01-01T02:09:30.123456789Z"),
203
+ nil,
204
+ Time.parse("2017-08-23T14:57:02.987654321Z"),
205
+ ]
206
+ target = build(Arrow::TimestampArray.new(:nano, values))
207
+ assert_equal(values, target.values)
208
+ end
209
+
210
+ def test_time32_second
211
+ unit = Arrow::TimeUnit::SECOND
212
+ values = [
213
+ Arrow::Time.new(unit, 60 * 10), # 00:10:00
214
+ nil,
215
+ Arrow::Time.new(unit, 60 * 60 * 2 + 9), # 02:00:09
216
+ ]
217
+ target = build(Arrow::Time32Array.new(:second, values))
218
+ assert_equal(values, target.values)
219
+ end
220
+
221
+ def test_time32_milli
222
+ unit = Arrow::TimeUnit::MILLI
223
+ values = [
224
+ Arrow::Time.new(unit, (60 * 10) * 1000 + 123), # 00:10:00.123
225
+ nil,
226
+ Arrow::Time.new(unit, (60 * 60 * 2 + 9) * 1000 + 987), # 02:00:09.987
227
+ ]
228
+ target = build(Arrow::Time32Array.new(:milli, values))
229
+ assert_equal(values, target.values)
230
+ end
231
+
232
+ def test_time64_micro
233
+ unit = Arrow::TimeUnit::MICRO
234
+ values = [
235
+ # 00:10:00.123456
236
+ Arrow::Time.new(unit, (60 * 10) * 1_000_000 + 123_456),
237
+ nil,
238
+ # 02:00:09.987654
239
+ Arrow::Time.new(unit, (60 * 60 * 2 + 9) * 1_000_000 + 987_654),
240
+ ]
241
+ target = build(Arrow::Time64Array.new(:micro, values))
242
+ assert_equal(values, target.values)
243
+ end
244
+
245
+ def test_time64_nano
246
+ unit = Arrow::TimeUnit::NANO
247
+ values = [
248
+ # 00:10:00.123456789
249
+ Arrow::Time.new(unit, (60 * 10) * 1_000_000_000 + 123_456_789),
250
+ nil,
251
+ # 02:00:09.987654321
252
+ Arrow::Time.new(unit, (60 * 60 * 2 + 9) * 1_000_000_000 + 987_654_321),
253
+ ]
254
+ target = build(Arrow::Time64Array.new(:nano, values))
255
+ assert_equal(values, target.values)
256
+ end
257
+
258
+ def test_decimal128
259
+ values = [
260
+ BigDecimal("92.92"),
261
+ nil,
262
+ BigDecimal("29.29"),
263
+ ]
264
+ data_type = Arrow::Decimal128DataType.new(8, 2)
265
+ target = build(Arrow::Decimal128Array.new(data_type, values))
266
+ assert_equal(values, target.values)
267
+ end
268
+ end
269
+
270
+ class ValuesArrayBasicArraysTest < Test::Unit::TestCase
271
+ include ValuesBasicArraysTests
272
+
273
+ def build(array)
274
+ array
275
+ end
276
+ end
277
+
278
+ class ValuesChunkedArrayBasicArraysTest < Test::Unit::TestCase
279
+ include ValuesBasicArraysTests
280
+
281
+ def build(array)
282
+ Arrow::ChunkedArray.new([array])
283
+ end
284
+ end
@@ -0,0 +1,487 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one
2
+ # or more contributor license agreements. See the NOTICE file
3
+ # distributed with this work for additional information
4
+ # regarding copyright ownership. The ASF licenses this file
5
+ # to you under the Apache License, Version 2.0 (the
6
+ # "License"); you may not use this file except in compliance
7
+ # with the License. You may obtain a copy of the License at
8
+ #
9
+ # http://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing,
12
+ # software distributed under the License is distributed on an
13
+ # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
+ # KIND, either express or implied. See the License for the
15
+ # specific language governing permissions and limitations
16
+ # under the License.
17
+
18
+ module ValuesDenseUnionArrayTests
19
+ def build_data_type(type, type_codes)
20
+ field_description = {}
21
+ if type.is_a?(Hash)
22
+ field_description = field_description.merge(type)
23
+ else
24
+ field_description[:type] = type
25
+ end
26
+ Arrow::DenseUnionDataType.new(fields: [
27
+ field_description.merge(name: "0"),
28
+ field_description.merge(name: "1"),
29
+ ],
30
+ type_codes: type_codes)
31
+ end
32
+
33
+ def build_array(type, values)
34
+ type_codes = [0, 1]
35
+ data_type = build_data_type(type, type_codes)
36
+ type_ids = []
37
+ offsets = []
38
+ arrays = data_type.fields.collect do |field|
39
+ sub_schema = Arrow::Schema.new([field])
40
+ sub_records = []
41
+ values.each do |value|
42
+ next if value.nil?
43
+ next unless value.key?(field.name)
44
+ sub_records << [value[field.name]]
45
+ end
46
+ sub_record_batch = Arrow::RecordBatch.new(sub_schema,
47
+ sub_records)
48
+ sub_record_batch.columns[0].data
49
+ end
50
+ values.each do |value|
51
+ if value.nil?
52
+ type_ids << nil
53
+ offsets << 0
54
+ elsif value.key?("0")
55
+ type_id = type_codes[0]
56
+ type_ids << type_id
57
+ offsets << (type_ids.count(type_id) - 1)
58
+ elsif value.key?("1")
59
+ type_id = type_codes[1]
60
+ type_ids << type_id
61
+ offsets << (type_ids.count(type_id) - 1)
62
+ end
63
+ end
64
+ Arrow::DenseUnionArray.new(data_type,
65
+ Arrow::Int8Array.new(type_ids),
66
+ Arrow::Int32Array.new(offsets),
67
+ arrays)
68
+ end
69
+
70
+ def test_null
71
+ values = [
72
+ {"0" => nil},
73
+ nil,
74
+ ]
75
+ target = build(:null, values)
76
+ assert_equal(values, target.values)
77
+ end
78
+
79
+ def test_boolean
80
+ values = [
81
+ {"0" => true},
82
+ nil,
83
+ {"1" => nil},
84
+ ]
85
+ target = build(:boolean, values)
86
+ assert_equal(values, target.values)
87
+ end
88
+
89
+ def test_int8
90
+ values = [
91
+ {"0" => -(2 ** 7)},
92
+ nil,
93
+ {"1" => nil},
94
+ ]
95
+ target = build(:int8, values)
96
+ assert_equal(values, target.values)
97
+ end
98
+
99
+ def test_uint8
100
+ values = [
101
+ {"0" => (2 ** 8) - 1},
102
+ nil,
103
+ {"1" => nil},
104
+ ]
105
+ target = build(:uint8, values)
106
+ assert_equal(values, target.values)
107
+ end
108
+
109
+ def test_int16
110
+ values = [
111
+ {"0" => -(2 ** 15)},
112
+ nil,
113
+ {"1" => nil},
114
+ ]
115
+ target = build(:int16, values)
116
+ assert_equal(values, target.values)
117
+ end
118
+
119
+ def test_uint16
120
+ values = [
121
+ {"0" => (2 ** 16) - 1},
122
+ nil,
123
+ {"1" => nil},
124
+ ]
125
+ target = build(:uint16, values)
126
+ assert_equal(values, target.values)
127
+ end
128
+
129
+ def test_int32
130
+ values = [
131
+ {"0" => -(2 ** 31)},
132
+ nil,
133
+ {"1" => nil},
134
+ ]
135
+ target = build(:int32, values)
136
+ assert_equal(values, target.values)
137
+ end
138
+
139
+ def test_uint32
140
+ values = [
141
+ {"0" => (2 ** 32) - 1},
142
+ nil,
143
+ {"1" => nil},
144
+ ]
145
+ target = build(:uint32, values)
146
+ assert_equal(values, target.values)
147
+ end
148
+
149
+ def test_int64
150
+ values = [
151
+ {"0" => -(2 ** 63)},
152
+ nil,
153
+ {"1" => nil},
154
+ ]
155
+ target = build(:int64, values)
156
+ assert_equal(values, target.values)
157
+ end
158
+
159
+ def test_uint64
160
+ values = [
161
+ {"0" => (2 ** 64) - 1},
162
+ nil,
163
+ {"1" => nil},
164
+ ]
165
+ target = build(:uint64, values)
166
+ assert_equal(values, target.values)
167
+ end
168
+
169
+ def test_float
170
+ values = [
171
+ {"0" => -1.0},
172
+ nil,
173
+ {"1" => nil},
174
+ ]
175
+ target = build(:float, values)
176
+ assert_equal(values, target.values)
177
+ end
178
+
179
+ def test_double
180
+ values = [
181
+ {"0" => -1.0},
182
+ nil,
183
+ {"1" => nil},
184
+ ]
185
+ target = build(:double, values)
186
+ assert_equal(values, target.values)
187
+ end
188
+
189
+ def test_binary
190
+ values = [
191
+ {"0" => "\xff".b},
192
+ nil,
193
+ {"1" => nil},
194
+ ]
195
+ target = build(:binary, values)
196
+ assert_equal(values, target.values)
197
+ end
198
+
199
+ def test_string
200
+ values = [
201
+ {"0" => "Ruby"},
202
+ nil,
203
+ {"1" => nil},
204
+ ]
205
+ target = build(:string, values)
206
+ assert_equal(values, target.values)
207
+ end
208
+
209
+ def test_date32
210
+ values = [
211
+ {"0" => Date.new(1960, 1, 1)},
212
+ nil,
213
+ {"1" => nil},
214
+ ]
215
+ target = build(:date32, values)
216
+ assert_equal(values, target.values)
217
+ end
218
+
219
+ def test_date64
220
+ values = [
221
+ {"0" => DateTime.new(1960, 1, 1, 2, 9, 30)},
222
+ nil,
223
+ {"1" => nil},
224
+ ]
225
+ target = build(:date64, values)
226
+ assert_equal(values, target.values)
227
+ end
228
+
229
+ def test_timestamp_second
230
+ values = [
231
+ {"0" => Time.parse("1960-01-01T02:09:30Z")},
232
+ nil,
233
+ {"1" => nil},
234
+ ]
235
+ target = build({
236
+ type: :timestamp,
237
+ unit: :second,
238
+ },
239
+ values)
240
+ assert_equal(values, target.values)
241
+ end
242
+
243
+ def test_timestamp_milli
244
+ values = [
245
+ {"0" => Time.parse("1960-01-01T02:09:30.123Z")},
246
+ nil,
247
+ {"1" => nil},
248
+ ]
249
+ target = build({
250
+ type: :timestamp,
251
+ unit: :milli,
252
+ },
253
+ values)
254
+ assert_equal(values, target.values)
255
+ end
256
+
257
+ def test_timestamp_micro
258
+ values = [
259
+ {"0" => Time.parse("1960-01-01T02:09:30.123456Z")},
260
+ nil,
261
+ {"1" => nil},
262
+ ]
263
+ target = build({
264
+ type: :timestamp,
265
+ unit: :micro,
266
+ },
267
+ values)
268
+ assert_equal(values, target.values)
269
+ end
270
+
271
+ def test_timestamp_nano
272
+ values = [
273
+ {"0" => Time.parse("1960-01-01T02:09:30.123456789Z")},
274
+ nil,
275
+ {"1" => nil},
276
+ ]
277
+ target = build({
278
+ type: :timestamp,
279
+ unit: :nano,
280
+ },
281
+ values)
282
+ assert_equal(values, target.values)
283
+ end
284
+
285
+ def test_time32_second
286
+ unit = Arrow::TimeUnit::SECOND
287
+ values = [
288
+ # 00:10:00
289
+ {"0" => Arrow::Time.new(unit, 60 * 10)},
290
+ nil,
291
+ {"1" => nil},
292
+ ]
293
+ target = build({
294
+ type: :time32,
295
+ unit: :second,
296
+ },
297
+ values)
298
+ assert_equal(values, target.values)
299
+ end
300
+
301
+ def test_time32_milli
302
+ unit = Arrow::TimeUnit::MILLI
303
+ values = [
304
+ # 00:10:00.123
305
+ {"0" => Arrow::Time.new(unit, (60 * 10) * 1000 + 123)},
306
+ nil,
307
+ {"1" => nil},
308
+ ]
309
+ target = build({
310
+ type: :time32,
311
+ unit: :milli,
312
+ },
313
+ values)
314
+ assert_equal(values, target.values)
315
+ end
316
+
317
+ def test_time64_micro
318
+ unit = Arrow::TimeUnit::MICRO
319
+ values = [
320
+ # 00:10:00.123456
321
+ {"0" => Arrow::Time.new(unit, (60 * 10) * 1_000_000 + 123_456)},
322
+ nil,
323
+ {"1" => nil},
324
+ ]
325
+ target = build({
326
+ type: :time64,
327
+ unit: :micro,
328
+ },
329
+ values)
330
+ assert_equal(values, target.values)
331
+ end
332
+
333
+ def test_time64_nano
334
+ unit = Arrow::TimeUnit::NANO
335
+ values = [
336
+ # 00:10:00.123456789
337
+ {"0" => Arrow::Time.new(unit, (60 * 10) * 1_000_000_000 + 123_456_789)},
338
+ nil,
339
+ {"1" => nil},
340
+ ]
341
+ target = build({
342
+ type: :time64,
343
+ unit: :nano,
344
+ },
345
+ values)
346
+ assert_equal(values, target.values)
347
+ end
348
+
349
+ def test_decimal128
350
+ values = [
351
+ {"0" => BigDecimal("92.92")},
352
+ nil,
353
+ {"1" => nil},
354
+ ]
355
+ target = build({
356
+ type: :decimal128,
357
+ precision: 8,
358
+ scale: 2,
359
+ },
360
+ values)
361
+ assert_equal(values, target.values)
362
+ end
363
+
364
+ def test_list
365
+ values = [
366
+ {"0" => [true, nil, false]},
367
+ nil,
368
+ {"1" => nil},
369
+ ]
370
+ target = build({
371
+ type: :list,
372
+ field: {
373
+ name: :sub_element,
374
+ type: :boolean,
375
+ },
376
+ },
377
+ values)
378
+ assert_equal(values, target.values)
379
+ end
380
+
381
+ def test_struct
382
+ values = [
383
+ {"0" => {"sub_field" => true}},
384
+ nil,
385
+ {"1" => nil},
386
+ {"0" => {"sub_field" => nil}},
387
+ ]
388
+ target = build({
389
+ type: :struct,
390
+ fields: [
391
+ {
392
+ name: :sub_field,
393
+ type: :boolean,
394
+ },
395
+ ],
396
+ },
397
+ values)
398
+ assert_equal(values, target.values)
399
+ end
400
+
401
+ def test_sparse_union
402
+ omit("Need to add support for SparseUnionArrayBuilder")
403
+ values = [
404
+ {"0" => {"field1" => true}},
405
+ nil,
406
+ {"1" => nil},
407
+ {"0" => {"field2" => nil}},
408
+ ]
409
+ target = build({
410
+ type: :sparse_union,
411
+ fields: [
412
+ {
413
+ name: :field1,
414
+ type: :boolean,
415
+ },
416
+ {
417
+ name: :field2,
418
+ type: :uint8,
419
+ },
420
+ ],
421
+ type_codes: [0, 1],
422
+ },
423
+ values)
424
+ assert_equal(values, target.values)
425
+ end
426
+
427
+ def test_dense_union
428
+ omit("Need to add support for DenseUnionArrayBuilder")
429
+ values = [
430
+ {"0" => {"field1" => true}},
431
+ nil,
432
+ {"1" => nil},
433
+ {"0" => {"field2" => nil}},
434
+ ]
435
+ target = build({
436
+ type: :dense_union,
437
+ fields: [
438
+ {
439
+ name: :field1,
440
+ type: :boolean,
441
+ },
442
+ {
443
+ name: :field2,
444
+ type: :uint8,
445
+ },
446
+ ],
447
+ type_codes: [0, 1],
448
+ },
449
+ values)
450
+ assert_equal(values, target.values)
451
+ end
452
+
453
+ def test_dictionary
454
+ omit("Need to add support for DictionaryArrayBuilder")
455
+ values = [
456
+ {"0" => "Ruby"},
457
+ nil,
458
+ {"1" => nil},
459
+ {"0" => "GLib"},
460
+ ]
461
+ dictionary = Arrow::StringArray.new(["GLib", "Ruby"])
462
+ target = build({
463
+ type: :dictionary,
464
+ index_data_type: :int8,
465
+ dictionary: dictionary,
466
+ ordered: true,
467
+ },
468
+ values)
469
+ assert_equal(values, target.values)
470
+ end
471
+ end
472
+
473
+ class ValuesArrayDenseUnionArrayTest < Test::Unit::TestCase
474
+ include ValuesDenseUnionArrayTests
475
+
476
+ def build(type, values)
477
+ build_array(type, values)
478
+ end
479
+ end
480
+
481
+ class ValuesChunkedArrayDenseUnionArrayTest < Test::Unit::TestCase
482
+ include ValuesDenseUnionArrayTests
483
+
484
+ def build(type, values)
485
+ Arrow::ChunkedArray.new([build_array(type, values)])
486
+ end
487
+ end