red-arrow-dataset 1.0.0 → 4.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: f6765f578316707de9fdb029f2e16873d6a013888e30aa684bf1722745fb99ce
4
- data.tar.gz: 61425742e9849324c10ceba4801325b829a81c161b4fc618bfccd51256ddb399
3
+ metadata.gz: 00cf96f680d62ad003d931b3628313f83dd351b34222a59e5d1f85018ea20d7e
4
+ data.tar.gz: 399966d45ae4bb31868c9ae21df1b5ee6e6738297597b8536718db398f2a927b
5
5
  SHA512:
6
- metadata.gz: c0f53a37a9c77a662cc4256075d7d38b89b03eb1193764d26c1759d65397775953bc9f526854776a2b002f120efd3d091514a3a2d7cca523a041b62f350cd535
7
- data.tar.gz: a976fd8cf83bb3852b5c3518f01c07fad895d5ce0f76eb4b3a71a3046946d82349f343ba65b8f18b1b743beb598fab545fdadf73f897f5c1468b158a204326c8
6
+ metadata.gz: c61e5f5ecd8ed9b027091a55ca9213e206c71c7d13c6f11714ec4ad9cdf58c45b4811a46315e267a9fcbf7d5d7a893af2b2dd935dce23c6c898d0c4ae37f4a83
7
+ data.tar.gz: 0acea5814073860de6780405ff597227dd9fc0971b1312f2e51af2e43c710650968b301160ba4542498189728fb87f2a66cc9344293d80ea71efaba8fe25166c
@@ -19,6 +19,7 @@
19
19
 
20
20
  require "pkg-config"
21
21
  require "native-package-installer"
22
+ require_relative "../lib/arrow-dataset/version"
22
23
 
23
24
  case RUBY_PLATFORM
24
25
  when /mingw|mswin/
@@ -33,7 +34,10 @@ end
33
34
  namespace :dependency do
34
35
  desc "Check dependency"
35
36
  task :check do
36
- unless PKGConfig.check_version?("arrow-dataset-glib")
37
+ unless PKGConfig.check_version?("arrow-dataset-glib",
38
+ ArrowDataset::Version::MAJOR,
39
+ ArrowDataset::Version::MINOR,
40
+ ArrowDataset::Version::MICRO)
37
41
  unless NativePackageInstaller.install(:debian => "libarrow-dataset-glib-dev",
38
42
  :redhat => "arrow-dataset-glib-devel")
39
43
  exit(false)
@@ -0,0 +1,32 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one
2
+ # or more contributor license agreements. See the NOTICE file
3
+ # distributed with this work for additional information
4
+ # regarding copyright ownership. The ASF licenses this file
5
+ # to you under the Apache License, Version 2.0 (the
6
+ # "License"); you may not use this file except in compliance
7
+ # with the License. You may obtain a copy of the License at
8
+ #
9
+ # http://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing,
12
+ # software distributed under the License is distributed on an
13
+ # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
+ # KIND, either express or implied. See the License for the
15
+ # specific language governing permissions and limitations
16
+ # under the License.
17
+
18
+ module ArrowDataset
19
+ class InMemoryFragment
20
+ alias_method :initialize_raw, :initialize
21
+ private :initialize_raw
22
+ def initialize(schema, record_batches)
23
+ record_batches = record_batches.collect do |record_batch|
24
+ unless record_batch.is_a?(Arrow::RecordBatch)
25
+ record_batch = Arrow::RecordBatch.new(record_batch)
26
+ end
27
+ record_batch
28
+ end
29
+ initialize_raw(schema, record_batches)
30
+ end
31
+ end
32
+ end
@@ -26,9 +26,10 @@ module ArrowDataset
26
26
  end
27
27
  record_batch
28
28
  end
29
- context = options.delete(:context) || ScanContext.new
30
29
  options[:schema] ||= record_batches.first.schema
31
- initialize_raw(record_batches, options, context)
30
+ fragment = options.delete(:fragment)
31
+ fragment ||= InMemoryFragment.new(options[:schema], record_batches)
32
+ initialize_raw(record_batches, options, fragment)
32
33
  end
33
34
  end
34
35
  end
@@ -16,7 +16,7 @@
16
16
  # under the License.
17
17
 
18
18
  module ArrowDataset
19
- VERSION = "1.0.0"
19
+ VERSION = "4.0.1"
20
20
 
21
21
  module Version
22
22
  numbers, TAG = VERSION.split("-")
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: red-arrow-dataset
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.0.0
4
+ version: 4.0.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - Apache Arrow Developers
8
- autorequire:
8
+ autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2020-07-24 00:00:00.000000000 Z
11
+ date: 2021-05-27 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: red-arrow
@@ -16,14 +16,14 @@ dependencies:
16
16
  requirements:
17
17
  - - '='
18
18
  - !ruby/object:Gem::Version
19
- version: 1.0.0
19
+ version: 4.0.1
20
20
  type: :runtime
21
21
  prerelease: false
22
22
  version_requirements: !ruby/object:Gem::Requirement
23
23
  requirements:
24
24
  - - '='
25
25
  - !ruby/object:Gem::Version
26
- version: 1.0.0
26
+ version: 4.0.1
27
27
  - !ruby/object:Gem::Dependency
28
28
  name: bundler
29
29
  requirement: !ruby/object:Gem::Requirement
@@ -82,6 +82,7 @@ files:
82
82
  - Rakefile
83
83
  - dependency-check/Rakefile
84
84
  - lib/arrow-dataset.rb
85
+ - lib/arrow-dataset/in-memory-fragment.rb
85
86
  - lib/arrow-dataset/in-memory-scan-task.rb
86
87
  - lib/arrow-dataset/loader.rb
87
88
  - lib/arrow-dataset/scan-options.rb
@@ -95,7 +96,7 @@ homepage: https://arrow.apache.org/
95
96
  licenses:
96
97
  - Apache-2.0
97
98
  metadata: {}
98
- post_install_message:
99
+ post_install_message:
99
100
  rdoc_options: []
100
101
  require_paths:
101
102
  - lib
@@ -110,12 +111,12 @@ required_rubygems_version: !ruby/object:Gem::Requirement
110
111
  - !ruby/object:Gem::Version
111
112
  version: '0'
112
113
  requirements: []
113
- rubygems_version: 3.1.2
114
- signing_key:
114
+ rubygems_version: 3.2.5
115
+ signing_key:
115
116
  specification_version: 4
116
117
  summary: Red Arrow Dataset is the Ruby bindings of Apache Arrow Dataset
117
118
  test_files:
118
- - test/run-test.rb
119
119
  - test/helper.rb
120
+ - test/run-test.rb
120
121
  - test/test-scan-options.rb
121
122
  - test/test-in-memory-scan-task.rb