red-arrow-dataset 1.0.0 → 4.0.1

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: f6765f578316707de9fdb029f2e16873d6a013888e30aa684bf1722745fb99ce
4
- data.tar.gz: 61425742e9849324c10ceba4801325b829a81c161b4fc618bfccd51256ddb399
3
+ metadata.gz: 00cf96f680d62ad003d931b3628313f83dd351b34222a59e5d1f85018ea20d7e
4
+ data.tar.gz: 399966d45ae4bb31868c9ae21df1b5ee6e6738297597b8536718db398f2a927b
5
5
  SHA512:
6
- metadata.gz: c0f53a37a9c77a662cc4256075d7d38b89b03eb1193764d26c1759d65397775953bc9f526854776a2b002f120efd3d091514a3a2d7cca523a041b62f350cd535
7
- data.tar.gz: a976fd8cf83bb3852b5c3518f01c07fad895d5ce0f76eb4b3a71a3046946d82349f343ba65b8f18b1b743beb598fab545fdadf73f897f5c1468b158a204326c8
6
+ metadata.gz: c61e5f5ecd8ed9b027091a55ca9213e206c71c7d13c6f11714ec4ad9cdf58c45b4811a46315e267a9fcbf7d5d7a893af2b2dd935dce23c6c898d0c4ae37f4a83
7
+ data.tar.gz: 0acea5814073860de6780405ff597227dd9fc0971b1312f2e51af2e43c710650968b301160ba4542498189728fb87f2a66cc9344293d80ea71efaba8fe25166c
@@ -19,6 +19,7 @@
19
19
 
20
20
  require "pkg-config"
21
21
  require "native-package-installer"
22
+ require_relative "../lib/arrow-dataset/version"
22
23
 
23
24
  case RUBY_PLATFORM
24
25
  when /mingw|mswin/
@@ -33,7 +34,10 @@ end
33
34
  namespace :dependency do
34
35
  desc "Check dependency"
35
36
  task :check do
36
- unless PKGConfig.check_version?("arrow-dataset-glib")
37
+ unless PKGConfig.check_version?("arrow-dataset-glib",
38
+ ArrowDataset::Version::MAJOR,
39
+ ArrowDataset::Version::MINOR,
40
+ ArrowDataset::Version::MICRO)
37
41
  unless NativePackageInstaller.install(:debian => "libarrow-dataset-glib-dev",
38
42
  :redhat => "arrow-dataset-glib-devel")
39
43
  exit(false)
@@ -0,0 +1,32 @@
1
+ # Licensed to the Apache Software Foundation (ASF) under one
2
+ # or more contributor license agreements. See the NOTICE file
3
+ # distributed with this work for additional information
4
+ # regarding copyright ownership. The ASF licenses this file
5
+ # to you under the Apache License, Version 2.0 (the
6
+ # "License"); you may not use this file except in compliance
7
+ # with the License. You may obtain a copy of the License at
8
+ #
9
+ # http://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing,
12
+ # software distributed under the License is distributed on an
13
+ # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
14
+ # KIND, either express or implied. See the License for the
15
+ # specific language governing permissions and limitations
16
+ # under the License.
17
+
18
+ module ArrowDataset
19
+ class InMemoryFragment
20
+ alias_method :initialize_raw, :initialize
21
+ private :initialize_raw
22
+ def initialize(schema, record_batches)
23
+ record_batches = record_batches.collect do |record_batch|
24
+ unless record_batch.is_a?(Arrow::RecordBatch)
25
+ record_batch = Arrow::RecordBatch.new(record_batch)
26
+ end
27
+ record_batch
28
+ end
29
+ initialize_raw(schema, record_batches)
30
+ end
31
+ end
32
+ end
@@ -26,9 +26,10 @@ module ArrowDataset
26
26
  end
27
27
  record_batch
28
28
  end
29
- context = options.delete(:context) || ScanContext.new
30
29
  options[:schema] ||= record_batches.first.schema
31
- initialize_raw(record_batches, options, context)
30
+ fragment = options.delete(:fragment)
31
+ fragment ||= InMemoryFragment.new(options[:schema], record_batches)
32
+ initialize_raw(record_batches, options, fragment)
32
33
  end
33
34
  end
34
35
  end
@@ -16,7 +16,7 @@
16
16
  # under the License.
17
17
 
18
18
  module ArrowDataset
19
- VERSION = "1.0.0"
19
+ VERSION = "4.0.1"
20
20
 
21
21
  module Version
22
22
  numbers, TAG = VERSION.split("-")
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: red-arrow-dataset
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.0.0
4
+ version: 4.0.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - Apache Arrow Developers
8
- autorequire:
8
+ autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2020-07-24 00:00:00.000000000 Z
11
+ date: 2021-05-27 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: red-arrow
@@ -16,14 +16,14 @@ dependencies:
16
16
  requirements:
17
17
  - - '='
18
18
  - !ruby/object:Gem::Version
19
- version: 1.0.0
19
+ version: 4.0.1
20
20
  type: :runtime
21
21
  prerelease: false
22
22
  version_requirements: !ruby/object:Gem::Requirement
23
23
  requirements:
24
24
  - - '='
25
25
  - !ruby/object:Gem::Version
26
- version: 1.0.0
26
+ version: 4.0.1
27
27
  - !ruby/object:Gem::Dependency
28
28
  name: bundler
29
29
  requirement: !ruby/object:Gem::Requirement
@@ -82,6 +82,7 @@ files:
82
82
  - Rakefile
83
83
  - dependency-check/Rakefile
84
84
  - lib/arrow-dataset.rb
85
+ - lib/arrow-dataset/in-memory-fragment.rb
85
86
  - lib/arrow-dataset/in-memory-scan-task.rb
86
87
  - lib/arrow-dataset/loader.rb
87
88
  - lib/arrow-dataset/scan-options.rb
@@ -95,7 +96,7 @@ homepage: https://arrow.apache.org/
95
96
  licenses:
96
97
  - Apache-2.0
97
98
  metadata: {}
98
- post_install_message:
99
+ post_install_message:
99
100
  rdoc_options: []
100
101
  require_paths:
101
102
  - lib
@@ -110,12 +111,12 @@ required_rubygems_version: !ruby/object:Gem::Requirement
110
111
  - !ruby/object:Gem::Version
111
112
  version: '0'
112
113
  requirements: []
113
- rubygems_version: 3.1.2
114
- signing_key:
114
+ rubygems_version: 3.2.5
115
+ signing_key:
115
116
  specification_version: 4
116
117
  summary: Red Arrow Dataset is the Ruby bindings of Apache Arrow Dataset
117
118
  test_files:
118
- - test/run-test.rb
119
119
  - test/helper.rb
120
+ - test/run-test.rb
120
121
  - test/test-scan-options.rb
121
122
  - test/test-in-memory-scan-task.rb