embulk 0.10.44-java → 0.10.45-java
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/embulk.gemspec +2 -2
- data/lib/embulk/gem_version.rb +1 -1
- data/lib/embulk/guess/charset.rb +4 -23
- metadata +3 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: cdf29acae0add6fde587d70e8673b73108c5ef6e
|
4
|
+
data.tar.gz: 6c68e1355ccb2996cb40b2c271e3b37f41ae9422
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: fb768d8e7cfd7eaecae90a8bdfde631eb6e920043d83dbbeb36961acdc185acac2d3f131831ba8a415e1854fe0c06b2c5c14b1edcdb3da6bd369a8988fb104d3
|
7
|
+
data.tar.gz: e5d41d6d88ff3d34f69950e90fb5486e6f3da55283e1b2b422f9d9953d162195b6499778d060bbd73df8396d758f23f23773e70b7c37a2eb98e28df66bc0c7fc
|
data/embulk.gemspec
CHANGED
@@ -1,6 +1,6 @@
|
|
1
1
|
Gem::Specification.new do |gem|
|
2
2
|
gem.name = "embulk"
|
3
|
-
gem.version = "0.10.
|
3
|
+
gem.version = "0.10.45"
|
4
4
|
gem.license = "Apache-2.0"
|
5
5
|
|
6
6
|
gem.summary = "Embulk's runtime library for Ruby."
|
@@ -33,7 +33,7 @@ Gem::Specification.new do |gem|
|
|
33
33
|
"documentation_uri" => "https://www.embulk.org/",
|
34
34
|
"homepage_uri" => gem.homepage,
|
35
35
|
# "mailing_list_uri" => "",
|
36
|
-
"source_code_uri" => "https://github.com/embulk/embulk/tree/v0.10.
|
36
|
+
"source_code_uri" => "https://github.com/embulk/embulk/tree/v0.10.45",
|
37
37
|
# "wiki_uri" => "",
|
38
38
|
}
|
39
39
|
end
|
data/lib/embulk/gem_version.rb
CHANGED
data/lib/embulk/guess/charset.rb
CHANGED
@@ -4,30 +4,11 @@ module Embulk
|
|
4
4
|
class CharsetGuessPlugin < GuessPlugin
|
5
5
|
Plugin.register_guess('charset', self)
|
6
6
|
|
7
|
-
STATIC_MAPPING = {
|
8
|
-
# ISO-8859-1 means ASCII which is a subset of UTF-8 in most of cases
|
9
|
-
# due to lack of sample data set.
|
10
|
-
"ISO-8859-1" => "UTF-8",
|
11
|
-
|
12
|
-
# Shift_JIS is used almost only by Windows that uses "CP932" in fact.
|
13
|
-
# And "CP932" called by Microsoft actually means "MS932" in Java.
|
14
|
-
"Shift_JIS" => "MS932",
|
15
|
-
}
|
16
|
-
|
17
7
|
def guess(config, sample_buffer)
|
18
|
-
|
19
|
-
|
20
|
-
|
21
|
-
|
22
|
-
if best_match.getConfidence < 50
|
23
|
-
name = "UTF-8"
|
24
|
-
else
|
25
|
-
name = best_match.getName
|
26
|
-
if mapped_name = STATIC_MAPPING[name]
|
27
|
-
name = mapped_name
|
28
|
-
end
|
29
|
-
end
|
30
|
-
return {"parser" => {"charset" => name}}
|
8
|
+
Embulk.logger.warn(
|
9
|
+
"Ruby-based CharsetGuess is no longer available. "
|
10
|
+
+ "It always returns \"UTF-8\" unconditionally. Use an appropriate guess plugin explicitly."
|
11
|
+
return {"parser" => {"charset" => "UTF-8"}}
|
31
12
|
end
|
32
13
|
end
|
33
14
|
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: embulk
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.10.
|
4
|
+
version: 0.10.45
|
5
5
|
platform: java
|
6
6
|
authors:
|
7
7
|
- Sadayuki Furuhashi
|
@@ -10,7 +10,7 @@ authors:
|
|
10
10
|
autorequire:
|
11
11
|
bindir: bin
|
12
12
|
cert_chain: []
|
13
|
-
date: 2023-03
|
13
|
+
date: 2023-04-03 00:00:00.000000000 Z
|
14
14
|
dependencies:
|
15
15
|
- !ruby/object:Gem::Dependency
|
16
16
|
requirement: !ruby/object:Gem::Requirement
|
@@ -78,7 +78,7 @@ metadata:
|
|
78
78
|
changelog_uri: https://github.com/embulk/embulk/releases
|
79
79
|
documentation_uri: https://www.embulk.org/
|
80
80
|
homepage_uri: https://www.embulk.org/
|
81
|
-
source_code_uri: https://github.com/embulk/embulk/tree/v0.10.
|
81
|
+
source_code_uri: https://github.com/embulk/embulk/tree/v0.10.45
|
82
82
|
post_install_message:
|
83
83
|
rdoc_options: []
|
84
84
|
require_paths:
|