rchardet 1.6.1 → 1.7.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/rchardet/universaldetector.rb +10 -0
- data/lib/rchardet/version.rb +1 -1
- metadata +3 -3
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 3cdc02a9943abeba846fd618a5ee9f04fe8ef506
|
4
|
+
data.tar.gz: edeeefd5700589aa5bb8cbc371a6cd580e2557fc
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: facabfeae468c114f98ae3e6f38aedbf9c3a1f4393995b00d539903b67444a1124ed2a1307c56192263d6b28a9167766fd2fdd1c5eda2183379d37a679cb5a10
|
7
|
+
data.tar.gz: 374d62ffda808bfd64639de216087162d2f117fd78cbc87fc9bcd05162e00c0e311638a20748c8a7033b7ad5320ff2ab8d2011843e4400992c23548911fabc49
|
@@ -90,6 +90,16 @@ module CharDet
|
|
90
90
|
elsif aBuf[0, 2] == "\xFE\xFF"
|
91
91
|
# FE FF UTF-16, big endian BOM
|
92
92
|
@result = {'encoding' => "UTF-16BE", 'confidence' => 1.0}
|
93
|
+
elsif aBuf[0, 3] == "\x2B\x2F\x76" && ["\x38", "\x39", "\x2B", "\x2F"].include?(aBuf[3, 1])
|
94
|
+
# NOTE: Ruby only includes "dummy" support for UTF-7.
|
95
|
+
# A Ruby UTF-7 string can't have methods called on it, nor can it be converted to anything else, but "BINARY"/"ASCII-8BIT".
|
96
|
+
# Still, this doesn't make detection useless, as UTF-7 encodings exist in the wild, and the scenario may need to be handled.
|
97
|
+
# 2B 2F 76 38 UTF-7
|
98
|
+
# 2B 2F 76 39 UTF-7
|
99
|
+
# 2B 2F 76 2B UTF-7
|
100
|
+
# 2B 2F 76 2F UTF-7
|
101
|
+
# 2B 2F 76 38 2D UTF-7 with no following character (empty string)
|
102
|
+
@result = {'encoding' => "UTF-7", 'confidence' => 0.99}
|
93
103
|
end
|
94
104
|
end
|
95
105
|
|
data/lib/rchardet/version.rb
CHANGED
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: rchardet
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.7.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Michael Grosser
|
@@ -9,7 +9,7 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date:
|
12
|
+
date: 2018-01-07 00:00:00.000000000 Z
|
13
13
|
dependencies: []
|
14
14
|
description:
|
15
15
|
email:
|
@@ -75,7 +75,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
75
75
|
version: '0'
|
76
76
|
requirements: []
|
77
77
|
rubyforge_project:
|
78
|
-
rubygems_version: 2.
|
78
|
+
rubygems_version: 2.6.14
|
79
79
|
signing_key:
|
80
80
|
specification_version: 4
|
81
81
|
summary: Character encoding auto-detection in Ruby. As smart as your browser. Open
|