henkei 1.28.4.1 → 1.28.5.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.github/workflows/test.yml +1 -1
- data/.rubocop.yml +1 -1
- data/Gemfile +9 -0
- data/henkei.gemspec +1 -11
- data/jar/{tika-app-1.28.4.jar → tika-app-1.28.5.jar} +0 -0
- data/lib/henkei/version.rb +1 -1
- data/lib/henkei.rb +2 -2
- metadata +6 -138
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 5c4d344ed0b3e34f58c4fa5c5e8694b50acc9fb2765b2923aa342a2aeb37f924
|
4
|
+
data.tar.gz: 1bde6cdf92d957e707e71bb4763230e1a39e128efc447f842538c42f35e945c9
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 14a19c09c4fbde49ce7774392793f26dbdcb8c9af5418cda6ce58b7583b6a0edc16640a55348ff1f7d64b7153359055fbaba91bfcd3217a285f2aafa5c7f4dc1
|
7
|
+
data.tar.gz: eaad5644f3e69cb7b1720284f6eac900e4598b7cec0c6745a622473176568b110f4a280c21213ecf55185b9ee304ea9574279a9cb5fd34a65578af0a89d2fe91
|
data/.github/workflows/test.yml
CHANGED
data/.rubocop.yml
CHANGED
data/Gemfile
CHANGED
@@ -4,3 +4,12 @@ source 'https://rubygems.org'
|
|
4
4
|
|
5
5
|
# Specify your gem's dependencies in henkei.gemspec
|
6
6
|
gemspec
|
7
|
+
|
8
|
+
gem 'bundler', '~> 2.0'
|
9
|
+
gem 'rake', '~> 12.3'
|
10
|
+
gem 'rspec', '~> 3.7'
|
11
|
+
gem 'rubocop', '~> 1.26'
|
12
|
+
gem 'rubocop-performance', '~> 1.13'
|
13
|
+
gem 'rubocop-rake', '~> 0.6'
|
14
|
+
gem 'rubocop-rspec', '~> 2.9'
|
15
|
+
gem 'simplecov', '~> 0.15', '< 0.18'
|
data/henkei.gemspec
CHANGED
@@ -15,7 +15,7 @@ Gem::Specification.new do |spec|
|
|
15
15
|
'(.doc, .docx, .pages, .odt, .rtf, .pdf) using Apache Tika toolkit'
|
16
16
|
spec.homepage = 'https://github.com/abrom/henkei'
|
17
17
|
spec.license = 'MIT'
|
18
|
-
spec.required_ruby_version = ['>=
|
18
|
+
spec.required_ruby_version = ['>= 3.0.0', '< 3.4.0']
|
19
19
|
|
20
20
|
# Prevent pushing this gem to RubyGems.org by setting 'allowed_push_host', or
|
21
21
|
# delete this section to allow pushing this gem to any host.
|
@@ -30,14 +30,4 @@ Gem::Specification.new do |spec|
|
|
30
30
|
|
31
31
|
spec.add_runtime_dependency 'json', '>= 1.8', '< 3'
|
32
32
|
spec.add_runtime_dependency 'mini_mime', '>= 0.1.1', '< 2'
|
33
|
-
|
34
|
-
spec.add_development_dependency 'bundler', '~> 2.0'
|
35
|
-
spec.add_development_dependency 'rails', '~> 5.0'
|
36
|
-
spec.add_development_dependency 'rake', '~> 12.3'
|
37
|
-
spec.add_development_dependency 'rspec', '~> 3.7'
|
38
|
-
spec.add_development_dependency 'rubocop', '~> 1.26'
|
39
|
-
spec.add_development_dependency 'rubocop-performance', '~> 1.13'
|
40
|
-
spec.add_development_dependency 'rubocop-rake', '~> 0.6'
|
41
|
-
spec.add_development_dependency 'rubocop-rspec', '~> 2.9'
|
42
|
-
spec.add_development_dependency 'simplecov', '~> 0.15', '< 0.18'
|
43
33
|
end
|
Binary file
|
data/lib/henkei/version.rb
CHANGED
data/lib/henkei.rb
CHANGED
@@ -25,7 +25,7 @@ require 'open3'
|
|
25
25
|
# Read text and metadata from files and documents using Apache Tika toolkit
|
26
26
|
class Henkei # rubocop:disable Metrics/ClassLength
|
27
27
|
GEM_PATH = File.dirname(File.dirname(__FILE__))
|
28
|
-
JAR_PATH = File.join(Henkei::GEM_PATH, 'jar', 'tika-app-1.28.
|
28
|
+
JAR_PATH = File.join(Henkei::GEM_PATH, 'jar', 'tika-app-1.28.5.jar')
|
29
29
|
CONFIG_PATH = File.join(Henkei::GEM_PATH, 'jar', 'tika-config.xml')
|
30
30
|
DEFAULT_SERVER_PORT = 9293 # an arbitrary, but perfectly cromulent, port
|
31
31
|
|
@@ -268,7 +268,7 @@ class Henkei # rubocop:disable Metrics/ClassLength
|
|
268
268
|
resp = +''
|
269
269
|
loop do
|
270
270
|
chunk = s.recv(65_536)
|
271
|
-
break if chunk
|
271
|
+
break if !chunk || chunk.empty?
|
272
272
|
|
273
273
|
resp << chunk
|
274
274
|
end
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: henkei
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.28.
|
4
|
+
version: 1.28.5.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Erol Fornoles
|
@@ -9,7 +9,7 @@ authors:
|
|
9
9
|
autorequire:
|
10
10
|
bindir: bin
|
11
11
|
cert_chain: []
|
12
|
-
date:
|
12
|
+
date: 2024-05-01 00:00:00.000000000 Z
|
13
13
|
dependencies:
|
14
14
|
- !ruby/object:Gem::Dependency
|
15
15
|
name: json
|
@@ -51,138 +51,6 @@ dependencies:
|
|
51
51
|
- - "<"
|
52
52
|
- !ruby/object:Gem::Version
|
53
53
|
version: '2'
|
54
|
-
- !ruby/object:Gem::Dependency
|
55
|
-
name: bundler
|
56
|
-
requirement: !ruby/object:Gem::Requirement
|
57
|
-
requirements:
|
58
|
-
- - "~>"
|
59
|
-
- !ruby/object:Gem::Version
|
60
|
-
version: '2.0'
|
61
|
-
type: :development
|
62
|
-
prerelease: false
|
63
|
-
version_requirements: !ruby/object:Gem::Requirement
|
64
|
-
requirements:
|
65
|
-
- - "~>"
|
66
|
-
- !ruby/object:Gem::Version
|
67
|
-
version: '2.0'
|
68
|
-
- !ruby/object:Gem::Dependency
|
69
|
-
name: rails
|
70
|
-
requirement: !ruby/object:Gem::Requirement
|
71
|
-
requirements:
|
72
|
-
- - "~>"
|
73
|
-
- !ruby/object:Gem::Version
|
74
|
-
version: '5.0'
|
75
|
-
type: :development
|
76
|
-
prerelease: false
|
77
|
-
version_requirements: !ruby/object:Gem::Requirement
|
78
|
-
requirements:
|
79
|
-
- - "~>"
|
80
|
-
- !ruby/object:Gem::Version
|
81
|
-
version: '5.0'
|
82
|
-
- !ruby/object:Gem::Dependency
|
83
|
-
name: rake
|
84
|
-
requirement: !ruby/object:Gem::Requirement
|
85
|
-
requirements:
|
86
|
-
- - "~>"
|
87
|
-
- !ruby/object:Gem::Version
|
88
|
-
version: '12.3'
|
89
|
-
type: :development
|
90
|
-
prerelease: false
|
91
|
-
version_requirements: !ruby/object:Gem::Requirement
|
92
|
-
requirements:
|
93
|
-
- - "~>"
|
94
|
-
- !ruby/object:Gem::Version
|
95
|
-
version: '12.3'
|
96
|
-
- !ruby/object:Gem::Dependency
|
97
|
-
name: rspec
|
98
|
-
requirement: !ruby/object:Gem::Requirement
|
99
|
-
requirements:
|
100
|
-
- - "~>"
|
101
|
-
- !ruby/object:Gem::Version
|
102
|
-
version: '3.7'
|
103
|
-
type: :development
|
104
|
-
prerelease: false
|
105
|
-
version_requirements: !ruby/object:Gem::Requirement
|
106
|
-
requirements:
|
107
|
-
- - "~>"
|
108
|
-
- !ruby/object:Gem::Version
|
109
|
-
version: '3.7'
|
110
|
-
- !ruby/object:Gem::Dependency
|
111
|
-
name: rubocop
|
112
|
-
requirement: !ruby/object:Gem::Requirement
|
113
|
-
requirements:
|
114
|
-
- - "~>"
|
115
|
-
- !ruby/object:Gem::Version
|
116
|
-
version: '1.26'
|
117
|
-
type: :development
|
118
|
-
prerelease: false
|
119
|
-
version_requirements: !ruby/object:Gem::Requirement
|
120
|
-
requirements:
|
121
|
-
- - "~>"
|
122
|
-
- !ruby/object:Gem::Version
|
123
|
-
version: '1.26'
|
124
|
-
- !ruby/object:Gem::Dependency
|
125
|
-
name: rubocop-performance
|
126
|
-
requirement: !ruby/object:Gem::Requirement
|
127
|
-
requirements:
|
128
|
-
- - "~>"
|
129
|
-
- !ruby/object:Gem::Version
|
130
|
-
version: '1.13'
|
131
|
-
type: :development
|
132
|
-
prerelease: false
|
133
|
-
version_requirements: !ruby/object:Gem::Requirement
|
134
|
-
requirements:
|
135
|
-
- - "~>"
|
136
|
-
- !ruby/object:Gem::Version
|
137
|
-
version: '1.13'
|
138
|
-
- !ruby/object:Gem::Dependency
|
139
|
-
name: rubocop-rake
|
140
|
-
requirement: !ruby/object:Gem::Requirement
|
141
|
-
requirements:
|
142
|
-
- - "~>"
|
143
|
-
- !ruby/object:Gem::Version
|
144
|
-
version: '0.6'
|
145
|
-
type: :development
|
146
|
-
prerelease: false
|
147
|
-
version_requirements: !ruby/object:Gem::Requirement
|
148
|
-
requirements:
|
149
|
-
- - "~>"
|
150
|
-
- !ruby/object:Gem::Version
|
151
|
-
version: '0.6'
|
152
|
-
- !ruby/object:Gem::Dependency
|
153
|
-
name: rubocop-rspec
|
154
|
-
requirement: !ruby/object:Gem::Requirement
|
155
|
-
requirements:
|
156
|
-
- - "~>"
|
157
|
-
- !ruby/object:Gem::Version
|
158
|
-
version: '2.9'
|
159
|
-
type: :development
|
160
|
-
prerelease: false
|
161
|
-
version_requirements: !ruby/object:Gem::Requirement
|
162
|
-
requirements:
|
163
|
-
- - "~>"
|
164
|
-
- !ruby/object:Gem::Version
|
165
|
-
version: '2.9'
|
166
|
-
- !ruby/object:Gem::Dependency
|
167
|
-
name: simplecov
|
168
|
-
requirement: !ruby/object:Gem::Requirement
|
169
|
-
requirements:
|
170
|
-
- - "~>"
|
171
|
-
- !ruby/object:Gem::Version
|
172
|
-
version: '0.15'
|
173
|
-
- - "<"
|
174
|
-
- !ruby/object:Gem::Version
|
175
|
-
version: '0.18'
|
176
|
-
type: :development
|
177
|
-
prerelease: false
|
178
|
-
version_requirements: !ruby/object:Gem::Requirement
|
179
|
-
requirements:
|
180
|
-
- - "~>"
|
181
|
-
- !ruby/object:Gem::Version
|
182
|
-
version: '0.15'
|
183
|
-
- - "<"
|
184
|
-
- !ruby/object:Gem::Version
|
185
|
-
version: '0.18'
|
186
54
|
description: Read text and metadata from files and documents using Apache Tika toolkit
|
187
55
|
email:
|
188
56
|
- erol.fornoles@gmail.com
|
@@ -203,7 +71,7 @@ files:
|
|
203
71
|
- Rakefile
|
204
72
|
- bin/console
|
205
73
|
- henkei.gemspec
|
206
|
-
- jar/tika-app-1.28.
|
74
|
+
- jar/tika-app-1.28.5.jar
|
207
75
|
- jar/tika-config.xml
|
208
76
|
- lib/henkei.rb
|
209
77
|
- lib/henkei/configuration.rb
|
@@ -230,17 +98,17 @@ required_ruby_version: !ruby/object:Gem::Requirement
|
|
230
98
|
requirements:
|
231
99
|
- - ">="
|
232
100
|
- !ruby/object:Gem::Version
|
233
|
-
version:
|
101
|
+
version: 3.0.0
|
234
102
|
- - "<"
|
235
103
|
- !ruby/object:Gem::Version
|
236
|
-
version: 3.
|
104
|
+
version: 3.4.0
|
237
105
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
238
106
|
requirements:
|
239
107
|
- - ">="
|
240
108
|
- !ruby/object:Gem::Version
|
241
109
|
version: '0'
|
242
110
|
requirements: []
|
243
|
-
rubygems_version: 3.
|
111
|
+
rubygems_version: 3.3.7
|
244
112
|
signing_key:
|
245
113
|
specification_version: 4
|
246
114
|
summary: Read text and metadata from files and documents (.doc, .docx, .pages, .odt,
|