simple_text_extract 3.0.5 → 3.0.6

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 48a3c8805698e6f4af386789e4b4f11e9a3e38425bb1c2ce467ec7cefa99f2ba
4
- data.tar.gz: f66a75c47984d63cf41b4f09f8c874f94da1f2928dddf268b4aac5ce48413f85
3
+ metadata.gz: 160e7942ed36cf8d4840b2a8bc3e833d8de5417e44b6d28524c17e81d471719e
4
+ data.tar.gz: 3754f1cafc6b9c20b09030d07760d9720110eb19c98eac2045f07238dc11d19a
5
5
  SHA512:
6
- metadata.gz: 5c8a892a0916945062f298c1b78728f62962ccca8404c9aabc7724db73b0806f00c1074bac7e13a94d390c7b67d19b7f5398ef96ea6ef41439ea66ba4bf78d3b
7
- data.tar.gz: f0de6277f88c6debeaaac4bea385b3ba6e4d9180f53e5a2cef288ce5f80a30e92f67ad7e46c08aa908fb5ee30ccaffb1aaf0ea5ac4560cb2aa8262c8a610ce05
6
+ metadata.gz: 12fb32bc9263cd2243d65132cf9b8ad2a4e65d8e2b864a01d658c7c91229226e285289f9d4121ff5f82b2c6a036511cb4bb7d8c782673c47cfe30af91768954c
7
+ data.tar.gz: af3c753ae0dbe728c51b3963e1d92837be270cda3e1c1618a3cc0f5e99d80aeec82a2956043f0cffe57cf5f1a52122a1f9f822982f8676bc7bf9de6d978ce4f3
data/CHANGELOG.md CHANGED
@@ -1,3 +1,7 @@
1
+ ## 3.0.6 (2024-07-12)
2
+
3
+ - Stop depending on Active::Support (#present?)
4
+
1
5
  ## 3.0.3 (2023-04-27)
2
6
 
3
7
  - Add support for extracting text from tables in DOCX files.
data/Gemfile.lock CHANGED
@@ -1,7 +1,7 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- simple_text_extract (3.0.5)
4
+ simple_text_extract (3.0.6)
5
5
  roo (~> 2.10.0)
6
6
  rubyzip (~> 2.3.2)
7
7
  spreadsheet (~> 1.3.0)
@@ -10,54 +10,56 @@ GEM
10
10
  remote: https://rubygems.org/
11
11
  specs:
12
12
  ast (2.4.2)
13
- base64 (0.1.1)
13
+ bigdecimal (3.1.8)
14
14
  coderay (1.1.3)
15
- json (2.6.3)
15
+ json (2.7.2)
16
16
  language_server-protocol (3.17.0.3)
17
- memory_profiler (1.0.1)
18
- method_source (1.0.0)
19
- minitest (5.20.0)
20
- mocha (2.1.0)
17
+ memory_profiler (1.0.2)
18
+ method_source (1.1.0)
19
+ minitest (5.24.1)
20
+ mocha (2.4.0)
21
21
  ruby2_keywords (>= 0.0.5)
22
- nokogiri (1.15.4-arm64-darwin)
22
+ nokogiri (1.16.6-arm64-darwin)
23
23
  racc (~> 1.4)
24
- nokogiri (1.15.4-x86_64-linux)
24
+ nokogiri (1.16.6-x86_64-linux)
25
25
  racc (~> 1.4)
26
- parallel (1.23.0)
27
- parser (3.2.2.4)
26
+ parallel (1.25.1)
27
+ parser (3.3.4.0)
28
28
  ast (~> 2.4.1)
29
29
  racc
30
30
  pry (0.14.2)
31
31
  coderay (~> 1.1)
32
32
  method_source (~> 1.0)
33
- racc (1.7.1)
33
+ racc (1.8.0)
34
34
  rainbow (3.1.1)
35
- rake (13.0.6)
36
- regexp_parser (2.8.2)
37
- rexml (3.2.6)
38
- roo (2.10.0)
35
+ rake (13.2.1)
36
+ regexp_parser (2.9.2)
37
+ rexml (3.3.1)
38
+ strscan
39
+ roo (2.10.1)
39
40
  nokogiri (~> 1)
40
41
  rubyzip (>= 1.3.0, < 3.0.0)
41
- rubocop (1.57.1)
42
- base64 (~> 0.1.1)
42
+ rubocop (1.65.0)
43
43
  json (~> 2.3)
44
44
  language_server-protocol (>= 3.17.0)
45
45
  parallel (~> 1.10)
46
- parser (>= 3.2.2.4)
46
+ parser (>= 3.3.0.2)
47
47
  rainbow (>= 2.2.2, < 4.0)
48
- regexp_parser (>= 1.8, < 3.0)
48
+ regexp_parser (>= 2.4, < 3.0)
49
49
  rexml (>= 3.2.5, < 4.0)
50
- rubocop-ast (>= 1.28.1, < 2.0)
50
+ rubocop-ast (>= 1.31.1, < 2.0)
51
51
  ruby-progressbar (~> 1.7)
52
52
  unicode-display_width (>= 2.4.0, < 3.0)
53
- rubocop-ast (1.29.0)
54
- parser (>= 3.2.1.0)
55
- ruby-ole (1.2.12.2)
53
+ rubocop-ast (1.31.3)
54
+ parser (>= 3.3.1.0)
55
+ ruby-ole (1.2.13.1)
56
56
  ruby-progressbar (1.13.0)
57
57
  ruby2_keywords (0.0.5)
58
58
  rubyzip (2.3.2)
59
- spreadsheet (1.3.0)
59
+ spreadsheet (1.3.1)
60
+ bigdecimal
60
61
  ruby-ole
62
+ strscan (3.1.0)
61
63
  unicode-display_width (2.5.0)
62
64
 
63
65
  PLATFORMS
@@ -93,7 +93,7 @@ class SimpleTextExtract::Extract # rubocop:disable Metrics/ClassLength
93
93
  text << "# Sheet Name: #{name}"
94
94
 
95
95
  spreadsheet.sheet(name)&.each_row_streaming do |row|
96
- text << row.filter(&:present?).join(" ")
96
+ text << row.map(&:to_s).join(" ")
97
97
  end
98
98
  end
99
99
 
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module SimpleTextExtract
4
- VERSION = "3.0.5"
4
+ VERSION = "3.0.6"
5
5
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: simple_text_extract
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.0.5
4
+ version: 3.0.6
5
5
  platform: ruby
6
6
  authors:
7
7
  - Nick Weiland
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2023-10-23 00:00:00.000000000 Z
11
+ date: 2024-07-12 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: roo
@@ -60,7 +60,7 @@ extensions: []
60
60
  extra_rdoc_files: []
61
61
  files:
62
62
  - "-"
63
- - ".github/workflows/build.yml"
63
+ - ".github/workflows/test.yml"
64
64
  - ".gitignore"
65
65
  - ".rubocop.yml"
66
66
  - ".ruby-version"
@@ -97,7 +97,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
97
97
  requirements:
98
98
  - antiword
99
99
  - pdftotext/poppler
100
- rubygems_version: 3.4.10
100
+ rubygems_version: 3.5.5
101
101
  signing_key:
102
102
  specification_version: 4
103
103
  summary: Extract text from various file types before resorting to an OCR solution.
File without changes