simple_text_extract 3.0.5 → 3.0.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 48a3c8805698e6f4af386789e4b4f11e9a3e38425bb1c2ce467ec7cefa99f2ba
4
- data.tar.gz: f66a75c47984d63cf41b4f09f8c874f94da1f2928dddf268b4aac5ce48413f85
3
+ metadata.gz: 160e7942ed36cf8d4840b2a8bc3e833d8de5417e44b6d28524c17e81d471719e
4
+ data.tar.gz: 3754f1cafc6b9c20b09030d07760d9720110eb19c98eac2045f07238dc11d19a
5
5
  SHA512:
6
- metadata.gz: 5c8a892a0916945062f298c1b78728f62962ccca8404c9aabc7724db73b0806f00c1074bac7e13a94d390c7b67d19b7f5398ef96ea6ef41439ea66ba4bf78d3b
7
- data.tar.gz: f0de6277f88c6debeaaac4bea385b3ba6e4d9180f53e5a2cef288ce5f80a30e92f67ad7e46c08aa908fb5ee30ccaffb1aaf0ea5ac4560cb2aa8262c8a610ce05
6
+ metadata.gz: 12fb32bc9263cd2243d65132cf9b8ad2a4e65d8e2b864a01d658c7c91229226e285289f9d4121ff5f82b2c6a036511cb4bb7d8c782673c47cfe30af91768954c
7
+ data.tar.gz: af3c753ae0dbe728c51b3963e1d92837be270cda3e1c1618a3cc0f5e99d80aeec82a2956043f0cffe57cf5f1a52122a1f9f822982f8676bc7bf9de6d978ce4f3
data/CHANGELOG.md CHANGED
@@ -1,3 +1,7 @@
1
+ ## 3.0.6 (2024-07-12)
2
+
3
+ - Stop depending on Active::Support (#present?)
4
+
1
5
  ## 3.0.3 (2023-04-27)
2
6
 
3
7
  - Add support for extracting text from tables in DOCX files.
data/Gemfile.lock CHANGED
@@ -1,7 +1,7 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- simple_text_extract (3.0.5)
4
+ simple_text_extract (3.0.6)
5
5
  roo (~> 2.10.0)
6
6
  rubyzip (~> 2.3.2)
7
7
  spreadsheet (~> 1.3.0)
@@ -10,54 +10,56 @@ GEM
10
10
  remote: https://rubygems.org/
11
11
  specs:
12
12
  ast (2.4.2)
13
- base64 (0.1.1)
13
+ bigdecimal (3.1.8)
14
14
  coderay (1.1.3)
15
- json (2.6.3)
15
+ json (2.7.2)
16
16
  language_server-protocol (3.17.0.3)
17
- memory_profiler (1.0.1)
18
- method_source (1.0.0)
19
- minitest (5.20.0)
20
- mocha (2.1.0)
17
+ memory_profiler (1.0.2)
18
+ method_source (1.1.0)
19
+ minitest (5.24.1)
20
+ mocha (2.4.0)
21
21
  ruby2_keywords (>= 0.0.5)
22
- nokogiri (1.15.4-arm64-darwin)
22
+ nokogiri (1.16.6-arm64-darwin)
23
23
  racc (~> 1.4)
24
- nokogiri (1.15.4-x86_64-linux)
24
+ nokogiri (1.16.6-x86_64-linux)
25
25
  racc (~> 1.4)
26
- parallel (1.23.0)
27
- parser (3.2.2.4)
26
+ parallel (1.25.1)
27
+ parser (3.3.4.0)
28
28
  ast (~> 2.4.1)
29
29
  racc
30
30
  pry (0.14.2)
31
31
  coderay (~> 1.1)
32
32
  method_source (~> 1.0)
33
- racc (1.7.1)
33
+ racc (1.8.0)
34
34
  rainbow (3.1.1)
35
- rake (13.0.6)
36
- regexp_parser (2.8.2)
37
- rexml (3.2.6)
38
- roo (2.10.0)
35
+ rake (13.2.1)
36
+ regexp_parser (2.9.2)
37
+ rexml (3.3.1)
38
+ strscan
39
+ roo (2.10.1)
39
40
  nokogiri (~> 1)
40
41
  rubyzip (>= 1.3.0, < 3.0.0)
41
- rubocop (1.57.1)
42
- base64 (~> 0.1.1)
42
+ rubocop (1.65.0)
43
43
  json (~> 2.3)
44
44
  language_server-protocol (>= 3.17.0)
45
45
  parallel (~> 1.10)
46
- parser (>= 3.2.2.4)
46
+ parser (>= 3.3.0.2)
47
47
  rainbow (>= 2.2.2, < 4.0)
48
- regexp_parser (>= 1.8, < 3.0)
48
+ regexp_parser (>= 2.4, < 3.0)
49
49
  rexml (>= 3.2.5, < 4.0)
50
- rubocop-ast (>= 1.28.1, < 2.0)
50
+ rubocop-ast (>= 1.31.1, < 2.0)
51
51
  ruby-progressbar (~> 1.7)
52
52
  unicode-display_width (>= 2.4.0, < 3.0)
53
- rubocop-ast (1.29.0)
54
- parser (>= 3.2.1.0)
55
- ruby-ole (1.2.12.2)
53
+ rubocop-ast (1.31.3)
54
+ parser (>= 3.3.1.0)
55
+ ruby-ole (1.2.13.1)
56
56
  ruby-progressbar (1.13.0)
57
57
  ruby2_keywords (0.0.5)
58
58
  rubyzip (2.3.2)
59
- spreadsheet (1.3.0)
59
+ spreadsheet (1.3.1)
60
+ bigdecimal
60
61
  ruby-ole
62
+ strscan (3.1.0)
61
63
  unicode-display_width (2.5.0)
62
64
 
63
65
  PLATFORMS
@@ -93,7 +93,7 @@ class SimpleTextExtract::Extract # rubocop:disable Metrics/ClassLength
93
93
  text << "# Sheet Name: #{name}"
94
94
 
95
95
  spreadsheet.sheet(name)&.each_row_streaming do |row|
96
- text << row.filter(&:present?).join(" ")
96
+ text << row.map(&:to_s).join(" ")
97
97
  end
98
98
  end
99
99
 
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module SimpleTextExtract
4
- VERSION = "3.0.5"
4
+ VERSION = "3.0.6"
5
5
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: simple_text_extract
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.0.5
4
+ version: 3.0.6
5
5
  platform: ruby
6
6
  authors:
7
7
  - Nick Weiland
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2023-10-23 00:00:00.000000000 Z
11
+ date: 2024-07-12 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: roo
@@ -60,7 +60,7 @@ extensions: []
60
60
  extra_rdoc_files: []
61
61
  files:
62
62
  - "-"
63
- - ".github/workflows/build.yml"
63
+ - ".github/workflows/test.yml"
64
64
  - ".gitignore"
65
65
  - ".rubocop.yml"
66
66
  - ".ruby-version"
@@ -97,7 +97,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
97
97
  requirements:
98
98
  - antiword
99
99
  - pdftotext/poppler
100
- rubygems_version: 3.4.10
100
+ rubygems_version: 3.5.5
101
101
  signing_key:
102
102
  specification_version: 4
103
103
  summary: Extract text from various file types before resorting to an OCR solution.
File without changes