simple_text_extract 3.0.6 → 3.0.8

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 160e7942ed36cf8d4840b2a8bc3e833d8de5417e44b6d28524c17e81d471719e
4
- data.tar.gz: 3754f1cafc6b9c20b09030d07760d9720110eb19c98eac2045f07238dc11d19a
3
+ metadata.gz: 44412a154f56b1100983582f15f3d56800edf040dfac98a5ae9fb9b3fa2d6401
4
+ data.tar.gz: a6c5b2d94e13be12c71d3b4a66d0c2aef8fc6b7d7084a4c2b2d490e49954916d
5
5
  SHA512:
6
- metadata.gz: 12fb32bc9263cd2243d65132cf9b8ad2a4e65d8e2b864a01d658c7c91229226e285289f9d4121ff5f82b2c6a036511cb4bb7d8c782673c47cfe30af91768954c
7
- data.tar.gz: af3c753ae0dbe728c51b3963e1d92837be270cda3e1c1618a3cc0f5e99d80aeec82a2956043f0cffe57cf5f1a52122a1f9f822982f8676bc7bf9de6d978ce4f3
6
+ metadata.gz: 88e630c8aeee64240196e96c93675ba15a1a7c2f3c2c1a67ab51a05d35dc404a11574f61995628b2b399cd4d42570d40beddb55c0b6cda0bccece97415d995a7
7
+ data.tar.gz: 42ff8b4a4702c52702ac95b2bab6b79495384cdec6d9f68011fb04bfca778cf91442c010ab67ac0a1ee59d27148b00be43221fbd20392d6e96f53d4ec5ae7788
@@ -1,14 +1,20 @@
1
1
  name: build
2
- on: [push, pull_request]
2
+ on:
3
+ push:
4
+ branches:
5
+ - master
6
+ pull_request:
7
+ branches:
8
+ - master
3
9
  jobs:
4
10
  build:
5
11
  strategy:
6
12
  fail-fast: false
7
13
  matrix:
8
14
  include:
9
- - ruby: 3.2
15
+ - ruby: 3.3
10
16
  gemfile: Gemfile
11
- - ruby: 3.1
17
+ - ruby: 3.2
12
18
  gemfile: Gemfile
13
19
  runs-on: ubuntu-latest
14
20
  env:
data/.rubocop.yml CHANGED
@@ -111,5 +111,8 @@ Lint/MissingSuper:
111
111
  Lint/ConstantDefinitionInBlock:
112
112
  Enabled: false
113
113
 
114
+ Lint/SuppressedException:
115
+ Enabled: false
116
+
114
117
  Style/SingleArgumentDig:
115
118
  Enabled: false
data/.ruby-version CHANGED
@@ -1 +1 @@
1
- 3.2.2
1
+ 3.3.4
data/Gemfile.lock CHANGED
@@ -1,7 +1,7 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- simple_text_extract (3.0.6)
4
+ simple_text_extract (3.0.8)
5
5
  roo (~> 2.10.0)
6
6
  rubyzip (~> 2.3.2)
7
7
  spreadsheet (~> 1.3.0)
@@ -77,4 +77,4 @@ DEPENDENCIES
77
77
  simple_text_extract!
78
78
 
79
79
  BUNDLED WITH
80
- 2.4.10
80
+ 2.5.11
@@ -78,7 +78,7 @@ class SimpleTextExtract::Extract # rubocop:disable Metrics/ClassLength
78
78
  def pdf_extract
79
79
  return nil if SimpleTextExtract.missing_dependency?("pdftotext")
80
80
 
81
- `pdftotext #{Shellwords.escape(file.path)} -`
81
+ `pdftotext #{Shellwords.escape(file.path)} - 2>/dev/null`
82
82
  end
83
83
 
84
84
  def xlsx_extract
@@ -87,13 +87,14 @@ class SimpleTextExtract::Extract # rubocop:disable Metrics/ClassLength
87
87
  spreadsheet = Roo::Spreadsheet.open(file, only_visible_sheets: true)
88
88
 
89
89
  text = []
90
-
91
90
  spreadsheet.sheets.each_with_index do |name, i|
92
91
  text << "# Sheet Index: #{i}"
93
92
  text << "# Sheet Name: #{name}"
94
93
 
95
94
  spreadsheet.sheet(name)&.each_row_streaming do |row|
96
- text << row.map(&:to_s).join(" ")
95
+ text << row.map do |cell|
96
+ cell.value.to_s
97
+ end.join(" ")
97
98
  end
98
99
  end
99
100
 
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module SimpleTextExtract
4
- VERSION = "3.0.6"
4
+ VERSION = "3.0.8"
5
5
  end
@@ -27,6 +27,6 @@ Gem::Specification.new do |spec|
27
27
  spec.requirements << "pdftotext/poppler"
28
28
 
29
29
  spec.add_dependency "roo", "~> 2.10.0"
30
- spec.add_dependency "spreadsheet", "~> 1.3.0"
31
30
  spec.add_dependency "rubyzip", "~> 2.3.2"
31
+ spec.add_dependency "spreadsheet", "~> 1.3.0"
32
32
  end
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: simple_text_extract
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.0.6
4
+ version: 3.0.8
5
5
  platform: ruby
6
6
  authors:
7
7
  - Nick Weiland
@@ -25,33 +25,33 @@ dependencies:
25
25
  - !ruby/object:Gem::Version
26
26
  version: 2.10.0
27
27
  - !ruby/object:Gem::Dependency
28
- name: spreadsheet
28
+ name: rubyzip
29
29
  requirement: !ruby/object:Gem::Requirement
30
30
  requirements:
31
31
  - - "~>"
32
32
  - !ruby/object:Gem::Version
33
- version: 1.3.0
33
+ version: 2.3.2
34
34
  type: :runtime
35
35
  prerelease: false
36
36
  version_requirements: !ruby/object:Gem::Requirement
37
37
  requirements:
38
38
  - - "~>"
39
39
  - !ruby/object:Gem::Version
40
- version: 1.3.0
40
+ version: 2.3.2
41
41
  - !ruby/object:Gem::Dependency
42
- name: rubyzip
42
+ name: spreadsheet
43
43
  requirement: !ruby/object:Gem::Requirement
44
44
  requirements:
45
45
  - - "~>"
46
46
  - !ruby/object:Gem::Version
47
- version: 2.3.2
47
+ version: 1.3.0
48
48
  type: :runtime
49
49
  prerelease: false
50
50
  version_requirements: !ruby/object:Gem::Requirement
51
51
  requirements:
52
52
  - - "~>"
53
53
  - !ruby/object:Gem::Version
54
- version: 2.3.2
54
+ version: 1.3.0
55
55
  description: Extract text from various file types before resorting to an OCR solution.
56
56
  email:
57
57
  - nickweiland@gmail.com
@@ -97,7 +97,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
97
97
  requirements:
98
98
  - antiword
99
99
  - pdftotext/poppler
100
- rubygems_version: 3.5.5
100
+ rubygems_version: 3.5.15
101
101
  signing_key:
102
102
  specification_version: 4
103
103
  summary: Extract text from various file types before resorting to an OCR solution.