simple_text_extract 3.0.0 → 3.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 411c821b9a0f6ab4f5b95d0104786fbca88c42ab97fa4bd41e8443baae7c80a3
4
- data.tar.gz: e6034b96a08ed5bea7abc61e0fb0c762e4c16c44a1e4d54adbc7eff2d9a8bcab
3
+ metadata.gz: 4d97ba86e11c6ad6e14e3e2af600eddc00378747a693a51be38a15da7c73b9b5
4
+ data.tar.gz: 401dd3aee14d95cc750397bc7b9e6393dbb49eb45d9369d39096a5a6046cb0d8
5
5
  SHA512:
6
- metadata.gz: 87d96e6217062b72e104ac1165475d3af497937532fe7f03364128086f6ab61d490d650d60030813783ba32c418bbab564455dc0659882724e6711d9a612cc4d
7
- data.tar.gz: 645af90b82616a06805603d2417498890f6fbb53c0d2661934b9ec40d686550c97a42b5bbcc9cf8fe90c049367e45a2e8dd76af8f29d375d8f501beed5be4b16
6
+ metadata.gz: 76156def8c686dca8dba70e7ac36fb58a65757610c7cdb9bfd73c9a13c161d64db1730a21bcf5746a75398cfea2bc1a47e52acfd2e038c414e1a102df05b7854
7
+ data.tar.gz: f327f06da4692531b051e291f20529889e123c508f15643ade8486819b2ac91ab04bde79b1ed5b6091d3bf8e28c3895fcdbf3cf1148367c16fb2743190aab159
data/CHANGELOG.md CHANGED
@@ -1,4 +1,8 @@
1
- ## 2.0.0 (2023-04-14)
1
+ ## 3.0.1 (2023-04-17)
2
+
3
+ - Fixes printing of Roo::Excelx::Cell::Empty for empty rows
4
+
5
+ ## 3.0.0 (2023-04-14)
2
6
 
3
7
  - [BREAKING CHANGE] Improves format of text extracts to better support post processing into sentences/rows. This will only cause issues if you have tests/code that relies on the specific format of whitespace characters in the resulting extracts. For example, the docx extract will now preserve newline characters.
4
8
  - Improves memory allocation for xlsx files using `Roo#each_row_streaming`
data/Gemfile.lock CHANGED
@@ -1,7 +1,7 @@
1
1
  PATH
2
2
  remote: .
3
3
  specs:
4
- simple_text_extract (3.0.0)
4
+ simple_text_extract (3.0.1)
5
5
  roo (~> 2.10.0)
6
6
  rubyzip (~> 2.3.2)
7
7
  spreadsheet (~> 1.3.0)
@@ -88,10 +88,13 @@ class SimpleTextExtract::Extract
88
88
 
89
89
  text = []
90
90
 
91
- spreadsheet.sheets.each do |name|
92
- text << name
91
+ spreadsheet.sheets.each_with_index do |name, i|
92
+ text << "# Sheet Index: #{i}"
93
+ text << "# Sheet Name: #{name}"
93
94
 
94
- spreadsheet.sheet(name)&.each_row_streaming { |row| text << row.join(" ") }
95
+ spreadsheet.sheet(name)&.each_row_streaming do |row|
96
+ text << row.filter(&:present?).join(" ")
97
+ end
95
98
  end
96
99
 
97
100
  text.join("\n")
@@ -1,5 +1,5 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module SimpleTextExtract
4
- VERSION = "3.0.0"
4
+ VERSION = "3.0.1"
5
5
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: simple_text_extract
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.0.0
4
+ version: 3.0.1
5
5
  platform: ruby
6
6
  authors:
7
7
  - Nick Weiland
8
8
  autorequire:
9
9
  bindir: exe
10
10
  cert_chain: []
11
- date: 2023-04-14 00:00:00.000000000 Z
11
+ date: 2023-04-17 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: roo