simple_text_extract 3.0.0 → 3.0.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +9 -1
- data/Gemfile.lock +1 -1
- data/lib/simple_text_extract/extract.rb +6 -3
- data/lib/simple_text_extract/version.rb +1 -1
- data/lib/simple_text_extract.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 388ec404e856a47441f3bb3e23873d70eff4fabf86d96afcfeb6f7ad324e262d
|
4
|
+
data.tar.gz: 054f2cdb252b91ae14bdc678af1b75d433bfc6266d68ccace27ce4ec829c6484
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 5c5a9d4f02bd00f32495803f60b2552d084f204a39df5c239d29e9be2c04013ae44b865c805c750c3a52a51a5e9b93a358e97d386a351aa16460664e048bac61
|
7
|
+
data.tar.gz: f7bc4192659abaf6653f58c01b446e11e483dddad2efb91ebf077a88767346f50997d87ba8af5d4ab26e7ac2ed7bf6a4393fecf75b78b1968662a266e251a84e
|
data/CHANGELOG.md
CHANGED
@@ -1,4 +1,12 @@
|
|
1
|
-
##
|
1
|
+
## 3.0.1 (2023-04-17)
|
2
|
+
|
3
|
+
- Coerces filename in `SimpleTextExtract.supports?(filename:)` to string.
|
4
|
+
|
5
|
+
## 3.0.1 (2023-04-17)
|
6
|
+
|
7
|
+
- Fixes printing of Roo::Excelx::Cell::Empty for empty rows
|
8
|
+
|
9
|
+
## 3.0.0 (2023-04-14)
|
2
10
|
|
3
11
|
- [BREAKING CHANGE] Improves format of text extracts to better support post processing into sentences/rows. This will only cause issues if you have tests/code that relies on the specific format of whitespace characters in the resulting extracts. For example, the docx extract will now preserve newline characters.
|
4
12
|
- Improves memory allocation for xlsx files using `Roo#each_row_streaming`
|
data/Gemfile.lock
CHANGED
@@ -88,10 +88,13 @@ class SimpleTextExtract::Extract
|
|
88
88
|
|
89
89
|
text = []
|
90
90
|
|
91
|
-
spreadsheet.sheets.
|
92
|
-
text <<
|
91
|
+
spreadsheet.sheets.each_with_index do |name, i|
|
92
|
+
text << "# Sheet Index: #{i}"
|
93
|
+
text << "# Sheet Name: #{name}"
|
93
94
|
|
94
|
-
spreadsheet.sheet(name)&.each_row_streaming
|
95
|
+
spreadsheet.sheet(name)&.each_row_streaming do |row|
|
96
|
+
text << row.filter(&:present?).join(" ")
|
97
|
+
end
|
95
98
|
end
|
96
99
|
|
97
100
|
text.join("\n")
|
data/lib/simple_text_extract.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: simple_text_extract
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 3.0.
|
4
|
+
version: 3.0.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Nick Weiland
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2023-04-
|
11
|
+
date: 2023-04-18 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: roo
|