simple_text_extract 3.0.0 → 3.0.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +9 -1
- data/Gemfile.lock +1 -1
- data/lib/simple_text_extract/extract.rb +6 -3
- data/lib/simple_text_extract/version.rb +1 -1
- data/lib/simple_text_extract.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 388ec404e856a47441f3bb3e23873d70eff4fabf86d96afcfeb6f7ad324e262d
|
4
|
+
data.tar.gz: 054f2cdb252b91ae14bdc678af1b75d433bfc6266d68ccace27ce4ec829c6484
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 5c5a9d4f02bd00f32495803f60b2552d084f204a39df5c239d29e9be2c04013ae44b865c805c750c3a52a51a5e9b93a358e97d386a351aa16460664e048bac61
|
7
|
+
data.tar.gz: f7bc4192659abaf6653f58c01b446e11e483dddad2efb91ebf077a88767346f50997d87ba8af5d4ab26e7ac2ed7bf6a4393fecf75b78b1968662a266e251a84e
|
data/CHANGELOG.md
CHANGED
@@ -1,4 +1,12 @@
|
|
1
|
-
##
|
1
|
+
## 3.0.1 (2023-04-17)
|
2
|
+
|
3
|
+
- Coerces filename in `SimpleTextExtract.supports?(filename:)` to string.
|
4
|
+
|
5
|
+
## 3.0.1 (2023-04-17)
|
6
|
+
|
7
|
+
- Fixes printing of Roo::Excelx::Cell::Empty for empty rows
|
8
|
+
|
9
|
+
## 3.0.0 (2023-04-14)
|
2
10
|
|
3
11
|
- [BREAKING CHANGE] Improves format of text extracts to better support post processing into sentences/rows. This will only cause issues if you have tests/code that relies on the specific format of whitespace characters in the resulting extracts. For example, the docx extract will now preserve newline characters.
|
4
12
|
- Improves memory allocation for xlsx files using `Roo#each_row_streaming`
|
data/Gemfile.lock
CHANGED
@@ -88,10 +88,13 @@ class SimpleTextExtract::Extract
|
|
88
88
|
|
89
89
|
text = []
|
90
90
|
|
91
|
-
spreadsheet.sheets.
|
92
|
-
text <<
|
91
|
+
spreadsheet.sheets.each_with_index do |name, i|
|
92
|
+
text << "# Sheet Index: #{i}"
|
93
|
+
text << "# Sheet Name: #{name}"
|
93
94
|
|
94
|
-
spreadsheet.sheet(name)&.each_row_streaming
|
95
|
+
spreadsheet.sheet(name)&.each_row_streaming do |row|
|
96
|
+
text << row.filter(&:present?).join(" ")
|
97
|
+
end
|
95
98
|
end
|
96
99
|
|
97
100
|
text.join("\n")
|
data/lib/simple_text_extract.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: simple_text_extract
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 3.0.
|
4
|
+
version: 3.0.2
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Nick Weiland
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2023-04-
|
11
|
+
date: 2023-04-18 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: roo
|