boilerpipe-ruby 0.4.2 → 0.4.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +9 -1
- data/boilerpipe-ruby.gemspec +3 -3
- data/lib/boilerpipe/document/text_document.rb +4 -6
- data/lib/boilerpipe/version.rb +1 -1
- metadata +13 -13
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: da8bc0b8d74eea14b73e61812bbeba5fef75e8bae2330739e49b28e26f73d14d
|
|
4
|
+
data.tar.gz: 68fee529b501210cf3278eb2b045b09e6d27c7846355b7d430c05e60f39088e2
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 4202afab2a01ae588977fde351dfacc29551634077e794d028282666c43d3aeb09adf425d60608dc694c36f2fd8ed034ef89ba41ee07e6ad23f426c19d740931
|
|
7
|
+
data.tar.gz: a0dc75a0c5384e1eaf8b50dfb92bc9294b41f38e8b0e0cceb9e9a6aafdf436629df2b3420f61a33523a08d6788c02ade799cdf8fe29db4338c766c7b01523704
|
data/CHANGELOG.md
CHANGED
|
@@ -1,3 +1,11 @@
|
|
|
1
|
+
# 0.4.3 / 2020-07-18
|
|
2
|
+
|
|
3
|
+
* update deps
|
|
4
|
+
|
|
5
|
+
# 0.4.2 / 2020-03-11
|
|
6
|
+
|
|
7
|
+
* update deps
|
|
8
|
+
|
|
1
9
|
# 0.4.1 / 2019-07-04
|
|
2
10
|
|
|
3
11
|
* Fix bug in min_clause_words_filter ( used in article_sentence_extractor )
|
|
@@ -35,4 +43,4 @@
|
|
|
35
43
|
|
|
36
44
|
# 0.1.0 / 2017-09-08
|
|
37
45
|
|
|
38
|
-
* Add Article Extractor
|
|
46
|
+
* Add Article Extractor
|
data/boilerpipe-ruby.gemspec
CHANGED
|
@@ -21,7 +21,7 @@ Gem::Specification.new do |spec|
|
|
|
21
21
|
|
|
22
22
|
spec.add_development_dependency 'bundler', '~> 2.0'
|
|
23
23
|
spec.add_development_dependency 'rake', '>= 12.3.3'
|
|
24
|
-
spec.add_development_dependency 'rickshaw', '~> 0.
|
|
25
|
-
spec.add_development_dependency 'rspec', '~> 3.
|
|
26
|
-
spec.add_runtime_dependency 'nokogiri', '
|
|
24
|
+
spec.add_development_dependency 'rickshaw', '~> 0.5.0'
|
|
25
|
+
spec.add_development_dependency 'rspec', '~> 3.9'
|
|
26
|
+
spec.add_runtime_dependency 'nokogiri', '~> 1.10'
|
|
27
27
|
end
|
|
@@ -19,16 +19,14 @@ module Boilerpipe
|
|
|
19
19
|
case text_block.is_content?
|
|
20
20
|
when true
|
|
21
21
|
next unless include_content
|
|
22
|
-
|
|
23
|
-
s << text_block.text
|
|
24
|
-
s << "\n"
|
|
25
22
|
when false
|
|
26
23
|
next unless include_noncontent
|
|
27
|
-
|
|
28
|
-
s << text_block.text
|
|
29
|
-
s << "\n"
|
|
30
24
|
end
|
|
25
|
+
|
|
26
|
+
s << text_block.text
|
|
27
|
+
s << "\n"
|
|
31
28
|
end
|
|
29
|
+
|
|
32
30
|
s
|
|
33
31
|
end
|
|
34
32
|
|
data/lib/boilerpipe/version.rb
CHANGED
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: boilerpipe-ruby
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.4.
|
|
4
|
+
version: 0.4.3
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Gregory Ostermayr
|
|
8
|
-
autorequire:
|
|
8
|
+
autorequire:
|
|
9
9
|
bindir: exe
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2020-
|
|
11
|
+
date: 2020-07-22 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: bundler
|
|
@@ -44,42 +44,42 @@ dependencies:
|
|
|
44
44
|
requirements:
|
|
45
45
|
- - "~>"
|
|
46
46
|
- !ruby/object:Gem::Version
|
|
47
|
-
version: 0.
|
|
47
|
+
version: 0.5.0
|
|
48
48
|
type: :development
|
|
49
49
|
prerelease: false
|
|
50
50
|
version_requirements: !ruby/object:Gem::Requirement
|
|
51
51
|
requirements:
|
|
52
52
|
- - "~>"
|
|
53
53
|
- !ruby/object:Gem::Version
|
|
54
|
-
version: 0.
|
|
54
|
+
version: 0.5.0
|
|
55
55
|
- !ruby/object:Gem::Dependency
|
|
56
56
|
name: rspec
|
|
57
57
|
requirement: !ruby/object:Gem::Requirement
|
|
58
58
|
requirements:
|
|
59
59
|
- - "~>"
|
|
60
60
|
- !ruby/object:Gem::Version
|
|
61
|
-
version: '3.
|
|
61
|
+
version: '3.9'
|
|
62
62
|
type: :development
|
|
63
63
|
prerelease: false
|
|
64
64
|
version_requirements: !ruby/object:Gem::Requirement
|
|
65
65
|
requirements:
|
|
66
66
|
- - "~>"
|
|
67
67
|
- !ruby/object:Gem::Version
|
|
68
|
-
version: '3.
|
|
68
|
+
version: '3.9'
|
|
69
69
|
- !ruby/object:Gem::Dependency
|
|
70
70
|
name: nokogiri
|
|
71
71
|
requirement: !ruby/object:Gem::Requirement
|
|
72
72
|
requirements:
|
|
73
|
-
- - "
|
|
73
|
+
- - "~>"
|
|
74
74
|
- !ruby/object:Gem::Version
|
|
75
|
-
version: 1.
|
|
75
|
+
version: '1.10'
|
|
76
76
|
type: :runtime
|
|
77
77
|
prerelease: false
|
|
78
78
|
version_requirements: !ruby/object:Gem::Requirement
|
|
79
79
|
requirements:
|
|
80
|
-
- - "
|
|
80
|
+
- - "~>"
|
|
81
81
|
- !ruby/object:Gem::Version
|
|
82
|
-
version: 1.
|
|
82
|
+
version: '1.10'
|
|
83
83
|
description: A pure ruby implementation of the boilerpipe web content extraction algorithm
|
|
84
84
|
email:
|
|
85
85
|
- "<gregory.ostermayr@gmail.com>"
|
|
@@ -154,7 +154,7 @@ homepage: https://github.com/gregors/boilerpipe-ruby
|
|
|
154
154
|
licenses:
|
|
155
155
|
- Apache 2.0
|
|
156
156
|
metadata: {}
|
|
157
|
-
post_install_message:
|
|
157
|
+
post_install_message:
|
|
158
158
|
rdoc_options: []
|
|
159
159
|
require_paths:
|
|
160
160
|
- lib
|
|
@@ -170,7 +170,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
|
170
170
|
version: '0'
|
|
171
171
|
requirements: []
|
|
172
172
|
rubygems_version: 3.0.8
|
|
173
|
-
signing_key:
|
|
173
|
+
signing_key:
|
|
174
174
|
specification_version: 4
|
|
175
175
|
summary: A pure ruby implementation of the boilerpipe web content extraction algorithm
|
|
176
176
|
test_files: []
|