algolia_html_extractor 2.3.0 → 2.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 2935d48da689f8b8064f82fe45d08294973b537b
4
- data.tar.gz: e4eaf98057448f77c4ffa4472e479d8f331ccf48
3
+ metadata.gz: 9dcc5416e75d46b8b0b18e78f920b7b588cdb853
4
+ data.tar.gz: 19ea9540c519f30a9e04caa71d4216531dc97295
5
5
  SHA512:
6
- metadata.gz: 2b97bd8f04d84d81bf5adbc4063163c43e3b5c53f2cfa8297b3fac07d0b3542ea3ca135068dbf9e63b3444b5604a2cd34645f79328491b14c7445eeafc897ab8
7
- data.tar.gz: 1c7e7f1edfb75945ef179dffb5138f3fdb408273653e2c2612fcd7ff73c5d86eebf68aa1911bc65d4974ab867667b36a9d9e26a672ff50d94981e5eae6f88fbc
6
+ metadata.gz: 0fff97d2b4fdbc2c7588f3df01f21f8f98b4e2a719348f93ddde54e53b6474d78627d6227ac242928506439a62b8533ea9dbb8145f9c88e02d835e5d9dab43a7
7
+ data.tar.gz: 956d98cb1a1f06139d53bc29a8c10ce40b9c4287fc0d3285238f3f74e8b1b8602110874ce61685f5a543e3556246a6dbbb6e00ecb205fa2687a08def76e9c4a1
data/README.md CHANGED
@@ -75,7 +75,6 @@ Here is one of the records extracted:
75
75
  ```ruby
76
76
  {
77
77
  :objectID => "1f5923d5a60e998704f201bbe9964811",
78
- :tag_name => "p",
79
78
  :html => "<p>The hero quits his job, hits the road, or whatever cuts him from his previous life.</p>",
80
79
  :text => "The hero quits his job, hits the road, or whatever cuts him from his previous life.",
81
80
  :node => #<Nokogiri::XML::Element:0x11a5850 name="p">,
@@ -99,9 +98,6 @@ Here is one of the records extracted:
99
98
  Each record has a `objectID` that uniquely identify it (computed by a hash of all
100
99
  the other values).
101
100
 
102
- It also contains the HTML tag name in `tag_name` (by default `<p>`
103
- paragraphs are extracted, but see the [settings][7] on how to change it).
104
-
105
101
  `html` contains the whole `outerContent` of the element, including the wrapping
106
102
  tags and inner children. The `text` attribute contains the textual content,
107
103
  stripping out all HTML.
@@ -63,7 +63,6 @@ module AlgoliaHTMLExtractor
63
63
  item = {
64
64
  html: extract_html(node),
65
65
  content: content,
66
- tag_name: extract_tag_name(node),
67
66
  hierarchy: current_hierarchy.clone,
68
67
  anchor: current_anchor,
69
68
  node: node,
@@ -1,6 +1,6 @@
1
1
  # Expose gem version
2
2
  # rubocop:disable Style/SingleLineMethods
3
3
  class AlgoliaHTMLExtractorVersion
4
- def self.to_s; '2.3.0' end
4
+ def self.to_s; '2.4.0' end
5
5
  end
6
6
  # rubocop:enable Style/SingleLineMethods
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: algolia_html_extractor
3
3
  version: !ruby/object:Gem::Version
4
- version: 2.3.0
4
+ version: 2.4.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Tim Carry