html-to-markdown 2.14.1 → 2.14.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA256:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: 3b8f5d14713f391a39c77222107b33764ced9559cc484bfe916e94e091eafb0f
|
|
4
|
+
data.tar.gz: 123d48de7bb0d423ca4c92333462596202969c182bcd8c7b9021d0fe4ff2ea88
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: d1987a2a62c32d8bfe67ecde0f73d7d161065461feb2a471dc15cd67e5f46ba93a55e46522b20eb63871ed0b6a056216022c966261093161a767b359cec27e19
|
|
7
|
+
data.tar.gz: 74c7cb93a0ed5186afc81d40fd4c03c19beb725880ff8d234706b898864710ec17711a9488cb8a81fb70c128f47eb5b9c1ee148ab65d648494a1dab918b66114
|
data/Gemfile.lock
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
PATH
|
|
2
2
|
remote: .
|
|
3
3
|
specs:
|
|
4
|
-
html-to-markdown (2.14.
|
|
4
|
+
html-to-markdown (2.14.2)
|
|
5
5
|
rb_sys (>= 0.9, < 1.0)
|
|
6
6
|
|
|
7
7
|
GEM
|
|
@@ -33,14 +33,14 @@ GEM
|
|
|
33
33
|
fileutils (1.8.0)
|
|
34
34
|
i18n (1.14.7)
|
|
35
35
|
concurrent-ruby (~> 1.0)
|
|
36
|
-
json (2.
|
|
36
|
+
json (2.18.0)
|
|
37
37
|
language_server-protocol (3.17.0.5)
|
|
38
38
|
lint_roller (1.1.0)
|
|
39
39
|
listen (3.9.0)
|
|
40
40
|
rb-fsevent (~> 0.10, >= 0.10.3)
|
|
41
41
|
rb-inotify (~> 0.9, >= 0.9.10)
|
|
42
42
|
logger (1.7.0)
|
|
43
|
-
minitest (5.
|
|
43
|
+
minitest (5.27.0)
|
|
44
44
|
mutex_m (0.3.0)
|
|
45
45
|
parallel (1.27.0)
|
|
46
46
|
parser (3.3.10.0)
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[package]
|
|
2
2
|
name = "html-to-markdown-rb"
|
|
3
|
-
version = "2.14.
|
|
3
|
+
version = "2.14.2"
|
|
4
4
|
edition = "2024"
|
|
5
5
|
authors = ["Na'aman Hirschfeld <nhirschfeld@gmail.com>"]
|
|
6
6
|
license = "MIT"
|
|
@@ -22,7 +22,7 @@ default = ["metadata"]
|
|
|
22
22
|
metadata = ["html-to-markdown-rs/metadata"]
|
|
23
23
|
|
|
24
24
|
[dependencies]
|
|
25
|
-
html-to-markdown-rs = { version = "2.14.
|
|
25
|
+
html-to-markdown-rs = { version = "2.14.2", features = ["inline-images"] }
|
|
26
26
|
magnus = { git = "https://github.com/matsadler/magnus", rev = "f6db11769efb517427bf7f121f9c32e18b059b38", features = ["rb-sys"] }
|
|
27
27
|
|
|
28
28
|
[dev-dependencies]
|
|
@@ -681,7 +681,6 @@ fn convert_with_metadata_fn(ruby: &Ruby, args: &[Value]) -> Result<Value, Error>
|
|
|
681
681
|
let (markdown, metadata) =
|
|
682
682
|
guard_panic(|| convert_with_metadata_inner(&html, Some(options), metadata_config)).map_err(conversion_error)?;
|
|
683
683
|
|
|
684
|
-
// Convert to Ruby array [markdown, metadata_hash]
|
|
685
684
|
let array = ruby.ary_new();
|
|
686
685
|
array.push(markdown)?;
|
|
687
686
|
array.push(extended_metadata_to_ruby(ruby, metadata)?)?;
|
|
@@ -349,7 +349,6 @@ RSpec.describe HtmlToMarkdown do
|
|
|
349
349
|
HTML
|
|
350
350
|
_, metadata = described_class.convert_with_metadata(html)
|
|
351
351
|
|
|
352
|
-
# Structured data extraction may vary by implementation
|
|
353
352
|
expect(metadata[:structured_data]).to be_an(Array)
|
|
354
353
|
end
|
|
355
354
|
end
|
|
@@ -382,7 +381,6 @@ RSpec.describe HtmlToMarkdown do
|
|
|
382
381
|
html = '<html><head><title> Title with spaces </title></head><body><p>Content</p></body></html>'
|
|
383
382
|
_, metadata = described_class.convert_with_metadata(html)
|
|
384
383
|
|
|
385
|
-
# Whitespace may be normalized
|
|
386
384
|
expect(metadata[:document][:title]).to match(/Title.*spaces/)
|
|
387
385
|
end
|
|
388
386
|
|
|
@@ -398,7 +396,6 @@ RSpec.describe HtmlToMarkdown do
|
|
|
398
396
|
HTML
|
|
399
397
|
_, metadata = described_class.convert_with_metadata(html)
|
|
400
398
|
|
|
401
|
-
# Last value typically wins, but implementation may vary
|
|
402
399
|
expect(metadata[:document][:author]).to be_a(String)
|
|
403
400
|
end
|
|
404
401
|
end
|
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: html-to-markdown
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 2.14.
|
|
4
|
+
version: 2.14.2
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Na'aman Hirschfeld
|
|
8
8
|
autorequire:
|
|
9
9
|
bindir: exe
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2025-12-
|
|
11
|
+
date: 2025-12-13 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: rb_sys
|