hpricot 0.8.1-x86-mswin32 → 0.8.2-x86-mswin32
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/CHANGELOG +13 -0
- data/README +6 -15
- data/Rakefile +40 -28
- data/ext/fast_xs/FastXsService.java +13 -1
- data/ext/hpricot_scan/HpricotCss.java +831 -0
- data/ext/hpricot_scan/HpricotScanService.java +1168 -387
- data/ext/hpricot_scan/hpricot_css.c +101 -100
- data/ext/hpricot_scan/hpricot_css.java.rl +155 -0
- data/ext/hpricot_scan/hpricot_scan.c +287 -128
- data/ext/hpricot_scan/hpricot_scan.java.rl +1078 -299
- data/ext/hpricot_scan/hpricot_scan.rl +2 -0
- data/lib/fast_xs.so +0 -0
- data/lib/hpricot/tag.rb +31 -12
- data/lib/hpricot/traverse.rb +1 -0
- data/lib/hpricot_scan.so +0 -0
- data/test/test_alter.rb +21 -2
- data/test/test_parser.rb +8 -0
- data/test/test_preserved.rb +18 -0
- metadata +30 -29
- data/ext/hpricot_scan/test.rb +0 -4
data/lib/fast_xs.so
CHANGED
Binary file
|
data/lib/hpricot/tag.rb
CHANGED
@@ -38,15 +38,20 @@ module Hpricot
|
|
38
38
|
end
|
39
39
|
end
|
40
40
|
|
41
|
-
class
|
42
|
-
|
43
|
-
|
44
|
-
|
41
|
+
class Attributes
|
42
|
+
attr_accessor :element
|
43
|
+
def initialize e
|
44
|
+
@element = e
|
45
45
|
end
|
46
|
-
def
|
47
|
-
|
48
|
-
|
49
|
-
|
46
|
+
def [] k
|
47
|
+
Hpricot.uxs((@element.raw_attributes || {})[k])
|
48
|
+
end
|
49
|
+
def []= k, v
|
50
|
+
(@element.raw_attributes ||= {})[k] = v.fast_xs
|
51
|
+
end
|
52
|
+
def to_hash
|
53
|
+
if @element.raw_attributes
|
54
|
+
@element.raw_attributes.inject({}) do |hsh, (k, v)|
|
50
55
|
hsh[k] = Hpricot.uxs(v)
|
51
56
|
hsh
|
52
57
|
end
|
@@ -54,6 +59,23 @@ module Hpricot
|
|
54
59
|
{}
|
55
60
|
end
|
56
61
|
end
|
62
|
+
def to_s
|
63
|
+
to_hash.to_s
|
64
|
+
end
|
65
|
+
def inspect
|
66
|
+
to_hash.inspect
|
67
|
+
end
|
68
|
+
end
|
69
|
+
|
70
|
+
class Elem
|
71
|
+
def initialize tag, attrs = nil, children = nil, etag = nil
|
72
|
+
self.name, self.raw_attributes, self.children, self.etag =
|
73
|
+
tag, attrs, children, etag
|
74
|
+
end
|
75
|
+
def empty?; children.nil? or children.empty? end
|
76
|
+
def attributes
|
77
|
+
Attributes.new self
|
78
|
+
end
|
57
79
|
def to_plain_text
|
58
80
|
if self.name == 'br'
|
59
81
|
"\n"
|
@@ -102,10 +124,7 @@ module Hpricot
|
|
102
124
|
class BogusETag
|
103
125
|
def initialize name; self.name = name end
|
104
126
|
def output(out, opts = {})
|
105
|
-
out <<
|
106
|
-
if_output(opts) do
|
107
|
-
"</#{name}>"
|
108
|
-
end
|
127
|
+
out << if_output(opts) { "" }
|
109
128
|
end
|
110
129
|
end
|
111
130
|
|
data/lib/hpricot/traverse.rb
CHANGED
data/lib/hpricot_scan.so
CHANGED
Binary file
|
data/test/test_alter.rb
CHANGED
@@ -1,3 +1,4 @@
|
|
1
|
+
# -*- coding: utf-8 -*-
|
1
2
|
#!/usr/bin/env ruby
|
2
3
|
|
3
4
|
require 'test/unit'
|
@@ -35,14 +36,22 @@ class TestAlter < Test::Unit::TestCase
|
|
35
36
|
end
|
36
37
|
|
37
38
|
def test_change_attributes
|
38
|
-
all_ps = (@basic/"p").attr("title", "Some Title")
|
39
|
+
all_ps = (@basic/"p").attr("title", "Some Title & Etc…")
|
39
40
|
all_as = (@basic/"a").attr("href", "http://my_new_href.com")
|
40
41
|
all_lb = (@basic/"link").attr("href") { |e| e.name }
|
41
|
-
assert_changed(@basic, "p", all_ps) {|p| p.
|
42
|
+
assert_changed(@basic, "p", all_ps) {|p| p.raw_attributes["title"] == "Some Title & Etc…"}
|
42
43
|
assert_changed(@basic, "a", all_as) {|a| a.attributes["href"] == "http://my_new_href.com"}
|
43
44
|
assert_changed(@basic, "link", all_lb) {|a| a.attributes["href"] == "link" }
|
44
45
|
end
|
45
46
|
|
47
|
+
def test_change_attributes2
|
48
|
+
all_as = (@basic%"a").attributes["href"] = "http://my_new_href.com"
|
49
|
+
all_ps = (@basic%"p").attributes["title"] = "Some Title & Etc…"
|
50
|
+
assert_equal (@basic%"a").raw_attributes["href"], "http://my_new_href.com"
|
51
|
+
assert_equal (@basic%"p").raw_attributes["title"], "Some Title & Etc…"
|
52
|
+
assert_equal (@basic%"p").attributes["title"], "Some Title & Etc…"
|
53
|
+
end
|
54
|
+
|
46
55
|
def test_remove_attr
|
47
56
|
all_rl = (@basic/"link").remove_attr("href")
|
48
57
|
assert_changed(@basic, "link", all_rl) { |link| link['href'].nil? }
|
@@ -70,6 +79,16 @@ class TestAlter < Test::Unit::TestCase
|
|
70
79
|
assert_equal frag.to_s, "<b><i>A bit of HTML</i></b><beanPole>gravity</beanPole>"
|
71
80
|
end
|
72
81
|
|
82
|
+
def test_reparent_empty_nodes
|
83
|
+
doc = Hpricot("<div/>")
|
84
|
+
doc.root.inner_html = "foo"
|
85
|
+
assert_equal doc.root.inner_html, "foo"
|
86
|
+
doc.root.inner_html = ""
|
87
|
+
assert_equal doc.root.inner_html, ""
|
88
|
+
doc.root.swap { b "test" }
|
89
|
+
assert_equal doc.root.inner_html, "test"
|
90
|
+
end
|
91
|
+
|
73
92
|
def assert_changed original, selector, set, &block
|
74
93
|
assert set.all?(&block)
|
75
94
|
assert Hpricot(original.to_html).search(selector).all?(&block)
|
data/test/test_parser.rb
CHANGED
@@ -227,6 +227,14 @@ class TestParser < Test::Unit::TestCase
|
|
227
227
|
assert_kind_of Hpricot::Elements, @boingboing.search('//div/p').search('a img')
|
228
228
|
end
|
229
229
|
|
230
|
+
def test_attr_casing
|
231
|
+
doc = Hpricot("<a HREF='a'>A simple <b>test</b> string.</a>")
|
232
|
+
assert_equal (doc % :a)[:href], "a"
|
233
|
+
assert_equal (doc % :a)[:HREF], nil
|
234
|
+
assert_equal (doc % :a)['href'], "a"
|
235
|
+
assert_equal (doc % :a)['HREF'], nil
|
236
|
+
end
|
237
|
+
|
230
238
|
def test_class_search
|
231
239
|
# test case sent by Chih-Chao Lam
|
232
240
|
doc = Hpricot("<div class=xyz'>abc</div>")
|
data/test/test_preserved.rb
CHANGED
@@ -5,6 +5,15 @@ require 'test/unit'
|
|
5
5
|
require 'hpricot'
|
6
6
|
require 'load_files'
|
7
7
|
|
8
|
+
unless "".respond_to?(:lines)
|
9
|
+
require 'enumerator'
|
10
|
+
class String
|
11
|
+
def lines
|
12
|
+
Enumerable::Enumerator.new(self, :each_line)
|
13
|
+
end
|
14
|
+
end
|
15
|
+
end
|
16
|
+
|
8
17
|
class TestPreserved < Test::Unit::TestCase
|
9
18
|
def assert_roundtrip str
|
10
19
|
doc = Hpricot(str)
|
@@ -53,6 +62,15 @@ class TestPreserved < Test::Unit::TestCase
|
|
53
62
|
assert_roundtrip TestFiles::CY0
|
54
63
|
end
|
55
64
|
|
65
|
+
def test_fixup_link
|
66
|
+
doc = %{<?xml version="1.0" encoding="UTF-8"?><rss><channel><link>ht</link></channel></rss>}
|
67
|
+
assert_roundtrip doc
|
68
|
+
assert_equal Hpricot(doc).to_s,
|
69
|
+
%{<?xml version="1.0" encoding="UTF-8"?><rss><channel><link />ht</channel></rss>}
|
70
|
+
assert_equal Hpricot.XML(doc).to_s,
|
71
|
+
%{<?xml version="1.0" encoding="UTF-8"?><rss><channel><link>ht</link></channel></rss>}
|
72
|
+
end
|
73
|
+
|
56
74
|
def test_escaping_of_attrs
|
57
75
|
# ampersands in URLs
|
58
76
|
str = %{<a href="http://google.com/search?q=hpricot&l=en">Google</a>}
|
metadata
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: hpricot
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.8.
|
4
|
+
version: 0.8.2
|
5
5
|
platform: x86-mswin32
|
6
6
|
authors:
|
7
7
|
- why the lucky stiff
|
@@ -9,7 +9,7 @@ autorequire:
|
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
11
|
|
12
|
-
date: 2009-
|
12
|
+
date: 2009-11-05 00:00:00 -06:00
|
13
13
|
default_executable:
|
14
14
|
dependencies: []
|
15
15
|
|
@@ -28,56 +28,57 @@ files:
|
|
28
28
|
- COPYING
|
29
29
|
- README
|
30
30
|
- Rakefile
|
31
|
-
- test/
|
32
|
-
- test/
|
33
|
-
- test/test_parser.rb
|
34
|
-
- test/files
|
31
|
+
- test/files/basic.xhtml
|
32
|
+
- test/files/boingboing.html
|
35
33
|
- test/files/cy0.html
|
34
|
+
- test/files/immob.html
|
36
35
|
- test/files/pace_application.html
|
37
|
-
- test/files/
|
36
|
+
- test/files/tenderlove.html
|
37
|
+
- test/files/uswebgen.html
|
38
38
|
- test/files/utf8.html
|
39
|
-
- test/files/boingboing.html
|
40
39
|
- test/files/week9.html
|
41
|
-
- test/files/tenderlove.html
|
42
|
-
- test/files/immob.html
|
43
40
|
- test/files/why.xml
|
44
|
-
- test/files/uswebgen.html
|
45
41
|
- test/load_files.rb
|
46
42
|
- test/nokogiri-bench.rb
|
43
|
+
- test/test_alter.rb
|
47
44
|
- test/test_builder.rb
|
45
|
+
- test/test_parser.rb
|
46
|
+
- test/test_paths.rb
|
47
|
+
- test/test_preserved.rb
|
48
48
|
- test/test_xml.rb
|
49
|
-
-
|
50
|
-
- lib/hpricot
|
51
|
-
- lib/hpricot/tags.rb
|
49
|
+
- lib/hpricot/blankslate.rb
|
52
50
|
- lib/hpricot/builder.rb
|
53
|
-
- lib/hpricot/traverse.rb
|
54
51
|
- lib/hpricot/elements.rb
|
55
|
-
- lib/hpricot/
|
52
|
+
- lib/hpricot/htmlinfo.rb
|
56
53
|
- lib/hpricot/inspect.rb
|
54
|
+
- lib/hpricot/modules.rb
|
55
|
+
- lib/hpricot/parse.rb
|
57
56
|
- lib/hpricot/tag.rb
|
58
|
-
- lib/hpricot/
|
57
|
+
- lib/hpricot/tags.rb
|
58
|
+
- lib/hpricot/traverse.rb
|
59
59
|
- lib/hpricot/xchar.rb
|
60
|
-
- lib/hpricot/htmlinfo.rb
|
61
|
-
- lib/hpricot/parse.rb
|
62
60
|
- lib/hpricot.rb
|
63
61
|
- extras/mingw-rbconfig.rb
|
64
62
|
- ext/hpricot_scan/hpricot_scan.h
|
65
|
-
- ext/hpricot_scan/HpricotScanService.java
|
66
63
|
- ext/fast_xs/FastXsService.java
|
67
|
-
- ext/hpricot_scan/
|
68
|
-
- ext/hpricot_scan/
|
64
|
+
- ext/hpricot_scan/HpricotCss.java
|
65
|
+
- ext/hpricot_scan/HpricotScanService.java
|
69
66
|
- ext/fast_xs/fast_xs.c
|
70
|
-
- ext/hpricot_scan/
|
71
|
-
- ext/hpricot_scan/
|
67
|
+
- ext/hpricot_scan/hpricot_css.c
|
68
|
+
- ext/hpricot_scan/hpricot_scan.c
|
72
69
|
- ext/fast_xs/extconf.rb
|
73
|
-
- ext/hpricot_scan/
|
74
|
-
- ext/hpricot_scan/hpricot_scan.java.rl
|
75
|
-
- ext/hpricot_scan/hpricot_css.rl
|
70
|
+
- ext/hpricot_scan/extconf.rb
|
76
71
|
- ext/hpricot_scan/hpricot_common.rl
|
72
|
+
- ext/hpricot_scan/hpricot_css.java.rl
|
73
|
+
- ext/hpricot_scan/hpricot_css.rl
|
74
|
+
- ext/hpricot_scan/hpricot_scan.java.rl
|
75
|
+
- ext/hpricot_scan/hpricot_scan.rl
|
77
76
|
- lib/hpricot_scan.so
|
78
77
|
- lib/fast_xs.so
|
79
78
|
has_rdoc: true
|
80
79
|
homepage: http://code.whytheluckystiff.net/hpricot/
|
80
|
+
licenses: []
|
81
|
+
|
81
82
|
post_install_message:
|
82
83
|
rdoc_options:
|
83
84
|
- --quiet
|
@@ -103,9 +104,9 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
103
104
|
requirements: []
|
104
105
|
|
105
106
|
rubyforge_project: hobix
|
106
|
-
rubygems_version: 1.3.
|
107
|
+
rubygems_version: 1.3.5
|
107
108
|
signing_key:
|
108
|
-
specification_version:
|
109
|
+
specification_version: 3
|
109
110
|
summary: a swift, liberal HTML parser with a fantastic library
|
110
111
|
test_files: []
|
111
112
|
|
data/ext/hpricot_scan/test.rb
DELETED