iudex-html 1.7.0-java → 1.7.1-java
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +5 -5
- data/History.rdoc +5 -0
- data/Manifest.txt +1 -1
- data/Rakefile +1 -1
- data/build/HTML.java.erb +27 -0
- data/lib/iudex-html/base.rb +1 -1
- data/lib/iudex-html/{iudex-html-1.7.0.jar → iudex-html-1.7.1.jar} +0 -0
- data/pom.xml +1 -1
- metadata +22 -20
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
|
-
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
2
|
+
SHA256:
|
3
|
+
metadata.gz: e579cd4b386446b5e5a8bfbb35f2dc1b4df53cf6a44822a45545029efe59ef17
|
4
|
+
data.tar.gz: 727c3391a2742d4d5a4bdfa7d421c7bb7e31c7439b04e1132fa13d23c625e896
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 835028132ea61517091bbb3423032bf287d0bf4a57df91c7a067c9bd8e81d458df4e112b24bdbe8bd5a647ba922c8d4630aa2a3a488e318e904178de0c6c1b28
|
7
|
+
data.tar.gz: 261b78face3489ea9ac02aba008d41da4d2298041784892f174e03845409b32a476c086ad453788438f9e58fef96620e6246d52a4e60a5d1df4e563a4315b231
|
data/History.rdoc
CHANGED
data/Manifest.txt
CHANGED
data/Rakefile
CHANGED
@@ -9,7 +9,7 @@ RJack::TarPit.new( 'iudex-html' ).define_tasks
|
|
9
9
|
file 'target/.tarpit' => [ 'src/main/java/iudex/html/HTML.java' ]
|
10
10
|
|
11
11
|
file 'src/main/java/iudex/html/HTML.java' => FileList.new( "build/*" ) do
|
12
|
-
|
12
|
+
require_relative 'build/java_generate'
|
13
13
|
puts "Generating HTML.java"
|
14
14
|
JavaGenerator.new.run
|
15
15
|
end
|
data/build/HTML.java.erb
CHANGED
@@ -73,6 +73,21 @@ public class HTML
|
|
73
73
|
|
74
74
|
% end
|
75
75
|
|
76
|
+
/**
|
77
|
+
* Return existing or add a new Tag by name and with basicAtts and
|
78
|
+
* flags to TAGS.
|
79
|
+
*/
|
80
|
+
public static HTMLTag addTag( String name,
|
81
|
+
List<Attribute> basicAtts,
|
82
|
+
Flag...flags )
|
83
|
+
{
|
84
|
+
HTMLTag exists = TAGS.get( name );
|
85
|
+
if( exists != null ) {
|
86
|
+
return exists;
|
87
|
+
}
|
88
|
+
return tag( name, basicAtts, flags );
|
89
|
+
}
|
90
|
+
|
76
91
|
private static HTMLTag tag( String name,
|
77
92
|
List<Attribute> basicAtts,
|
78
93
|
Flag...flags )
|
@@ -82,6 +97,18 @@ public class HTML
|
|
82
97
|
return t;
|
83
98
|
}
|
84
99
|
|
100
|
+
/**
|
101
|
+
* Return existing or add a new Attribute by name to ATTRIBUTES.
|
102
|
+
*/
|
103
|
+
public static Attribute addAttr( String name )
|
104
|
+
{
|
105
|
+
Attribute exists = ATTRIBUTES.get( name );
|
106
|
+
if( exists != null ) {
|
107
|
+
return exists;
|
108
|
+
}
|
109
|
+
return attr( name );
|
110
|
+
}
|
111
|
+
|
85
112
|
private static Attribute attr( String name )
|
86
113
|
{
|
87
114
|
Attribute a = new Attribute( name, NS_XHTML );
|
data/lib/iudex-html/base.rb
CHANGED
Binary file
|
data/pom.xml
CHANGED
metadata
CHANGED
@@ -1,19 +1,19 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: iudex-html
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.7.
|
4
|
+
version: 1.7.1
|
5
5
|
platform: java
|
6
6
|
authors:
|
7
7
|
- David Kellum
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date:
|
11
|
+
date: 2017-07-07 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
requirement: !ruby/object:Gem::Requirement
|
15
15
|
requirements:
|
16
|
-
- - ~>
|
16
|
+
- - "~>"
|
17
17
|
- !ruby/object:Gem::Version
|
18
18
|
version: '1.7'
|
19
19
|
name: iudex-core
|
@@ -21,13 +21,13 @@ dependencies:
|
|
21
21
|
type: :runtime
|
22
22
|
version_requirements: !ruby/object:Gem::Requirement
|
23
23
|
requirements:
|
24
|
-
- - ~>
|
24
|
+
- - "~>"
|
25
25
|
- !ruby/object:Gem::Version
|
26
26
|
version: '1.7'
|
27
27
|
- !ruby/object:Gem::Dependency
|
28
28
|
requirement: !ruby/object:Gem::Requirement
|
29
29
|
requirements:
|
30
|
-
- - ~>
|
30
|
+
- - "~>"
|
31
31
|
- !ruby/object:Gem::Version
|
32
32
|
version: 1.9.18
|
33
33
|
name: rjack-nekohtml
|
@@ -35,13 +35,13 @@ dependencies:
|
|
35
35
|
type: :runtime
|
36
36
|
version_requirements: !ruby/object:Gem::Requirement
|
37
37
|
requirements:
|
38
|
-
- - ~>
|
38
|
+
- - "~>"
|
39
39
|
- !ruby/object:Gem::Version
|
40
40
|
version: 1.9.18
|
41
41
|
- !ruby/object:Gem::Dependency
|
42
42
|
requirement: !ruby/object:Gem::Requirement
|
43
43
|
requirements:
|
44
|
-
- - ~>
|
44
|
+
- - "~>"
|
45
45
|
- !ruby/object:Gem::Version
|
46
46
|
version: 1.7.0
|
47
47
|
name: gravitext-xmlprod
|
@@ -49,13 +49,13 @@ dependencies:
|
|
49
49
|
type: :runtime
|
50
50
|
version_requirements: !ruby/object:Gem::Requirement
|
51
51
|
requirements:
|
52
|
-
- - ~>
|
52
|
+
- - "~>"
|
53
53
|
- !ruby/object:Gem::Version
|
54
54
|
version: 1.7.0
|
55
55
|
- !ruby/object:Gem::Dependency
|
56
56
|
requirement: !ruby/object:Gem::Requirement
|
57
57
|
requirements:
|
58
|
-
- - ~>
|
58
|
+
- - "~>"
|
59
59
|
- !ruby/object:Gem::Version
|
60
60
|
version: 4.7.4
|
61
61
|
name: minitest
|
@@ -63,13 +63,13 @@ dependencies:
|
|
63
63
|
type: :development
|
64
64
|
version_requirements: !ruby/object:Gem::Requirement
|
65
65
|
requirements:
|
66
|
-
- - ~>
|
66
|
+
- - "~>"
|
67
67
|
- !ruby/object:Gem::Version
|
68
68
|
version: 4.7.4
|
69
69
|
- !ruby/object:Gem::Dependency
|
70
70
|
requirement: !ruby/object:Gem::Requirement
|
71
71
|
requirements:
|
72
|
-
- - ~>
|
72
|
+
- - "~>"
|
73
73
|
- !ruby/object:Gem::Version
|
74
74
|
version: '1.5'
|
75
75
|
name: rjack-logback
|
@@ -77,13 +77,13 @@ dependencies:
|
|
77
77
|
type: :development
|
78
78
|
version_requirements: !ruby/object:Gem::Requirement
|
79
79
|
requirements:
|
80
|
-
- - ~>
|
80
|
+
- - "~>"
|
81
81
|
- !ruby/object:Gem::Version
|
82
82
|
version: '1.5'
|
83
83
|
- !ruby/object:Gem::Dependency
|
84
84
|
requirement: !ruby/object:Gem::Requirement
|
85
85
|
requirements:
|
86
|
-
- - ~>
|
86
|
+
- - "~>"
|
87
87
|
- !ruby/object:Gem::Version
|
88
88
|
version: '2.1'
|
89
89
|
name: rjack-tarpit
|
@@ -91,10 +91,12 @@ dependencies:
|
|
91
91
|
type: :development
|
92
92
|
version_requirements: !ruby/object:Gem::Requirement
|
93
93
|
requirements:
|
94
|
-
- - ~>
|
94
|
+
- - "~>"
|
95
95
|
- !ruby/object:Gem::Version
|
96
96
|
version: '2.1'
|
97
|
-
description: Iudex is a general purpose web crawler and feed processor in ruby/java.
|
97
|
+
description: Iudex is a general purpose web crawler and feed processor in ruby/java.
|
98
|
+
The iudex-html gem contains filters for HTML parsing, filtering, exracting text
|
99
|
+
and links.
|
98
100
|
email:
|
99
101
|
- dek-oss@gravitext.com
|
100
102
|
executables:
|
@@ -118,7 +120,7 @@ files:
|
|
118
120
|
- lib/iudex-html.rb
|
119
121
|
- lib/iudex-html/base.rb
|
120
122
|
- lib/iudex-html/factory_helper.rb
|
121
|
-
- lib/iudex-html/iudex-html-1.7.
|
123
|
+
- lib/iudex-html/iudex-html-1.7.1.jar
|
122
124
|
- pom.xml
|
123
125
|
- test/html_test_helper.rb
|
124
126
|
- test/reddit.xhtml
|
@@ -139,23 +141,23 @@ licenses:
|
|
139
141
|
metadata: {}
|
140
142
|
post_install_message:
|
141
143
|
rdoc_options:
|
142
|
-
- --main
|
144
|
+
- "--main"
|
143
145
|
- README.rdoc
|
144
146
|
require_paths:
|
145
147
|
- lib
|
146
148
|
required_ruby_version: !ruby/object:Gem::Requirement
|
147
149
|
requirements:
|
148
|
-
- -
|
150
|
+
- - ">="
|
149
151
|
- !ruby/object:Gem::Version
|
150
152
|
version: 1.8.7
|
151
153
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
152
154
|
requirements:
|
153
|
-
- -
|
155
|
+
- - ">="
|
154
156
|
- !ruby/object:Gem::Version
|
155
157
|
version: '0'
|
156
158
|
requirements: []
|
157
159
|
rubyforge_project:
|
158
|
-
rubygems_version: 2.
|
160
|
+
rubygems_version: 2.6.11
|
159
161
|
signing_key:
|
160
162
|
specification_version: 4
|
161
163
|
summary: Iudex is a general purpose web crawler and feed processor in ruby/java.
|