iudex-html 1.7.0-java → 1.7.1-java

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
- SHA1:
3
- metadata.gz: 8562423f11f6ec337a56e96f9c0ee172fd789f65
4
- data.tar.gz: 206f0dbd3bb2055e0b600ff6f607943af79a56fe
2
+ SHA256:
3
+ metadata.gz: e579cd4b386446b5e5a8bfbb35f2dc1b4df53cf6a44822a45545029efe59ef17
4
+ data.tar.gz: 727c3391a2742d4d5a4bdfa7d421c7bb7e31c7439b04e1132fa13d23c625e896
5
5
  SHA512:
6
- metadata.gz: 55f5d8f05329a4f4fd2330c23b8a0f03eb518c71d4f847efa0d7d081cc43969851f37331a1264703b1f8dbb4ba99957623b6843a8987fc8962a1dee0b3c05bb4
7
- data.tar.gz: f07d067eee916aa6e63d321820c2a76bde6ca141a47dfe8c396f93b890547bf7f893f4d048e9bd034b756419b86e1798b7271b0ed0023aee4272139923edee3d
6
+ metadata.gz: 835028132ea61517091bbb3423032bf287d0bf4a57df91c7a067c9bd8e81d458df4e112b24bdbe8bd5a647ba922c8d4630aa2a3a488e318e904178de0c6c1b28
7
+ data.tar.gz: 261b78face3489ea9ac02aba008d41da4d2298041784892f174e03845409b32a476c086ad453788438f9e58fef96620e6246d52a4e60a5d1df4e563a4315b231
@@ -1,3 +1,8 @@
1
+ === 1.7.1 (2017-7-7)
2
+ * Fix for (jruby 9.x) require relative on build
3
+ * Add HTML.addTag and addAttr methods for application support of
4
+ non-standard tags in the wild.
5
+
1
6
  === 1.7.0 (2015-5-3)
2
7
  * Upgrade to iudex-* ~> 1.7 dependencies
3
8
 
@@ -25,4 +25,4 @@ test/test_parse_filter.rb
25
25
  test/test_stax_parser.rb
26
26
  test/test_tree_walker.rb
27
27
  test/test_word_counters.rb
28
- lib/iudex-html/iudex-html-1.7.0.jar
28
+ lib/iudex-html/iudex-html-1.7.1.jar
data/Rakefile CHANGED
@@ -9,7 +9,7 @@ RJack::TarPit.new( 'iudex-html' ).define_tasks
9
9
  file 'target/.tarpit' => [ 'src/main/java/iudex/html/HTML.java' ]
10
10
 
11
11
  file 'src/main/java/iudex/html/HTML.java' => FileList.new( "build/*" ) do
12
- require 'build/java_generate'
12
+ require_relative 'build/java_generate'
13
13
  puts "Generating HTML.java"
14
14
  JavaGenerator.new.run
15
15
  end
@@ -73,6 +73,21 @@ public class HTML
73
73
 
74
74
  % end
75
75
 
76
+ /**
77
+ * Return existing or add a new Tag by name and with basicAtts and
78
+ * flags to TAGS.
79
+ */
80
+ public static HTMLTag addTag( String name,
81
+ List<Attribute> basicAtts,
82
+ Flag...flags )
83
+ {
84
+ HTMLTag exists = TAGS.get( name );
85
+ if( exists != null ) {
86
+ return exists;
87
+ }
88
+ return tag( name, basicAtts, flags );
89
+ }
90
+
76
91
  private static HTMLTag tag( String name,
77
92
  List<Attribute> basicAtts,
78
93
  Flag...flags )
@@ -82,6 +97,18 @@ public class HTML
82
97
  return t;
83
98
  }
84
99
 
100
+ /**
101
+ * Return existing or add a new Attribute by name to ATTRIBUTES.
102
+ */
103
+ public static Attribute addAttr( String name )
104
+ {
105
+ Attribute exists = ATTRIBUTES.get( name );
106
+ if( exists != null ) {
107
+ return exists;
108
+ }
109
+ return attr( name );
110
+ }
111
+
85
112
  private static Attribute attr( String name )
86
113
  {
87
114
  Attribute a = new Attribute( name, NS_XHTML );
@@ -16,6 +16,6 @@
16
16
 
17
17
  module Iudex
18
18
  module HTML
19
- VERSION = '1.7.0'
19
+ VERSION = '1.7.1'
20
20
  end
21
21
  end
data/pom.xml CHANGED
@@ -3,7 +3,7 @@
3
3
  <groupId>iudex</groupId>
4
4
  <artifactId>iudex-html</artifactId>
5
5
  <packaging>jar</packaging>
6
- <version>1.7.0</version>
6
+ <version>1.7.1</version>
7
7
  <name>Iudex HTML parsing/filtering and text extraction</name>
8
8
 
9
9
  <parent>
metadata CHANGED
@@ -1,19 +1,19 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: iudex-html
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.7.0
4
+ version: 1.7.1
5
5
  platform: java
6
6
  authors:
7
7
  - David Kellum
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2015-05-04 00:00:00.000000000 Z
11
+ date: 2017-07-07 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  requirement: !ruby/object:Gem::Requirement
15
15
  requirements:
16
- - - ~>
16
+ - - "~>"
17
17
  - !ruby/object:Gem::Version
18
18
  version: '1.7'
19
19
  name: iudex-core
@@ -21,13 +21,13 @@ dependencies:
21
21
  type: :runtime
22
22
  version_requirements: !ruby/object:Gem::Requirement
23
23
  requirements:
24
- - - ~>
24
+ - - "~>"
25
25
  - !ruby/object:Gem::Version
26
26
  version: '1.7'
27
27
  - !ruby/object:Gem::Dependency
28
28
  requirement: !ruby/object:Gem::Requirement
29
29
  requirements:
30
- - - ~>
30
+ - - "~>"
31
31
  - !ruby/object:Gem::Version
32
32
  version: 1.9.18
33
33
  name: rjack-nekohtml
@@ -35,13 +35,13 @@ dependencies:
35
35
  type: :runtime
36
36
  version_requirements: !ruby/object:Gem::Requirement
37
37
  requirements:
38
- - - ~>
38
+ - - "~>"
39
39
  - !ruby/object:Gem::Version
40
40
  version: 1.9.18
41
41
  - !ruby/object:Gem::Dependency
42
42
  requirement: !ruby/object:Gem::Requirement
43
43
  requirements:
44
- - - ~>
44
+ - - "~>"
45
45
  - !ruby/object:Gem::Version
46
46
  version: 1.7.0
47
47
  name: gravitext-xmlprod
@@ -49,13 +49,13 @@ dependencies:
49
49
  type: :runtime
50
50
  version_requirements: !ruby/object:Gem::Requirement
51
51
  requirements:
52
- - - ~>
52
+ - - "~>"
53
53
  - !ruby/object:Gem::Version
54
54
  version: 1.7.0
55
55
  - !ruby/object:Gem::Dependency
56
56
  requirement: !ruby/object:Gem::Requirement
57
57
  requirements:
58
- - - ~>
58
+ - - "~>"
59
59
  - !ruby/object:Gem::Version
60
60
  version: 4.7.4
61
61
  name: minitest
@@ -63,13 +63,13 @@ dependencies:
63
63
  type: :development
64
64
  version_requirements: !ruby/object:Gem::Requirement
65
65
  requirements:
66
- - - ~>
66
+ - - "~>"
67
67
  - !ruby/object:Gem::Version
68
68
  version: 4.7.4
69
69
  - !ruby/object:Gem::Dependency
70
70
  requirement: !ruby/object:Gem::Requirement
71
71
  requirements:
72
- - - ~>
72
+ - - "~>"
73
73
  - !ruby/object:Gem::Version
74
74
  version: '1.5'
75
75
  name: rjack-logback
@@ -77,13 +77,13 @@ dependencies:
77
77
  type: :development
78
78
  version_requirements: !ruby/object:Gem::Requirement
79
79
  requirements:
80
- - - ~>
80
+ - - "~>"
81
81
  - !ruby/object:Gem::Version
82
82
  version: '1.5'
83
83
  - !ruby/object:Gem::Dependency
84
84
  requirement: !ruby/object:Gem::Requirement
85
85
  requirements:
86
- - - ~>
86
+ - - "~>"
87
87
  - !ruby/object:Gem::Version
88
88
  version: '2.1'
89
89
  name: rjack-tarpit
@@ -91,10 +91,12 @@ dependencies:
91
91
  type: :development
92
92
  version_requirements: !ruby/object:Gem::Requirement
93
93
  requirements:
94
- - - ~>
94
+ - - "~>"
95
95
  - !ruby/object:Gem::Version
96
96
  version: '2.1'
97
- description: Iudex is a general purpose web crawler and feed processor in ruby/java. The iudex-html gem contains filters for HTML parsing, filtering, exracting text and links.
97
+ description: Iudex is a general purpose web crawler and feed processor in ruby/java.
98
+ The iudex-html gem contains filters for HTML parsing, filtering, exracting text
99
+ and links.
98
100
  email:
99
101
  - dek-oss@gravitext.com
100
102
  executables:
@@ -118,7 +120,7 @@ files:
118
120
  - lib/iudex-html.rb
119
121
  - lib/iudex-html/base.rb
120
122
  - lib/iudex-html/factory_helper.rb
121
- - lib/iudex-html/iudex-html-1.7.0.jar
123
+ - lib/iudex-html/iudex-html-1.7.1.jar
122
124
  - pom.xml
123
125
  - test/html_test_helper.rb
124
126
  - test/reddit.xhtml
@@ -139,23 +141,23 @@ licenses:
139
141
  metadata: {}
140
142
  post_install_message:
141
143
  rdoc_options:
142
- - --main
144
+ - "--main"
143
145
  - README.rdoc
144
146
  require_paths:
145
147
  - lib
146
148
  required_ruby_version: !ruby/object:Gem::Requirement
147
149
  requirements:
148
- - - '>='
150
+ - - ">="
149
151
  - !ruby/object:Gem::Version
150
152
  version: 1.8.7
151
153
  required_rubygems_version: !ruby/object:Gem::Requirement
152
154
  requirements:
153
- - - '>='
155
+ - - ">="
154
156
  - !ruby/object:Gem::Version
155
157
  version: '0'
156
158
  requirements: []
157
159
  rubyforge_project:
158
- rubygems_version: 2.4.5
160
+ rubygems_version: 2.6.11
159
161
  signing_key:
160
162
  specification_version: 4
161
163
  summary: Iudex is a general purpose web crawler and feed processor in ruby/java.