iudex-html 1.7.0-java → 1.7.1-java

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
- SHA1:
3
- metadata.gz: 8562423f11f6ec337a56e96f9c0ee172fd789f65
4
- data.tar.gz: 206f0dbd3bb2055e0b600ff6f607943af79a56fe
2
+ SHA256:
3
+ metadata.gz: e579cd4b386446b5e5a8bfbb35f2dc1b4df53cf6a44822a45545029efe59ef17
4
+ data.tar.gz: 727c3391a2742d4d5a4bdfa7d421c7bb7e31c7439b04e1132fa13d23c625e896
5
5
  SHA512:
6
- metadata.gz: 55f5d8f05329a4f4fd2330c23b8a0f03eb518c71d4f847efa0d7d081cc43969851f37331a1264703b1f8dbb4ba99957623b6843a8987fc8962a1dee0b3c05bb4
7
- data.tar.gz: f07d067eee916aa6e63d321820c2a76bde6ca141a47dfe8c396f93b890547bf7f893f4d048e9bd034b756419b86e1798b7271b0ed0023aee4272139923edee3d
6
+ metadata.gz: 835028132ea61517091bbb3423032bf287d0bf4a57df91c7a067c9bd8e81d458df4e112b24bdbe8bd5a647ba922c8d4630aa2a3a488e318e904178de0c6c1b28
7
+ data.tar.gz: 261b78face3489ea9ac02aba008d41da4d2298041784892f174e03845409b32a476c086ad453788438f9e58fef96620e6246d52a4e60a5d1df4e563a4315b231
@@ -1,3 +1,8 @@
1
+ === 1.7.1 (2017-7-7)
2
+ * Fix for (jruby 9.x) require relative on build
3
+ * Add HTML.addTag and addAttr methods for application support of
4
+ non-standard tags in the wild.
5
+
1
6
  === 1.7.0 (2015-5-3)
2
7
  * Upgrade to iudex-* ~> 1.7 dependencies
3
8
 
@@ -25,4 +25,4 @@ test/test_parse_filter.rb
25
25
  test/test_stax_parser.rb
26
26
  test/test_tree_walker.rb
27
27
  test/test_word_counters.rb
28
- lib/iudex-html/iudex-html-1.7.0.jar
28
+ lib/iudex-html/iudex-html-1.7.1.jar
data/Rakefile CHANGED
@@ -9,7 +9,7 @@ RJack::TarPit.new( 'iudex-html' ).define_tasks
9
9
  file 'target/.tarpit' => [ 'src/main/java/iudex/html/HTML.java' ]
10
10
 
11
11
  file 'src/main/java/iudex/html/HTML.java' => FileList.new( "build/*" ) do
12
- require 'build/java_generate'
12
+ require_relative 'build/java_generate'
13
13
  puts "Generating HTML.java"
14
14
  JavaGenerator.new.run
15
15
  end
@@ -73,6 +73,21 @@ public class HTML
73
73
 
74
74
  % end
75
75
 
76
+ /**
77
+ * Return existing or add a new Tag by name and with basicAtts and
78
+ * flags to TAGS.
79
+ */
80
+ public static HTMLTag addTag( String name,
81
+ List<Attribute> basicAtts,
82
+ Flag...flags )
83
+ {
84
+ HTMLTag exists = TAGS.get( name );
85
+ if( exists != null ) {
86
+ return exists;
87
+ }
88
+ return tag( name, basicAtts, flags );
89
+ }
90
+
76
91
  private static HTMLTag tag( String name,
77
92
  List<Attribute> basicAtts,
78
93
  Flag...flags )
@@ -82,6 +97,18 @@ public class HTML
82
97
  return t;
83
98
  }
84
99
 
100
+ /**
101
+ * Return existing or add a new Attribute by name to ATTRIBUTES.
102
+ */
103
+ public static Attribute addAttr( String name )
104
+ {
105
+ Attribute exists = ATTRIBUTES.get( name );
106
+ if( exists != null ) {
107
+ return exists;
108
+ }
109
+ return attr( name );
110
+ }
111
+
85
112
  private static Attribute attr( String name )
86
113
  {
87
114
  Attribute a = new Attribute( name, NS_XHTML );
@@ -16,6 +16,6 @@
16
16
 
17
17
  module Iudex
18
18
  module HTML
19
- VERSION = '1.7.0'
19
+ VERSION = '1.7.1'
20
20
  end
21
21
  end
data/pom.xml CHANGED
@@ -3,7 +3,7 @@
3
3
  <groupId>iudex</groupId>
4
4
  <artifactId>iudex-html</artifactId>
5
5
  <packaging>jar</packaging>
6
- <version>1.7.0</version>
6
+ <version>1.7.1</version>
7
7
  <name>Iudex HTML parsing/filtering and text extraction</name>
8
8
 
9
9
  <parent>
metadata CHANGED
@@ -1,19 +1,19 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: iudex-html
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.7.0
4
+ version: 1.7.1
5
5
  platform: java
6
6
  authors:
7
7
  - David Kellum
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2015-05-04 00:00:00.000000000 Z
11
+ date: 2017-07-07 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  requirement: !ruby/object:Gem::Requirement
15
15
  requirements:
16
- - - ~>
16
+ - - "~>"
17
17
  - !ruby/object:Gem::Version
18
18
  version: '1.7'
19
19
  name: iudex-core
@@ -21,13 +21,13 @@ dependencies:
21
21
  type: :runtime
22
22
  version_requirements: !ruby/object:Gem::Requirement
23
23
  requirements:
24
- - - ~>
24
+ - - "~>"
25
25
  - !ruby/object:Gem::Version
26
26
  version: '1.7'
27
27
  - !ruby/object:Gem::Dependency
28
28
  requirement: !ruby/object:Gem::Requirement
29
29
  requirements:
30
- - - ~>
30
+ - - "~>"
31
31
  - !ruby/object:Gem::Version
32
32
  version: 1.9.18
33
33
  name: rjack-nekohtml
@@ -35,13 +35,13 @@ dependencies:
35
35
  type: :runtime
36
36
  version_requirements: !ruby/object:Gem::Requirement
37
37
  requirements:
38
- - - ~>
38
+ - - "~>"
39
39
  - !ruby/object:Gem::Version
40
40
  version: 1.9.18
41
41
  - !ruby/object:Gem::Dependency
42
42
  requirement: !ruby/object:Gem::Requirement
43
43
  requirements:
44
- - - ~>
44
+ - - "~>"
45
45
  - !ruby/object:Gem::Version
46
46
  version: 1.7.0
47
47
  name: gravitext-xmlprod
@@ -49,13 +49,13 @@ dependencies:
49
49
  type: :runtime
50
50
  version_requirements: !ruby/object:Gem::Requirement
51
51
  requirements:
52
- - - ~>
52
+ - - "~>"
53
53
  - !ruby/object:Gem::Version
54
54
  version: 1.7.0
55
55
  - !ruby/object:Gem::Dependency
56
56
  requirement: !ruby/object:Gem::Requirement
57
57
  requirements:
58
- - - ~>
58
+ - - "~>"
59
59
  - !ruby/object:Gem::Version
60
60
  version: 4.7.4
61
61
  name: minitest
@@ -63,13 +63,13 @@ dependencies:
63
63
  type: :development
64
64
  version_requirements: !ruby/object:Gem::Requirement
65
65
  requirements:
66
- - - ~>
66
+ - - "~>"
67
67
  - !ruby/object:Gem::Version
68
68
  version: 4.7.4
69
69
  - !ruby/object:Gem::Dependency
70
70
  requirement: !ruby/object:Gem::Requirement
71
71
  requirements:
72
- - - ~>
72
+ - - "~>"
73
73
  - !ruby/object:Gem::Version
74
74
  version: '1.5'
75
75
  name: rjack-logback
@@ -77,13 +77,13 @@ dependencies:
77
77
  type: :development
78
78
  version_requirements: !ruby/object:Gem::Requirement
79
79
  requirements:
80
- - - ~>
80
+ - - "~>"
81
81
  - !ruby/object:Gem::Version
82
82
  version: '1.5'
83
83
  - !ruby/object:Gem::Dependency
84
84
  requirement: !ruby/object:Gem::Requirement
85
85
  requirements:
86
- - - ~>
86
+ - - "~>"
87
87
  - !ruby/object:Gem::Version
88
88
  version: '2.1'
89
89
  name: rjack-tarpit
@@ -91,10 +91,12 @@ dependencies:
91
91
  type: :development
92
92
  version_requirements: !ruby/object:Gem::Requirement
93
93
  requirements:
94
- - - ~>
94
+ - - "~>"
95
95
  - !ruby/object:Gem::Version
96
96
  version: '2.1'
97
- description: Iudex is a general purpose web crawler and feed processor in ruby/java. The iudex-html gem contains filters for HTML parsing, filtering, exracting text and links.
97
+ description: Iudex is a general purpose web crawler and feed processor in ruby/java.
98
+ The iudex-html gem contains filters for HTML parsing, filtering, exracting text
99
+ and links.
98
100
  email:
99
101
  - dek-oss@gravitext.com
100
102
  executables:
@@ -118,7 +120,7 @@ files:
118
120
  - lib/iudex-html.rb
119
121
  - lib/iudex-html/base.rb
120
122
  - lib/iudex-html/factory_helper.rb
121
- - lib/iudex-html/iudex-html-1.7.0.jar
123
+ - lib/iudex-html/iudex-html-1.7.1.jar
122
124
  - pom.xml
123
125
  - test/html_test_helper.rb
124
126
  - test/reddit.xhtml
@@ -139,23 +141,23 @@ licenses:
139
141
  metadata: {}
140
142
  post_install_message:
141
143
  rdoc_options:
142
- - --main
144
+ - "--main"
143
145
  - README.rdoc
144
146
  require_paths:
145
147
  - lib
146
148
  required_ruby_version: !ruby/object:Gem::Requirement
147
149
  requirements:
148
- - - '>='
150
+ - - ">="
149
151
  - !ruby/object:Gem::Version
150
152
  version: 1.8.7
151
153
  required_rubygems_version: !ruby/object:Gem::Requirement
152
154
  requirements:
153
- - - '>='
155
+ - - ">="
154
156
  - !ruby/object:Gem::Version
155
157
  version: '0'
156
158
  requirements: []
157
159
  rubyforge_project:
158
- rubygems_version: 2.4.5
160
+ rubygems_version: 2.6.11
159
161
  signing_key:
160
162
  specification_version: 4
161
163
  summary: Iudex is a general purpose web crawler and feed processor in ruby/java.