htmlclipping 0.1.4 → 0.1.5

Sign up to get free protection for your applications and to get access to all the features.
data/lib/htmlclipping.rb CHANGED
@@ -33,7 +33,7 @@
33
33
  require 'iconv'
34
34
 
35
35
  class HtmlClipping
36
- Version = '0.1.4'
36
+ Version = '0.1.5'
37
37
 
38
38
  # html:: The HTML of the referring web page.
39
39
  # referred_uri:: The URI that is being referred to.
@@ -187,6 +187,9 @@ class HtmlClipping
187
187
  %r{</?(acronym|nobr|abbr|strong|td|tt|small|em|img|font|span|input|hr|noscript|legend|address).*?>}im, ''
188
188
  )
189
189
  @detokenized.gsub!( %r{</?(b|i)(\s+.*?)?>}i, '' )
190
+ @detokenized.gsub!( %r{</?.*?>} ) do |match|
191
+ match =~ %r{</?(xhtml:)?(br|a)(\s.*?)?>}i ? match : ''
192
+ end
190
193
  substitute_links
191
194
  compact_brs
192
195
  @detokenized.gsub!( /\s+/, ' ' )
@@ -201,6 +204,7 @@ class HtmlClipping
201
204
  if ( a_att =~ /href=('|")?([^'" ]*)("|')?/i )
202
205
  href = $2
203
206
  href.gsub!( /("|')$/, '' )
207
+ href.strip!
204
208
  matches_self = ( href == @referred_uri )
205
209
  else
206
210
  matches_self = false
data/lib/htmlclipping.rb~ CHANGED
@@ -33,7 +33,7 @@
33
33
  require 'iconv'
34
34
 
35
35
  class HtmlClipping
36
- Version = '0.1.3'
36
+ Version = '0.1.4'
37
37
 
38
38
  # html:: The HTML of the referring web page.
39
39
  # referred_uri:: The URI that is being referred to.
@@ -187,6 +187,9 @@ class HtmlClipping
187
187
  %r{</?(acronym|nobr|abbr|strong|td|tt|small|em|img|font|span|input|hr|noscript|legend|address).*?>}im, ''
188
188
  )
189
189
  @detokenized.gsub!( %r{</?(b|i)(\s+.*?)?>}i, '' )
190
+ @detokenized.gsub!( %r{</?.*?>} ) do |match|
191
+ match =~ %r{</?(xhtml:)?(br|a)(\s.*?)?>}i ? match : ''
192
+ end
190
193
  substitute_links
191
194
  compact_brs
192
195
  @detokenized.gsub!( /\s+/, ' ' )
@@ -201,6 +204,7 @@ class HtmlClipping
201
204
  if ( a_att =~ /href=('|")?([^'" ]*)("|')?/i )
202
205
  href = $2
203
206
  href.gsub!( /("|')$/, '' )
207
+ href.strip!
204
208
  matches_self = ( href == @referred_uri )
205
209
  else
206
210
  matches_self = false
metadata CHANGED
@@ -3,8 +3,8 @@ rubygems_version: 0.8.6
3
3
  specification_version: 1
4
4
  name: htmlclipping
5
5
  version: !ruby/object:Gem::Version
6
- version: 0.1.4
7
- date: 2005-11-04
6
+ version: 0.1.5
7
+ date: 2005-12-25
8
8
  summary: HtmlClipping generates excerpts from an HTML page that has a link pointing to a particular URI.
9
9
  require_paths:
10
10
  - lib