rfeedfinder 0.9.0 → 0.9.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/History.txt +7 -3
- data/lib/rfeedfinder/version.rb +1 -1
- data/lib/rfeedfinder.rb +10 -6
- data/test/test_rfeedfinder.rb +21 -17
- data/website/index.html +14 -63
- data/website/index.txt +14 -15
- metadata +2 -2
data/History.txt
CHANGED
data/lib/rfeedfinder/version.rb
CHANGED
data/lib/rfeedfinder.rb
CHANGED
@@ -1,4 +1,3 @@
|
|
1
|
-
require File.dirname(__FILE__) + '/rfeedfinder/version.rb'
|
2
1
|
require 'net/http'
|
3
2
|
require 'rubygems'
|
4
3
|
require 'open-uri'
|
@@ -88,14 +87,17 @@ module Rfeedfinder
|
|
88
87
|
return false
|
89
88
|
end
|
90
89
|
begin
|
90
|
+
data = Hpricot(open(uri), :xml => true)
|
91
|
+
rescue OpenURI::HTTPError
|
91
92
|
html = Net::HTTP.get(URI.parse(uri))
|
92
|
-
data = Hpricot(
|
93
|
-
return isFeedData?(data)
|
93
|
+
data = Hpricot(html, :xml => true)
|
94
94
|
rescue Timeout::Error
|
95
95
|
return false
|
96
96
|
rescue
|
97
97
|
return false
|
98
|
-
end
|
98
|
+
end
|
99
|
+
|
100
|
+
return isFeedData?(data)
|
99
101
|
end
|
100
102
|
|
101
103
|
def getFeedsFromSyndic8(uri)
|
@@ -118,12 +120,14 @@ module Rfeedfinder
|
|
118
120
|
fulluri = makeFullURI(uri)
|
119
121
|
|
120
122
|
begin
|
121
|
-
html = Net::HTTP.get(URI.parse(fulluri))
|
122
123
|
data = Hpricot(open(fulluri), :xml => true)
|
123
124
|
rescue Timeout::Error
|
124
125
|
return []
|
126
|
+
rescue OpenURI::HTTPError
|
127
|
+
html = Net::HTTP.get(URI.parse(fulluri))
|
128
|
+
data = Hpricot(html, :xml => true)
|
125
129
|
rescue => err
|
126
|
-
puts "Error while opening #{fulluri} with Hpricot: " << $!
|
130
|
+
puts "Error while opening #{fulluri} with Hpricot: #{err.class} " << $!
|
127
131
|
return []
|
128
132
|
end
|
129
133
|
|
data/test/test_rfeedfinder.rb
CHANGED
@@ -25,7 +25,7 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
25
25
|
"http://rss.jumpcut.com/rss/user?u_id=17C65AB8A6EF11DBBE093EF340157CF2"
|
26
26
|
end
|
27
27
|
|
28
|
-
def
|
28
|
+
def test_jumpcut_home
|
29
29
|
feed_finder "http://www.jumpcut.com/myhome/?u_id=DB9EC418FDAF11DB8198000423CEF5F6",
|
30
30
|
"http://rss.jumpcut.com/rss/user?u_id=db9ec418fdaf11db8198000423cef5f6"
|
31
31
|
end
|
@@ -35,6 +35,22 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
35
35
|
"http://rss.jumpcut.com/rss/user?u_id=db9ec418fdaf11db8198000423cef5f6"
|
36
36
|
end
|
37
37
|
|
38
|
+
def test_random_blogspot
|
39
|
+
feed_finder "http://organizandolaesperanza.blogspot.com"
|
40
|
+
feed_finder "http://skblackburn.blogspot.com/"
|
41
|
+
feed_finder "http://nadapersonal.blogspot.com"
|
42
|
+
feed_finder "http://diariodeunadislexica.blogspot.com/"
|
43
|
+
feed_finder "http://diputadodelosverdes.blogspot.com/"
|
44
|
+
feed_finder "http://cinclin.blogspot.com/"
|
45
|
+
feed_finder "http://claudiaramos.blogspot.com/"
|
46
|
+
end
|
47
|
+
|
48
|
+
def test_el_pais
|
49
|
+
feed_finder "http://lacomunidad.elpais.com/krismontesinos/"
|
50
|
+
feed_finder "http://lacomunidad.elpais.com/krismontesinos/posts"
|
51
|
+
feed_finder "http://lacomunidad.elpais.com/krismontesinos"
|
52
|
+
end
|
53
|
+
|
38
54
|
def test_from_feevy
|
39
55
|
feed_finder "http://www.becker-posner-blog.com/index.rdf"
|
40
56
|
feed_finder "http://www.slashdot.com", "http://rss.slashdot.org/Slashdot/slashdot"
|
@@ -44,15 +60,9 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
44
60
|
feed_finder "http://www.twitter.com/alx/"
|
45
61
|
feed_finder "http://alemama.blogspot.com"
|
46
62
|
feed_finder "http://seedmagazine.com/news/atom-focus.xml"
|
47
|
-
feed_finder "http://organizandolaesperanza.blogspot.com"
|
48
63
|
feed_finder "http://bitacora.feevy.com"
|
49
64
|
feed_finder "http://www.enriquemeneses.com/"
|
50
|
-
feed_finder "http://skblackburn.blogspot.com/"
|
51
65
|
feed_finder "http://ianasagasti.blogs.com/"
|
52
|
-
feed_finder "http://nadapersonal.blogspot.com"
|
53
|
-
feed_finder "http://lacomunidad.elpais.com/krismontesinos/"
|
54
|
-
feed_finder "http://lacomunidad.elpais.com/krismontesinos/posts"
|
55
|
-
feed_finder "http://lacomunidad.elpais.com/krismontesinos"
|
56
66
|
feed_finder "http://www.ecoperiodico.com/"
|
57
67
|
feed_finder "http://bloc.balearweb.net/rss.php?summary=1"
|
58
68
|
feed_finder "http://www.antoniobezanilla.com/"
|
@@ -61,26 +71,18 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
61
71
|
feed_finder "http://www.dosdedosdefrente.com/blog/"
|
62
72
|
feed_finder "http://www.deugarte.com/blog/fabbing/feed"
|
63
73
|
feed_finder "http://www.papelenblanco.com/autor/sergio-fernandez/rss2.xml"
|
64
|
-
feed_finder "http://www.fotolog.com/darth_fonsu/"
|
65
|
-
feed_finder "http://www.fotolog.com/darth_fonsu/feed/main/rss20"
|
66
|
-
feed_finder "http://www1.fotolog.com/mad_lux"
|
67
|
-
feed_finder "http://www1.fotolog.com/kel_06/"
|
68
74
|
feed_finder "http://sombra.lamatriz.org/"
|
69
75
|
feed_finder "http://tristezza0.spaces.live.com/", "http://tristezza0.spaces.live.com/feed.rss"
|
70
76
|
feed_finder "http://lacoctelera.com/macadamia"
|
71
|
-
feed_finder "http://diariodeunadislexica.blogspot.com/"
|
72
77
|
feed_finder "http://www.liberation.fr"
|
73
|
-
feed_finder "http://diputadodelosverdes.blogspot.com/"
|
74
78
|
feed_finder "http://juxtaprose.com/posts/good-web-20-critique/feed/"
|
75
79
|
feed_finder "http://www.gara.net/rss/kultura"
|
76
80
|
feed_finder "http://davicius.wordpress.com/feed/"
|
77
81
|
feed_finder "http://www.cato-at-liberty.org/wp-rss.php"
|
78
82
|
feed_finder "http://creando.bligoo.com/"
|
79
83
|
feed_finder "http://svn.37signals.com/", "http://feeds.feedburner.com/37signals/beMH"
|
80
|
-
feed_finder "http://cinclin.blogspot.com/"
|
81
84
|
feed_finder "http://www.takingitglobal.org/connections/tigblogs/feed.rss?UserID=251"
|
82
85
|
feed_finder "http://www.rubendomfer.com/blog/"
|
83
|
-
feed_finder "http://claudiaramos.blogspot.com/"
|
84
86
|
feed_finder "http://www.arfues.net/weblog/"
|
85
87
|
feed_finder "http://www.lkstro.com/"
|
86
88
|
feed_finder "http://www.lorenabetta.info"
|
@@ -90,9 +92,11 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
90
92
|
feed_finder "http://mephisto.sobrerailes.com/"
|
91
93
|
end
|
92
94
|
|
93
|
-
def
|
94
|
-
|
95
|
+
def test_fotolog
|
96
|
+
feed_finder "http://www.fotolog.com/darth_fonsu/"
|
97
|
+
feed_finder "http://www.fotolog.com/darth_fonsu/feed/main/rss20"
|
95
98
|
feed_finder "http://www1.fotolog.com/mad_lux", "http://www.fotolog.com/mad_lux/feed/main/rss20"
|
99
|
+
feed_finder "http://www1.fotolog.com/kel_06/"
|
96
100
|
end
|
97
101
|
|
98
102
|
def test_not_fulluri_link
|
data/website/index.html
CHANGED
@@ -33,15 +33,15 @@
|
|
33
33
|
<h1>rfeedfinder</h1>
|
34
34
|
<div id="version" class="clickable" onclick='document.location = "http://rubyforge.org/projects/rfeedfinder"; return false'>
|
35
35
|
<p>Get Version</p>
|
36
|
-
<a href="http://rubyforge.org/projects/rfeedfinder" class="numbers">0.9.
|
36
|
+
<a href="http://rubyforge.org/projects/rfeedfinder" class="numbers">0.9.1</a>
|
37
37
|
</div>
|
38
|
-
<
|
38
|
+
<h2>What</h2>
|
39
39
|
|
40
40
|
|
41
|
-
<
|
41
|
+
<p>rFeedFinder uses <span class="caps">RSS</span> autodiscovery, Atom autodiscovery, spidering, <span class="caps">URL</span> correction, and Web service queries (whatever it takes) to find the feed.</p>
|
42
42
|
|
43
43
|
|
44
|
-
<p>
|
44
|
+
<p>From <a href="http://www.aaronsw.com/2002/feedfinder/">Aaron Swartz feedfinder python lib</a>.</p>
|
45
45
|
|
46
46
|
|
47
47
|
<h2>Installing</h2>
|
@@ -49,69 +49,20 @@
|
|
49
49
|
|
50
50
|
<pre syntax="ruby">sudo gem install rfeedfinder</pre>
|
51
51
|
|
52
|
-
<h2>The basics</h2>
|
53
|
-
|
54
|
-
|
55
52
|
<h2>Demonstration of usage</h2>
|
56
53
|
|
57
54
|
|
58
|
-
<
|
59
|
-
|
60
|
-
<blockquote>
|
61
|
-
<p>require ‘rfeedfinder’</p>
|
62
|
-
|
63
|
-
</blockquote>
|
64
|
-
|
65
|
-
|
66
|
-
|
67
|
-
</blockquote>
|
68
|
-
|
69
|
-
|
70
|
-
|
71
|
-
</blockquote>
|
72
|
-
|
73
|
-
|
74
|
-
|
75
|
-
|
76
|
-
<blockquote>
|
77
|
-
<blockquote>
|
78
|
-
<blockquote>
|
79
|
-
<p>Rfeedfinder.feed(‘scripting.com’)
|
80
|
-
‘http://scripting.com/rss.xml’</p>
|
81
|
-
|
82
|
-
</blockquote>
|
83
|
-
|
84
|
-
|
85
|
-
|
86
|
-
</blockquote>
|
87
|
-
|
88
|
-
|
89
|
-
|
90
|
-
</blockquote>
|
91
|
-
|
92
|
-
|
93
|
-
|
94
|
-
|
95
|
-
<blockquote>
|
96
|
-
<blockquote>
|
97
|
-
<blockquote>
|
98
|
-
<p>Rfeedfinder.feeds(‘scripting.com’)
|
99
|
-
[‘http://delong.typepad.com/sdj/atom.xml’,
|
100
|
-
‘http://delong.typepad.com/sdj/index.rdf’,
|
101
|
-
‘http://delong.typepad.com/sdj/rss.xml’]</p>
|
102
|
-
|
103
|
-
</blockquote>
|
104
|
-
|
105
|
-
|
106
|
-
|
107
|
-
</blockquote>
|
108
|
-
|
109
|
-
|
110
|
-
|
111
|
-
</blockquote>
|
112
|
-
|
55
|
+
<pre syntax="ruby">
|
56
|
+
require 'rfeedfinder'
|
113
57
|
|
58
|
+
Rfeedfinder.feed('scripting.com')
|
59
|
+
# return String: 'http://scripting.com/rss.xml'
|
114
60
|
|
61
|
+
Rfeedfinder.feeds('scripting.com')
|
62
|
+
# return Array: ['http://delong.typepad.com/sdj/atom.xml',
|
63
|
+
# 'http://delong.typepad.com/sdj/index.rdf',
|
64
|
+
# 'http://delong.typepad.com/sdj/rss.xml']
|
65
|
+
</pre>
|
115
66
|
|
116
67
|
<h2>Forum</h2>
|
117
68
|
|
@@ -137,7 +88,7 @@
|
|
137
88
|
<h2>Contact</h2>
|
138
89
|
|
139
90
|
|
140
|
-
<p>Comments are welcome. Send an email to <a href="mailto:
|
91
|
+
<p>Comments are welcome. Send an email to <a href="mailto:alx.girard@gmail.com">Alexandre Girard</a>.</p>
|
141
92
|
<p class="coda">
|
142
93
|
<a href="mailto:drnicwilliams@gmail.com">Dr Nic</a>, 24th August 2007<br>
|
143
94
|
Theme extended from <a href="http://rb2js.rubyforge.org/">Paul Battley</a>
|
data/website/index.txt
CHANGED
@@ -1,30 +1,29 @@
|
|
1
1
|
h1. rfeedfinder
|
2
2
|
|
3
|
-
h1. → 'rfeedfinder'
|
4
|
-
|
5
|
-
|
6
3
|
h2. What
|
7
4
|
|
8
|
-
rFeedFinder uses RSS autodiscovery, Atom autodiscovery, spidering, URL correction, and Web service queries
|
5
|
+
rFeedFinder uses RSS autodiscovery, Atom autodiscovery, spidering, URL correction, and Web service queries (whatever it takes) to find the feed.
|
6
|
+
|
7
|
+
From "Aaron Swartz feedfinder python lib":http://www.aaronsw.com/2002/feedfinder/.
|
9
8
|
|
10
9
|
h2. Installing
|
11
10
|
|
12
11
|
<pre syntax="ruby">sudo gem install rfeedfinder</pre>
|
13
12
|
|
14
|
-
h2. The basics
|
15
|
-
|
16
|
-
|
17
13
|
h2. Demonstration of usage
|
18
14
|
|
19
|
-
|
15
|
+
<pre syntax="ruby">
|
16
|
+
require 'rfeedfinder'
|
17
|
+
|
18
|
+
Rfeedfinder.feed('scripting.com')
|
19
|
+
# return String: 'http://scripting.com/rss.xml'
|
20
20
|
|
21
|
-
|
22
|
-
'http://
|
21
|
+
Rfeedfinder.feeds('scripting.com')
|
22
|
+
# return Array: ['http://delong.typepad.com/sdj/atom.xml',
|
23
|
+
# 'http://delong.typepad.com/sdj/index.rdf',
|
24
|
+
# 'http://delong.typepad.com/sdj/rss.xml']
|
25
|
+
</pre>
|
23
26
|
|
24
|
-
>>> Rfeedfinder.feeds('scripting.com')
|
25
|
-
['http://delong.typepad.com/sdj/atom.xml',
|
26
|
-
'http://delong.typepad.com/sdj/index.rdf',
|
27
|
-
'http://delong.typepad.com/sdj/rss.xml']
|
28
27
|
|
29
28
|
h2. Forum
|
30
29
|
|
@@ -42,4 +41,4 @@ This code is free to use under the terms of the MIT license.
|
|
42
41
|
|
43
42
|
h2. Contact
|
44
43
|
|
45
|
-
Comments are welcome. Send an email to "
|
44
|
+
Comments are welcome. Send an email to "Alexandre Girard":mailto:alx.girard@gmail.com.
|
metadata
CHANGED
@@ -3,8 +3,8 @@ rubygems_version: 0.9.4
|
|
3
3
|
specification_version: 1
|
4
4
|
name: rfeedfinder
|
5
5
|
version: !ruby/object:Gem::Version
|
6
|
-
version: 0.9.
|
7
|
-
date: 2007-08-
|
6
|
+
version: 0.9.1
|
7
|
+
date: 2007-08-25 00:00:00 +02:00
|
8
8
|
summary: rFeedFinder uses RSS autodiscovery, Atom autodiscovery, spidering, URL correction, and Web service queries -- whatever it takes -- to find the feed.
|
9
9
|
require_paths:
|
10
10
|
- lib
|