rfeedfinder 0.9.0 → 0.9.1
Sign up to get free protection for your applications and to get access to all the features.
- data/History.txt +7 -3
- data/lib/rfeedfinder/version.rb +1 -1
- data/lib/rfeedfinder.rb +10 -6
- data/test/test_rfeedfinder.rb +21 -17
- data/website/index.html +14 -63
- data/website/index.txt +14 -15
- metadata +2 -2
data/History.txt
CHANGED
data/lib/rfeedfinder/version.rb
CHANGED
data/lib/rfeedfinder.rb
CHANGED
@@ -1,4 +1,3 @@
|
|
1
|
-
require File.dirname(__FILE__) + '/rfeedfinder/version.rb'
|
2
1
|
require 'net/http'
|
3
2
|
require 'rubygems'
|
4
3
|
require 'open-uri'
|
@@ -88,14 +87,17 @@ module Rfeedfinder
|
|
88
87
|
return false
|
89
88
|
end
|
90
89
|
begin
|
90
|
+
data = Hpricot(open(uri), :xml => true)
|
91
|
+
rescue OpenURI::HTTPError
|
91
92
|
html = Net::HTTP.get(URI.parse(uri))
|
92
|
-
data = Hpricot(
|
93
|
-
return isFeedData?(data)
|
93
|
+
data = Hpricot(html, :xml => true)
|
94
94
|
rescue Timeout::Error
|
95
95
|
return false
|
96
96
|
rescue
|
97
97
|
return false
|
98
|
-
end
|
98
|
+
end
|
99
|
+
|
100
|
+
return isFeedData?(data)
|
99
101
|
end
|
100
102
|
|
101
103
|
def getFeedsFromSyndic8(uri)
|
@@ -118,12 +120,14 @@ module Rfeedfinder
|
|
118
120
|
fulluri = makeFullURI(uri)
|
119
121
|
|
120
122
|
begin
|
121
|
-
html = Net::HTTP.get(URI.parse(fulluri))
|
122
123
|
data = Hpricot(open(fulluri), :xml => true)
|
123
124
|
rescue Timeout::Error
|
124
125
|
return []
|
126
|
+
rescue OpenURI::HTTPError
|
127
|
+
html = Net::HTTP.get(URI.parse(fulluri))
|
128
|
+
data = Hpricot(html, :xml => true)
|
125
129
|
rescue => err
|
126
|
-
puts "Error while opening #{fulluri} with Hpricot: " << $!
|
130
|
+
puts "Error while opening #{fulluri} with Hpricot: #{err.class} " << $!
|
127
131
|
return []
|
128
132
|
end
|
129
133
|
|
data/test/test_rfeedfinder.rb
CHANGED
@@ -25,7 +25,7 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
25
25
|
"http://rss.jumpcut.com/rss/user?u_id=17C65AB8A6EF11DBBE093EF340157CF2"
|
26
26
|
end
|
27
27
|
|
28
|
-
def
|
28
|
+
def test_jumpcut_home
|
29
29
|
feed_finder "http://www.jumpcut.com/myhome/?u_id=DB9EC418FDAF11DB8198000423CEF5F6",
|
30
30
|
"http://rss.jumpcut.com/rss/user?u_id=db9ec418fdaf11db8198000423cef5f6"
|
31
31
|
end
|
@@ -35,6 +35,22 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
35
35
|
"http://rss.jumpcut.com/rss/user?u_id=db9ec418fdaf11db8198000423cef5f6"
|
36
36
|
end
|
37
37
|
|
38
|
+
def test_random_blogspot
|
39
|
+
feed_finder "http://organizandolaesperanza.blogspot.com"
|
40
|
+
feed_finder "http://skblackburn.blogspot.com/"
|
41
|
+
feed_finder "http://nadapersonal.blogspot.com"
|
42
|
+
feed_finder "http://diariodeunadislexica.blogspot.com/"
|
43
|
+
feed_finder "http://diputadodelosverdes.blogspot.com/"
|
44
|
+
feed_finder "http://cinclin.blogspot.com/"
|
45
|
+
feed_finder "http://claudiaramos.blogspot.com/"
|
46
|
+
end
|
47
|
+
|
48
|
+
def test_el_pais
|
49
|
+
feed_finder "http://lacomunidad.elpais.com/krismontesinos/"
|
50
|
+
feed_finder "http://lacomunidad.elpais.com/krismontesinos/posts"
|
51
|
+
feed_finder "http://lacomunidad.elpais.com/krismontesinos"
|
52
|
+
end
|
53
|
+
|
38
54
|
def test_from_feevy
|
39
55
|
feed_finder "http://www.becker-posner-blog.com/index.rdf"
|
40
56
|
feed_finder "http://www.slashdot.com", "http://rss.slashdot.org/Slashdot/slashdot"
|
@@ -44,15 +60,9 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
44
60
|
feed_finder "http://www.twitter.com/alx/"
|
45
61
|
feed_finder "http://alemama.blogspot.com"
|
46
62
|
feed_finder "http://seedmagazine.com/news/atom-focus.xml"
|
47
|
-
feed_finder "http://organizandolaesperanza.blogspot.com"
|
48
63
|
feed_finder "http://bitacora.feevy.com"
|
49
64
|
feed_finder "http://www.enriquemeneses.com/"
|
50
|
-
feed_finder "http://skblackburn.blogspot.com/"
|
51
65
|
feed_finder "http://ianasagasti.blogs.com/"
|
52
|
-
feed_finder "http://nadapersonal.blogspot.com"
|
53
|
-
feed_finder "http://lacomunidad.elpais.com/krismontesinos/"
|
54
|
-
feed_finder "http://lacomunidad.elpais.com/krismontesinos/posts"
|
55
|
-
feed_finder "http://lacomunidad.elpais.com/krismontesinos"
|
56
66
|
feed_finder "http://www.ecoperiodico.com/"
|
57
67
|
feed_finder "http://bloc.balearweb.net/rss.php?summary=1"
|
58
68
|
feed_finder "http://www.antoniobezanilla.com/"
|
@@ -61,26 +71,18 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
61
71
|
feed_finder "http://www.dosdedosdefrente.com/blog/"
|
62
72
|
feed_finder "http://www.deugarte.com/blog/fabbing/feed"
|
63
73
|
feed_finder "http://www.papelenblanco.com/autor/sergio-fernandez/rss2.xml"
|
64
|
-
feed_finder "http://www.fotolog.com/darth_fonsu/"
|
65
|
-
feed_finder "http://www.fotolog.com/darth_fonsu/feed/main/rss20"
|
66
|
-
feed_finder "http://www1.fotolog.com/mad_lux"
|
67
|
-
feed_finder "http://www1.fotolog.com/kel_06/"
|
68
74
|
feed_finder "http://sombra.lamatriz.org/"
|
69
75
|
feed_finder "http://tristezza0.spaces.live.com/", "http://tristezza0.spaces.live.com/feed.rss"
|
70
76
|
feed_finder "http://lacoctelera.com/macadamia"
|
71
|
-
feed_finder "http://diariodeunadislexica.blogspot.com/"
|
72
77
|
feed_finder "http://www.liberation.fr"
|
73
|
-
feed_finder "http://diputadodelosverdes.blogspot.com/"
|
74
78
|
feed_finder "http://juxtaprose.com/posts/good-web-20-critique/feed/"
|
75
79
|
feed_finder "http://www.gara.net/rss/kultura"
|
76
80
|
feed_finder "http://davicius.wordpress.com/feed/"
|
77
81
|
feed_finder "http://www.cato-at-liberty.org/wp-rss.php"
|
78
82
|
feed_finder "http://creando.bligoo.com/"
|
79
83
|
feed_finder "http://svn.37signals.com/", "http://feeds.feedburner.com/37signals/beMH"
|
80
|
-
feed_finder "http://cinclin.blogspot.com/"
|
81
84
|
feed_finder "http://www.takingitglobal.org/connections/tigblogs/feed.rss?UserID=251"
|
82
85
|
feed_finder "http://www.rubendomfer.com/blog/"
|
83
|
-
feed_finder "http://claudiaramos.blogspot.com/"
|
84
86
|
feed_finder "http://www.arfues.net/weblog/"
|
85
87
|
feed_finder "http://www.lkstro.com/"
|
86
88
|
feed_finder "http://www.lorenabetta.info"
|
@@ -90,9 +92,11 @@ class TestRfeedfinder < Test::Unit::TestCase
|
|
90
92
|
feed_finder "http://mephisto.sobrerailes.com/"
|
91
93
|
end
|
92
94
|
|
93
|
-
def
|
94
|
-
|
95
|
+
def test_fotolog
|
96
|
+
feed_finder "http://www.fotolog.com/darth_fonsu/"
|
97
|
+
feed_finder "http://www.fotolog.com/darth_fonsu/feed/main/rss20"
|
95
98
|
feed_finder "http://www1.fotolog.com/mad_lux", "http://www.fotolog.com/mad_lux/feed/main/rss20"
|
99
|
+
feed_finder "http://www1.fotolog.com/kel_06/"
|
96
100
|
end
|
97
101
|
|
98
102
|
def test_not_fulluri_link
|
data/website/index.html
CHANGED
@@ -33,15 +33,15 @@
|
|
33
33
|
<h1>rfeedfinder</h1>
|
34
34
|
<div id="version" class="clickable" onclick='document.location = "http://rubyforge.org/projects/rfeedfinder"; return false'>
|
35
35
|
<p>Get Version</p>
|
36
|
-
<a href="http://rubyforge.org/projects/rfeedfinder" class="numbers">0.9.
|
36
|
+
<a href="http://rubyforge.org/projects/rfeedfinder" class="numbers">0.9.1</a>
|
37
37
|
</div>
|
38
|
-
<
|
38
|
+
<h2>What</h2>
|
39
39
|
|
40
40
|
|
41
|
-
<
|
41
|
+
<p>rFeedFinder uses <span class="caps">RSS</span> autodiscovery, Atom autodiscovery, spidering, <span class="caps">URL</span> correction, and Web service queries (whatever it takes) to find the feed.</p>
|
42
42
|
|
43
43
|
|
44
|
-
<p>
|
44
|
+
<p>From <a href="http://www.aaronsw.com/2002/feedfinder/">Aaron Swartz feedfinder python lib</a>.</p>
|
45
45
|
|
46
46
|
|
47
47
|
<h2>Installing</h2>
|
@@ -49,69 +49,20 @@
|
|
49
49
|
|
50
50
|
<pre syntax="ruby">sudo gem install rfeedfinder</pre>
|
51
51
|
|
52
|
-
<h2>The basics</h2>
|
53
|
-
|
54
|
-
|
55
52
|
<h2>Demonstration of usage</h2>
|
56
53
|
|
57
54
|
|
58
|
-
<
|
59
|
-
|
60
|
-
<blockquote>
|
61
|
-
<p>require ‘rfeedfinder’</p>
|
62
|
-
|
63
|
-
</blockquote>
|
64
|
-
|
65
|
-
|
66
|
-
|
67
|
-
</blockquote>
|
68
|
-
|
69
|
-
|
70
|
-
|
71
|
-
</blockquote>
|
72
|
-
|
73
|
-
|
74
|
-
|
75
|
-
|
76
|
-
<blockquote>
|
77
|
-
<blockquote>
|
78
|
-
<blockquote>
|
79
|
-
<p>Rfeedfinder.feed(‘scripting.com’)
|
80
|
-
‘http://scripting.com/rss.xml’</p>
|
81
|
-
|
82
|
-
</blockquote>
|
83
|
-
|
84
|
-
|
85
|
-
|
86
|
-
</blockquote>
|
87
|
-
|
88
|
-
|
89
|
-
|
90
|
-
</blockquote>
|
91
|
-
|
92
|
-
|
93
|
-
|
94
|
-
|
95
|
-
<blockquote>
|
96
|
-
<blockquote>
|
97
|
-
<blockquote>
|
98
|
-
<p>Rfeedfinder.feeds(‘scripting.com’)
|
99
|
-
[‘http://delong.typepad.com/sdj/atom.xml’,
|
100
|
-
‘http://delong.typepad.com/sdj/index.rdf’,
|
101
|
-
‘http://delong.typepad.com/sdj/rss.xml’]</p>
|
102
|
-
|
103
|
-
</blockquote>
|
104
|
-
|
105
|
-
|
106
|
-
|
107
|
-
</blockquote>
|
108
|
-
|
109
|
-
|
110
|
-
|
111
|
-
</blockquote>
|
112
|
-
|
55
|
+
<pre syntax="ruby">
|
56
|
+
require 'rfeedfinder'
|
113
57
|
|
58
|
+
Rfeedfinder.feed('scripting.com')
|
59
|
+
# return String: 'http://scripting.com/rss.xml'
|
114
60
|
|
61
|
+
Rfeedfinder.feeds('scripting.com')
|
62
|
+
# return Array: ['http://delong.typepad.com/sdj/atom.xml',
|
63
|
+
# 'http://delong.typepad.com/sdj/index.rdf',
|
64
|
+
# 'http://delong.typepad.com/sdj/rss.xml']
|
65
|
+
</pre>
|
115
66
|
|
116
67
|
<h2>Forum</h2>
|
117
68
|
|
@@ -137,7 +88,7 @@
|
|
137
88
|
<h2>Contact</h2>
|
138
89
|
|
139
90
|
|
140
|
-
<p>Comments are welcome. Send an email to <a href="mailto:
|
91
|
+
<p>Comments are welcome. Send an email to <a href="mailto:alx.girard@gmail.com">Alexandre Girard</a>.</p>
|
141
92
|
<p class="coda">
|
142
93
|
<a href="mailto:drnicwilliams@gmail.com">Dr Nic</a>, 24th August 2007<br>
|
143
94
|
Theme extended from <a href="http://rb2js.rubyforge.org/">Paul Battley</a>
|
data/website/index.txt
CHANGED
@@ -1,30 +1,29 @@
|
|
1
1
|
h1. rfeedfinder
|
2
2
|
|
3
|
-
h1. → 'rfeedfinder'
|
4
|
-
|
5
|
-
|
6
3
|
h2. What
|
7
4
|
|
8
|
-
rFeedFinder uses RSS autodiscovery, Atom autodiscovery, spidering, URL correction, and Web service queries
|
5
|
+
rFeedFinder uses RSS autodiscovery, Atom autodiscovery, spidering, URL correction, and Web service queries (whatever it takes) to find the feed.
|
6
|
+
|
7
|
+
From "Aaron Swartz feedfinder python lib":http://www.aaronsw.com/2002/feedfinder/.
|
9
8
|
|
10
9
|
h2. Installing
|
11
10
|
|
12
11
|
<pre syntax="ruby">sudo gem install rfeedfinder</pre>
|
13
12
|
|
14
|
-
h2. The basics
|
15
|
-
|
16
|
-
|
17
13
|
h2. Demonstration of usage
|
18
14
|
|
19
|
-
|
15
|
+
<pre syntax="ruby">
|
16
|
+
require 'rfeedfinder'
|
17
|
+
|
18
|
+
Rfeedfinder.feed('scripting.com')
|
19
|
+
# return String: 'http://scripting.com/rss.xml'
|
20
20
|
|
21
|
-
|
22
|
-
'http://
|
21
|
+
Rfeedfinder.feeds('scripting.com')
|
22
|
+
# return Array: ['http://delong.typepad.com/sdj/atom.xml',
|
23
|
+
# 'http://delong.typepad.com/sdj/index.rdf',
|
24
|
+
# 'http://delong.typepad.com/sdj/rss.xml']
|
25
|
+
</pre>
|
23
26
|
|
24
|
-
>>> Rfeedfinder.feeds('scripting.com')
|
25
|
-
['http://delong.typepad.com/sdj/atom.xml',
|
26
|
-
'http://delong.typepad.com/sdj/index.rdf',
|
27
|
-
'http://delong.typepad.com/sdj/rss.xml']
|
28
27
|
|
29
28
|
h2. Forum
|
30
29
|
|
@@ -42,4 +41,4 @@ This code is free to use under the terms of the MIT license.
|
|
42
41
|
|
43
42
|
h2. Contact
|
44
43
|
|
45
|
-
Comments are welcome. Send an email to "
|
44
|
+
Comments are welcome. Send an email to "Alexandre Girard":mailto:alx.girard@gmail.com.
|
metadata
CHANGED
@@ -3,8 +3,8 @@ rubygems_version: 0.9.4
|
|
3
3
|
specification_version: 1
|
4
4
|
name: rfeedfinder
|
5
5
|
version: !ruby/object:Gem::Version
|
6
|
-
version: 0.9.
|
7
|
-
date: 2007-08-
|
6
|
+
version: 0.9.1
|
7
|
+
date: 2007-08-25 00:00:00 +02:00
|
8
8
|
summary: rFeedFinder uses RSS autodiscovery, Atom autodiscovery, spidering, URL correction, and Web service queries -- whatever it takes -- to find the feed.
|
9
9
|
require_paths:
|
10
10
|
- lib
|