scrapers 0.4.0 → 0.4.1

Sign up to get free protection for your applications and to get access to all the features.
@@ -1,326 +0,0 @@
1
- ---
2
- http_interactions:
3
- - request:
4
- method: get
5
- uri: http://apod.nasa.gov/apod/astropix.html
6
- body:
7
- encoding: US-ASCII
8
- string: ''
9
- headers:
10
- Accept-Encoding:
11
- - gzip,deflate,identity
12
- Accept:
13
- - '*/*'
14
- User-Agent:
15
- - Mechanize/2.7.2 Ruby/2.0.0p247 (http://github.com/sparklemotion/mechanize/)
16
- Accept-Charset:
17
- - ISO-8859-1,utf-8;q=0.7,*;q=0.7
18
- Accept-Language:
19
- - en-us,en;q=0.5
20
- Host:
21
- - apod.nasa.gov
22
- Connection:
23
- - keep-alive
24
- Keep-Alive:
25
- - 300
26
- response:
27
- status:
28
- code: 200
29
- message: OK
30
- headers:
31
- Date:
32
- - Sun, 29 Sep 2013 04:05:40 GMT
33
- Server:
34
- - WebServer/1.0
35
- Accept-Ranges:
36
- - bytes
37
- Content-Length:
38
- - '4683'
39
- Keep-Alive:
40
- - timeout=5, max=100
41
- Connection:
42
- - Keep-Alive
43
- Content-Type:
44
- - text/html; charset=ISO-8859-1
45
- body:
46
- encoding: UTF-8
47
- string: "<html>\n<head>\n<title>Astronomy Picture of the Day\n</title>\n<!--
48
- gsfc meta tags -->\n<meta name=\"orgcode\" content=\"661\">\n<meta name=\"rno\"
49
- content=\"phillip.a.newman\">\n<meta name=\"content-owner\" content=\"Jerry.T.Bonnell.1\">\n<meta
50
- name=\"webmaster\" content=\"Stephen.F.Fantasia.1\">\n<meta name=\"description\"
51
- content=\"A different astronomy and space science\nrelated image is featured
52
- each day, along with a brief explanation.\">\n<!-- -->\n<meta name=\"keywords\"
53
- content=\"Eagle Nebula, M16, dust pillar\">\n</head>\n<body BGCOLOR=\"#F4F4FF\"
54
- text=\"#000000\" link=\"#0000FF\" vlink=\"#7F0F9F\"\nalink=\"#FF0000\">\n\n<center>\n<h1>
55
- Astronomy Picture of the Day </h1>\n<p>\n\n<a href=\"archivepix.html\">Discover
56
- the cosmos!</a>\nEach day a different image or photograph of our fascinating
57
- universe is\nfeatured, along with a brief explanation written by a professional
58
- astronomer.\n<p>\n\n2013 September 29 \n<br> \n<a href=\"image/1309/fairypillar_hubble_900.jpg\">\n<IMG
59
- SRC=\"image/1309/fairypillar_hubble_900.jpg\"\nalt=\"See Explanation. Clicking
60
- on the picture will download\n the highest resolution version available.\"></a>\n</center>\n\n<center>\n<b>
61
- The Fairy of Eagle Nebula </b> <br> \n<b> Image Credit: </b> \n<a href=\n\"http://heritage.stsci.edu/commonpages/infoindex/ourproject/moreproject.html\"\n>The
62
- Hubble Heritage Team</a>,\n(<a href=\"http://www.stsci.edu/resources/\">STScI</a>/<a
63
- href=\"\nhttp://www.aura-astronomy.org/\">AURA</a>),\n<a href=\"http://www.esa.int/\">ESA</a>,\n<a
64
- href=\"http://www.nasa.gov/\">NASA</a>\n\n</center> <p> \n\n<b> Explanation:
65
- </b> \nThe dust sculptures of the Eagle Nebula are evaporating. \n\nAs powerful
66
- starlight whittles away these\n<a href=\"ap031228.html\">cool cosmic mountains</a>,
67
- the\n<a href=\"ap070218.html\">statuesque pillars</a> that remain\nmight be
68
- imagined as <a href=\n\"http://www.pantheon.org/areas/bestiary/\">mythical
69
- beasts</a>. \n\nPictured <a href=\n\"http://hubblesite.org/newscenter/newsdesk/archive/releases/2005/12/\"\n>above</a>
70
- is one of <a href=\"ap061022.html\">several striking\ndust pillars</a> of
71
- the\n<a href=\"http://en.wikipedia.org/wiki/Eagle_Nebula\">Eagle Nebula</a>\nthat
72
- might be described as a gigantic alien\n<a href=\"http://en.wikipedia.org/wiki/Fairies\">fairy</a>.
73
- \ \n\nThis fairy, however, is ten\n<a href=\"http://chandra.harvard.edu/photo/cosmic_distance.html\"\n>light
74
- years</a> tall and spews radiation much hotter than\n<a href=\"ap130901.html\">common
75
- fire</a>.\n\nThe <a href=\"ap041024.html\">greater Eagle Nebula</a>, M16,\nis
76
- actually a giant evaporating shell of gas and\n<a href=\"ap030706.html\">dust</a>
77
- inside of which is a growing\n<a href=\"http://kidshealth.org/kid/health_problems/teeth/cavity.html\"\n>cavity</a>
78
- filled with a spectacular stellar nursery currently forming an\n<a href=\"http://www.seds.org/messier/open.html\">open
79
- cluster</a> of stars. \n\nThe <a href=\"http://www.spacetelescope.org/images/html/heic0506b.html\"\n>above
80
- image</a> in scientifically re-assigned colors was\n<a href=\"http://heritage.stsci.edu/2005/12b/index.html\">released</a>\nin
81
- 2005 as part of the\n<a href=\"http://www.spacetelescope.org/news/html/heic0506.html\"\n>fifteenth
82
- anniversary celebration</a> of the\n<a href=\"ap021124.html\">launch</a> of
83
- the\n<a href=\"http://www.stsci.edu/hst/HST_overview/\">Hubble Space Telescope</a>.\n\n\n<p>
84
- <center> \n<b> Note: </b>\n<a href=\"http://asterisk.apod.com/viewtopic.php?f=28&t=32210\"\n>How
85
- to follow APOD if the US government shuts down.</a> <br>\n<b> Tomorrow's picture:
86
- </b>the green unknown\n\n<p> <hr>\n<a href=\"ap130928.html\">&lt;</a>\n| <a
87
- href=\"archivepix.html\">Archive</a>\n| <a href=\"lib/aptree.html\">Index</a>\n|
88
- <a href=\"http://antwrp.gsfc.nasa.gov/cgi-bin/apod/apod_search\">Search</a>\n|
89
- <a href=\"calendar/allyears.html\">Calendar</a>\n| <a href=\"/apod.rss\">RSS</a>\n|
90
- <a href=\"lib/edlinks.html\">Education</a>\n| <a href=\"lib/about_apod.html\">About
91
- APOD</a>\n| <a href=\n\"http://asterisk.apod.com/discuss_apod.php?date=130929\">Discuss</a>\n|
92
- <a href=\"ap130930.html\">&gt;</a>\n\n<hr><p>\n<b> Authors & editors: </b>\n<a
93
- href=\"http://www.phy.mtu.edu/faculty/Nemiroff.html\">Robert Nemiroff</a>\n(<a
94
- href=\"http://www.phy.mtu.edu/\">MTU</a>) &\n<a href=\"http://antwrp.gsfc.nasa.gov/htmltest/jbonnell/www/bonnell.html\"\n>Jerry
95
- Bonnell</a> (<a href=\"http://www.astro.umd.edu/\">UMCP</a>)<br>\n<b>NASA
96
- Official: </b> Phillip Newman\n<a href=\"lib/about_apod.html#srapply\">Specific
97
- rights apply</a>.<br>\n<a href=\"http://www.nasa.gov/about/highlights/HP_Privacy.html\">NASA
98
- Web\nPrivacy Policy and Important Notices</a><br>\n<b>A service of:</b>\n<a
99
- href=\"http://astrophysics.gsfc.nasa.gov/\">ASD</a> at\n<a href=\"http://www.nasa.gov/\">NASA</a>
100
- /\n<a href=\"http://www.nasa.gov/centers/goddard/\">GSFC</a>\n<br><b>&</b>
101
- <a href=\"http://www.mtu.edu/\">Michigan Tech. U.</a><br>\n</center>\n</body>\n</html>\n"
102
- http_version:
103
- recorded_at: Sun, 29 Sep 2013 04:05:40 GMT
104
- - request:
105
- method: get
106
- uri: http://apod.nasa.gov/apod/ap130928.html
107
- body:
108
- encoding: US-ASCII
109
- string: ''
110
- headers:
111
- Accept-Encoding:
112
- - gzip,deflate,identity
113
- Accept:
114
- - '*/*'
115
- User-Agent:
116
- - Mechanize/2.7.2 Ruby/2.0.0p247 (http://github.com/sparklemotion/mechanize/)
117
- Accept-Charset:
118
- - ISO-8859-1,utf-8;q=0.7,*;q=0.7
119
- Accept-Language:
120
- - en-us,en;q=0.5
121
- Host:
122
- - apod.nasa.gov
123
- Referer:
124
- - !ruby/object:URI::HTTP
125
- scheme: http
126
- user:
127
- password:
128
- host: apod.nasa.gov
129
- port: 80
130
- path: /apod/astropix.html
131
- query:
132
- opaque:
133
- registry:
134
- fragment:
135
- parser:
136
- Connection:
137
- - keep-alive
138
- Keep-Alive:
139
- - 300
140
- response:
141
- status:
142
- code: 200
143
- message: OK
144
- headers:
145
- Date:
146
- - Sun, 29 Sep 2013 04:05:40 GMT
147
- Server:
148
- - WebServer/1.0
149
- Accept-Ranges:
150
- - bytes
151
- Content-Length:
152
- - '4103'
153
- Keep-Alive:
154
- - timeout=5, max=100
155
- Connection:
156
- - Keep-Alive
157
- Content-Type:
158
- - text/html; charset=ISO-8859-1
159
- body:
160
- encoding: UTF-8
161
- string: "<html>\n<head>\n<title> APOD: 2013 September 28 - Equinox Earth \n</title>\n<!--
162
- gsfc meta tags -->\n<meta name=\"orgcode\" content=\"661\">\n<meta name=\"rno\"
163
- content=\"phillip.a.newman\">\n<meta name=\"content-owner\" content=\"Jerry.T.Bonnell.1\">\n<meta
164
- name=\"webmaster\" content=\"Stephen.F.Fantasia.1\">\n<meta name=\"description\"
165
- content=\"A different astronomy and space science\nrelated image is featured
166
- each day, along with a brief explanation.\">\n<!-- -->\n<meta name=\"keywords\"
167
- content=\"equinox, earth, elektro-l, geosynchronous\">\n</head>\n<body BGCOLOR=\"#F4F4FF\"
168
- text=\"#000000\" link=\"#0000FF\" vlink=\"#7F0F9F\"\nalink=\"#FF0000\">\n\n<center>\n<h1>
169
- Astronomy Picture of the Day </h1>\n<p>\n\n<a href=\"archivepix.html\">Discover
170
- the cosmos!</a>\nEach day a different image or photograph of our fascinating
171
- universe is\nfeatured, along with a brief explanation written by a professional
172
- astronomer.\n<p>\n\n2013 September 28\n<br>\n<a href=\"image/1309/EquinoxEarthElektroL900.jpg\">\n<IMG
173
- SRC=\"image/1309/EquinoxEarthElektroL800.jpg\"\nalt=\"See Explanation. Clicking
174
- on the picture will download\n the highest resolution version available.\"></a>\n</center>\n\n<center>\n<b>
175
- Equinox Earth </b> <br> \n\n<b> Image Credit: </b>\n\n<a href=\"http://roscosmos.ru/\">Roscosmos</a>
176
- / NTSOMZ /\n<a href=\"http://zelenyikot.livejournal.com/\n17213.html\">zelenyikot.livejournal.com</a>\n<br>\nCourtesy:\n<a
177
- href=\"mailto: tirsky at gmail dot com\">Igor Tirsky</a>,\n<a href=\"mailto:
178
- zelenyikoteyka at gmail dot com\">Vitaliy Egorov</a>\n\n</center> \n<p> \n\n<b>
179
- Explanation: </b>\n\nFrom a geostationary orbit 36,000 kilometers above the
180
- equator,\nRussian meteorological\n<a href=\"https://en.wikipedia.org/wiki/Elektro%E2%80%93L\">satellite\nElektro-L</a>
181
- takes high-resolution images\n<a href=\"http://www.planetary.org/blogs/guest-blogs/2013/\n20130723-beautiful-science-by-elektro-l.html\">our
182
- fair planet</a>\nevery 30 minutes.\n\nBut only twice\n<a href=\"ap130922.html\">a
183
- year</a>, during an Equinox, can it capture an image\nlike this one, showing
184
- an entire hemisphere bathed in sunlight.\n\n<a href=\"https://en.wikipedia.org/wiki/Equinox\">At
185
- an Equinox</a>,\nthe Earth's axis of rotation is not tilted toward or\naway
186
- from the Sun, so the\n<a href=\"http://earthobservatory.nasa.gov/IOTD/\nview.php?id=52248\">solar
187
- illumination can extend</a>\nto both the planet's poles.\n\nOf course,\nthis
188
- <a href=\"https://vk.com/electrol\">Elektro-L picture</a>\nwas recorded on
189
- September 22nd,\nat the northern hemisphere's autumnal equinox.\n\nFor a moment
190
- on that date, the Sun was behind\nthe <a href=\"ap100220.html\">geostationary
191
- satellite</a> and a\ntelltale glint of reflected sunlight is seen crossing
192
- the equator,\nat the location on the planet with satellite and sun directly
193
- overhead\n(<a href=\"image/1309/130921-600ElektroL.gif\">5MB animated gif</a>).\n\n<p>
194
- <center>\n<b> Tomorrow's picture: </b><a href=\"ap130929.html\">fairy big</a>\n\n<p>
195
- <hr>\n<a href=\"ap130927.html\">&lt;</a>\n| <a href=\"archivepix.html\">Archive</a>\n|
196
- <a href=\"lib/aptree.html\">Index</a>\n| <a href=\"http://antwrp.gsfc.nasa.gov/cgi-bin/apod/apod_search\">Search</a>\n|
197
- <a href=\"calendar/allyears.html\">Calendar</a>\n| <a href=\"/apod.rss\">RSS</a>\n|
198
- <a href=\"lib/edlinks.html\">Education</a>\n| <a href=\"lib/about_apod.html\">About
199
- APOD</a>\n| <a href=\n\"http://asterisk.apod.com/discuss_apod.php?date=130928\">Discuss</a>\n|
200
- <a href=\"ap130929.html\">&gt;</a>\n\n<hr><p>\n<b> Authors & editors: </b>\n<a
201
- href=\"http://www.phy.mtu.edu/faculty/Nemiroff.html\">Robert Nemiroff</a>\n(<a
202
- href=\"http://www.phy.mtu.edu/\">MTU</a>) &\n<a href=\"http://antwrp.gsfc.nasa.gov/htmltest/jbonnell/www/bonnell.html\"\n>Jerry
203
- Bonnell</a> (<a href=\"http://www.astro.umd.edu/\">UMCP</a>)<br>\n<b>NASA
204
- Official: </b> Phillip Newman\n<a href=\"lib/about_apod.html#srapply\">Specific
205
- rights apply</a>.<br>\n<a href=\"http://www.nasa.gov/about/highlights/HP_Privacy.html\">NASA
206
- Web\nPrivacy Policy and Important Notices</a><br>\n<b>A service of:</b>\n<a
207
- href=\"http://astrophysics.gsfc.nasa.gov/\">ASD</a> at\n<a href=\"http://www.nasa.gov/\">NASA</a>
208
- /\n<a href=\"http://www.nasa.gov/centers/goddard/\">GSFC</a>\n<br><b>&</b>
209
- <a href=\"http://www.mtu.edu/\">Michigan Tech. U.</a><br>\n</center>\n</body>\n</html>\n"
210
- http_version:
211
- recorded_at: Sun, 29 Sep 2013 04:05:40 GMT
212
- - request:
213
- method: get
214
- uri: http://apod.nasa.gov/apod/ap130929.html
215
- body:
216
- encoding: US-ASCII
217
- string: ''
218
- headers:
219
- Accept-Encoding:
220
- - gzip,deflate,identity
221
- Accept:
222
- - '*/*'
223
- User-Agent:
224
- - Mechanize/2.7.2 Ruby/2.0.0p247 (http://github.com/sparklemotion/mechanize/)
225
- Accept-Charset:
226
- - ISO-8859-1,utf-8;q=0.7,*;q=0.7
227
- Accept-Language:
228
- - en-us,en;q=0.5
229
- Host:
230
- - apod.nasa.gov
231
- Referer:
232
- - !ruby/object:URI::HTTP
233
- scheme: http
234
- user:
235
- password:
236
- host: apod.nasa.gov
237
- port: 80
238
- path: /apod/ap130928.html
239
- query:
240
- opaque:
241
- registry:
242
- fragment:
243
- parser:
244
- Connection:
245
- - keep-alive
246
- Keep-Alive:
247
- - 300
248
- response:
249
- status:
250
- code: 200
251
- message: OK
252
- headers:
253
- Date:
254
- - Sun, 29 Sep 2013 04:05:40 GMT
255
- Server:
256
- - WebServer/1.0
257
- Accept-Ranges:
258
- - bytes
259
- Content-Length:
260
- - '4736'
261
- Keep-Alive:
262
- - timeout=5, max=100
263
- Connection:
264
- - Keep-Alive
265
- Content-Type:
266
- - text/html; charset=ISO-8859-1
267
- body:
268
- encoding: UTF-8
269
- string: "<html>\n<head>\n<title> APOD: 2013 September 29 - The Fairy of Eagle
270
- Nebula \n</title>\n<!-- gsfc meta tags -->\n<meta name=\"orgcode\" content=\"661\">\n<meta
271
- name=\"rno\" content=\"phillip.a.newman\">\n<meta name=\"content-owner\" content=\"Jerry.T.Bonnell.1\">\n<meta
272
- name=\"webmaster\" content=\"Stephen.F.Fantasia.1\">\n<meta name=\"description\"
273
- content=\"A different astronomy and space science\nrelated image is featured
274
- each day, along with a brief explanation.\">\n<!-- -->\n<meta name=\"keywords\"
275
- content=\"Eagle Nebula, M16, dust pillar\">\n</head>\n<body BGCOLOR=\"#F4F4FF\"
276
- text=\"#000000\" link=\"#0000FF\" vlink=\"#7F0F9F\"\nalink=\"#FF0000\">\n\n<center>\n<h1>
277
- Astronomy Picture of the Day </h1>\n<p>\n\n<a href=\"archivepix.html\">Discover
278
- the cosmos!</a>\nEach day a different image or photograph of our fascinating
279
- universe is\nfeatured, along with a brief explanation written by a professional
280
- astronomer.\n<p>\n\n2013 September 29 \n<br> \n<a href=\"image/1309/fairypillar_hubble_900.jpg\">\n<IMG
281
- SRC=\"image/1309/fairypillar_hubble_900.jpg\"\nalt=\"See Explanation. Clicking
282
- on the picture will download\n the highest resolution version available.\"></a>\n</center>\n\n<center>\n<b>
283
- The Fairy of Eagle Nebula </b> <br> \n<b> Image Credit: </b> \n<a href=\n\"http://heritage.stsci.edu/commonpages/infoindex/ourproject/moreproject.html\"\n>The
284
- Hubble Heritage Team</a>,\n(<a href=\"http://www.stsci.edu/resources/\">STScI</a>/<a
285
- href=\"\nhttp://www.aura-astronomy.org/\">AURA</a>),\n<a href=\"http://www.esa.int/\">ESA</a>,\n<a
286
- href=\"http://www.nasa.gov/\">NASA</a>\n\n</center> <p> \n\n<b> Explanation:
287
- </b> \nThe dust sculptures of the Eagle Nebula are evaporating. \n\nAs powerful
288
- starlight whittles away these\n<a href=\"ap031228.html\">cool cosmic mountains</a>,
289
- the\n<a href=\"ap070218.html\">statuesque pillars</a> that remain\nmight be
290
- imagined as <a href=\n\"http://www.pantheon.org/areas/bestiary/\">mythical
291
- beasts</a>. \n\nPictured <a href=\n\"http://hubblesite.org/newscenter/newsdesk/archive/releases/2005/12/\"\n>above</a>
292
- is one of <a href=\"ap061022.html\">several striking\ndust pillars</a> of
293
- the\n<a href=\"http://en.wikipedia.org/wiki/Eagle_Nebula\">Eagle Nebula</a>\nthat
294
- might be described as a gigantic alien\n<a href=\"http://en.wikipedia.org/wiki/Fairies\">fairy</a>.
295
- \ \n\nThis fairy, however, is ten\n<a href=\"http://chandra.harvard.edu/photo/cosmic_distance.html\"\n>light
296
- years</a> tall and spews radiation much hotter than\n<a href=\"ap130901.html\">common
297
- fire</a>.\n\nThe <a href=\"ap041024.html\">greater Eagle Nebula</a>, M16,\nis
298
- actually a giant evaporating shell of gas and\n<a href=\"ap030706.html\">dust</a>
299
- inside of which is a growing\n<a href=\"http://kidshealth.org/kid/health_problems/teeth/cavity.html\"\n>cavity</a>
300
- filled with a spectacular stellar nursery currently forming an\n<a href=\"http://www.seds.org/messier/open.html\">open
301
- cluster</a> of stars. \n\nThe <a href=\"http://www.spacetelescope.org/images/html/heic0506b.html\"\n>above
302
- image</a> in scientifically re-assigned colors was\n<a href=\"http://heritage.stsci.edu/2005/12b/index.html\">released</a>\nin
303
- 2005 as part of the\n<a href=\"http://www.spacetelescope.org/news/html/heic0506.html\"\n>fifteenth
304
- anniversary celebration</a> of the\n<a href=\"ap021124.html\">launch</a> of
305
- the\n<a href=\"http://www.stsci.edu/hst/HST_overview/\">Hubble Space Telescope</a>.\n\n\n<p>
306
- <center> \n<b> Note: </b>\n<a href=\"http://asterisk.apod.com/viewtopic.php?f=28&t=32210\"\n>How
307
- to follow APOD if the US government shuts down.</a> <br>\n<b> Tomorrow's picture:
308
- </b><a href=\"ap130930.html\">the green unknown</a>\n\n<p> <hr>\n<a href=\"ap130928.html\">&lt;</a>\n|
309
- <a href=\"archivepix.html\">Archive</a>\n| <a href=\"lib/aptree.html\">Index</a>\n|
310
- <a href=\"http://antwrp.gsfc.nasa.gov/cgi-bin/apod/apod_search\">Search</a>\n|
311
- <a href=\"calendar/allyears.html\">Calendar</a>\n| <a href=\"/apod.rss\">RSS</a>\n|
312
- <a href=\"lib/edlinks.html\">Education</a>\n| <a href=\"lib/about_apod.html\">About
313
- APOD</a>\n| <a href=\n\"http://asterisk.apod.com/discuss_apod.php?date=130929\">Discuss</a>\n|
314
- <a href=\"ap130930.html\">&gt;</a>\n\n<hr><p>\n<b> Authors & editors: </b>\n<a
315
- href=\"http://www.phy.mtu.edu/faculty/Nemiroff.html\">Robert Nemiroff</a>\n(<a
316
- href=\"http://www.phy.mtu.edu/\">MTU</a>) &\n<a href=\"http://antwrp.gsfc.nasa.gov/htmltest/jbonnell/www/bonnell.html\"\n>Jerry
317
- Bonnell</a> (<a href=\"http://www.astro.umd.edu/\">UMCP</a>)<br>\n<b>NASA
318
- Official: </b> Phillip Newman\n<a href=\"lib/about_apod.html#srapply\">Specific
319
- rights apply</a>.<br>\n<a href=\"http://www.nasa.gov/about/highlights/HP_Privacy.html\">NASA
320
- Web\nPrivacy Policy and Important Notices</a><br>\n<b>A service of:</b>\n<a
321
- href=\"http://astrophysics.gsfc.nasa.gov/\">ASD</a> at\n<a href=\"http://www.nasa.gov/\">NASA</a>
322
- /\n<a href=\"http://www.nasa.gov/centers/goddard/\">GSFC</a>\n<br><b>&</b>
323
- <a href=\"http://www.mtu.edu/\">Michigan Tech. U.</a><br>\n</center>\n</body>\n</html>\n"
324
- http_version:
325
- recorded_at: Sun, 29 Sep 2013 04:05:40 GMT
326
- recorded_with: VCR 2.6.0