open-uri-cached 0.0.1 → 0.0.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of open-uri-cached might be problematic. Click here for more details.
- data/lib/open-uri/cached.rb +62 -10
- metadata +14 -5
data/lib/open-uri/cached.rb
CHANGED
@@ -5,14 +5,8 @@ module OpenURI
|
|
5
5
|
class << self
|
6
6
|
alias original_open_uri open_uri #:nodoc:
|
7
7
|
def open_uri(uri, *rest, &block)
|
8
|
-
response = Cache.get(uri.to_s)
|
9
|
-
|
10
|
-
unless response
|
11
|
-
response = original_open_uri(uri, *rest).read
|
12
|
-
Cache.set(uri.to_s, response)
|
13
|
-
end
|
14
|
-
|
15
|
-
response = StringIO.new(response)
|
8
|
+
response = Cache.get(uri.to_s) ||
|
9
|
+
Cache.set(uri.to_s, original_open_uri(uri, *rest))
|
16
10
|
|
17
11
|
if block_given?
|
18
12
|
begin
|
@@ -30,16 +24,74 @@ module OpenURI
|
|
30
24
|
@cache_path = '/tmp/open-uri'
|
31
25
|
|
32
26
|
class << self
|
27
|
+
##
|
28
|
+
# Retrieve file content and meta data from cache
|
29
|
+
# @param [String] key
|
30
|
+
# @return [StringIO]
|
33
31
|
def get(key)
|
34
32
|
filename = filename_from_url(key)
|
35
33
|
# TODO: head request to determine last_modified vs file modtime
|
36
|
-
|
34
|
+
|
35
|
+
# Read metadata, if it exists
|
36
|
+
meta = YAML::load(File.read("#{filename}.meta")) if File.exists?("#{filename}.meta")
|
37
|
+
|
38
|
+
f = File.exists?(filename) ? StringIO.new(File.read(filename)) : nil
|
39
|
+
|
40
|
+
# Add meta accessors
|
41
|
+
if meta && f
|
42
|
+
f.instance_variable_set(:"@meta", meta)
|
43
|
+
|
44
|
+
def f.meta
|
45
|
+
@meta
|
46
|
+
end
|
47
|
+
def f.base_uri
|
48
|
+
@meta[:base_uri]
|
49
|
+
end
|
50
|
+
def f.content_type
|
51
|
+
@meta[:content_type]
|
52
|
+
end
|
53
|
+
def f.charset
|
54
|
+
@meta[:charset]
|
55
|
+
end
|
56
|
+
def f.content_encoding
|
57
|
+
@meta[:content_encoding]
|
58
|
+
end
|
59
|
+
def f.last_modified
|
60
|
+
@meta[:last_modified]
|
61
|
+
end
|
62
|
+
def f.status
|
63
|
+
@meta[:status]
|
64
|
+
end
|
65
|
+
end
|
66
|
+
|
67
|
+
f
|
37
68
|
end
|
38
69
|
|
70
|
+
# Cache file content and metadata
|
71
|
+
# @param [String] key
|
72
|
+
# URL of content to be cached
|
73
|
+
# @param [StringIO] value
|
74
|
+
# value to be cached, typically StringIO returned from `original_open_uri`
|
75
|
+
# @return [StringIO]
|
76
|
+
# Returns value
|
39
77
|
def set(key, value)
|
40
78
|
filename = filename_from_url(key)
|
41
79
|
mkpath(filename)
|
42
|
-
|
80
|
+
|
81
|
+
# Save metadata in a parallel file
|
82
|
+
if value.respond_to?(:meta)
|
83
|
+
filename_meta = "#{filename}.meta"
|
84
|
+
meta = value.meta
|
85
|
+
meta[:status] = value.status if value.respond_to?(:status)
|
86
|
+
meta[:content_type] = value.content_type if value.respond_to?(:content_type)
|
87
|
+
meta[:base_uri] = value.base_uri if value.respond_to?(:base_uri)
|
88
|
+
File.open(filename_meta, 'w') {|f| YAML::dump(meta, f)}
|
89
|
+
end
|
90
|
+
|
91
|
+
# Save file contents
|
92
|
+
File.open(filename, 'w'){|f| f.write value.read }
|
93
|
+
value.rewind
|
94
|
+
value
|
43
95
|
end
|
44
96
|
|
45
97
|
protected
|
metadata
CHANGED
@@ -1,7 +1,12 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: open-uri-cached
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
|
4
|
+
prerelease: false
|
5
|
+
segments:
|
6
|
+
- 0
|
7
|
+
- 0
|
8
|
+
- 3
|
9
|
+
version: 0.0.3
|
5
10
|
platform: ruby
|
6
11
|
authors:
|
7
12
|
- Danial Pearce
|
@@ -9,7 +14,7 @@ autorequire:
|
|
9
14
|
bindir: bin
|
10
15
|
cert_chain: []
|
11
16
|
|
12
|
-
date:
|
17
|
+
date: 2011-03-22 00:00:00 +11:00
|
13
18
|
default_executable:
|
14
19
|
dependencies: []
|
15
20
|
|
@@ -35,21 +40,25 @@ rdoc_options: []
|
|
35
40
|
require_paths:
|
36
41
|
- lib
|
37
42
|
required_ruby_version: !ruby/object:Gem::Requirement
|
43
|
+
none: false
|
38
44
|
requirements:
|
39
45
|
- - ">="
|
40
46
|
- !ruby/object:Gem::Version
|
47
|
+
segments:
|
48
|
+
- 0
|
41
49
|
version: "0"
|
42
|
-
version:
|
43
50
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
51
|
+
none: false
|
44
52
|
requirements:
|
45
53
|
- - ">="
|
46
54
|
- !ruby/object:Gem::Version
|
55
|
+
segments:
|
56
|
+
- 0
|
47
57
|
version: "0"
|
48
|
-
version:
|
49
58
|
requirements: []
|
50
59
|
|
51
60
|
rubyforge_project:
|
52
|
-
rubygems_version: 1.3.
|
61
|
+
rubygems_version: 1.3.7
|
53
62
|
signing_key:
|
54
63
|
specification_version: 3
|
55
64
|
summary: Do a lot of site scraping but take lots of attempts at parsing the content before reaching your end result? This gem is for you. But wait, there's more... Ok, no there isn't.
|