ghazel-aws-s3 0.6.4
Sign up to get free protection for your applications and to get access to all the features.
- data/CHANGELOG +107 -0
- data/COPYING +19 -0
- data/INSTALL +55 -0
- data/Rakefile +344 -0
- data/bin/s3sh +6 -0
- data/bin/setup.rb +10 -0
- data/lib/aws/s3.rb +60 -0
- data/lib/aws/s3/acl.rb +636 -0
- data/lib/aws/s3/authentication.rb +221 -0
- data/lib/aws/s3/base.rb +240 -0
- data/lib/aws/s3/bittorrent.rb +58 -0
- data/lib/aws/s3/bucket.rb +319 -0
- data/lib/aws/s3/connection.rb +280 -0
- data/lib/aws/s3/error.rb +69 -0
- data/lib/aws/s3/exceptions.rb +133 -0
- data/lib/aws/s3/extensions.rb +356 -0
- data/lib/aws/s3/logging.rb +314 -0
- data/lib/aws/s3/object.rb +624 -0
- data/lib/aws/s3/owner.rb +44 -0
- data/lib/aws/s3/parsing.rb +99 -0
- data/lib/aws/s3/response.rb +180 -0
- data/lib/aws/s3/service.rb +51 -0
- data/lib/aws/s3/version.rb +11 -0
- metadata +77 -0
@@ -0,0 +1,221 @@
|
|
1
|
+
module AWS
|
2
|
+
module S3
|
3
|
+
# All authentication is taken care of for you by the AWS::S3 library. None the less, some details of the two types
|
4
|
+
# of authentication and when they are used may be of interest to some.
|
5
|
+
#
|
6
|
+
# === Header based authentication
|
7
|
+
#
|
8
|
+
# Header based authentication is achieved by setting a special <tt>Authorization</tt> header whose value
|
9
|
+
# is formatted like so:
|
10
|
+
#
|
11
|
+
# "AWS #{access_key_id}:#{encoded_canonical}"
|
12
|
+
#
|
13
|
+
# The <tt>access_key_id</tt> is the public key that is assigned by Amazon for a given account which you use when
|
14
|
+
# establishing your initial connection. The <tt>encoded_canonical</tt> is computed according to rules layed out
|
15
|
+
# by Amazon which we will describe presently.
|
16
|
+
#
|
17
|
+
# ==== Generating the encoded canonical string
|
18
|
+
#
|
19
|
+
# The "canonical string", generated by the CanonicalString class, is computed by collecting the current request method,
|
20
|
+
# a set of significant headers of the current request, and the current request path into a string.
|
21
|
+
# That canonical string is then encrypted with the <tt>secret_access_key</tt> assigned by Amazon. The resulting encrypted canonical
|
22
|
+
# string is then base 64 encoded.
|
23
|
+
#
|
24
|
+
# === Query string based authentication
|
25
|
+
#
|
26
|
+
# When accessing a restricted object from the browser, you can authenticate via the query string, by setting the following parameters:
|
27
|
+
#
|
28
|
+
# "AWSAccessKeyId=#{access_key_id}&Expires=#{expires}&Signature=#{encoded_canonical}"
|
29
|
+
#
|
30
|
+
# The QueryString class is responsible for generating the appropriate parameters for authentication via the
|
31
|
+
# query string.
|
32
|
+
#
|
33
|
+
# The <tt>access_key_id</tt> and <tt>encoded_canonical</tt> are the same as described in the Header based authentication section.
|
34
|
+
# The <tt>expires</tt> value dictates for how long the current url is valid (by default, it will expire in 5 minutes). Expiration can be specified
|
35
|
+
# either by an absolute time (expressed in seconds since the epoch), or in relative time (in number of seconds from now).
|
36
|
+
# Details of how to customize the expiration of the url are provided in the documentation for the QueryString class.
|
37
|
+
#
|
38
|
+
# All requests made by this library use header authentication. When a query string authenticated url is needed,
|
39
|
+
# the S3Object#url method will include the appropriate query string parameters.
|
40
|
+
#
|
41
|
+
# === Full authentication specification
|
42
|
+
#
|
43
|
+
# The full specification of the authentication protocol can be found at
|
44
|
+
# http://docs.amazonwebservices.com/AmazonS3/2006-03-01/RESTAuthentication.html
|
45
|
+
class Authentication
|
46
|
+
constant :AMAZON_HEADER_PREFIX, 'x-amz-'
|
47
|
+
|
48
|
+
# Signature is the abstract super class for the Header and QueryString authentication methods. It does the job
|
49
|
+
# of computing the canonical_string using the CanonicalString class as well as encoding the canonical string. The subclasses
|
50
|
+
# parameterize these computations and arrange them in a string form appropriate to how they are used, in one case a http request
|
51
|
+
# header value, and in the other case key/value query string parameter pairs.
|
52
|
+
class Signature < String #:nodoc:
|
53
|
+
attr_reader :request, :access_key_id, :secret_access_key, :options
|
54
|
+
|
55
|
+
def initialize(request, access_key_id, secret_access_key, options = {})
|
56
|
+
super()
|
57
|
+
@request, @access_key_id, @secret_access_key = request, access_key_id, secret_access_key
|
58
|
+
@options = options
|
59
|
+
end
|
60
|
+
|
61
|
+
private
|
62
|
+
|
63
|
+
def canonical_string
|
64
|
+
options = {}
|
65
|
+
options[:expires] = expires if expires?
|
66
|
+
CanonicalString.new(request, options)
|
67
|
+
end
|
68
|
+
memoized :canonical_string
|
69
|
+
|
70
|
+
def encoded_canonical
|
71
|
+
digest = OpenSSL::Digest::Digest.new('sha1')
|
72
|
+
b64_hmac = [OpenSSL::HMAC.digest(digest, secret_access_key, canonical_string)].pack("m").strip
|
73
|
+
url_encode? ? CGI.escape(b64_hmac) : b64_hmac
|
74
|
+
end
|
75
|
+
|
76
|
+
def url_encode?
|
77
|
+
!@options[:url_encode].nil?
|
78
|
+
end
|
79
|
+
|
80
|
+
def expires?
|
81
|
+
is_a? QueryString
|
82
|
+
end
|
83
|
+
|
84
|
+
def date
|
85
|
+
request['date'].to_s.strip.empty? ? Time.now : Time.parse(request['date'])
|
86
|
+
end
|
87
|
+
end
|
88
|
+
|
89
|
+
# Provides header authentication by computing the value of the Authorization header. More details about the
|
90
|
+
# various authentication schemes can be found in the docs for its containing module, Authentication.
|
91
|
+
class Header < Signature #:nodoc:
|
92
|
+
def initialize(*args)
|
93
|
+
super
|
94
|
+
self << "AWS #{access_key_id}:#{encoded_canonical}"
|
95
|
+
end
|
96
|
+
end
|
97
|
+
|
98
|
+
# Provides query string authentication by computing the three authorization parameters: AWSAccessKeyId, Expires and Signature.
|
99
|
+
# More details about the various authentication schemes can be found in the docs for its containing module, Authentication.
|
100
|
+
class QueryString < Signature #:nodoc:
|
101
|
+
constant :DEFAULT_EXPIRY, 300 # 5 minutes
|
102
|
+
def initialize(*args)
|
103
|
+
super
|
104
|
+
options[:url_encode] = true
|
105
|
+
self << build
|
106
|
+
end
|
107
|
+
|
108
|
+
private
|
109
|
+
|
110
|
+
# Will return one of three values, in the following order of precedence:
|
111
|
+
#
|
112
|
+
# 1) Seconds since the epoch explicitly passed in the +:expires+ option
|
113
|
+
# 2) The current time in seconds since the epoch plus the number of seconds passed in
|
114
|
+
# the +:expires_in+ option
|
115
|
+
# 3) The current time in seconds since the epoch plus the default number of seconds (60 seconds)
|
116
|
+
def expires
|
117
|
+
return options[:expires] if options[:expires]
|
118
|
+
date.to_i + expires_in
|
119
|
+
end
|
120
|
+
|
121
|
+
def expires_in
|
122
|
+
options.has_key?(:expires_in) ? Integer(options[:expires_in]) : DEFAULT_EXPIRY
|
123
|
+
end
|
124
|
+
|
125
|
+
# Keep in alphabetical order
|
126
|
+
def build
|
127
|
+
"AWSAccessKeyId=#{access_key_id}&Expires=#{expires}&Signature=#{encoded_canonical}"
|
128
|
+
end
|
129
|
+
end
|
130
|
+
|
131
|
+
# The CanonicalString is used to generate an encrypted signature, signed with your secrect access key. It is composed of
|
132
|
+
# data related to the given request for which it provides authentication. This data includes the request method, request headers,
|
133
|
+
# and the request path. Both Header and QueryString use it to generate their signature.
|
134
|
+
class CanonicalString < String #:nodoc:
|
135
|
+
class << self
|
136
|
+
def default_headers
|
137
|
+
%w(content-type content-md5)
|
138
|
+
end
|
139
|
+
|
140
|
+
def interesting_headers
|
141
|
+
['content-md5', 'content-type', 'date', amazon_header_prefix]
|
142
|
+
end
|
143
|
+
|
144
|
+
def amazon_header_prefix
|
145
|
+
/^#{AMAZON_HEADER_PREFIX}/io
|
146
|
+
end
|
147
|
+
end
|
148
|
+
|
149
|
+
attr_reader :request, :headers
|
150
|
+
|
151
|
+
def initialize(request, options = {})
|
152
|
+
super()
|
153
|
+
@request = request
|
154
|
+
@headers = {}
|
155
|
+
@options = options
|
156
|
+
# "For non-authenticated or anonymous requests. A NotImplemented error result code will be returned if
|
157
|
+
# an authenticated (signed) request specifies a Host: header other than 's3.amazonaws.com'"
|
158
|
+
# (from http://docs.amazonwebservices.com/AmazonS3/2006-03-01/VirtualHosting.html)
|
159
|
+
request['Host'] = DEFAULT_HOST
|
160
|
+
build
|
161
|
+
end
|
162
|
+
|
163
|
+
private
|
164
|
+
def build
|
165
|
+
self << "#{request.method}\n"
|
166
|
+
ensure_date_is_valid
|
167
|
+
|
168
|
+
initialize_headers
|
169
|
+
set_expiry!
|
170
|
+
|
171
|
+
headers.sort_by {|k, _| k}.each do |key, value|
|
172
|
+
value = value.to_s.strip
|
173
|
+
self << (key =~ self.class.amazon_header_prefix ? "#{key}:#{value}" : value)
|
174
|
+
self << "\n"
|
175
|
+
end
|
176
|
+
self << path
|
177
|
+
end
|
178
|
+
|
179
|
+
def initialize_headers
|
180
|
+
identify_interesting_headers
|
181
|
+
set_default_headers
|
182
|
+
end
|
183
|
+
|
184
|
+
def set_expiry!
|
185
|
+
self.headers['date'] = @options[:expires] if @options[:expires]
|
186
|
+
end
|
187
|
+
|
188
|
+
def ensure_date_is_valid
|
189
|
+
request['Date'] ||= Time.now.httpdate
|
190
|
+
end
|
191
|
+
|
192
|
+
def identify_interesting_headers
|
193
|
+
request.each do |key, value|
|
194
|
+
key = key.downcase # Can't modify frozen string so no bang
|
195
|
+
if self.class.interesting_headers.any? {|header| header === key}
|
196
|
+
self.headers[key] = value.to_s.strip
|
197
|
+
end
|
198
|
+
end
|
199
|
+
end
|
200
|
+
|
201
|
+
def set_default_headers
|
202
|
+
self.class.default_headers.each do |header|
|
203
|
+
self.headers[header] ||= ''
|
204
|
+
end
|
205
|
+
end
|
206
|
+
|
207
|
+
def path
|
208
|
+
[only_path, extract_significant_parameter].compact.join('?')
|
209
|
+
end
|
210
|
+
|
211
|
+
def extract_significant_parameter
|
212
|
+
request.path[/[&?](acl|torrent|logging)(?:&|=|$)/, 1]
|
213
|
+
end
|
214
|
+
|
215
|
+
def only_path
|
216
|
+
request.path[/^[^?]*/]
|
217
|
+
end
|
218
|
+
end
|
219
|
+
end
|
220
|
+
end
|
221
|
+
end
|
data/lib/aws/s3/base.rb
ADDED
@@ -0,0 +1,240 @@
|
|
1
|
+
module AWS #:nodoc:
|
2
|
+
# AWS::S3 is a Ruby library for Amazon's Simple Storage Service's REST API (http://aws.amazon.com/s3).
|
3
|
+
# Full documentation of the currently supported API can be found at http://docs.amazonwebservices.com/AmazonS3/2006-03-01.
|
4
|
+
#
|
5
|
+
# == Getting started
|
6
|
+
#
|
7
|
+
# To get started you need to require 'aws/s3':
|
8
|
+
#
|
9
|
+
# % irb -rubygems
|
10
|
+
# irb(main):001:0> require 'aws/s3'
|
11
|
+
# # => true
|
12
|
+
#
|
13
|
+
# The AWS::S3 library ships with an interactive shell called <tt>s3sh</tt>. From within it, you have access to all the operations the library exposes from the command line.
|
14
|
+
#
|
15
|
+
# % s3sh
|
16
|
+
# >> Version
|
17
|
+
#
|
18
|
+
# Before you can do anything, you must establish a connection using Base.establish_connection!. A basic connection would look something like this:
|
19
|
+
#
|
20
|
+
# AWS::S3::Base.establish_connection!(
|
21
|
+
# :access_key_id => 'abc',
|
22
|
+
# :secret_access_key => '123'
|
23
|
+
# )
|
24
|
+
#
|
25
|
+
# The minimum connection options that you must specify are your access key id and your secret access key.
|
26
|
+
#
|
27
|
+
# (If you don't already have your access keys, all you need to sign up for the S3 service is an account at Amazon. You can sign up for S3 and get access keys by visiting http://aws.amazon.com/s3.)
|
28
|
+
#
|
29
|
+
# For convenience, if you set two special environment variables with the value of your access keys, the console will automatically create a default connection for you. For example:
|
30
|
+
#
|
31
|
+
# % cat .amazon_keys
|
32
|
+
# export AMAZON_ACCESS_KEY_ID='abcdefghijklmnop'
|
33
|
+
# export AMAZON_SECRET_ACCESS_KEY='1234567891012345'
|
34
|
+
#
|
35
|
+
# Then load it in your shell's rc file.
|
36
|
+
#
|
37
|
+
# % cat .zshrc
|
38
|
+
# if [[ -f "$HOME/.amazon_keys" ]]; then
|
39
|
+
# source "$HOME/.amazon_keys";
|
40
|
+
# fi
|
41
|
+
#
|
42
|
+
# See more connection details at AWS::S3::Connection::Management::ClassMethods.
|
43
|
+
module S3
|
44
|
+
constant :DEFAULT_HOST, 's3.amazonaws.com'
|
45
|
+
|
46
|
+
# AWS::S3::Base is the abstract super class of all classes who make requests against S3, such as the built in
|
47
|
+
# Service, Bucket and S3Object classes. It provides methods for making requests, inferring or setting response classes,
|
48
|
+
# processing request options, and accessing attributes from S3's response data.
|
49
|
+
#
|
50
|
+
# Establishing a connection with the Base class is the entry point to using the library:
|
51
|
+
#
|
52
|
+
# AWS::S3::Base.establish_connection!(:access_key_id => '...', :secret_access_key => '...')
|
53
|
+
#
|
54
|
+
# The <tt>:access_key_id</tt> and <tt>:secret_access_key</tt> are the two required connection options. More
|
55
|
+
# details can be found in the docs for Connection::Management::ClassMethods.
|
56
|
+
#
|
57
|
+
# Extensive examples can be found in the README[link:files/README.html].
|
58
|
+
class Base
|
59
|
+
class << self
|
60
|
+
# Wraps the current connection's request method and picks the appropriate response class to wrap the response in.
|
61
|
+
# If the response is an error, it will raise that error as an exception. All such exceptions can be caught by rescuing
|
62
|
+
# their superclass, the ResponseError exception class.
|
63
|
+
#
|
64
|
+
# It is unlikely that you would call this method directly. Subclasses of Base have convenience methods for each http request verb
|
65
|
+
# that wrap calls to request.
|
66
|
+
def request(verb, path, options = {}, body = nil, attempts = 0, &block)
|
67
|
+
Service.response = nil
|
68
|
+
process_options!(options, verb)
|
69
|
+
response = response_class.new(connection.request(verb, path, options, body, attempts, &block))
|
70
|
+
Service.response = response
|
71
|
+
|
72
|
+
Error::Response.new(response.response).error.raise if response.error?
|
73
|
+
response
|
74
|
+
# Once in a while, a request to S3 returns an internal error. A glitch in the matrix I presume. Since these
|
75
|
+
# errors are few and far between the request method will rescue InternalErrors the first three times they encouter them
|
76
|
+
# and will retry the request again. Most of the time the second attempt will work.
|
77
|
+
rescue InternalError, RequestTimeout
|
78
|
+
if attempts == 3
|
79
|
+
raise
|
80
|
+
else
|
81
|
+
attempts += 1
|
82
|
+
retry
|
83
|
+
end
|
84
|
+
end
|
85
|
+
|
86
|
+
[:get, :post, :put, :delete, :head].each do |verb|
|
87
|
+
class_eval(<<-EVAL, __FILE__, __LINE__)
|
88
|
+
def #{verb}(path, headers = {}, body = nil, &block)
|
89
|
+
request(:#{verb}, path, headers, body, &block)
|
90
|
+
end
|
91
|
+
EVAL
|
92
|
+
end
|
93
|
+
|
94
|
+
# Called when a method which requires a bucket name is called without that bucket name specified. It will try to
|
95
|
+
# infer the current bucket by looking for it as the subdomain of the current connection's address. If no subdomain
|
96
|
+
# is found, CurrentBucketNotSpecified will be raised.
|
97
|
+
#
|
98
|
+
# MusicBucket.establish_connection! :server => 'jukeboxzero.s3.amazonaws.com'
|
99
|
+
# MusicBucket.connection.server
|
100
|
+
# => 'jukeboxzero.s3.amazonaws.com'
|
101
|
+
# MusicBucket.current_bucket
|
102
|
+
# => 'jukeboxzero'
|
103
|
+
#
|
104
|
+
# Rather than infering the current bucket from the subdomain, the current class' bucket can be explicitly set with
|
105
|
+
# set_current_bucket_to.
|
106
|
+
def current_bucket
|
107
|
+
connection.subdomain or raise CurrentBucketNotSpecified.new(connection.http.address)
|
108
|
+
end
|
109
|
+
|
110
|
+
# If you plan on always using a specific bucket for certain files, you can skip always having to specify the bucket by creating
|
111
|
+
# a subclass of Bucket or S3Object and telling it what bucket to use:
|
112
|
+
#
|
113
|
+
# class JukeBoxSong < AWS::S3::S3Object
|
114
|
+
# set_current_bucket_to 'jukebox'
|
115
|
+
# end
|
116
|
+
#
|
117
|
+
# For all methods that take a bucket name as an argument, the current bucket will be used if the bucket name argument is omitted.
|
118
|
+
#
|
119
|
+
# other_song = 'baby-please-come-home.mp3'
|
120
|
+
# JukeBoxSong.store(other_song, open(other_song))
|
121
|
+
#
|
122
|
+
# This time we didn't have to explicitly pass in the bucket name, as the JukeBoxSong class knows that it will
|
123
|
+
# always use the 'jukebox' bucket.
|
124
|
+
#
|
125
|
+
# "Astute readers", as they say, may have noticed that we used the third parameter to pass in the content type,
|
126
|
+
# rather than the fourth parameter as we had the last time we created an object. If the bucket can be inferred, or
|
127
|
+
# is explicitly set, as we've done in the JukeBoxSong class, then the third argument can be used to pass in
|
128
|
+
# options.
|
129
|
+
#
|
130
|
+
# Now all operations that would have required a bucket name no longer do.
|
131
|
+
#
|
132
|
+
# other_song = JukeBoxSong.find('baby-please-come-home.mp3')
|
133
|
+
def set_current_bucket_to(name)
|
134
|
+
raise ArgumentError, "`#{__method__}' must be called on a subclass of #{self.name}" if self == AWS::S3::Base
|
135
|
+
instance_eval(<<-EVAL)
|
136
|
+
def current_bucket
|
137
|
+
'#{name}'
|
138
|
+
end
|
139
|
+
EVAL
|
140
|
+
end
|
141
|
+
alias_method :current_bucket=, :set_current_bucket_to
|
142
|
+
|
143
|
+
private
|
144
|
+
|
145
|
+
def response_class
|
146
|
+
FindResponseClass.for(self)
|
147
|
+
end
|
148
|
+
|
149
|
+
def process_options!(options, verb)
|
150
|
+
options.replace(RequestOptions.process(options, verb))
|
151
|
+
end
|
152
|
+
|
153
|
+
# Using the conventions layed out in the <tt>response_class</tt> works for more than 80% of the time.
|
154
|
+
# There are a few edge cases though where we want a given class to wrap its responses in different
|
155
|
+
# response classes depending on which method is being called.
|
156
|
+
def respond_with(klass)
|
157
|
+
eval(<<-EVAL, binding, __FILE__, __LINE__)
|
158
|
+
def new_response_class
|
159
|
+
#{klass}
|
160
|
+
end
|
161
|
+
|
162
|
+
class << self
|
163
|
+
alias_method :old_response_class, :response_class
|
164
|
+
alias_method :response_class, :new_response_class
|
165
|
+
end
|
166
|
+
EVAL
|
167
|
+
|
168
|
+
yield
|
169
|
+
ensure
|
170
|
+
# Restore the original version
|
171
|
+
eval(<<-EVAL, binding, __FILE__, __LINE__)
|
172
|
+
class << self
|
173
|
+
alias_method :response_class, :old_response_class
|
174
|
+
end
|
175
|
+
EVAL
|
176
|
+
end
|
177
|
+
|
178
|
+
def bucket_name(name)
|
179
|
+
name || current_bucket
|
180
|
+
end
|
181
|
+
|
182
|
+
class RequestOptions < Hash #:nodoc:
|
183
|
+
attr_reader :options, :verb
|
184
|
+
|
185
|
+
class << self
|
186
|
+
def process(*args, &block)
|
187
|
+
new(*args, &block).process!
|
188
|
+
end
|
189
|
+
end
|
190
|
+
|
191
|
+
def initialize(options, verb = :get)
|
192
|
+
@options = options.to_normalized_options
|
193
|
+
@verb = verb
|
194
|
+
super()
|
195
|
+
end
|
196
|
+
|
197
|
+
def process!
|
198
|
+
set_access_controls! if verb == :put
|
199
|
+
replace(options)
|
200
|
+
end
|
201
|
+
|
202
|
+
private
|
203
|
+
def set_access_controls!
|
204
|
+
ACL::OptionProcessor.process!(options)
|
205
|
+
end
|
206
|
+
end
|
207
|
+
end
|
208
|
+
|
209
|
+
def initialize(attributes = {}) #:nodoc:
|
210
|
+
@attributes = attributes
|
211
|
+
end
|
212
|
+
|
213
|
+
private
|
214
|
+
attr_reader :attributes
|
215
|
+
|
216
|
+
def connection
|
217
|
+
self.class.connection
|
218
|
+
end
|
219
|
+
|
220
|
+
def http
|
221
|
+
connection.http
|
222
|
+
end
|
223
|
+
|
224
|
+
def request(*args, &block)
|
225
|
+
self.class.request(*args, &block)
|
226
|
+
end
|
227
|
+
|
228
|
+
def method_missing(method, *args, &block)
|
229
|
+
case
|
230
|
+
when attributes.has_key?(method.to_s)
|
231
|
+
attributes[method.to_s]
|
232
|
+
when attributes.has_key?(method)
|
233
|
+
attributes[method]
|
234
|
+
else
|
235
|
+
super
|
236
|
+
end
|
237
|
+
end
|
238
|
+
end
|
239
|
+
end
|
240
|
+
end
|