RubyGems - rack-cache - Versions diffs - 0.3.0 → 0.4 - Mend

rack-cache 0.3.0 → 0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of rack-cache might be problematic. Click here for more details.

Files changed (44) hide show

data/CHANGES +43 -0
data/README +18 -9
data/Rakefile +1 -14
data/TODO +13 -14
data/doc/configuration.markdown +7 -153
data/doc/faq.markdown +8 -0
data/doc/index.markdown +7 -9
data/example/sinatra/app.rb +25 -0
data/example/sinatra/views/index.erb +44 -0
data/lib/rack/cache.rb +5 -11
data/lib/rack/cache/cachecontrol.rb +193 -0
data/lib/rack/cache/context.rb +190 -52
data/lib/rack/cache/entitystore.rb +10 -4
data/lib/rack/cache/key.rb +52 -0
data/lib/rack/cache/metastore.rb +52 -16
data/lib/rack/cache/options.rb +60 -39
data/lib/rack/cache/request.rb +11 -15
data/lib/rack/cache/response.rb +221 -30
data/lib/rack/cache/storage.rb +1 -2
data/rack-cache.gemspec +9 -15
data/test/cache_test.rb +9 -6
data/test/cachecontrol_test.rb +139 -0
data/test/context_test.rb +251 -169
data/test/entitystore_test.rb +12 -11
data/test/key_test.rb +50 -0
data/test/metastore_test.rb +57 -14
data/test/options_test.rb +11 -0
data/test/request_test.rb +19 -0
data/test/response_test.rb +164 -23
data/test/spec_setup.rb +7 -0
metadata +12 -20
data/doc/events.dot +0 -27
data/lib/rack/cache/config.rb +0 -65
data/lib/rack/cache/config/busters.rb +0 -16
data/lib/rack/cache/config/default.rb +0 -133
data/lib/rack/cache/config/no-cache.rb +0 -13
data/lib/rack/cache/core.rb +0 -299
data/lib/rack/cache/headers.rb +0 -325
data/lib/rack/utils/environment_headers.rb +0 -78
data/test/config_test.rb +0 -66
data/test/core_test.rb +0 -84
data/test/environment_headers_test.rb +0 -69
data/test/headers_test.rb +0 -298
data/test/logging_test.rb +0 -45

data/lib/rack/cache.rb CHANGED Viewed

@@ -1,10 +1,5 @@
-require 'fileutils'
-require 'time'
 require 'rack'
-module Rack #:nodoc:
-end
 # = HTTP Caching For Rack
 #
 # Rack::Cache is suitable as a quick, drop-in component to enable HTTP caching
@@ -15,7 +10,6 @@ end
 # * Freshness/expiration based caching and validation
 # * Supports HTTP Vary
 # * Portable: 100% Ruby / works with any Rack-enabled framework
-# * VCL-like configuration language for advanced caching policies
 # * Disk, memcached, and heap memory storage backends
 #
 # === Usage
@@ -32,12 +26,12 @@ end
 #     set :entitystore, 'file:/var/cache/rack'
 #   end
 #   run app
-#
 module Rack::Cache
-  require 'rack/cache/request'
-  require 'rack/cache/response'
-  require 'rack/cache/context'
-  require 'rack/cache/storage'
+  autoload :Request,      'rack/cache/request'
+  autoload :Response,     'rack/cache/response'
+  autoload :Context,      'rack/cache/context'
+  autoload :Storage,      'rack/cache/storage'
+  autoload :CacheControl, 'rack/cache/cachecontrol'
   # Create a new Rack::Cache middleware component that fetches resources from
   # the specified backend application. The +options+ Hash can be used to

data/lib/rack/cache/cachecontrol.rb ADDED Viewed

@@ -0,0 +1,193 @@
+module Rack
+  module Cache
+    # Parses a Cache-Control header and exposes the directives as a Hash.
+    # Directives that do not have values are set to +true+.
+    class CacheControl < Hash
+      def initialize(value=nil)
+        parse(value)
+      end
+      # Indicates that the response MAY be cached by any cache, even if it
+      # would normally be non-cacheable or cacheable only within a non-
+      # shared cache.
+      #
+      # A response may be considered public without this directive if the
+      # private directive is not set and the request does not include an
+      # Authorization header.
+      def public?
+        self['public']
+      end
+      # Indicates that all or part of the response message is intended for
+      # a single user and MUST NOT be cached by a shared cache. This
+      # allows an origin server to state that the specified parts of the
+      # response are intended for only one user and are not a valid
+      # response for requests by other users. A private (non-shared) cache
+      # MAY cache the response.
+      #
+      # Note: This usage of the word private only controls where the
+      # response may be cached, and cannot ensure the privacy of the
+      # message content.
+      def private?
+        self['private']
+      end
+      # When set in a response, a cache MUST NOT use the response to satisfy a
+      # subsequent request without successful revalidation with the origin
+      # server. This allows an origin server to prevent caching even by caches
+      # that have been configured to return stale responses to client requests.
+      #
+      # Note that this does not necessary imply that the response may not be
+      # stored by the cache, only that the cache cannot serve it without first
+      # making a conditional GET request with the origin server.
+      #
+      # When set in a request, the server MUST NOT use a cached copy for its
+      # response. This has quite different semantics compared to the no-cache
+      # directive on responses. When the client specifies no-cache, it causes
+      # an end-to-end reload, forcing each cache to update their cached copies.
+      def no_cache?
+        self['no-cache']
+      end
+      # Indicates that the response MUST NOT be stored under any circumstances.
+      #
+      # The purpose of the no-store directive is to prevent the
+      # inadvertent release or retention of sensitive information (for
+      # example, on backup tapes). The no-store directive applies to the
+      # entire message, and MAY be sent either in a response or in a
+      # request. If sent in a request, a cache MUST NOT store any part of
+      # either this request or any response to it. If sent in a response,
+      # a cache MUST NOT store any part of either this response or the
+      # request that elicited it. This directive applies to both non-
+      # shared and shared caches. "MUST NOT store" in this context means
+      # that the cache MUST NOT intentionally store the information in
+      # non-volatile storage, and MUST make a best-effort attempt to
+      # remove the information from volatile storage as promptly as
+      # possible after forwarding it.
+      #
+      # The purpose of this directive is to meet the stated requirements
+      # of certain users and service authors who are concerned about
+      # accidental releases of information via unanticipated accesses to
+      # cache data structures. While the use of this directive might
+      # improve privacy in some cases, we caution that it is NOT in any
+      # way a reliable or sufficient mechanism for ensuring privacy. In
+      # particular, malicious or compromised caches might not recognize or
+      # obey this directive, and communications networks might be
+      # vulnerable to eavesdropping.
+      def no_store?
+        self['no-store']
+      end
+      # The expiration time of an entity MAY be specified by the origin
+      # server using the Expires header (see section 14.21). Alternatively,
+      # it MAY be specified using the max-age directive in a response. When
+      # the max-age cache-control directive is present in a cached response,
+      # the response is stale if its current age is greater than the age
+      # value given (in seconds) at the time of a new request for that
+      # resource. The max-age directive on a response implies that the
+      # response is cacheable (i.e., "public") unless some other, more
+      # restrictive cache directive is also present.
+      #
+      # If a response includes both an Expires header and a max-age
+      # directive, the max-age directive overrides the Expires header, even
+      # if the Expires header is more restrictive. This rule allows an origin
+      # server to provide, for a given response, a longer expiration time to
+      # an HTTP/1.1 (or later) cache than to an HTTP/1.0 cache. This might be
+      # useful if certain HTTP/1.0 caches improperly calculate ages or
+      # expiration times, perhaps due to desynchronized clocks.
+      #
+      # Many HTTP/1.0 cache implementations will treat an Expires value that
+      # is less than or equal to the response Date value as being equivalent
+      # to the Cache-Control response directive "no-cache". If an HTTP/1.1
+      # cache receives such a response, and the response does not include a
+      # Cache-Control header field, it SHOULD consider the response to be
+      # non-cacheable in order to retain compatibility with HTTP/1.0 servers.
+      #
+      # When the max-age directive is included in the request, it indicates
+      # that the client is willing to accept a response whose age is no
+      # greater than the specified time in seconds.
+      def max_age
+        self['max-age'].to_i  if key?('max-age')
+      end
+      # If a response includes an s-maxage directive, then for a shared
+      # cache (but not for a private cache), the maximum age specified by
+      # this directive overrides the maximum age specified by either the
+      # max-age directive or the Expires header. The s-maxage directive
+      # also implies the semantics of the proxy-revalidate directive. i.e.,
+      # that the shared cache must not use the entry after it becomes stale
+      # to respond to a subsequent request without first revalidating it with
+      # the origin server. The s-maxage directive is always ignored by a
+      # private cache.
+      def shared_max_age
+        self['s-maxage'].to_i  if key?('s-maxage')
+      end
+      alias_method :s_maxage, :shared_max_age
+      # Because a cache MAY be configured to ignore a server's specified
+      # expiration time, and because a client request MAY include a max-
+      # stale directive (which has a similar effect), the protocol also
+      # includes a mechanism for the origin server to require revalidation
+      # of a cache entry on any subsequent use. When the must-revalidate
+      # directive is present in a response received by a cache, that cache
+      # MUST NOT use the entry after it becomes stale to respond to a
+      # subsequent request without first revalidating it with the origin
+      # server. (I.e., the cache MUST do an end-to-end revalidation every
+      # time, if, based solely on the origin server's Expires or max-age
+      # value, the cached response is stale.)
+      #
+      # The must-revalidate directive is necessary to support reliable
+      # operation for certain protocol features. In all circumstances an
+      # HTTP/1.1 cache MUST obey the must-revalidate directive; in
+      # particular, if the cache cannot reach the origin server for any
+      # reason, it MUST generate a 504 (Gateway Timeout) response.
+      #
+      # Servers SHOULD send the must-revalidate directive if and only if
+      # failure to revalidate a request on the entity could result in
+      # incorrect operation, such as a silently unexecuted financial
+      # transaction. Recipients MUST NOT take any automated action that
+      # violates this directive, and MUST NOT automatically provide an
+      # unvalidated copy of the entity if revalidation fails.
+      def must_revalidate?
+        self['must-revalidate']
+      end
+      # The proxy-revalidate directive has the same meaning as the must-
+      # revalidate directive, except that it does not apply to non-shared
+      # user agent caches. It can be used on a response to an
+      # authenticated request to permit the user's cache to store and
+      # later return the response without needing to revalidate it (since
+      # it has already been authenticated once by that user), while still
+      # requiring proxies that service many users to revalidate each time
+      # (in order to make sure that each user has been authenticated).
+      # Note that such authenticated responses also need the public cache
+      # control directive in order to allow them to be cached at all.
+      def proxy_revalidate?
+        self['proxy-revalidate']
+      end
+      def to_s
+        bools, vals = [], []
+        each do |key,value|
+          if value == true
+            bools << key
+          elsif value
+            vals << "#{key}=#{value}"
+          end
+        end
+        (bools.sort + vals.sort).join(', ')
+      end
+    private
+      def parse(value)
+        return  if value.nil? || value.empty?
+        value.delete(' ').split(',').inject(self) do |hash,part|
+          name, value = part.split('=', 2)
+          hash[name.downcase] = (value || true) unless name.empty?
+          hash
+        end
+      end
+    end
+  end
+end

data/lib/rack/cache/context.rb CHANGED Viewed

@@ -1,40 +1,48 @@
-require 'rack/cache/config'
 require 'rack/cache/options'
-require 'rack/cache/core'
 require 'rack/cache/request'
 require 'rack/cache/response'
 require 'rack/cache/storage'
 module Rack::Cache
   # Implements Rack's middleware interface and provides the context for all
-  # cache logic. This class includes the Options, Config, and Core modules
-  # to provide much of its core functionality.
+  # cache logic, including the core logic engine.
   class Context
     include Rack::Cache::Options
-    include Rack::Cache::Config
-    include Rack::Cache::Core
+    # Array of trace Symbols
+    attr_reader :trace
     # The Rack application object immediately downstream.
     attr_reader :backend
-    def initialize(backend, options={}, &block)
-      @errors = nil
-      @env = nil
+    def initialize(backend, options={})
       @backend = backend
+      @trace = []
       initialize_options options
-      initialize_core
-      initialize_config(&block)
+      yield self if block_given?
+      @private_header_keys =
+        private_headers.map { |name| "HTTP_#{name.upcase.tr('-', '_')}" }
     end
-    # The call! method is invoked on the duplicate context instance.
-    # process_request is defined in Core.
-    alias_method :call!, :process_request
-    protected :call!
+    # The configured MetaStore instance. Changing the rack-cache.metastore
+    # value effects the result of this method immediately.
+    def metastore
+      uri = options['rack-cache.metastore']
+      storage.resolve_metastore_uri(uri)
+    end
+    # The configured EntityStore instance. Changing the rack-cache.entitystore
+    # value effects the result of this method immediately.
+    def entitystore
+      uri = options['rack-cache.entitystore']
+      storage.resolve_entitystore_uri(uri)
+    end
-    # The Rack call interface. The receiver acts as a prototype and runs each
-    # request in a duplicate object, unless the +rack.run_once+ variable is set
-    # in the environment.
+    # The Rack call interface. The receiver acts as a prototype and runs
+    # each request in a dup object unless the +rack.run_once+ variable is
+    # set in the environment.
     def call(env)
       if env['rack.run_once']
         call! env
@@ -43,53 +51,183 @@ module Rack::Cache
       end
     end
-  public
-    # IO-like object that receives log, warning, and error messages;
-    # defaults to the rack.errors environment variable.
-    def errors
-      @errors || (@env && (@errors = @env['rack.errors'])) || STDERR
+    # The real Rack call interface. The caching logic is performed within
+    # the context of the receiver.
+    def call!(env)
+      @trace = []
+      @env = @default_options.merge(env)
+      @request = Request.new(@env.dup.freeze)
+      response =
+        if @request.get? || @request.head?
+          if !@env['HTTP_EXPECT']
+            lookup
+          else
+            pass
+          end
+        else
+          invalidate
+        end
+      # log trace and set X-Rack-Cache tracing header
+      trace = @trace.join(', ')
+      response.headers['X-Rack-Cache'] = trace
+      # write log message to rack.errors
+      if verbose?
+        message = "cache: [%s %s] %s\n" %
+          [@request.request_method, @request.fullpath, trace]
+        @env['rack.errors'].write(message)
+      end
+      # tidy up response a bit
+      response.not_modified! if not_modified?(response)
+      response.body = [] if @request.head?
+      response.to_a
     end
-    # Set the output stream for log messages, warnings, and errors.
-    def errors=(ioish)
-      fail "stream must respond to :write" if ! ioish.respond_to?(:write)
-      @errors = ioish
+  private
+    # Record that an event took place.
+    def record(event)
+      @trace << event
     end
-    # The configured MetaStore instance. Changing the rack-cache.metastore
-    # environment variable effects the result of this method immediately.
-    def metastore
-      uri = options['rack-cache.metastore']
-      storage.resolve_metastore_uri(uri)
+    # Does the request include authorization or other sensitive information
+    # that should cause the response to be considered private by default?
+    # Private responses are not stored in the cache.
+    def private_request?
+      @private_header_keys.any? { |key| @env.key?(key) }
     end
-    # The configured EntityStore instance. Changing the rack-cache.entitystore
-    # environment variable effects the result of this method immediately.
-    def entitystore
-      uri = options['rack-cache.entitystore']
-      storage.resolve_entitystore_uri(uri)
+    # Determine if the #response validators (ETag, Last-Modified) matches
+    # a conditional value specified in #request.
+    def not_modified?(response)
+      response.etag_matches?(@request.env['HTTP_IF_NONE_MATCH']) ||
+        response.last_modified_at?(@request.env['HTTP_IF_MODIFIED_SINCE'])
     end
-  protected
-    # Write a log message to the errors stream. +level+ is a symbol
-    # such as :error, :warn, :info, or :trace.
-    def log(level, message=nil, *params)
-      errors.write("[cache] #{level}: #{message}\n" % params)
-      errors.flush
+    # Whether the cache entry is "fresh enough" to satisfy the request.
+    def fresh_enough?(entry)
+      if entry.fresh?
+        if allow_revalidate? && max_age = @request.cache_control.max_age
+          max_age > 0 && max_age >= entry.age
+        else
+          true
+        end
+      end
     end
-    def info(*message, &bk)
-      log :info, *message, &bk
+    # Delegate the request to the backend and create the response.
+    def forward
+      Response.new(*backend.call(@env))
     end
-    def warn(*message, &bk)
-      log :warn, *message, &bk
+    # The request is sent to the backend, and the backend's response is sent
+    # to the client, but is not entered into the cache.
+    def pass
+      record :pass
+      forward
     end
-    def trace(*message, &bk)
-      return unless verbose?
-      log :trace, *message, &bk
+    # Invalidate POST, PUT, DELETE and all methods not understood by this cache
+    # See RFC2616 13.10
+    def invalidate
+      record :invalidate
+      metastore.invalidate(@request, entitystore)
+      pass
     end
-  end
+    # Try to serve the response from cache. When a matching cache entry is
+    # found and is fresh, use it as the response without forwarding any
+    # request to the backend. When a matching cache entry is found but is
+    # stale, attempt to #validate the entry with the backend using conditional
+    # GET. When no matching cache entry is found, trigger #miss processing.
+    def lookup
+      if @request.no_cache? && allow_reload?
+        record :reload
+        fetch
+      elsif entry = metastore.lookup(@request, entitystore)
+        if fresh_enough?(entry)
+          record :fresh
+          entry.headers['Age'] = entry.age.to_s
+          entry
+        else
+          record :stale
+          validate(entry)
+        end
+      else
+        record :miss
+        fetch
+      end
+    end
+    # Validate that the cache entry is fresh. The original request is used
+    # as a template for a conditional GET request with the backend.
+    def validate(entry)
+      # send no head requests because we want content
+      @env['REQUEST_METHOD'] = 'GET'
+      # add our cached validators to the environment
+      @env['HTTP_IF_MODIFIED_SINCE'] = entry.last_modified
+      @env['HTTP_IF_NONE_MATCH'] = entry.etag
+      backend_response = forward
+      response =
+        if backend_response.status == 304
+          record :valid
+          entry = entry.dup
+          entry.headers.delete('Date')
+          %w[Date Expires Cache-Control ETag Last-Modified].each do |name|
+            next unless value = backend_response.headers[name]
+            entry.headers[name] = value
+          end
+          entry
+        else
+          record :invalid
+          backend_response
+        end
+      store(response) if response.cacheable?
+      response
+    end
+    # The cache missed or a reload is required. Forward the request to the
+    # backend and determine whether the response should be stored.
+    def fetch
+      # send no head requests because we want content
+      @env['REQUEST_METHOD'] = 'GET'
+      # avoid that the backend sends no content
+      @env.delete('HTTP_IF_MODIFIED_SINCE')
+      @env.delete('HTTP_IF_NONE_MATCH')
+      response = forward
+      # Mark the response as explicitly private if any of the private
+      # request headers are present and the response was not explicitly
+      # declared public.
+      if private_request? && !response.cache_control.public?
+        response.private = true
+      elsif default_ttl > 0 && response.ttl.nil? && !response.cache_control.must_revalidate?
+        # assign a default TTL for the cache entry if none was specified in
+        # the response; the must-revalidate cache control directive disables
+        # default ttl assigment.
+        response.ttl = default_ttl
+      end
+      store(response) if response.cacheable?
+      response
+    end
+    # Write the response to the cache.
+    def store(response)
+      record :store
+      metastore.store(@request, response, entitystore)
+      response.headers['Age'] = response.age.to_s
+    end
+  end
 end