PyPI - swift - Versions diffs - 2.31.1__py2.py3-none-any.whl → 2.32.1__py2.py3-none-any.whl - Mend

swift 2.31.1py2.py3-none-any.whl → 2.32.1py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (104) hide show

swift/cli/info.py +9 -2
swift/cli/ringbuilder.py +5 -1
swift/common/container_sync_realms.py +6 -7
swift/common/daemon.py +7 -3
swift/common/db.py +22 -7
swift/common/db_replicator.py +19 -20
swift/common/direct_client.py +63 -14
swift/common/internal_client.py +24 -3
swift/common/manager.py +43 -44
swift/common/memcached.py +168 -74
swift/common/middleware/__init__.py +4 -0
swift/common/middleware/account_quotas.py +98 -40
swift/common/middleware/backend_ratelimit.py +6 -4
swift/common/middleware/crossdomain.py +21 -8
swift/common/middleware/listing_formats.py +26 -38
swift/common/middleware/proxy_logging.py +12 -9
swift/common/middleware/s3api/controllers/bucket.py +8 -2
swift/common/middleware/s3api/s3api.py +9 -4
swift/common/middleware/s3api/s3request.py +32 -24
swift/common/middleware/s3api/s3response.py +10 -1
swift/common/middleware/tempauth.py +9 -10
swift/common/middleware/versioned_writes/__init__.py +0 -3
swift/common/middleware/versioned_writes/object_versioning.py +22 -5
swift/common/middleware/x_profile/html_viewer.py +1 -1
swift/common/middleware/xprofile.py +5 -0
swift/common/request_helpers.py +1 -2
swift/common/ring/ring.py +22 -19
swift/common/swob.py +2 -1
swift/common/{utils.py → utils/__init__.py} +610 -1146
swift/common/utils/ipaddrs.py +256 -0
swift/common/utils/libc.py +345 -0
swift/common/utils/timestamp.py +399 -0
swift/common/wsgi.py +70 -39
swift/container/backend.py +106 -38
swift/container/server.py +11 -2
swift/container/sharder.py +34 -15
swift/locale/de/LC_MESSAGES/swift.po +1 -320
swift/locale/en_GB/LC_MESSAGES/swift.po +1 -347
swift/locale/es/LC_MESSAGES/swift.po +1 -279
swift/locale/fr/LC_MESSAGES/swift.po +1 -209
swift/locale/it/LC_MESSAGES/swift.po +1 -207
swift/locale/ja/LC_MESSAGES/swift.po +2 -278
swift/locale/ko_KR/LC_MESSAGES/swift.po +3 -303
swift/locale/pt_BR/LC_MESSAGES/swift.po +1 -204
swift/locale/ru/LC_MESSAGES/swift.po +1 -203
swift/locale/tr_TR/LC_MESSAGES/swift.po +1 -192
swift/locale/zh_CN/LC_MESSAGES/swift.po +1 -192
swift/locale/zh_TW/LC_MESSAGES/swift.po +1 -193
swift/obj/diskfile.py +19 -6
swift/obj/server.py +20 -6
swift/obj/ssync_receiver.py +19 -9
swift/obj/ssync_sender.py +10 -10
swift/proxy/controllers/account.py +7 -7
swift/proxy/controllers/base.py +374 -366
swift/proxy/controllers/container.py +112 -53
swift/proxy/controllers/obj.py +254 -390
swift/proxy/server.py +3 -8
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-account-server +1 -1
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-server +1 -1
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-drive-audit +45 -14
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-server +1 -1
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-proxy-server +1 -1
{swift-2.31.1.dist-info → swift-2.32.1.dist-info}/AUTHORS +4 -0
{swift-2.31.1.dist-info → swift-2.32.1.dist-info}/METADATA +32 -35
{swift-2.31.1.dist-info → swift-2.32.1.dist-info}/RECORD +103 -100
{swift-2.31.1.dist-info → swift-2.32.1.dist-info}/WHEEL +1 -1
{swift-2.31.1.dist-info → swift-2.32.1.dist-info}/entry_points.txt +0 -1
swift-2.32.1.dist-info/pbr.json +1 -0
swift-2.31.1.dist-info/pbr.json +0 -1
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-account-audit +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-account-auditor +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-account-info +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-account-reaper +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-account-replicator +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-config +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-auditor +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-info +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-reconciler +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-replicator +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-sharder +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-sync +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-container-updater +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-dispersion-populate +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-dispersion-report +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-form-signature +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-get-nodes +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-init +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-auditor +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-expirer +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-info +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-reconstructor +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-relinker +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-replicator +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-object-updater +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-oldies +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-orphans +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-recon +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-recon-cron +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-reconciler-enqueue +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-ring-builder +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-ring-builder-analyzer +0 -0
{swift-2.31.1.data → swift-2.32.1.data}/scripts/swift-ring-composer +0 -0
{swift-2.31.1.dist-info → swift-2.32.1.dist-info}/LICENSE +0 -0
{swift-2.31.1.dist-info → swift-2.32.1.dist-info}/top_level.txt +0 -0

swift/proxy/controllers/obj.py CHANGED Viewed

@@ -38,7 +38,7 @@ import random
 import sys
 from greenlet import GreenletExit
-from eventlet import GreenPile, sleep
+from eventlet import GreenPile
 from eventlet.queue import Queue, Empty
 from eventlet.timeout import Timeout
@@ -48,7 +48,8 @@ from swift.common.utils import (
     normalize_delete_at_timestamp, public, get_expirer_container,
     document_iters_to_http_response_body, parse_content_range,
     quorum_size, reiterate, close_if_possible, safe_json_loads, md5,
-    ShardRange, find_shard_range, cache_from_env)
+    ShardRange, find_namespace, cache_from_env, NamespaceBoundList,
+    CooperativeIterator)
 from swift.common.bufferedhttp import http_connect
 from swift.common.constraints import check_metadata, check_object_creation
 from swift.common import constraints
@@ -67,8 +68,9 @@ from swift.common.memcached import MemcacheConnectionError
 from swift.common.storage_policy import (POLICIES, REPL_POLICY, EC_POLICY,
                                          ECDriverError, PolicyError)
 from swift.proxy.controllers.base import Controller, delay_denial, \
-    cors_validation, update_headers, bytes_to_skip, close_swift_conn, \
-    ByteCountEnforcer, record_cache_op_metrics, get_cache_key
+    cors_validation, update_headers, bytes_to_skip, ByteCountEnforcer, \
+    record_cache_op_metrics, get_cache_key, GetterBase, GetterSource, \
+    is_good_source, NodeIter
 from swift.common.swob import HTTPAccepted, HTTPBadRequest, HTTPNotFound, \
     HTTPPreconditionFailed, HTTPRequestEntityTooLarge, HTTPRequestTimeout, \
     HTTPServerError, HTTPServiceUnavailable, HTTPClientDisconnect, \
@@ -76,8 +78,7 @@ from swift.common.swob import HTTPAccepted, HTTPBadRequest, HTTPNotFound, \
     HTTPRequestedRangeNotSatisfiable, Range, HTTPInternalServerError, \
     normalize_etag
 from swift.common.request_helpers import update_etag_is_at_header, \
-    resolve_etag_is_at_header, validate_internal_obj, get_ip_port, \
-    http_response_to_document_iters
+    resolve_etag_is_at_header, validate_internal_obj, get_ip_port
 def check_content_type(req):
@@ -200,8 +201,8 @@ class BaseObjectController(Controller):
         policy_options = self.app.get_policy_options(policy)
         is_local = policy_options.write_affinity_is_local_fn
         if is_local is None:
-            return self.app.iter_nodes(ring, partition, self.logger, request,
-                                       policy=policy)
+            return NodeIter(self.app, ring, partition, self.logger, request,
+                            policy=policy)
         primary_nodes = ring.get_part_nodes(partition)
         handoff_nodes = ring.get_more_nodes(partition)
@@ -234,8 +235,8 @@ class BaseObjectController(Controller):
             (node for node in all_nodes if node not in preferred_nodes)
         )
-        return self.app.iter_nodes(ring, partition, self.logger, request,
-                                   node_iter=node_iter, policy=policy)
+        return NodeIter(self.app, ring, partition, self.logger, request,
+                        node_iter=node_iter, policy=policy)
     def GETorHEAD(self, req):
         """Handle HTTP GET or HEAD requests."""
@@ -254,8 +255,8 @@ class BaseObjectController(Controller):
                 return aresp
         partition = obj_ring.get_part(
             self.account_name, self.container_name, self.object_name)
-        node_iter = self.app.iter_nodes(obj_ring, partition, self.logger, req,
-                                        policy=policy)
+        node_iter = NodeIter(self.app, obj_ring, partition, self.logger, req,
+                             policy=policy)
         resp = self._get_or_head_response(req, node_iter, partition, policy)
@@ -278,37 +279,67 @@ class BaseObjectController(Controller):
         """Handler for HTTP HEAD requests."""
         return self.GETorHEAD(req)
-    def _get_cached_updating_shard_ranges(
+    def _get_cached_updating_namespaces(
             self, infocache, memcache, cache_key):
         """
-        Fetch cached shard ranges from infocache and memcache.
+        Fetch cached updating namespaces of updating shard ranges from
+        infocache and memcache.
         :param infocache: the infocache instance.
         :param memcache: an instance of a memcache client,
                          :class:`swift.common.memcached.MemcacheRing`.
         :param cache_key: the cache key for both infocache and memcache.
-        :return: a tuple of (list of shard ranges in dict format, cache state)
-        """
-        cached_ranges = infocache.get(cache_key)
-        if cached_ranges:
-            cache_state = 'infocache_hit'
+        :return: a tuple of (an instance of NamespaceBoundList, cache state)
+        """
+        # try get namespaces from infocache first
+        namespace_list = infocache.get(cache_key)
+        if namespace_list:
+            return namespace_list, 'infocache_hit'
+        # then try get them from memcache
+        if not memcache:
+            return None, 'disabled'
+        skip_chance = self.app.container_updating_shard_ranges_skip_cache
+        if skip_chance and random.random() < skip_chance:
+            return None, 'skip'
+        try:
+            namespaces = memcache.get(cache_key, raise_on_error=True)
+            cache_state = 'hit' if namespaces else 'miss'
+        except MemcacheConnectionError:
+            namespaces = None
+            cache_state = 'error'
+        if namespaces:
+            if six.PY2:
+                # json.loads() in memcache.get will convert json 'string' to
+                # 'unicode' with python2, here we cast 'unicode' back to 'str'
+                namespaces = [
+                    [lower.encode('utf-8'), name.encode('utf-8')]
+                    for lower, name in namespaces]
+            namespace_list = NamespaceBoundList(namespaces)
         else:
-            if memcache:
-                skip_chance = \
-                    self.app.container_updating_shard_ranges_skip_cache
-                if skip_chance and random.random() < skip_chance:
-                    cache_state = 'skip'
-                else:
-                    try:
-                        cached_ranges = memcache.get(
-                            cache_key, raise_on_error=True)
-                        cache_state = 'hit' if cached_ranges else 'miss'
-                    except MemcacheConnectionError:
-                        cache_state = 'error'
-            else:
-                cache_state = 'disabled'
-        cached_ranges = cached_ranges or []
-        return cached_ranges, cache_state
+            namespace_list = None
+        return namespace_list, cache_state
+    def _get_update_shard_caching_disabled(self, req, account, container, obj):
+        """
+        Fetch all updating shard ranges for the given root container when
+        all caching is disabled.
+        :param req: original Request instance.
+        :param account: account from which shard ranges should be fetched.
+        :param container: container from which shard ranges should be fetched.
+        :param obj: object getting updated.
+        :return: an instance of :class:`swift.common.utils.ShardRange`,
+            or None if the update should go back to the root
+        """
+        # legacy behavior requests container server for includes=obj
+        shard_ranges, response = self._get_shard_ranges(
+            req, account, container, states='updating', includes=obj)
+        record_cache_op_metrics(
+            self.logger, 'shard_updating', 'disabled', response)
+        # there will be only one shard range in the list if any
+        return shard_ranges[0] if shard_ranges else None
     def _get_update_shard(self, req, account, container, obj):
         """
@@ -327,39 +358,44 @@ class BaseObjectController(Controller):
         """
         if not self.app.recheck_updating_shard_ranges:
             # caching is disabled
-            cache_state = 'disabled'
-            # legacy behavior requests container server for includes=obj
-            shard_ranges, response = self._get_shard_ranges(
-                req, account, container, states='updating', includes=obj)
+            return self._get_update_shard_caching_disabled(
+                req, account, container, obj)
+        # caching is enabled, try to get from caches
+        response = None
+        cache_key = get_cache_key(account, container, shard='updating')
+        infocache = req.environ.setdefault('swift.infocache', {})
+        memcache = cache_from_env(req.environ, True)
+        cached_namespaces, cache_state = self._get_cached_updating_namespaces(
+            infocache, memcache, cache_key)
+        if cached_namespaces:
+            # found cached namespaces in either infocache or memcache
+            infocache[cache_key] = cached_namespaces
+            namespace = cached_namespaces.get_namespace(obj)
+            update_shard = ShardRange(
+                name=namespace.name, timestamp=0, lower=namespace.lower,
+                upper=namespace.upper)
         else:
-            # try to get from cache
-            response = None
-            cache_key = get_cache_key(account, container, shard='updating')
-            infocache = req.environ.setdefault('swift.infocache', {})
-            memcache = cache_from_env(req.environ, True)
-            (cached_ranges, cache_state
-             ) = self._get_cached_updating_shard_ranges(
-                infocache, memcache, cache_key)
-            if cached_ranges:
-                # found cached shard ranges in either infocache or memcache
-                infocache[cache_key] = tuple(cached_ranges)
-                shard_ranges = [ShardRange.from_dict(shard_range)
-                                for shard_range in cached_ranges]
-            else:
-                # pull full set of updating shards from backend
-                shard_ranges, response = self._get_shard_ranges(
-                    req, account, container, states='updating')
-                if shard_ranges:
-                    cached_ranges = [dict(sr) for sr in shard_ranges]
-                    infocache[cache_key] = tuple(cached_ranges)
-                    if memcache:
-                        memcache.set(
-                            cache_key, cached_ranges,
-                            time=self.app.recheck_updating_shard_ranges)
+            # pull full set of updating shard ranges from backend
+            shard_ranges, response = self._get_shard_ranges(
+                req, account, container, states='updating')
+            if shard_ranges:
+                # only store the list of namespace lower bounds and names into
+                # infocache and memcache.
+                cached_namespaces = NamespaceBoundList.parse(
+                    shard_ranges)
+                infocache[cache_key] = cached_namespaces
+                if memcache:
+                    self.logger.info(
+                        'Caching updating shards for %s (%d shards)',
+                        cache_key, len(cached_namespaces.bounds))
+                    memcache.set(
+                        cache_key, cached_namespaces.bounds,
+                        time=self.app.recheck_updating_shard_ranges)
+            update_shard = find_namespace(obj, shard_ranges or [])
         record_cache_op_metrics(
             self.logger, 'shard_updating', cache_state, response)
-        return find_shard_range(obj, shard_ranges or [])
+        return update_shard
     def _get_update_target(self, req, container_info):
         # find the sharded container to which we'll send the update
@@ -975,6 +1011,7 @@ class ReplicatedObjectController(BaseObjectController):
         This method was added in the PUT method extraction change
         """
         bytes_transferred = 0
+        data_source = CooperativeIterator(data_source)
         def send_chunk(chunk):
             timeout_at = time.time() + self.app.node_timeout
@@ -1132,14 +1169,15 @@ class ECAppIter(object):
         self.mime_boundary = None
         self.learned_content_type = None
         self.stashed_iter = None
+        self.pool = ContextPool(len(internal_parts_iters))
     def close(self):
-        # close down the stashed iter first so the ContextPool can
-        # cleanup the frag queue feeding coros that may be currently
+        # close down the stashed iter and shutdown the context pool to
+        # clean up the frag queue feeding coroutines that may be currently
         # executing the internal_parts_iters.
         if self.stashed_iter:
             close_if_possible(self.stashed_iter)
-        sleep()  # Give the per-frag threads a chance to clean up
+        self.pool.close()
         for it in self.internal_parts_iters:
             close_if_possible(it)
@@ -1486,7 +1524,7 @@ class ECAppIter(object):
             except ChunkWriteTimeout:
                 # slow client disconnect
                 self.logger.exception(
-                    "ChunkWriteTimeout fetching fragments for %r",
+                    "ChunkWriteTimeout feeding fragments for %r",
                     quote(self.path))
             except:  # noqa
                 self.logger.exception("Exception fetching fragments for %r",
@@ -1497,7 +1535,7 @@ class ECAppIter(object):
                 frag_iter.close()
         segments_decoded = 0
-        with ContextPool(len(fragment_iters)) as pool:
+        with self.pool as pool:
             for frag_iter, queue in zip(fragment_iters, queues):
                 pool.spawn(put_fragments_in_queue, frag_iter, queue,
                            self.logger.thread_locals)
@@ -2195,8 +2233,8 @@ class ECGetResponseBucket(object):
         Close bucket's responses; they won't be used for a client response.
         """
         for getter, frag_iter in self.get_responses():
-            if getattr(getter.source, 'swift_conn', None):
-                close_swift_conn(getter.source)
+            if getter.source:
+                getter.source.close()
     def __str__(self):
         # return a string summarising bucket state, useful for debugging.
@@ -2286,7 +2324,8 @@ class ECGetResponseCollection(object):
         frag_sets = safe_json_loads(headers.get('X-Backend-Fragments')) or {}
         for t_frag, frag_set in frag_sets.items():
             t_frag = Timestamp(t_frag)
-            self._get_bucket(t_frag).add_alternate_nodes(get.node, frag_set)
+            self._get_bucket(t_frag).add_alternate_nodes(
+                get.source.node, frag_set)
         # If the response includes a durable timestamp then mark that bucket as
         # durable. Note that this may be a different bucket than the one this
         # response got added to, and that we may never go and get a durable
@@ -2439,326 +2478,125 @@ class ECGetResponseCollection(object):
             return nodes.pop(0).copy()
-def is_good_source(status):
-    """
-    Indicates whether or not the request made to the backend found
-    what it was looking for.
-    :param status: the response from the backend
-    :returns: True if found, False if not
-    """
-    if status == HTTP_REQUESTED_RANGE_NOT_SATISFIABLE:
-        return True
-    return is_success(status) or is_redirection(status)
-class ECFragGetter(object):
+class ECFragGetter(GetterBase):
     def __init__(self, app, req, node_iter, partition, policy, path,
                  backend_headers, header_provider, logger_thread_locals,
                  logger):
-        self.app = app
-        self.req = req
-        self.node_iter = node_iter
-        self.partition = partition
-        self.path = path
-        self.backend_headers = backend_headers
+        super(ECFragGetter, self).__init__(
+            app=app, req=req, node_iter=node_iter,
+            partition=partition, policy=policy, path=path,
+            backend_headers=backend_headers, logger=logger)
         self.header_provider = header_provider
-        self.req_query_string = req.query_string
-        self.client_chunk_size = policy.fragment_size
+        self.fragment_size = policy.fragment_size
         self.skip_bytes = 0
-        self.bytes_used_from_backend = 0
-        self.source = None
         self.logger_thread_locals = logger_thread_locals
-        self.logger = logger
-    def fast_forward(self, num_bytes):
-        """
-        Will skip num_bytes into the current ranges.
-        :params num_bytes: the number of bytes that have already been read on
-                           this request. This will change the Range header
-                           so that the next req will start where it left off.
-        :raises HTTPRequestedRangeNotSatisfiable: if begin + num_bytes
-                                                  > end of range + 1
-        :raises RangeAlreadyComplete: if begin + num_bytes == end of range + 1
-        """
-        try:
-            req_range = Range(self.backend_headers.get('Range'))
-        except ValueError:
-            req_range = None
-        if req_range:
-            begin, end = req_range.ranges[0]
-            if begin is None:
-                # this is a -50 range req (last 50 bytes of file)
-                end -= num_bytes
-                if end == 0:
-                    # we sent out exactly the first range's worth of bytes, so
-                    # we're done with it
-                    raise RangeAlreadyComplete()
-                if end < 0:
-                    raise HTTPRequestedRangeNotSatisfiable()
-            else:
-                begin += num_bytes
-                if end is not None and begin == end + 1:
-                    # we sent out exactly the first range's worth of bytes, so
-                    # we're done with it
-                    raise RangeAlreadyComplete()
-                if end is not None and begin > end:
-                    raise HTTPRequestedRangeNotSatisfiable()
-            req_range.ranges = [(begin, end)] + req_range.ranges[1:]
-            self.backend_headers['Range'] = str(req_range)
-        else:
-            self.backend_headers['Range'] = 'bytes=%d-' % num_bytes
-        # Reset so if we need to do this more than once, we don't double-up
-        self.bytes_used_from_backend = 0
-    def pop_range(self):
-        """
-        Remove the first byterange from our Range header.
+        self.status = self.reason = self.body = self.source_headers = None
+        self._source_iter = None
-        This is used after a byterange has been completely sent to the
-        client; this way, should we need to resume the download from another
-        object server, we do not re-fetch byteranges that the client already
-        has.
+    def _get_next_response_part(self):
+        node_timeout = self.app.recoverable_node_timeout
-        If we have no Range header, this is a no-op.
-        """
-        if 'Range' in self.backend_headers:
+        while True:
+            # the loop here is to resume if trying to parse
+            # multipart/byteranges response raises a ChunkReadTimeout
+            # and resets the source_parts_iter
             try:
-                req_range = Range(self.backend_headers['Range'])
-            except ValueError:
-                # there's a Range header, but it's garbage, so get rid of it
-                self.backend_headers.pop('Range')
-                return
-            begin, end = req_range.ranges.pop(0)
-            if len(req_range.ranges) > 0:
-                self.backend_headers['Range'] = str(req_range)
-            else:
-                self.backend_headers.pop('Range')
-    def learn_size_from_content_range(self, start, end, length):
-        """
-        If client_chunk_size is set, makes sure we yield things starting on
-        chunk boundaries based on the Content-Range header in the response.
-        Sets our Range header's first byterange to the value learned from
-        the Content-Range header in the response; if we were given a
-        fully-specified range (e.g. "bytes=123-456"), this is a no-op.
-        If we were given a half-specified range (e.g. "bytes=123-" or
-        "bytes=-456"), then this changes the Range header to a
-        semantically-equivalent one *and* it lets us resume on a proper
-        boundary instead of just in the middle of a piece somewhere.
-        """
-        if length == 0:
-            return
-        if self.client_chunk_size:
-            self.skip_bytes = bytes_to_skip(self.client_chunk_size, start)
+                with WatchdogTimeout(self.app.watchdog, node_timeout,
+                                     ChunkReadTimeout):
+                    # If we don't have a multipart/byteranges response,
+                    # but just a 200 or a single-range 206, then this
+                    # performs no IO, and just returns source (or
+                    # raises StopIteration).
+                    # Otherwise, this call to next() performs IO when
+                    # we have a multipart/byteranges response; as it
+                    # will read the MIME boundary and part headers.
+                    start_byte, end_byte, length, headers, part = next(
+                        self.source.parts_iter)
+                return (start_byte, end_byte, length, headers, part)
+            except ChunkReadTimeout:
+                if not self._replace_source(
+                        'Trying to read next part of EC multi-part GET '
+                        '(retrying)'):
+                    raise
-        if 'Range' in self.backend_headers:
+    def _iter_bytes_from_response_part(self, part_file, nbytes):
+        buf = b''
+        part_file = ByteCountEnforcer(part_file, nbytes)
+        while True:
             try:
-                req_range = Range(self.backend_headers['Range'])
-                new_ranges = [(start, end)] + req_range.ranges[1:]
-            except ValueError:
-                new_ranges = [(start, end)]
-        else:
-            new_ranges = [(start, end)]
-        self.backend_headers['Range'] = (
-            "bytes=" + (",".join("%s-%s" % (s if s is not None else '',
-                                            e if e is not None else '')
-                                 for s, e in new_ranges)))
-    def response_parts_iter(self, req):
-        try:
-            self.source, self.node = next(self.source_and_node_iter)
-        except StopIteration:
-            return
-        it = None
-        if self.source:
-            it = self._get_response_parts_iter(req)
-        return it
-    def _get_response_parts_iter(self, req):
-        try:
-            client_chunk_size = self.client_chunk_size
-            node_timeout = self.app.recoverable_node_timeout
-            # This is safe; it sets up a generator but does not call next()
-            # on it, so no IO is performed.
-            parts_iter = [
-                http_response_to_document_iters(
-                    self.source, read_chunk_size=self.app.object_chunk_size)]
-            def get_next_doc_part():
-                while True:
-                    # the loop here is to resume if trying to parse
-                    # multipart/byteranges response raises a ChunkReadTimeout
-                    # and resets the parts_iter
-                    try:
-                        with WatchdogTimeout(self.app.watchdog, node_timeout,
-                                             ChunkReadTimeout):
-                            # If we don't have a multipart/byteranges response,
-                            # but just a 200 or a single-range 206, then this
-                            # performs no IO, and just returns source (or
-                            # raises StopIteration).
-                            # Otherwise, this call to next() performs IO when
-                            # we have a multipart/byteranges response; as it
-                            # will read the MIME boundary and part headers.
-                            start_byte, end_byte, length, headers, part = next(
-                                parts_iter[0])
-                        return (start_byte, end_byte, length, headers, part)
-                    except ChunkReadTimeout:
-                        new_source, new_node = self._dig_for_source_and_node()
-                        if not new_source:
-                            raise
-                        self.app.error_occurred(
-                            self.node, 'Trying to read next part of '
-                            'EC multi-part GET (retrying)')
-                        # Close-out the connection as best as possible.
-                        if getattr(self.source, 'swift_conn', None):
-                            close_swift_conn(self.source)
-                        self.source = new_source
-                        self.node = new_node
-                        # This is safe; it sets up a generator but does
-                        # not call next() on it, so no IO is performed.
-                        parts_iter[0] = http_response_to_document_iters(
-                            new_source,
-                            read_chunk_size=self.app.object_chunk_size)
-            def iter_bytes_from_response_part(part_file, nbytes):
-                nchunks = 0
+                with WatchdogTimeout(self.app.watchdog,
+                                     self.app.recoverable_node_timeout,
+                                     ChunkReadTimeout):
+                    chunk = part_file.read(self.app.object_chunk_size)
+                    # NB: this append must be *inside* the context
+                    # manager for test.unit.SlowBody to do its thing
+                    buf += chunk
+                    if nbytes is not None:
+                        nbytes -= len(chunk)
+            except (ChunkReadTimeout, ShortReadError):
+                exc_type, exc_value, exc_traceback = sys.exc_info()
+                try:
+                    self.fast_forward(self.bytes_used_from_backend)
+                except (HTTPException, ValueError):
+                    self.logger.exception('Unable to fast forward')
+                    six.reraise(exc_type, exc_value, exc_traceback)
+                except RangeAlreadyComplete:
+                    break
                 buf = b''
-                part_file = ByteCountEnforcer(part_file, nbytes)
-                while True:
+                if self._replace_source(
+                        'Trying to read EC fragment during GET (retrying)'):
                     try:
-                        with WatchdogTimeout(self.app.watchdog, node_timeout,
-                                             ChunkReadTimeout):
-                            chunk = part_file.read(self.app.object_chunk_size)
-                            nchunks += 1
-                            # NB: this append must be *inside* the context
-                            # manager for test.unit.SlowBody to do its thing
-                            buf += chunk
-                            if nbytes is not None:
-                                nbytes -= len(chunk)
-                    except (ChunkReadTimeout, ShortReadError):
-                        exc_type, exc_value, exc_traceback = sys.exc_info()
-                        try:
-                            self.fast_forward(self.bytes_used_from_backend)
-                        except (HTTPException, ValueError):
-                            self.logger.exception('Unable to fast forward')
-                            six.reraise(exc_type, exc_value, exc_traceback)
-                        except RangeAlreadyComplete:
-                            break
-                        buf = b''
-                        old_node = self.node
-                        new_source, new_node = self._dig_for_source_and_node()
-                        if new_source:
-                            self.app.error_occurred(
-                                old_node, 'Trying to read EC fragment '
-                                'during GET (retrying)')
-                            # Close-out the connection as best as possible.
-                            if getattr(self.source, 'swift_conn', None):
-                                close_swift_conn(self.source)
-                            self.source = new_source
-                            self.node = new_node
-                            # This is safe; it just sets up a generator but
-                            # does not call next() on it, so no IO is
-                            # performed.
-                            parts_iter[0] = http_response_to_document_iters(
-                                new_source,
-                                read_chunk_size=self.app.object_chunk_size)
-                            try:
-                                _junk, _junk, _junk, _junk, part_file = \
-                                    get_next_doc_part()
-                            except StopIteration:
-                                # it's not clear to me how to make
-                                # get_next_doc_part raise StopIteration for the
-                                # first doc part of a new request
-                                six.reraise(exc_type, exc_value, exc_traceback)
-                            part_file = ByteCountEnforcer(part_file, nbytes)
-                        else:
-                            six.reraise(exc_type, exc_value, exc_traceback)
+                        _junk, _junk, _junk, _junk, part_file = \
+                            self._get_next_response_part()
+                    except StopIteration:
+                        # it's not clear to me how to make
+                        # _get_next_response_part raise StopIteration for the
+                        # first doc part of a new request
+                        six.reraise(exc_type, exc_value, exc_traceback)
+                    part_file = ByteCountEnforcer(part_file, nbytes)
+                else:
+                    six.reraise(exc_type, exc_value, exc_traceback)
+            else:
+                if buf and self.skip_bytes:
+                    if self.skip_bytes < len(buf):
+                        buf = buf[self.skip_bytes:]
+                        self.bytes_used_from_backend += self.skip_bytes
+                        self.skip_bytes = 0
                     else:
-                        if buf and self.skip_bytes:
-                            if self.skip_bytes < len(buf):
-                                buf = buf[self.skip_bytes:]
-                                self.bytes_used_from_backend += self.skip_bytes
-                                self.skip_bytes = 0
-                            else:
-                                self.skip_bytes -= len(buf)
-                                self.bytes_used_from_backend += len(buf)
-                                buf = b''
-                        if not chunk:
-                            if buf:
-                                with WatchdogTimeout(self.app.watchdog,
-                                                     self.app.client_timeout,
-                                                     ChunkWriteTimeout):
-                                    self.bytes_used_from_backend += len(buf)
-                                    yield buf
-                                buf = b''
-                            break
-                        if client_chunk_size is not None:
-                            while len(buf) >= client_chunk_size:
-                                client_chunk = buf[:client_chunk_size]
-                                buf = buf[client_chunk_size:]
-                                with WatchdogTimeout(self.app.watchdog,
-                                                     self.app.client_timeout,
-                                                     ChunkWriteTimeout):
-                                    self.bytes_used_from_backend += \
-                                        len(client_chunk)
-                                    yield client_chunk
-                        else:
-                            with WatchdogTimeout(self.app.watchdog,
-                                                 self.app.client_timeout,
-                                                 ChunkWriteTimeout):
-                                self.bytes_used_from_backend += len(buf)
-                                yield buf
-                            buf = b''
-                        # This is for fairness; if the network is outpacing
-                        # the CPU, we'll always be able to read and write
-                        # data without encountering an EWOULDBLOCK, and so
-                        # eventlet will not switch greenthreads on its own.
-                        # We do it manually so that clients don't starve.
-                        #
-                        # The number 5 here was chosen by making stuff up.
-                        # It's not every single chunk, but it's not too big
-                        # either, so it seemed like it would probably be an
-                        # okay choice.
-                        #
-                        # Note that we may trampoline to other greenthreads
-                        # more often than once every 5 chunks, depending on
-                        # how blocking our network IO is; the explicit sleep
-                        # here simply provides a lower bound on the rate of
-                        # trampolining.
-                        if nchunks % 5 == 0:
-                            sleep()
+                        self.skip_bytes -= len(buf)
+                        self.bytes_used_from_backend += len(buf)
+                        buf = b''
+                while buf and (len(buf) >= self.fragment_size or not chunk):
+                    client_chunk = buf[:self.fragment_size]
+                    buf = buf[self.fragment_size:]
+                    with WatchdogTimeout(self.app.watchdog,
+                                         self.app.client_timeout,
+                                         ChunkWriteTimeout):
+                        self.bytes_used_from_backend += len(client_chunk)
+                        yield client_chunk
+                if not chunk:
+                    break
+    def _iter_parts_from_response(self, req):
+        try:
             part_iter = None
             try:
                 while True:
                     try:
                         start_byte, end_byte, length, headers, part = \
-                            get_next_doc_part()
+                            self._get_next_response_part()
                     except StopIteration:
                         # it seems this is the only way out of the loop; not
                         # sure why the req.environ update is always needed
                         req.environ['swift.non_client_disconnect'] = True
                         break
-                    # note: learn_size_from_content_range() sets
-                    # self.skip_bytes
+                    # skip_bytes compensates for the backend request range
+                    # expansion done in _convert_range
+                    self.skip_bytes = bytes_to_skip(
+                        self.fragment_size, start_byte)
                     self.learn_size_from_content_range(
                         start_byte, end_byte, length)
                     self.bytes_used_from_backend = 0
@@ -2768,7 +2606,8 @@ class ECFragGetter(object):
                                   if (end_byte is not None
                                       and start_byte is not None)
                                   else None)
-                    part_iter = iter_bytes_from_response_part(part, byte_count)
+                    part_iter = CooperativeIterator(
+                        self._iter_bytes_from_response_part(part, byte_count))
                     yield {'start_byte': start_byte, 'end_byte': end_byte,
                            'entity_length': length, 'headers': headers,
                            'part_iter': part_iter}
@@ -2778,7 +2617,7 @@ class ECFragGetter(object):
                     part_iter.close()
         except ChunkReadTimeout:
-            self.app.exception_occurred(self.node, 'Object',
+            self.app.exception_occurred(self.source.node, 'Object',
                                         'Trying to read during GET')
             raise
         except ChunkWriteTimeout:
@@ -2804,9 +2643,7 @@ class ECFragGetter(object):
             self.logger.exception('Trying to send to client')
             raise
         finally:
-            # Close-out the connection as best as possible.
-            if getattr(self.source, 'swift_conn', None):
-                close_swift_conn(self.source)
+            self.source.close()
     @property
     def last_status(self):
@@ -2820,6 +2657,8 @@ class ECFragGetter(object):
             return HeaderKeyDict()
     def _make_node_request(self, node, node_timeout):
+        # make a backend request; return a response if it has an acceptable
+        # status code, otherwise None
         self.logger.thread_locals = self.logger_thread_locals
         req_headers = dict(self.backend_headers)
         ip, port = get_ip_port(node, req_headers)
@@ -2831,7 +2670,7 @@ class ECFragGetter(object):
                     ip, port, node['device'],
                     self.partition, 'GET', self.path,
                     headers=req_headers,
-                    query_string=self.req_query_string)
+                    query_string=self.req.query_string)
             self.app.set_node_timing(node, time.time() - start_node_timing)
             with Timeout(node_timeout):
@@ -2863,7 +2702,7 @@ class ECFragGetter(object):
         self.status = possible_source.status
         self.reason = possible_source.reason
         self.source_headers = possible_source.getheaders()
-        if is_good_source(possible_source.status):
+        if is_good_source(possible_source.status, server_type='Object'):
             self.body = None
             return possible_source
         else:
@@ -2878,38 +2717,62 @@ class ECFragGetter(object):
             return None
     @property
-    def source_and_node_iter(self):
-        if not hasattr(self, '_source_and_node_iter'):
-            self._source_and_node_iter = self._source_and_node_gen()
-        return self._source_and_node_iter
+    def source_iter(self):
+        """
+        An iterator over responses to backend fragment GETs. Yields an
+        instance of ``GetterSource`` if a response is good, otherwise ``None``.
+        """
+        if self._source_iter is None:
+            self._source_iter = self._source_gen()
+        return self._source_iter
-    def _source_and_node_gen(self):
+    def _source_gen(self):
         self.status = self.reason = self.body = self.source_headers = None
         for node in self.node_iter:
             source = self._make_node_request(
                 node, self.app.recoverable_node_timeout)
             if source:
-                self.node = node
-                yield source, node
+                yield GetterSource(self.app, source, node)
             else:
-                yield None, None
+                yield None
             self.status = self.reason = self.body = self.source_headers = None
-    def _dig_for_source_and_node(self):
+    def _find_source(self):
         # capture last used etag before continuation
         used_etag = self.last_headers.get('X-Object-Sysmeta-EC-ETag')
-        for source, node in self.source_and_node_iter:
+        for source in self.source_iter:
             if not source:
                 # _make_node_request only returns good sources
                 continue
-            if source.getheader('X-Object-Sysmeta-EC-ETag') != used_etag:
+            if source.resp.getheader('X-Object-Sysmeta-EC-ETag') != used_etag:
                 self.logger.warning(
                     'Skipping source (etag mismatch: got %s, expected %s)',
-                    source.getheader('X-Object-Sysmeta-EC-ETag'), used_etag)
+                    source.resp.getheader('X-Object-Sysmeta-EC-ETag'),
+                    used_etag)
             else:
-                return source, node
-        return None, None
+                self.source = source
+                return True
+        return False
+    def response_parts_iter(self, req):
+        """
+        Create an iterator over a single fragment response body.
+        :param req: a ``swob.Request``.
+        :return: an interator that yields chunks of bytes from a fragment
+            response body.
+        """
+        it = None
+        try:
+            source = next(self.source_iter)
+        except StopIteration:
+            pass
+        else:
+            if source:
+                self.source = source
+                it = self._iter_parts_from_response(req)
+        return it
 @ObjectControllerRouter.register(EC_POLICY)
@@ -3070,9 +2933,9 @@ class ECObjectController(BaseObjectController):
                     break
                 requests_available = extra_requests < max_extra_requests and (
                     node_iter.nodes_left > 0 or buckets.has_alternate_node())
-                bad_resp = not is_good_source(get.last_status)
                 if requests_available and (
-                        buckets.shortfall > pile._pending or bad_resp):
+                        buckets.shortfall > pile._pending or
+                        not is_good_source(get.last_status, self.server_type)):
                     extra_requests += 1
                     pile.spawn(self._fragment_GET_request, req, safe_iter,
                                partition, policy, buckets.get_extra_headers,
@@ -3343,6 +3206,7 @@ class ECObjectController(BaseObjectController):
             # same part nodes index as the primaries they are covering
             putter_to_frag_index = self._determine_chunk_destinations(
                 putters, policy)
+            data_source = CooperativeIterator(data_source)
             while True:
                 with WatchdogTimeout(self.app.watchdog,

swift 2.31.1__py2.py3-none-any.whl → 2.32.1__py2.py3-none-any.whl

swift 2.31.1py2.py3-none-any.whl → 2.32.1py2.py3-none-any.whl