Support multi-range GETs for static large objects.

Bonus consistency: 416 responses now always have a body. Before, if
you had "swob.HTTPRequestedRangeNotSatisfiable()", you'd get a body,
but if you had "swob.Response(..., conditional_response=True)", then
you'd get a length-0 response body. Now you always get a response
body. It's just the default <html><h1>..., but at it's always there.

Bonus efficiency: do a little caching of sub-SLO manifests to avoid
needless re-fetches. This kicks in when there are multiple references
to the same sub-SLO in a given manifest. The caching only holds 20
sub-SLOs so that a malicious user can't build a giant SLO tree and use
it to run the proxy out of memory (we're already holding up to 10
manifests in memory at a time since a SLO can include another SLO to a
depth of 10; this doesn't make the situation too much worse).

Change-Id: I24716e3271cf3370642e3755447e717fd7d9957c
This commit is contained in:
Samuel Merritt 2016-08-08 17:57:49 -07:00
parent e42567f14f
commit 4bcd3d7f6d
8 changed files with 357 additions and 89 deletions

View File

@ -213,12 +213,11 @@ from swift.common.exceptions import ListingIterError, SegmentError
from swift.common.swob import Request, HTTPBadRequest, HTTPServerError, \ from swift.common.swob import Request, HTTPBadRequest, HTTPServerError, \
HTTPMethodNotAllowed, HTTPRequestEntityTooLarge, HTTPLengthRequired, \ HTTPMethodNotAllowed, HTTPRequestEntityTooLarge, HTTPLengthRequired, \
HTTPOk, HTTPPreconditionFailed, HTTPException, HTTPNotFound, \ HTTPOk, HTTPPreconditionFailed, HTTPException, HTTPNotFound, \
HTTPUnauthorized, HTTPConflict, HTTPRequestedRangeNotSatisfiable,\ HTTPUnauthorized, HTTPConflict, Response, Range
Response, Range
from swift.common.utils import get_logger, config_true_value, \ from swift.common.utils import get_logger, config_true_value, \
get_valid_utf8_str, override_bytes_from_content_type, split_path, \ get_valid_utf8_str, override_bytes_from_content_type, split_path, \
register_swift_info, RateLimitedIterator, quote, close_if_possible, \ register_swift_info, RateLimitedIterator, quote, close_if_possible, \
closing_if_possible closing_if_possible, LRUCache
from swift.common.request_helpers import SegmentedIterable from swift.common.request_helpers import SegmentedIterable
from swift.common.constraints import check_utf8, MAX_BUFFERED_SLO_SEGMENTS from swift.common.constraints import check_utf8, MAX_BUFFERED_SLO_SEGMENTS
from swift.common.http import HTTP_NOT_FOUND, HTTP_UNAUTHORIZED, is_success from swift.common.http import HTTP_NOT_FOUND, HTTP_UNAUTHORIZED, is_success
@ -386,8 +385,6 @@ class SloGetContext(WSGIContext):
def __init__(self, slo): def __init__(self, slo):
self.slo = slo self.slo = slo
self.first_byte = None
self.last_byte = None
super(SloGetContext, self).__init__(slo.app) super(SloGetContext, self).__init__(slo.app)
def _fetch_sub_slo_segments(self, req, version, acc, con, obj): def _fetch_sub_slo_segments(self, req, version, acc, con, obj):
@ -434,7 +431,7 @@ class SloGetContext(WSGIContext):
return int(seg_dict['bytes']) return int(seg_dict['bytes'])
def _segment_listing_iterator(self, req, version, account, segments, def _segment_listing_iterator(self, req, version, account, segments,
recursion_depth=1): byteranges):
for seg_dict in segments: for seg_dict in segments:
if config_true_value(seg_dict.get('sub_slo')): if config_true_value(seg_dict.get('sub_slo')):
override_bytes_from_content_type(seg_dict, override_bytes_from_content_type(seg_dict,
@ -448,23 +445,46 @@ class SloGetContext(WSGIContext):
# If we were to make SegmentedIterable handle all the range # If we were to make SegmentedIterable handle all the range
# calculations, we would be unable to make this optimization. # calculations, we would be unable to make this optimization.
total_length = sum(self._segment_length(seg) for seg in segments) total_length = sum(self._segment_length(seg) for seg in segments)
if self.first_byte is None: if not byteranges:
self.first_byte = 0 byteranges = [(0, total_length - 1)]
if self.last_byte is None:
self.last_byte = total_length - 1
# Cache segments from sub-SLOs in case more than one byterange
# includes data from a particular sub-SLO. We only cache a few sets
# of segments so that a malicious user cannot build a giant SLO tree
# and then GET it to run the proxy out of memory.
#
# LRUCache is a little awkward to use this way, but it beats doing
# things manually.
#
# 20 is sort of an arbitrary choice; it's twice our max recursion
# depth, so we know this won't expand memory requirements by too
# much.
cached_fetch_sub_slo_segments = \
LRUCache(maxsize=20)(self._fetch_sub_slo_segments)
for first_byte, last_byte in byteranges:
byterange_listing_iter = self._byterange_listing_iterator(
req, version, account, segments, first_byte, last_byte,
cached_fetch_sub_slo_segments)
for seg_info in byterange_listing_iter:
yield seg_info
def _byterange_listing_iterator(self, req, version, account, segments,
first_byte, last_byte,
cached_fetch_sub_slo_segments,
recursion_depth=1):
last_sub_path = None last_sub_path = None
for seg_dict in segments: for seg_dict in segments:
seg_length = self._segment_length(seg_dict) seg_length = self._segment_length(seg_dict)
if self.first_byte >= seg_length: if first_byte >= seg_length:
# don't need any bytes from this segment # don't need any bytes from this segment
self.first_byte -= seg_length first_byte -= seg_length
self.last_byte -= seg_length last_byte -= seg_length
continue continue
if self.last_byte < 0: if last_byte < 0:
# no bytes are needed from this or any future segment # no bytes are needed from this or any future segment
break return
seg_range = seg_dict.get('range') seg_range = seg_dict.get('range')
if seg_range is None: if seg_range is None:
@ -483,33 +503,30 @@ class SloGetContext(WSGIContext):
sub_path = get_valid_utf8_str(seg_dict['name']) sub_path = get_valid_utf8_str(seg_dict['name'])
sub_cont, sub_obj = split_path(sub_path, 2, 2, True) sub_cont, sub_obj = split_path(sub_path, 2, 2, True)
if last_sub_path != sub_path: if last_sub_path != sub_path:
sub_segments = self._fetch_sub_slo_segments( sub_segments = cached_fetch_sub_slo_segments(
req, version, account, sub_cont, sub_obj) req, version, account, sub_cont, sub_obj)
last_sub_path = sub_path last_sub_path = sub_path
# Use the existing machinery to slice into the sub-SLO. # Use the existing machinery to slice into the sub-SLO.
# This requires that we save off our current state, and for sub_seg_dict, sb, eb in self._byterange_listing_iterator(
# restore at the other end.
orig_start, orig_end = self.first_byte, self.last_byte
self.first_byte = range_start + max(0, self.first_byte)
self.last_byte = min(range_end, range_start + self.last_byte)
for sub_seg_dict, sb, eb in self._segment_listing_iterator(
req, version, account, sub_segments, req, version, account, sub_segments,
# This adjusts first_byte and last_byte to be
# relative to the sub-SLO.
range_start + max(0, first_byte),
min(range_end, range_start + last_byte),
cached_fetch_sub_slo_segments,
recursion_depth=recursion_depth + 1): recursion_depth=recursion_depth + 1):
yield sub_seg_dict, sb, eb yield sub_seg_dict, sb, eb
# Restore the first/last state
self.first_byte, self.last_byte = orig_start, orig_end
else: else:
if isinstance(seg_dict['name'], six.text_type): if isinstance(seg_dict['name'], six.text_type):
seg_dict['name'] = seg_dict['name'].encode("utf-8") seg_dict['name'] = seg_dict['name'].encode("utf-8")
yield (seg_dict, yield (seg_dict,
max(0, self.first_byte) + range_start, max(0, first_byte) + range_start,
min(range_end, range_start + self.last_byte)) min(range_end, range_start + last_byte))
self.first_byte -= seg_length first_byte -= seg_length
self.last_byte -= seg_length last_byte -= seg_length
def _need_to_refetch_manifest(self, req): def _need_to_refetch_manifest(self, req):
""" """
@ -692,22 +709,18 @@ class SloGetContext(WSGIContext):
def _manifest_get_response(self, req, content_length, response_headers, def _manifest_get_response(self, req, content_length, response_headers,
segments): segments):
self.first_byte, self.last_byte = None, None
if req.range: if req.range:
byteranges = req.range.ranges_for_length(content_length) byteranges = [
if len(byteranges) == 0:
return HTTPRequestedRangeNotSatisfiable(request=req)
elif len(byteranges) == 1:
self.first_byte, self.last_byte = byteranges[0]
# For some reason, swob.Range.ranges_for_length adds 1 to the # For some reason, swob.Range.ranges_for_length adds 1 to the
# last byte's position. # last byte's position.
self.last_byte -= 1 (start, end - 1) for start, end
else: in req.range.ranges_for_length(content_length)]
req.range = None else:
byteranges = []
ver, account, _junk = req.split_path(3, 3, rest_with_last=True) ver, account, _junk = req.split_path(3, 3, rest_with_last=True)
plain_listing_iter = self._segment_listing_iterator( plain_listing_iter = self._segment_listing_iterator(
req, ver, account, segments) req, ver, account, segments, byteranges)
def is_small_segment((seg_dict, start_byte, end_byte)): def is_small_segment((seg_dict, start_byte, end_byte)):
start = 0 if start_byte is None else start_byte start = 0 if start_byte is None else start_byte

View File

@ -35,11 +35,11 @@ from swift.common.constraints import FORMAT2CONTENT_TYPE
from swift.common.exceptions import ListingIterError, SegmentError from swift.common.exceptions import ListingIterError, SegmentError
from swift.common.http import is_success from swift.common.http import is_success
from swift.common.swob import HTTPBadRequest, HTTPNotAcceptable, \ from swift.common.swob import HTTPBadRequest, HTTPNotAcceptable, \
HTTPServiceUnavailable, Range, is_chunked HTTPServiceUnavailable, Range, is_chunked, multi_range_iterator
from swift.common.utils import split_path, validate_device_partition, \ from swift.common.utils import split_path, validate_device_partition, \
close_if_possible, maybe_multipart_byteranges_to_document_iters, \ close_if_possible, maybe_multipart_byteranges_to_document_iters, \
multipart_byteranges_to_document_iters, parse_content_type, \ multipart_byteranges_to_document_iters, parse_content_type, \
parse_content_range, csv_append, list_from_csv parse_content_range, csv_append, list_from_csv, Spliterator
from swift.common.wsgi import make_subrequest from swift.common.wsgi import make_subrequest
@ -520,6 +520,25 @@ class SegmentedIterable(object):
""" """
return self return self
def app_iter_ranges(self, ranges, content_type, boundary, content_size):
"""
This method assumes that iter(self) yields all the data bytes that
go into the response, but none of the MIME stuff. For example, if
the response will contain three MIME docs with data "abcd", "efgh",
and "ijkl", then iter(self) will give out the bytes "abcdefghijkl".
This method inserts the MIME stuff around the data bytes.
"""
si = Spliterator(self)
mri = multi_range_iterator(
ranges, content_type, boundary, content_size,
lambda start, end_plus_one: si.take(end_plus_one - start))
try:
for x in mri:
yield x
finally:
self.close()
def validate_first_segment(self): def validate_first_segment(self):
""" """
Start fetching object data to ensure that the first segment (if any) is Start fetching object data to ensure that the first segment (if any) is

View File

@ -1245,9 +1245,9 @@ class Response(object):
ranges = self.request.range.ranges_for_length(self.content_length) ranges = self.request.range.ranges_for_length(self.content_length)
if ranges == []: if ranges == []:
self.status = 416 self.status = 416
self.content_length = 0
close_if_possible(app_iter) close_if_possible(app_iter)
return [''] body = None
app_iter = None
elif ranges: elif ranges:
range_size = len(ranges) range_size = len(ranges)
if range_size > 0: if range_size > 0:

View File

@ -3292,6 +3292,80 @@ class LRUCache(object):
return LRUCacheWrapped() return LRUCacheWrapped()
class Spliterator(object):
"""
Takes an iterator yielding sliceable things (e.g. strings or lists) and
yields subiterators, each yielding up to the requested number of items
from the source.
>>> si = Spliterator(["abcde", "fg", "hijkl"])
>>> ''.join(si.take(4))
"abcd"
>>> ''.join(si.take(3))
"efg"
>>> ''.join(si.take(1))
"h"
>>> ''.join(si.take(3))
"ijk"
>>> ''.join(si.take(3))
"l" # shorter than requested; this can happen with the last iterator
"""
def __init__(self, source_iterable):
self.input_iterator = iter(source_iterable)
self.leftovers = None
self.leftovers_index = 0
self._iterator_in_progress = False
def take(self, n):
if self._iterator_in_progress:
raise ValueError("cannot call take() again until the first"
" iterator is exhausted")
self._iterator_in_progress = True
try:
if self.leftovers:
# All this string slicing is a little awkward, but it's for
# a good reason. Consider a length N string that someone is
# taking k bytes at a time.
#
# With this implementation, we create one new string of
# length k (copying the bytes) on each call to take(). Once
# the whole input has been consumed, each byte has been
# copied exactly once, giving O(N) bytes copied.
#
# If, instead of this, we were to set leftovers =
# leftovers[k:] and omit leftovers_index, then each call to
# take() would copy k bytes to create the desired substring,
# then copy all the remaining bytes to reset leftovers,
# resulting in an overall O(N^2) bytes copied.
llen = len(self.leftovers) - self.leftovers_index
if llen <= n:
n -= llen
yield self.leftovers[self.leftovers_index:]
self.leftovers = None
self.leftovers_index = 0
else:
yield self.leftovers[
self.leftovers_index:(self.leftovers_index + n)]
self.leftovers_index += n
n = 0
while n > 0:
chunk = next(self.input_iterator)
cl = len(chunk)
if cl <= n:
n -= cl
yield chunk
else:
yield chunk[:n]
self.leftovers = chunk
self.leftovers_index = n
n = 0
finally:
self._iterator_in_progress = False
def tpool_reraise(func, *args, **kwargs): def tpool_reraise(func, *args, **kwargs):
""" """
Hack to work around Eventlet's tpool not catching and reraising Timeouts. Hack to work around Eventlet's tpool not catching and reraising Timeouts.

View File

@ -3097,6 +3097,34 @@ class TestSlo(Base):
self.assertEqual('b', file_contents[-2]) self.assertEqual('b', file_contents[-2])
self.assertEqual('c', file_contents[-1]) self.assertEqual('c', file_contents[-1])
def test_slo_multi_ranged_get(self):
file_item = self.env.container.file('manifest-abcde')
file_contents = file_item.read(
hdrs={"Range": "bytes=1048571-1048580,2097147-2097156"})
# See testMultiRangeGets for explanation
parser = email.parser.FeedParser()
parser.feed("Content-Type: %s\r\n\r\n" % file_item.content_type)
parser.feed(file_contents)
root_message = parser.close()
self.assertTrue(root_message.is_multipart()) # sanity check
byteranges = root_message.get_payload()
self.assertEqual(len(byteranges), 2)
self.assertEqual(byteranges[0]['Content-Type'],
"application/octet-stream")
self.assertEqual(
byteranges[0]['Content-Range'], "bytes 1048571-1048580/4194305")
self.assertEqual(byteranges[0].get_payload(), "aaaaabbbbb")
self.assertEqual(byteranges[1]['Content-Type'],
"application/octet-stream")
self.assertEqual(
byteranges[1]['Content-Range'], "bytes 2097147-2097156/4194305")
self.assertEqual(byteranges[1].get_payload(), "bbbbbccccc")
def test_slo_ranged_submanifest(self): def test_slo_ranged_submanifest(self):
file_item = self.env.container.file('manifest-abcde-submanifest') file_item = self.env.container.file('manifest-abcde-submanifest')
file_contents = file_item.read(size=1024 * 1024 + 2, file_contents = file_item.read(size=1024 * 1024 + 2,

View File

@ -22,12 +22,14 @@ import time
import unittest import unittest
from mock import patch from mock import patch
from hashlib import md5 from hashlib import md5
from StringIO import StringIO
from swift.common import swob, utils from swift.common import swob, utils
from swift.common.exceptions import ListingIterError, SegmentError from swift.common.exceptions import ListingIterError, SegmentError
from swift.common.header_key_dict import HeaderKeyDict from swift.common.header_key_dict import HeaderKeyDict
from swift.common.middleware import slo from swift.common.middleware import slo
from swift.common.swob import Request, HTTPException from swift.common.swob import Request, HTTPException
from swift.common.utils import quote, closing_if_possible, close_if_possible from swift.common.utils import quote, closing_if_possible, close_if_possible, \
parse_content_type, iter_multipart_mime_documents, parse_mime_headers
from test.unit.common.middleware.helpers import FakeSwift from test.unit.common.middleware.helpers import FakeSwift
@ -1735,6 +1737,116 @@ class TestSloGetManifest(SloTestCase):
self.assertEqual(self.app.swift_sources[1:], self.assertEqual(self.app.swift_sources[1:],
['SLO'] * (len(self.app.swift_sources) - 1)) ['SLO'] * (len(self.app.swift_sources) - 1))
def test_multiple_ranges_get_manifest(self):
req = Request.blank(
'/v1/AUTH_test/gettest/manifest-abcd',
environ={'REQUEST_METHOD': 'GET'},
headers={'Range': 'bytes=3-17,20-24,35-999999'})
status, headers, body = self.call_slo(req)
headers = HeaderKeyDict(headers)
self.assertEqual(status, '206 Partial Content')
ct, params = parse_content_type(headers['Content-Type'])
params = dict(params)
self.assertEqual(ct, 'multipart/byteranges')
boundary = params.get('boundary')
self.assertTrue(boundary is not None)
self.assertEqual(len(body), int(headers['Content-Length']))
got_mime_docs = []
for mime_doc_fh in iter_multipart_mime_documents(
StringIO(body), boundary):
headers = parse_mime_headers(mime_doc_fh)
body = mime_doc_fh.read()
got_mime_docs.append((headers, body))
self.assertEqual(len(got_mime_docs), 3)
first_range_headers = got_mime_docs[0][0]
first_range_body = got_mime_docs[0][1]
self.assertEqual(first_range_headers['Content-Range'],
'bytes 3-17/50')
self.assertEqual(first_range_headers['Content-Type'],
'application/json')
self.assertEqual(first_range_body, 'aabbbbbbbbbbccc')
second_range_headers = got_mime_docs[1][0]
second_range_body = got_mime_docs[1][1]
self.assertEqual(second_range_headers['Content-Range'],
'bytes 20-24/50')
self.assertEqual(second_range_headers['Content-Type'],
'application/json')
self.assertEqual(second_range_body, 'ccccc')
third_range_headers = got_mime_docs[2][0]
third_range_body = got_mime_docs[2][1]
self.assertEqual(third_range_headers['Content-Range'],
'bytes 35-49/50')
self.assertEqual(third_range_headers['Content-Type'],
'application/json')
self.assertEqual(third_range_body, 'ddddddddddddddd')
self.assertEqual(
self.app.calls,
[('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
('GET', '/v1/AUTH_test/gettest/manifest-abcd'),
('GET', '/v1/AUTH_test/gettest/manifest-bc'),
('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
ranges = [c[2].get('Range') for c in self.app.calls_with_headers]
self.assertEqual(ranges, [
'bytes=3-17,20-24,35-999999', # initial GET
None, # re-fetch top-level manifest
None, # fetch manifest-bc as sub-slo
'bytes=3-', # a_5
None, # b_10
'bytes=0-2,5-9', # c_15
'bytes=5-']) # d_20
# we set swift.source for everything but the first request
self.assertIsNone(self.app.swift_sources[0])
self.assertEqual(self.app.swift_sources[1:],
['SLO'] * (len(self.app.swift_sources) - 1))
def test_multiple_ranges_including_suffix_get_manifest(self):
req = Request.blank(
'/v1/AUTH_test/gettest/manifest-abcd',
environ={'REQUEST_METHOD': 'GET'},
headers={'Range': 'bytes=3-17,-21'})
status, headers, body = self.call_slo(req)
headers = HeaderKeyDict(headers)
self.assertEqual(status, '206 Partial Content')
ct, params = parse_content_type(headers['Content-Type'])
params = dict(params)
self.assertEqual(ct, 'multipart/byteranges')
boundary = params.get('boundary')
self.assertTrue(boundary is not None)
got_mime_docs = []
for mime_doc_fh in iter_multipart_mime_documents(
StringIO(body), boundary):
headers = parse_mime_headers(mime_doc_fh)
body = mime_doc_fh.read()
got_mime_docs.append((headers, body))
self.assertEqual(len(got_mime_docs), 2)
first_range_headers = got_mime_docs[0][0]
first_range_body = got_mime_docs[0][1]
self.assertEqual(first_range_headers['Content-Range'],
'bytes 3-17/50')
self.assertEqual(first_range_body, 'aabbbbbbbbbbccc')
second_range_headers = got_mime_docs[1][0]
second_range_body = got_mime_docs[1][1]
self.assertEqual(second_range_headers['Content-Range'],
'bytes 29-49/50')
self.assertEqual(second_range_body, 'cdddddddddddddddddddd')
def test_range_get_includes_whole_manifest(self): def test_range_get_includes_whole_manifest(self):
# If the first range GET results in retrieval of the entire manifest # If the first range GET results in retrieval of the entire manifest
# body (which we can detect by looking at Content-Range), then we # body (which we can detect by looking at Content-Range), then we
@ -1924,21 +2036,6 @@ class TestSloGetManifest(SloTestCase):
status, headers, body = self.call_slo(req) status, headers, body = self.call_slo(req)
self.assertEqual(status, '416 Requested Range Not Satisfiable') self.assertEqual(status, '416 Requested Range Not Satisfiable')
def test_multi_range_get_manifest(self):
# SLO doesn't support multi-range GETs. The way that you express
# "unsupported" in HTTP is to return a 200 and the whole entity.
req = Request.blank(
'/v1/AUTH_test/gettest/manifest-abcd',
environ={'REQUEST_METHOD': 'GET'},
headers={'Range': 'bytes=0-0,2-2'})
status, headers, body = self.call_slo(req)
headers = HeaderKeyDict(headers)
self.assertEqual(status, '200 OK')
self.assertEqual(headers['Content-Length'], '50')
self.assertEqual(
body, 'aaaaabbbbbbbbbbcccccccccccccccdddddddddddddddddddd')
def test_get_segment_with_non_ascii_path(self): def test_get_segment_with_non_ascii_path(self):
segment_body = u"a møøse once bit my sister".encode("utf-8") segment_body = u"a møøse once bit my sister".encode("utf-8")
self.app.register( self.app.register(
@ -2027,11 +2124,9 @@ class TestSloGetManifest(SloTestCase):
('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'), ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')]) ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get')])
@ -2043,11 +2138,9 @@ class TestSloGetManifest(SloTestCase):
None, None,
'bytes=3-', 'bytes=3-',
'bytes=0-2', 'bytes=0-2',
None,
'bytes=11-11', 'bytes=11-11',
'bytes=13-', 'bytes=13-',
'bytes=4-6', 'bytes=4-6',
None,
'bytes=0-0', 'bytes=0-0',
'bytes=4-5', 'bytes=4-5',
'bytes=0-2']) 'bytes=0-2'])
@ -2114,11 +2207,9 @@ class TestSloGetManifest(SloTestCase):
('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'), ('GET', '/v1/AUTH_test/gettest/manifest-abcd-ranges'),
('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'), ('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/d_20?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/c_15?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/manifest-bc-ranges'),
('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'), ('GET', '/v1/AUTH_test/gettest/a_5?multipart-manifest=get'),
('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')]) ('GET', '/v1/AUTH_test/gettest/b_10?multipart-manifest=get')])
@ -2129,11 +2220,9 @@ class TestSloGetManifest(SloTestCase):
None, None,
None, None,
'bytes=2-2', 'bytes=2-2',
None,
'bytes=11-11', 'bytes=11-11',
'bytes=13-', 'bytes=13-',
'bytes=4-6', 'bytes=4-6',
None,
'bytes=0-0', 'bytes=0-0',
'bytes=4-4']) 'bytes=4-4'])
# we set swift.source for everything but the first request # we set swift.source for everything but the first request
@ -2180,23 +2269,6 @@ class TestSloGetManifest(SloTestCase):
self.assertEqual(self.app.swift_sources[1:], self.assertEqual(self.app.swift_sources[1:],
['SLO'] * (len(self.app.swift_sources) - 1)) ['SLO'] * (len(self.app.swift_sources) - 1))
def test_multi_range_get_range_manifest(self):
# SLO doesn't support multi-range GETs. The way that you express
# "unsupported" in HTTP is to return a 200 and the whole entity.
req = Request.blank(
'/v1/AUTH_test/gettest/manifest-abcd-ranges',
environ={'REQUEST_METHOD': 'GET'},
headers={'Range': 'bytes=0-0,2-2'})
status, headers, body = self.call_slo(req)
headers = HeaderKeyDict(headers)
self.assertEqual(status, '200 OK')
self.assertEqual(headers['Content-Type'], 'application/json')
self.assertEqual(body, 'aaaaaaaaccccccccbbbbbbbbdddddddd')
self.assertNotIn('Transfer-Encoding', headers)
self.assertNotIn('Content-Range', headers)
self.assertEqual(headers['Content-Length'], '32')
def test_get_bogus_manifest(self): def test_get_bogus_manifest(self):
req = Request.blank( req = Request.blank(
'/v1/AUTH_test/gettest/manifest-badjson', '/v1/AUTH_test/gettest/manifest-badjson',

View File

@ -1298,16 +1298,16 @@ class TestResponse(unittest.TestCase):
resp = req.get_response(test_app) resp = req.get_response(test_app)
resp.conditional_response = True resp.conditional_response = True
body = ''.join(resp([], start_response)) body = ''.join(resp([], start_response))
self.assertEqual(body, '') self.assertIn('The Range requested is not available', body)
self.assertEqual(resp.content_length, 0) self.assertEqual(resp.content_length, len(body))
self.assertEqual(resp.status, '416 Requested Range Not Satisfiable') self.assertEqual(resp.status, '416 Requested Range Not Satisfiable')
resp = swift.common.swob.Response( resp = swift.common.swob.Response(
body='1234567890', request=req, body='1234567890', request=req,
conditional_response=True) conditional_response=True)
body = ''.join(resp([], start_response)) body = ''.join(resp([], start_response))
self.assertEqual(body, '') self.assertIn('The Range requested is not available', body)
self.assertEqual(resp.content_length, 0) self.assertEqual(resp.content_length, len(body))
self.assertEqual(resp.status, '416 Requested Range Not Satisfiable') self.assertEqual(resp.status, '416 Requested Range Not Satisfiable')
# Syntactically-invalid Range headers "MUST" be ignored # Syntactically-invalid Range headers "MUST" be ignored

View File

@ -5335,6 +5335,68 @@ class TestLRUCache(unittest.TestCase):
self.assertEqual(f.size(), 4) self.assertEqual(f.size(), 4)
class TestSpliterator(unittest.TestCase):
def test_string(self):
input_chunks = ["coun", "ter-", "b", "ra", "nch-mater",
"nit", "y-fungusy", "-nummular"]
si = utils.Spliterator(input_chunks)
self.assertEqual(''.join(si.take(8)), "counter-")
self.assertEqual(''.join(si.take(7)), "branch-")
self.assertEqual(''.join(si.take(10)), "maternity-")
self.assertEqual(''.join(si.take(8)), "fungusy-")
self.assertEqual(''.join(si.take(8)), "nummular")
def test_big_input_string(self):
input_chunks = ["iridium"]
si = utils.Spliterator(input_chunks)
self.assertEqual(''.join(si.take(2)), "ir")
self.assertEqual(''.join(si.take(1)), "i")
self.assertEqual(''.join(si.take(2)), "di")
self.assertEqual(''.join(si.take(1)), "u")
self.assertEqual(''.join(si.take(1)), "m")
def test_chunk_boundaries(self):
input_chunks = ["soylent", "green", "is", "people"]
si = utils.Spliterator(input_chunks)
self.assertEqual(''.join(si.take(7)), "soylent")
self.assertEqual(''.join(si.take(5)), "green")
self.assertEqual(''.join(si.take(2)), "is")
self.assertEqual(''.join(si.take(6)), "people")
def test_no_empty_strings(self):
input_chunks = ["soylent", "green", "is", "people"]
si = utils.Spliterator(input_chunks)
outputs = (list(si.take(7)) # starts and ends on chunk boundary
+ list(si.take(2)) # spans two chunks
+ list(si.take(3)) # begins but does not end chunk
+ list(si.take(2)) # ends but does not begin chunk
+ list(si.take(6))) # whole chunk + EOF
self.assertNotIn('', outputs)
def test_running_out(self):
input_chunks = ["not much"]
si = utils.Spliterator(input_chunks)
self.assertEqual(''.join(si.take(4)), "not ")
self.assertEqual(''.join(si.take(99)), "much") # short
self.assertEqual(''.join(si.take(4)), "")
self.assertEqual(''.join(si.take(4)), "")
def test_overlap(self):
input_chunks = ["one fish", "two fish", "red fish", "blue fish"]
si = utils.Spliterator(input_chunks)
t1 = si.take(20) # longer than first chunk
self.assertLess(len(next(t1)), 20) # it's not exhausted
t2 = si.take(20)
self.assertRaises(ValueError, next, t2)
class TestParseContentRange(unittest.TestCase): class TestParseContentRange(unittest.TestCase):
def test_good(self): def test_good(self):
start, end, total = utils.parse_content_range("bytes 100-200/300") start, end, total = utils.parse_content_range("bytes 100-200/300")