Merge "add bytes of expiring objects to queue entry"

This commit is contained in:
Zuul 2024-06-14 20:29:12 +00:00 committed by Gerrit Code Review
commit 46e183df15
6 changed files with 804 additions and 35 deletions

View File

@ -29,7 +29,8 @@ from swift.common.daemon import Daemon
from swift.common.internal_client import InternalClient, UnexpectedResponse from swift.common.internal_client import InternalClient, UnexpectedResponse
from swift.common.utils import get_logger, dump_recon_cache, split_path, \ from swift.common.utils import get_logger, dump_recon_cache, split_path, \
Timestamp, config_true_value, normalize_delete_at_timestamp, \ Timestamp, config_true_value, normalize_delete_at_timestamp, \
RateLimitedIterator, md5, non_negative_float, non_negative_int RateLimitedIterator, md5, non_negative_float, non_negative_int, \
parse_content_type
from swift.common.http import HTTP_NOT_FOUND, HTTP_CONFLICT, \ from swift.common.http import HTTP_NOT_FOUND, HTTP_CONFLICT, \
HTTP_PRECONDITION_FAILED HTTP_PRECONDITION_FAILED
from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
@ -37,6 +38,7 @@ from swift.common.recon import RECON_OBJECT_FILE, DEFAULT_RECON_CACHE_PATH
from swift.container.reconciler import direct_delete_container_entry from swift.container.reconciler import direct_delete_container_entry
MAX_OBJECTS_TO_CACHE = 100000 MAX_OBJECTS_TO_CACHE = 100000
X_DELETE_TYPE = 'text/plain'
ASYNC_DELETE_TYPE = 'application/async-deleted' ASYNC_DELETE_TYPE = 'application/async-deleted'
@ -67,6 +69,37 @@ def parse_task_obj(task_obj):
return timestamp, target_account, target_container, target_obj return timestamp, target_account, target_container, target_obj
def extract_expirer_bytes_from_ctype(content_type):
"""
Parse a content-type and return the number of bytes.
:param content_type: a content-type string
:return: int or None
"""
content_type, params = parse_content_type(content_type)
bytes_size = None
for k, v in params:
if k == 'swift_expirer_bytes':
bytes_size = int(v)
return bytes_size
def embed_expirer_bytes_in_ctype(content_type, metadata):
"""
Embed number of bytes into content-type. The bytes should come from
content-length on regular objects, but future extensions to "bytes in
expirer queue" monitoring may want to more closely consider expiration of
large multipart object manifests.
:param content_type: a content-type string
:param metadata: a dict, from Diskfile metadata
:return: str
"""
# as best I can tell this key is required by df.open
report_bytes = metadata['Content-Length']
return "%s;swift_expirer_bytes=%d" % (content_type, int(report_bytes))
def read_conf_for_delay_reaping_times(conf): def read_conf_for_delay_reaping_times(conf):
delay_reaping_times = {} delay_reaping_times = {}
for conf_key in conf: for conf_key in conf:

View File

@ -59,7 +59,8 @@ from swift.common.swob import HTTPAccepted, HTTPBadRequest, HTTPCreated, \
HTTPInsufficientStorage, HTTPForbidden, HTTPException, HTTPConflict, \ HTTPInsufficientStorage, HTTPForbidden, HTTPException, HTTPConflict, \
HTTPServerError, bytes_to_wsgi, wsgi_to_bytes, wsgi_to_str, normalize_etag HTTPServerError, bytes_to_wsgi, wsgi_to_bytes, wsgi_to_str, normalize_etag
from swift.obj.diskfile import RESERVED_DATAFILE_META, DiskFileRouter from swift.obj.diskfile import RESERVED_DATAFILE_META, DiskFileRouter
from swift.obj.expirer import build_task_obj from swift.obj.expirer import build_task_obj, embed_expirer_bytes_in_ctype, \
X_DELETE_TYPE
def iter_mime_headers_and_bodies(wsgi_input, mime_boundary, read_chunk_size): def iter_mime_headers_and_bodies(wsgi_input, mime_boundary, read_chunk_size):
@ -437,7 +438,7 @@ class ObjectController(BaseStorageServer):
self.container_update_timeout, updates) self.container_update_timeout, updates)
def delete_at_update(self, op, delete_at, account, container, obj, def delete_at_update(self, op, delete_at, account, container, obj,
request, objdevice, policy): request, objdevice, policy, extra_headers=None):
""" """
Update the expiring objects container when objects are updated. Update the expiring objects container when objects are updated.
@ -449,6 +450,7 @@ class ObjectController(BaseStorageServer):
:param request: the original request driving the update :param request: the original request driving the update
:param objdevice: device name that the object is in :param objdevice: device name that the object is in
:param policy: the BaseStoragePolicy instance (used for tmp dir) :param policy: the BaseStoragePolicy instance (used for tmp dir)
:param extra_headers: dict of additional headers for the update
""" """
if config_true_value( if config_true_value(
request.headers.get('x-backend-replication', 'f')): request.headers.get('x-backend-replication', 'f')):
@ -494,8 +496,10 @@ class ObjectController(BaseStorageServer):
if not updates: if not updates:
updates = [(None, None)] updates = [(None, None)]
headers_out['x-size'] = '0' headers_out['x-size'] = '0'
headers_out['x-content-type'] = 'text/plain' headers_out['x-content-type'] = X_DELETE_TYPE
headers_out['x-etag'] = 'd41d8cd98f00b204e9800998ecf8427e' headers_out['x-etag'] = 'd41d8cd98f00b204e9800998ecf8427e'
if extra_headers:
headers_out.update(extra_headers)
else: else:
if not config_true_value( if not config_true_value(
request.headers.get( request.headers.get(
@ -620,6 +624,24 @@ class ObjectController(BaseStorageServer):
override = key.lower().replace(override_prefix, 'x-') override = key.lower().replace(override_prefix, 'x-')
update_headers[override] = val update_headers[override] = val
def _conditional_delete_at_update(self, request, device, account,
container, obj, policy, metadata,
orig_delete_at, new_delete_at):
if new_delete_at:
extra_headers = {
'x-content-type': embed_expirer_bytes_in_ctype(
X_DELETE_TYPE, metadata),
'x-content-type-timestamp':
metadata.get('X-Timestamp'),
}
self.delete_at_update(
'PUT', new_delete_at, account, container, obj, request,
device, policy, extra_headers)
if orig_delete_at and orig_delete_at != new_delete_at:
self.delete_at_update(
'DELETE', orig_delete_at, account, container, obj,
request, device, policy)
@public @public
@timing_stats() @timing_stats()
def POST(self, request): def POST(self, request):
@ -675,15 +697,11 @@ class ObjectController(BaseStorageServer):
wsgi_to_bytes(header_key).title()) wsgi_to_bytes(header_key).title())
metadata[header_caps] = request.headers[header_key] metadata[header_caps] = request.headers[header_key]
orig_delete_at = int(orig_metadata.get('X-Delete-At') or 0) orig_delete_at = int(orig_metadata.get('X-Delete-At') or 0)
if orig_delete_at != new_delete_at: disk_file_metadata = disk_file.get_datafile_metadata()
if new_delete_at: self._conditional_delete_at_update(
self.delete_at_update( request, device, account, container, obj, policy,
'PUT', new_delete_at, account, container, obj, request, disk_file_metadata, orig_delete_at, new_delete_at
device, policy) )
if orig_delete_at:
self.delete_at_update('DELETE', orig_delete_at, account,
container, obj, request, device,
policy)
else: else:
# preserve existing metadata, only content-type may be updated # preserve existing metadata, only content-type may be updated
metadata = dict(disk_file.get_metafile_metadata()) metadata = dict(disk_file.get_metafile_metadata())
@ -993,15 +1011,10 @@ class ObjectController(BaseStorageServer):
orig_metadata, footers_metadata, metadata): orig_metadata, footers_metadata, metadata):
orig_delete_at = int(orig_metadata.get('X-Delete-At') or 0) orig_delete_at = int(orig_metadata.get('X-Delete-At') or 0)
new_delete_at = int(request.headers.get('X-Delete-At') or 0) new_delete_at = int(request.headers.get('X-Delete-At') or 0)
if orig_delete_at != new_delete_at:
if new_delete_at: self._conditional_delete_at_update(request, device, account, container,
self.delete_at_update( obj, policy, metadata,
'PUT', new_delete_at, account, container, obj, request, orig_delete_at, new_delete_at)
device, policy)
if orig_delete_at:
self.delete_at_update(
'DELETE', orig_delete_at, account, container, obj,
request, device, policy)
update_headers = HeaderKeyDict({ update_headers = HeaderKeyDict({
'x-size': metadata['Content-Length'], 'x-size': metadata['Content-Length'],
@ -1262,10 +1275,10 @@ class ObjectController(BaseStorageServer):
else: else:
# differentiate success from no object at all # differentiate success from no object at all
response_class = HTTPNoContent response_class = HTTPNoContent
if orig_delete_at: self._conditional_delete_at_update(
self.delete_at_update('DELETE', orig_delete_at, account, request, device, account, container, obj, policy, {},
container, obj, request, device, orig_delete_at, 0
policy) )
if orig_timestamp < req_timestamp: if orig_timestamp < req_timestamp:
try: try:
disk_file.delete(req_timestamp) disk_file.delete(req_timestamp)

View File

@ -12,6 +12,7 @@
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
from collections import Counter
import json import json
import random import random
import time import time
@ -22,6 +23,8 @@ from io import BytesIO
from swift.common.internal_client import InternalClient, UnexpectedResponse from swift.common.internal_client import InternalClient, UnexpectedResponse
from swift.common.manager import Manager from swift.common.manager import Manager
from swift.common.utils import Timestamp, config_true_value from swift.common.utils import Timestamp, config_true_value
from swift.common import direct_client
from swift.obj.expirer import extract_expirer_bytes_from_ctype
from test.probe.common import ReplProbeTest, ENABLED_POLICIES from test.probe.common import ReplProbeTest, ENABLED_POLICIES
from test.probe.brain import BrainSplitter from test.probe.brain import BrainSplitter
@ -472,6 +475,142 @@ class TestObjectExpirer(ReplProbeTest):
headers={'X-Backend-Open-Expired': True}) headers={'X-Backend-Open-Expired': True})
self.assertEqual(e.exception.resp.status_int, 404) self.assertEqual(e.exception.resp.status_int, 404)
def test_expirer_object_bytes_eventual_consistency(self):
obj_brain = BrainSplitter(self.url, self.token, self.container_name,
self.object_name, 'object', self.policy)
obj_brain.put_container()
def put_object(content_length=0):
try:
self.client.upload_object(BytesIO(bytes(content_length)),
self.account, self.container_name,
self.object_name)
except UnexpectedResponse as e:
self.fail(
'Expected 201 for PUT object but got %s' % e.resp.status)
t0_content_length = 24
put_object(content_length=t0_content_length)
try:
metadata = self.client.get_object_metadata(
self.account, self.container_name, self.object_name)
except UnexpectedResponse as e:
self.fail(
'Expected 200 for HEAD object but got %s' % e.resp.status)
assert metadata['content-length'] == str(t0_content_length)
t0 = metadata['x-timestamp']
obj_brain.stop_primary_half()
t1_content_length = 32
put_object(content_length=t1_content_length)
try:
metadata = self.client.get_object_metadata(
self.account, self.container_name, self.object_name)
except UnexpectedResponse as e:
self.fail(
'Expected 200 for HEAD object but got %s' % e.resp.status)
assert metadata['content-length'] == str(t1_content_length)
t1 = metadata['x-timestamp']
# some object servers recovered
obj_brain.start_primary_half()
head_responses = []
for node in obj_brain.ring.devs:
metadata = direct_client.direct_head_object(
node, obj_brain.part, self.account, self.container_name,
self.object_name)
head_responses.append(metadata)
timestamp_counts = Counter([
resp['X-Timestamp'] for resp in head_responses
])
expected_counts = {t0: 2, t1: 2}
self.assertEqual(expected_counts, timestamp_counts)
# Do a POST to update object metadata (timestamp x-delete-at)
# POST will create an expiry queue entry with 2 landing on t0, 1 on t1
self.client.set_object_metadata(
self.account, self.container_name, self.object_name,
metadata={'X-Delete-After': '5'}, acceptable_statuses=(2,)
)
# Run the container updater once to register new container containing
# expirey queue entry
Manager(['container-updater']).once()
# Find the name of the container containing the expiring object
expiring_containers = list(
self.client.iter_containers('.expiring_objects')
)
self.assertEqual(1, len(expiring_containers))
expiring_container = expiring_containers[0]
expiring_container_name = expiring_container['name']
# Verify that there is one expiring object
expiring_objects = list(
self.client.iter_objects('.expiring_objects',
expiring_container_name)
)
self.assertEqual(1, len(expiring_objects))
# Get the nodes of the expiring container
expiring_container_part_num, expiring_container_nodes = \
self.client.container_ring.get_nodes('.expiring_objects',
expiring_container_name)
# Verify that there are only 3 such nodes
self.assertEqual(3, len(expiring_container_nodes))
listing_records = []
for node in expiring_container_nodes:
metadata, container_data = direct_client.direct_get_container(
node, expiring_container_part_num, '.expiring_objects',
expiring_container_name)
# Verify there is metadata for only one object
self.assertEqual(1, len(container_data))
listing_records.append(container_data[0])
# Check for inconsistent metadata
byte_size_counts = Counter([
extract_expirer_bytes_from_ctype(resp['content_type'])
for resp in listing_records
])
expected_byte_size_counts = {
t0_content_length: 2,
t1_content_length: 1
}
self.assertEqual(expected_byte_size_counts, byte_size_counts)
# Run the replicator to update expirey queue entries
Manager(['container-replicator']).once()
listing_records = []
for node in expiring_container_nodes:
metadata, container_data = direct_client.direct_get_container(
node, expiring_container_part_num, '.expiring_objects',
expiring_container_name)
self.assertEqual(1, len(container_data))
listing_records.append(container_data[0])
# Ensure that metadata is now consistent
byte_size_counts = Counter([
extract_expirer_bytes_from_ctype(resp['content_type'])
for resp in listing_records
])
expected_byte_size_counts = {t1_content_length: 3}
self.assertEqual(expected_byte_size_counts, byte_size_counts)
def _test_expirer_delete_outdated_object_version(self, object_exists): def _test_expirer_delete_outdated_object_version(self, object_exists):
# This test simulates a case where the expirer tries to delete # This test simulates a case where the expirer tries to delete
# an outdated version of an object. # an outdated version of an object.

View File

@ -7179,3 +7179,113 @@ class TestModuleFunctions(unittest.TestCase):
self.assertIn(sr1, to_add) self.assertIn(sr1, to_add)
self.assertIn(sr2, to_add) self.assertIn(sr2, to_add)
self.assertEqual({'a/o'}, to_delete) self.assertEqual({'a/o'}, to_delete)
class TestExpirerBytesCtypeTimestamp(test_db.TestDbBase):
def setUp(self):
super(TestExpirerBytesCtypeTimestamp, self).setUp()
self.ts = make_timestamp_iter()
self.policy = POLICIES.default
def _get_broker(self):
broker = ContainerBroker(self.db_path,
account='.expiring_objects',
container='1234')
broker.initialize(next(self.ts).internal, self.policy.idx)
return broker
def test_in_order_expirer_bytes_ctype(self):
broker = self._get_broker()
put1_ts = next(self.ts)
put2_ts = next(self.ts)
post_ts = next(self.ts)
broker.put_object(
'1234-a/c/o', post_ts.internal, 0,
'text/plain;swift_expirer_bytes=1',
'd41d8cd98f00b204e9800998ecf8427e',
storage_policy_index=self.policy.idx,
ctype_timestamp=put1_ts.internal)
broker.put_object(
'1234-a/c/o', post_ts.internal, 0,
'text/plain;swift_expirer_bytes=2',
'd41d8cd98f00b204e9800998ecf8427e',
storage_policy_index=self.policy.idx,
ctype_timestamp=put2_ts.internal)
self.assertEqual([{
'content_type': 'text/plain;swift_expirer_bytes=2',
'created_at': encode_timestamps(post_ts, put2_ts, put2_ts),
'deleted': 0,
'etag': 'd41d8cd98f00b204e9800998ecf8427e',
'name': '1234-a/c/o',
'size': 0,
'storage_policy_index': self.policy.idx,
}], broker.get_objects())
def test_out_of_order_expirer_bytes_ctype(self):
broker = self._get_broker()
put1_ts = next(self.ts)
put2_ts = next(self.ts)
post_ts = next(self.ts)
broker.put_object(
'1234-a/c/o', post_ts.internal, 0,
'text/plain;swift_expirer_bytes=2',
'd41d8cd98f00b204e9800998ecf8427e',
storage_policy_index=self.policy.idx,
ctype_timestamp=put2_ts.internal)
# order doesn't matter, more recent put2_ts ctype_timestamp wins
broker.put_object(
'1234-a/c/o', post_ts.internal, 0,
'text/plain;swift_expirer_bytes=1',
'd41d8cd98f00b204e9800998ecf8427e',
storage_policy_index=self.policy.idx,
ctype_timestamp=put1_ts.internal)
self.assertEqual([{
'content_type': 'text/plain;swift_expirer_bytes=2',
'created_at': encode_timestamps(post_ts, put2_ts, put2_ts),
'deleted': 0,
'etag': 'd41d8cd98f00b204e9800998ecf8427e',
'name': '1234-a/c/o',
'size': 0,
'storage_policy_index': self.policy.idx,
}], broker.get_objects())
def test_unupgraded_expirer_bytes_ctype(self):
broker = self._get_broker()
put1_ts = next(self.ts)
post_ts = next(self.ts)
broker.put_object(
'1234-a/c/o', post_ts.internal, 0,
'text/plain',
'd41d8cd98f00b204e9800998ecf8427e',
storage_policy_index=self.policy.idx)
# since the un-upgraded server's task creation request arrived w/o a
# ctype_timestamp, the row treats it's ctype timestamp as being the
# same as the x-timestamp that created the row (the post_ts) - which is
# more recent than the put1_ts used as the ctype_timestamp from the
# already-upgraded server
broker.put_object(
'1234-a/c/o', post_ts.internal, 0,
'text/plain;swift_expirer_bytes=1',
'd41d8cd98f00b204e9800998ecf8427e',
storage_policy_index=self.policy.idx,
ctype_timestamp=put1_ts.internal)
# so the un-upgraded row wins
self.assertEqual([{
'content_type': 'text/plain',
'created_at': post_ts,
'deleted': 0,
'etag': 'd41d8cd98f00b204e9800998ecf8427e',
'name': '1234-a/c/o',
'size': 0,
'storage_policy_index': self.policy.idx,
}], broker.get_objects())

View File

@ -14,6 +14,7 @@
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
import os
from time import time from time import time
from unittest import main, TestCase from unittest import main, TestCase
from test.debug_logger import debug_logger from test.debug_logger import debug_logger
@ -29,7 +30,7 @@ from six.moves import urllib
from swift.common import internal_client, utils, swob from swift.common import internal_client, utils, swob
from swift.common.utils import Timestamp from swift.common.utils import Timestamp
from swift.obj import expirer from swift.obj import expirer, diskfile
def not_random(): def not_random():
@ -95,6 +96,112 @@ class FakeInternalClient(object):
pass pass
class TestExpirerHelpers(TestCase):
def test_add_expirer_bytes_to_ctype(self):
self.assertEqual(
'text/plain;swift_expirer_bytes=10',
expirer.embed_expirer_bytes_in_ctype(
'text/plain', {'Content-Length': 10}))
self.assertEqual(
'text/plain;some_foo=bar;swift_expirer_bytes=10',
expirer.embed_expirer_bytes_in_ctype(
'text/plain;some_foo=bar', {'Content-Length': '10'}))
# you could probably make a case it'd be better to replace an existing
# value if the swift_expirer_bytes key already exists in the content
# type; but in the only case we use this function currently the content
# type is hard coded to text/plain
self.assertEqual(
'text/plain;some_foo=bar;swift_expirer_bytes=10;'
'swift_expirer_bytes=11',
expirer.embed_expirer_bytes_in_ctype(
'text/plain;some_foo=bar;swift_expirer_bytes=10',
{'Content-Length': '11'}))
def test_extract_expirer_bytes_from_ctype(self):
self.assertEqual(10, expirer.extract_expirer_bytes_from_ctype(
'text/plain;swift_expirer_bytes=10'))
self.assertEqual(10, expirer.extract_expirer_bytes_from_ctype(
'text/plain;swift_expirer_bytes=10;some_foo=bar'))
def test_inverse_add_extract_bytes_from_ctype(self):
ctype_bytes = [
('null', 0),
('text/plain', 10),
('application/octet-stream', 42),
('application/json', 512),
('gzip', 1000044),
]
for ctype, expirer_bytes in ctype_bytes:
embedded_ctype = expirer.embed_expirer_bytes_in_ctype(
ctype, {'Content-Length': expirer_bytes})
found_bytes = expirer.extract_expirer_bytes_from_ctype(
embedded_ctype)
self.assertEqual(expirer_bytes, found_bytes)
def test_add_invalid_expirer_bytes_to_ctype(self):
self.assertRaises(TypeError,
expirer.embed_expirer_bytes_in_ctype, 'nill', None)
self.assertRaises(TypeError,
expirer.embed_expirer_bytes_in_ctype, 'bar', 'foo')
self.assertRaises(KeyError,
expirer.embed_expirer_bytes_in_ctype, 'nill', {})
self.assertRaises(TypeError,
expirer.embed_expirer_bytes_in_ctype, 'nill',
{'Content-Length': None})
self.assertRaises(ValueError,
expirer.embed_expirer_bytes_in_ctype, 'nill',
{'Content-Length': 'foo'})
# perhaps could be an error
self.assertEqual(
'weird/float;swift_expirer_bytes=15',
expirer.embed_expirer_bytes_in_ctype('weird/float',
{'Content-Length': 15.9}))
def test_embed_expirer_bytes_from_diskfile_metadata(self):
self.logger = debug_logger('test-expirer')
self.ts = make_timestamp_iter()
self.devices = mkdtemp()
self.conf = {
'mount_check': 'false',
'devices': self.devices,
}
self.df_mgr = diskfile.DiskFileManager(self.conf, logger=self.logger)
utils.mkdirs(os.path.join(self.devices, 'sda1'))
df = self.df_mgr.get_diskfile('sda1', '0', 'a', 'c', 'o', policy=0)
ts = next(self.ts)
with df.create() as writer:
writer.write(b'test')
writer.put({
# wrong key/case here would KeyError
'X-Timestamp': ts.internal,
# wrong key/case here would cause quarantine on read
'Content-Length': '4',
})
metadata = df.read_metadata()
# the Content-Type in the metadata is irrelevant; this method is used
# to create the content_type of an expirer queue task object
embeded_ctype_entry = expirer.embed_expirer_bytes_in_ctype(
'text/plain', metadata)
self.assertEqual('text/plain;swift_expirer_bytes=4',
embeded_ctype_entry)
def test_extract_missing_bytes_from_ctype(self):
self.assertEqual(
None, expirer.extract_expirer_bytes_from_ctype('text/plain'))
self.assertEqual(
None, expirer.extract_expirer_bytes_from_ctype(
'text/plain;swift_bytes=10'))
self.assertEqual(
None, expirer.extract_expirer_bytes_from_ctype(
'text/plain;bytes=21'))
self.assertEqual(
None, expirer.extract_expirer_bytes_from_ctype(
'text/plain;some_foo=bar;other-baz=buz'))
class TestObjectExpirer(TestCase): class TestObjectExpirer(TestCase):
maxDiff = None maxDiff = None
internal_client = None internal_client = None

View File

@ -133,6 +133,15 @@ class TestTpoolSize(unittest.TestCase):
self.assertEqual([], mock_snt.mock_calls) self.assertEqual([], mock_snt.mock_calls)
class SameReqEnv(object):
def __init__(self, req):
self.environ = req.environ
def __eq__(self, other):
return self.environ == other.environ
@patch_policies(test_policies) @patch_policies(test_policies)
class TestObjectController(BaseTestCase): class TestObjectController(BaseTestCase):
"""Test swift.obj.server.ObjectController""" """Test swift.obj.server.ObjectController"""
@ -5704,7 +5713,8 @@ class TestObjectController(BaseTestCase):
'method': 'PUT', 'method': 'PUT',
'ssl': False, 'ssl': False,
'headers': HeaderKeyDict({ 'headers': HeaderKeyDict({
'x-content-type': 'text/plain', 'x-content-type': 'text/plain;swift_expirer_bytes=0',
'x-content-type-timestamp': utils.Timestamp('12345').internal,
'x-etag': 'd41d8cd98f00b204e9800998ecf8427e', 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
'x-size': '0', 'x-size': '0',
'x-timestamp': utils.Timestamp('12345').internal, 'x-timestamp': utils.Timestamp('12345').internal,
@ -5724,7 +5734,8 @@ class TestObjectController(BaseTestCase):
'method': 'PUT', 'method': 'PUT',
'ssl': False, 'ssl': False,
'headers': HeaderKeyDict({ 'headers': HeaderKeyDict({
'x-content-type': 'text/plain', 'x-content-type': 'text/plain;swift_expirer_bytes=0',
'x-content-type-timestamp': utils.Timestamp('12345').internal,
'x-etag': 'd41d8cd98f00b204e9800998ecf8427e', 'x-etag': 'd41d8cd98f00b204e9800998ecf8427e',
'x-size': '0', 'x-size': '0',
'x-timestamp': utils.Timestamp('12345').internal, 'x-timestamp': utils.Timestamp('12345').internal,
@ -6867,9 +6878,10 @@ class TestObjectController(BaseTestCase):
self.object_controller.delete_at_update = fake_delete_at_update self.object_controller.delete_at_update = fake_delete_at_update
timestamp0 = normalize_timestamp(time())
req = Request.blank( req = Request.blank(
'/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'}, '/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
headers={'X-Timestamp': normalize_timestamp(time()), headers={'X-Timestamp': timestamp0,
'Content-Length': '4', 'Content-Length': '4',
'Content-Type': 'application/octet-stream', 'Content-Type': 'application/octet-stream',
'X-Backend-Storage-Policy-Index': int(policy), 'X-Backend-Storage-Policy-Index': int(policy),
@ -6905,7 +6917,10 @@ class TestObjectController(BaseTestCase):
self.assertEqual( self.assertEqual(
given_args, [ given_args, [
'PUT', int(delete_at_timestamp1), 'a', 'c', 'o', 'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
given_args[5], 'sda1', policy]) given_args[5], 'sda1', policy, {
'x-content-type': 'text/plain;swift_expirer_bytes=4',
'x-content-type-timestamp': timestamp0
}])
while given_args: while given_args:
given_args.pop() given_args.pop()
@ -6925,7 +6940,10 @@ class TestObjectController(BaseTestCase):
self.assertEqual( self.assertEqual(
given_args, [ given_args, [
'PUT', int(delete_at_timestamp2), 'a', 'c', 'o', 'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
given_args[5], 'sda1', policy, given_args[5], 'sda1', policy, {
'x-content-type': 'text/plain;swift_expirer_bytes=4',
'x-content-type-timestamp': timestamp0
},
'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o', 'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
given_args[5], 'sda1', policy]) given_args[5], 'sda1', policy])
@ -6967,7 +6985,10 @@ class TestObjectController(BaseTestCase):
self.assertEqual( self.assertEqual(
given_args, [ given_args, [
'PUT', int(delete_at_timestamp1), 'a', 'c', 'o', 'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
given_args[5], 'sda1', policy]) given_args[5], 'sda1', policy, {
'x-content-type': 'text/plain;swift_expirer_bytes=4',
'x-content-type-timestamp': timestamp1
}])
while given_args: while given_args:
given_args.pop() given_args.pop()
@ -6987,10 +7008,14 @@ class TestObjectController(BaseTestCase):
req.body = 'TEST' req.body = 'TEST'
resp = req.get_response(self.object_controller) resp = req.get_response(self.object_controller)
self.assertEqual(resp.status_int, 201) self.assertEqual(resp.status_int, 201)
self.maxDiff = None
self.assertEqual( self.assertEqual(
given_args, [ given_args, [
'PUT', int(delete_at_timestamp2), 'a', 'c', 'o', 'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
given_args[5], 'sda1', policy, given_args[5], 'sda1', policy, {
'x-content-type': 'text/plain;swift_expirer_bytes=4',
'x-content-type-timestamp': timestamp2
},
'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o', 'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
given_args[5], 'sda1', policy]) given_args[5], 'sda1', policy])
@ -7590,6 +7615,345 @@ class TestObjectController(BaseTestCase):
resp = req.get_response(self.object_controller) resp = req.get_response(self.object_controller)
self.assertEqual(resp.status_int, 400) self.assertEqual(resp.status_int, 400)
def test_extra_headers_contain_object_bytes(self):
timestamp1 = next(self.ts).normal
delete_at_timestamp1 = int(time() + 1000)
delete_at_container1 = str(
delete_at_timestamp1 /
self.object_controller.expiring_objects_container_divisor *
self.object_controller.expiring_objects_container_divisor)
req = Request.blank(
'/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
headers={'X-Timestamp': timestamp1,
'Content-Length': '4096',
'Content-Type': 'application/octet-stream',
'X-Delete-At': str(delete_at_timestamp1),
'X-Delete-At-Container': delete_at_container1})
req.body = '\x00' * 4096
with mock.patch.object(self.object_controller, 'delete_at_update') \
as fake_delete_at_update:
resp = req.get_response(self.object_controller)
self.assertEqual(resp.status_int, 201)
self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
SameReqEnv(req), 'sda1', POLICIES[0], {
'x-content-type': 'text/plain;swift_expirer_bytes=4096',
'x-content-type-timestamp': timestamp1
})])
timestamp2 = next(self.ts).normal
req = Request.blank(
'/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'PUT'},
headers={'X-Timestamp': timestamp2,
'Content-Length': '5120',
'Content-Type': 'application/octet-stream',
'X-Delete-At': str(delete_at_timestamp1),
'X-Delete-At-Container': delete_at_container1})
req.body = '\x00' * 5120
with mock.patch.object(self.object_controller, 'delete_at_update') \
as fake_delete_at_update:
resp = req.get_response(self.object_controller)
self.assertEqual(resp.status_int, 201)
self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
SameReqEnv(req), 'sda1', POLICIES[0], {
'x-content-type': 'text/plain;swift_expirer_bytes=5120',
'x-content-type-timestamp': timestamp2
}
)])
timestamp3 = next(self.ts).normal
delete_at_timestamp2 = str(int(next(self.ts)) + 2000)
req = Request.blank(
'/sda1/p/a/c/o', environ={'REQUEST_METHOD': 'POST'},
headers={'X-Timestamp': timestamp3,
'X-Delete-At': delete_at_timestamp2})
with mock.patch.object(self.object_controller, 'delete_at_update') \
as fake_delete_at_update:
resp = req.get_response(self.object_controller)
self.assertEqual(resp.status_int, 202)
self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
'PUT', int(delete_at_timestamp2), 'a', 'c', 'o',
SameReqEnv(req), 'sda1', POLICIES[0], {
'x-content-type': 'text/plain;swift_expirer_bytes=5120',
'x-content-type-timestamp': timestamp2
},
), mock.call(
'DELETE', int(delete_at_timestamp1), 'a', 'c', 'o',
SameReqEnv(req), 'sda1', POLICIES[0]
)])
timestamp4 = next(self.ts).normal
req = Request.blank(
'/sda1/p/a/c/o',
environ={'REQUEST_METHOD': 'DELETE'},
headers={'X-Timestamp': timestamp4,
'Content-Type': 'application/octet-stream'})
with mock.patch.object(self.object_controller, 'delete_at_update') \
as fake_delete_at_update:
resp = req.get_response(self.object_controller)
self.assertEqual(resp.status_int, 204)
self.assertEqual(fake_delete_at_update.call_args_list, [mock.call(
'DELETE', int(delete_at_timestamp2), 'a', 'c', 'o',
SameReqEnv(req), 'sda1', POLICIES[0]
)])
def test_delete_at_overwrite_same_expiration_different_bytes(self):
container_updates = []
def capture_updates(ip, port, method, path, headers, *args, **kwargs):
container_updates.append((ip, port, method, path, headers))
policy = random.choice(list(POLICIES))
delete_at = int(next(self.ts)) + 30
delete_at_container = utils.get_expirer_container(delete_at, 86400,
'a', 'c', 'o')
base_headers = {
'X-Backend-Storage-Policy-Index': int(policy),
'Content-Type': 'application/octet-stream',
# we exclude the user container listing updates for brevity
# 'X-Container-Partition': '20',
# 'X-Container-Host': '1.2.3.4:5105',
# 'X-Container-Device': 'sdb1',
'X-Delete-At': str(delete_at),
'X-Delete-At-Container': delete_at_container,
'X-Delete-At-Host': "10.1.1.1:6201",
'X-Delete-At-Partition': '6237',
'X-Delete-At-Device': 'sdp',
}
if policy.policy_type == EC_POLICY:
base_headers['X-Object-Sysmeta-Ec-Frag-Index'] = '2'
put1_ts = next(self.ts)
put1_size = 4042
req1 = Request.blank(
'/sda1/p/a/c/o', method='PUT', body='\x01' * put1_size,
headers=dict(base_headers, **{
'X-Timestamp': put1_ts.normal,
'Content-Length': str(put1_size),
'X-Trans-Id': 'txn1',
}))
put2_ts = next(self.ts)
put2_size = 2044
req2 = Request.blank(
'/sda1/p/a/c/o', method='PUT', body='\x02' * put2_size,
headers=dict(base_headers, **{
'X-Timestamp': put2_ts.normal,
'Content-Length': str(put2_size),
'X-Trans-Id': 'txn2',
}))
with fake_spawn(), mocked_http_conn(
200, 200, give_connect=capture_updates):
resp1 = req1.get_response(self.object_controller)
resp2 = req2.get_response(self.object_controller)
self.assertEqual(resp1.status_int, 201)
self.assertEqual(resp2.status_int, 201)
self.assertEqual([(
'10.1.1.1', '6201', 'PUT',
'/sdp/6237/.expiring_objects/%s/%s-a/c/o' % (
delete_at_container, delete_at
), {
'X-Backend-Storage-Policy-Index': '0',
'X-Timestamp': put1_ts.normal,
'X-Trans-Id': 'txn1',
'Referer': 'PUT http://localhost/sda1/p/a/c/o',
'X-Size': '0',
'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
'X-Content-Type':
'text/plain;swift_expirer_bytes=%s' % put1_size,
'X-Content-Type-Timestamp': put1_ts.normal,
'User-Agent': 'object-server %s' % os.getpid(),
}
), (
'10.1.1.1', '6201', 'PUT',
'/sdp/6237/.expiring_objects/%s/%s-a/c/o' % (
delete_at_container, delete_at
), {
'X-Backend-Storage-Policy-Index': '0',
'X-Timestamp': put2_ts.normal,
'X-Trans-Id': 'txn2',
'Referer': 'PUT http://localhost/sda1/p/a/c/o',
'X-Size': '0',
'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
'X-Content-Type':
'text/plain;swift_expirer_bytes=%s' % put2_size,
'X-Content-Type-Timestamp': put2_ts.normal,
'User-Agent': 'object-server %s' % os.getpid(),
}
)], container_updates)
async_pendings = []
async_pending_dir = os.path.join(
self.testdir, 'sda1', diskfile.get_async_dir(policy))
for dirpath, _, filenames in os.walk(async_pending_dir):
for filename in filenames:
async_pendings.append(os.path.join(dirpath, filename))
self.assertEqual(len(async_pendings), 0)
def test_delete_at_POST_update_same_expiration(self):
container_updates = []
def capture_updates(ip, port, method, path, headers, *args, **kwargs):
container_updates.append((ip, port, method, path, headers))
policy = random.choice(list(POLICIES))
put_ts = next(self.ts)
put_size = 1548
put_delete_at = int(next(self.ts)) + 30
put_delete_at_container = utils.get_expirer_container(
put_delete_at, 86400, 'a', 'c', 'o')
put_req = Request.blank(
'/sda1/p/a/c/o', method='PUT', body='\x01' * put_size,
headers={
'X-Backend-Storage-Policy-Index': int(policy),
'X-Timestamp': put_ts.normal,
'Content-Length': str(put_size),
'X-Trans-Id': 'txn1',
'Content-Type': 'application/octet-stream',
# we exclude the user container listing updates for brevity
# 'X-Container-Partition': '20',
# 'X-Container-Host': '1.2.3.4:5105',
# 'X-Container-Device': 'sdb1',
'X-Delete-At': str(put_delete_at),
'X-Delete-At-Container': put_delete_at_container,
'X-Delete-At-Host': "10.1.1.1:6201",
'X-Delete-At-Partition': '6237',
'X-Delete-At-Device': 'sdp',
})
if policy.policy_type == EC_POLICY:
put_req.headers['X-Object-Sysmeta-Ec-Frag-Index'] = '3'
with fake_spawn(), mocked_http_conn(
200, give_connect=capture_updates):
put_resp = put_req.get_response(self.object_controller)
self.assertEqual(put_resp.status_int, 201)
self.assertEqual([(
'10.1.1.1', '6201', 'PUT',
'/sdp/6237/.expiring_objects/%s/%s-a/c/o' % (
put_delete_at_container, put_delete_at
), {
'X-Backend-Storage-Policy-Index': '0',
'X-Timestamp': put_ts.normal,
'X-Trans-Id': 'txn1',
'Referer': 'PUT http://localhost/sda1/p/a/c/o',
'X-Size': '0',
'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
'X-Content-Type':
'text/plain;swift_expirer_bytes=%s' % put_size,
'X-Content-Type-Timestamp': put_ts.normal,
'User-Agent': 'object-server %s' % os.getpid(),
}
)], container_updates)
# reset container updates
container_updates = []
delete_at = int(next(self.ts)) + 100
self.assertNotEqual(delete_at, put_delete_at) # sanity
delete_at_container = utils.get_expirer_container(
delete_at, 86400, 'a', 'c', 'o')
base_headers = {
'X-Backend-Storage-Policy-Index': int(policy),
# we exclude the user container listing updates for brevity
# 'X-Container-Partition': '20',
# 'X-Container-Host': '1.2.3.4:5105',
# 'X-Container-Device': 'sdb1',
'X-Delete-At': str(delete_at),
'X-Delete-At-Container': delete_at_container,
'X-Delete-At-Host': "10.2.2.2:6202",
'X-Delete-At-Partition': '592',
'X-Delete-At-Device': 'sdm',
}
post1_ts = next(self.ts)
req1 = Request.blank(
'/sda1/p/a/c/o', method='POST', headers=dict(base_headers, **{
'X-Timestamp': post1_ts.normal,
'X-Trans-Id': 'txn2',
}))
post2_ts = next(self.ts)
req2 = Request.blank(
'/sda1/p/a/c/o', method='POST', headers=dict(base_headers, **{
'X-Timestamp': post2_ts.normal,
'X-Trans-Id': 'txn3',
}))
with fake_spawn(), mocked_http_conn(
200, 200, give_connect=capture_updates):
resp1 = req1.get_response(self.object_controller)
resp2 = req2.get_response(self.object_controller)
self.assertEqual(resp1.status_int, 202)
self.assertEqual(resp2.status_int, 202)
self.assertEqual([(
'10.2.2.2', '6202', 'PUT',
'/sdm/592/.expiring_objects/%s/%s-a/c/o' % (
delete_at_container, delete_at
), {
'X-Backend-Storage-Policy-Index': '0',
# this the PUT from the POST-1
'X-Timestamp': post1_ts.normal,
'X-Trans-Id': 'txn2',
'Referer': 'POST http://localhost/sda1/p/a/c/o',
'X-Size': '0',
'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
'X-Content-Type':
'text/plain;swift_expirer_bytes=%s' % put_size,
'X-Content-Type-Timestamp': put_ts.normal,
'User-Agent': 'object-server %s' % os.getpid(),
}
), (
'10.2.2.2', '6202', 'PUT',
'/sdm/592/.expiring_objects/%s/%s-a/c/o' % (
delete_at_container, delete_at
), {
'X-Backend-Storage-Policy-Index': '0',
# this the PUT from POST-2
'X-Timestamp': post2_ts.normal,
'X-Trans-Id': 'txn3',
'Referer': 'POST http://localhost/sda1/p/a/c/o',
'X-Size': '0',
'X-Etag': 'd41d8cd98f00b204e9800998ecf8427e',
'X-Content-Type':
'text/plain;swift_expirer_bytes=%s' % put_size,
'X-Content-Type-Timestamp': put_ts.normal,
'User-Agent': 'object-server %s' % os.getpid(),
}
)], container_updates)
async_pendings = []
async_pending_dir = os.path.join(
self.testdir, 'sda1', diskfile.get_async_dir(policy))
for dirpath, _, filenames in os.walk(async_pending_dir):
for filename in filenames:
async_pendings.append(os.path.join(dirpath, filename))
self.assertEqual(len(async_pendings), 1)
async_updates = []
for pending_file in async_pendings:
with open(pending_file, 'rb') as fh:
async_pending = pickle.load(fh)
async_updates.append(async_pending)
self.assertEqual([{
'op': 'DELETE',
'account': '.expiring_objects',
'container': delete_at_container,
'obj': '%s-a/c/o' % put_delete_at,
'headers': {
'X-Backend-Storage-Policy-Index': '0',
# only POST-1 has to clear the orig PUT delete-at
'X-Timestamp': post1_ts.normal,
'X-Trans-Id': 'txn2',
'Referer': 'POST http://localhost/sda1/p/a/c/o',
'User-Agent': 'object-server %s' % os.getpid(),
},
}], async_updates)
def test_DELETE_calls_delete_at(self): def test_DELETE_calls_delete_at(self):
given_args = [] given_args = []
@ -7615,7 +7979,10 @@ class TestObjectController(BaseTestCase):
self.assertEqual(resp.status_int, 201) self.assertEqual(resp.status_int, 201)
self.assertEqual(given_args, [ self.assertEqual(given_args, [
'PUT', int(delete_at_timestamp1), 'a', 'c', 'o', 'PUT', int(delete_at_timestamp1), 'a', 'c', 'o',
given_args[5], 'sda1', POLICIES[0]]) given_args[5], 'sda1', POLICIES[0], {
'x-content-type': 'text/plain;swift_expirer_bytes=4',
'x-content-type-timestamp': timestamp1
}])
while given_args: while given_args:
given_args.pop() given_args.pop()