From 5558b92938aff30ffe3ee6f63b2a05fc929849a2 Mon Sep 17 00:00:00 2001 From: Darryl Tam Date: Fri, 15 Jun 2018 12:15:01 -0700 Subject: [PATCH] Properly handle custom metadata upon an object COPY operation Previously, the 'x-amz-metadata-directive' header was ignored except to ensure that it had a valid value if it existed. In all cases any metadata specified was applied to the copied object, while non-conflicting metadata remained. This patch fixes this behaviour. Now, if the 'x-amz-metadata-directive' header is set to 'REPLACE' during a copy operation, the s3api middleware sets the 'x-fresh-metadata' header to 'True' to replace valid metadata values. If the 'x-amz-metadata-directive' header is set to 'COPY' or if it is omited during a copy operation, then the s3api middleware removes all metadata (custom or not) from the request to prevent it from being changed. Content-Type can never be set on an S3 copy operation, even if the metadata directive is set to 'REPLACE', so it is specifically filtered out on copy. Change-Id: I333e46758bd2b7a29f672c098af267849232c911 Closes-Bug: #1433875 --- swift/common/middleware/s3api/s3request.py | 16 +++ test/functional/s3api/test_object.py | 29 +++++ test/unit/common/middleware/s3api/test_obj.py | 112 ++++++++++++++++-- 3 files changed, 150 insertions(+), 7 deletions(-) diff --git a/swift/common/middleware/s3api/s3request.py b/swift/common/middleware/s3api/s3request.py index 5833921f89..b6d8632b7c 100644 --- a/swift/common/middleware/s3api/s3request.py +++ b/swift/common/middleware/s3api/s3request.py @@ -982,6 +982,22 @@ class S3Request(swob.Request): env['HTTP_X_COPY_FROM'] = env['HTTP_X_AMZ_COPY_SOURCE'] del env['HTTP_X_AMZ_COPY_SOURCE'] env['CONTENT_LENGTH'] = '0' + # Content type cannot be modified on COPY + env.pop('CONTENT_TYPE', None) + if env.pop('HTTP_X_AMZ_METADATA_DIRECTIVE', None) == 'REPLACE': + env['HTTP_X_FRESH_METADATA'] = 'True' + else: + copy_exclude_headers = ('HTTP_CONTENT_DISPOSITION', + 'HTTP_CONTENT_ENCODING', + 'HTTP_CONTENT_LANGUAGE', + 'HTTP_EXPIRES', + 'HTTP_CACHE_CONTROL', + 'HTTP_X_ROBOTS_TAG') + for key in copy_exclude_headers: + env.pop(key, None) + for key in list(env.keys()): + if key.startswith('HTTP_X_OBJECT_META_'): + del env[key] if self.force_request_log: env['swift.proxy_access_log_made'] = False diff --git a/test/functional/s3api/test_object.py b/test/functional/s3api/test_object.py index 783f48ae9a..a3f93188ab 100644 --- a/test/functional/s3api/test_object.py +++ b/test/functional/s3api/test_object.py @@ -486,6 +486,35 @@ class TestS3ApiObject(S3ApiBase): self.conn.make_request('HEAD', dst_bucket, dst_obj) self.assertEqual(headers['x-amz-meta-test'], 'dst') + headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj), + 'X-Amz-Metadata-Directive': 'COPY', + 'X-Amz-Meta-Test': 'dst'} + status, headers, body = \ + self.conn.make_request('PUT', dst_bucket, dst_obj, headers) + self.assertEqual(status, 200) + self.assertCommonResponseHeaders(headers) + status, headers, body = \ + self.conn.make_request('HEAD', dst_bucket, dst_obj) + self.assertEqual(headers['x-amz-meta-test'], 'src') + + headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj), + 'X-Amz-Meta-Test2': 'dst', + 'X-Amz-Metadata-Directive': 'REPLACE'} + status, headers, body = \ + self.conn.make_request('PUT', dst_bucket, dst_obj, headers) + self.assertEqual(status, 200) + self.assertCommonResponseHeaders(headers) + status, headers, body = \ + self.conn.make_request('HEAD', dst_bucket, dst_obj) + self.assertNotIn('x-amz-meta-test', headers) + self.assertEqual(headers['x-amz-meta-test2'], 'dst') + + headers = {'X-Amz-Copy-Source': '/%s/%s' % (self.bucket, obj), + 'X-Amz-Metadata-Directive': 'BAD'} + status, headers, body = \ + self.conn.make_request('PUT', dst_bucket, dst_obj, headers) + self.assertEqual(status, 400) + def test_put_object_copy_source_if_modified_since(self): obj = 'object' dst_bucket = 'dst-bucket' diff --git a/test/unit/common/middleware/s3api/test_obj.py b/test/unit/common/middleware/s3api/test_obj.py index 601cd7cd07..3abd8d6c13 100644 --- a/test/unit/common/middleware/s3api/test_obj.py +++ b/test/unit/common/middleware/s3api/test_obj.py @@ -504,13 +504,12 @@ class TestS3ApiObj(S3ApiTestCase): _, _, headers = self.swift.calls_with_headers[-1] # Check that s3api converts a Content-MD5 header into an etag. self.assertEqual(headers['ETag'], self.etag) - self.assertEqual(headers['X-Object-Meta-Something'], 'oh hai') - self.assertEqual(headers['X-Object-Meta-Unreadable-Prefix'], - '=?UTF-8?Q?=04w?=') - self.assertEqual(headers['X-Object-Meta-Unreadable-Suffix'], - '=?UTF-8?Q?h=04?=') - self.assertEqual(headers['X-Object-Meta-Lots-Of-Unprintable'], - '=?UTF-8?B?BAQEBAQ=?=') + # Check that metadata is omited if no directive is specified + self.assertIsNone(headers.get('X-Object-Meta-Something')) + self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Prefix')) + self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Suffix')) + self.assertIsNone(headers.get('X-Object-Meta-Lots-Of-Unprintable')) + self.assertEqual(headers['X-Copy-From'], '/some/source') self.assertEqual(headers['Content-Length'], '0') @@ -577,6 +576,7 @@ class TestS3ApiObj(S3ApiTestCase): _, _, headers = self.swift.calls_with_headers[-1] self.assertEqual(headers['X-Copy-From'], '/some/source') + self.assertTrue(headers.get('X-Fresh-Metadata') is None) self.assertEqual(headers['Content-Length'], '0') do_test('/some/source') @@ -586,6 +586,104 @@ class TestS3ApiObj(S3ApiTestCase): # AWS seems to tolerate this so we should, too do_test('some/source') + @s3acl + def test_object_PUT_copy_metadata_replace(self): + date_header = self.get_date_header() + timestamp = mktime(date_header) + last_modified = S3Timestamp(timestamp).s3xmlformat + status, headers, body = \ + self._test_object_PUT_copy( + swob.HTTPOk, + {'X-Amz-Metadata-Directive': 'REPLACE', + 'X-Amz-Meta-Something': 'oh hai', + 'X-Amz-Meta-Unreadable-Prefix': '\x04w', + 'X-Amz-Meta-Unreadable-Suffix': 'h\x04', + 'X-Amz-Meta-Lots-Of-Unprintable': 5 * '\x04', + 'Cache-Control': 'hello', + 'content-disposition': 'how are you', + 'content-encoding': 'good and you', + 'content-language': 'great', + 'content-type': 'so', + 'expires': 'yeah', + 'x-robots-tag': 'bye'}) + + self.assertEqual(status.split()[0], '200') + self.assertEqual(headers['Content-Type'], 'application/xml') + self.assertIsNone(headers.get('etag')) + elem = fromstring(body, 'CopyObjectResult') + self.assertEqual(elem.find('LastModified').text, last_modified) + self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag) + + _, _, headers = self.swift.calls_with_headers[-1] + self.assertEqual(headers['X-Copy-From'], '/some/source') + # Check that metadata is included if replace directive is specified + # and that Fresh Metadata is set + self.assertTrue(headers.get('X-Fresh-Metadata') == 'True') + self.assertEqual(headers['X-Object-Meta-Something'], 'oh hai') + self.assertEqual(headers['X-Object-Meta-Unreadable-Prefix'], + '=?UTF-8?Q?=04w?=') + self.assertEqual(headers['X-Object-Meta-Unreadable-Suffix'], + '=?UTF-8?Q?h=04?=') + self.assertEqual(headers['X-Object-Meta-Lots-Of-Unprintable'], + '=?UTF-8?B?BAQEBAQ=?=') + # Check other metadata is set + self.assertEqual(headers['Cache-Control'], 'hello') + self.assertEqual(headers['Content-Disposition'], 'how are you') + self.assertEqual(headers['Content-Encoding'], 'good and you') + self.assertEqual(headers['Content-Language'], 'great') + # Content-Type can't be set during an S3 copy operation + self.assertIsNone(headers.get('Content-Type')) + self.assertEqual(headers['Expires'], 'yeah') + self.assertEqual(headers['X-Robots-Tag'], 'bye') + + self.assertEqual(headers['Content-Length'], '0') + + @s3acl + def test_object_PUT_copy_metadata_copy(self): + date_header = self.get_date_header() + timestamp = mktime(date_header) + last_modified = S3Timestamp(timestamp).s3xmlformat + status, headers, body = \ + self._test_object_PUT_copy( + swob.HTTPOk, + {'X-Amz-Metadata-Directive': 'COPY', + 'X-Amz-Meta-Something': 'oh hai', + 'X-Amz-Meta-Unreadable-Prefix': '\x04w', + 'X-Amz-Meta-Unreadable-Suffix': 'h\x04', + 'X-Amz-Meta-Lots-Of-Unprintable': 5 * '\x04', + 'Cache-Control': 'hello', + 'content-disposition': 'how are you', + 'content-encoding': 'good and you', + 'content-language': 'great', + 'content-type': 'so', + 'expires': 'yeah', + 'x-robots-tag': 'bye'}) + self.assertEqual(status.split()[0], '200') + self.assertEqual(headers['Content-Type'], 'application/xml') + self.assertIsNone(headers.get('etag')) + + elem = fromstring(body, 'CopyObjectResult') + self.assertEqual(elem.find('LastModified').text, last_modified) + self.assertEqual(elem.find('ETag').text, '"%s"' % self.etag) + + _, _, headers = self.swift.calls_with_headers[-1] + self.assertEqual(headers['X-Copy-From'], '/some/source') + # Check that metadata is omited if COPY directive is specified + self.assertIsNone(headers.get('X-Fresh-Metadata')) + self.assertIsNone(headers.get('X-Object-Meta-Something')) + self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Prefix')) + self.assertIsNone(headers.get('X-Object-Meta-Unreadable-Suffix')) + self.assertIsNone(headers.get('X-Object-Meta-Lots-Of-Unprintable')) + self.assertIsNone(headers.get('Cache-Control')) + self.assertIsNone(headers.get('Content-Disposition')) + self.assertIsNone(headers.get('Content-Encoding')) + self.assertIsNone(headers.get('Content-Language')) + self.assertIsNone(headers.get('Content-Type')) + self.assertIsNone(headers.get('Expires')) + self.assertIsNone(headers.get('X-Robots-Tag')) + + self.assertEqual(headers['Content-Length'], '0') + @s3acl def test_object_PUT_copy_self(self): status, headers, body = \