From af8c3ea44dda3f75fb6605c6fd9df40985f0025f Mon Sep 17 00:00:00 2001 From: Nate Prewitt Date: Fri, 24 Nov 2023 13:32:52 -0700 Subject: [PATCH] Add error translation from S3ResponseError to Botocore errors Co-authored-by: Michael Graeb --- s3transfer/crt.py | 75 ++++++++++++++++++++++++++++++++--- tests/integration/test_crt.py | 17 ++++++++ tests/unit/test_crt.py | 55 +++++++++++++++++++++++++ 3 files changed, 142 insertions(+), 5 deletions(-) diff --git a/s3transfer/crt.py b/s3transfer/crt.py index eda2985f..08105314 100644 --- a/s3transfer/crt.py +++ b/s3transfer/crt.py @@ -25,7 +25,12 @@ EventLoopGroup, TlsContextOptions, ) -from awscrt.s3 import S3Client, S3RequestTlsMode, S3RequestType +from awscrt.s3 import ( + S3Client, + S3RequestTlsMode, + S3RequestType, + S3ResponseError, +) from botocore import UNSIGNED from botocore.compat import urlsplit from botocore.config import Config @@ -171,6 +176,9 @@ def __init__(self, crt_s3_client, crt_request_serializer, osutil=None): self._s3_args_creator = S3ClientArgsCreator( crt_request_serializer, self._osutil ) + self._crt_exception_translator = ( + crt_request_serializer.translate_crt_exception + ) self._future_coordinators = [] self._semaphore = threading.Semaphore(128) # not configurable # A counter to create unique id's for each transfer submitted. @@ -262,7 +270,10 @@ def _release_semaphore(self, **kwargs): def _submit_transfer(self, request_type, call_args): on_done_after_calls = [self._release_semaphore] - coordinator = CRTTransferCoordinator(transfer_id=self._id_counter) + coordinator = CRTTransferCoordinator( + transfer_id=self._id_counter, + exception_translator=self._crt_exception_translator, + ) components = { 'meta': CRTTransferMeta(self._id_counter, call_args), 'coordinator': coordinator, @@ -373,6 +384,9 @@ def serialize_http_request(self, transfer_type, future): """ raise NotImplementedError('serialize_http_request()') + def translate_crt_exception(self, exception): + raise NotImplementedError('translate_crt_exception()') + class BotocoreCRTRequestSerializer(BaseCRTRequestSerializer): def __init__(self, session, client_kwargs=None): @@ -496,6 +510,40 @@ def serialize_http_request(self, transfer_type, future): crt_request = self._convert_to_crt_http_request(botocore_http_request) return crt_request + def translate_crt_exception(self, exception): + if isinstance(exception, S3ResponseError): + return self._translate_crt_s3_response_error(exception) + else: + return None + + def _translate_crt_s3_response_error(self, s3_response_error): + status_code = s3_response_error.status_code + if status_code < 301: + # Botocore's exception parsing only + # runs on status codes >= 301 + return None + + headers = {k: v for k, v in s3_response_error.headers} + operation_name = s3_response_error.operation_name + if operation_name is not None: + service_model = self._client.meta.service_model + shape = service_model.operation_model(operation_name).output_shape + else: + shape = None + + response_dict = { + 'headers': botocore.awsrequest.HeadersDict(headers), + 'status_code': status_code, + 'body': s3_response_error.body, + } + parsed_response = self._client._response_parser.parse( + response_dict, shape=shape + ) + + error_code = parsed_response.get("Error", {}).get("Code") + error_class = self._client.exceptions.from_code(error_code) + return error_class(parsed_response, operation_name=operation_name) + class FakeRawResponse(BytesIO): def stream(self, amt=1024, decode_content=None): @@ -509,9 +557,10 @@ def stream(self, amt=1024, decode_content=None): class CRTTransferCoordinator: """A helper class for managing CRTTransferFuture""" - def __init__(self, transfer_id=None, s3_request=None): + def __init__(self, transfer_id=None, exception_translator=None): self.transfer_id = transfer_id - self._s3_request = s3_request + self._exception_translator = exception_translator + self._s3_request = None self._lock = threading.Lock() self._exception = None self._crt_future = None @@ -543,11 +592,27 @@ def result(self, timeout=None): self._crt_future.result(timeout) except KeyboardInterrupt: self.cancel() + self._crt_future.result(timeout) raise + except Exception as e: + self.handle_exception(e) finally: if self._s3_request: self._s3_request = None - self._crt_future.result(timeout) + + def handle_exception(self, exc): + translated_exc = None + if self._exception_translator: + try: + translated_exc = self._exception_translator(exc) + except Exception: + # Bail out if we hit an issue translating + # and raise the original error. + pass + if translated_exc is not None: + raise translated_exc from exc + else: + raise exc def done(self): if self._crt_future is None: diff --git a/tests/integration/test_crt.py b/tests/integration/test_crt.py index 7881fa63..f7c4988b 100644 --- a/tests/integration/test_crt.py +++ b/tests/integration/test_crt.py @@ -505,3 +505,20 @@ def test_download_cancel(self): possible_matches = glob.glob('%s*' % download_path) self.assertEqual(possible_matches, []) self._assert_subscribers_called() + + def test_exception_translation(self): + # Test that CRT's S3ResponseError translates to botocore error + transfer = self._create_s3_transfer() + download_path = os.path.join( + self.files.rootdir, 'obviously-no-such-key.txt' + ) + with self.assertRaises(self.client.exceptions.NoSuchKey) as cm: + future = transfer.download( + self.bucket_name, + 'obviously-no-such-key.txt', + download_path, + subscribers=[self.record_subscriber], + ) + future.result() + + self.assertEqual(cm.exception.response['Error']['Code'], 'NoSuchKey') diff --git a/tests/unit/test_crt.py b/tests/unit/test_crt.py index aadd3827..1c141d26 100644 --- a/tests/unit/test_crt.py +++ b/tests/unit/test_crt.py @@ -13,6 +13,7 @@ import io from botocore.credentials import CredentialResolver, ReadOnlyCredentials +from botocore.exceptions import ClientError from botocore.session import Session from s3transfer.exceptions import TransferNotDoneError @@ -104,6 +105,60 @@ def test_delete_request(self): self.assertEqual(self.expected_host, crt_request.headers.get("host")) self.assertIsNone(crt_request.headers.get("Authorization")) + def _create_crt_response_error( + self, status_code, body, operation_name=None + ): + return awscrt.s3.S3ResponseError( + code=14343, + name='AWS_ERROR_S3_INVALID_RESPONSE_STATUS', + message='Invalid response status from request', + status_code=status_code, + headers=[ + ('x-amz-request-id', 'QSJHJJZR2EDYD4GQ'), + ( + 'x-amz-id-2', + 'xDbgdKdvYZTjgpOTzm7yNP2JPrOQl+eaQvUkFdOjdJoWkIC643fgHxdsHpUKvVAfjKf5F6otEYA=', + ), + ('Content-Type', 'application/xml'), + ('Transfer-Encoding', 'chunked'), + ('Date', 'Fri, 10 Nov 2023 23:22:47 GMT'), + ('Server', 'AmazonS3'), + ], + body=body, + operation_name=operation_name, + ) + + def test_translate_get_object_404(self): + body = ( + b'\n' + b'NoSuchKey' + b'The specified key does not exist.' + b'obviously-no-such-key.txt' + b'SBJ7ZQY03N1WDW9T' + b'SomeHostId' + ) + crt_exc = self._create_crt_response_error(404, body, 'GetObject') + boto_err = self.request_serializer.translate_crt_exception(crt_exc) + self.assertIsInstance( + boto_err, self.session.create_client('s3').exceptions.NoSuchKey + ) + + def test_translate_head_object_404(self): + # There's no body in a HEAD response, so we can't map it to a modeled S3 exception. + # But it should still map to a botocore ClientError + body = None + crt_exc = self._create_crt_response_error( + 404, body, operation_name='HeadObject' + ) + boto_err = self.request_serializer.translate_crt_exception(crt_exc) + self.assertIsInstance(boto_err, ClientError) + + def test_translate_unknown_operation_404(self): + body = None + crt_exc = self._create_crt_response_error(404, body) + boto_err = self.request_serializer.translate_crt_exception(crt_exc) + self.assertIsInstance(boto_err, ClientError) + @requires_crt class TestCRTCredentialProviderAdapter(unittest.TestCase):