Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

CRC64NVME checksum algo #611

Merged
merged 11 commits into from
Dec 6, 2024
Merged
Show file tree
Hide file tree
Changes from 10 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions awscrt/s3.py
Original file line number Diff line number Diff line change
Expand Up @@ -102,6 +102,9 @@ class S3ChecksumAlgorithm(IntEnum):
SHA256 = 4
"""SHA-256"""

CRC64NVME = 5
"""CRC64NVME"""


class S3ChecksumLocation(IntEnum):
"""Where to put the checksum."""
Expand Down
2 changes: 1 addition & 1 deletion crt/aws-lc
2 changes: 1 addition & 1 deletion crt/s2n
Submodule s2n updated from ffe0bf to 493b77
98 changes: 73 additions & 25 deletions test/test_s3.py
Original file line number Diff line number Diff line change
Expand Up @@ -253,6 +253,7 @@ def setUp(self):
self.num_threads = 0
self.special_path = "put_object_test_10MB@$%.txt"
self.non_ascii_file_name = "ÉxÅmple.txt"
self.part_size = 5 * MB

self.response_headers = None
self.response_status_code = None
Expand Down Expand Up @@ -363,13 +364,12 @@ def _test_s3_put_get_object(
request_type,
exception_name=None,
enable_s3express=False,
region="us-west-2",
mem_limit=None,
**kwargs):
s3_client = s3_client_new(
False,
region,
5 * MB,
self.region,
self.part_size,
enable_s3express=enable_s3express,
mem_limit=mem_limit)
signing_config = None
Expand All @@ -392,8 +392,14 @@ def _test_s3_put_get_object(
self.assertTrue(shutdown_event.wait(self.timeout))

if exception_name is None:
finished_future.result()
self._validate_successful_response(request_type is S3RequestType.PUT_OBJECT)
try:
finished_future.result()
self._validate_successful_response(request_type is S3RequestType.PUT_OBJECT)
except S3ResponseError as e:
print(e.status_code)
print(e.headers)
print(e.body)
raise e
else:
e = finished_future.exception()
self.assertEqual(e.name, exception_name)
Expand Down Expand Up @@ -436,14 +442,16 @@ def test_put_object_unknown_content_length_single_part(self):
put_body_stream.close()

def test_get_object_s3express(self):
self.region = "us-east-1"
request = self._get_object_request("/crt-download-10MB", enable_s3express=True)
self._test_s3_put_get_object(request, S3RequestType.GET_OBJECT, enable_s3express=True, region="us-east-1")
self._test_s3_put_get_object(request, S3RequestType.GET_OBJECT, enable_s3express=True)

def test_put_object_s3express(self):
self.region = "us-east-1"
put_body_stream = open(self.temp_put_obj_file_path, "rb")
content_length = os.stat(self.temp_put_obj_file_path).st_size
request = self._put_object_request(put_body_stream, content_length, enable_s3express=True)
self._test_s3_put_get_object(request, S3RequestType.PUT_OBJECT, enable_s3express=True, region="us-east-1")
self._test_s3_put_get_object(request, S3RequestType.PUT_OBJECT, enable_s3express=True)
put_body_stream.close()

def test_put_object_multiple_times(self):
Expand Down Expand Up @@ -586,38 +594,78 @@ def on_done_remove_file(**kwargs):
"the transferred length reported does not match body we sent")
self._validate_successful_response(request_type is S3RequestType.PUT_OBJECT)

def test_put_get_with_checksum(self):
put_body = b'hello world'
put_body_stream = BytesIO(put_body)
content_length = len(put_body)
path = '/hello-world.txt'

# calculate expected CRC32 header value:
# a string containing the url-safe-base64-encoding of a big-endian-32-bit-CRC
crc32_int = zlib.crc32(put_body)
crc32_big_endian = crc32_int.to_bytes(4, 'big')
crc32_base64_bytes = base64.urlsafe_b64encode(crc32_big_endian)
crc32_base64_str = crc32_base64_bytes.decode()
def _round_trip_with_checksums_helper(
self,
algo=S3ChecksumAlgorithm.CRC32,
mpu=True,
provide_full_object_checksum=False):
if not mpu:
# increase the part size for the client to use single part upload
self.part_size = 20 * MB

# awscrt.io.init_logging(awscrt.io.LogLevel.Trace, "trace.log")
put_body_stream = open(self.temp_put_obj_file_path, "rb")
content_length = os.stat(self.temp_put_obj_file_path).st_size
# construct different path to prevent race condition between tests
path = '/hello-world-' + algo.name
if mpu:
path += "-mpu"
if provide_full_object_checksum:
path += "-full-object"

if algo == S3ChecksumAlgorithm.CRC32:
checksum_header_name = 'x-amz-checksum-crc32'
checksum_str = 'a9ccsg=='
elif algo == S3ChecksumAlgorithm.CRC64NVME:
checksum_header_name = 'x-amz-checksum-crc64nvme'
checksum_str = 'tPMvgM0jSDQ='
else:
raise Exception("Checksum algo not supported by test helper")

# upload, with client adding checksum
upload_request = self._put_object_request(put_body_stream, content_length, path=path)
upload_checksum_config = S3ChecksumConfig(
algorithm=S3ChecksumAlgorithm.CRC32,
algorithm=algo,
location=S3ChecksumLocation.TRAILER)
if provide_full_object_checksum:
upload_request.headers.add(checksum_header_name, checksum_str)
# checksum will be provided from the header, don't set the checksum configs
upload_checksum_config = None

self._test_s3_put_get_object(upload_request, S3RequestType.PUT_OBJECT,
checksum_config=upload_checksum_config)
self.assertEqual(HttpHeaders(self.response_headers).get('x-amz-checksum-crc32'),
crc32_base64_str)

# download, with client validating checksum
download_request = self._get_object_request(path)
download_checksum_config = S3ChecksumConfig(validate_response=True)
self._test_s3_put_get_object(download_request, S3RequestType.GET_OBJECT,
checksum_config=download_checksum_config)
self.assertTrue(self.done_did_validate_checksum)
self.assertEqual(self.done_checksum_validation_algorithm, S3ChecksumAlgorithm.CRC32)
self.assertEqual(HttpHeaders(self.response_headers).get('x-amz-checksum-crc32'),
crc32_base64_str)
self.assertEqual(self.done_checksum_validation_algorithm, algo)
self.assertEqual(HttpHeaders(self.response_headers).get(checksum_header_name),
checksum_str)
put_body_stream.close()

def test_round_trip_with_trailing_checksum(self):
self._round_trip_with_checksums_helper(S3ChecksumAlgorithm.CRC32, mpu=False)

def test_round_trip_with_full_object_checksum_mpu(self):
self._round_trip_with_checksums_helper(
S3ChecksumAlgorithm.CRC64NVME,
mpu=True,
provide_full_object_checksum=True)

def test_round_trip_with_full_object_checksum_single_part(self):
self._round_trip_with_checksums_helper(
S3ChecksumAlgorithm.CRC64NVME,
mpu=False,
provide_full_object_checksum=True)

def test_round_trip_with_full_object_checksum_mpu_crc32(self):
self._round_trip_with_checksums_helper(S3ChecksumAlgorithm.CRC32, mpu=True, provide_full_object_checksum=True)

def test_round_trip_with_full_object_checksum_single_part_crc32(self):
self._round_trip_with_checksums_helper(S3ChecksumAlgorithm.CRC32, mpu=False, provide_full_object_checksum=True)

def _on_progress_cancel_after_first_chunk(self, progress):
self.transferred_len += progress
Expand Down
Loading