Skip to content

Commit 33b8cd0

Browse files
authored
Respect checksum header over settings from options (#474)
1 parent 1e8a980 commit 33b8cd0

8 files changed

+143
-114
lines changed

include/aws/s3/private/s3_checksums.h

+4-2
Original file line numberDiff line numberDiff line change
@@ -166,10 +166,12 @@ AWS_S3_API
166166
int aws_checksum_finalize(struct aws_s3_checksum *checksum, struct aws_byte_buf *output);
167167

168168
AWS_S3_API
169-
void aws_checksum_config_storage_init(
169+
int aws_checksum_config_storage_init(
170170
struct aws_allocator *allocator,
171171
struct checksum_config_storage *internal_config,
172-
const struct aws_s3_checksum_config *config);
172+
const struct aws_s3_checksum_config *config,
173+
const struct aws_http_message *message,
174+
const void *log_id);
173175

174176
AWS_S3_API
175177
void aws_checksum_config_storage_cleanup(struct checksum_config_storage *internal_config);

include/aws/s3/s3_client.h

+3
Original file line numberDiff line numberDiff line change
@@ -756,6 +756,9 @@ struct aws_s3_meta_request_options {
756756
/**
757757
* Optional.
758758
* if set, the flexible checksum will be performed by client based on the config.
759+
*
760+
* Notes: checksum can also be added through the http message provided.
761+
* The checksum in http header will override corresponding the checksum config.
759762
*/
760763
const struct aws_s3_checksum_config *checksum_config;
761764

source/s3_auto_ranged_put.c

+4-75
Original file line numberDiff line numberDiff line change
@@ -313,78 +313,6 @@ static struct aws_s3_meta_request_vtable s_s3_auto_ranged_put_vtable = {
313313
.pause = s_s3_auto_ranged_put_pause,
314314
};
315315

316-
static int s_init_and_verify_checksum_config_from_headers(
317-
struct checksum_config_storage *checksum_config,
318-
const struct aws_http_message *message,
319-
const void *log_id) {
320-
/* Check if the checksum header was set from the message */
321-
struct aws_http_headers *headers = aws_http_message_get_headers(message);
322-
enum aws_s3_checksum_algorithm header_algo = AWS_SCA_NONE;
323-
struct aws_byte_cursor header_value;
324-
AWS_ZERO_STRUCT(header_value);
325-
326-
for (size_t i = 0; i < AWS_ARRAY_SIZE(s_checksum_algo_priority_list); i++) {
327-
enum aws_s3_checksum_algorithm algorithm = s_checksum_algo_priority_list[i];
328-
const struct aws_byte_cursor algorithm_header_name =
329-
aws_get_http_header_name_from_checksum_algorithm(algorithm);
330-
if (aws_http_headers_get(headers, algorithm_header_name, &header_value) == AWS_OP_SUCCESS) {
331-
if (header_algo == AWS_SCA_NONE) {
332-
header_algo = algorithm;
333-
} else {
334-
/* If there are multiple checksum headers set, it's malformed request */
335-
AWS_LOGF_ERROR(
336-
AWS_LS_S3_META_REQUEST,
337-
"id=%p Could not create auto-ranged-put meta request; multiple checksum headers has been set",
338-
log_id);
339-
return aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
340-
}
341-
}
342-
}
343-
if (header_algo == AWS_SCA_NONE) {
344-
/* No checksum header found, done */
345-
return AWS_OP_SUCCESS;
346-
}
347-
348-
/* Found the full object checksum from the header, check if it matches the explicit setting from config */
349-
if (checksum_config->checksum_algorithm != AWS_SCA_NONE && checksum_config->checksum_algorithm != header_algo) {
350-
AWS_LOGF_ERROR(
351-
AWS_LS_S3_META_REQUEST,
352-
"id=%p: Could not create auto-ranged-put meta request; checksum config mismatch the checksum from header.",
353-
log_id);
354-
return aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
355-
}
356-
if (checksum_config->has_full_object_checksum) {
357-
/* If the full object checksum has been set, it's malformed request */
358-
AWS_LOGF_ERROR(
359-
AWS_LS_S3_META_REQUEST,
360-
"id=%p: Could not create auto-ranged-put meta request; full object checksum is set from multiple ways.",
361-
log_id);
362-
return aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
363-
}
364-
365-
AWS_LOGF_DEBUG(
366-
AWS_LS_S3_META_REQUEST,
367-
"id=%p: Setting the full-object checksum from header; algorithm: " PRInSTR ", value: " PRInSTR ".",
368-
log_id,
369-
AWS_BYTE_CURSOR_PRI(aws_get_checksum_algorithm_name(header_algo)),
370-
AWS_BYTE_CURSOR_PRI(header_value));
371-
/* Set algo */
372-
checksum_config->checksum_algorithm = header_algo;
373-
if (checksum_config->location == AWS_SCL_NONE) {
374-
/* Set the checksum location to trailer for the parts, complete MPU will still have the checksum in the header.
375-
* But to keep the data integrity for the parts, we need to set the checksum location to trailer to send the
376-
* parts level checksums.
377-
*/
378-
checksum_config->location = AWS_SCL_TRAILER;
379-
}
380-
381-
/* Set full object checksum from the header value. */
382-
aws_byte_buf_init_copy_from_cursor(
383-
&checksum_config->full_object_checksum, checksum_config->allocator, header_value);
384-
checksum_config->has_full_object_checksum = true;
385-
return AWS_OP_SUCCESS;
386-
}
387-
388316
/* Allocate a new auto-ranged put meta request */
389317
struct aws_s3_meta_request *aws_s3_meta_request_auto_ranged_put_new(
390318
struct aws_allocator *allocator,
@@ -442,9 +370,10 @@ struct aws_s3_meta_request *aws_s3_meta_request_auto_ranged_put_new(
442370
goto error_clean_up;
443371
}
444372

445-
if (s_init_and_verify_checksum_config_from_headers(
446-
&auto_ranged_put->base.checksum_config, options->message, (void *)&auto_ranged_put->base)) {
447-
goto error_clean_up;
373+
if (auto_ranged_put->base.checksum_config.full_object_checksum.len > 0) {
374+
/* The full object checksum was set, make sure the parts level checksum will be calculated and sent via client.
375+
*/
376+
auto_ranged_put->base.checksum_config.location = AWS_SCL_TRAILER;
448377
}
449378

450379
AWS_LOGF_DEBUG(

source/s3_checksums.c

+104-3
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22
#include "aws/s3/private/s3_util.h"
33
#include <aws/cal/hash.h>
44
#include <aws/checksums/crc.h>
5+
#include <aws/http/request_response.h>
56

67
#define AWS_CRC32_LEN sizeof(uint32_t)
78
#define AWS_CRC32C_LEN sizeof(uint32_t)
@@ -330,17 +331,109 @@ int aws_checksum_compute(
330331
}
331332
}
332333

333-
void aws_checksum_config_storage_init(
334+
static int s_init_and_verify_checksum_config_from_headers(
335+
struct checksum_config_storage *checksum_config,
336+
const struct aws_http_message *message,
337+
const void *log_id) {
338+
/* Check if the checksum header was set from the message */
339+
struct aws_http_headers *headers = aws_http_message_get_headers(message);
340+
enum aws_s3_checksum_algorithm header_algo = AWS_SCA_NONE;
341+
struct aws_byte_cursor header_value;
342+
AWS_ZERO_STRUCT(header_value);
343+
344+
for (size_t i = 0; i < AWS_ARRAY_SIZE(s_checksum_algo_priority_list); i++) {
345+
enum aws_s3_checksum_algorithm algorithm = s_checksum_algo_priority_list[i];
346+
const struct aws_byte_cursor algorithm_header_name =
347+
aws_get_http_header_name_from_checksum_algorithm(algorithm);
348+
if (aws_http_headers_get(headers, algorithm_header_name, &header_value) == AWS_OP_SUCCESS) {
349+
if (header_algo == AWS_SCA_NONE) {
350+
header_algo = algorithm;
351+
} else {
352+
/* If there are multiple checksum headers set, it's malformed request */
353+
AWS_LOGF_ERROR(
354+
AWS_LS_S3_META_REQUEST,
355+
"id=%p Could not create auto-ranged-put meta request; multiple checksum headers has been set",
356+
log_id);
357+
return aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
358+
}
359+
}
360+
}
361+
if (header_algo == AWS_SCA_NONE) {
362+
/* No checksum header found, done */
363+
return AWS_OP_SUCCESS;
364+
}
365+
366+
if (checksum_config->has_full_object_checksum) {
367+
/* If the full object checksum has been set, it's malformed request */
368+
AWS_LOGF_ERROR(
369+
AWS_LS_S3_META_REQUEST,
370+
"id=%p: Could not create auto-ranged-put meta request; full object checksum is set from multiple ways.",
371+
log_id);
372+
return aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
373+
}
374+
375+
AWS_LOGF_DEBUG(
376+
AWS_LS_S3_META_REQUEST,
377+
"id=%p Setting the full-object checksum from header; algorithm: " PRInSTR ", value: " PRInSTR ".",
378+
log_id,
379+
AWS_BYTE_CURSOR_PRI(aws_get_checksum_algorithm_name(header_algo)),
380+
AWS_BYTE_CURSOR_PRI(header_value));
381+
/* Set algo */
382+
checksum_config->checksum_algorithm = header_algo;
383+
/**
384+
* Set the location to NONE to avoid adding extra checksums from client.
385+
*
386+
* Notes: The multipart upload will set the location to trailer to add parts level checksums.
387+
**/
388+
checksum_config->location = AWS_SCL_NONE;
389+
390+
/* Set full object checksum from the header value. */
391+
aws_byte_buf_init_copy_from_cursor(
392+
&checksum_config->full_object_checksum, checksum_config->allocator, header_value);
393+
checksum_config->has_full_object_checksum = true;
394+
return AWS_OP_SUCCESS;
395+
}
396+
397+
int aws_checksum_config_storage_init(
334398
struct aws_allocator *allocator,
335399
struct checksum_config_storage *internal_config,
336-
const struct aws_s3_checksum_config *config) {
400+
const struct aws_s3_checksum_config *config,
401+
const struct aws_http_message *message,
402+
const void *log_id) {
337403
AWS_ZERO_STRUCT(*internal_config);
338404
/* Zero out the struct and set the allocator regardless. */
339405
internal_config->allocator = allocator;
340406

341407
if (!config) {
342-
return;
408+
return AWS_OP_SUCCESS;
409+
}
410+
411+
struct aws_http_headers *headers = aws_http_message_get_headers(message);
412+
if (config->location == AWS_SCL_TRAILER) {
413+
struct aws_byte_cursor existing_encoding;
414+
AWS_ZERO_STRUCT(existing_encoding);
415+
if (aws_http_headers_get(headers, g_content_encoding_header_name, &existing_encoding) == AWS_OP_SUCCESS) {
416+
if (aws_byte_cursor_find_exact(&existing_encoding, &g_content_encoding_header_aws_chunked, NULL) ==
417+
AWS_OP_SUCCESS) {
418+
AWS_LOGF_ERROR(
419+
AWS_LS_S3_META_REQUEST,
420+
"id=%p Cannot create meta s3 request; for trailer checksum, the original request cannot be "
421+
"aws-chunked encoding. The client will encode the request instead.",
422+
(void *)log_id);
423+
aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
424+
return AWS_OP_ERR;
425+
}
426+
}
343427
}
428+
if (config->location != AWS_SCL_NONE && config->checksum_algorithm == AWS_SCA_NONE) {
429+
AWS_LOGF_ERROR(
430+
AWS_LS_S3_META_REQUEST,
431+
"id=%p Cannot create meta s3 request; checksum location is set, but no checksum algorithm selected.",
432+
(void *)log_id);
433+
aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
434+
return AWS_OP_ERR;
435+
}
436+
344437
internal_config->checksum_algorithm = config->checksum_algorithm;
345438
internal_config->location = config->location;
346439
internal_config->validate_response_checksum = config->validate_response_checksum;
@@ -385,6 +478,14 @@ void aws_checksum_config_storage_init(
385478
internal_config->response_checksum_algorithms.sha1 = true;
386479
internal_config->response_checksum_algorithms.sha256 = true;
387480
}
481+
482+
/* After applying settings from config, check the message header to override the corresponding settings. */
483+
if (s_init_and_verify_checksum_config_from_headers(internal_config, message, log_id)) {
484+
return AWS_OP_ERR;
485+
}
486+
/* Anything fail afterward will need to cleanup the storage. */
487+
488+
return AWS_OP_SUCCESS;
388489
}
389490

390491
void aws_checksum_config_storage_cleanup(struct checksum_config_storage *internal_config) {

source/s3_client.c

-30
Original file line numberDiff line numberDiff line change
@@ -945,36 +945,6 @@ struct aws_s3_meta_request *aws_s3_client_make_meta_request(
945945
return NULL;
946946
}
947947

948-
if (options->checksum_config) {
949-
if (options->checksum_config->location == AWS_SCL_TRAILER) {
950-
struct aws_http_headers *headers = aws_http_message_get_headers(options->message);
951-
struct aws_byte_cursor existing_encoding;
952-
AWS_ZERO_STRUCT(existing_encoding);
953-
if (aws_http_headers_get(headers, g_content_encoding_header_name, &existing_encoding) == AWS_OP_SUCCESS) {
954-
if (aws_byte_cursor_find_exact(&existing_encoding, &g_content_encoding_header_aws_chunked, NULL) ==
955-
AWS_OP_SUCCESS) {
956-
AWS_LOGF_ERROR(
957-
AWS_LS_S3_CLIENT,
958-
"id=%p Cannot create meta s3 request; for trailer checksum, the original request cannot be "
959-
"aws-chunked encoding. The client will encode the request instead.",
960-
(void *)client);
961-
aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
962-
return NULL;
963-
}
964-
}
965-
}
966-
967-
if (options->checksum_config->location != AWS_SCL_NONE &&
968-
options->checksum_config->checksum_algorithm == AWS_SCA_NONE) {
969-
AWS_LOGF_ERROR(
970-
AWS_LS_S3_CLIENT,
971-
"id=%p Cannot create meta s3 request; checksum location is set, but no checksum algorithm selected.",
972-
(void *)client);
973-
aws_raise_error(AWS_ERROR_INVALID_ARGUMENT);
974-
return NULL;
975-
}
976-
}
977-
978948
if (s_apply_endpoint_override(client, message_headers, options->endpoint)) {
979949
return NULL;
980950
}

source/s3_meta_request.c

+8-1
Original file line numberDiff line numberDiff line change
@@ -218,7 +218,14 @@ int aws_s3_meta_request_init_base(
218218

219219
*((size_t *)&meta_request->part_size) = part_size;
220220
*((bool *)&meta_request->should_compute_content_md5) = should_compute_content_md5;
221-
aws_checksum_config_storage_init(meta_request->allocator, &meta_request->checksum_config, options->checksum_config);
221+
if (aws_checksum_config_storage_init(
222+
meta_request->allocator,
223+
&meta_request->checksum_config,
224+
options->checksum_config,
225+
options->message,
226+
(void *)meta_request)) {
227+
goto error;
228+
}
222229

223230
if (options->signing_config) {
224231
meta_request->cached_signing_config = aws_cached_signing_config_new(client, options->signing_config);

tests/CMakeLists.txt

+1
Original file line numberDiff line numberDiff line change
@@ -186,6 +186,7 @@ add_net_test_case(test_s3_round_trip_with_filepath)
186186
add_net_test_case(test_s3_round_trip_mpu_with_filepath)
187187
add_net_test_case(test_s3_round_trip_with_filepath_no_content_length)
188188
add_net_test_case(test_s3_round_trip_mpu_with_filepath_no_content_length)
189+
add_net_test_case(test_s3_round_trip_default_get_full_object_checksum_fc)
189190
add_net_test_case(test_s3_round_trip_mpu_multipart_get_full_object_checksum_fc)
190191
add_net_test_case(test_s3_round_trip_mpu_multipart_get_full_object_checksum_fc_header)
191192
add_net_test_case(test_s3_round_trip_mpu_multipart_get_full_object_checksum_via_callback)

tests/s3_data_plane_tests.c

+19-3
Original file line numberDiff line numberDiff line change
@@ -3918,7 +3918,11 @@ void s_s3_test_no_validate_checksum(
39183918
}
39193919

39203920
/* TODO: maybe refactor the fc -> flexible checksum tests to be less copy/paste */
3921-
static int s_test_s3_round_trip_default_get_fc_helper(struct aws_allocator *allocator, void *ctx, bool via_header) {
3921+
static int s_test_s3_round_trip_default_get_fc_helper(
3922+
struct aws_allocator *allocator,
3923+
void *ctx,
3924+
bool via_header,
3925+
enum aws_s3_tester_full_object_checksum full_object_checksum) {
39223926
(void)ctx;
39233927

39243928
struct aws_s3_tester tester;
@@ -3960,6 +3964,10 @@ static int s_test_s3_round_trip_default_get_fc_helper(struct aws_allocator *allo
39603964
.object_path_override = object_path,
39613965
},
39623966
};
3967+
if (algorithm != AWS_SCA_SHA1 && algorithm != AWS_SCA_SHA256) {
3968+
/* Full object checksums doesn't support SHA. */
3969+
put_options.put_options.full_object_checksum = full_object_checksum;
3970+
}
39633971

39643972
ASSERT_SUCCESS(aws_s3_tester_send_meta_request_with_options(&tester, &put_options, NULL));
39653973

@@ -3992,12 +4000,18 @@ static int s_test_s3_round_trip_default_get_fc_helper(struct aws_allocator *allo
39924000

39934001
AWS_TEST_CASE(test_s3_round_trip_default_get_fc, s_test_s3_round_trip_default_get_fc)
39944002
static int s_test_s3_round_trip_default_get_fc(struct aws_allocator *allocator, void *ctx) {
3995-
return s_test_s3_round_trip_default_get_fc_helper(allocator, ctx, false);
4003+
return s_test_s3_round_trip_default_get_fc_helper(allocator, ctx, false, AWS_TEST_FOC_NONE);
39964004
}
39974005

39984006
AWS_TEST_CASE(test_s3_round_trip_default_get_fc_header, s_test_s3_round_trip_default_get_fc_header)
39994007
static int s_test_s3_round_trip_default_get_fc_header(struct aws_allocator *allocator, void *ctx) {
4000-
return s_test_s3_round_trip_default_get_fc_helper(allocator, ctx, true);
4008+
return s_test_s3_round_trip_default_get_fc_helper(allocator, ctx, true, AWS_TEST_FOC_NONE);
4009+
}
4010+
AWS_TEST_CASE(
4011+
test_s3_round_trip_default_get_full_object_checksum_fc,
4012+
s_test_s3_round_trip_default_get_full_object_checksum_fc)
4013+
static int s_test_s3_round_trip_default_get_full_object_checksum_fc(struct aws_allocator *allocator, void *ctx) {
4014+
return s_test_s3_round_trip_default_get_fc_helper(allocator, ctx, false, AWS_TEST_FOC_HEADER);
40014015
}
40024016

40034017
static int s_test_s3_round_trip_multipart_get_fc_helper(struct aws_allocator *allocator, void *ctx, bool via_header) {
@@ -4066,6 +4080,7 @@ AWS_TEST_CASE(test_s3_round_trip_multipart_get_fc, s_test_s3_round_trip_multipar
40664080
static int s_test_s3_round_trip_multipart_get_fc(struct aws_allocator *allocator, void *ctx) {
40674081
return s_test_s3_round_trip_multipart_get_fc_helper(allocator, ctx, false);
40684082
}
4083+
40694084
AWS_TEST_CASE(test_s3_round_trip_multipart_get_fc_header, s_test_s3_round_trip_multipart_get_fc_header)
40704085
static int s_test_s3_round_trip_multipart_get_fc_header(struct aws_allocator *allocator, void *ctx) {
40714086
return s_test_s3_round_trip_multipart_get_fc_helper(allocator, ctx, true);
@@ -4166,6 +4181,7 @@ AWS_TEST_CASE(
41664181
static int s_test_s3_round_trip_mpu_multipart_get_full_object_checksum_fc(struct aws_allocator *allocator, void *ctx) {
41674182
return s_test_s3_round_trip_mpu_multipart_get_fc_helper(allocator, ctx, false, AWS_TEST_FOC_HEADER);
41684183
}
4184+
41694185
AWS_TEST_CASE(
41704186
test_s3_round_trip_mpu_multipart_get_full_object_checksum_fc_header,
41714187
s_test_s3_round_trip_mpu_multipart_get_full_object_checksum_fc_header)

0 commit comments

Comments
 (0)