Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat(services/s3): add append support #5428

Open
wants to merge 3 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
23 changes: 19 additions & 4 deletions core/src/services/s3/backend.rs
Original file line number Diff line number Diff line change
Expand Up @@ -564,6 +564,12 @@ impl S3Builder {
self
}

/// Enable write with append so that opendal will send write request with append headers.
pub fn enable_write_with_append(mut self) -> Self {
self.config.enable_write_with_append = true;
self
}

/// Detect region of S3 bucket.
///
/// # Args
Expand Down Expand Up @@ -895,6 +901,7 @@ impl Builder for S3Builder {
checksum_algorithm,
delete_max_size,
disable_write_with_if_match: self.config.disable_write_with_if_match,
enable_write_with_append: self.config.enable_write_with_append,
}),
})
}
Expand Down Expand Up @@ -956,6 +963,8 @@ impl Access for S3Backend {
write: true,
write_can_empty: true,
write_can_multi: true,
write_can_append: self.core.enable_write_with_append,

write_with_cache_control: true,
write_with_content_type: true,
write_with_content_encoding: true,
Expand Down Expand Up @@ -1048,11 +1057,17 @@ impl Access for S3Backend {
}

async fn write(&self, path: &str, args: OpWrite) -> Result<(RpWrite, Self::Writer)> {
let concurrent = args.concurrent();
let executor = args.executor().cloned();
let writer = S3Writer::new(self.core.clone(), path, args);
let writer = S3Writer::new(self.core.clone(), path, args.clone());

let w = oio::MultipartWriter::new(writer, executor, concurrent);
let w = if args.append() {
S3Writers::Two(oio::AppendWriter::new(writer))
} else {
S3Writers::One(oio::MultipartWriter::new(
writer,
args.executor().cloned(),
args.concurrent(),
))
};

Ok((RpWrite::default(), w))
}
Expand Down
4 changes: 4 additions & 0 deletions core/src/services/s3/config.rs
Original file line number Diff line number Diff line change
Expand Up @@ -143,6 +143,7 @@ pub struct S3Config {
/// - `GLACIER_IR`
/// - `INTELLIGENT_TIERING`
/// - `ONEZONE_IA`
/// - `EXPRESS_ONEZONE`
/// - `OUTPOSTS`
/// - `REDUCED_REDUNDANCY`
/// - `STANDARD`
Expand Down Expand Up @@ -188,6 +189,9 @@ pub struct S3Config {
///
/// For example, Ceph RADOS S3 doesn't support write with if match.
pub disable_write_with_if_match: bool,

/// Enable write with append so that opendal will send write request with append headers.
pub enable_write_with_append: bool,
}

impl Debug for S3Config {
Expand Down
112 changes: 76 additions & 36 deletions core/src/services/s3/core.rs
Original file line number Diff line number Diff line change
Expand Up @@ -70,6 +70,8 @@ pub mod constants {
pub const X_AMZ_COPY_SOURCE_SERVER_SIDE_ENCRYPTION_CUSTOMER_KEY_MD5: &str =
"x-amz-copy-source-server-side-encryption-customer-key-md5";

pub const X_AMZ_WRITE_OFFSET_BYTES: &str = "x-amz-write-offset-bytes";

pub const X_AMZ_META_PREFIX: &str = "x-amz-meta-";

pub const RESPONSE_CONTENT_DISPOSITION: &str = "response-content-disposition";
Expand Down Expand Up @@ -100,6 +102,7 @@ pub struct S3Core {
pub delete_max_size: usize,
pub checksum_algorithm: Option<ChecksumAlgorithm>,
pub disable_write_with_if_match: bool,
pub enable_write_with_append: bool,
}

impl Debug for S3Core {
Expand Down Expand Up @@ -289,6 +292,54 @@ impl S3Core {
}
req
}

pub fn insert_metadata_headers(
&self,
mut req: http::request::Builder,
size: Option<u64>,
args: &OpWrite,
) -> http::request::Builder {
if let Some(size) = size {
req = req.header(CONTENT_LENGTH, size.to_string())
}

if let Some(mime) = args.content_type() {
req = req.header(CONTENT_TYPE, mime)
}

if let Some(pos) = args.content_disposition() {
req = req.header(CONTENT_DISPOSITION, pos)
}

if let Some(encoding) = args.content_encoding() {
req = req.header(CONTENT_ENCODING, encoding);
}

if let Some(cache_control) = args.cache_control() {
req = req.header(CACHE_CONTROL, cache_control)
}

if let Some(if_match) = args.if_match() {
req = req.header(IF_MATCH, if_match);
}

if args.if_not_exists() {
req = req.header(IF_NONE_MATCH, "*");
}

// Set storage class header
if let Some(v) = &self.default_storage_class {
req = req.header(HeaderName::from_static(constants::X_AMZ_STORAGE_CLASS), v);
}

// Set user metadata headers.
if let Some(user_metadata) = args.user_metadata() {
for (key, value) in user_metadata {
req = req.header(format!("{X_AMZ_META_PREFIX}{key}"), value)
}
}
req
}
}

impl S3Core {
Expand Down Expand Up @@ -468,55 +519,44 @@ impl S3Core {

let mut req = Request::put(&url);

if let Some(size) = size {
req = req.header(CONTENT_LENGTH, size.to_string())
}
req = self.insert_metadata_headers(req, size, args);

if let Some(mime) = args.content_type() {
req = req.header(CONTENT_TYPE, mime)
}
// Set SSE headers.
req = self.insert_sse_headers(req, true);

if let Some(pos) = args.content_disposition() {
req = req.header(CONTENT_DISPOSITION, pos)
// Calculate Checksum.
if let Some(checksum) = self.calculate_checksum(&body) {
// Set Checksum header.
req = self.insert_checksum_header(req, &checksum);
}

if let Some(encoding) = args.content_encoding() {
req = req.header(CONTENT_ENCODING, encoding);
}
// Set body
let req = req.body(body).map_err(new_request_build_error)?;

if let Some(cache_control) = args.cache_control() {
req = req.header(CACHE_CONTROL, cache_control)
}
Ok(req)
}

if let Some(if_match) = args.if_match() {
req = req.header(IF_MATCH, if_match);
}
pub fn s3_append_object_request(
&self,
path: &str,
position: u64,
size: u64,
args: &OpWrite,
body: Buffer,
) -> Result<Request<Buffer>> {
let p = build_abs_path(&self.root, path);

if args.if_not_exists() {
req = req.header(IF_NONE_MATCH, "*");
}
let url = format!("{}/{}", self.endpoint, percent_encode_path(&p));

// Set storage class header
if let Some(v) = &self.default_storage_class {
req = req.header(HeaderName::from_static(constants::X_AMZ_STORAGE_CLASS), v);
}
let mut req = Request::put(&url);

// Set user metadata headers.
if let Some(user_metadata) = args.user_metadata() {
for (key, value) in user_metadata {
req = req.header(format!("{X_AMZ_META_PREFIX}{key}"), value)
}
}
req = self.insert_metadata_headers(req, Some(size), args);
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Hi, I assume that only the first append call supports setting up metadata. We don't need to repeat the metadata for subsequent append requests.

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Hi, so sorry for the late reply! having two crazy weeks after the holidays :(

I may not follow what you mean but it seems we could set up the metadata after the first one?
image


req = req.header(constants::X_AMZ_WRITE_OFFSET_BYTES, position.to_string());

// Set SSE headers.
req = self.insert_sse_headers(req, true);

// Calculate Checksum.
if let Some(checksum) = self.calculate_checksum(&body) {
// Set Checksum header.
req = self.insert_checksum_header(req, &checksum);
}

// Set body
let req = req.body(body).map_err(new_request_build_error)?;

Expand Down
1 change: 1 addition & 0 deletions core/src/services/s3/docs.md
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@ This service can be used to:
- [x] stat
- [x] read
- [x] write
- [x] append
- [x] create_dir
- [x] delete
- [x] copy
Expand Down
36 changes: 35 additions & 1 deletion core/src/services/s3/writer.rs
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@ use super::error::S3Error;
use crate::raw::*;
use crate::*;

pub type S3Writers = oio::MultipartWriter<S3Writer>;
pub type S3Writers = TwoWays<oio::MultipartWriter<S3Writer>, oio::AppendWriter<S3Writer>>;

pub struct S3Writer {
core: Arc<S3Core>,
Expand Down Expand Up @@ -188,3 +188,37 @@ impl oio::MultipartWrite for S3Writer {
}
}
}

impl oio::AppendWrite for S3Writer {
async fn offset(&self) -> Result<u64> {
let resp = self
.core
.s3_head_object(&self.path, OpStat::default())
.await?;

let status = resp.status();

match status {
StatusCode::OK => Ok(parse_content_length(resp.headers())?.unwrap_or_default()),
StatusCode::NOT_FOUND => Ok(0),
_ => Err(parse_error(resp)),
}
}

async fn append(&self, offset: u64, size: u64, body: Buffer) -> Result<()> {
let mut req = self
.core
.s3_append_object_request(&self.path, offset, size, &self.op, body)?;

self.core.sign(&mut req).await?;

let resp = self.core.send(req).await?;

let status = resp.status();

match status {
StatusCode::OK => Ok(()),
_ => Err(parse_error(resp)),
}
}
}
Loading