2022-04-07 17:01:04 +00:00
|
|
|
use std::pin::Pin;
|
2020-04-28 10:18:14 +00:00
|
|
|
use std::sync::Arc;
|
2022-01-11 11:43:46 +00:00
|
|
|
use std::time::{Duration, SystemTime, UNIX_EPOCH};
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2023-05-03 10:02:59 +00:00
|
|
|
use futures::{stream, stream::Stream, StreamExt};
|
2022-01-11 16:31:09 +00:00
|
|
|
use md5::{Digest as Md5Digest, Md5};
|
|
|
|
|
2022-07-22 16:20:27 +00:00
|
|
|
use bytes::Bytes;
|
2024-02-05 17:49:54 +00:00
|
|
|
use hyper::{Request, Response};
|
2022-01-11 16:31:09 +00:00
|
|
|
use serde::Serialize;
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2024-02-13 11:55:41 +00:00
|
|
|
use garage_net::bytes_buf::BytesBuf;
|
2022-09-01 10:58:20 +00:00
|
|
|
use garage_rpc::rpc_helper::OrderTag;
|
2020-04-28 10:18:14 +00:00
|
|
|
use garage_table::*;
|
|
|
|
use garage_util::data::*;
|
2021-03-15 15:21:41 +00:00
|
|
|
use garage_util::time::*;
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2020-07-07 11:59:22 +00:00
|
|
|
use garage_model::garage::Garage;
|
2022-01-11 16:31:09 +00:00
|
|
|
use garage_model::key_table::Key;
|
2022-05-10 11:16:57 +00:00
|
|
|
use garage_model::s3::block_ref_table::*;
|
2023-05-03 10:02:59 +00:00
|
|
|
use garage_model::s3::mpu_table::*;
|
2022-05-10 11:16:57 +00:00
|
|
|
use garage_model::s3::object_table::*;
|
|
|
|
use garage_model::s3::version_table::*;
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2024-02-05 17:49:54 +00:00
|
|
|
use crate::helpers::*;
|
|
|
|
use crate::s3::api_server::{ReqBody, ResBody};
|
2022-05-24 10:16:39 +00:00
|
|
|
use crate::s3::error::*;
|
2023-05-03 10:02:59 +00:00
|
|
|
use crate::s3::multipart;
|
|
|
|
use crate::s3::put::get_headers;
|
2022-05-10 11:16:57 +00:00
|
|
|
use crate::s3::xml::{self as s3_xml, xmlns_tag};
|
2020-11-08 14:04:30 +00:00
|
|
|
|
2020-04-28 10:18:14 +00:00
|
|
|
pub async fn handle_copy(
|
|
|
|
garage: Arc<Garage>,
|
2022-01-11 16:31:09 +00:00
|
|
|
api_key: &Key,
|
2024-02-05 17:49:54 +00:00
|
|
|
req: &Request<ReqBody>,
|
2021-12-14 12:55:11 +00:00
|
|
|
dest_bucket_id: Uuid,
|
2020-04-28 10:18:14 +00:00
|
|
|
dest_key: &str,
|
2024-02-05 17:49:54 +00:00
|
|
|
) -> Result<Response<ResBody>, Error> {
|
2022-01-11 11:43:46 +00:00
|
|
|
let copy_precondition = CopyPreconditionHeaders::parse(req)?;
|
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
let source_object = get_copy_source(&garage, api_key, req).await?;
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
let (source_version, source_version_data, source_version_meta) =
|
|
|
|
extract_source_info(&source_object)?;
|
2020-11-11 15:12:42 +00:00
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
// Check precondition, e.g. x-amz-copy-source-if-match
|
|
|
|
copy_precondition.check(source_version, &source_version_meta.etag)?;
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
// Generate parameters for copied object
|
2020-04-28 10:18:14 +00:00
|
|
|
let new_uuid = gen_uuid();
|
2021-03-15 14:26:29 +00:00
|
|
|
let new_timestamp = now_msec();
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2021-03-15 15:21:41 +00:00
|
|
|
// Implement x-amz-metadata-directive: REPLACE
|
|
|
|
let new_meta = match req.headers().get("x-amz-metadata-directive") {
|
|
|
|
Some(v) if v == hyper::header::HeaderValue::from_static("REPLACE") => ObjectVersionMeta {
|
2022-02-21 22:02:30 +00:00
|
|
|
headers: get_headers(req.headers())?,
|
2022-01-11 16:31:09 +00:00
|
|
|
size: source_version_meta.size,
|
|
|
|
etag: source_version_meta.etag.clone(),
|
2021-03-15 15:21:41 +00:00
|
|
|
},
|
2022-01-11 16:31:09 +00:00
|
|
|
_ => source_version_meta.clone(),
|
2021-03-15 15:21:41 +00:00
|
|
|
};
|
|
|
|
|
2021-05-03 20:45:42 +00:00
|
|
|
let etag = new_meta.etag.to_string();
|
|
|
|
|
2021-03-15 15:21:41 +00:00
|
|
|
// Save object copy
|
2022-01-11 16:31:09 +00:00
|
|
|
match source_version_data {
|
2021-03-15 15:21:41 +00:00
|
|
|
ObjectVersionData::DeleteMarker => unreachable!(),
|
|
|
|
ObjectVersionData::Inline(_meta, bytes) => {
|
|
|
|
let dest_object_version = ObjectVersion {
|
|
|
|
uuid: new_uuid,
|
|
|
|
timestamp: new_timestamp,
|
|
|
|
state: ObjectVersionState::Complete(ObjectVersionData::Inline(
|
|
|
|
new_meta,
|
|
|
|
bytes.clone(),
|
|
|
|
)),
|
|
|
|
};
|
|
|
|
let dest_object = Object::new(
|
2021-12-14 12:55:11 +00:00
|
|
|
dest_bucket_id,
|
2021-03-15 15:21:41 +00:00
|
|
|
dest_key.to_string(),
|
|
|
|
vec![dest_object_version],
|
|
|
|
);
|
2020-04-28 10:18:14 +00:00
|
|
|
garage.object_table.insert(&dest_object).await?;
|
|
|
|
}
|
2021-03-15 15:21:41 +00:00
|
|
|
ObjectVersionData::FirstBlock(_meta, first_block_hash) => {
|
2021-03-15 14:26:29 +00:00
|
|
|
// Get block list from source version
|
2020-04-28 10:18:14 +00:00
|
|
|
let source_version = garage
|
|
|
|
.version_table
|
2022-01-11 16:31:09 +00:00
|
|
|
.get(&source_version.uuid, &EmptyKey)
|
2020-04-28 10:18:14 +00:00
|
|
|
.await?;
|
2022-01-05 16:07:36 +00:00
|
|
|
let source_version = source_version.ok_or(Error::NoSuchKey)?;
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2021-03-15 14:26:29 +00:00
|
|
|
// Write an "uploading" marker in Object table
|
|
|
|
// This holds a reference to the object in the Version table
|
|
|
|
// so that it won't be deleted, e.g. by repair_versions.
|
|
|
|
let tmp_dest_object_version = ObjectVersion {
|
|
|
|
uuid: new_uuid,
|
|
|
|
timestamp: new_timestamp,
|
2023-05-03 10:02:59 +00:00
|
|
|
state: ObjectVersionState::Uploading {
|
|
|
|
headers: new_meta.headers.clone(),
|
|
|
|
multipart: false,
|
|
|
|
},
|
2021-03-15 14:26:29 +00:00
|
|
|
};
|
|
|
|
let tmp_dest_object = Object::new(
|
2021-12-14 12:55:11 +00:00
|
|
|
dest_bucket_id,
|
2021-03-15 14:26:29 +00:00
|
|
|
dest_key.to_string(),
|
|
|
|
vec![tmp_dest_object_version],
|
|
|
|
);
|
|
|
|
garage.object_table.insert(&tmp_dest_object).await?;
|
|
|
|
|
|
|
|
// Write version in the version table. Even with empty block list,
|
|
|
|
// this means that the BlockRef entries linked to this version cannot be
|
|
|
|
// marked as deleted (they are marked as deleted only if the Version
|
|
|
|
// doesn't exist or is marked as deleted).
|
2023-05-03 10:02:59 +00:00
|
|
|
let mut dest_version = Version::new(
|
|
|
|
new_uuid,
|
|
|
|
VersionBacklink::Object {
|
|
|
|
bucket_id: dest_bucket_id,
|
|
|
|
key: dest_key.to_string(),
|
|
|
|
},
|
|
|
|
false,
|
|
|
|
);
|
2021-03-15 14:26:29 +00:00
|
|
|
garage.version_table.insert(&dest_version).await?;
|
|
|
|
|
|
|
|
// Fill in block list for version and insert block refs
|
2021-03-10 15:21:56 +00:00
|
|
|
for (bk, bv) in source_version.blocks.items().iter() {
|
|
|
|
dest_version.blocks.put(*bk, *bv);
|
|
|
|
}
|
2020-04-28 10:18:14 +00:00
|
|
|
let dest_block_refs = dest_version
|
2021-03-10 15:21:56 +00:00
|
|
|
.blocks
|
|
|
|
.items()
|
2020-04-28 10:18:14 +00:00
|
|
|
.iter()
|
|
|
|
.map(|b| BlockRef {
|
2021-03-10 15:21:56 +00:00
|
|
|
block: b.1.hash,
|
2020-04-28 10:18:14 +00:00
|
|
|
version: new_uuid,
|
2021-03-10 15:21:56 +00:00
|
|
|
deleted: false.into(),
|
2020-04-28 10:18:14 +00:00
|
|
|
})
|
|
|
|
.collect::<Vec<_>>();
|
|
|
|
futures::try_join!(
|
|
|
|
garage.version_table.insert(&dest_version),
|
|
|
|
garage.block_ref_table.insert_many(&dest_block_refs[..]),
|
|
|
|
)?;
|
2021-03-15 14:26:29 +00:00
|
|
|
|
|
|
|
// Insert final object
|
|
|
|
// We do this last because otherwise there is a race condition in the case where
|
|
|
|
// the copy call has the same source and destination (this happens, rclone does
|
|
|
|
// it to update the modification timestamp for instance). If we did this concurrently
|
|
|
|
// with the stuff before, the block's reference counts could be decremented before
|
|
|
|
// they are incremented again for the new version, leading to data being deleted.
|
2021-03-15 15:21:41 +00:00
|
|
|
let dest_object_version = ObjectVersion {
|
|
|
|
uuid: new_uuid,
|
|
|
|
timestamp: new_timestamp,
|
|
|
|
state: ObjectVersionState::Complete(ObjectVersionData::FirstBlock(
|
|
|
|
new_meta,
|
|
|
|
*first_block_hash,
|
|
|
|
)),
|
|
|
|
};
|
|
|
|
let dest_object = Object::new(
|
2021-12-14 12:55:11 +00:00
|
|
|
dest_bucket_id,
|
2021-03-15 15:21:41 +00:00
|
|
|
dest_key.to_string(),
|
|
|
|
vec![dest_object_version],
|
|
|
|
);
|
2021-03-15 14:26:29 +00:00
|
|
|
garage.object_table.insert(&dest_object).await?;
|
2020-04-28 10:18:14 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-15 15:21:41 +00:00
|
|
|
let last_modified = msec_to_rfc3339(new_timestamp);
|
2022-01-12 10:41:20 +00:00
|
|
|
let result = CopyObjectResult {
|
2021-05-03 20:45:42 +00:00
|
|
|
last_modified: s3_xml::Value(last_modified),
|
2022-01-12 10:41:20 +00:00
|
|
|
etag: s3_xml::Value(format!("\"{}\"", etag)),
|
2021-05-03 20:45:42 +00:00
|
|
|
};
|
|
|
|
let xml = s3_xml::to_xml_with_header(&result)?;
|
2020-04-28 10:18:14 +00:00
|
|
|
|
2021-02-19 22:40:18 +00:00
|
|
|
Ok(Response::builder()
|
2021-02-23 17:46:25 +00:00
|
|
|
.header("Content-Type", "application/xml")
|
2022-01-11 11:43:46 +00:00
|
|
|
.header("x-amz-version-id", hex::encode(new_uuid))
|
|
|
|
.header(
|
|
|
|
"x-amz-copy-source-version-id",
|
2022-01-11 16:31:09 +00:00
|
|
|
hex::encode(source_version.uuid),
|
2022-01-11 11:43:46 +00:00
|
|
|
)
|
2024-02-05 17:49:54 +00:00
|
|
|
.body(string_body(xml))?)
|
2020-04-28 10:18:14 +00:00
|
|
|
}
|
2022-01-11 11:43:46 +00:00
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
pub async fn handle_upload_part_copy(
|
|
|
|
garage: Arc<Garage>,
|
|
|
|
api_key: &Key,
|
2024-02-05 17:49:54 +00:00
|
|
|
req: &Request<ReqBody>,
|
2022-01-11 16:31:09 +00:00
|
|
|
dest_bucket_id: Uuid,
|
|
|
|
dest_key: &str,
|
|
|
|
part_number: u64,
|
|
|
|
upload_id: &str,
|
2024-02-05 17:49:54 +00:00
|
|
|
) -> Result<Response<ResBody>, Error> {
|
2022-01-11 16:31:09 +00:00
|
|
|
let copy_precondition = CopyPreconditionHeaders::parse(req)?;
|
|
|
|
|
2023-05-03 10:02:59 +00:00
|
|
|
let dest_upload_id = multipart::decode_upload_id(upload_id)?;
|
2022-01-11 16:31:09 +00:00
|
|
|
|
|
|
|
let dest_key = dest_key.to_string();
|
2023-05-03 10:02:59 +00:00
|
|
|
let (source_object, (_, _, mut dest_mpu)) = futures::try_join!(
|
2022-01-11 16:31:09 +00:00
|
|
|
get_copy_source(&garage, api_key, req),
|
2023-05-03 10:02:59 +00:00
|
|
|
multipart::get_upload(&garage, &dest_bucket_id, &dest_key, &dest_upload_id)
|
2022-01-11 16:31:09 +00:00
|
|
|
)?;
|
|
|
|
|
|
|
|
let (source_object_version, source_version_data, source_version_meta) =
|
|
|
|
extract_source_info(&source_object)?;
|
|
|
|
|
|
|
|
// Check precondition on source, e.g. x-amz-copy-source-if-match
|
|
|
|
copy_precondition.check(source_object_version, &source_version_meta.etag)?;
|
|
|
|
|
|
|
|
// Check source range is valid
|
|
|
|
let source_range = match req.headers().get("x-amz-copy-source-range") {
|
|
|
|
Some(range) => {
|
|
|
|
let range_str = range.to_str()?;
|
|
|
|
let mut ranges = http_range::HttpRange::parse(range_str, source_version_meta.size)
|
|
|
|
.map_err(|e| (e, source_version_meta.size))?;
|
|
|
|
if ranges.len() != 1 {
|
2022-05-24 10:16:39 +00:00
|
|
|
return Err(Error::bad_request(
|
|
|
|
"Invalid x-amz-copy-source-range header: exactly 1 range must be given",
|
2022-01-11 16:31:09 +00:00
|
|
|
));
|
|
|
|
} else {
|
|
|
|
ranges.pop().unwrap()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
None => http_range::HttpRange {
|
|
|
|
start: 0,
|
|
|
|
length: source_version_meta.size,
|
|
|
|
},
|
|
|
|
};
|
|
|
|
|
|
|
|
// Check source version is not inlined
|
|
|
|
match source_version_data {
|
|
|
|
ObjectVersionData::DeleteMarker => unreachable!(),
|
|
|
|
ObjectVersionData::Inline(_meta, _bytes) => {
|
|
|
|
// This is only for small files, we don't bother handling this.
|
|
|
|
// (in AWS UploadPartCopy works for parts at least 5MB which
|
|
|
|
// is never the case of an inline object)
|
2022-05-24 10:16:39 +00:00
|
|
|
return Err(Error::bad_request(
|
|
|
|
"Source object is too small (minimum part size is 5Mb)",
|
2022-01-11 16:31:09 +00:00
|
|
|
));
|
|
|
|
}
|
|
|
|
ObjectVersionData::FirstBlock(_meta, _first_block_hash) => (),
|
|
|
|
};
|
|
|
|
|
|
|
|
// Fetch source versin with its block list,
|
|
|
|
// and destination version to check part hasn't yet been uploaded
|
2023-05-03 10:02:59 +00:00
|
|
|
let source_version = garage
|
|
|
|
.version_table
|
|
|
|
.get(&source_object_version.uuid, &EmptyKey)
|
|
|
|
.await?
|
|
|
|
.ok_or(Error::NoSuchKey)?;
|
2022-01-11 16:31:09 +00:00
|
|
|
|
|
|
|
// We want to reuse blocks from the source version as much as possible.
|
|
|
|
// However, we still need to get the data from these blocks
|
|
|
|
// because we need to know it to calculate the MD5sum of the part
|
|
|
|
// which is used as its ETag.
|
|
|
|
|
|
|
|
// First, calculate what blocks we want to keep,
|
|
|
|
// and the subrange of the block to take, if the bounds of the
|
|
|
|
// requested range are in the middle.
|
|
|
|
let (range_begin, range_end) = (source_range.start, source_range.start + source_range.length);
|
|
|
|
|
|
|
|
let mut blocks_to_copy = vec![];
|
|
|
|
let mut current_offset = 0;
|
|
|
|
for (_bk, block) in source_version.blocks.items().iter() {
|
|
|
|
let (block_begin, block_end) = (current_offset, current_offset + block.size);
|
|
|
|
|
|
|
|
if block_begin < range_end && block_end > range_begin {
|
|
|
|
let subrange_begin = if block_begin < range_begin {
|
|
|
|
Some(range_begin - block_begin)
|
|
|
|
} else {
|
|
|
|
None
|
|
|
|
};
|
|
|
|
let subrange_end = if block_end > range_end {
|
|
|
|
Some(range_end - block_begin)
|
|
|
|
} else {
|
|
|
|
None
|
|
|
|
};
|
|
|
|
let range_to_copy = match (subrange_begin, subrange_end) {
|
|
|
|
(Some(b), Some(e)) => Some(b as usize..e as usize),
|
|
|
|
(None, Some(e)) => Some(0..e as usize),
|
|
|
|
(Some(b), None) => Some(b as usize..block.size as usize),
|
|
|
|
(None, None) => None,
|
|
|
|
};
|
|
|
|
|
|
|
|
blocks_to_copy.push((block.hash, range_to_copy));
|
|
|
|
}
|
|
|
|
|
|
|
|
current_offset = block_end;
|
|
|
|
}
|
|
|
|
|
2023-05-03 10:02:59 +00:00
|
|
|
// Calculate the identity of destination part: timestamp, version id
|
|
|
|
let dest_version_id = gen_uuid();
|
|
|
|
let dest_mpu_part_key = MpuPartKey {
|
|
|
|
part_number,
|
|
|
|
timestamp: dest_mpu.next_timestamp(part_number),
|
|
|
|
};
|
|
|
|
|
|
|
|
// Create the uploaded part
|
|
|
|
dest_mpu.parts.clear();
|
|
|
|
dest_mpu.parts.put(
|
|
|
|
dest_mpu_part_key,
|
|
|
|
MpuPart {
|
|
|
|
version: dest_version_id,
|
|
|
|
etag: None,
|
|
|
|
size: None,
|
|
|
|
},
|
|
|
|
);
|
|
|
|
garage.mpu_table.insert(&dest_mpu).await?;
|
|
|
|
|
|
|
|
let mut dest_version = Version::new(
|
|
|
|
dest_version_id,
|
|
|
|
VersionBacklink::MultipartUpload {
|
|
|
|
upload_id: dest_upload_id,
|
|
|
|
},
|
|
|
|
false,
|
|
|
|
);
|
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
// Now, actually copy the blocks
|
|
|
|
let mut md5hasher = Md5::new();
|
|
|
|
|
2022-04-07 16:38:32 +00:00
|
|
|
// First, create a stream that is able to read the source blocks
|
|
|
|
// and extract the subrange if necessary.
|
|
|
|
// The second returned value is an Option<Hash>, that is Some
|
|
|
|
// if and only if the block returned is a block that already existed
|
|
|
|
// in the Garage data store (thus we don't need to save it again).
|
|
|
|
let garage2 = garage.clone();
|
2022-09-01 10:58:20 +00:00
|
|
|
let order_stream = OrderTag::stream();
|
2022-04-07 16:38:32 +00:00
|
|
|
let source_blocks = stream::iter(blocks_to_copy)
|
2022-09-01 10:58:20 +00:00
|
|
|
.enumerate()
|
|
|
|
.flat_map(|(i, (block_hash, range_to_copy))| {
|
2022-04-07 16:38:32 +00:00
|
|
|
let garage3 = garage2.clone();
|
|
|
|
stream::once(async move {
|
2022-09-01 10:58:20 +00:00
|
|
|
let data = garage3
|
|
|
|
.block_manager
|
|
|
|
.rpc_get_block(&block_hash, Some(order_stream.order(i as u64)))
|
|
|
|
.await?;
|
2022-04-07 16:38:32 +00:00
|
|
|
match range_to_copy {
|
2022-07-22 16:20:27 +00:00
|
|
|
Some(r) => Ok((data.slice(r), None)),
|
2022-04-07 16:38:32 +00:00
|
|
|
None => Ok((data, Some(block_hash))),
|
|
|
|
}
|
|
|
|
})
|
|
|
|
})
|
|
|
|
.peekable();
|
2022-01-11 16:31:09 +00:00
|
|
|
|
2022-04-07 17:01:04 +00:00
|
|
|
// The defragmenter is a custom stream (defined below) that concatenates
|
|
|
|
// consecutive block parts when they are too small.
|
|
|
|
// It returns a series of (Vec<u8>, Option<Hash>).
|
|
|
|
// When it is done, it returns an empty vec.
|
|
|
|
// Same as the previous iterator, the Option is Some(_) if and only if
|
|
|
|
// it's an existing block of the Garage data store.
|
|
|
|
let mut defragmenter = Defragmenter::new(garage.config.block_size, Box::pin(source_blocks));
|
2022-04-07 16:38:32 +00:00
|
|
|
|
2022-04-07 17:01:04 +00:00
|
|
|
let mut current_offset = 0;
|
|
|
|
let mut next_block = defragmenter.next().await?;
|
2022-04-07 16:38:32 +00:00
|
|
|
|
|
|
|
loop {
|
2022-04-07 17:01:04 +00:00
|
|
|
let (data, existing_block_hash) = next_block;
|
|
|
|
if data.is_empty() {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
md5hasher.update(&data[..]);
|
|
|
|
|
|
|
|
let must_upload = existing_block_hash.is_none();
|
|
|
|
let final_hash = existing_block_hash.unwrap_or_else(|| blake2sum(&data[..]));
|
|
|
|
|
2023-05-03 10:02:59 +00:00
|
|
|
dest_version.blocks.clear();
|
|
|
|
dest_version.blocks.put(
|
2022-04-07 17:01:04 +00:00
|
|
|
VersionBlockKey {
|
|
|
|
part_number,
|
|
|
|
offset: current_offset,
|
|
|
|
},
|
|
|
|
VersionBlock {
|
|
|
|
hash: final_hash,
|
|
|
|
size: data.len() as u64,
|
|
|
|
},
|
|
|
|
);
|
|
|
|
current_offset += data.len() as u64;
|
|
|
|
|
|
|
|
let block_ref = BlockRef {
|
|
|
|
block: final_hash,
|
2023-05-03 10:02:59 +00:00
|
|
|
version: dest_version_id,
|
2022-04-07 17:01:04 +00:00
|
|
|
deleted: false.into(),
|
2022-01-11 16:31:09 +00:00
|
|
|
};
|
|
|
|
|
2022-04-07 17:01:04 +00:00
|
|
|
let garage2 = garage.clone();
|
|
|
|
let res = futures::try_join!(
|
|
|
|
// Thing 1: if the block is not exactly a block that existed before,
|
|
|
|
// we need to insert that data as a new block.
|
|
|
|
async move {
|
|
|
|
if must_upload {
|
2022-07-22 17:06:56 +00:00
|
|
|
garage2.block_manager.rpc_put_block(final_hash, data).await
|
2022-01-11 16:31:09 +00:00
|
|
|
} else {
|
2022-04-07 17:01:04 +00:00
|
|
|
Ok(())
|
2022-01-11 16:31:09 +00:00
|
|
|
}
|
2022-04-07 17:01:04 +00:00
|
|
|
},
|
2023-05-03 10:02:59 +00:00
|
|
|
async {
|
|
|
|
// Thing 2: we need to insert the block in the version
|
|
|
|
garage.version_table.insert(&dest_version).await?;
|
|
|
|
// Thing 3: we need to add a block reference
|
|
|
|
garage.block_ref_table.insert(&block_ref).await
|
|
|
|
},
|
2022-01-11 16:31:09 +00:00
|
|
|
// Thing 4: we need to prefetch the next block
|
2022-04-07 17:01:04 +00:00
|
|
|
defragmenter.next(),
|
|
|
|
)?;
|
2023-05-03 10:02:59 +00:00
|
|
|
next_block = res.2;
|
2022-01-11 16:31:09 +00:00
|
|
|
}
|
|
|
|
|
2023-05-03 10:02:59 +00:00
|
|
|
assert_eq!(current_offset, source_range.length);
|
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
let data_md5sum = md5hasher.finalize();
|
|
|
|
let etag = hex::encode(data_md5sum);
|
|
|
|
|
|
|
|
// Put the part's ETag in the Versiontable
|
2023-05-03 10:02:59 +00:00
|
|
|
dest_mpu.parts.put(
|
|
|
|
dest_mpu_part_key,
|
|
|
|
MpuPart {
|
|
|
|
version: dest_version_id,
|
|
|
|
etag: Some(etag.clone()),
|
|
|
|
size: Some(current_offset),
|
|
|
|
},
|
|
|
|
);
|
|
|
|
garage.mpu_table.insert(&dest_mpu).await?;
|
2022-01-11 16:31:09 +00:00
|
|
|
|
|
|
|
// LGTM
|
|
|
|
let resp_xml = s3_xml::to_xml_with_header(&CopyPartResult {
|
|
|
|
xmlns: (),
|
2022-01-12 10:41:20 +00:00
|
|
|
etag: s3_xml::Value(format!("\"{}\"", etag)),
|
2022-01-11 16:31:09 +00:00
|
|
|
last_modified: s3_xml::Value(msec_to_rfc3339(source_object_version.timestamp)),
|
|
|
|
})?;
|
|
|
|
|
|
|
|
Ok(Response::builder()
|
|
|
|
.header("Content-Type", "application/xml")
|
|
|
|
.header(
|
|
|
|
"x-amz-copy-source-version-id",
|
|
|
|
hex::encode(source_object_version.uuid),
|
|
|
|
)
|
2024-02-05 17:49:54 +00:00
|
|
|
.body(string_body(resp_xml))?)
|
2022-01-11 16:31:09 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
async fn get_copy_source(
|
|
|
|
garage: &Garage,
|
|
|
|
api_key: &Key,
|
2024-02-05 17:49:54 +00:00
|
|
|
req: &Request<ReqBody>,
|
2022-01-11 16:31:09 +00:00
|
|
|
) -> Result<Object, Error> {
|
|
|
|
let copy_source = req.headers().get("x-amz-copy-source").unwrap().to_str()?;
|
|
|
|
let copy_source = percent_encoding::percent_decode_str(copy_source).decode_utf8()?;
|
|
|
|
|
|
|
|
let (source_bucket, source_key) = parse_bucket_key(©_source, None)?;
|
2022-05-24 10:16:39 +00:00
|
|
|
let source_bucket_id = garage
|
|
|
|
.bucket_helper()
|
|
|
|
.resolve_bucket(&source_bucket.to_string(), api_key)
|
|
|
|
.await?;
|
2022-01-11 16:31:09 +00:00
|
|
|
|
|
|
|
if !api_key.allow_read(&source_bucket_id) {
|
2022-05-24 10:16:39 +00:00
|
|
|
return Err(Error::forbidden(format!(
|
2022-01-11 16:31:09 +00:00
|
|
|
"Reading from bucket {} not allowed for this key",
|
|
|
|
source_bucket
|
|
|
|
)));
|
|
|
|
}
|
|
|
|
|
|
|
|
let source_key = source_key.ok_or_bad_request("No source key specified")?;
|
|
|
|
|
|
|
|
let source_object = garage
|
|
|
|
.object_table
|
|
|
|
.get(&source_bucket_id, &source_key.to_string())
|
|
|
|
.await?
|
|
|
|
.ok_or(Error::NoSuchKey)?;
|
|
|
|
|
|
|
|
Ok(source_object)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn extract_source_info(
|
|
|
|
source_object: &Object,
|
|
|
|
) -> Result<(&ObjectVersion, &ObjectVersionData, &ObjectVersionMeta), Error> {
|
|
|
|
let source_version = source_object
|
|
|
|
.versions()
|
|
|
|
.iter()
|
|
|
|
.rev()
|
|
|
|
.find(|v| v.is_complete())
|
|
|
|
.ok_or(Error::NoSuchKey)?;
|
|
|
|
|
|
|
|
let source_version_data = match &source_version.state {
|
|
|
|
ObjectVersionState::Complete(x) => x,
|
|
|
|
_ => unreachable!(),
|
|
|
|
};
|
|
|
|
|
|
|
|
let source_version_meta = match source_version_data {
|
|
|
|
ObjectVersionData::DeleteMarker => {
|
|
|
|
return Err(Error::NoSuchKey);
|
|
|
|
}
|
|
|
|
ObjectVersionData::Inline(meta, _bytes) => meta,
|
|
|
|
ObjectVersionData::FirstBlock(meta, _fbh) => meta,
|
|
|
|
};
|
|
|
|
|
|
|
|
Ok((source_version, source_version_data, source_version_meta))
|
|
|
|
}
|
|
|
|
|
2022-01-11 11:43:46 +00:00
|
|
|
struct CopyPreconditionHeaders {
|
|
|
|
copy_source_if_match: Option<Vec<String>>,
|
|
|
|
copy_source_if_modified_since: Option<SystemTime>,
|
|
|
|
copy_source_if_none_match: Option<Vec<String>>,
|
|
|
|
copy_source_if_unmodified_since: Option<SystemTime>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl CopyPreconditionHeaders {
|
2024-02-05 17:49:54 +00:00
|
|
|
fn parse(req: &Request<ReqBody>) -> Result<Self, Error> {
|
2022-01-11 11:43:46 +00:00
|
|
|
Ok(Self {
|
|
|
|
copy_source_if_match: req
|
|
|
|
.headers()
|
|
|
|
.get("x-amz-copy-source-if-match")
|
|
|
|
.map(|x| x.to_str())
|
|
|
|
.transpose()?
|
|
|
|
.map(|x| {
|
|
|
|
x.split(',')
|
|
|
|
.map(|m| m.trim().trim_matches('"').to_string())
|
|
|
|
.collect::<Vec<_>>()
|
|
|
|
}),
|
|
|
|
copy_source_if_modified_since: req
|
|
|
|
.headers()
|
|
|
|
.get("x-amz-copy-source-if-modified-since")
|
|
|
|
.map(|x| x.to_str())
|
|
|
|
.transpose()?
|
2022-01-18 11:22:31 +00:00
|
|
|
.map(httpdate::parse_http_date)
|
2022-01-11 11:43:46 +00:00
|
|
|
.transpose()
|
|
|
|
.ok_or_bad_request("Invalid date in x-amz-copy-source-if-modified-since")?,
|
|
|
|
copy_source_if_none_match: req
|
|
|
|
.headers()
|
|
|
|
.get("x-amz-copy-source-if-none-match")
|
|
|
|
.map(|x| x.to_str())
|
|
|
|
.transpose()?
|
|
|
|
.map(|x| {
|
|
|
|
x.split(',')
|
|
|
|
.map(|m| m.trim().trim_matches('"').to_string())
|
|
|
|
.collect::<Vec<_>>()
|
|
|
|
}),
|
|
|
|
copy_source_if_unmodified_since: req
|
|
|
|
.headers()
|
|
|
|
.get("x-amz-copy-source-if-unmodified-since")
|
|
|
|
.map(|x| x.to_str())
|
|
|
|
.transpose()?
|
2022-01-18 11:22:31 +00:00
|
|
|
.map(httpdate::parse_http_date)
|
2022-01-11 11:43:46 +00:00
|
|
|
.transpose()
|
|
|
|
.ok_or_bad_request("Invalid date in x-amz-copy-source-if-unmodified-since")?,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
fn check(&self, v: &ObjectVersion, etag: &str) -> Result<(), Error> {
|
|
|
|
let v_date = UNIX_EPOCH + Duration::from_millis(v.timestamp);
|
|
|
|
|
|
|
|
let ok = match (
|
|
|
|
&self.copy_source_if_match,
|
|
|
|
&self.copy_source_if_unmodified_since,
|
|
|
|
&self.copy_source_if_none_match,
|
|
|
|
&self.copy_source_if_modified_since,
|
|
|
|
) {
|
|
|
|
// TODO I'm not sure all of the conditions are evaluated correctly here
|
|
|
|
|
|
|
|
// If we have both if-match and if-unmodified-since,
|
|
|
|
// basically we don't care about if-unmodified-since,
|
|
|
|
// because in the spec it says that if if-match evaluates to
|
|
|
|
// true but if-unmodified-since evaluates to false,
|
|
|
|
// the copy is still done.
|
|
|
|
(Some(im), _, None, None) => im.iter().any(|x| x == etag || x == "*"),
|
|
|
|
(None, Some(ius), None, None) => v_date <= *ius,
|
|
|
|
|
|
|
|
// If we have both if-none-match and if-modified-since,
|
|
|
|
// then both of the two conditions must evaluate to true
|
|
|
|
(None, None, Some(inm), Some(ims)) => {
|
|
|
|
!inm.iter().any(|x| x == etag || x == "*") && v_date > *ims
|
|
|
|
}
|
|
|
|
(None, None, Some(inm), None) => !inm.iter().any(|x| x == etag || x == "*"),
|
|
|
|
(None, None, None, Some(ims)) => v_date > *ims,
|
2022-01-12 09:17:15 +00:00
|
|
|
(None, None, None, None) => true,
|
2022-01-11 11:43:46 +00:00
|
|
|
_ => {
|
2022-05-24 10:16:39 +00:00
|
|
|
return Err(Error::bad_request(
|
|
|
|
"Invalid combination of x-amz-copy-source-if-xxxxx headers",
|
2022-01-11 11:43:46 +00:00
|
|
|
))
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
if ok {
|
|
|
|
Ok(())
|
|
|
|
} else {
|
|
|
|
Err(Error::PreconditionFailed)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2022-01-11 16:31:09 +00:00
|
|
|
|
2022-07-22 16:20:27 +00:00
|
|
|
type BlockStreamItemOk = (Bytes, Option<Hash>);
|
2022-04-07 17:01:04 +00:00
|
|
|
type BlockStreamItem = Result<BlockStreamItemOk, garage_util::error::Error>;
|
|
|
|
|
|
|
|
struct Defragmenter<S: Stream<Item = BlockStreamItem>> {
|
|
|
|
block_size: usize,
|
|
|
|
block_stream: Pin<Box<stream::Peekable<S>>>,
|
2022-09-06 20:25:23 +00:00
|
|
|
buffer: BytesBuf,
|
2022-04-07 17:01:04 +00:00
|
|
|
hash: Option<Hash>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl<S: Stream<Item = BlockStreamItem>> Defragmenter<S> {
|
|
|
|
fn new(block_size: usize, block_stream: Pin<Box<stream::Peekable<S>>>) -> Self {
|
|
|
|
Self {
|
|
|
|
block_size,
|
|
|
|
block_stream,
|
2022-09-06 20:25:23 +00:00
|
|
|
buffer: BytesBuf::new(),
|
2022-04-07 17:01:04 +00:00
|
|
|
hash: None,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn next(&mut self) -> BlockStreamItem {
|
|
|
|
// Fill buffer while we can
|
|
|
|
while let Some(res) = self.block_stream.as_mut().peek().await {
|
|
|
|
let (peeked_next_block, _) = match res {
|
|
|
|
Ok(t) => t,
|
|
|
|
Err(_) => {
|
|
|
|
self.block_stream.next().await.unwrap()?;
|
|
|
|
unreachable!()
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
if self.buffer.is_empty() {
|
|
|
|
let (next_block, next_block_hash) = self.block_stream.next().await.unwrap()?;
|
2022-09-06 20:25:23 +00:00
|
|
|
self.buffer.extend(next_block);
|
2022-04-07 17:01:04 +00:00
|
|
|
self.hash = next_block_hash;
|
|
|
|
} else if self.buffer.len() + peeked_next_block.len() > self.block_size {
|
|
|
|
break;
|
|
|
|
} else {
|
|
|
|
let (next_block, _) = self.block_stream.next().await.unwrap()?;
|
|
|
|
self.buffer.extend(next_block);
|
|
|
|
self.hash = None;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-06 20:25:23 +00:00
|
|
|
Ok((self.buffer.take_all(), self.hash.take()))
|
2022-04-07 17:01:04 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-13 14:08:00 +00:00
|
|
|
#[derive(Debug, Serialize, PartialEq, Eq)]
|
2022-01-12 10:41:20 +00:00
|
|
|
pub struct CopyObjectResult {
|
|
|
|
#[serde(rename = "LastModified")]
|
|
|
|
pub last_modified: s3_xml::Value,
|
|
|
|
#[serde(rename = "ETag")]
|
|
|
|
pub etag: s3_xml::Value,
|
|
|
|
}
|
|
|
|
|
2022-09-13 14:08:00 +00:00
|
|
|
#[derive(Debug, Serialize, PartialEq, Eq)]
|
2022-01-11 16:31:09 +00:00
|
|
|
pub struct CopyPartResult {
|
|
|
|
#[serde(serialize_with = "xmlns_tag")]
|
|
|
|
pub xmlns: (),
|
|
|
|
#[serde(rename = "LastModified")]
|
|
|
|
pub last_modified: s3_xml::Value,
|
|
|
|
#[serde(rename = "ETag")]
|
|
|
|
pub etag: s3_xml::Value,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
use super::*;
|
2022-05-10 11:16:57 +00:00
|
|
|
use crate::s3::xml::to_xml_with_header;
|
2022-01-11 16:31:09 +00:00
|
|
|
|
2022-01-12 10:41:20 +00:00
|
|
|
#[test]
|
|
|
|
fn copy_object_result() -> Result<(), Error> {
|
|
|
|
let copy_result = CopyObjectResult {
|
|
|
|
last_modified: s3_xml::Value(msec_to_rfc3339(0)),
|
|
|
|
etag: s3_xml::Value("\"9b2cf535f27731c974343645a3985328\"".to_string()),
|
|
|
|
};
|
|
|
|
assert_eq!(
|
|
|
|
to_xml_with_header(©_result)?,
|
|
|
|
"<?xml version=\"1.0\" encoding=\"UTF-8\"?>\
|
|
|
|
<CopyObjectResult>\
|
|
|
|
<LastModified>1970-01-01T00:00:00.000Z</LastModified>\
|
|
|
|
<ETag>"9b2cf535f27731c974343645a3985328"</ETag>\
|
|
|
|
</CopyObjectResult>\
|
|
|
|
"
|
|
|
|
);
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
2022-01-11 16:31:09 +00:00
|
|
|
#[test]
|
|
|
|
fn serialize_copy_part_result() -> Result<(), Error> {
|
2022-01-12 10:41:20 +00:00
|
|
|
let expected_retval = "<?xml version=\"1.0\" encoding=\"UTF-8\"?>\
|
|
|
|
<CopyPartResult xmlns=\"http://s3.amazonaws.com/doc/2006-03-01/\">\
|
|
|
|
<LastModified>2011-04-11T20:34:56.000Z</LastModified>\
|
|
|
|
<ETag>"9b2cf535f27731c974343645a3985328"</ETag>\
|
|
|
|
</CopyPartResult>";
|
2022-01-11 16:31:09 +00:00
|
|
|
let v = CopyPartResult {
|
|
|
|
xmlns: (),
|
|
|
|
last_modified: s3_xml::Value("2011-04-11T20:34:56.000Z".into()),
|
2022-01-12 10:41:20 +00:00
|
|
|
etag: s3_xml::Value("\"9b2cf535f27731c974343645a3985328\"".into()),
|
2022-01-11 16:31:09 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
assert_eq!(to_xml_with_header(&v)?, expected_retval);
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|