2023-11-01 14:15:57 +00:00
|
|
|
use crate::storage::*;
|
2023-12-18 16:09:44 +00:00
|
|
|
use serde::Serialize;
|
2023-12-21 21:30:17 +00:00
|
|
|
use aws_sdk_s3::{
|
|
|
|
self as s3,
|
|
|
|
error::SdkError,
|
|
|
|
operation::get_object::GetObjectError,
|
|
|
|
};
|
2023-11-01 14:15:57 +00:00
|
|
|
|
2023-12-18 16:09:44 +00:00
|
|
|
#[derive(Clone, Debug, Serialize)]
|
|
|
|
pub struct GarageConf {
|
2023-11-23 16:19:35 +00:00
|
|
|
pub region: String,
|
|
|
|
pub s3_endpoint: String,
|
|
|
|
pub k2v_endpoint: String,
|
|
|
|
pub aws_access_key_id: String,
|
|
|
|
pub aws_secret_access_key: String,
|
|
|
|
pub bucket: String,
|
|
|
|
}
|
2023-11-01 14:15:57 +00:00
|
|
|
|
2023-12-18 16:09:44 +00:00
|
|
|
#[derive(Clone, Debug)]
|
|
|
|
pub struct GarageBuilder {
|
|
|
|
conf: GarageConf,
|
|
|
|
unicity: Vec<u8>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl GarageBuilder {
|
|
|
|
pub fn new(conf: GarageConf) -> anyhow::Result<Arc<Self>> {
|
|
|
|
let mut unicity: Vec<u8> = vec![];
|
|
|
|
unicity.extend_from_slice(file!().as_bytes());
|
|
|
|
unicity.append(&mut rmp_serde::to_vec(&conf)?);
|
|
|
|
Ok(Arc::new(Self { conf, unicity }))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-12-21 20:54:36 +00:00
|
|
|
#[async_trait]
|
2023-12-16 10:13:32 +00:00
|
|
|
impl IBuilder for GarageBuilder {
|
2023-12-21 20:54:36 +00:00
|
|
|
async fn build(&self) -> Result<Store, StorageError> {
|
2023-12-22 20:52:20 +00:00
|
|
|
let s3_creds = s3::config::Credentials::new(
|
2023-12-21 20:54:36 +00:00
|
|
|
self.conf.aws_access_key_id.clone(),
|
|
|
|
self.conf.aws_secret_access_key.clone(),
|
|
|
|
None,
|
|
|
|
None,
|
|
|
|
"aerogramme"
|
|
|
|
);
|
|
|
|
|
2023-12-22 20:52:20 +00:00
|
|
|
let s3_config = aws_config::from_env()
|
2023-12-21 20:54:36 +00:00
|
|
|
.region(aws_config::Region::new(self.conf.region.clone()))
|
2023-12-22 20:52:20 +00:00
|
|
|
.credentials_provider(s3_creds)
|
2023-12-21 20:54:36 +00:00
|
|
|
.endpoint_url(self.conf.s3_endpoint.clone())
|
|
|
|
.load()
|
|
|
|
.await;
|
2023-12-22 20:52:20 +00:00
|
|
|
let s3_client = aws_sdk_s3::Client::new(&s3_config);
|
|
|
|
|
|
|
|
let k2v_config = k2v_client::K2vClientConfig {
|
|
|
|
endpoint: self.conf.k2v_endpoint.clone(),
|
|
|
|
region: self.conf.region.clone(),
|
|
|
|
aws_access_key_id: self.conf.aws_access_key_id.clone(),
|
|
|
|
aws_secret_access_key: self.conf.aws_secret_access_key.clone(),
|
|
|
|
bucket: self.conf.bucket.clone(),
|
|
|
|
user_agent: None,
|
|
|
|
};
|
|
|
|
|
|
|
|
let k2v_client = match k2v_client::K2vClient::new(k2v_config) {
|
|
|
|
Err(e) => {
|
|
|
|
tracing::error!("unable to build k2v client: {}", e);
|
|
|
|
return Err(StorageError::Internal);
|
|
|
|
}
|
|
|
|
Ok(v) => v,
|
|
|
|
};
|
2023-12-21 20:54:36 +00:00
|
|
|
|
2023-12-21 21:30:17 +00:00
|
|
|
Ok(Box::new(GarageStore {
|
2023-12-22 20:52:20 +00:00
|
|
|
bucket: self.conf.bucket.clone(),
|
|
|
|
s3: s3_client,
|
|
|
|
k2v: k2v_client,
|
2023-12-21 21:30:17 +00:00
|
|
|
}))
|
2023-11-01 14:15:57 +00:00
|
|
|
}
|
2023-12-18 16:09:44 +00:00
|
|
|
fn unique(&self) -> UnicityBuffer {
|
|
|
|
UnicityBuffer(self.unicity.clone())
|
|
|
|
}
|
2023-12-16 10:13:32 +00:00
|
|
|
}
|
2023-11-02 11:18:43 +00:00
|
|
|
|
2023-12-16 10:13:32 +00:00
|
|
|
pub struct GarageStore {
|
2023-12-22 20:52:20 +00:00
|
|
|
bucket: String,
|
2023-12-21 20:54:36 +00:00
|
|
|
s3: s3::Client,
|
2023-12-22 20:52:20 +00:00
|
|
|
k2v: k2v_client::K2vClient,
|
|
|
|
}
|
|
|
|
|
|
|
|
fn causal_to_row_val(row_ref: RowRef, causal_value: k2v_client::CausalValue) -> RowVal {
|
|
|
|
let new_row_ref = row_ref.with_causality(causal_value.causality.into());
|
|
|
|
let row_values = causal_value.value.into_iter().map(|k2v_value| match k2v_value {
|
|
|
|
k2v_client::K2vValue::Tombstone => Alternative::Tombstone,
|
|
|
|
k2v_client::K2vValue::Value(v) => Alternative::Value(v),
|
|
|
|
}).collect::<Vec<_>>();
|
|
|
|
|
|
|
|
RowVal { row_ref: new_row_ref, value: row_values }
|
2023-11-01 14:15:57 +00:00
|
|
|
}
|
|
|
|
|
2023-12-16 10:13:32 +00:00
|
|
|
#[async_trait]
|
|
|
|
impl IStore for GarageStore {
|
|
|
|
async fn row_fetch<'a>(&self, select: &Selector<'a>) -> Result<Vec<RowVal>, StorageError> {
|
2023-12-22 20:52:20 +00:00
|
|
|
let batch_op = match select {
|
|
|
|
Selector::Range { shard, sort_begin, sort_end } => vec![k2v_client::BatchReadOp {
|
|
|
|
partition_key: shard,
|
|
|
|
filter: k2v_client::Filter {
|
|
|
|
start: Some(sort_begin),
|
|
|
|
end: Some(sort_end),
|
|
|
|
..k2v_client::Filter::default()
|
|
|
|
},
|
|
|
|
..k2v_client::BatchReadOp::default()
|
|
|
|
}],
|
|
|
|
Selector::List(row_ref_list) => row_ref_list.iter().map(|row_ref| k2v_client::BatchReadOp {
|
|
|
|
partition_key: &row_ref.uid.shard,
|
|
|
|
filter: k2v_client::Filter {
|
|
|
|
start: Some(&row_ref.uid.sort),
|
|
|
|
..k2v_client::Filter::default()
|
|
|
|
},
|
|
|
|
single_item: true,
|
|
|
|
..k2v_client::BatchReadOp::default()
|
|
|
|
}).collect::<Vec<_>>(),
|
|
|
|
Selector::Prefix { shard, sort_prefix } => vec![k2v_client::BatchReadOp {
|
|
|
|
partition_key: shard,
|
|
|
|
filter: k2v_client::Filter {
|
|
|
|
prefix: Some(sort_prefix),
|
|
|
|
..k2v_client::Filter::default()
|
|
|
|
},
|
|
|
|
..k2v_client::BatchReadOp::default()
|
|
|
|
}],
|
|
|
|
Selector::Single(row_ref) => {
|
|
|
|
let causal_value = match self.k2v.read_item(&row_ref.uid.shard, &row_ref.uid.sort).await {
|
|
|
|
Err(e) => {
|
|
|
|
tracing::error!("K2V read item shard={}, sort={}, bucket={} failed: {}", row_ref.uid.shard, row_ref.uid.sort, self.bucket, e);
|
|
|
|
return Err(StorageError::Internal);
|
|
|
|
},
|
|
|
|
Ok(v) => v,
|
|
|
|
};
|
|
|
|
|
|
|
|
let row_val = causal_to_row_val((*row_ref).clone(), causal_value);
|
|
|
|
return Ok(vec![row_val])
|
|
|
|
},
|
|
|
|
};
|
|
|
|
|
|
|
|
let all_res = match self.k2v.read_batch(&batch_op).await {
|
|
|
|
Err(e) => {
|
|
|
|
tracing::error!("k2v read batch failed for {:?}, bucket {} with err: {}", select, self.bucket, e);
|
|
|
|
return Err(StorageError::Internal);
|
|
|
|
},
|
|
|
|
Ok(v) => v,
|
|
|
|
};
|
|
|
|
|
2023-11-01 14:15:57 +00:00
|
|
|
unimplemented!();
|
|
|
|
}
|
2023-12-16 10:13:32 +00:00
|
|
|
async fn row_rm<'a>(&self, select: &Selector<'a>) -> Result<(), StorageError> {
|
2023-11-15 14:56:43 +00:00
|
|
|
unimplemented!();
|
|
|
|
}
|
2023-11-16 17:27:24 +00:00
|
|
|
|
2023-12-16 10:13:32 +00:00
|
|
|
async fn row_insert(&self, values: Vec<RowVal>) -> Result<(), StorageError> {
|
2023-11-16 17:27:24 +00:00
|
|
|
unimplemented!();
|
2023-11-17 09:46:13 +00:00
|
|
|
|
|
|
|
}
|
2023-12-18 16:09:44 +00:00
|
|
|
async fn row_poll(&self, value: &RowRef) -> Result<RowVal, StorageError> {
|
2023-11-02 14:28:19 +00:00
|
|
|
unimplemented!();
|
|
|
|
}
|
|
|
|
|
2023-12-19 18:02:22 +00:00
|
|
|
async fn row_rm_single(&self, entry: &RowRef) -> Result<(), StorageError> {
|
|
|
|
unimplemented!();
|
|
|
|
}
|
|
|
|
|
2023-12-16 10:13:32 +00:00
|
|
|
async fn blob_fetch(&self, blob_ref: &BlobRef) -> Result<BlobVal, StorageError> {
|
2023-12-21 21:30:17 +00:00
|
|
|
let maybe_out = self.s3
|
|
|
|
.get_object()
|
2023-12-22 20:52:20 +00:00
|
|
|
.bucket(self.bucket.to_string())
|
2023-12-21 21:30:17 +00:00
|
|
|
.key(blob_ref.0.to_string())
|
|
|
|
.send()
|
|
|
|
.await;
|
|
|
|
|
|
|
|
let object_output = match maybe_out {
|
|
|
|
Ok(output) => output,
|
|
|
|
Err(SdkError::ServiceError(x)) => match x.err() {
|
|
|
|
GetObjectError::NoSuchKey(_) => return Err(StorageError::NotFound),
|
|
|
|
e => {
|
|
|
|
tracing::warn!("Blob Fetch Error, Service Error: {}", e);
|
|
|
|
return Err(StorageError::Internal);
|
|
|
|
},
|
|
|
|
},
|
|
|
|
Err(e) => {
|
|
|
|
tracing::warn!("Blob Fetch Error, {}", e);
|
|
|
|
return Err(StorageError::Internal);
|
|
|
|
},
|
|
|
|
};
|
|
|
|
|
|
|
|
let buffer = match object_output.body.collect().await {
|
|
|
|
Ok(aggreg) => aggreg.to_vec(),
|
|
|
|
Err(e) => {
|
|
|
|
tracing::warn!("Fetching body failed with {}", e);
|
|
|
|
return Err(StorageError::Internal);
|
|
|
|
}
|
|
|
|
};
|
2023-11-15 14:56:43 +00:00
|
|
|
|
2023-12-22 20:52:20 +00:00
|
|
|
tracing::debug!("Fetched {}/{}", self.bucket, blob_ref.0);
|
2023-12-21 21:30:17 +00:00
|
|
|
Ok(BlobVal::new(blob_ref.clone(), buffer))
|
2023-11-01 14:15:57 +00:00
|
|
|
}
|
2023-12-22 18:32:07 +00:00
|
|
|
async fn blob_insert(&self, blob_val: BlobVal) -> Result<(), StorageError> {
|
|
|
|
let streamable_value = s3::primitives::ByteStream::from(blob_val.value);
|
|
|
|
|
|
|
|
let maybe_send = self.s3
|
|
|
|
.put_object()
|
2023-12-22 20:52:20 +00:00
|
|
|
.bucket(self.bucket.to_string())
|
2023-12-22 18:32:07 +00:00
|
|
|
.key(blob_val.blob_ref.0.to_string())
|
|
|
|
.body(streamable_value)
|
|
|
|
.send()
|
|
|
|
.await;
|
|
|
|
|
|
|
|
match maybe_send {
|
|
|
|
Err(e) => {
|
|
|
|
tracing::error!("unable to send object: {}", e);
|
|
|
|
Err(StorageError::Internal)
|
|
|
|
}
|
|
|
|
Ok(_) => {
|
2023-12-22 20:52:20 +00:00
|
|
|
tracing::debug!("Inserted {}/{}", self.bucket, blob_val.blob_ref.0);
|
2023-12-22 18:32:07 +00:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
2023-12-18 16:09:44 +00:00
|
|
|
}
|
2023-12-19 18:02:22 +00:00
|
|
|
async fn blob_copy(&self, src: &BlobRef, dst: &BlobRef) -> Result<(), StorageError> {
|
2023-12-22 18:32:07 +00:00
|
|
|
let maybe_copy = self.s3
|
|
|
|
.copy_object()
|
2023-12-22 20:52:20 +00:00
|
|
|
.bucket(self.bucket.to_string())
|
2023-12-22 18:32:07 +00:00
|
|
|
.key(dst.0.clone())
|
2023-12-22 20:52:20 +00:00
|
|
|
.copy_source(format!("/{}/{}", self.bucket.to_string(), src.0.clone()))
|
2023-12-22 18:32:07 +00:00
|
|
|
.send()
|
|
|
|
.await;
|
|
|
|
|
|
|
|
match maybe_copy {
|
|
|
|
Err(e) => {
|
2023-12-22 20:52:20 +00:00
|
|
|
tracing::error!("unable to copy object {} to {} (bucket: {}), error: {}", src.0, dst.0, self.bucket, e);
|
2023-12-22 18:32:07 +00:00
|
|
|
Err(StorageError::Internal)
|
|
|
|
},
|
|
|
|
Ok(_) => {
|
2023-12-22 20:52:20 +00:00
|
|
|
tracing::debug!("copied {} to {} (bucket: {})", src.0, dst.0, self.bucket);
|
2023-12-22 18:32:07 +00:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
2023-11-01 14:15:57 +00:00
|
|
|
|
2023-11-17 11:15:44 +00:00
|
|
|
}
|
2023-12-16 10:13:32 +00:00
|
|
|
async fn blob_list(&self, prefix: &str) -> Result<Vec<BlobRef>, StorageError> {
|
2023-12-22 18:32:07 +00:00
|
|
|
let maybe_list = self.s3
|
|
|
|
.list_objects_v2()
|
2023-12-22 20:52:20 +00:00
|
|
|
.bucket(self.bucket.to_string())
|
2023-12-22 18:32:07 +00:00
|
|
|
.prefix(prefix)
|
|
|
|
.into_paginator()
|
|
|
|
.send()
|
|
|
|
.try_collect()
|
|
|
|
.await;
|
|
|
|
|
|
|
|
match maybe_list {
|
|
|
|
Err(e) => {
|
2023-12-22 20:52:20 +00:00
|
|
|
tracing::error!("listing prefix {} on bucket {} failed: {}", prefix, self.bucket, e);
|
2023-12-22 18:32:07 +00:00
|
|
|
Err(StorageError::Internal)
|
|
|
|
}
|
|
|
|
Ok(pagin_list_out) => Ok(pagin_list_out
|
|
|
|
.into_iter()
|
|
|
|
.map(|list_out| list_out.contents.unwrap_or(vec![]))
|
|
|
|
.flatten()
|
|
|
|
.map(|obj| BlobRef(obj.key.unwrap_or(String::new())))
|
|
|
|
.collect::<Vec<_>>()),
|
|
|
|
}
|
2023-11-01 14:15:57 +00:00
|
|
|
}
|
2023-12-16 10:13:32 +00:00
|
|
|
async fn blob_rm(&self, blob_ref: &BlobRef) -> Result<(), StorageError> {
|
2023-12-22 18:32:07 +00:00
|
|
|
let maybe_delete = self.s3
|
|
|
|
.delete_object()
|
2023-12-22 20:52:20 +00:00
|
|
|
.bucket(self.bucket.to_string())
|
2023-12-22 18:32:07 +00:00
|
|
|
.key(blob_ref.0.clone())
|
|
|
|
.send()
|
|
|
|
.await;
|
|
|
|
|
|
|
|
match maybe_delete {
|
|
|
|
Err(e) => {
|
2023-12-22 20:52:20 +00:00
|
|
|
tracing::error!("unable to delete {} (bucket: {}), error {}", blob_ref.0, self.bucket, e);
|
2023-12-22 18:32:07 +00:00
|
|
|
Err(StorageError::Internal)
|
|
|
|
},
|
|
|
|
Ok(_) => {
|
2023-12-22 20:52:20 +00:00
|
|
|
tracing::debug!("deleted {} (bucket: {})", blob_ref.0, self.bucket);
|
2023-12-22 18:32:07 +00:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
2023-11-01 14:15:57 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|