2020-11-21 16:50:19 +00:00
|
|
|
use std::{borrow::Cow, convert::Infallible, net::SocketAddr, sync::Arc};
|
2020-11-02 14:48:39 +00:00
|
|
|
|
|
|
|
use futures::future::Future;
|
|
|
|
|
2022-01-07 15:23:04 +00:00
|
|
|
use http::header::{ACCESS_CONTROL_REQUEST_HEADERS, ACCESS_CONTROL_REQUEST_METHOD};
|
2020-11-21 14:15:25 +00:00
|
|
|
use hyper::{
|
2022-01-06 11:55:49 +00:00
|
|
|
header::{HeaderValue, HOST},
|
2020-11-21 14:15:25 +00:00
|
|
|
server::conn::AddrStream,
|
|
|
|
service::{make_service_fn, service_fn},
|
2022-01-07 15:23:04 +00:00
|
|
|
Body, Method, Request, Response, Server, StatusCode,
|
2020-11-21 16:50:19 +00:00
|
|
|
};
|
2020-11-02 14:48:39 +00:00
|
|
|
|
2020-11-21 16:50:19 +00:00
|
|
|
use crate::error::*;
|
2021-12-16 10:47:58 +00:00
|
|
|
|
2022-01-07 15:23:04 +00:00
|
|
|
use garage_api::error::{Error as ApiError, OkOrBadRequest, OkOrInternalError};
|
2021-11-11 10:26:02 +00:00
|
|
|
use garage_api::helpers::{authority_to_host, host_to_bucket};
|
2022-01-07 15:23:04 +00:00
|
|
|
use garage_api::s3_cors::{add_cors_headers, cors_rule_matches};
|
2020-11-21 16:58:14 +00:00
|
|
|
use garage_api::s3_get::{handle_get, handle_head};
|
2021-12-16 10:47:58 +00:00
|
|
|
|
2022-01-07 15:23:04 +00:00
|
|
|
use garage_model::bucket_table::Bucket;
|
2020-11-02 14:48:39 +00:00
|
|
|
use garage_model::garage::Garage;
|
2021-12-16 10:47:58 +00:00
|
|
|
|
2020-12-17 21:51:44 +00:00
|
|
|
use garage_table::*;
|
2020-11-19 13:56:00 +00:00
|
|
|
use garage_util::error::Error as GarageError;
|
2020-11-02 14:48:39 +00:00
|
|
|
|
2021-03-26 21:05:16 +00:00
|
|
|
/// Run a web server
|
2020-11-02 14:48:39 +00:00
|
|
|
pub async fn run_web_server(
|
|
|
|
garage: Arc<Garage>,
|
|
|
|
shutdown_signal: impl Future<Output = ()>,
|
2020-11-19 13:56:00 +00:00
|
|
|
) -> Result<(), GarageError> {
|
2020-11-10 08:57:07 +00:00
|
|
|
let addr = &garage.config.s3_web.bind_addr;
|
2020-11-02 14:48:39 +00:00
|
|
|
|
|
|
|
let service = make_service_fn(|conn: &AddrStream| {
|
|
|
|
let garage = garage.clone();
|
|
|
|
let client_addr = conn.remote_addr();
|
2020-11-10 08:59:52 +00:00
|
|
|
async move {
|
2020-11-02 14:48:39 +00:00
|
|
|
Ok::<_, Error>(service_fn(move |req: Request<Body>| {
|
|
|
|
let garage = garage.clone();
|
2020-11-11 20:17:34 +00:00
|
|
|
handle_request(garage, req, client_addr)
|
2020-11-02 14:48:39 +00:00
|
|
|
}))
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
2021-10-26 08:20:05 +00:00
|
|
|
let server = Server::bind(addr).serve(service);
|
2020-11-02 14:48:39 +00:00
|
|
|
let graceful = server.with_graceful_shutdown(shutdown_signal);
|
|
|
|
info!("Web server listening on http://{}", addr);
|
|
|
|
|
|
|
|
graceful.await?;
|
|
|
|
Ok(())
|
|
|
|
}
|
2020-11-08 14:47:25 +00:00
|
|
|
|
2020-11-11 20:17:34 +00:00
|
|
|
async fn handle_request(
|
2020-11-08 14:47:25 +00:00
|
|
|
garage: Arc<Garage>,
|
|
|
|
req: Request<Body>,
|
|
|
|
addr: SocketAddr,
|
2020-11-11 20:17:34 +00:00
|
|
|
) -> Result<Response<Body>, Infallible> {
|
|
|
|
info!("{} {} {}", addr, req.method(), req.uri());
|
2022-01-06 11:55:49 +00:00
|
|
|
match serve_file(garage, &req).await {
|
|
|
|
Ok(res) => {
|
|
|
|
debug!("{} {} {}", req.method(), req.uri(), res.status());
|
|
|
|
Ok(res)
|
|
|
|
}
|
|
|
|
Err(error) => {
|
|
|
|
info!(
|
|
|
|
"{} {} {} {}",
|
|
|
|
req.method(),
|
|
|
|
req.uri(),
|
|
|
|
error.http_status_code(),
|
|
|
|
error
|
|
|
|
);
|
|
|
|
Ok(error_to_res(error))
|
|
|
|
}
|
2020-11-11 20:17:34 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn error_to_res(e: Error) -> Response<Body> {
|
2022-01-06 11:55:49 +00:00
|
|
|
// If we are here, it is either that:
|
|
|
|
// - there was an error before trying to get the requested URL
|
|
|
|
// from the bucket (e.g. bucket not found)
|
|
|
|
// - there was an error processing the request and (the request
|
|
|
|
// was a HEAD request or we couldn't get the error document)
|
|
|
|
// We do NOT enter this code path when returning the bucket's
|
|
|
|
// error document (this is handled in serve_file)
|
|
|
|
let body = Body::from(format!("{}\n", e));
|
2020-11-11 20:17:34 +00:00
|
|
|
let mut http_error = Response::new(body);
|
|
|
|
*http_error.status_mut() = e.http_status_code();
|
2021-11-29 10:52:42 +00:00
|
|
|
e.add_headers(http_error.headers_mut());
|
2020-11-11 20:17:34 +00:00
|
|
|
http_error
|
|
|
|
}
|
|
|
|
|
2022-01-06 11:55:49 +00:00
|
|
|
async fn serve_file(garage: Arc<Garage>, req: &Request<Body>) -> Result<Response<Body>, Error> {
|
2020-11-10 08:57:07 +00:00
|
|
|
// Get http authority string (eg. [::1]:3902 or garage.tld:80)
|
2020-11-08 14:47:25 +00:00
|
|
|
let authority = req
|
|
|
|
.headers()
|
|
|
|
.get(HOST)
|
2022-01-06 11:55:49 +00:00
|
|
|
.ok_or_bad_request("HOST header required")?
|
2020-11-08 14:47:25 +00:00
|
|
|
.to_str()?;
|
|
|
|
|
2020-11-10 08:57:07 +00:00
|
|
|
// Get bucket
|
2021-11-11 10:26:02 +00:00
|
|
|
let host = authority_to_host(authority)?;
|
2020-11-10 08:59:52 +00:00
|
|
|
let root = &garage.config.s3_web.root_domain;
|
2020-11-10 08:57:07 +00:00
|
|
|
|
2021-12-14 12:55:11 +00:00
|
|
|
let bucket_name = host_to_bucket(&host, root).unwrap_or(&host);
|
|
|
|
let bucket_id = garage
|
|
|
|
.bucket_alias_table
|
|
|
|
.get(&EmptyKey, &bucket_name.to_string())
|
|
|
|
.await?
|
2022-01-03 17:32:15 +00:00
|
|
|
.map(|x| x.state.take())
|
2021-12-14 12:55:11 +00:00
|
|
|
.flatten()
|
|
|
|
.ok_or(Error::NotFound)?;
|
|
|
|
|
2021-12-16 10:47:58 +00:00
|
|
|
// Check bucket isn't deleted and has website access enabled
|
2022-01-06 11:55:49 +00:00
|
|
|
let bucket = garage
|
2020-12-17 21:51:44 +00:00
|
|
|
.bucket_table
|
2022-01-03 18:06:04 +00:00
|
|
|
.get(&EmptyKey, &bucket_id)
|
2020-12-17 21:51:44 +00:00
|
|
|
.await?
|
2022-01-06 11:55:49 +00:00
|
|
|
.ok_or(Error::NotFound)?;
|
|
|
|
|
|
|
|
let website_config = bucket
|
|
|
|
.params()
|
|
|
|
.ok_or(Error::NotFound)?
|
|
|
|
.website_config
|
|
|
|
.get()
|
|
|
|
.as_ref()
|
2020-12-17 21:51:44 +00:00
|
|
|
.ok_or(Error::NotFound)?;
|
|
|
|
|
2020-11-10 08:57:07 +00:00
|
|
|
// Get path
|
|
|
|
let path = req.uri().path().to_string();
|
2022-01-06 11:55:49 +00:00
|
|
|
let index = &website_config.index_document;
|
2021-10-26 08:20:05 +00:00
|
|
|
let key = path_to_key(&path, index)?;
|
2020-11-10 08:59:52 +00:00
|
|
|
|
2022-01-06 11:55:49 +00:00
|
|
|
debug!(
|
2021-12-14 12:55:11 +00:00
|
|
|
"Selected bucket: \"{}\" {:?}, selected key: \"{}\"",
|
|
|
|
bucket_name, bucket_id, key
|
|
|
|
);
|
2020-11-11 18:48:01 +00:00
|
|
|
|
2022-01-06 11:55:49 +00:00
|
|
|
let ret_doc = match *req.method() {
|
2022-01-07 15:23:04 +00:00
|
|
|
Method::OPTIONS => return handle_options(&bucket, req),
|
|
|
|
Method::HEAD => {
|
|
|
|
return handle_head(garage.clone(), req, bucket_id, &key)
|
|
|
|
.await
|
|
|
|
.map_err(Error::from)
|
|
|
|
}
|
2022-01-06 11:55:49 +00:00
|
|
|
Method::GET => handle_get(garage.clone(), req, bucket_id, &key).await,
|
|
|
|
_ => Err(ApiError::BadRequest("HTTP method not supported".into())),
|
|
|
|
}
|
|
|
|
.map_err(Error::from);
|
|
|
|
|
2022-01-07 15:23:04 +00:00
|
|
|
match ret_doc {
|
|
|
|
Err(error) => {
|
|
|
|
// For a HEAD or OPTIONS method, we don't return the error document
|
|
|
|
// as content, we return above and just return the error message
|
|
|
|
// by relying on err_to_res that is called when we return an Err.
|
|
|
|
assert!(*req.method() != Method::HEAD && *req.method() != Method::OPTIONS);
|
|
|
|
|
|
|
|
if !error.http_status_code().is_client_error() {
|
|
|
|
// Do not return the error document if it is not a 4xx error code.
|
|
|
|
return Err(error);
|
|
|
|
}
|
|
|
|
|
|
|
|
// If no error document is set: just return the error directly
|
|
|
|
let error_document = match &website_config.error_document {
|
|
|
|
Some(ed) => ed.trim_start_matches('/').to_owned(),
|
|
|
|
None => return Err(error),
|
|
|
|
};
|
|
|
|
|
|
|
|
// We want to return the error document
|
|
|
|
// Create a fake HTTP request with path = the error document
|
|
|
|
let req2 = Request::builder()
|
|
|
|
.uri(format!("http://{}/{}", host, &error_document))
|
|
|
|
.body(Body::empty())
|
|
|
|
.unwrap();
|
2020-11-21 14:15:25 +00:00
|
|
|
|
2022-01-07 15:23:04 +00:00
|
|
|
match handle_get(garage, &req2, bucket_id, &error_document).await {
|
|
|
|
Ok(mut error_doc) => {
|
|
|
|
// The error won't be logged back in handle_request,
|
|
|
|
// so log it here
|
|
|
|
info!(
|
|
|
|
"{} {} {} {}",
|
|
|
|
req.method(),
|
|
|
|
req.uri(),
|
|
|
|
error.http_status_code(),
|
|
|
|
error
|
|
|
|
);
|
|
|
|
|
|
|
|
*error_doc.status_mut() = error.http_status_code();
|
|
|
|
error.add_headers(error_doc.headers_mut());
|
|
|
|
|
|
|
|
// Preserve error message in a special header
|
|
|
|
for error_line in error.to_string().split('\n') {
|
|
|
|
if let Ok(v) = HeaderValue::from_bytes(error_line.as_bytes()) {
|
|
|
|
error_doc.headers_mut().append("X-Garage-Error", v);
|
|
|
|
}
|
2022-01-06 11:55:49 +00:00
|
|
|
}
|
|
|
|
|
2022-01-07 15:23:04 +00:00
|
|
|
Ok(error_doc)
|
|
|
|
}
|
|
|
|
Err(error_doc_error) => {
|
|
|
|
warn!(
|
|
|
|
"Couldn't get error document {} for bucket {:?}: {}",
|
|
|
|
error_document, bucket_id, error_doc_error
|
|
|
|
);
|
|
|
|
Err(error)
|
|
|
|
}
|
2022-01-06 11:55:49 +00:00
|
|
|
}
|
2022-01-07 15:23:04 +00:00
|
|
|
}
|
|
|
|
Ok(mut resp) => {
|
|
|
|
// Maybe add CORS headers
|
|
|
|
if let Some(cors_config) = bucket.params().unwrap().cors_config.get() {
|
|
|
|
if let Some(origin) = req.headers().get("Origin") {
|
|
|
|
let origin = origin.to_str()?;
|
|
|
|
let request_headers = match req.headers().get(ACCESS_CONTROL_REQUEST_HEADERS) {
|
|
|
|
Some(h) => h.to_str()?.split(',').map(|h| h.trim()).collect::<Vec<_>>(),
|
|
|
|
None => vec![],
|
|
|
|
};
|
|
|
|
let matching_rule = cors_config.iter().find(|rule| {
|
|
|
|
cors_rule_matches(
|
|
|
|
rule,
|
|
|
|
origin,
|
|
|
|
&req.method().to_string(),
|
|
|
|
request_headers.iter(),
|
|
|
|
)
|
|
|
|
});
|
|
|
|
if let Some(rule) = matching_rule {
|
|
|
|
add_cors_headers(&mut resp, rule)
|
|
|
|
.ok_or_internal_error("Invalid CORS configuration")?;
|
|
|
|
}
|
|
|
|
}
|
2022-01-06 11:55:49 +00:00
|
|
|
}
|
2022-01-07 15:23:04 +00:00
|
|
|
Ok(resp)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn handle_options(bucket: &Bucket, req: &Request<Body>) -> Result<Response<Body>, Error> {
|
|
|
|
let origin = req
|
|
|
|
.headers()
|
|
|
|
.get("Origin")
|
|
|
|
.ok_or_bad_request("Missing Origin header")?
|
|
|
|
.to_str()?;
|
|
|
|
let request_method = req
|
|
|
|
.headers()
|
|
|
|
.get(ACCESS_CONTROL_REQUEST_METHOD)
|
|
|
|
.ok_or_bad_request("Missing Access-Control-Request-Method header")?
|
|
|
|
.to_str()?;
|
|
|
|
let request_headers = match req.headers().get(ACCESS_CONTROL_REQUEST_HEADERS) {
|
|
|
|
Some(h) => h.to_str()?.split(',').map(|h| h.trim()).collect::<Vec<_>>(),
|
|
|
|
None => vec![],
|
|
|
|
};
|
|
|
|
|
|
|
|
if let Some(cors_config) = bucket.params().unwrap().cors_config.get() {
|
|
|
|
let matching_rule = cors_config
|
|
|
|
.iter()
|
|
|
|
.find(|rule| cors_rule_matches(rule, origin, request_method, request_headers.iter()));
|
|
|
|
if let Some(rule) = matching_rule {
|
|
|
|
let mut resp = Response::builder()
|
|
|
|
.status(StatusCode::OK)
|
|
|
|
.body(Body::empty())
|
|
|
|
.map_err(ApiError::from)?;
|
|
|
|
add_cors_headers(&mut resp, rule).ok_or_internal_error("Invalid CORS configuration")?;
|
|
|
|
return Ok(resp);
|
2022-01-06 11:55:49 +00:00
|
|
|
}
|
|
|
|
}
|
2022-01-07 15:23:04 +00:00
|
|
|
|
|
|
|
Err(ApiError::Forbidden("No matching CORS rule".into()).into())
|
2020-11-08 14:47:25 +00:00
|
|
|
}
|
|
|
|
|
2020-11-11 18:48:01 +00:00
|
|
|
/// Path to key
|
|
|
|
///
|
|
|
|
/// Convert the provided path to the internal key
|
|
|
|
/// When a path ends with "/", we append the index name to match traditional web server behavior
|
|
|
|
/// which is also AWS S3 behavior.
|
|
|
|
fn path_to_key<'a>(path: &'a str, index: &str) -> Result<Cow<'a, str>, Error> {
|
2021-10-26 08:20:05 +00:00
|
|
|
let path_utf8 = percent_encoding::percent_decode_str(path).decode_utf8()?;
|
2020-11-21 16:50:19 +00:00
|
|
|
|
2021-04-23 20:26:27 +00:00
|
|
|
if !path_utf8.starts_with('/') {
|
|
|
|
return Err(Error::BadRequest(
|
|
|
|
"Path must start with a / (slash)".to_string(),
|
|
|
|
));
|
2020-11-21 11:01:02 +00:00
|
|
|
}
|
|
|
|
|
2020-11-11 18:48:01 +00:00
|
|
|
match path_utf8.chars().last() {
|
2021-01-15 16:11:15 +00:00
|
|
|
None => unreachable!(),
|
2020-11-11 18:48:01 +00:00
|
|
|
Some('/') => {
|
|
|
|
let mut key = String::with_capacity(path_utf8.len() + index.len());
|
2020-11-21 11:01:02 +00:00
|
|
|
key.push_str(&path_utf8[1..]);
|
2020-11-11 18:48:01 +00:00
|
|
|
key.push_str(index);
|
|
|
|
Ok(key.into())
|
|
|
|
}
|
2020-11-21 16:50:19 +00:00
|
|
|
Some(_) => match path_utf8 {
|
|
|
|
Cow::Borrowed(pu8) => Ok((&pu8[1..]).into()),
|
|
|
|
Cow::Owned(pu8) => Ok((&pu8[1..]).to_string().into()),
|
|
|
|
},
|
2020-11-11 18:48:01 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-11-08 14:47:25 +00:00
|
|
|
#[cfg(test)]
|
|
|
|
mod tests {
|
|
|
|
use super::*;
|
|
|
|
|
2020-11-11 18:48:01 +00:00
|
|
|
#[test]
|
|
|
|
fn path_to_key_test() -> Result<(), Error> {
|
2020-11-21 11:01:02 +00:00
|
|
|
assert_eq!(path_to_key("/file%20.jpg", "index.html")?, "file .jpg");
|
|
|
|
assert_eq!(path_to_key("/%20t/", "index.html")?, " t/index.html");
|
|
|
|
assert_eq!(path_to_key("/", "index.html")?, "index.html");
|
|
|
|
assert_eq!(path_to_key("/hello", "index.html")?, "hello");
|
2020-11-11 18:48:01 +00:00
|
|
|
assert!(path_to_key("", "index.html").is_err());
|
2020-11-21 11:01:02 +00:00
|
|
|
assert!(path_to_key("i/am/relative", "index.html").is_err());
|
2020-11-11 18:48:01 +00:00
|
|
|
Ok(())
|
|
|
|
}
|
2020-11-08 14:47:25 +00:00
|
|
|
}
|