add doc comments #53

Merged
lx merged 10 commits from trinity-1686a/garage:doc-comments into main 2021-04-08 13:01:22 +00:00
20 changed files with 38 additions and 44 deletions
Showing only changes of commit c8906f200b - Show all commits

View file

@ -29,7 +29,7 @@ pub enum Error {
NotFound,
// Category: bad request
/// The request used an invalid path
/// The request contained an invalid UTF-8 sequence in its path or in other parameters
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

the request contained an invalid UTF-8 sequence in its path or in other parameters would be more accurate

`the request contained an invalid UTF-8 sequence in its path or in other parameters` would be more accurate
#[error(display = "Invalid UTF-8: {}", _0)]
InvalidUTF8Str(#[error(source)] std::str::Utf8Error),
@ -65,7 +65,7 @@ impl From<roxmltree::Error> for Error {
}
impl Error {
/// Convert an error into an Http status code
/// Get the HTTP status code that best represents the meaning of the error for the client
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

rather get the HTTP status code that best represents the meaning of the error for the client

rather `get the HTTP status code that best represents the meaning of the error for the client`
pub fn http_status_code(&self) -> StatusCode {
match self {
Error::NotFound => StatusCode::NOT_FOUND,

View file

@ -1,4 +1,3 @@
#![deny(missing_crate_level_docs, missing_docs)]
//! Crate for serving a S3 compatible API
#[macro_use]
extern crate log;

View file

@ -1,6 +1,5 @@
#![deny(missing_crate_level_docs, missing_docs)]
#![recursion_limit = "1024"]
//! Garage CLI, used to interact with a running Garage instance, and to launch a Garage
//! Garage CLI, used to interact with a running Garage instance, and to launch a Garage instance
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

"and to launch a Garage instance" ?

"and to launch a Garage **instance**" ?
#[macro_use]
extern crate log;

View file

@ -157,7 +157,7 @@ impl BlockManager {
}
/// Write a block to disk
pub async fn write_block(&self, hash: &Hash, data: &[u8]) -> Result<Message, Error> {
async fn write_block(&self, hash: &Hash, data: &[u8]) -> Result<Message, Error> {
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

should probably not be pub, same for read_block and need_block

should probably not be `pub`, same for `read_block` and `need_block`
let _lock = self.data_dir_lock.lock().await;
let mut path = self.block_dir(hash);
@ -176,7 +176,7 @@ impl BlockManager {
}
/// Read block from disk, verifying it's integrity
pub async fn read_block(&self, hash: &Hash) -> Result<Message, Error> {
async fn read_block(&self, hash: &Hash) -> Result<Message, Error> {
let path = self.block_path(hash);
let mut f = match fs::File::open(&path).await {
@ -208,7 +208,7 @@ impl BlockManager {
}
/// Check if this node should have a block, but don't actually have it
pub async fn need_block(&self, hash: &Hash) -> Result<bool, Error> {
async fn need_block(&self, hash: &Hash) -> Result<bool, Error> {
let needed = self
.rc
.get(hash.as_ref())?

View file

@ -10,16 +10,14 @@ use crate::block::*;
#[derive(PartialEq, Clone, Debug, Serialize, Deserialize)]
pub struct BlockRef {
// Primary key
/// Hash of the block
/// Hash of the block, used as partition key
pub block: Hash,
// Sort key
// why a version on a hashed (probably immutable) piece of data?
/// Id of the Version for the object containing this block, used as sorting key
pub version: UUID,
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

version is the id of a Version object in the version table (which stores the different versions of objects in the buckets), not a version number for the BlockRef. i.e. BlockRef.version is the version id of an object that contains this block

version is the id of a Version object in the version table (which stores the different versions of objects in the buckets), not a version number for the BlockRef. i.e. `BlockRef.version` is the version id of an object that contains this block
// Keep track of deleted status
/// Is that block deleted
/// Is the Version that contains this block deleted
pub deleted: crdt::Bool,
}
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

-> is the Version (a version of an object in a bucket) that contains this block deleted

-> is the Version (a version of an object in a bucket) that contains this block deleted

View file

@ -6,7 +6,7 @@ use garage_table::*;
/// An api key
#[derive(PartialEq, Clone, Debug, Serialize, Deserialize)]
pub struct Key {
/// The id of the key (immutable)
/// The id of the key (immutable), used as partition key
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

please keep in the comment that this acts as the primary key

please keep in the comment that this acts as the primary key
pub key_id: String,
/// The secret_key associated
@ -19,6 +19,7 @@ pub struct Key {
pub deleted: crdt::Bool,
/// Buckets in which the key is authorized. Empty if `Key` is deleted
// CRDT interaction: deleted implies authorized_buckets is empty
pub authorized_buckets: crdt::LWWMap<String, PermissionSet>,
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

this comment needs to be kept somewhere

this comment needs to be kept somewhere
}

View file

@ -1,4 +1,3 @@
#![warn(missing_docs)]
#[macro_use]
extern crate log;

View file

@ -14,13 +14,13 @@ use crate::version_table::*;
/// An object
#[derive(PartialEq, Clone, Debug, Serialize, Deserialize)]
pub struct Object {
/// The bucket in which the object is stored
/// The bucket in which the object is stored, used as partition key
pub bucket: String,
/// The key at which the object is stored in its bucket
/// The key at which the object is stored in its bucket, used as sorting key
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

please keep in the comment that these two are used respectively as partition key (not primary key, my bad) and sort key, it's an import detail in understanding how Garage works internally

please keep in the comment that these two are used respectively as partition key (not primary key, my bad) and sort key, it's an import detail in understanding how Garage works internally
pub key: String,
/// The list of known versions of the object
/// The list of currenty stored versions of the object
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

doesn't keep all known versions, the comment is misleading

doesn't keep all known versions, the comment is misleading

I'm not sure what it store then

I'm not sure what it store then
versions: Vec<ObjectVersion>,
}
@ -53,7 +53,7 @@ impl Object {
}
}
/// Get a list of all versions known for `Object`
/// Get a list of currently stored versions of `Object`
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

s/known/currently stored

s/known/currently stored
pub fn versions(&self) -> &[ObjectVersion] {
&self.versions[..]
}
@ -77,7 +77,7 @@ pub enum ObjectVersionState {
Uploading(ObjectVersionHeaders),
/// The version is fully received
Complete(ObjectVersionData),
/// The version was never fully received
/// The version uploaded containded errors or the upload was explicitly aborted
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

it can never be received and stay in Uploading state forever if CompleteMultipartUpload/AbortMultipartUpload is never called (and it doesn't matter)

it can never be received and stay in Uploading state forever if CompleteMultipartUpload/AbortMultipartUpload is never called (and it doesn't matter)
Aborted,
}
@ -105,7 +105,7 @@ impl CRDT for ObjectVersionState {
/// Data about an object version
#[derive(PartialEq, Eq, PartialOrd, Ord, Clone, Debug, Serialize, Deserialize)]
pub enum ObjectVersionData {
/// The version is deleted
/// The object was deleted, this Version is a tombstone to mark it as such
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

the version represents a deletion of the object, i.e. at this version number the object doesn't exist (404)

the version represents a deletion of the object, i.e. at this version number the object doesn't exist (404)
DeleteMarker,
/// The object is short, it's stored inlined
Inline(ObjectVersionMeta, #[serde(with = "serde_bytes")] Vec<u8>),
@ -159,7 +159,7 @@ impl ObjectVersion {
}
}
/// Is the object version available (received and not deleted)
/// Is the object version available (received and not a tombstone)
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

is the object version available as an existing object (received and not a delete marker)

is the object version available as an existing object (received and not a delete marker)
pub fn is_data(&self) -> bool {
match self.state {
ObjectVersionState::Complete(ObjectVersionData::DeleteMarker) => false,

View file

@ -13,7 +13,7 @@ use crate::block_ref_table::*;
/// A version of an object
#[derive(PartialEq, Clone, Debug, Serialize, Deserialize)]
pub struct Version {
/// UUID of the version
/// UUID of the version, used as partition key
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

used as a partition key

used as a partition key
pub uuid: UUID,
// Actual data: the blocks for this version
@ -49,9 +49,9 @@ impl Version {
#[derive(PartialEq, Eq, Clone, Copy, Debug, Serialize, Deserialize)]
pub struct VersionBlockKey {
/// Number of the part, starting at 1
/// Number of the part
lx marked this conversation as resolved Outdated
Outdated
Review

not necessarily starting at 1, the client decides the part numbers and we don't care (for instance he can send parts 0, 1, 2, 14, 22, 37 and 42, and that's a fine object as long as these parts match the checklist that is sent in the CompleteMultipartUpload call)

not necessarily starting at 1, the client decides the part numbers and we don't care (for instance he can send parts 0, 1, 2, 14, 22, 37 and 42, and that's a fine object as long as these parts match the checklist that is sent in the CompleteMultipartUpload call)

Ok I've read s3 doc on multi-part upload and I hate it.
Next comment appear to be false too, it's offset in part, not in the whole file

Ok I've read s3 doc on multi-part upload and I hate it. Next comment appear to be false too, it's offset in part, not in the whole file
Outdated
Review

Yes, we don't know the offset in the whole file when a part is being uploaded because parts get uploaded independently from one another.

Yes, we don't know the offset in the whole file when a part is being uploaded because parts get uploaded independently from one another.
pub part_number: u64,
/// offset of the block in the file, starting at 0
/// Offset of this sub-segment in its part
pub offset: u64,
}

View file

@ -1,4 +1,3 @@
#![warn(missing_crate_level_docs, missing_docs)]
//! Crate containing rpc related functions and types used in Garage
#[macro_use]

View file

@ -1,4 +1,4 @@
/// Module containing structs related to membership management
//! Module containing structs related to membership management
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

//!

`//!`
use std::collections::HashMap;
use std::fmt::Write as FmtWrite;
use std::io::{Read, Write};
@ -96,7 +96,7 @@ pub struct System {
rpc_client: Arc<RpcClient<Message>>,
pub(crate) status: watch::Receiver<Arc<Status>>,
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

not "viewed by this node", all nodes should have equal rings (if not it's a bug)

not "viewed by this node", all nodes should have equal rings (if not it's a bug)
/// The ring, viewed by this node
/// The ring
pub ring: watch::Receiver<Arc<Ring>>,
update_lock: Mutex<Updaters>,
@ -114,9 +114,8 @@ struct Updaters {
#[derive(Debug, Clone)]
pub struct Status {
/// Mapping of each node id to its known status
// considering its sorted regularly, maybe it should be a btreeset?
pub nodes: HashMap<UUID, Arc<StatusEntry>>,
/// Hash of this entry
/// Hash of `nodes`, used to detect when nodes have different views of the cluster
pub hash: Hash,
}
@ -380,7 +379,7 @@ impl System {
id_option,
addr,
sys.rpc_client
.get_addr()
.by_addr()
.call(&addr, ping_msg_ref, PING_TIMEOUT)
.await,
)
@ -418,6 +417,8 @@ impl System {
}
} else if let Some(id) = id_option {
if let Some(st) = status.nodes.get_mut(id) {
// TODO this might double-increment the value as the counter is already
// incremented for any kind of failure in rpc_client
Outdated
Review

Actually no because the increment in rpc_client.rs is done by the RpcClient and not the RpcAddrClient, but here we are using the RpcAddrClient. (we could put this in a comment to make it clearer)

Actually no because the increment in `rpc_client.rs` is done by the `RpcClient` and not the `RpcAddrClient`, but here we are using the `RpcAddrClient`. (we could put this in a comment to make it clearer)
st.num_failures.fetch_add(1, Ordering::SeqCst);
if !st.is_up() {
warn!("Node {:?} seems to be down.", id);

View file

@ -1,4 +1,5 @@
//! Module containing types related to computing nodes which should receive a copy of data blocks
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

and metadata entries

and metadata entries
//! and metadata
use std::collections::{HashMap, HashSet};
use std::convert::TryInto;
@ -197,7 +198,7 @@ impl Ring {
top >> (16 - PARTITION_BITS)
}
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

and the first hash (of a partition key) that would fall in this partition

and the first hash (of a partition key) that would fall in this partition
/// Get the list of partitions and
/// Get the list of partitions and the first hash of a partition key that would fall in it
pub fn partitions(&self) -> Vec<(Partition, Hash)> {
let mut ret = vec![];
@ -211,6 +212,7 @@ impl Ring {
ret
}
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

TODO rename this function as it doesn't walk the ring anymore but just returns the nodes at the corresponding location. This is vocabulary from the previous implementation that used datacenter-aware ring walking and led to data imbalance.

TODO rename this function as it doesn't walk the ring anymore but just returns the nodes at the corresponding location. This is vocabulary from the previous implementation that used datacenter-aware ring walking and led to data imbalance.
// TODO rename this function as it no longer walk the ring
/// Walk the ring to find the n servers in which data should be replicated
pub fn walk_ring(&self, from: &Hash, n: usize) -> Vec<UUID> {
if self.ring.len() != 1 << PARTITION_BITS {

View file

@ -53,6 +53,7 @@ impl RequestStrategy {
self
}
/// Set if requests can be dropped after quorum has been reached
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

as a general rule: true for read requests, false for write requests

as a general rule: true for read requests, false for write requests
/// In general true for read requests, and false for write
pub fn interrupt_after_quorum(mut self, interrupt: bool) -> Self {
self.rs_interrupt_after_quorum = interrupt;
self
@ -103,8 +104,8 @@ impl<M: RpcMessage + 'static> RpcClient<M> {
self.local_handler.swap(Some(Arc::new((my_id, handler))));
}
/// Get the server address this client connect to
pub fn get_addr(&self) -> &RpcAddrClient<M> {
/// Get a RPC client to make calls using node's SocketAddr instead of its ID
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

Please don't call this get_addr, it's not what it does ! It does not return a SocketAddr or something like that. It is used to get the underlying RpcAddrClient which allows for RPC by specifing the target node's SocketAddr instead of their node IDs. Also, the comment is wrong.

Please don't call this `get_addr`, it's not what it does ! It does not return a SocketAddr or something like that. It is used to get the underlying RpcAddrClient which allows for RPC by specifing the target node's SocketAddr instead of their node IDs. Also, the comment is wrong.
pub fn by_addr(&self) -> &RpcAddrClient<M> {
&self.rpc_addr_client
}
@ -167,7 +168,7 @@ impl<M: RpcMessage + 'static> RpcClient<M> {
}
/// Make a RPC call to multiple servers, returning either a Vec of responses, or an error if
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

too many*

too many*
/// strategy could not be respected due to to many errors
/// strategy could not be respected due to too many errors
pub async fn try_call_many(
self: &Arc<Self>,
to: &[UUID],
@ -227,7 +228,7 @@ impl<M: RpcMessage + 'static> RpcClient<M> {
}
}
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

No. This is an RPC client which contains only the necessary logic to call RPC's to nodes by specifying their SocketAddr, and not by specifying their node IDs. It is used as an underlying layer for RpcClient.

No. This is an RPC client which contains only the necessary logic to call RPC's to nodes by specifying their SocketAddr, and not by specifying their node IDs. It is used as an underlying layer for RpcClient.
/// Endpoint to which send RPC
/// Thin wrapper arround an `RpcHttpClient` specifying the path of the request
pub struct RpcAddrClient<M: RpcMessage> {
phantom: PhantomData<M>,

View file

@ -1,4 +1,3 @@
#![warn(missing_docs)]
#![recursion_limit = "1024"]
#[macro_use]

View file

@ -16,7 +16,6 @@ pub trait TableReplication: Send + Sync {
fn write_nodes(&self, hash: &Hash) -> Vec<UUID>;
/// Responses needed to consider a write succesfull
fn write_quorum(&self) -> usize;
// this feels like its write_nodes().len() - write_quorum()
fn max_write_errors(&self) -> usize;
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

Most of the time it is, but not always for fully replicated tables

Most of the time it is, but not always for fully replicated tables
// Accessing partitions, for Merkle tree & sync

View file

@ -4,7 +4,7 @@ use garage_util::data::*;
use crate::crdt::CRDT;
/// Trait for partitionnable data
/// Trait for field used to partition data
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

It's not a trait for the data, but only for a field of the data that is used to partition it.

It's not a trait for the data, but only for a field of the data that is used to partition it.
pub trait PartitionKey {
/// Get the key used to partition
fn hash(&self) -> Hash;
@ -22,7 +22,7 @@ impl PartitionKey for Hash {
}
}
/// Trait for sortable data
/// Trait for field used to sort data
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

Same as above, it's only a trait of one of the fields of the data

Same as above, it's only a trait of one of the fields of the data
pub trait SortKey {
/// Get the key used to sort
fn sort_key(&self) -> &[u8];

View file

@ -1,5 +1,4 @@
//! Module containing error types used in Garage
#![allow(missing_docs)]
use err_derive::Error;
use hyper::StatusCode;
use std::io;

View file

@ -1,4 +1,3 @@
#![warn(missing_crate_level_docs, missing_docs)]
//! Crate containing common functions and types used in Garage
#[macro_use]

View file

@ -19,7 +19,7 @@ pub enum Error {
#[error(display = "Not found")]
NotFound,
/// The client requested a malformed path
/// The request contained an invalid UTF-8 sequence in its path or in other parameters
trinity-1686a marked this conversation as resolved Outdated
Outdated
Review

see garage_api/error.rs

see garage_api/error.rs
#[error(display = "Invalid UTF-8: {}", _0)]
InvalidUTF8(#[error(source)] std::str::Utf8Error),

View file

@ -1,4 +1,3 @@
#![deny(missing_crate_level_docs, missing_docs)]
//! Crate for handling web serving of s3 bucket
#[macro_use]
extern crate log;