2020-12-02 12:30:47 +00:00
|
|
|
use std::collections::HashMap;
|
|
|
|
use std::net::SocketAddr;
|
2022-09-01 13:54:11 +00:00
|
|
|
use std::pin::Pin;
|
2021-10-13 15:12:13 +00:00
|
|
|
use std::sync::atomic::{self, AtomicU32};
|
2020-12-07 12:35:24 +00:00
|
|
|
use std::sync::{Arc, Mutex};
|
2022-09-01 13:54:11 +00:00
|
|
|
use std::task::Poll;
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2021-10-13 15:12:13 +00:00
|
|
|
use arc_swap::ArcSwapOption;
|
2022-07-21 15:34:53 +00:00
|
|
|
use async_trait::async_trait;
|
2022-07-22 10:45:38 +00:00
|
|
|
use bytes::Bytes;
|
2020-12-07 12:35:24 +00:00
|
|
|
use log::{debug, error, trace};
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2022-07-21 15:34:53 +00:00
|
|
|
use futures::io::AsyncReadExt;
|
2022-09-01 13:54:11 +00:00
|
|
|
use futures::Stream;
|
2022-07-21 15:34:53 +00:00
|
|
|
use kuska_handshake::async_std::{handshake_client, BoxStream};
|
2020-12-02 12:30:47 +00:00
|
|
|
use tokio::net::TcpStream;
|
2021-10-13 15:12:13 +00:00
|
|
|
use tokio::select;
|
2020-12-02 12:30:47 +00:00
|
|
|
use tokio::sync::{mpsc, oneshot, watch};
|
2021-10-12 12:51:28 +00:00
|
|
|
use tokio_util::compat::*;
|
|
|
|
|
2022-02-18 19:10:46 +00:00
|
|
|
#[cfg(feature = "telemetry")]
|
|
|
|
use opentelemetry::{
|
|
|
|
trace::{FutureExt, Span, SpanKind, TraceContextExt, Tracer},
|
2022-02-18 19:23:10 +00:00
|
|
|
Context, KeyValue,
|
2022-02-18 19:10:46 +00:00
|
|
|
};
|
|
|
|
#[cfg(feature = "telemetry")]
|
|
|
|
use opentelemetry_contrib::trace::propagator::binary::*;
|
|
|
|
|
2020-12-02 12:30:47 +00:00
|
|
|
use crate::error::*;
|
2022-07-21 15:34:53 +00:00
|
|
|
use crate::message::*;
|
2020-12-02 12:30:47 +00:00
|
|
|
use crate::netapp::*;
|
2022-07-21 15:34:53 +00:00
|
|
|
use crate::recv::*;
|
|
|
|
use crate::send::*;
|
2022-07-22 10:45:38 +00:00
|
|
|
use crate::stream::*;
|
2020-12-02 12:30:47 +00:00
|
|
|
use crate::util::*;
|
|
|
|
|
2020-12-02 19:12:24 +00:00
|
|
|
pub(crate) struct ClientConn {
|
|
|
|
pub(crate) remote_addr: SocketAddr,
|
2020-12-12 20:14:15 +00:00
|
|
|
pub(crate) peer_id: NodeID,
|
2020-12-02 19:12:24 +00:00
|
|
|
|
2022-09-01 13:54:11 +00:00
|
|
|
query_send: ArcSwapOption<mpsc::UnboundedSender<SendItem>>,
|
2020-12-07 12:35:24 +00:00
|
|
|
|
2021-10-12 15:59:46 +00:00
|
|
|
next_query_number: AtomicU32,
|
2022-07-22 11:01:52 +00:00
|
|
|
inflight: Mutex<HashMap<RequestID, oneshot::Sender<ByteStream>>>,
|
2020-12-02 12:30:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
impl ClientConn {
|
|
|
|
pub(crate) async fn init(
|
|
|
|
netapp: Arc<NetApp>,
|
|
|
|
socket: TcpStream,
|
2020-12-12 20:14:15 +00:00
|
|
|
peer_id: NodeID,
|
2020-12-02 12:30:47 +00:00
|
|
|
) -> Result<(), Error> {
|
2021-10-12 12:51:28 +00:00
|
|
|
let remote_addr = socket.peer_addr()?;
|
|
|
|
let mut socket = socket.compat();
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2022-02-21 15:43:17 +00:00
|
|
|
// Do handshake to authenticate and prove our identity to server
|
2020-12-02 12:30:47 +00:00
|
|
|
let handshake = handshake_client(
|
2021-10-12 12:51:28 +00:00
|
|
|
&mut socket,
|
2020-12-02 12:30:47 +00:00
|
|
|
netapp.netid.clone(),
|
2021-10-12 11:18:24 +00:00
|
|
|
netapp.id,
|
2020-12-02 12:30:47 +00:00
|
|
|
netapp.privkey.clone(),
|
2021-10-12 11:18:24 +00:00
|
|
|
peer_id,
|
2020-12-02 12:30:47 +00:00
|
|
|
)
|
|
|
|
.await?;
|
|
|
|
|
|
|
|
debug!(
|
|
|
|
"Handshake complete (client) with {}@{}",
|
2023-01-31 22:57:33 +00:00
|
|
|
hex::encode(peer_id),
|
2020-12-02 12:30:47 +00:00
|
|
|
remote_addr
|
|
|
|
);
|
|
|
|
|
2022-02-21 15:43:17 +00:00
|
|
|
// Create BoxStream layer that encodes content
|
2021-10-12 12:51:28 +00:00
|
|
|
let (read, write) = socket.split();
|
2022-02-21 15:43:17 +00:00
|
|
|
let (mut read, write) =
|
2020-12-02 12:30:47 +00:00
|
|
|
BoxStream::from_handshake(read, write, handshake, 0x8000).split_read_write();
|
|
|
|
|
2022-02-21 15:43:17 +00:00
|
|
|
// Before doing anything, receive version tag and
|
|
|
|
// check they are running the same version as us
|
|
|
|
let mut their_version_tag = VersionTag::default();
|
|
|
|
read.read_exact(&mut their_version_tag[..]).await?;
|
|
|
|
if their_version_tag != netapp.version_tag {
|
|
|
|
let msg = format!(
|
2022-02-21 15:57:07 +00:00
|
|
|
"different version tags: {} (theirs) vs. {} (ours)",
|
|
|
|
hex::encode(their_version_tag),
|
|
|
|
hex::encode(netapp.version_tag)
|
2022-02-21 15:43:17 +00:00
|
|
|
);
|
2022-02-21 15:57:07 +00:00
|
|
|
error!("Cannot connect to {}: {}", hex::encode(&peer_id[..8]), msg);
|
2022-02-21 15:43:17 +00:00
|
|
|
return Err(Error::VersionMismatch(msg));
|
|
|
|
}
|
|
|
|
|
|
|
|
// Build and launch stuff that manages sending requests client-side
|
2020-12-02 12:30:47 +00:00
|
|
|
let (query_send, query_recv) = mpsc::unbounded_channel();
|
|
|
|
|
2020-12-07 12:35:24 +00:00
|
|
|
let (stop_recv_loop, stop_recv_loop_recv) = watch::channel(false);
|
2020-12-02 12:30:47 +00:00
|
|
|
|
|
|
|
let conn = Arc::new(ClientConn {
|
|
|
|
remote_addr,
|
2021-10-12 11:18:24 +00:00
|
|
|
peer_id,
|
2021-10-12 15:59:46 +00:00
|
|
|
next_query_number: AtomicU32::from(RequestID::default()),
|
2021-10-13 15:12:13 +00:00
|
|
|
query_send: ArcSwapOption::new(Some(Arc::new(query_send))),
|
2020-12-07 12:35:24 +00:00
|
|
|
inflight: Mutex::new(HashMap::new()),
|
2020-12-02 12:30:47 +00:00
|
|
|
});
|
|
|
|
|
2021-10-12 11:18:24 +00:00
|
|
|
netapp.connected_as_client(peer_id, conn.clone());
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2022-08-31 13:58:05 +00:00
|
|
|
let debug_name = format!("CLI {}", hex::encode(&peer_id[..8]));
|
|
|
|
|
2020-12-02 12:30:47 +00:00
|
|
|
tokio::spawn(async move {
|
2022-08-31 13:58:05 +00:00
|
|
|
let debug_name_2 = debug_name.clone();
|
|
|
|
let send_future = tokio::spawn(conn.clone().send_loop(query_recv, write, debug_name_2));
|
2021-10-13 15:12:13 +00:00
|
|
|
|
2020-12-02 12:30:47 +00:00
|
|
|
let conn2 = conn.clone();
|
2021-10-13 15:12:13 +00:00
|
|
|
let recv_future = tokio::spawn(async move {
|
|
|
|
select! {
|
2022-08-31 13:58:05 +00:00
|
|
|
r = conn2.recv_loop(read, debug_name) => r,
|
2021-10-13 15:12:13 +00:00
|
|
|
_ = await_exit(stop_recv_loop_recv) => Ok(())
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
|
|
|
send_future.await.log_err("ClientConn send_loop");
|
|
|
|
|
2021-10-13 15:14:26 +00:00
|
|
|
// FIXME: should do here: wait for inflight requests to all have their response
|
2021-10-13 15:12:13 +00:00
|
|
|
stop_recv_loop
|
|
|
|
.send(true)
|
|
|
|
.log_err("ClientConn send true to stop_recv_loop");
|
|
|
|
|
|
|
|
recv_future.await.log_err("ClientConn recv_loop");
|
|
|
|
|
|
|
|
// Make sure we don't wait on any more requests that won't
|
|
|
|
// have a response
|
|
|
|
conn.inflight.lock().unwrap().clear();
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2020-12-12 20:14:15 +00:00
|
|
|
netapp.disconnected_as_client(&peer_id, conn);
|
2020-12-02 12:30:47 +00:00
|
|
|
});
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn close(&self) {
|
2021-10-13 15:12:13 +00:00
|
|
|
self.query_send.store(None);
|
2020-12-02 12:30:47 +00:00
|
|
|
}
|
|
|
|
|
2022-07-21 17:05:51 +00:00
|
|
|
pub(crate) async fn call<T>(
|
2020-12-02 12:30:47 +00:00
|
|
|
self: Arc<Self>,
|
2022-07-21 18:22:56 +00:00
|
|
|
req: Req<T>,
|
2022-02-21 11:04:09 +00:00
|
|
|
path: &str,
|
2020-12-02 12:30:47 +00:00
|
|
|
prio: RequestPriority,
|
2022-07-21 18:22:56 +00:00
|
|
|
) -> Result<Resp<T>, Error>
|
2020-12-02 12:30:47 +00:00
|
|
|
where
|
|
|
|
T: Message,
|
|
|
|
{
|
2021-10-13 15:12:13 +00:00
|
|
|
let query_send = self.query_send.load_full().ok_or(Error::ConnectionClosed)?;
|
|
|
|
|
2020-12-02 12:30:47 +00:00
|
|
|
let id = self
|
|
|
|
.next_query_number
|
2022-06-20 21:40:31 +00:00
|
|
|
.fetch_add(1, atomic::Ordering::Relaxed);
|
2021-10-12 16:13:07 +00:00
|
|
|
|
2022-02-18 18:01:23 +00:00
|
|
|
cfg_if::cfg_if! {
|
|
|
|
if #[cfg(feature = "telemetry")] {
|
2022-02-18 19:10:46 +00:00
|
|
|
let tracer = opentelemetry::global::tracer("netapp");
|
2022-02-18 19:23:10 +00:00
|
|
|
let mut span = tracer.span_builder(format!("RPC >> {}", path))
|
2022-04-07 08:31:37 +00:00
|
|
|
.with_kind(SpanKind::Client)
|
2022-02-18 19:10:46 +00:00
|
|
|
.start(&tracer);
|
|
|
|
let propagator = BinaryPropagator::new();
|
2023-01-31 13:45:43 +00:00
|
|
|
let telemetry_id: Bytes = propagator.serialize_into_bytes(span.span_context()).to_vec().into();
|
2022-02-18 18:01:23 +00:00
|
|
|
} else {
|
2022-07-22 10:45:38 +00:00
|
|
|
let telemetry_id: Bytes = Bytes::new();
|
2022-02-18 18:01:23 +00:00
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
// Encode request
|
2022-07-22 10:45:38 +00:00
|
|
|
let req_enc = req.into_enc(prio, path.as_bytes().to_vec().into(), telemetry_id);
|
|
|
|
let req_msg_len = req_enc.msg.len();
|
2022-09-01 10:15:50 +00:00
|
|
|
let (req_stream, req_order) = req_enc.encode();
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2022-02-18 18:01:23 +00:00
|
|
|
// Send request through
|
2020-12-02 12:30:47 +00:00
|
|
|
let (resp_send, resp_recv) = oneshot::channel();
|
2020-12-07 12:35:24 +00:00
|
|
|
let old = self.inflight.lock().unwrap().insert(id, resp_send);
|
|
|
|
if let Some(old_ch) = old {
|
|
|
|
error!(
|
|
|
|
"Too many inflight requests! RequestID collision. Interrupting previous request."
|
|
|
|
);
|
2022-07-22 11:01:52 +00:00
|
|
|
let _ = old_ch.send(Box::pin(futures::stream::once(async move {
|
2022-09-01 10:15:50 +00:00
|
|
|
Err(std::io::Error::new(
|
|
|
|
std::io::ErrorKind::Other,
|
|
|
|
"RequestID collision, too many inflight requests",
|
|
|
|
))
|
2022-07-22 11:01:52 +00:00
|
|
|
})));
|
2020-12-07 12:35:24 +00:00
|
|
|
}
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2022-07-25 13:04:52 +00:00
|
|
|
debug!(
|
|
|
|
"request: query_send {}, path {}, prio {} (serialized message: {} bytes)",
|
|
|
|
id, path, prio, req_msg_len
|
2022-07-22 10:45:38 +00:00
|
|
|
);
|
2022-02-18 19:23:10 +00:00
|
|
|
|
|
|
|
#[cfg(feature = "telemetry")]
|
2022-07-22 10:45:38 +00:00
|
|
|
span.set_attribute(KeyValue::new("len_query_msg", req_msg_len as i64));
|
2022-02-18 19:23:10 +00:00
|
|
|
|
2022-09-01 13:54:11 +00:00
|
|
|
query_send.send(SendItem::Stream(id, prio, req_order, req_stream))?;
|
|
|
|
|
|
|
|
let canceller = CancelOnDrop::new(id, query_send.as_ref().clone());
|
2020-12-02 12:30:47 +00:00
|
|
|
|
2022-02-18 19:10:46 +00:00
|
|
|
cfg_if::cfg_if! {
|
|
|
|
if #[cfg(feature = "telemetry")] {
|
2022-06-20 21:40:31 +00:00
|
|
|
let stream = resp_recv
|
2022-02-18 19:10:46 +00:00
|
|
|
.with_context(Context::current_with_span(span))
|
|
|
|
.await?;
|
|
|
|
} else {
|
2022-06-20 21:40:31 +00:00
|
|
|
let stream = resp_recv.await?;
|
2022-02-18 19:10:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-01 13:54:11 +00:00
|
|
|
let stream = Box::pin(canceller.for_stream(stream));
|
|
|
|
|
2022-07-22 11:01:52 +00:00
|
|
|
let resp_enc = RespEnc::decode(stream).await?;
|
2022-07-25 13:04:52 +00:00
|
|
|
debug!("client: got response to request {} (path {})", id, path);
|
2022-07-22 10:45:38 +00:00
|
|
|
Resp::from_enc(resp_enc)
|
2020-12-02 12:30:47 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl SendLoop for ClientConn {}
|
|
|
|
|
|
|
|
#[async_trait]
|
|
|
|
impl RecvLoop for ClientConn {
|
2022-07-22 11:01:52 +00:00
|
|
|
fn recv_handler(self: &Arc<Self>, id: RequestID, stream: ByteStream) {
|
2022-06-20 21:40:31 +00:00
|
|
|
trace!("ClientConn recv_handler {}", id);
|
2020-12-07 15:00:12 +00:00
|
|
|
|
2020-12-07 12:35:24 +00:00
|
|
|
let mut inflight = self.inflight.lock().unwrap();
|
|
|
|
if let Some(ch) = inflight.remove(&id) {
|
2022-06-20 21:40:31 +00:00
|
|
|
if ch.send(stream).is_err() {
|
2020-12-07 12:35:24 +00:00
|
|
|
debug!("Could not send request response, probably because request was interrupted. Dropping response.");
|
|
|
|
}
|
2022-09-01 13:54:11 +00:00
|
|
|
} else {
|
|
|
|
debug!("Got unexpected response to request {}, dropping it", id);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// ----
|
|
|
|
|
|
|
|
struct CancelOnDrop {
|
|
|
|
id: RequestID,
|
|
|
|
query_send: mpsc::UnboundedSender<SendItem>,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl CancelOnDrop {
|
|
|
|
fn new(id: RequestID, query_send: mpsc::UnboundedSender<SendItem>) -> Self {
|
|
|
|
Self { id, query_send }
|
|
|
|
}
|
|
|
|
fn for_stream(self, stream: ByteStream) -> CancelOnDropStream {
|
|
|
|
CancelOnDropStream {
|
|
|
|
cancel: Some(self),
|
2023-01-31 22:57:33 +00:00
|
|
|
stream,
|
2022-09-01 13:54:11 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Drop for CancelOnDrop {
|
|
|
|
fn drop(&mut self) {
|
|
|
|
trace!("cancelling request {}", self.id);
|
|
|
|
let _ = self.query_send.send(SendItem::Cancel(self.id));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[pin_project::pin_project]
|
|
|
|
struct CancelOnDropStream {
|
|
|
|
cancel: Option<CancelOnDrop>,
|
|
|
|
#[pin]
|
|
|
|
stream: ByteStream,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Stream for CancelOnDropStream {
|
|
|
|
type Item = Packet;
|
|
|
|
|
|
|
|
fn poll_next(
|
|
|
|
self: Pin<&mut Self>,
|
|
|
|
cx: &mut std::task::Context<'_>,
|
|
|
|
) -> Poll<Option<Self::Item>> {
|
|
|
|
let this = self.project();
|
|
|
|
let res = this.stream.poll_next(cx);
|
|
|
|
if matches!(res, Poll::Ready(None)) {
|
|
|
|
if let Some(c) = this.cancel.take() {
|
|
|
|
std::mem::forget(c)
|
|
|
|
}
|
2020-12-07 12:35:24 +00:00
|
|
|
}
|
2022-09-01 13:54:11 +00:00
|
|
|
res
|
|
|
|
}
|
|
|
|
|
|
|
|
fn size_hint(&self) -> (usize, Option<usize>) {
|
|
|
|
self.stream.size_hint()
|
2020-12-02 12:30:47 +00:00
|
|
|
}
|
|
|
|
}
|