Only have some nodes respond to latent heartbeats

Also only respond if they're more than 2 blocks behind to minimize redundant
sending of blocks.
This commit is contained in:
Luke Parker 2024-04-17 21:54:10 -04:00
parent dac46c8d7d
commit 6b4df4f2c0
No known key found for this signature in database
4 changed files with 40 additions and 25 deletions

View file

@ -1292,6 +1292,7 @@ pub async fn run<D: Db, Pro: Processors, P: P2p>(
p2p.clone(), p2p.clone(),
cosign_channel.clone(), cosign_channel.clone(),
tributary_event_listener_4, tributary_event_listener_4,
<Ristretto as Ciphersuite>::generator() * key.deref(),
)); ));
// Handle all messages from processors // Handle all messages from processors

View file

@ -9,6 +9,8 @@ use std::{
use async_trait::async_trait; use async_trait::async_trait;
use rand_core::{RngCore, OsRng}; use rand_core::{RngCore, OsRng};
use ciphersuite::{Ciphersuite, Ristretto};
use scale::Encode; use scale::Encode;
use borsh::{BorshSerialize, BorshDeserialize}; use borsh::{BorshSerialize, BorshDeserialize};
use serai_client::{primitives::NetworkId, validator_sets::primitives::ValidatorSet, Serai}; use serai_client::{primitives::NetworkId, validator_sets::primitives::ValidatorSet, Serai};
@ -612,6 +614,7 @@ pub async fn handle_p2p_task<D: Db, P: P2p>(
p2p: P, p2p: P,
cosign_channel: mpsc::UnboundedSender<CosignedBlock>, cosign_channel: mpsc::UnboundedSender<CosignedBlock>,
mut tributary_event: broadcast::Receiver<TributaryEvent<D, P>>, mut tributary_event: broadcast::Receiver<TributaryEvent<D, P>>,
our_key: <Ristretto as Ciphersuite>::G,
) { ) {
let channels = Arc::new(RwLock::new(HashMap::<_, mpsc::UnboundedSender<Message<P>>>::new())); let channels = Arc::new(RwLock::new(HashMap::<_, mpsc::UnboundedSender<Message<P>>>::new()));
tokio::spawn({ tokio::spawn({
@ -631,6 +634,8 @@ pub async fn handle_p2p_task<D: Db, P: P2p>(
// Subscribe to the topic for this tributary // Subscribe to the topic for this tributary
p2p.subscribe(tributary.spec.set(), genesis).await; p2p.subscribe(tributary.spec.set(), genesis).await;
let spec_set = tributary.spec.set();
// Per-Tributary P2P message handler // Per-Tributary P2P message handler
tokio::spawn({ tokio::spawn({
let p2p = p2p.clone(); let p2p = p2p.clone();
@ -645,7 +650,7 @@ pub async fn handle_p2p_task<D: Db, P: P2p>(
P2pMessageKind::Tributary(msg_genesis) => { P2pMessageKind::Tributary(msg_genesis) => {
assert_eq!(msg_genesis, genesis); assert_eq!(msg_genesis, genesis);
log::trace!("handling message for tributary {:?}", tributary.spec.set()); log::trace!("handling message for tributary {:?}", spec_set);
if tributary.tributary.handle_message(&msg.msg).await { if tributary.tributary.handle_message(&msg.msg).await {
P2p::broadcast(&p2p, msg.kind, msg.msg).await; P2p::broadcast(&p2p, msg.kind, msg.msg).await;
} }
@ -668,18 +673,13 @@ pub async fn handle_p2p_task<D: Db, P: P2p>(
// Spawn a dedicated task as this may require loading large amounts of data // Spawn a dedicated task as this may require loading large amounts of data
// from disk and take a notable amount of time // from disk and take a notable amount of time
tokio::spawn(async move { tokio::spawn(async move {
/*
// Have sqrt(n) nodes reply with the blocks // Have sqrt(n) nodes reply with the blocks
let mut responders = (tributary.spec.n() as f32).sqrt().floor() as u64; #[allow(clippy::cast_possible_truncation, clippy::cast_sign_loss)]
let mut responders = f32::from(spec.n(&[])).sqrt().floor() as u64;
// Try to have at least 3 responders // Try to have at least 3 responders
if responders < 3 { if responders < 3 {
responders = tributary.spec.n().min(3).into(); responders = spec.n(&[]).min(3).into();
} }
*/
/*
// Have up to three nodes respond
let responders = u64::from(spec.n().min(3));
// Decide which nodes will respond by using the latest block's hash as a // Decide which nodes will respond by using the latest block's hash as a
// mutually agreed upon entropy source // mutually agreed upon entropy source
@ -689,7 +689,7 @@ pub async fn handle_p2p_task<D: Db, P: P2p>(
// (so the highest is 7, 8, 9) // (so the highest is 7, 8, 9)
// entropy % (10 + 1) - 3 = entropy % 8 = 0 ..= 7 // entropy % (10 + 1) - 3 = entropy % 8 = 0 ..= 7
let start = let start =
usize::try_from(entropy % (u64::from(spec.n() + 1) - responders)) usize::try_from(entropy % (u64::from(spec.n(&[]) + 1) - responders))
.unwrap(); .unwrap();
let mut selected = false; let mut selected = false;
for validator in &spec.validators() for validator in &spec.validators()
@ -706,21 +706,23 @@ pub async fn handle_p2p_task<D: Db, P: P2p>(
} }
log::debug!("received heartbeat and selected to respond"); log::debug!("received heartbeat and selected to respond");
*/
// Have every node respond // Have the selected nodes respond
// While we could only have a subset respond, LibP2P will sync all messages
// it isn't aware of
// It's cheaper to be aware from our disk than from over the network
// TODO: Spawn a dedicated topic for this heartbeat response? // TODO: Spawn a dedicated topic for this heartbeat response?
let mut latest = msg.msg[.. 32].try_into().unwrap(); let mut latest = msg.msg[.. 32].try_into().unwrap();
let mut to_send = vec![];
while let Some(next) = reader.block_after(&latest) { while let Some(next) = reader.block_after(&latest) {
to_send.push(next);
latest = next;
}
if to_send.len() > 1 {
for next in to_send {
let mut res = reader.block(&next).unwrap().serialize(); let mut res = reader.block(&next).unwrap().serialize();
res.extend(reader.commit(&next).unwrap()); res.extend(reader.commit(&next).unwrap());
// Also include the timestamp used within the Heartbeat // Also include the timestamp used within the Heartbeat
res.extend(&msg.msg[32 .. 40]); res.extend(&msg.msg[32 .. 40]);
p2p.send(msg.sender, P2pMessageKind::Block(spec.genesis()), res).await; p2p.send(msg.sender, P2pMessageKind::Block(spec.genesis()), res).await;
latest = next; }
} }
}); });
} }

View file

@ -3,6 +3,8 @@ use std::sync::Arc;
use rand_core::OsRng; use rand_core::OsRng;
use ciphersuite::{Ciphersuite, Ristretto};
use tokio::{ use tokio::{
sync::{mpsc, broadcast}, sync::{mpsc, broadcast},
time::sleep, time::sleep,
@ -35,12 +37,17 @@ async fn handle_p2p_test() {
let mut tributary_senders = vec![]; let mut tributary_senders = vec![];
let mut tributary_arcs = vec![]; let mut tributary_arcs = vec![];
for (p2p, tributary) in tributaries.drain(..) { for (i, (p2p, tributary)) in tributaries.drain(..).enumerate() {
let tributary = Arc::new(tributary); let tributary = Arc::new(tributary);
tributary_arcs.push(tributary.clone()); tributary_arcs.push(tributary.clone());
let (new_tributary_send, new_tributary_recv) = broadcast::channel(5); let (new_tributary_send, new_tributary_recv) = broadcast::channel(5);
let (cosign_send, _) = mpsc::unbounded_channel(); let (cosign_send, _) = mpsc::unbounded_channel();
tokio::spawn(handle_p2p_task(p2p, cosign_send, new_tributary_recv)); tokio::spawn(handle_p2p_task(
p2p,
cosign_send,
new_tributary_recv,
<Ristretto as Ciphersuite>::generator() * *keys[i],
));
new_tributary_send new_tributary_send
.send(TributaryEvent::NewTributary(ActiveTributary { spec: spec.clone(), tributary })) .send(TributaryEvent::NewTributary(ActiveTributary { spec: spec.clone(), tributary }))
.map_err(|_| "failed to send ActiveTributary") .map_err(|_| "failed to send ActiveTributary")

View file

@ -45,12 +45,17 @@ async fn sync_test() {
let mut tributary_senders = vec![]; let mut tributary_senders = vec![];
let mut tributary_arcs = vec![]; let mut tributary_arcs = vec![];
let mut p2p_threads = vec![]; let mut p2p_threads = vec![];
for (p2p, tributary) in tributaries.drain(..) { for (i, (p2p, tributary)) in tributaries.drain(..).enumerate() {
let tributary = Arc::new(tributary); let tributary = Arc::new(tributary);
tributary_arcs.push(tributary.clone()); tributary_arcs.push(tributary.clone());
let (new_tributary_send, new_tributary_recv) = broadcast::channel(5); let (new_tributary_send, new_tributary_recv) = broadcast::channel(5);
let (cosign_send, _) = mpsc::unbounded_channel(); let (cosign_send, _) = mpsc::unbounded_channel();
let thread = tokio::spawn(handle_p2p_task(p2p, cosign_send, new_tributary_recv)); let thread = tokio::spawn(handle_p2p_task(
p2p,
cosign_send,
new_tributary_recv,
<Ristretto as Ciphersuite>::generator() * *keys[i],
));
new_tributary_send new_tributary_send
.send(TributaryEvent::NewTributary(ActiveTributary { spec: spec.clone(), tributary })) .send(TributaryEvent::NewTributary(ActiveTributary { spec: spec.clone(), tributary }))
.map_err(|_| "failed to send ActiveTributary") .map_err(|_| "failed to send ActiveTributary")
@ -86,7 +91,7 @@ async fn sync_test() {
let syncer_tributary = Arc::new(syncer_tributary); let syncer_tributary = Arc::new(syncer_tributary);
let (syncer_tributary_send, syncer_tributary_recv) = broadcast::channel(5); let (syncer_tributary_send, syncer_tributary_recv) = broadcast::channel(5);
let (cosign_send, _) = mpsc::unbounded_channel(); let (cosign_send, _) = mpsc::unbounded_channel();
tokio::spawn(handle_p2p_task(syncer_p2p.clone(), cosign_send, syncer_tributary_recv)); tokio::spawn(handle_p2p_task(syncer_p2p.clone(), cosign_send, syncer_tributary_recv, syncer_key));
syncer_tributary_send syncer_tributary_send
.send(TributaryEvent::NewTributary(ActiveTributary { .send(TributaryEvent::NewTributary(ActiveTributary {
spec: spec.clone(), spec: spec.clone(),