Use multiple retransmit stage threads/sockets (#6279)
This commit is contained in:
@ -31,7 +31,6 @@ use itertools::Itertools;
|
||||
use rand::SeedableRng;
|
||||
use rand::{thread_rng, Rng};
|
||||
use rand_chacha::ChaChaRng;
|
||||
use rayon::prelude::*;
|
||||
use solana_metrics::{datapoint_debug, inc_new_counter_debug, inc_new_counter_error};
|
||||
use solana_netutil::{
|
||||
bind_common, bind_common_in_range, bind_in_range, find_available_port_in_range,
|
||||
@ -747,7 +746,7 @@ impl ClusterInfo {
|
||||
) -> Result<()> {
|
||||
trace!("retransmit orders {}", peers.len());
|
||||
let errs: Vec<_> = peers
|
||||
.par_iter()
|
||||
.iter()
|
||||
.filter(|v| v.id != slot_leader_pubkey.unwrap_or_default())
|
||||
.map(|v| {
|
||||
let dest = if forwarded { &v.tvu_forwards } else { &v.tvu };
|
||||
@ -1565,7 +1564,7 @@ pub struct Sockets {
|
||||
pub tpu_forwards: Vec<UdpSocket>,
|
||||
pub broadcast: UdpSocket,
|
||||
pub repair: UdpSocket,
|
||||
pub retransmit: UdpSocket,
|
||||
pub retransmit_sockets: Vec<UdpSocket>,
|
||||
pub storage: Option<UdpSocket>,
|
||||
}
|
||||
|
||||
@ -1613,7 +1612,7 @@ impl Node {
|
||||
tpu_forwards: vec![],
|
||||
broadcast,
|
||||
repair,
|
||||
retransmit,
|
||||
retransmit_sockets: vec![retransmit],
|
||||
storage: Some(storage),
|
||||
ip_echo: None,
|
||||
},
|
||||
@ -1634,7 +1633,7 @@ impl Node {
|
||||
SocketAddr::new(IpAddr::V4(Ipv4Addr::new(127, 0, 0, 1)), rpc_pubsub_port);
|
||||
|
||||
let broadcast = UdpSocket::bind("0.0.0.0:0").unwrap();
|
||||
let retransmit = UdpSocket::bind("0.0.0.0:0").unwrap();
|
||||
let retransmit_socket = UdpSocket::bind("0.0.0.0:0").unwrap();
|
||||
let storage = UdpSocket::bind("0.0.0.0:0").unwrap();
|
||||
let info = ContactInfo::new(
|
||||
pubkey,
|
||||
@ -1659,7 +1658,7 @@ impl Node {
|
||||
tpu_forwards: vec![tpu_forwards],
|
||||
broadcast,
|
||||
repair,
|
||||
retransmit,
|
||||
retransmit_sockets: vec![retransmit_socket],
|
||||
storage: None,
|
||||
},
|
||||
}
|
||||
@ -1692,16 +1691,18 @@ impl Node {
|
||||
let (tvu_port, tvu_sockets) = multi_bind_in_range(port_range, 8).expect("tvu multi_bind");
|
||||
|
||||
let (tvu_forwards_port, tvu_forwards_sockets) =
|
||||
multi_bind_in_range(port_range, 8).expect("tpu multi_bind");
|
||||
multi_bind_in_range(port_range, 8).expect("tvu_forwards multi_bind");
|
||||
|
||||
let (tpu_port, tpu_sockets) = multi_bind_in_range(port_range, 32).expect("tpu multi_bind");
|
||||
|
||||
let (tpu_forwards_port, tpu_forwards_sockets) =
|
||||
multi_bind_in_range(port_range, 8).expect("tpu multi_bind");
|
||||
multi_bind_in_range(port_range, 8).expect("tpu_forwards multi_bind");
|
||||
|
||||
let (_, retransmit_sockets) =
|
||||
multi_bind_in_range(port_range, 8).expect("retransmit multi_bind");
|
||||
|
||||
let (_, repair) = Self::bind(port_range);
|
||||
let (_, broadcast) = Self::bind(port_range);
|
||||
let (_, retransmit) = Self::bind(port_range);
|
||||
|
||||
let info = ContactInfo::new(
|
||||
pubkey,
|
||||
@ -1727,7 +1728,7 @@ impl Node {
|
||||
tpu_forwards: tpu_forwards_sockets,
|
||||
broadcast,
|
||||
repair,
|
||||
retransmit,
|
||||
retransmit_sockets,
|
||||
storage: None,
|
||||
ip_echo: Some(ip_echo),
|
||||
},
|
||||
@ -1774,6 +1775,7 @@ mod tests {
|
||||
use crate::shred::max_ticks_per_n_shreds;
|
||||
use crate::shred::{DataShredHeader, Shred};
|
||||
use crate::test_tx::test_tx;
|
||||
use rayon::prelude::*;
|
||||
use solana_sdk::hash::Hash;
|
||||
use solana_sdk::signature::{Keypair, KeypairUtil};
|
||||
use std::collections::HashSet;
|
||||
|
@ -23,27 +23,38 @@ use std::{
|
||||
sync::atomic::AtomicBool,
|
||||
sync::mpsc::channel,
|
||||
sync::mpsc::RecvTimeoutError,
|
||||
sync::Mutex,
|
||||
sync::{Arc, RwLock},
|
||||
thread::{self, Builder, JoinHandle},
|
||||
time::Duration,
|
||||
};
|
||||
|
||||
pub fn retransmit(
|
||||
// Limit a given thread to consume about this many packets so that
|
||||
// it doesn't pull up too much work.
|
||||
const MAX_PACKET_BATCH_SIZE: usize = 100;
|
||||
|
||||
fn retransmit(
|
||||
bank_forks: &Arc<RwLock<BankForks>>,
|
||||
leader_schedule_cache: &Arc<LeaderScheduleCache>,
|
||||
cluster_info: &Arc<RwLock<ClusterInfo>>,
|
||||
r: &PacketReceiver,
|
||||
r: &Arc<Mutex<PacketReceiver>>,
|
||||
sock: &UdpSocket,
|
||||
id: u32,
|
||||
) -> Result<()> {
|
||||
let timer = Duration::new(1, 0);
|
||||
let packets = r.recv_timeout(timer)?;
|
||||
let r_lock = r.lock().unwrap();
|
||||
let packets = r_lock.recv_timeout(timer)?;
|
||||
let mut timer_start = Measure::start("retransmit");
|
||||
let mut total_packets = packets.packets.len();
|
||||
let mut packet_v = vec![packets];
|
||||
while let Ok(nq) = r.try_recv() {
|
||||
while let Ok(nq) = r_lock.try_recv() {
|
||||
total_packets += nq.packets.len();
|
||||
packet_v.push(nq);
|
||||
if total_packets >= MAX_PACKET_BATCH_SIZE {
|
||||
break;
|
||||
}
|
||||
}
|
||||
drop(r_lock);
|
||||
|
||||
let r_bank = bank_forks.read().unwrap().working_bank();
|
||||
let bank_epoch = r_bank.get_leader_schedule_epoch(r_bank.slot());
|
||||
@ -100,10 +111,11 @@ pub fn retransmit(
|
||||
}
|
||||
timer_start.stop();
|
||||
debug!(
|
||||
"retransmitted {} packets in {}ms retransmit_time: {}ms",
|
||||
"retransmitted {} packets in {}ms retransmit_time: {}ms id: {}",
|
||||
total_packets,
|
||||
timer_start.as_ms(),
|
||||
retransmit_total
|
||||
retransmit_total,
|
||||
id,
|
||||
);
|
||||
datapoint_debug!("cluster_info-num_nodes", ("count", peers_len, i64));
|
||||
datapoint_debug!(
|
||||
@ -124,39 +136,48 @@ pub fn retransmit(
|
||||
/// * `cluster_info` - This structure needs to be updated and populated by the bank and via gossip.
|
||||
/// * `recycler` - Blob recycler.
|
||||
/// * `r` - Receive channel for blobs to be retransmitted to all the layer 1 nodes.
|
||||
fn retransmitter(
|
||||
sock: Arc<UdpSocket>,
|
||||
pub fn retransmitter(
|
||||
sockets: Arc<Vec<UdpSocket>>,
|
||||
bank_forks: Arc<RwLock<BankForks>>,
|
||||
leader_schedule_cache: &Arc<LeaderScheduleCache>,
|
||||
cluster_info: Arc<RwLock<ClusterInfo>>,
|
||||
r: PacketReceiver,
|
||||
) -> JoinHandle<()> {
|
||||
let bank_forks = bank_forks.clone();
|
||||
let leader_schedule_cache = leader_schedule_cache.clone();
|
||||
Builder::new()
|
||||
.name("solana-retransmitter".to_string())
|
||||
.spawn(move || {
|
||||
trace!("retransmitter started");
|
||||
loop {
|
||||
if let Err(e) = retransmit(
|
||||
&bank_forks,
|
||||
&leader_schedule_cache,
|
||||
&cluster_info,
|
||||
&r,
|
||||
&sock,
|
||||
) {
|
||||
match e {
|
||||
Error::RecvTimeoutError(RecvTimeoutError::Disconnected) => break,
|
||||
Error::RecvTimeoutError(RecvTimeoutError::Timeout) => (),
|
||||
_ => {
|
||||
inc_new_counter_error!("streamer-retransmit-error", 1, 1);
|
||||
r: Arc<Mutex<PacketReceiver>>,
|
||||
) -> Vec<JoinHandle<()>> {
|
||||
(0..sockets.len())
|
||||
.map(|s| {
|
||||
let sockets = sockets.clone();
|
||||
let bank_forks = bank_forks.clone();
|
||||
let leader_schedule_cache = leader_schedule_cache.clone();
|
||||
let r = r.clone();
|
||||
let cluster_info = cluster_info.clone();
|
||||
|
||||
Builder::new()
|
||||
.name("solana-retransmitter".to_string())
|
||||
.spawn(move || {
|
||||
trace!("retransmitter started");
|
||||
loop {
|
||||
if let Err(e) = retransmit(
|
||||
&bank_forks,
|
||||
&leader_schedule_cache,
|
||||
&cluster_info,
|
||||
&r,
|
||||
&sockets[s],
|
||||
s as u32,
|
||||
) {
|
||||
match e {
|
||||
Error::RecvTimeoutError(RecvTimeoutError::Disconnected) => break,
|
||||
Error::RecvTimeoutError(RecvTimeoutError::Timeout) => (),
|
||||
_ => {
|
||||
inc_new_counter_error!("streamer-retransmit-error", 1, 1);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
trace!("exiting retransmitter");
|
||||
trace!("exiting retransmitter");
|
||||
})
|
||||
.unwrap()
|
||||
})
|
||||
.unwrap()
|
||||
.collect()
|
||||
}
|
||||
|
||||
pub struct RetransmitStage {
|
||||
@ -172,7 +193,7 @@ impl RetransmitStage {
|
||||
leader_schedule_cache: &Arc<LeaderScheduleCache>,
|
||||
blocktree: Arc<Blocktree>,
|
||||
cluster_info: &Arc<RwLock<ClusterInfo>>,
|
||||
retransmit_socket: Arc<UdpSocket>,
|
||||
retransmit_sockets: Arc<Vec<UdpSocket>>,
|
||||
repair_socket: Arc<UdpSocket>,
|
||||
fetch_stage_receiver: PacketReceiver,
|
||||
exit: &Arc<AtomicBool>,
|
||||
@ -181,8 +202,9 @@ impl RetransmitStage {
|
||||
) -> Self {
|
||||
let (retransmit_sender, retransmit_receiver) = channel();
|
||||
|
||||
let retransmit_receiver = Arc::new(Mutex::new(retransmit_receiver));
|
||||
let t_retransmit = retransmitter(
|
||||
retransmit_socket,
|
||||
retransmit_sockets,
|
||||
bank_forks.clone(),
|
||||
leader_schedule_cache,
|
||||
cluster_info.clone(),
|
||||
@ -215,7 +237,7 @@ impl RetransmitStage {
|
||||
},
|
||||
);
|
||||
|
||||
let thread_hdls = vec![t_retransmit];
|
||||
let thread_hdls = t_retransmit;
|
||||
Self {
|
||||
thread_hdls,
|
||||
window_service,
|
||||
@ -275,7 +297,7 @@ mod tests {
|
||||
let mut cluster_info = ClusterInfo::new_with_invalid_keypair(other);
|
||||
cluster_info.insert_info(me);
|
||||
|
||||
let retransmit_socket = Arc::new(UdpSocket::bind("0.0.0.0:0").unwrap());
|
||||
let retransmit_socket = Arc::new(vec![UdpSocket::bind("0.0.0.0:0").unwrap()]);
|
||||
let cluster_info = Arc::new(RwLock::new(cluster_info));
|
||||
|
||||
let (retransmit_sender, retransmit_receiver) = channel();
|
||||
@ -284,7 +306,7 @@ mod tests {
|
||||
bank_forks,
|
||||
&leader_schedule_cache,
|
||||
cluster_info,
|
||||
retransmit_receiver,
|
||||
Arc::new(Mutex::new(retransmit_receiver)),
|
||||
);
|
||||
let _thread_hdls = vec![t_retransmit];
|
||||
|
||||
|
@ -49,7 +49,7 @@ pub struct Tvu {
|
||||
pub struct Sockets {
|
||||
pub fetch: Vec<UdpSocket>,
|
||||
pub repair: UdpSocket,
|
||||
pub retransmit: UdpSocket,
|
||||
pub retransmit: Vec<UdpSocket>,
|
||||
pub forwards: Vec<UdpSocket>,
|
||||
}
|
||||
|
||||
@ -92,7 +92,7 @@ impl Tvu {
|
||||
let Sockets {
|
||||
repair: repair_socket,
|
||||
fetch: fetch_sockets,
|
||||
retransmit: retransmit_socket,
|
||||
retransmit: retransmit_sockets,
|
||||
forwards: tvu_forward_sockets,
|
||||
} = sockets;
|
||||
|
||||
@ -118,7 +118,7 @@ impl Tvu {
|
||||
leader_schedule_cache,
|
||||
blocktree.clone(),
|
||||
&cluster_info,
|
||||
Arc::new(retransmit_socket),
|
||||
Arc::new(retransmit_sockets),
|
||||
repair_socket,
|
||||
fetch_receiver,
|
||||
&exit,
|
||||
@ -270,7 +270,7 @@ pub mod tests {
|
||||
{
|
||||
Sockets {
|
||||
repair: target1.sockets.repair,
|
||||
retransmit: target1.sockets.retransmit,
|
||||
retransmit: target1.sockets.retransmit_sockets,
|
||||
fetch: target1.sockets.tvu,
|
||||
forwards: target1.sockets.tvu_forwards,
|
||||
}
|
||||
|
@ -274,9 +274,10 @@ impl Validator {
|
||||
.expect("Failed to clone repair socket"),
|
||||
retransmit: node
|
||||
.sockets
|
||||
.retransmit
|
||||
.try_clone()
|
||||
.expect("Failed to clone retransmit socket"),
|
||||
.retransmit_sockets
|
||||
.iter()
|
||||
.map(|s| s.try_clone().expect("Failed to clone retransmit socket"))
|
||||
.collect(),
|
||||
fetch: node
|
||||
.sockets
|
||||
.tvu
|
||||
@ -378,7 +379,7 @@ impl Validator {
|
||||
);
|
||||
info!(
|
||||
"local retransmit address: {}",
|
||||
node.sockets.retransmit.local_addr().unwrap()
|
||||
node.sockets.retransmit_sockets[0].local_addr().unwrap()
|
||||
);
|
||||
}
|
||||
}
|
||||
|
Reference in New Issue
Block a user