3448 lines
		
	
	
		
			126 KiB
		
	
	
	
		
			Rust
		
	
	
	
	
	
			
		
		
	
	
			3448 lines
		
	
	
		
			126 KiB
		
	
	
	
		
			Rust
		
	
	
	
	
	
| //! The `cluster_info` module defines a data structure that is shared by all the nodes in the network over
 | |
| //! a gossip control plane.  The goal is to share small bits of off-chain information and detect and
 | |
| //! repair partitions.
 | |
| //!
 | |
| //! This CRDT only supports a very limited set of types.  A map of Pubkey -> Versioned Struct.
 | |
| //! The last version is always picked during an update.
 | |
| //!
 | |
| //! The network is arranged in layers:
 | |
| //!
 | |
| //! * layer 0 - Leader.
 | |
| //! * layer 1 - As many nodes as we can fit
 | |
| //! * layer 2 - Everyone else, if layer 1 is `2^10`, layer 2 should be able to fit `2^20` number of nodes.
 | |
| //!
 | |
| //! Bank needs to provide an interface for us to query the stake weight
 | |
| use crate::{
 | |
|     contact_info::ContactInfo,
 | |
|     crds_gossip::CrdsGossip,
 | |
|     crds_gossip_error::CrdsGossipError,
 | |
|     crds_gossip_pull::{CrdsFilter, ProcessPullStats, CRDS_GOSSIP_PULL_CRDS_TIMEOUT_MS},
 | |
|     crds_value::{
 | |
|         self, CrdsData, CrdsValue, CrdsValueLabel, EpochSlotsIndex, LowestSlot, SnapshotHash,
 | |
|         Version, Vote, MAX_WALLCLOCK,
 | |
|     },
 | |
|     epoch_slots::EpochSlots,
 | |
|     result::{Error, Result},
 | |
|     weighted_shuffle::weighted_shuffle,
 | |
| };
 | |
| 
 | |
| use rand::distributions::{Distribution, WeightedIndex};
 | |
| use rand::SeedableRng;
 | |
| use rand_chacha::ChaChaRng;
 | |
| use solana_sdk::sanitize::{Sanitize, SanitizeError};
 | |
| 
 | |
| use bincode::{serialize, serialized_size};
 | |
| use core::cmp;
 | |
| use itertools::Itertools;
 | |
| use rayon::iter::IntoParallelIterator;
 | |
| use rayon::iter::ParallelIterator;
 | |
| use rayon::ThreadPool;
 | |
| use solana_ledger::staking_utils;
 | |
| use solana_measure::measure::Measure;
 | |
| use solana_measure::thread_mem_usage;
 | |
| use solana_metrics::{datapoint_debug, inc_new_counter_debug, inc_new_counter_error};
 | |
| use solana_net_utils::{
 | |
|     bind_common, bind_common_in_range, bind_in_range, find_available_port_in_range,
 | |
|     multi_bind_in_range, PortRange,
 | |
| };
 | |
| use solana_perf::packet::{
 | |
|     limited_deserialize, to_packets_with_destination, Packet, Packets, PacketsRecycler,
 | |
|     PACKET_DATA_SIZE,
 | |
| };
 | |
| use solana_rayon_threadlimit::get_thread_count;
 | |
| use solana_runtime::bank_forks::BankForks;
 | |
| use solana_sdk::hash::Hash;
 | |
| use solana_sdk::{
 | |
|     clock::{Slot, DEFAULT_MS_PER_SLOT, DEFAULT_SLOTS_PER_EPOCH},
 | |
|     pubkey::Pubkey,
 | |
|     signature::{Keypair, Signable, Signature, Signer},
 | |
|     timing::timestamp,
 | |
|     transaction::Transaction,
 | |
| };
 | |
| use solana_streamer::sendmmsg::multicast;
 | |
| use solana_streamer::streamer::{PacketReceiver, PacketSender};
 | |
| use std::{
 | |
|     borrow::Cow,
 | |
|     cmp::min,
 | |
|     collections::{HashMap, HashSet},
 | |
|     fmt,
 | |
|     net::{IpAddr, Ipv4Addr, SocketAddr, TcpListener, UdpSocket},
 | |
|     ops::{Deref, DerefMut},
 | |
|     sync::atomic::{AtomicBool, AtomicU64, Ordering},
 | |
|     sync::{Arc, RwLock, RwLockReadGuard, RwLockWriteGuard},
 | |
|     thread::{sleep, Builder, JoinHandle},
 | |
|     time::{Duration, Instant},
 | |
| };
 | |
| 
 | |
| pub const VALIDATOR_PORT_RANGE: PortRange = (8000, 10_000);
 | |
| pub const MINIMUM_VALIDATOR_PORT_RANGE_WIDTH: u16 = 10; // VALIDATOR_PORT_RANGE must be at least this wide
 | |
| 
 | |
| /// The Data plane fanout size, also used as the neighborhood size
 | |
| pub const DATA_PLANE_FANOUT: usize = 200;
 | |
| /// milliseconds we sleep for between gossip requests
 | |
| pub const GOSSIP_SLEEP_MILLIS: u64 = 100;
 | |
| /// The maximum size of a bloom filter
 | |
| pub const MAX_BLOOM_SIZE: usize = MAX_CRDS_OBJECT_SIZE;
 | |
| pub const MAX_CRDS_OBJECT_SIZE: usize = 928;
 | |
| /// The maximum size of a protocol payload
 | |
| const MAX_PROTOCOL_PAYLOAD_SIZE: u64 = PACKET_DATA_SIZE as u64 - MAX_PROTOCOL_HEADER_SIZE;
 | |
| /// The largest protocol header size
 | |
| const MAX_PROTOCOL_HEADER_SIZE: u64 = 214;
 | |
| /// A hard limit on incoming gossip messages
 | |
| /// Chosen to be able to handle 1Gbps of pure gossip traffic
 | |
| /// 128MB/PACKET_DATA_SIZE
 | |
| const MAX_GOSSIP_TRAFFIC: usize = 128_000_000 / PACKET_DATA_SIZE;
 | |
| 
 | |
| /// Keep the number of snapshot hashes a node publishes under MAX_PROTOCOL_PAYLOAD_SIZE
 | |
| pub const MAX_SNAPSHOT_HASHES: usize = 16;
 | |
| 
 | |
| #[derive(Debug, PartialEq, Eq)]
 | |
| pub enum ClusterInfoError {
 | |
|     NoPeers,
 | |
|     NoLeader,
 | |
|     BadContactInfo,
 | |
|     BadGossipAddress,
 | |
| }
 | |
| #[derive(Clone)]
 | |
| pub struct DataBudget {
 | |
|     bytes: usize, // amount of bytes we have in the budget to send
 | |
|     last_timestamp_ms: u64, // Last time that we upped the bytes count,
 | |
|                   // used to detect when to up the bytes budget again
 | |
| }
 | |
| 
 | |
| struct GossipWriteLock<'a> {
 | |
|     gossip: RwLockWriteGuard<'a, CrdsGossip>,
 | |
|     timer: Measure,
 | |
|     counter: &'a Counter,
 | |
| }
 | |
| 
 | |
| impl<'a> GossipWriteLock<'a> {
 | |
|     fn new(
 | |
|         gossip: RwLockWriteGuard<'a, CrdsGossip>,
 | |
|         label: &'static str,
 | |
|         counter: &'a Counter,
 | |
|     ) -> Self {
 | |
|         Self {
 | |
|             gossip,
 | |
|             timer: Measure::start(label),
 | |
|             counter,
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| impl<'a> Deref for GossipWriteLock<'a> {
 | |
|     type Target = RwLockWriteGuard<'a, CrdsGossip>;
 | |
|     fn deref(&self) -> &Self::Target {
 | |
|         &self.gossip
 | |
|     }
 | |
| }
 | |
| 
 | |
| impl<'a> DerefMut for GossipWriteLock<'a> {
 | |
|     fn deref_mut(&mut self) -> &mut Self::Target {
 | |
|         &mut self.gossip
 | |
|     }
 | |
| }
 | |
| 
 | |
| impl<'a> Drop for GossipWriteLock<'a> {
 | |
|     fn drop(&mut self) {
 | |
|         self.counter.add_measure(&mut self.timer);
 | |
|     }
 | |
| }
 | |
| 
 | |
| struct GossipReadLock<'a> {
 | |
|     gossip: RwLockReadGuard<'a, CrdsGossip>,
 | |
|     timer: Measure,
 | |
|     counter: &'a Counter,
 | |
| }
 | |
| 
 | |
| impl<'a> GossipReadLock<'a> {
 | |
|     fn new(
 | |
|         gossip: RwLockReadGuard<'a, CrdsGossip>,
 | |
|         label: &'static str,
 | |
|         counter: &'a Counter,
 | |
|     ) -> Self {
 | |
|         Self {
 | |
|             gossip,
 | |
|             timer: Measure::start(label),
 | |
|             counter,
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| impl<'a> Deref for GossipReadLock<'a> {
 | |
|     type Target = RwLockReadGuard<'a, CrdsGossip>;
 | |
|     fn deref(&self) -> &Self::Target {
 | |
|         &self.gossip
 | |
|     }
 | |
| }
 | |
| 
 | |
| impl<'a> Drop for GossipReadLock<'a> {
 | |
|     fn drop(&mut self) {
 | |
|         self.counter.add_measure(&mut self.timer);
 | |
|     }
 | |
| }
 | |
| 
 | |
| #[derive(Default)]
 | |
| struct Counter(AtomicU64);
 | |
| 
 | |
| impl Counter {
 | |
|     fn add_measure(&self, x: &mut Measure) {
 | |
|         x.stop();
 | |
|         self.0.fetch_add(x.as_us(), Ordering::Relaxed);
 | |
|     }
 | |
|     fn add_relaxed(&self, x: u64) {
 | |
|         self.0.fetch_add(x, Ordering::Relaxed);
 | |
|     }
 | |
|     fn clear(&self) -> u64 {
 | |
|         self.0.swap(0, Ordering::Relaxed)
 | |
|     }
 | |
| }
 | |
| 
 | |
| #[derive(Default)]
 | |
| struct GossipStats {
 | |
|     entrypoint: Counter,
 | |
|     entrypoint2: Counter,
 | |
|     push_vote_read: Counter,
 | |
|     vote_process_push: Counter,
 | |
|     get_votes: Counter,
 | |
|     get_accounts_hash: Counter,
 | |
|     get_snapshot_hash: Counter,
 | |
|     all_tvu_peers: Counter,
 | |
|     tvu_peers: Counter,
 | |
|     retransmit_peers: Counter,
 | |
|     repair_peers: Counter,
 | |
|     new_push_requests: Counter,
 | |
|     new_push_requests2: Counter,
 | |
|     new_push_requests_num: Counter,
 | |
|     filter_pull_response: Counter,
 | |
|     process_pull_response: Counter,
 | |
|     process_pull_response_count: Counter,
 | |
|     process_pull_response_len: Counter,
 | |
|     process_pull_response_timeout: Counter,
 | |
|     process_pull_response_fail_insert: Counter,
 | |
|     process_pull_response_fail_timeout: Counter,
 | |
|     process_pull_response_success: Counter,
 | |
|     process_pull_requests: Counter,
 | |
|     generate_pull_responses: Counter,
 | |
|     process_prune: Counter,
 | |
|     process_push_message: Counter,
 | |
|     prune_received_cache: Counter,
 | |
|     prune_message_count: Counter,
 | |
|     prune_message_len: Counter,
 | |
|     purge: Counter,
 | |
|     epoch_slots_lookup: Counter,
 | |
|     epoch_slots_push: Counter,
 | |
|     push_message: Counter,
 | |
|     new_pull_requests: Counter,
 | |
|     new_pull_requests_count: Counter,
 | |
|     mark_pull_request: Counter,
 | |
|     skip_pull_response_shred_version: Counter,
 | |
|     skip_pull_shred_version: Counter,
 | |
|     skip_push_message_shred_version: Counter,
 | |
|     push_message_count: Counter,
 | |
|     push_message_value_count: Counter,
 | |
|     push_response_count: Counter,
 | |
|     pull_requests_count: Counter,
 | |
| }
 | |
| 
 | |
| pub struct ClusterInfo {
 | |
|     /// The network
 | |
|     pub gossip: RwLock<CrdsGossip>,
 | |
|     /// set the keypair that will be used to sign crds values generated. It is unset only in tests.
 | |
|     pub(crate) keypair: Arc<Keypair>,
 | |
|     /// The network entrypoint
 | |
|     entrypoint: RwLock<Option<ContactInfo>>,
 | |
|     outbound_budget: RwLock<DataBudget>,
 | |
|     my_contact_info: RwLock<ContactInfo>,
 | |
|     id: Pubkey,
 | |
|     stats: GossipStats,
 | |
|     socket: UdpSocket,
 | |
| }
 | |
| 
 | |
| impl Default for ClusterInfo {
 | |
|     fn default() -> Self {
 | |
|         Self::new_with_invalid_keypair(ContactInfo::default())
 | |
|     }
 | |
| }
 | |
| 
 | |
| #[derive(Default, Clone)]
 | |
| pub struct Locality {
 | |
|     /// The bounds of the neighborhood represented by this locality
 | |
|     pub neighbor_bounds: (usize, usize),
 | |
|     /// The `turbine` layer this locality is in
 | |
|     pub layer_ix: usize,
 | |
|     /// The bounds of the current layer
 | |
|     pub layer_bounds: (usize, usize),
 | |
|     /// The bounds of the next layer
 | |
|     pub next_layer_bounds: Option<(usize, usize)>,
 | |
|     /// The indices of the nodes that should be contacted in next layer
 | |
|     pub next_layer_peers: Vec<usize>,
 | |
| }
 | |
| 
 | |
| impl fmt::Debug for Locality {
 | |
|     fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
 | |
|         write!(
 | |
|             f,
 | |
|             "Locality {{ neighborhood_bounds: {:?}, current_layer: {:?}, child_layer_bounds: {:?} child_layer_peers: {:?} }}",
 | |
|             self.neighbor_bounds, self.layer_ix, self.next_layer_bounds, self.next_layer_peers
 | |
|         )
 | |
|     }
 | |
| }
 | |
| 
 | |
| #[derive(Debug, Default, Deserialize, Serialize, AbiExample)]
 | |
| pub struct PruneData {
 | |
|     /// Pubkey of the node that sent this prune data
 | |
|     pub pubkey: Pubkey,
 | |
|     /// Pubkeys of nodes that should be pruned
 | |
|     pub prunes: Vec<Pubkey>,
 | |
|     /// Signature of this Prune Message
 | |
|     pub signature: Signature,
 | |
|     /// The Pubkey of the intended node/destination for this message
 | |
|     pub destination: Pubkey,
 | |
|     /// Wallclock of the node that generated this message
 | |
|     pub wallclock: u64,
 | |
| }
 | |
| 
 | |
| impl Sanitize for PruneData {
 | |
|     fn sanitize(&self) -> std::result::Result<(), SanitizeError> {
 | |
|         if self.wallclock >= MAX_WALLCLOCK {
 | |
|             return Err(SanitizeError::ValueOutOfBounds);
 | |
|         }
 | |
|         Ok(())
 | |
|     }
 | |
| }
 | |
| 
 | |
| impl Signable for PruneData {
 | |
|     fn pubkey(&self) -> Pubkey {
 | |
|         self.pubkey
 | |
|     }
 | |
| 
 | |
|     fn signable_data(&self) -> Cow<[u8]> {
 | |
|         #[derive(Serialize)]
 | |
|         struct SignData {
 | |
|             pubkey: Pubkey,
 | |
|             prunes: Vec<Pubkey>,
 | |
|             destination: Pubkey,
 | |
|             wallclock: u64,
 | |
|         }
 | |
|         let data = SignData {
 | |
|             pubkey: self.pubkey,
 | |
|             prunes: self.prunes.clone(),
 | |
|             destination: self.destination,
 | |
|             wallclock: self.wallclock,
 | |
|         };
 | |
|         Cow::Owned(serialize(&data).expect("serialize PruneData"))
 | |
|     }
 | |
| 
 | |
|     fn get_signature(&self) -> Signature {
 | |
|         self.signature
 | |
|     }
 | |
| 
 | |
|     fn set_signature(&mut self, signature: Signature) {
 | |
|         self.signature = signature
 | |
|     }
 | |
| }
 | |
| 
 | |
| struct PullData {
 | |
|     pub from_addr: SocketAddr,
 | |
|     pub caller: CrdsValue,
 | |
|     pub filter: CrdsFilter,
 | |
| }
 | |
| 
 | |
| pub fn make_accounts_hashes_message(
 | |
|     keypair: &Keypair,
 | |
|     accounts_hashes: Vec<(Slot, Hash)>,
 | |
| ) -> Option<CrdsValue> {
 | |
|     let message = CrdsData::AccountsHashes(SnapshotHash::new(keypair.pubkey(), accounts_hashes));
 | |
|     Some(CrdsValue::new_signed(message, keypair))
 | |
| }
 | |
| 
 | |
| // TODO These messages should go through the gpu pipeline for spam filtering
 | |
| #[frozen_abi(digest = "CnN1gW2K2TRydGc84eYnQJwdTADPjQf6LJLZ4RP1QeoH")]
 | |
| #[derive(Serialize, Deserialize, Debug, AbiEnumVisitor, AbiExample)]
 | |
| #[allow(clippy::large_enum_variant)]
 | |
| enum Protocol {
 | |
|     /// Gossip protocol messages
 | |
|     PullRequest(CrdsFilter, CrdsValue),
 | |
|     PullResponse(Pubkey, Vec<CrdsValue>),
 | |
|     PushMessage(Pubkey, Vec<CrdsValue>),
 | |
|     PruneMessage(Pubkey, PruneData),
 | |
| }
 | |
| 
 | |
| impl Sanitize for Protocol {
 | |
|     fn sanitize(&self) -> std::result::Result<(), SanitizeError> {
 | |
|         match self {
 | |
|             Protocol::PullRequest(filter, val) => {
 | |
|                 filter.sanitize()?;
 | |
|                 val.sanitize()
 | |
|             }
 | |
|             Protocol::PullResponse(_, val) => val.sanitize(),
 | |
|             Protocol::PushMessage(_, val) => val.sanitize(),
 | |
|             Protocol::PruneMessage(_, val) => val.sanitize(),
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| // Rating for pull requests
 | |
| // A response table is generated as a
 | |
| // 2-d table arranged by target nodes and a
 | |
| // list of responses for that node,
 | |
| // to/responses_index is a location in that table.
 | |
| struct ResponseScore {
 | |
|     to: usize,              // to, index of who the response is to
 | |
|     responses_index: usize, // index into the list of responses for a given to
 | |
|     score: u64,             // Relative score of the response
 | |
| }
 | |
| 
 | |
| impl ClusterInfo {
 | |
|     /// Without a valid keypair gossip will not function. Only useful for tests.
 | |
|     pub fn new_with_invalid_keypair(contact_info: ContactInfo) -> Self {
 | |
|         Self::new(contact_info, Arc::new(Keypair::new()))
 | |
|     }
 | |
| 
 | |
|     pub fn new(contact_info: ContactInfo, keypair: Arc<Keypair>) -> Self {
 | |
|         let id = contact_info.id;
 | |
|         let me = Self {
 | |
|             gossip: RwLock::new(CrdsGossip::default()),
 | |
|             keypair,
 | |
|             entrypoint: RwLock::new(None),
 | |
|             outbound_budget: RwLock::new(DataBudget {
 | |
|                 bytes: 0,
 | |
|                 last_timestamp_ms: 0,
 | |
|             }),
 | |
|             my_contact_info: RwLock::new(contact_info),
 | |
|             id,
 | |
|             stats: GossipStats::default(),
 | |
|             socket: UdpSocket::bind("0.0.0.0:0").unwrap(),
 | |
|         };
 | |
|         {
 | |
|             let mut gossip = me.gossip.write().unwrap();
 | |
|             gossip.set_self(&id);
 | |
|             gossip.set_shred_version(me.my_shred_version());
 | |
|         }
 | |
|         me.insert_self();
 | |
|         me.push_self(&HashMap::new());
 | |
|         me
 | |
|     }
 | |
| 
 | |
|     // Should only be used by tests and simulations
 | |
|     pub fn clone_with_id(&self, new_id: &Pubkey) -> Self {
 | |
|         let mut gossip = self.gossip.read().unwrap().clone();
 | |
|         gossip.id = *new_id;
 | |
|         let mut my_contact_info = self.my_contact_info.read().unwrap().clone();
 | |
|         my_contact_info.id = *new_id;
 | |
|         ClusterInfo {
 | |
|             gossip: RwLock::new(gossip),
 | |
|             keypair: self.keypair.clone(),
 | |
|             entrypoint: RwLock::new(self.entrypoint.read().unwrap().clone()),
 | |
|             outbound_budget: RwLock::new(self.outbound_budget.read().unwrap().clone()),
 | |
|             my_contact_info: RwLock::new(my_contact_info),
 | |
|             id: *new_id,
 | |
|             stats: GossipStats::default(),
 | |
|             socket: UdpSocket::bind("0.0.0.0:0").unwrap(),
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     pub fn update_contact_info<F>(&self, modify: F)
 | |
|     where
 | |
|         F: FnOnce(&mut ContactInfo),
 | |
|     {
 | |
|         let my_id = self.id();
 | |
|         modify(&mut self.my_contact_info.write().unwrap());
 | |
|         assert_eq!(self.my_contact_info.read().unwrap().id, my_id);
 | |
|         self.insert_self()
 | |
|     }
 | |
| 
 | |
|     fn push_self(&self, stakes: &HashMap<Pubkey, u64>) {
 | |
|         let now = timestamp();
 | |
|         self.my_contact_info.write().unwrap().wallclock = now;
 | |
|         let entry =
 | |
|             CrdsValue::new_signed(CrdsData::ContactInfo(self.my_contact_info()), &self.keypair);
 | |
|         let mut w_gossip = self.gossip.write().unwrap();
 | |
|         w_gossip.refresh_push_active_set(stakes);
 | |
|         w_gossip.process_push_message(&self.id(), vec![entry], now);
 | |
|     }
 | |
| 
 | |
|     // TODO kill insert_info, only used by tests
 | |
|     pub fn insert_info(&self, contact_info: ContactInfo) {
 | |
|         let value = CrdsValue::new_signed(CrdsData::ContactInfo(contact_info), &self.keypair);
 | |
|         let _ = self.gossip.write().unwrap().crds.insert(value, timestamp());
 | |
|     }
 | |
| 
 | |
|     pub fn set_entrypoint(&self, entrypoint: ContactInfo) {
 | |
|         *self.entrypoint.write().unwrap() = Some(entrypoint)
 | |
|     }
 | |
| 
 | |
|     pub fn id(&self) -> Pubkey {
 | |
|         self.id
 | |
|     }
 | |
| 
 | |
|     pub fn lookup_contact_info<F, Y>(&self, id: &Pubkey, map: F) -> Option<Y>
 | |
|     where
 | |
|         F: FnOnce(&ContactInfo) -> Y,
 | |
|     {
 | |
|         let entry = CrdsValueLabel::ContactInfo(*id);
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .lookup(&entry)
 | |
|             .and_then(CrdsValue::contact_info)
 | |
|             .map(map)
 | |
|     }
 | |
| 
 | |
|     pub fn lookup_contact_info_by_gossip_addr(
 | |
|         &self,
 | |
|         gossip_addr: &SocketAddr,
 | |
|     ) -> Option<ContactInfo> {
 | |
|         for versioned_value in self.gossip.read().unwrap().crds.table.values() {
 | |
|             if let Some(contact_info) = CrdsValue::contact_info(&versioned_value.value) {
 | |
|                 if contact_info.gossip == *gossip_addr {
 | |
|                     return Some(contact_info.clone());
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         None
 | |
|     }
 | |
| 
 | |
|     pub fn my_contact_info(&self) -> ContactInfo {
 | |
|         self.my_contact_info.read().unwrap().clone()
 | |
|     }
 | |
| 
 | |
|     pub fn my_shred_version(&self) -> u16 {
 | |
|         self.my_contact_info.read().unwrap().shred_version
 | |
|     }
 | |
| 
 | |
|     pub fn lookup_epoch_slots(&self, ix: EpochSlotsIndex) -> EpochSlots {
 | |
|         let entry = CrdsValueLabel::EpochSlots(ix, self.id());
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .lookup(&entry)
 | |
|             .and_then(CrdsValue::epoch_slots)
 | |
|             .cloned()
 | |
|             .unwrap_or_else(|| EpochSlots::new(self.id(), timestamp()))
 | |
|     }
 | |
| 
 | |
|     pub fn contact_info_trace(&self) -> String {
 | |
|         let now = timestamp();
 | |
|         let mut spy_nodes = 0;
 | |
|         let mut different_shred_nodes = 0;
 | |
|         let my_pubkey = self.id();
 | |
|         let my_shred_version = self.my_shred_version();
 | |
|         let nodes: Vec<_> = self
 | |
|             .all_peers()
 | |
|             .into_iter()
 | |
|             .filter_map(|(node, last_updated)| {
 | |
|                 if Self::is_spy_node(&node) {
 | |
|                     spy_nodes += 1;
 | |
|                 }
 | |
| 
 | |
|                 let node_version = self.get_node_version(&node.id);
 | |
|                 if my_shred_version != 0 && (node.shred_version != 0 && node.shred_version != my_shred_version) {
 | |
|                     different_shred_nodes += 1;
 | |
|                     None
 | |
|                 } else {
 | |
|                     fn addr_to_string(default_ip: &IpAddr, addr: &SocketAddr) -> String {
 | |
|                         if ContactInfo::is_valid_address(addr) {
 | |
|                             if &addr.ip() == default_ip {
 | |
|                                 addr.port().to_string()
 | |
|                             } else {
 | |
|                                 addr.to_string()
 | |
|                             }
 | |
|                         } else {
 | |
|                             "none".to_string()
 | |
|                         }
 | |
|                     }
 | |
|                     let ip_addr = node.gossip.ip();
 | |
|                     Some(format!(
 | |
|                         "{:15} {:2}| {:5} | {:44} |{:^15}| {:5}| {:5}| {:5}| {:5}| {:5}| {:5}| {:5}| {:5}| {:5}| {:5}| {}\n",
 | |
|                         if ContactInfo::is_valid_address(&node.gossip) {
 | |
|                             ip_addr.to_string()
 | |
|                         } else {
 | |
|                             "none".to_string()
 | |
|                         },
 | |
|                         if node.id == my_pubkey { "me" } else { "" }.to_string(),
 | |
|                         now.saturating_sub(last_updated),
 | |
|                         node.id.to_string(),
 | |
|                         if let Some(node_version) = node_version {
 | |
|                             node_version.to_string()
 | |
|                         } else {
 | |
|                             "-".to_string()
 | |
|                         },
 | |
|                         addr_to_string(&ip_addr, &node.gossip),
 | |
|                         addr_to_string(&ip_addr, &node.tpu),
 | |
|                         addr_to_string(&ip_addr, &node.tpu_forwards),
 | |
|                         addr_to_string(&ip_addr, &node.tvu),
 | |
|                         addr_to_string(&ip_addr, &node.tvu_forwards),
 | |
|                         addr_to_string(&ip_addr, &node.repair),
 | |
|                         addr_to_string(&ip_addr, &node.serve_repair),
 | |
|                         addr_to_string(&ip_addr, &node.rpc),
 | |
|                         addr_to_string(&ip_addr, &node.rpc_pubsub),
 | |
|                         addr_to_string(&ip_addr, &node.rpc_banks),
 | |
|                         node.shred_version,
 | |
|                     ))
 | |
|                 }
 | |
|             })
 | |
|             .collect();
 | |
| 
 | |
|         format!(
 | |
|             "IP Address        |Age(ms)| Node identifier                              \
 | |
|              | Version       |Gossip| TPU  |TPUfwd| TVU  |TVUfwd|Repair|ServeR| RPC  |PubSub|ShredVer\n\
 | |
|              ------------------+-------+----------------------------------------------+---------------+\
 | |
|              ------+------+------+------+------+------+------+------+------+--------\n\
 | |
|              {}\
 | |
|              Nodes: {}{}{}",
 | |
|             nodes.join(""),
 | |
|             nodes.len() - spy_nodes,
 | |
|             if spy_nodes > 0 {
 | |
|                 format!("\nSpies: {}", spy_nodes)
 | |
|             } else {
 | |
|                 "".to_string()
 | |
|             },
 | |
|             if different_shred_nodes > 0 {
 | |
|                 format!(
 | |
|                     "\nNodes with different shred version: {}",
 | |
|                     different_shred_nodes
 | |
|                 )
 | |
|             } else {
 | |
|                 "".to_string()
 | |
|             }
 | |
|         )
 | |
|     }
 | |
| 
 | |
|     pub fn push_lowest_slot(&self, id: Pubkey, min: Slot) {
 | |
|         let now = timestamp();
 | |
|         let last = self
 | |
|             .gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .lookup(&CrdsValueLabel::LowestSlot(self.id()))
 | |
|             .and_then(|x| x.lowest_slot())
 | |
|             .map(|x| x.lowest)
 | |
|             .unwrap_or(0);
 | |
|         if min > last {
 | |
|             let entry = CrdsValue::new_signed(
 | |
|                 CrdsData::LowestSlot(0, LowestSlot::new(id, min, now)),
 | |
|                 &self.keypair,
 | |
|             );
 | |
|             self.gossip
 | |
|                 .write()
 | |
|                 .unwrap()
 | |
|                 .process_push_message(&self.id(), vec![entry], now);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     pub fn push_epoch_slots(&self, update: &[Slot]) {
 | |
|         let mut num = 0;
 | |
|         let mut current_slots: Vec<_> = (0..crds_value::MAX_EPOCH_SLOTS)
 | |
|             .filter_map(|ix| {
 | |
|                 Some((
 | |
|                     self.time_gossip_read_lock(
 | |
|                         "lookup_epoch_slots",
 | |
|                         &self.stats.epoch_slots_lookup,
 | |
|                     )
 | |
|                     .crds
 | |
|                     .lookup(&CrdsValueLabel::EpochSlots(ix, self.id()))
 | |
|                     .and_then(CrdsValue::epoch_slots)
 | |
|                     .and_then(|x| Some((x.wallclock, x.first_slot()?)))?,
 | |
|                     ix,
 | |
|                 ))
 | |
|             })
 | |
|             .collect();
 | |
|         current_slots.sort();
 | |
|         let min_slot: Slot = current_slots
 | |
|             .iter()
 | |
|             .map(|((_, s), _)| *s)
 | |
|             .min()
 | |
|             .unwrap_or(0);
 | |
|         let max_slot: Slot = update.iter().max().cloned().unwrap_or(0);
 | |
|         let total_slots = max_slot as isize - min_slot as isize;
 | |
|         // WARN if CRDS is not storing at least a full epoch worth of slots
 | |
|         if DEFAULT_SLOTS_PER_EPOCH as isize > total_slots
 | |
|             && crds_value::MAX_EPOCH_SLOTS as usize <= current_slots.len()
 | |
|         {
 | |
|             inc_new_counter_warn!("cluster_info-epoch_slots-filled", 1);
 | |
|             warn!(
 | |
|                 "EPOCH_SLOTS are filling up FAST {}/{}",
 | |
|                 total_slots,
 | |
|                 current_slots.len()
 | |
|             );
 | |
|         }
 | |
|         let mut reset = false;
 | |
|         let mut epoch_slot_index = current_slots.last().map(|(_, x)| *x).unwrap_or(0);
 | |
|         while num < update.len() {
 | |
|             let ix = (epoch_slot_index % crds_value::MAX_EPOCH_SLOTS) as u8;
 | |
|             let now = timestamp();
 | |
|             let mut slots = if !reset {
 | |
|                 self.lookup_epoch_slots(ix)
 | |
|             } else {
 | |
|                 EpochSlots::new(self.id(), now)
 | |
|             };
 | |
|             let n = slots.fill(&update[num..], now);
 | |
|             if n > 0 {
 | |
|                 let entry = CrdsValue::new_signed(CrdsData::EpochSlots(ix, slots), &self.keypair);
 | |
|                 self.time_gossip_write_lock("epcoh_slots_push", &self.stats.epoch_slots_push)
 | |
|                     .process_push_message(&self.id(), vec![entry], now);
 | |
|             }
 | |
|             num += n;
 | |
|             if num < update.len() {
 | |
|                 epoch_slot_index += 1;
 | |
|                 reset = true;
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     fn time_gossip_read_lock<'a>(
 | |
|         &'a self,
 | |
|         label: &'static str,
 | |
|         counter: &'a Counter,
 | |
|     ) -> GossipReadLock<'a> {
 | |
|         GossipReadLock::new(self.gossip.read().unwrap(), label, counter)
 | |
|     }
 | |
| 
 | |
|     fn time_gossip_write_lock<'a>(
 | |
|         &'a self,
 | |
|         label: &'static str,
 | |
|         counter: &'a Counter,
 | |
|     ) -> GossipWriteLock<'a> {
 | |
|         GossipWriteLock::new(self.gossip.write().unwrap(), label, counter)
 | |
|     }
 | |
| 
 | |
|     pub fn push_message(&self, message: CrdsValue) {
 | |
|         let now = message.wallclock();
 | |
|         let id = message.pubkey();
 | |
|         self.time_gossip_write_lock("process_push_message", &self.stats.push_message)
 | |
|             .process_push_message(&id, vec![message], now);
 | |
|     }
 | |
| 
 | |
|     pub fn push_accounts_hashes(&self, accounts_hashes: Vec<(Slot, Hash)>) {
 | |
|         if accounts_hashes.len() > MAX_SNAPSHOT_HASHES {
 | |
|             warn!(
 | |
|                 "accounts hashes too large, ignored: {}",
 | |
|                 accounts_hashes.len(),
 | |
|             );
 | |
|             return;
 | |
|         }
 | |
| 
 | |
|         let message = CrdsData::AccountsHashes(SnapshotHash::new(self.id(), accounts_hashes));
 | |
|         self.push_message(CrdsValue::new_signed(message, &self.keypair));
 | |
|     }
 | |
| 
 | |
|     pub fn push_snapshot_hashes(&self, snapshot_hashes: Vec<(Slot, Hash)>) {
 | |
|         if snapshot_hashes.len() > MAX_SNAPSHOT_HASHES {
 | |
|             warn!(
 | |
|                 "snapshot hashes too large, ignored: {}",
 | |
|                 snapshot_hashes.len(),
 | |
|             );
 | |
|             return;
 | |
|         }
 | |
| 
 | |
|         let message = CrdsData::SnapshotHashes(SnapshotHash::new(self.id(), snapshot_hashes));
 | |
|         self.push_message(CrdsValue::new_signed(message, &self.keypair));
 | |
|     }
 | |
| 
 | |
|     pub fn push_vote(&self, tower_index: usize, vote: Transaction) {
 | |
|         let now = timestamp();
 | |
|         let vote = Vote::new(&self.id(), vote, now);
 | |
|         let vote_ix = {
 | |
|             let r_gossip =
 | |
|                 self.time_gossip_read_lock("gossip_read_push_vote", &self.stats.push_vote_read);
 | |
|             let current_votes: Vec<_> = (0..crds_value::MAX_VOTES)
 | |
|                 .filter_map(|ix| r_gossip.crds.lookup(&CrdsValueLabel::Vote(ix, self.id())))
 | |
|                 .collect();
 | |
|             CrdsValue::compute_vote_index(tower_index, current_votes)
 | |
|         };
 | |
|         let entry = CrdsValue::new_signed(CrdsData::Vote(vote_ix, vote), &self.keypair);
 | |
|         self.time_gossip_write_lock("push_vote_process_push", &self.stats.vote_process_push)
 | |
|             .process_push_message(&self.id(), vec![entry], now);
 | |
|     }
 | |
| 
 | |
|     pub fn send_vote(&self, vote: &Transaction) -> Result<()> {
 | |
|         let tpu = self.my_contact_info().tpu;
 | |
|         let buf = serialize(vote)?;
 | |
|         self.socket.send_to(&buf, &tpu)?;
 | |
|         Ok(())
 | |
|     }
 | |
| 
 | |
|     /// Get votes in the crds
 | |
|     /// * since - The timestamp of when the vote inserted must be greater than
 | |
|     /// since. This allows the bank to query for new votes only.
 | |
|     ///
 | |
|     /// * return - The votes, and the max timestamp from the new set.
 | |
|     pub fn get_votes(&self, since: u64) -> (Vec<CrdsValueLabel>, Vec<Transaction>, u64) {
 | |
|         let mut max_ts = since;
 | |
|         let (labels, txs): (Vec<CrdsValueLabel>, Vec<Transaction>) = self
 | |
|             .time_gossip_read_lock("get_votes", &self.stats.get_votes)
 | |
|             .crds
 | |
|             .table
 | |
|             .iter()
 | |
|             .filter(|(_, x)| x.insert_timestamp > since)
 | |
|             .filter_map(|(label, x)| {
 | |
|                 max_ts = std::cmp::max(x.insert_timestamp, max_ts);
 | |
|                 x.value
 | |
|                     .vote()
 | |
|                     .map(|v| (label.clone(), v.transaction.clone()))
 | |
|             })
 | |
|             .unzip();
 | |
|         inc_new_counter_info!("cluster_info-get_votes-count", txs.len());
 | |
|         (labels, txs, max_ts)
 | |
|     }
 | |
| 
 | |
|     pub fn get_snapshot_hash(&self, slot: Slot) -> Vec<(Pubkey, Hash)> {
 | |
|         self.time_gossip_read_lock("get_snapshot_hash", &self.stats.get_snapshot_hash)
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| x.value.snapshot_hash())
 | |
|             .filter_map(|x| {
 | |
|                 for (table_slot, hash) in &x.hashes {
 | |
|                     if *table_slot == slot {
 | |
|                         return Some((x.from, *hash));
 | |
|                     }
 | |
|                 }
 | |
|                 None
 | |
|             })
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     pub fn get_accounts_hash_for_node<F, Y>(&self, pubkey: &Pubkey, map: F) -> Option<Y>
 | |
|     where
 | |
|         F: FnOnce(&Vec<(Slot, Hash)>) -> Y,
 | |
|     {
 | |
|         self.time_gossip_read_lock("get_accounts_hash", &self.stats.get_accounts_hash)
 | |
|             .crds
 | |
|             .table
 | |
|             .get(&CrdsValueLabel::AccountsHashes(*pubkey))
 | |
|             .map(|x| &x.value.accounts_hash().unwrap().hashes)
 | |
|             .map(map)
 | |
|     }
 | |
| 
 | |
|     pub fn get_snapshot_hash_for_node<F, Y>(&self, pubkey: &Pubkey, map: F) -> Option<Y>
 | |
|     where
 | |
|         F: FnOnce(&Vec<(Slot, Hash)>) -> Y,
 | |
|     {
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .get(&CrdsValueLabel::SnapshotHashes(*pubkey))
 | |
|             .map(|x| &x.value.snapshot_hash().unwrap().hashes)
 | |
|             .map(map)
 | |
|     }
 | |
| 
 | |
|     pub fn get_lowest_slot_for_node<F, Y>(
 | |
|         &self,
 | |
|         pubkey: &Pubkey,
 | |
|         since: Option<u64>,
 | |
|         map: F,
 | |
|     ) -> Option<Y>
 | |
|     where
 | |
|         F: FnOnce(&LowestSlot, u64) -> Y,
 | |
|     {
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .get(&CrdsValueLabel::LowestSlot(*pubkey))
 | |
|             .filter(|x| {
 | |
|                 since
 | |
|                     .map(|since| x.insert_timestamp > since)
 | |
|                     .unwrap_or(true)
 | |
|             })
 | |
|             .map(|x| map(x.value.lowest_slot().unwrap(), x.insert_timestamp))
 | |
|     }
 | |
| 
 | |
|     pub fn get_epoch_slots_since(&self, since: Option<u64>) -> (Vec<EpochSlots>, Option<u64>) {
 | |
|         let vals: Vec<_> = self
 | |
|             .gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter(|x| {
 | |
|                 since
 | |
|                     .map(|since| x.insert_timestamp > since)
 | |
|                     .unwrap_or(true)
 | |
|             })
 | |
|             .filter_map(|x| Some((x.value.epoch_slots()?.clone(), x.insert_timestamp)))
 | |
|             .collect();
 | |
|         let max = vals.iter().map(|x| x.1).max().or(since);
 | |
|         let vec = vals.into_iter().map(|x| x.0).collect();
 | |
|         (vec, max)
 | |
|     }
 | |
| 
 | |
|     pub fn get_node_version(&self, pubkey: &Pubkey) -> Option<solana_version::Version> {
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .get(&CrdsValueLabel::Version(*pubkey))
 | |
|             .map(|x| x.value.version())
 | |
|             .flatten()
 | |
|             .map(|version| version.version.clone())
 | |
|     }
 | |
| 
 | |
|     /// all validators that have a valid rpc port regardless of `shred_version`.
 | |
|     pub fn all_rpc_peers(&self) -> Vec<ContactInfo> {
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| x.value.contact_info())
 | |
|             .filter(|x| x.id != self.id() && ContactInfo::is_valid_address(&x.rpc))
 | |
|             .cloned()
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     // All nodes in gossip (including spy nodes) and the last time we heard about them
 | |
|     pub(crate) fn all_peers(&self) -> Vec<(ContactInfo, u64)> {
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| {
 | |
|                 x.value
 | |
|                     .contact_info()
 | |
|                     .map(|ci| (ci.clone(), x.local_timestamp))
 | |
|             })
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     pub fn gossip_peers(&self) -> Vec<ContactInfo> {
 | |
|         let me = self.id();
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| x.value.contact_info())
 | |
|             // shred_version not considered for gossip peers (ie, spy nodes do not set shred_version)
 | |
|             .filter(|x| x.id != me && ContactInfo::is_valid_address(&x.gossip))
 | |
|             .cloned()
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     /// all validators that have a valid tvu port regardless of `shred_version`.
 | |
|     pub fn all_tvu_peers(&self) -> Vec<ContactInfo> {
 | |
|         self.time_gossip_read_lock("all_tvu_peers", &self.stats.all_tvu_peers)
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| x.value.contact_info())
 | |
|             .filter(|x| ContactInfo::is_valid_address(&x.tvu) && x.id != self.id())
 | |
|             .cloned()
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     /// all validators that have a valid tvu port and are on the same `shred_version`.
 | |
|     pub fn tvu_peers(&self) -> Vec<ContactInfo> {
 | |
|         self.time_gossip_read_lock("tvu_peers", &self.stats.tvu_peers)
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| x.value.contact_info())
 | |
|             .filter(|x| {
 | |
|                 ContactInfo::is_valid_address(&x.tvu)
 | |
|                     && x.id != self.id()
 | |
|                     && x.shred_version == self.my_shred_version()
 | |
|             })
 | |
|             .cloned()
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     /// all peers that have a valid tvu
 | |
|     pub fn retransmit_peers(&self) -> Vec<ContactInfo> {
 | |
|         self.time_gossip_read_lock("retransmit_peers", &self.stats.retransmit_peers)
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| x.value.contact_info())
 | |
|             .filter(|x| {
 | |
|                 x.id != self.id()
 | |
|                     && x.shred_version == self.my_shred_version()
 | |
|                     && ContactInfo::is_valid_address(&x.tvu)
 | |
|                     && ContactInfo::is_valid_address(&x.tvu_forwards)
 | |
|             })
 | |
|             .cloned()
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     /// all tvu peers with valid gossip addrs that likely have the slot being requested
 | |
|     pub fn repair_peers(&self, slot: Slot) -> Vec<ContactInfo> {
 | |
|         let mut time = Measure::start("repair_peers");
 | |
|         let ret = ClusterInfo::tvu_peers(self)
 | |
|             .into_iter()
 | |
|             .filter(|x| {
 | |
|                 x.id != self.id()
 | |
|                     && x.shred_version == self.my_shred_version()
 | |
|                     && ContactInfo::is_valid_address(&x.serve_repair)
 | |
|                     && {
 | |
|                         self.get_lowest_slot_for_node(&x.id, None, |lowest_slot, _| {
 | |
|                             lowest_slot.lowest <= slot
 | |
|                         })
 | |
|                         .unwrap_or_else(|| /* fallback to legacy behavior */ true)
 | |
|                     }
 | |
|             })
 | |
|             .collect();
 | |
|         self.stats.repair_peers.add_measure(&mut time);
 | |
|         ret
 | |
|     }
 | |
| 
 | |
|     fn is_spy_node(contact_info: &ContactInfo) -> bool {
 | |
|         !ContactInfo::is_valid_address(&contact_info.tpu)
 | |
|             || !ContactInfo::is_valid_address(&contact_info.gossip)
 | |
|             || !ContactInfo::is_valid_address(&contact_info.tvu)
 | |
|     }
 | |
| 
 | |
|     fn sorted_stakes_with_index<S: std::hash::BuildHasher>(
 | |
|         peers: &[ContactInfo],
 | |
|         stakes: Option<Arc<HashMap<Pubkey, u64, S>>>,
 | |
|     ) -> Vec<(u64, usize)> {
 | |
|         let stakes_and_index: Vec<_> = peers
 | |
|             .iter()
 | |
|             .enumerate()
 | |
|             .map(|(i, c)| {
 | |
|                 // For stake weighted shuffle a valid weight is atleast 1. Weight 0 is
 | |
|                 // assumed to be missing entry. So let's make sure stake weights are atleast 1
 | |
|                 let stake = 1.max(
 | |
|                     stakes
 | |
|                         .as_ref()
 | |
|                         .map_or(1, |stakes| *stakes.get(&c.id).unwrap_or(&1)),
 | |
|                 );
 | |
|                 (stake, i)
 | |
|             })
 | |
|             .sorted_by(|(l_stake, l_info), (r_stake, r_info)| {
 | |
|                 if r_stake == l_stake {
 | |
|                     peers[*r_info].id.cmp(&peers[*l_info].id)
 | |
|                 } else {
 | |
|                     r_stake.cmp(&l_stake)
 | |
|                 }
 | |
|             })
 | |
|             .collect();
 | |
| 
 | |
|         stakes_and_index
 | |
|     }
 | |
| 
 | |
|     fn stake_weighted_shuffle(
 | |
|         stakes_and_index: &[(u64, usize)],
 | |
|         seed: [u8; 32],
 | |
|     ) -> Vec<(u64, usize)> {
 | |
|         let stake_weights = stakes_and_index.iter().map(|(w, _)| *w).collect();
 | |
| 
 | |
|         let shuffle = weighted_shuffle(stake_weights, seed);
 | |
| 
 | |
|         shuffle.iter().map(|x| stakes_and_index[*x]).collect()
 | |
|     }
 | |
| 
 | |
|     // Return sorted_retransmit_peers(including self) and their stakes
 | |
|     pub fn sorted_retransmit_peers_and_stakes(
 | |
|         &self,
 | |
|         stakes: Option<Arc<HashMap<Pubkey, u64>>>,
 | |
|     ) -> (Vec<ContactInfo>, Vec<(u64, usize)>) {
 | |
|         let mut peers = self.retransmit_peers();
 | |
|         // insert "self" into this list for the layer and neighborhood computation
 | |
|         peers.push(self.my_contact_info());
 | |
|         let stakes_and_index = ClusterInfo::sorted_stakes_with_index(&peers, stakes);
 | |
|         (peers, stakes_and_index)
 | |
|     }
 | |
| 
 | |
|     /// Return sorted Retransmit peers and index of `Self.id()` as if it were in that list
 | |
|     pub fn shuffle_peers_and_index(
 | |
|         id: &Pubkey,
 | |
|         peers: &[ContactInfo],
 | |
|         stakes_and_index: &[(u64, usize)],
 | |
|         seed: [u8; 32],
 | |
|     ) -> (usize, Vec<(u64, usize)>) {
 | |
|         let shuffled_stakes_and_index = ClusterInfo::stake_weighted_shuffle(stakes_and_index, seed);
 | |
|         let mut self_index = 0;
 | |
|         shuffled_stakes_and_index
 | |
|             .iter()
 | |
|             .enumerate()
 | |
|             .for_each(|(i, (_stake, index))| {
 | |
|                 if &peers[*index].id == id {
 | |
|                     self_index = i;
 | |
|                 }
 | |
|             });
 | |
|         (self_index, shuffled_stakes_and_index)
 | |
|     }
 | |
| 
 | |
|     /// compute broadcast table
 | |
|     pub fn tpu_peers(&self) -> Vec<ContactInfo> {
 | |
|         self.gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .table
 | |
|             .values()
 | |
|             .filter_map(|x| x.value.contact_info())
 | |
|             .filter(|x| x.id != self.id() && ContactInfo::is_valid_address(&x.tpu))
 | |
|             .cloned()
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     /// Given a node count and fanout, it calculates how many layers are needed and at what index each layer begins.
 | |
|     pub fn describe_data_plane(nodes: usize, fanout: usize) -> (usize, Vec<usize>) {
 | |
|         let mut layer_indices: Vec<usize> = vec![0];
 | |
|         if nodes == 0 {
 | |
|             (0, vec![])
 | |
|         } else if nodes <= fanout {
 | |
|             // single layer data plane
 | |
|             (1, layer_indices)
 | |
|         } else {
 | |
|             //layer 1 is going to be the first num fanout nodes, so exclude those
 | |
|             let mut remaining_nodes = nodes - fanout;
 | |
|             layer_indices.push(fanout);
 | |
|             let mut num_layers = 2;
 | |
|             // fanout * num_nodes in a neighborhood, which is also fanout.
 | |
|             let mut layer_capacity = fanout * fanout;
 | |
|             while remaining_nodes > 0 {
 | |
|                 if remaining_nodes > layer_capacity {
 | |
|                     // Needs more layers.
 | |
|                     num_layers += 1;
 | |
|                     remaining_nodes -= layer_capacity;
 | |
|                     let end = *layer_indices.last().unwrap();
 | |
|                     layer_indices.push(layer_capacity + end);
 | |
| 
 | |
|                     // Next layer's capacity
 | |
|                     layer_capacity *= fanout;
 | |
|                 } else {
 | |
|                     //everything will now fit in the layers we have
 | |
|                     let end = *layer_indices.last().unwrap();
 | |
|                     layer_indices.push(layer_capacity + end);
 | |
|                     break;
 | |
|                 }
 | |
|             }
 | |
|             assert_eq!(num_layers, layer_indices.len() - 1);
 | |
|             (num_layers, layer_indices)
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     fn localize_item(
 | |
|         layer_indices: &[usize],
 | |
|         fanout: usize,
 | |
|         select_index: usize,
 | |
|         curr_index: usize,
 | |
|     ) -> Option<Locality> {
 | |
|         let end = layer_indices.len() - 1;
 | |
|         let next = min(end, curr_index + 1);
 | |
|         let layer_start = layer_indices[curr_index];
 | |
|         // localized if selected index lies within the current layer's bounds
 | |
|         let localized = select_index >= layer_start && select_index < layer_indices[next];
 | |
|         if localized {
 | |
|             let mut locality = Locality::default();
 | |
|             let hood_ix = (select_index - layer_start) / fanout;
 | |
|             match curr_index {
 | |
|                 _ if curr_index == 0 => {
 | |
|                     locality.layer_ix = 0;
 | |
|                     locality.layer_bounds = (0, fanout);
 | |
|                     locality.neighbor_bounds = locality.layer_bounds;
 | |
| 
 | |
|                     if next == end {
 | |
|                         locality.next_layer_bounds = None;
 | |
|                         locality.next_layer_peers = vec![];
 | |
|                     } else {
 | |
|                         locality.next_layer_bounds =
 | |
|                             Some((layer_indices[next], layer_indices[next + 1]));
 | |
|                         locality.next_layer_peers = ClusterInfo::next_layer_peers(
 | |
|                             select_index,
 | |
|                             hood_ix,
 | |
|                             layer_indices[next],
 | |
|                             fanout,
 | |
|                         );
 | |
|                     }
 | |
|                 }
 | |
|                 _ if curr_index == end => {
 | |
|                     locality.layer_ix = end;
 | |
|                     locality.layer_bounds = (end - fanout, end);
 | |
|                     locality.neighbor_bounds = locality.layer_bounds;
 | |
|                     locality.next_layer_bounds = None;
 | |
|                     locality.next_layer_peers = vec![];
 | |
|                 }
 | |
|                 ix => {
 | |
|                     locality.layer_ix = ix;
 | |
|                     locality.layer_bounds = (layer_start, layer_indices[next]);
 | |
|                     locality.neighbor_bounds = (
 | |
|                         ((hood_ix * fanout) + layer_start),
 | |
|                         ((hood_ix + 1) * fanout + layer_start),
 | |
|                     );
 | |
| 
 | |
|                     if next == end {
 | |
|                         locality.next_layer_bounds = None;
 | |
|                         locality.next_layer_peers = vec![];
 | |
|                     } else {
 | |
|                         locality.next_layer_bounds =
 | |
|                             Some((layer_indices[next], layer_indices[next + 1]));
 | |
|                         locality.next_layer_peers = ClusterInfo::next_layer_peers(
 | |
|                             select_index,
 | |
|                             hood_ix,
 | |
|                             layer_indices[next],
 | |
|                             fanout,
 | |
|                         );
 | |
|                     }
 | |
|                 }
 | |
|             }
 | |
|             Some(locality)
 | |
|         } else {
 | |
|             None
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /// Given a array of layer indices and an index of interest, returns (as a `Locality`) the layer,
 | |
|     /// layer-bounds, and neighborhood-bounds in which the index resides
 | |
|     fn localize(layer_indices: &[usize], fanout: usize, select_index: usize) -> Locality {
 | |
|         (0..layer_indices.len())
 | |
|             .find_map(|i| ClusterInfo::localize_item(layer_indices, fanout, select_index, i))
 | |
|             .or_else(|| Some(Locality::default()))
 | |
|             .unwrap()
 | |
|     }
 | |
| 
 | |
|     /// Selects a range in the next layer and chooses nodes from that range as peers for the given index
 | |
|     fn next_layer_peers(index: usize, hood_ix: usize, start: usize, fanout: usize) -> Vec<usize> {
 | |
|         // Each neighborhood is only tasked with pushing to `fanout` neighborhoods where each neighborhood contains `fanout` nodes.
 | |
|         let fanout_nodes = fanout * fanout;
 | |
|         // Skip first N nodes, where N is hood_ix * (fanout_nodes)
 | |
|         let start = start + (hood_ix * fanout_nodes);
 | |
|         let end = start + fanout_nodes;
 | |
|         (start..end)
 | |
|             .step_by(fanout)
 | |
|             .map(|x| x + index % fanout)
 | |
|             .collect()
 | |
|     }
 | |
| 
 | |
|     /// retransmit messages to a list of nodes
 | |
|     /// # Remarks
 | |
|     /// We need to avoid having obj locked while doing a io, such as the `send_to`
 | |
|     pub fn retransmit_to(
 | |
|         peers: &[&ContactInfo],
 | |
|         packet: &mut Packet,
 | |
|         slot_leader_pubkey: Option<Pubkey>,
 | |
|         s: &UdpSocket,
 | |
|         forwarded: bool,
 | |
|     ) -> Result<()> {
 | |
|         trace!("retransmit orders {}", peers.len());
 | |
|         let dests: Vec<_> = peers
 | |
|             .iter()
 | |
|             .filter(|v| v.id != slot_leader_pubkey.unwrap_or_default())
 | |
|             .map(|v| if forwarded { &v.tvu_forwards } else { &v.tvu })
 | |
|             .collect();
 | |
| 
 | |
|         let mut sent = 0;
 | |
|         while sent < dests.len() {
 | |
|             match multicast(s, &mut packet.data[..packet.meta.size], &dests[sent..]) {
 | |
|                 Ok(n) => sent += n,
 | |
|                 Err(e) => {
 | |
|                     inc_new_counter_error!(
 | |
|                         "cluster_info-retransmit-send_to_error",
 | |
|                         dests.len() - sent,
 | |
|                         1
 | |
|                     );
 | |
|                     error!("retransmit result {:?}", e);
 | |
|                     return Err(Error::IO(e));
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
|         Ok(())
 | |
|     }
 | |
| 
 | |
|     fn insert_self(&self) {
 | |
|         let value =
 | |
|             CrdsValue::new_signed(CrdsData::ContactInfo(self.my_contact_info()), &self.keypair);
 | |
|         let _ = self.gossip.write().unwrap().crds.insert(value, timestamp());
 | |
|     }
 | |
| 
 | |
|     // If the network entrypoint hasn't been discovered yet, add it to the crds table
 | |
|     fn append_entrypoint_to_pulls(
 | |
|         &self,
 | |
|         pulls: &mut Vec<(Pubkey, CrdsFilter, SocketAddr, CrdsValue)>,
 | |
|     ) {
 | |
|         let pull_from_entrypoint = {
 | |
|             let mut w_entrypoint = self.entrypoint.write().unwrap();
 | |
|             if let Some(ref mut entrypoint) = &mut *w_entrypoint {
 | |
|                 if pulls.is_empty() {
 | |
|                     // Nobody else to pull from, try the entrypoint
 | |
|                     true
 | |
|                 } else {
 | |
|                     let now = timestamp();
 | |
|                     // Only consider pulling from the entrypoint periodically to avoid spamming it
 | |
|                     if timestamp() - entrypoint.wallclock <= CRDS_GOSSIP_PULL_CRDS_TIMEOUT_MS / 2 {
 | |
|                         false
 | |
|                     } else {
 | |
|                         entrypoint.wallclock = now;
 | |
|                         let found_entrypoint = self
 | |
|                             .time_gossip_read_lock("entrypoint", &self.stats.entrypoint)
 | |
|                             .crds
 | |
|                             .table
 | |
|                             .iter()
 | |
|                             .any(|(_, v)| {
 | |
|                                 v.value
 | |
|                                     .contact_info()
 | |
|                                     .map(|ci| ci.gossip == entrypoint.gossip)
 | |
|                                     .unwrap_or(false)
 | |
|                             });
 | |
|                         !found_entrypoint
 | |
|                     }
 | |
|                 }
 | |
|             } else {
 | |
|                 false
 | |
|             }
 | |
|         };
 | |
| 
 | |
|         if pull_from_entrypoint {
 | |
|             let id_and_gossip = {
 | |
|                 self.entrypoint
 | |
|                     .read()
 | |
|                     .unwrap()
 | |
|                     .as_ref()
 | |
|                     .map(|e| (e.id, e.gossip))
 | |
|             };
 | |
|             if let Some((id, gossip)) = id_and_gossip {
 | |
|                 let r_gossip = self.time_gossip_read_lock("entrypoint", &self.stats.entrypoint2);
 | |
|                 let self_info = r_gossip
 | |
|                     .crds
 | |
|                     .lookup(&CrdsValueLabel::ContactInfo(self.id()))
 | |
|                     .unwrap_or_else(|| panic!("self_id invalid {}", self.id()));
 | |
|                 r_gossip
 | |
|                     .pull
 | |
|                     .build_crds_filters(&r_gossip.crds, MAX_BLOOM_SIZE)
 | |
|                     .into_iter()
 | |
|                     .for_each(|filter| pulls.push((id, filter, gossip, self_info.clone())));
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /// Splits a Vec of CrdsValues into a nested Vec, trying to make sure that
 | |
|     /// each Vec is no larger than `MAX_PROTOCOL_PAYLOAD_SIZE`
 | |
|     /// Note: some messages cannot be contained within that size so in the worst case this returns
 | |
|     /// N nested Vecs with 1 item each.
 | |
|     fn split_gossip_messages(msgs: Vec<CrdsValue>) -> Vec<Vec<CrdsValue>> {
 | |
|         let mut messages = vec![];
 | |
|         let mut payload = vec![];
 | |
|         let base_size = serialized_size(&payload).expect("Couldn't check size");
 | |
|         let max_payload_size = MAX_PROTOCOL_PAYLOAD_SIZE - base_size;
 | |
|         let mut payload_size = 0;
 | |
|         for msg in msgs {
 | |
|             let msg_size = msg.size();
 | |
|             // If the message is too big to fit in this batch
 | |
|             if payload_size + msg_size > max_payload_size as u64 {
 | |
|                 // See if it can fit in the next batch
 | |
|                 if msg_size <= max_payload_size as u64 {
 | |
|                     if !payload.is_empty() {
 | |
|                         // Flush the  current payload
 | |
|                         messages.push(payload);
 | |
|                         // Init the next payload
 | |
|                         payload = vec![msg];
 | |
|                         payload_size = msg_size;
 | |
|                     }
 | |
|                 } else {
 | |
|                     debug!(
 | |
|                         "dropping message larger than the maximum payload size {:?}",
 | |
|                         msg
 | |
|                     );
 | |
|                 }
 | |
|                 continue;
 | |
|             }
 | |
|             payload_size += msg_size;
 | |
|             payload.push(msg);
 | |
|         }
 | |
|         if !payload.is_empty() {
 | |
|             messages.push(payload);
 | |
|         }
 | |
|         messages
 | |
|     }
 | |
| 
 | |
|     fn new_pull_requests(&self, stakes: &HashMap<Pubkey, u64>) -> Vec<(SocketAddr, Protocol)> {
 | |
|         let now = timestamp();
 | |
|         let mut pulls: Vec<_> = {
 | |
|             let r_gossip =
 | |
|                 self.time_gossip_read_lock("new_pull_reqs", &self.stats.new_pull_requests);
 | |
|             r_gossip
 | |
|                 .new_pull_request(now, stakes, MAX_BLOOM_SIZE)
 | |
|                 .ok()
 | |
|                 .into_iter()
 | |
|                 .filter_map(|(peer, filters, me)| {
 | |
|                     let peer_label = CrdsValueLabel::ContactInfo(peer);
 | |
|                     r_gossip
 | |
|                         .crds
 | |
|                         .lookup(&peer_label)
 | |
|                         .and_then(CrdsValue::contact_info)
 | |
|                         .map(move |peer_info| {
 | |
|                             filters
 | |
|                                 .into_iter()
 | |
|                                 .map(move |f| (peer, f, peer_info.gossip, me.clone()))
 | |
|                         })
 | |
|                 })
 | |
|                 .flatten()
 | |
|                 .collect()
 | |
|         };
 | |
|         self.append_entrypoint_to_pulls(&mut pulls);
 | |
|         self.stats
 | |
|             .new_pull_requests_count
 | |
|             .add_relaxed(pulls.len() as u64);
 | |
|         pulls
 | |
|             .into_iter()
 | |
|             .map(|(peer, filter, gossip, self_info)| {
 | |
|                 self.time_gossip_write_lock("mark_pull", &self.stats.mark_pull_request)
 | |
|                     .mark_pull_request_creation_time(&peer, now);
 | |
|                 (gossip, Protocol::PullRequest(filter, self_info))
 | |
|             })
 | |
|             .collect()
 | |
|     }
 | |
|     fn new_push_requests(&self) -> Vec<(SocketAddr, Protocol)> {
 | |
|         let self_id = self.id();
 | |
|         let (_, push_messages) = self
 | |
|             .time_gossip_write_lock("new_push_requests", &self.stats.new_push_requests)
 | |
|             .new_push_messages(timestamp());
 | |
|         let messages: Vec<_> = push_messages
 | |
|             .into_iter()
 | |
|             .filter_map(|(peer, messages)| {
 | |
|                 let peer_label = CrdsValueLabel::ContactInfo(peer);
 | |
|                 self.time_gossip_read_lock("push_req_lookup", &self.stats.new_push_requests2)
 | |
|                     .crds
 | |
|                     .lookup(&peer_label)
 | |
|                     .and_then(CrdsValue::contact_info)
 | |
|                     .map(|p| (p.gossip, messages))
 | |
|             })
 | |
|             .flat_map(|(peer, msgs)| {
 | |
|                 Self::split_gossip_messages(msgs)
 | |
|                     .into_iter()
 | |
|                     .map(move |payload| (peer, Protocol::PushMessage(self_id, payload)))
 | |
|             })
 | |
|             .collect();
 | |
|         self.stats
 | |
|             .new_push_requests_num
 | |
|             .add_relaxed(messages.len() as u64);
 | |
|         messages
 | |
|     }
 | |
| 
 | |
|     // Generate new push and pull requests
 | |
|     fn generate_new_gossip_requests(
 | |
|         &self,
 | |
|         stakes: &HashMap<Pubkey, u64>,
 | |
|         generate_pull_requests: bool,
 | |
|     ) -> Vec<(SocketAddr, Protocol)> {
 | |
|         let pulls: Vec<_> = if generate_pull_requests {
 | |
|             self.new_pull_requests(stakes)
 | |
|         } else {
 | |
|             vec![]
 | |
|         };
 | |
|         let pushes: Vec<_> = self.new_push_requests();
 | |
|         vec![pulls, pushes].into_iter().flatten().collect()
 | |
|     }
 | |
| 
 | |
|     /// At random pick a node and try to get updated changes from them
 | |
|     fn run_gossip(
 | |
|         &self,
 | |
|         recycler: &PacketsRecycler,
 | |
|         stakes: &HashMap<Pubkey, u64>,
 | |
|         sender: &PacketSender,
 | |
|         generate_pull_requests: bool,
 | |
|     ) -> Result<()> {
 | |
|         let reqs = self.generate_new_gossip_requests(&stakes, generate_pull_requests);
 | |
|         if !reqs.is_empty() {
 | |
|             let packets = to_packets_with_destination(recycler.clone(), &reqs);
 | |
|             sender.send(packets)?;
 | |
|         }
 | |
|         Ok(())
 | |
|     }
 | |
| 
 | |
|     fn handle_adopt_shred_version(self: &Arc<Self>, adopt_shred_version: &mut bool) {
 | |
|         // Adopt the entrypoint's `shred_version` if ours is unset
 | |
|         if *adopt_shred_version {
 | |
|             // If gossip was given an entrypoint, look up the ContactInfo by the given
 | |
|             // entrypoint gossip adddress
 | |
|             let gossip_addr = self.entrypoint.read().unwrap().as_ref().map(|e| e.gossip);
 | |
| 
 | |
|             if let Some(gossip_addr) = gossip_addr {
 | |
|                 // If a pull from the entrypoint was successful, it should exist in the crds table
 | |
|                 let entrypoint = self.lookup_contact_info_by_gossip_addr(&gossip_addr);
 | |
|                 if let Some(entrypoint) = entrypoint {
 | |
|                     if entrypoint.shred_version == 0 {
 | |
|                         info!("Unable to adopt entrypoint's shred version");
 | |
|                     } else {
 | |
|                         info!(
 | |
|                             "Setting shred version to {:?} from entrypoint {:?}",
 | |
|                             entrypoint.shred_version, entrypoint.id
 | |
|                         );
 | |
|                         self.my_contact_info.write().unwrap().shred_version =
 | |
|                             entrypoint.shred_version;
 | |
|                         self.gossip
 | |
|                             .write()
 | |
|                             .unwrap()
 | |
|                             .set_shred_version(entrypoint.shred_version);
 | |
|                         self.insert_self();
 | |
|                         *self.entrypoint.write().unwrap() = Some(entrypoint);
 | |
|                         *adopt_shred_version = false;
 | |
|                     }
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     fn handle_purge(
 | |
|         self: &Arc<Self>,
 | |
|         bank_forks: &Option<Arc<RwLock<BankForks>>>,
 | |
|         stakes: &HashMap<Pubkey, u64>,
 | |
|     ) {
 | |
|         let timeout = {
 | |
|             if let Some(ref bank_forks) = bank_forks {
 | |
|                 let bank = bank_forks.read().unwrap().working_bank();
 | |
|                 let epoch = bank.epoch();
 | |
|                 let epoch_schedule = bank.epoch_schedule();
 | |
|                 epoch_schedule.get_slots_in_epoch(epoch) * DEFAULT_MS_PER_SLOT
 | |
|             } else {
 | |
|                 inc_new_counter_info!("cluster_info-purge-no_working_bank", 1);
 | |
|                 CRDS_GOSSIP_PULL_CRDS_TIMEOUT_MS
 | |
|             }
 | |
|         };
 | |
|         let timeouts = self.gossip.read().unwrap().make_timeouts(stakes, timeout);
 | |
|         let num_purged = self
 | |
|             .time_gossip_write_lock("purge", &self.stats.purge)
 | |
|             .purge(timestamp(), &timeouts);
 | |
|         inc_new_counter_info!("cluster_info-purge-count", num_purged);
 | |
|     }
 | |
| 
 | |
|     /// randomly pick a node and ask them for updates asynchronously
 | |
|     pub fn gossip(
 | |
|         self: Arc<Self>,
 | |
|         bank_forks: Option<Arc<RwLock<BankForks>>>,
 | |
|         sender: PacketSender,
 | |
|         exit: &Arc<AtomicBool>,
 | |
|     ) -> JoinHandle<()> {
 | |
|         let exit = exit.clone();
 | |
|         Builder::new()
 | |
|             .name("solana-gossip".to_string())
 | |
|             .spawn(move || {
 | |
|                 let mut last_push = timestamp();
 | |
|                 let mut last_contact_info_trace = timestamp();
 | |
|                 let mut adopt_shred_version = self.my_shred_version() == 0;
 | |
|                 let recycler = PacketsRecycler::default();
 | |
| 
 | |
|                 let message = CrdsData::Version(Version::new(self.id()));
 | |
|                 self.push_message(CrdsValue::new_signed(message, &self.keypair));
 | |
|                 let mut generate_pull_requests = true;
 | |
|                 loop {
 | |
|                     let start = timestamp();
 | |
|                     thread_mem_usage::datapoint("solana-gossip");
 | |
|                     if start - last_contact_info_trace > 10000 {
 | |
|                         // Log contact info every 10 seconds
 | |
|                         info!("\n{}", self.contact_info_trace());
 | |
|                         last_contact_info_trace = start;
 | |
|                     }
 | |
| 
 | |
|                     let stakes: HashMap<_, _> = match bank_forks {
 | |
|                         Some(ref bank_forks) => {
 | |
|                             staking_utils::staked_nodes(&bank_forks.read().unwrap().working_bank())
 | |
|                         }
 | |
|                         None => HashMap::new(),
 | |
|                     };
 | |
| 
 | |
|                     let _ = self.run_gossip(&recycler, &stakes, &sender, generate_pull_requests);
 | |
|                     if exit.load(Ordering::Relaxed) {
 | |
|                         return;
 | |
|                     }
 | |
| 
 | |
|                     self.handle_purge(&bank_forks, &stakes);
 | |
| 
 | |
|                     self.handle_adopt_shred_version(&mut adopt_shred_version);
 | |
| 
 | |
|                     //TODO: possibly tune this parameter
 | |
|                     //we saw a deadlock passing an self.read().unwrap().timeout into sleep
 | |
|                     if start - last_push > CRDS_GOSSIP_PULL_CRDS_TIMEOUT_MS / 2 {
 | |
|                         self.push_self(&stakes);
 | |
|                         last_push = timestamp();
 | |
|                     }
 | |
|                     let elapsed = timestamp() - start;
 | |
|                     if GOSSIP_SLEEP_MILLIS > elapsed {
 | |
|                         let time_left = GOSSIP_SLEEP_MILLIS - elapsed;
 | |
|                         sleep(Duration::from_millis(time_left));
 | |
|                     }
 | |
|                     generate_pull_requests = !generate_pull_requests;
 | |
|                 }
 | |
|             })
 | |
|             .unwrap()
 | |
|     }
 | |
| 
 | |
|     #[allow(clippy::cognitive_complexity)]
 | |
|     fn handle_packets(
 | |
|         &self,
 | |
|         recycler: &PacketsRecycler,
 | |
|         stakes: &HashMap<Pubkey, u64>,
 | |
|         packets: Packets,
 | |
|         response_sender: &PacketSender,
 | |
|         epoch_time_ms: u64,
 | |
|     ) {
 | |
|         // iter over the packets, collect pulls separately and process everything else
 | |
|         let allocated = thread_mem_usage::Allocatedp::default();
 | |
|         let mut gossip_pull_data: Vec<PullData> = vec![];
 | |
|         let timeouts = self
 | |
|             .gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .make_timeouts(&stakes, epoch_time_ms);
 | |
|         let mut pull_responses = HashMap::new();
 | |
|         packets.packets.iter().for_each(|packet| {
 | |
|             let from_addr = packet.meta.addr();
 | |
|             limited_deserialize(&packet.data[..packet.meta.size])
 | |
|                 .into_iter()
 | |
|                 .filter(|r: &Protocol| r.sanitize().is_ok())
 | |
|                 .for_each(|request| match request {
 | |
|                     Protocol::PullRequest(filter, caller) => {
 | |
|                         let start = allocated.get();
 | |
|                         if !caller.verify() {
 | |
|                             inc_new_counter_info!(
 | |
|                                 "cluster_info-gossip_pull_request_verify_fail",
 | |
|                                 1
 | |
|                             );
 | |
|                         } else if let Some(contact_info) = caller.contact_info() {
 | |
|                             if contact_info.id == self.id() {
 | |
|                                 warn!("PullRequest ignored, I'm talking to myself");
 | |
|                                 inc_new_counter_debug!("cluster_info-window-request-loopback", 1);
 | |
|                             } else if contact_info.shred_version == 0
 | |
|                                 || contact_info.shred_version == self.my_shred_version()
 | |
|                                 || self.my_shred_version() == 0
 | |
|                             {
 | |
|                                 gossip_pull_data.push(PullData {
 | |
|                                     from_addr,
 | |
|                                     caller,
 | |
|                                     filter,
 | |
|                                 });
 | |
|                             } else {
 | |
|                                 self.stats.skip_pull_shred_version.add_relaxed(1);
 | |
|                             }
 | |
|                         }
 | |
|                         datapoint_debug!(
 | |
|                             "solana-gossip-listen-memory",
 | |
|                             ("pull_request", (allocated.get() - start) as i64, i64),
 | |
|                         );
 | |
|                     }
 | |
|                     Protocol::PullResponse(from, mut data) => {
 | |
|                         let start = allocated.get();
 | |
|                         data.retain(|v| {
 | |
|                             let ret = v.verify();
 | |
|                             if !ret {
 | |
|                                 inc_new_counter_info!(
 | |
|                                     "cluster_info-gossip_pull_response_verify_fail",
 | |
|                                     1
 | |
|                                 );
 | |
|                             }
 | |
|                             ret
 | |
|                         });
 | |
|                         let pull_entry = pull_responses.entry(from).or_insert_with(Vec::new);
 | |
|                         pull_entry.extend(data);
 | |
|                         datapoint_debug!(
 | |
|                             "solana-gossip-listen-memory",
 | |
|                             ("pull_response", (allocated.get() - start) as i64, i64),
 | |
|                         );
 | |
|                     }
 | |
|                     Protocol::PushMessage(from, mut data) => {
 | |
|                         let start = allocated.get();
 | |
|                         data.retain(|v| {
 | |
|                             let ret = v.verify();
 | |
|                             if !ret {
 | |
|                                 inc_new_counter_info!(
 | |
|                                     "cluster_info-gossip_push_msg_verify_fail",
 | |
|                                     1
 | |
|                                 );
 | |
|                             }
 | |
|                             ret
 | |
|                         });
 | |
|                         let rsp = self.handle_push_message(recycler, &from, data, stakes);
 | |
|                         if let Some(rsp) = rsp {
 | |
|                             let _ignore_disconnect = response_sender.send(rsp);
 | |
|                         }
 | |
|                         datapoint_debug!(
 | |
|                             "solana-gossip-listen-memory",
 | |
|                             ("push_message", (allocated.get() - start) as i64, i64),
 | |
|                         );
 | |
|                     }
 | |
|                     Protocol::PruneMessage(from, data) => {
 | |
|                         let start = allocated.get();
 | |
|                         if data.verify() {
 | |
|                             self.stats.prune_message_count.add_relaxed(1);
 | |
|                             self.stats
 | |
|                                 .prune_message_len
 | |
|                                 .add_relaxed(data.prunes.len() as u64);
 | |
|                             match self
 | |
|                                 .time_gossip_write_lock("process_prune", &self.stats.process_prune)
 | |
|                                 .process_prune_msg(
 | |
|                                     &from,
 | |
|                                     &data.destination,
 | |
|                                     &data.prunes,
 | |
|                                     data.wallclock,
 | |
|                                     timestamp(),
 | |
|                                 ) {
 | |
|                                 Err(CrdsGossipError::PruneMessageTimeout) => {
 | |
|                                     inc_new_counter_debug!("cluster_info-prune_message_timeout", 1)
 | |
|                                 }
 | |
|                                 Err(CrdsGossipError::BadPruneDestination) => {
 | |
|                                     inc_new_counter_debug!("cluster_info-bad_prune_destination", 1)
 | |
|                                 }
 | |
|                                 _ => (),
 | |
|                             }
 | |
|                         } else {
 | |
|                             inc_new_counter_debug!("cluster_info-gossip_prune_msg_verify_fail", 1);
 | |
|                         }
 | |
|                         datapoint_debug!(
 | |
|                             "solana-gossip-listen-memory",
 | |
|                             ("prune_message", (allocated.get() - start) as i64, i64),
 | |
|                         );
 | |
|                     }
 | |
|                 })
 | |
|         });
 | |
| 
 | |
|         for (from, data) in pull_responses {
 | |
|             self.handle_pull_response(&from, data, &timeouts);
 | |
|         }
 | |
| 
 | |
|         // process the collected pulls together
 | |
|         if !gossip_pull_data.is_empty() {
 | |
|             self.stats
 | |
|                 .pull_requests_count
 | |
|                 .add_relaxed(gossip_pull_data.len() as u64);
 | |
|             let rsp = self.handle_pull_requests(recycler, gossip_pull_data, stakes);
 | |
|             if let Some(rsp) = rsp {
 | |
|                 let _ignore_disconnect = response_sender.send(rsp);
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     fn update_data_budget(&self, stakes: &HashMap<Pubkey, u64>) {
 | |
|         let mut w_outbound_budget = self.outbound_budget.write().unwrap();
 | |
| 
 | |
|         let now = timestamp();
 | |
|         const INTERVAL_MS: u64 = 100;
 | |
|         // allow 50kBps per staked validator, epoch slots + votes ~= 1.5kB/slot ~= 4kB/s
 | |
|         const BYTES_PER_INTERVAL: usize = 5000;
 | |
|         const MAX_BUDGET_MULTIPLE: usize = 5; // allow budget build-up to 5x the interval default
 | |
| 
 | |
|         if now - w_outbound_budget.last_timestamp_ms > INTERVAL_MS {
 | |
|             let len = std::cmp::max(stakes.len(), 2);
 | |
|             w_outbound_budget.bytes += len * BYTES_PER_INTERVAL;
 | |
|             w_outbound_budget.bytes = std::cmp::min(
 | |
|                 w_outbound_budget.bytes,
 | |
|                 MAX_BUDGET_MULTIPLE * len * BYTES_PER_INTERVAL,
 | |
|             );
 | |
|             w_outbound_budget.last_timestamp_ms = now;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     // Pull requests take an incoming bloom filter of contained entries from a node
 | |
|     // and tries to send back to them the values it detects are missing.
 | |
|     fn handle_pull_requests(
 | |
|         &self,
 | |
|         recycler: &PacketsRecycler,
 | |
|         requests: Vec<PullData>,
 | |
|         stakes: &HashMap<Pubkey, u64>,
 | |
|     ) -> Option<Packets> {
 | |
|         // split the requests into addrs and filters
 | |
|         let mut caller_and_filters = vec![];
 | |
|         let mut addrs = vec![];
 | |
|         let mut time = Measure::start("handle_pull_requests");
 | |
|         self.update_data_budget(stakes);
 | |
|         for pull_data in requests {
 | |
|             caller_and_filters.push((pull_data.caller, pull_data.filter));
 | |
|             addrs.push(pull_data.from_addr);
 | |
|         }
 | |
|         let now = timestamp();
 | |
|         let self_id = self.id();
 | |
| 
 | |
|         let pull_responses = self
 | |
|             .time_gossip_read_lock(
 | |
|                 "generate_pull_responses",
 | |
|                 &self.stats.generate_pull_responses,
 | |
|             )
 | |
|             .generate_pull_responses(&caller_and_filters, now);
 | |
| 
 | |
|         self.time_gossip_write_lock("process_pull_reqs", &self.stats.process_pull_requests)
 | |
|             .process_pull_requests(caller_and_filters, now);
 | |
| 
 | |
|         // Filter bad to addresses
 | |
|         let pull_responses: Vec<_> = pull_responses
 | |
|             .into_iter()
 | |
|             .zip(addrs.into_iter())
 | |
|             .filter_map(|(responses, from_addr)| {
 | |
|                 if !from_addr.ip().is_unspecified()
 | |
|                     && from_addr.port() != 0
 | |
|                     && !responses.is_empty()
 | |
|                 {
 | |
|                     Some((responses, from_addr))
 | |
|                 } else {
 | |
|                     None
 | |
|                 }
 | |
|             })
 | |
|             .collect();
 | |
| 
 | |
|         if pull_responses.is_empty() {
 | |
|             return None;
 | |
|         }
 | |
| 
 | |
|         let mut stats: Vec<_> = pull_responses
 | |
|             .iter()
 | |
|             .enumerate()
 | |
|             .map(|(i, (responses, _from_addr))| {
 | |
|                 let score: u64 = if stakes.get(&responses[0].pubkey()).is_some() {
 | |
|                     2
 | |
|                 } else {
 | |
|                     1
 | |
|                 };
 | |
|                 responses
 | |
|                     .iter()
 | |
|                     .enumerate()
 | |
|                     .map(|(j, _response)| ResponseScore {
 | |
|                         to: i,
 | |
|                         responses_index: j,
 | |
|                         score,
 | |
|                     })
 | |
|                     .collect::<Vec<ResponseScore>>()
 | |
|             })
 | |
|             .flatten()
 | |
|             .collect();
 | |
| 
 | |
|         stats.sort_by(|a, b| a.score.cmp(&b.score));
 | |
|         let weights: Vec<_> = stats.iter().map(|stat| stat.score).collect();
 | |
| 
 | |
|         let seed = [48u8; 32];
 | |
|         let rng = &mut ChaChaRng::from_seed(seed);
 | |
|         let weighted_index = WeightedIndex::new(weights).unwrap();
 | |
| 
 | |
|         let mut packets = Packets::new_with_recycler(recycler.clone(), 64, "handle_pull_requests");
 | |
|         let mut total_bytes = 0;
 | |
|         let mut sent = HashSet::new();
 | |
|         while sent.len() < stats.len() {
 | |
|             let index = weighted_index.sample(rng);
 | |
|             if sent.contains(&index) {
 | |
|                 continue;
 | |
|             }
 | |
|             let stat = &stats[index];
 | |
|             let from_addr = pull_responses[stat.to].1;
 | |
|             let response = pull_responses[stat.to].0[stat.responses_index].clone();
 | |
|             let protocol = Protocol::PullResponse(self_id, vec![response]);
 | |
|             let new_packet = Packet::from_data(&from_addr, protocol);
 | |
|             {
 | |
|                 let mut w_outbound_budget = self.outbound_budget.write().unwrap();
 | |
|                 if w_outbound_budget.bytes > new_packet.meta.size {
 | |
|                     sent.insert(index);
 | |
|                     w_outbound_budget.bytes -= new_packet.meta.size;
 | |
|                     total_bytes += new_packet.meta.size;
 | |
|                     packets.packets.push(new_packet)
 | |
|                 } else {
 | |
|                     inc_new_counter_info!("gossip_pull_request-no_budget", 1);
 | |
|                     break;
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
|         time.stop();
 | |
|         inc_new_counter_info!("gossip_pull_request-sent_requests", sent.len());
 | |
|         inc_new_counter_info!(
 | |
|             "gossip_pull_request-dropped_requests",
 | |
|             stats.len() - sent.len()
 | |
|         );
 | |
|         debug!(
 | |
|             "handle_pull_requests: {} sent: {} total: {} total_bytes: {}",
 | |
|             time,
 | |
|             sent.len(),
 | |
|             stats.len(),
 | |
|             total_bytes
 | |
|         );
 | |
|         if packets.is_empty() {
 | |
|             return None;
 | |
|         }
 | |
|         Some(packets)
 | |
|     }
 | |
| 
 | |
|     // Returns (failed, timeout, success)
 | |
|     fn handle_pull_response(
 | |
|         &self,
 | |
|         from: &Pubkey,
 | |
|         mut crds_values: Vec<CrdsValue>,
 | |
|         timeouts: &HashMap<Pubkey, u64>,
 | |
|     ) -> (usize, usize, usize) {
 | |
|         let len = crds_values.len();
 | |
|         trace!("PullResponse me: {} from: {} len={}", self.id, from, len);
 | |
|         let shred_version = self
 | |
|             .lookup_contact_info(from, |ci| ci.shred_version)
 | |
|             .unwrap_or(0);
 | |
|         Self::filter_by_shred_version(
 | |
|             from,
 | |
|             &mut crds_values,
 | |
|             shred_version,
 | |
|             self.my_shred_version(),
 | |
|         );
 | |
|         let filtered_len = crds_values.len();
 | |
| 
 | |
|         let mut pull_stats = ProcessPullStats::default();
 | |
|         let (filtered_pulls, filtered_pulls_expired_timeout) = self
 | |
|             .time_gossip_read_lock("filter_pull_resp", &self.stats.filter_pull_response)
 | |
|             .filter_pull_responses(timeouts, crds_values, timestamp(), &mut pull_stats);
 | |
| 
 | |
|         if !filtered_pulls.is_empty() || !filtered_pulls_expired_timeout.is_empty() {
 | |
|             self.time_gossip_write_lock("process_pull_resp", &self.stats.process_pull_response)
 | |
|                 .process_pull_responses(
 | |
|                     from,
 | |
|                     filtered_pulls,
 | |
|                     filtered_pulls_expired_timeout,
 | |
|                     timestamp(),
 | |
|                     &mut pull_stats,
 | |
|                 );
 | |
|         }
 | |
| 
 | |
|         self.stats
 | |
|             .skip_pull_response_shred_version
 | |
|             .add_relaxed((len - filtered_len) as u64);
 | |
|         self.stats.process_pull_response_count.add_relaxed(1);
 | |
|         self.stats
 | |
|             .process_pull_response_len
 | |
|             .add_relaxed(filtered_len as u64);
 | |
|         self.stats
 | |
|             .process_pull_response_timeout
 | |
|             .add_relaxed(pull_stats.timeout_count as u64);
 | |
|         self.stats
 | |
|             .process_pull_response_fail_insert
 | |
|             .add_relaxed(pull_stats.failed_insert as u64);
 | |
|         self.stats
 | |
|             .process_pull_response_fail_timeout
 | |
|             .add_relaxed(pull_stats.failed_timeout as u64);
 | |
|         self.stats
 | |
|             .process_pull_response_success
 | |
|             .add_relaxed(pull_stats.success as u64);
 | |
| 
 | |
|         (
 | |
|             pull_stats.failed_insert + pull_stats.failed_timeout,
 | |
|             pull_stats.timeout_count,
 | |
|             pull_stats.success,
 | |
|         )
 | |
|     }
 | |
| 
 | |
|     fn filter_by_shred_version(
 | |
|         from: &Pubkey,
 | |
|         crds_values: &mut Vec<CrdsValue>,
 | |
|         shred_version: u16,
 | |
|         my_shred_version: u16,
 | |
|     ) {
 | |
|         // Always run filter on spies
 | |
|         if my_shred_version != 0 && shred_version != my_shred_version {
 | |
|             // Allow someone to update their own ContactInfo so they
 | |
|             // can change shred versions if needed.
 | |
|             crds_values.retain(|crds_value| match &crds_value.data {
 | |
|                 CrdsData::ContactInfo(contact_info) => contact_info.id == *from,
 | |
|                 _ => false,
 | |
|             });
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     fn handle_push_message(
 | |
|         &self,
 | |
|         recycler: &PacketsRecycler,
 | |
|         from: &Pubkey,
 | |
|         mut crds_values: Vec<CrdsValue>,
 | |
|         stakes: &HashMap<Pubkey, u64>,
 | |
|     ) -> Option<Packets> {
 | |
|         let self_id = self.id();
 | |
|         self.stats.push_message_count.add_relaxed(1);
 | |
|         let len = crds_values.len();
 | |
| 
 | |
|         let shred_version = self
 | |
|             .lookup_contact_info(from, |ci| ci.shred_version)
 | |
|             .unwrap_or(0);
 | |
|         Self::filter_by_shred_version(
 | |
|             from,
 | |
|             &mut crds_values,
 | |
|             shred_version,
 | |
|             self.my_shred_version(),
 | |
|         );
 | |
|         let filtered_len = crds_values.len();
 | |
|         self.stats
 | |
|             .push_message_value_count
 | |
|             .add_relaxed(filtered_len as u64);
 | |
|         self.stats
 | |
|             .skip_push_message_shred_version
 | |
|             .add_relaxed((len - filtered_len) as u64);
 | |
| 
 | |
|         let updated: Vec<_> = self
 | |
|             .time_gossip_write_lock("process_push", &self.stats.process_push_message)
 | |
|             .process_push_message(from, crds_values, timestamp());
 | |
| 
 | |
|         let updated_labels: Vec<_> = updated.into_iter().map(|u| u.value.label()).collect();
 | |
|         let prunes_map: HashMap<Pubkey, HashSet<Pubkey>> = self
 | |
|             .time_gossip_write_lock("prune_received_cache", &self.stats.prune_received_cache)
 | |
|             .prune_received_cache(updated_labels, stakes);
 | |
| 
 | |
|         let rsp: Vec<_> = prunes_map
 | |
|             .into_iter()
 | |
|             .filter_map(|(from, prune_set)| {
 | |
|                 inc_new_counter_debug!("cluster_info-push_message-prunes", prune_set.len());
 | |
|                 self.lookup_contact_info(&from, |ci| ci.clone()).map(|ci| {
 | |
|                     let mut prune_msg = PruneData {
 | |
|                         pubkey: self_id,
 | |
|                         prunes: prune_set.into_iter().collect(),
 | |
|                         signature: Signature::default(),
 | |
|                         destination: from,
 | |
|                         wallclock: timestamp(),
 | |
|                     };
 | |
|                     prune_msg.sign(&self.keypair);
 | |
|                     let rsp = Protocol::PruneMessage(self_id, prune_msg);
 | |
|                     (ci.gossip, rsp)
 | |
|                 })
 | |
|             })
 | |
|             .collect();
 | |
|         if rsp.is_empty() {
 | |
|             return None;
 | |
|         }
 | |
|         let mut packets = to_packets_with_destination(recycler.clone(), &rsp);
 | |
|         self.stats
 | |
|             .push_response_count
 | |
|             .add_relaxed(packets.packets.len() as u64);
 | |
|         if !packets.is_empty() {
 | |
|             let pushes: Vec<_> = self.new_push_requests();
 | |
|             inc_new_counter_debug!("cluster_info-push_message-pushes", pushes.len());
 | |
|             pushes.into_iter().for_each(|(remote_gossip_addr, req)| {
 | |
|                 if !remote_gossip_addr.ip().is_unspecified() && remote_gossip_addr.port() != 0 {
 | |
|                     let p = Packet::from_data(&remote_gossip_addr, &req);
 | |
|                     packets.packets.push(p);
 | |
|                 } else {
 | |
|                     trace!("Dropping Gossip push response, as destination is unknown");
 | |
|                 }
 | |
|             });
 | |
|             Some(packets)
 | |
|         } else {
 | |
|             None
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     fn get_stakes_and_epoch_time(
 | |
|         bank_forks: Option<&Arc<RwLock<BankForks>>>,
 | |
|     ) -> (HashMap<Pubkey, u64>, u64) {
 | |
|         let epoch_time_ms;
 | |
|         let stakes: HashMap<_, _> = match bank_forks {
 | |
|             Some(ref bank_forks) => {
 | |
|                 let bank = bank_forks.read().unwrap().working_bank();
 | |
|                 let epoch = bank.epoch();
 | |
|                 let epoch_schedule = bank.epoch_schedule();
 | |
|                 epoch_time_ms = epoch_schedule.get_slots_in_epoch(epoch) * DEFAULT_MS_PER_SLOT;
 | |
|                 staking_utils::staked_nodes(&bank)
 | |
|             }
 | |
|             None => {
 | |
|                 inc_new_counter_info!("cluster_info-purge-no_working_bank", 1);
 | |
|                 epoch_time_ms = CRDS_GOSSIP_PULL_CRDS_TIMEOUT_MS;
 | |
|                 HashMap::new()
 | |
|             }
 | |
|         };
 | |
| 
 | |
|         (stakes, epoch_time_ms)
 | |
|     }
 | |
| 
 | |
|     fn process_packets(
 | |
|         &self,
 | |
|         requests: Vec<Packets>,
 | |
|         thread_pool: &ThreadPool,
 | |
|         recycler: &PacketsRecycler,
 | |
|         response_sender: &PacketSender,
 | |
|         stakes: HashMap<Pubkey, u64>,
 | |
|         epoch_time_ms: u64,
 | |
|     ) {
 | |
|         let sender = response_sender.clone();
 | |
|         thread_pool.install(|| {
 | |
|             requests.into_par_iter().for_each_with(sender, |s, reqs| {
 | |
|                 self.handle_packets(&recycler, &stakes, reqs, s, epoch_time_ms)
 | |
|             });
 | |
|         });
 | |
|     }
 | |
| 
 | |
|     /// Process messages from the network
 | |
|     fn run_listen(
 | |
|         &self,
 | |
|         recycler: &PacketsRecycler,
 | |
|         bank_forks: Option<&Arc<RwLock<BankForks>>>,
 | |
|         requests_receiver: &PacketReceiver,
 | |
|         response_sender: &PacketSender,
 | |
|         thread_pool: &ThreadPool,
 | |
|         last_print: &mut Instant,
 | |
|     ) -> Result<()> {
 | |
|         let timeout = Duration::new(1, 0);
 | |
|         let mut requests = vec![requests_receiver.recv_timeout(timeout)?];
 | |
|         let mut num_requests = requests.last().unwrap().packets.len();
 | |
|         while let Ok(more_reqs) = requests_receiver.try_recv() {
 | |
|             if num_requests >= MAX_GOSSIP_TRAFFIC {
 | |
|                 continue;
 | |
|             }
 | |
|             num_requests += more_reqs.packets.len();
 | |
|             requests.push(more_reqs)
 | |
|         }
 | |
| 
 | |
|         if num_requests >= MAX_GOSSIP_TRAFFIC {
 | |
|             warn!(
 | |
|                 "Too much gossip traffic, ignoring some messages (requests={}, max requests={})",
 | |
|                 num_requests, MAX_GOSSIP_TRAFFIC
 | |
|             );
 | |
|         }
 | |
| 
 | |
|         let (stakes, epoch_time_ms) = Self::get_stakes_and_epoch_time(bank_forks);
 | |
| 
 | |
|         self.process_packets(
 | |
|             requests,
 | |
|             thread_pool,
 | |
|             recycler,
 | |
|             response_sender,
 | |
|             stakes,
 | |
|             epoch_time_ms,
 | |
|         );
 | |
| 
 | |
|         self.print_reset_stats(last_print);
 | |
| 
 | |
|         Ok(())
 | |
|     }
 | |
| 
 | |
|     fn print_reset_stats(&self, last_print: &mut Instant) {
 | |
|         if last_print.elapsed().as_millis() > 2000 {
 | |
|             let (table_size, purged_values_size) = {
 | |
|                 let r_gossip = self.gossip.read().unwrap();
 | |
|                 (r_gossip.crds.table.len(), r_gossip.pull.purged_values.len())
 | |
|             };
 | |
|             datapoint_info!(
 | |
|                 "cluster_info_stats",
 | |
|                 ("entrypoint", self.stats.entrypoint.clear(), i64),
 | |
|                 ("entrypoint2", self.stats.entrypoint2.clear(), i64),
 | |
|                 ("push_vote_read", self.stats.push_vote_read.clear(), i64),
 | |
|                 (
 | |
|                     "vote_process_push",
 | |
|                     self.stats.vote_process_push.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 ("get_votes", self.stats.get_votes.clear(), i64),
 | |
|                 (
 | |
|                     "get_accounts_hash",
 | |
|                     self.stats.get_accounts_hash.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 ("all_tvu_peers", self.stats.all_tvu_peers.clear(), i64),
 | |
|                 ("tvu_peers", self.stats.tvu_peers.clear(), i64),
 | |
|                 (
 | |
|                     "new_push_requests_num",
 | |
|                     self.stats.new_push_requests_num.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 ("table_size", table_size as i64, i64),
 | |
|                 ("purged_values_size", purged_values_size as i64, i64),
 | |
|             );
 | |
|             datapoint_info!(
 | |
|                 "cluster_info_stats2",
 | |
|                 ("retransmit_peers", self.stats.retransmit_peers.clear(), i64),
 | |
|                 ("repair_peers", self.stats.repair_peers.clear(), i64),
 | |
|                 (
 | |
|                     "new_push_requests",
 | |
|                     self.stats.new_push_requests.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "new_push_requests2",
 | |
|                     self.stats.new_push_requests2.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 ("purge", self.stats.purge.clear(), i64),
 | |
|                 (
 | |
|                     "process_pull_resp",
 | |
|                     self.stats.process_pull_response.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "filter_pull_resp",
 | |
|                     self.stats.filter_pull_response.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "process_pull_resp_count",
 | |
|                     self.stats.process_pull_response_count.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "pull_response_fail_insert",
 | |
|                     self.stats.process_pull_response_fail_insert.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "pull_response_fail_timeout",
 | |
|                     self.stats.process_pull_response_fail_timeout.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "pull_response_success",
 | |
|                     self.stats.process_pull_response_success.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "process_pull_resp_timeout",
 | |
|                     self.stats.process_pull_response_timeout.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "push_response_count",
 | |
|                     self.stats.push_response_count.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|             );
 | |
|             datapoint_info!(
 | |
|                 "cluster_info_stats3",
 | |
|                 (
 | |
|                     "process_pull_resp_len",
 | |
|                     self.stats.process_pull_response_len.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "process_pull_requests",
 | |
|                     self.stats.process_pull_requests.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "generate_pull_responses",
 | |
|                     self.stats.generate_pull_responses.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 ("process_prune", self.stats.process_prune.clear(), i64),
 | |
|                 (
 | |
|                     "process_push_message",
 | |
|                     self.stats.process_push_message.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "prune_received_cache",
 | |
|                     self.stats.prune_received_cache.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "epoch_slots_lookup",
 | |
|                     self.stats.epoch_slots_lookup.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 ("epoch_slots_push", self.stats.epoch_slots_push.clear(), i64),
 | |
|                 ("push_message", self.stats.push_message.clear(), i64),
 | |
|                 (
 | |
|                     "new_pull_requests",
 | |
|                     self.stats.new_pull_requests.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "mark_pull_request",
 | |
|                     self.stats.mark_pull_request.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|             );
 | |
|             datapoint_info!(
 | |
|                 "cluster_info_stats4",
 | |
|                 (
 | |
|                     "skip_push_message_shred_version",
 | |
|                     self.stats.skip_push_message_shred_version.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "skip_pull_response_shred_version",
 | |
|                     self.stats.skip_pull_response_shred_version.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "skip_pull_shred_version",
 | |
|                     self.stats.skip_pull_shred_version.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "push_message_count",
 | |
|                     self.stats.push_message_count.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "push_message_value_count",
 | |
|                     self.stats.push_message_value_count.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "new_pull_requests_count",
 | |
|                     self.stats.new_pull_requests_count.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "prune_message_count",
 | |
|                     self.stats.prune_message_count.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|                 (
 | |
|                     "prune_message_len",
 | |
|                     self.stats.prune_message_len.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|             );
 | |
|             datapoint_info!(
 | |
|                 "cluster_info_stats5",
 | |
|                 (
 | |
|                     "pull_requests_count",
 | |
|                     self.stats.pull_requests_count.clear(),
 | |
|                     i64
 | |
|                 ),
 | |
|             );
 | |
| 
 | |
|             *last_print = Instant::now();
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     pub fn listen(
 | |
|         self: Arc<Self>,
 | |
|         bank_forks: Option<Arc<RwLock<BankForks>>>,
 | |
|         requests_receiver: PacketReceiver,
 | |
|         response_sender: PacketSender,
 | |
|         exit: &Arc<AtomicBool>,
 | |
|     ) -> JoinHandle<()> {
 | |
|         let exit = exit.clone();
 | |
|         let recycler = PacketsRecycler::default();
 | |
|         Builder::new()
 | |
|             .name("solana-listen".to_string())
 | |
|             .spawn(move || {
 | |
|                 let thread_pool = rayon::ThreadPoolBuilder::new()
 | |
|                     .num_threads(std::cmp::min(get_thread_count(), 8))
 | |
|                     .thread_name(|i| format!("sol-gossip-work-{}", i))
 | |
|                     .build()
 | |
|                     .unwrap();
 | |
|                 let mut last_print = Instant::now();
 | |
|                 loop {
 | |
|                     let e = self.run_listen(
 | |
|                         &recycler,
 | |
|                         bank_forks.as_ref(),
 | |
|                         &requests_receiver,
 | |
|                         &response_sender,
 | |
|                         &thread_pool,
 | |
|                         &mut last_print,
 | |
|                     );
 | |
|                     if exit.load(Ordering::Relaxed) {
 | |
|                         return;
 | |
|                     }
 | |
|                     if e.is_err() {
 | |
|                         let r_gossip = self.gossip.read().unwrap();
 | |
|                         debug!(
 | |
|                             "{}: run_listen timeout, table size: {}",
 | |
|                             self.id(),
 | |
|                             r_gossip.crds.table.len()
 | |
|                         );
 | |
|                     }
 | |
|                     thread_mem_usage::datapoint("solana-listen");
 | |
|                 }
 | |
|             })
 | |
|             .unwrap()
 | |
|     }
 | |
| 
 | |
|     pub fn gossip_contact_info(id: &Pubkey, gossip: SocketAddr, shred_version: u16) -> ContactInfo {
 | |
|         ContactInfo {
 | |
|             id: *id,
 | |
|             gossip,
 | |
|             wallclock: timestamp(),
 | |
|             shred_version,
 | |
|             ..ContactInfo::default()
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /// An alternative to Spy Node that has a valid gossip address and fully participate in Gossip.
 | |
|     pub fn gossip_node(
 | |
|         id: &Pubkey,
 | |
|         gossip_addr: &SocketAddr,
 | |
|         shred_version: u16,
 | |
|     ) -> (ContactInfo, UdpSocket, Option<TcpListener>) {
 | |
|         let bind_ip_addr = IpAddr::V4(Ipv4Addr::new(0, 0, 0, 0));
 | |
|         let (port, (gossip_socket, ip_echo)) =
 | |
|             Node::get_gossip_port(gossip_addr, VALIDATOR_PORT_RANGE, bind_ip_addr);
 | |
|         let contact_info =
 | |
|             Self::gossip_contact_info(id, SocketAddr::new(gossip_addr.ip(), port), shred_version);
 | |
| 
 | |
|         (contact_info, gossip_socket, Some(ip_echo))
 | |
|     }
 | |
| 
 | |
|     /// A Node with dummy ports to spy on gossip via pull requests
 | |
|     pub fn spy_node(
 | |
|         id: &Pubkey,
 | |
|         shred_version: u16,
 | |
|     ) -> (ContactInfo, UdpSocket, Option<TcpListener>) {
 | |
|         let bind_ip_addr = IpAddr::V4(Ipv4Addr::new(0, 0, 0, 0));
 | |
|         let (_, gossip_socket) = bind_in_range(bind_ip_addr, VALIDATOR_PORT_RANGE).unwrap();
 | |
|         let contact_info = Self::gossip_contact_info(id, socketaddr_any!(), shred_version);
 | |
| 
 | |
|         (contact_info, gossip_socket, None)
 | |
|     }
 | |
| }
 | |
| 
 | |
| /// Turbine logic
 | |
| /// 1 - For the current node find out if it is in layer 1
 | |
| /// 1.1 - If yes, then broadcast to all layer 1 nodes
 | |
| ///      1 - using the layer 1 index, broadcast to all layer 2 nodes assuming you know neighborhood size
 | |
| /// 1.2 - If no, then figure out what layer the node is in and who the neighbors are and only broadcast to them
 | |
| ///      1 - also check if there are nodes in the next layer and repeat the layer 1 to layer 2 logic
 | |
| 
 | |
| /// Returns Neighbor Nodes and Children Nodes `(neighbors, children)` for a given node based on its stake
 | |
| pub fn compute_retransmit_peers(
 | |
|     fanout: usize,
 | |
|     my_index: usize,
 | |
|     stakes_and_index: Vec<usize>,
 | |
| ) -> (Vec<usize>, Vec<usize>) {
 | |
|     //calc num_layers and num_neighborhoods using the total number of nodes
 | |
|     let (num_layers, layer_indices) =
 | |
|         ClusterInfo::describe_data_plane(stakes_and_index.len(), fanout);
 | |
| 
 | |
|     if num_layers <= 1 {
 | |
|         /* single layer data plane */
 | |
|         (stakes_and_index, vec![])
 | |
|     } else {
 | |
|         //find my layer
 | |
|         let locality = ClusterInfo::localize(&layer_indices, fanout, my_index);
 | |
|         let upper_bound = cmp::min(locality.neighbor_bounds.1, stakes_and_index.len());
 | |
|         let neighbors = stakes_and_index[locality.neighbor_bounds.0..upper_bound].to_vec();
 | |
|         let mut children = Vec::new();
 | |
|         for ix in locality.next_layer_peers {
 | |
|             if let Some(peer) = stakes_and_index.get(ix) {
 | |
|                 children.push(*peer);
 | |
|                 continue;
 | |
|             }
 | |
|             break;
 | |
|         }
 | |
|         (neighbors, children)
 | |
|     }
 | |
| }
 | |
| 
 | |
| #[derive(Debug)]
 | |
| pub struct Sockets {
 | |
|     pub gossip: UdpSocket,
 | |
|     pub ip_echo: Option<TcpListener>,
 | |
|     pub tvu: Vec<UdpSocket>,
 | |
|     pub tvu_forwards: Vec<UdpSocket>,
 | |
|     pub tpu: Vec<UdpSocket>,
 | |
|     pub tpu_forwards: Vec<UdpSocket>,
 | |
|     pub broadcast: Vec<UdpSocket>,
 | |
|     pub repair: UdpSocket,
 | |
|     pub retransmit_sockets: Vec<UdpSocket>,
 | |
|     pub serve_repair: UdpSocket,
 | |
| }
 | |
| 
 | |
| #[derive(Debug)]
 | |
| pub struct Node {
 | |
|     pub info: ContactInfo,
 | |
|     pub sockets: Sockets,
 | |
| }
 | |
| 
 | |
| impl Node {
 | |
|     pub fn new_localhost() -> Self {
 | |
|         let pubkey = Pubkey::new_rand();
 | |
|         Self::new_localhost_with_pubkey(&pubkey)
 | |
|     }
 | |
|     pub fn new_localhost_with_pubkey(pubkey: &Pubkey) -> Self {
 | |
|         let bind_ip_addr = IpAddr::V4(Ipv4Addr::new(0, 0, 0, 0));
 | |
|         let tpu = UdpSocket::bind("127.0.0.1:0").unwrap();
 | |
|         let (gossip_port, (gossip, ip_echo)) =
 | |
|             bind_common_in_range(bind_ip_addr, (1024, 65535)).unwrap();
 | |
|         let gossip_addr = SocketAddr::new(IpAddr::V4(Ipv4Addr::new(127, 0, 0, 1)), gossip_port);
 | |
|         let tvu = UdpSocket::bind("127.0.0.1:0").unwrap();
 | |
|         let tvu_forwards = UdpSocket::bind("127.0.0.1:0").unwrap();
 | |
|         let tpu_forwards = UdpSocket::bind("127.0.0.1:0").unwrap();
 | |
|         let repair = UdpSocket::bind("127.0.0.1:0").unwrap();
 | |
|         let rpc_port = find_available_port_in_range(bind_ip_addr, (1024, 65535)).unwrap();
 | |
|         let rpc_addr = SocketAddr::new(IpAddr::V4(Ipv4Addr::new(127, 0, 0, 1)), rpc_port);
 | |
|         let rpc_pubsub_port = find_available_port_in_range(bind_ip_addr, (1024, 65535)).unwrap();
 | |
|         let rpc_pubsub_addr =
 | |
|             SocketAddr::new(IpAddr::V4(Ipv4Addr::new(127, 0, 0, 1)), rpc_pubsub_port);
 | |
|         let rpc_banks_port = find_available_port_in_range(bind_ip_addr, (1024, 65535)).unwrap();
 | |
|         let rpc_banks_addr =
 | |
|             SocketAddr::new(IpAddr::V4(Ipv4Addr::new(127, 0, 0, 1)), rpc_banks_port);
 | |
| 
 | |
|         let broadcast = vec![UdpSocket::bind("0.0.0.0:0").unwrap()];
 | |
|         let retransmit_socket = UdpSocket::bind("0.0.0.0:0").unwrap();
 | |
|         let serve_repair = UdpSocket::bind("127.0.0.1:0").unwrap();
 | |
|         let info = ContactInfo {
 | |
|             id: *pubkey,
 | |
|             gossip: gossip_addr,
 | |
|             tvu: tvu.local_addr().unwrap(),
 | |
|             tvu_forwards: tvu_forwards.local_addr().unwrap(),
 | |
|             repair: repair.local_addr().unwrap(),
 | |
|             tpu: tpu.local_addr().unwrap(),
 | |
|             tpu_forwards: tpu_forwards.local_addr().unwrap(),
 | |
|             rpc_banks: rpc_banks_addr,
 | |
|             rpc: rpc_addr,
 | |
|             rpc_pubsub: rpc_pubsub_addr,
 | |
|             serve_repair: serve_repair.local_addr().unwrap(),
 | |
|             wallclock: timestamp(),
 | |
|             shred_version: 0,
 | |
|         };
 | |
|         Node {
 | |
|             info,
 | |
|             sockets: Sockets {
 | |
|                 gossip,
 | |
|                 ip_echo: Some(ip_echo),
 | |
|                 tvu: vec![tvu],
 | |
|                 tvu_forwards: vec![tvu_forwards],
 | |
|                 tpu: vec![tpu],
 | |
|                 tpu_forwards: vec![tpu_forwards],
 | |
|                 broadcast,
 | |
|                 repair,
 | |
|                 retransmit_sockets: vec![retransmit_socket],
 | |
|                 serve_repair,
 | |
|             },
 | |
|         }
 | |
|     }
 | |
|     fn get_gossip_port(
 | |
|         gossip_addr: &SocketAddr,
 | |
|         port_range: PortRange,
 | |
|         bind_ip_addr: IpAddr,
 | |
|     ) -> (u16, (UdpSocket, TcpListener)) {
 | |
|         if gossip_addr.port() != 0 {
 | |
|             (
 | |
|                 gossip_addr.port(),
 | |
|                 bind_common(bind_ip_addr, gossip_addr.port(), false).unwrap_or_else(|e| {
 | |
|                     panic!("gossip_addr bind_to port {}: {}", gossip_addr.port(), e)
 | |
|                 }),
 | |
|             )
 | |
|         } else {
 | |
|             bind_common_in_range(bind_ip_addr, port_range).expect("Failed to bind")
 | |
|         }
 | |
|     }
 | |
|     fn bind(bind_ip_addr: IpAddr, port_range: PortRange) -> (u16, UdpSocket) {
 | |
|         bind_in_range(bind_ip_addr, port_range).expect("Failed to bind")
 | |
|     }
 | |
| 
 | |
|     pub fn new_with_external_ip(
 | |
|         pubkey: &Pubkey,
 | |
|         gossip_addr: &SocketAddr,
 | |
|         port_range: PortRange,
 | |
|         bind_ip_addr: IpAddr,
 | |
|     ) -> Node {
 | |
|         let (gossip_port, (gossip, ip_echo)) =
 | |
|             Self::get_gossip_port(gossip_addr, port_range, bind_ip_addr);
 | |
| 
 | |
|         let (tvu_port, tvu_sockets) =
 | |
|             multi_bind_in_range(bind_ip_addr, port_range, 8).expect("tvu multi_bind");
 | |
| 
 | |
|         let (tvu_forwards_port, tvu_forwards_sockets) =
 | |
|             multi_bind_in_range(bind_ip_addr, port_range, 8).expect("tvu_forwards multi_bind");
 | |
| 
 | |
|         let (tpu_port, tpu_sockets) =
 | |
|             multi_bind_in_range(bind_ip_addr, port_range, 32).expect("tpu multi_bind");
 | |
| 
 | |
|         let (tpu_forwards_port, tpu_forwards_sockets) =
 | |
|             multi_bind_in_range(bind_ip_addr, port_range, 8).expect("tpu_forwards multi_bind");
 | |
| 
 | |
|         let (_, retransmit_sockets) =
 | |
|             multi_bind_in_range(bind_ip_addr, port_range, 8).expect("retransmit multi_bind");
 | |
| 
 | |
|         let (repair_port, repair) = Self::bind(bind_ip_addr, port_range);
 | |
|         let (serve_repair_port, serve_repair) = Self::bind(bind_ip_addr, port_range);
 | |
| 
 | |
|         let (_, broadcast) =
 | |
|             multi_bind_in_range(bind_ip_addr, port_range, 4).expect("broadcast multi_bind");
 | |
| 
 | |
|         let info = ContactInfo {
 | |
|             id: *pubkey,
 | |
|             gossip: SocketAddr::new(gossip_addr.ip(), gossip_port),
 | |
|             tvu: SocketAddr::new(gossip_addr.ip(), tvu_port),
 | |
|             tvu_forwards: SocketAddr::new(gossip_addr.ip(), tvu_forwards_port),
 | |
|             repair: SocketAddr::new(gossip_addr.ip(), repair_port),
 | |
|             tpu: SocketAddr::new(gossip_addr.ip(), tpu_port),
 | |
|             tpu_forwards: SocketAddr::new(gossip_addr.ip(), tpu_forwards_port),
 | |
|             rpc_banks: socketaddr_any!(),
 | |
|             rpc: socketaddr_any!(),
 | |
|             rpc_pubsub: socketaddr_any!(),
 | |
|             serve_repair: SocketAddr::new(gossip_addr.ip(), serve_repair_port),
 | |
|             wallclock: 0,
 | |
|             shred_version: 0,
 | |
|         };
 | |
|         trace!("new ContactInfo: {:?}", info);
 | |
| 
 | |
|         Node {
 | |
|             info,
 | |
|             sockets: Sockets {
 | |
|                 gossip,
 | |
|                 tvu: tvu_sockets,
 | |
|                 tvu_forwards: tvu_forwards_sockets,
 | |
|                 tpu: tpu_sockets,
 | |
|                 tpu_forwards: tpu_forwards_sockets,
 | |
|                 broadcast,
 | |
|                 repair,
 | |
|                 retransmit_sockets,
 | |
|                 serve_repair,
 | |
|                 ip_echo: Some(ip_echo),
 | |
|             },
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| pub fn stake_weight_peers<S: std::hash::BuildHasher>(
 | |
|     peers: &mut Vec<ContactInfo>,
 | |
|     stakes: Option<Arc<HashMap<Pubkey, u64, S>>>,
 | |
| ) -> Vec<(u64, usize)> {
 | |
|     peers.dedup();
 | |
|     ClusterInfo::sorted_stakes_with_index(peers, stakes)
 | |
| }
 | |
| 
 | |
| #[cfg(test)]
 | |
| mod tests {
 | |
|     use super::*;
 | |
|     use crate::crds_value::{CrdsValue, CrdsValueLabel, Vote as CrdsVote};
 | |
|     use rayon::prelude::*;
 | |
|     use solana_perf::test_tx::test_tx;
 | |
|     use solana_sdk::signature::{Keypair, Signer};
 | |
|     use solana_vote_program::{vote_instruction, vote_state::Vote};
 | |
|     use std::collections::HashSet;
 | |
|     use std::net::{IpAddr, Ipv4Addr};
 | |
|     use std::sync::Arc;
 | |
| 
 | |
|     #[test]
 | |
|     fn test_gossip_node() {
 | |
|         //check that a gossip nodes always show up as spies
 | |
|         let (node, _, _) = ClusterInfo::spy_node(&Pubkey::new_rand(), 0);
 | |
|         assert!(ClusterInfo::is_spy_node(&node));
 | |
|         let (node, _, _) =
 | |
|             ClusterInfo::gossip_node(&Pubkey::new_rand(), &"1.1.1.1:1111".parse().unwrap(), 0);
 | |
|         assert!(ClusterInfo::is_spy_node(&node));
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_handle_pull() {
 | |
|         solana_logger::setup();
 | |
|         let node = Node::new_localhost();
 | |
|         let cluster_info = Arc::new(ClusterInfo::new_with_invalid_keypair(node.info));
 | |
| 
 | |
|         let entrypoint_pubkey = Pubkey::new_rand();
 | |
|         let data = test_crds_values(entrypoint_pubkey);
 | |
|         let timeouts = HashMap::new();
 | |
|         assert_eq!(
 | |
|             (0, 0, 1),
 | |
|             ClusterInfo::handle_pull_response(
 | |
|                 &cluster_info,
 | |
|                 &entrypoint_pubkey,
 | |
|                 data.clone(),
 | |
|                 &timeouts
 | |
|             )
 | |
|         );
 | |
| 
 | |
|         let entrypoint_pubkey2 = Pubkey::new_rand();
 | |
|         assert_eq!(
 | |
|             (1, 0, 0),
 | |
|             ClusterInfo::handle_pull_response(&cluster_info, &entrypoint_pubkey2, data, &timeouts)
 | |
|         );
 | |
|     }
 | |
| 
 | |
|     fn test_crds_values(pubkey: Pubkey) -> Vec<CrdsValue> {
 | |
|         let entrypoint = ContactInfo::new_localhost(&pubkey, timestamp());
 | |
|         let entrypoint_crdsvalue = CrdsValue::new_unsigned(CrdsData::ContactInfo(entrypoint));
 | |
|         vec![entrypoint_crdsvalue]
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_filter_shred_version() {
 | |
|         let from = Pubkey::new_rand();
 | |
|         let my_shred_version = 1;
 | |
|         let other_shred_version = 1;
 | |
| 
 | |
|         // Allow same shred_version
 | |
|         let mut values = test_crds_values(from);
 | |
|         ClusterInfo::filter_by_shred_version(
 | |
|             &from,
 | |
|             &mut values,
 | |
|             other_shred_version,
 | |
|             my_shred_version,
 | |
|         );
 | |
|         assert_eq!(values.len(), 1);
 | |
| 
 | |
|         // Allow shred_version=0.
 | |
|         let other_shred_version = 0;
 | |
|         ClusterInfo::filter_by_shred_version(
 | |
|             &from,
 | |
|             &mut values,
 | |
|             other_shred_version,
 | |
|             my_shred_version,
 | |
|         );
 | |
|         assert_eq!(values.len(), 1);
 | |
| 
 | |
|         // Change to sender's ContactInfo version, allow that.
 | |
|         let other_shred_version = 2;
 | |
|         ClusterInfo::filter_by_shred_version(
 | |
|             &from,
 | |
|             &mut values,
 | |
|             other_shred_version,
 | |
|             my_shred_version,
 | |
|         );
 | |
|         assert_eq!(values.len(), 1);
 | |
| 
 | |
|         let snapshot_hash_data = CrdsValue::new_unsigned(CrdsData::SnapshotHashes(SnapshotHash {
 | |
|             from: Pubkey::new_rand(),
 | |
|             hashes: vec![],
 | |
|             wallclock: 0,
 | |
|         }));
 | |
|         values.push(snapshot_hash_data);
 | |
|         // Change to sender's ContactInfo version, allow that.
 | |
|         let other_shred_version = 2;
 | |
|         ClusterInfo::filter_by_shred_version(
 | |
|             &from,
 | |
|             &mut values,
 | |
|             other_shred_version,
 | |
|             my_shred_version,
 | |
|         );
 | |
|         assert_eq!(values.len(), 1);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_cluster_spy_gossip() {
 | |
|         //check that gossip doesn't try to push to invalid addresses
 | |
|         let node = Node::new_localhost();
 | |
|         let (spy, _, _) = ClusterInfo::spy_node(&Pubkey::new_rand(), 0);
 | |
|         let cluster_info = Arc::new(ClusterInfo::new_with_invalid_keypair(node.info));
 | |
|         cluster_info.insert_info(spy);
 | |
|         cluster_info
 | |
|             .gossip
 | |
|             .write()
 | |
|             .unwrap()
 | |
|             .refresh_push_active_set(&HashMap::new());
 | |
|         let reqs = cluster_info.generate_new_gossip_requests(&HashMap::new(), true);
 | |
|         //assert none of the addrs are invalid.
 | |
|         reqs.iter().all(|(addr, _)| {
 | |
|             let res = ContactInfo::is_valid_address(addr);
 | |
|             assert!(res);
 | |
|             res
 | |
|         });
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_cluster_info_new() {
 | |
|         let d = ContactInfo::new_localhost(&Pubkey::new_rand(), timestamp());
 | |
|         let cluster_info = ClusterInfo::new_with_invalid_keypair(d.clone());
 | |
|         assert_eq!(d.id, cluster_info.id());
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn insert_info_test() {
 | |
|         let d = ContactInfo::new_localhost(&Pubkey::new_rand(), timestamp());
 | |
|         let cluster_info = ClusterInfo::new_with_invalid_keypair(d);
 | |
|         let d = ContactInfo::new_localhost(&Pubkey::new_rand(), timestamp());
 | |
|         let label = CrdsValueLabel::ContactInfo(d.id);
 | |
|         cluster_info.insert_info(d);
 | |
|         assert!(cluster_info
 | |
|             .gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .lookup(&label)
 | |
|             .is_some());
 | |
|     }
 | |
|     #[test]
 | |
|     #[should_panic]
 | |
|     fn test_update_contact_info() {
 | |
|         let d = ContactInfo::new_localhost(&Pubkey::new_rand(), timestamp());
 | |
|         let cluster_info = ClusterInfo::new_with_invalid_keypair(d);
 | |
|         let entry_label = CrdsValueLabel::ContactInfo(cluster_info.id());
 | |
|         assert!(cluster_info
 | |
|             .gossip
 | |
|             .read()
 | |
|             .unwrap()
 | |
|             .crds
 | |
|             .lookup(&entry_label)
 | |
|             .is_some());
 | |
| 
 | |
|         let now = timestamp();
 | |
|         cluster_info.update_contact_info(|ci| ci.wallclock = now);
 | |
|         assert_eq!(
 | |
|             cluster_info
 | |
|                 .gossip
 | |
|                 .read()
 | |
|                 .unwrap()
 | |
|                 .crds
 | |
|                 .lookup(&entry_label)
 | |
|                 .unwrap()
 | |
|                 .contact_info()
 | |
|                 .unwrap()
 | |
|                 .wallclock,
 | |
|             now
 | |
|         );
 | |
| 
 | |
|         // Inserting Contactinfo with different pubkey should panic,
 | |
|         // and update should fail
 | |
|         cluster_info.update_contact_info(|ci| ci.id = Pubkey::new_rand())
 | |
|     }
 | |
| 
 | |
|     fn assert_in_range(x: u16, range: (u16, u16)) {
 | |
|         assert!(x >= range.0);
 | |
|         assert!(x < range.1);
 | |
|     }
 | |
| 
 | |
|     fn check_sockets(sockets: &[UdpSocket], ip: IpAddr, range: (u16, u16)) {
 | |
|         assert!(sockets.len() > 1);
 | |
|         let port = sockets[0].local_addr().unwrap().port();
 | |
|         for socket in sockets.iter() {
 | |
|             check_socket(socket, ip, range);
 | |
|             assert_eq!(socket.local_addr().unwrap().port(), port);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     fn check_socket(socket: &UdpSocket, ip: IpAddr, range: (u16, u16)) {
 | |
|         let local_addr = socket.local_addr().unwrap();
 | |
|         assert_eq!(local_addr.ip(), ip);
 | |
|         assert_in_range(local_addr.port(), range);
 | |
|     }
 | |
| 
 | |
|     fn check_node_sockets(node: &Node, ip: IpAddr, range: (u16, u16)) {
 | |
|         check_socket(&node.sockets.gossip, ip, range);
 | |
|         check_socket(&node.sockets.repair, ip, range);
 | |
| 
 | |
|         check_sockets(&node.sockets.tvu, ip, range);
 | |
|         check_sockets(&node.sockets.tpu, ip, range);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn new_with_external_ip_test_random() {
 | |
|         let ip = Ipv4Addr::from(0);
 | |
|         let node = Node::new_with_external_ip(
 | |
|             &Pubkey::new_rand(),
 | |
|             &socketaddr!(ip, 0),
 | |
|             VALIDATOR_PORT_RANGE,
 | |
|             IpAddr::V4(ip),
 | |
|         );
 | |
| 
 | |
|         check_node_sockets(&node, IpAddr::V4(ip), VALIDATOR_PORT_RANGE);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn new_with_external_ip_test_gossip() {
 | |
|         // Can't use VALIDATOR_PORT_RANGE because if this test runs in parallel with others, the
 | |
|         // port returned by `bind_in_range()` might be snatched up before `Node::new_with_external_ip()` runs
 | |
|         let port_range = (VALIDATOR_PORT_RANGE.1 + 10, VALIDATOR_PORT_RANGE.1 + 20);
 | |
| 
 | |
|         let ip = IpAddr::V4(Ipv4Addr::from(0));
 | |
|         let port = bind_in_range(ip, port_range).expect("Failed to bind").0;
 | |
|         let node =
 | |
|             Node::new_with_external_ip(&Pubkey::new_rand(), &socketaddr!(0, port), port_range, ip);
 | |
| 
 | |
|         check_node_sockets(&node, ip, port_range);
 | |
| 
 | |
|         assert_eq!(node.sockets.gossip.local_addr().unwrap().port(), port);
 | |
|     }
 | |
| 
 | |
|     //test that all cluster_info objects only generate signed messages
 | |
|     //when constructed with keypairs
 | |
|     #[test]
 | |
|     fn test_gossip_signature_verification() {
 | |
|         //create new cluster info, leader, and peer
 | |
|         let keypair = Keypair::new();
 | |
|         let peer_keypair = Keypair::new();
 | |
|         let contact_info = ContactInfo::new_localhost(&keypair.pubkey(), 0);
 | |
|         let peer = ContactInfo::new_localhost(&peer_keypair.pubkey(), 0);
 | |
|         let cluster_info = ClusterInfo::new(contact_info, Arc::new(keypair));
 | |
|         cluster_info.insert_info(peer);
 | |
|         cluster_info
 | |
|             .gossip
 | |
|             .write()
 | |
|             .unwrap()
 | |
|             .refresh_push_active_set(&HashMap::new());
 | |
|         //check that all types of gossip messages are signed correctly
 | |
|         let (_, push_messages) = cluster_info
 | |
|             .gossip
 | |
|             .write()
 | |
|             .unwrap()
 | |
|             .new_push_messages(timestamp());
 | |
|         // there should be some pushes ready
 | |
|         assert_eq!(push_messages.is_empty(), false);
 | |
|         push_messages
 | |
|             .values()
 | |
|             .for_each(|v| v.par_iter().for_each(|v| assert!(v.verify())));
 | |
| 
 | |
|         let (_, _, val) = cluster_info
 | |
|             .gossip
 | |
|             .write()
 | |
|             .unwrap()
 | |
|             .new_pull_request(timestamp(), &HashMap::new(), MAX_BLOOM_SIZE)
 | |
|             .ok()
 | |
|             .unwrap();
 | |
|         assert!(val.verify());
 | |
|     }
 | |
| 
 | |
|     fn num_layers(nodes: usize, fanout: usize) -> usize {
 | |
|         ClusterInfo::describe_data_plane(nodes, fanout).0
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_describe_data_plane() {
 | |
|         // no nodes
 | |
|         assert_eq!(num_layers(0, 200), 0);
 | |
| 
 | |
|         // 1 node
 | |
|         assert_eq!(num_layers(1, 200), 1);
 | |
| 
 | |
|         // 10 nodes with fanout of 2
 | |
|         assert_eq!(num_layers(10, 2), 3);
 | |
| 
 | |
|         // fanout + 1 nodes with fanout of 2
 | |
|         assert_eq!(num_layers(3, 2), 2);
 | |
| 
 | |
|         // A little more realistic
 | |
|         assert_eq!(num_layers(100, 10), 2);
 | |
| 
 | |
|         // A little more realistic with odd numbers
 | |
|         assert_eq!(num_layers(103, 13), 2);
 | |
| 
 | |
|         // A little more realistic with just enough for 3 layers
 | |
|         assert_eq!(num_layers(111, 10), 3);
 | |
| 
 | |
|         // larger
 | |
|         let (layer_cnt, layer_indices) = ClusterInfo::describe_data_plane(10_000, 10);
 | |
|         assert_eq!(layer_cnt, 4);
 | |
|         // distances between index values should increase by `fanout` for every layer.
 | |
|         let mut capacity = 10 * 10;
 | |
|         assert_eq!(layer_indices[1], 10);
 | |
|         layer_indices[1..].windows(2).for_each(|x| {
 | |
|             if x.len() == 2 {
 | |
|                 assert_eq!(x[1] - x[0], capacity);
 | |
|                 capacity *= 10;
 | |
|             }
 | |
|         });
 | |
| 
 | |
|         // massive
 | |
|         let (layer_cnt, layer_indices) = ClusterInfo::describe_data_plane(500_000, 200);
 | |
|         let mut capacity = 200 * 200;
 | |
|         assert_eq!(layer_cnt, 3);
 | |
|         // distances between index values should increase by `fanout` for every layer.
 | |
|         assert_eq!(layer_indices[1], 200);
 | |
|         layer_indices[1..].windows(2).for_each(|x| {
 | |
|             if x.len() == 2 {
 | |
|                 assert_eq!(x[1] - x[0], capacity);
 | |
|                 capacity *= 200;
 | |
|             }
 | |
|         });
 | |
|         let total_capacity: usize = *layer_indices.last().unwrap();
 | |
|         assert!(total_capacity >= 500_000);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_localize() {
 | |
|         // go for gold
 | |
|         let (_, layer_indices) = ClusterInfo::describe_data_plane(500_000, 200);
 | |
|         let mut me = 0;
 | |
|         let mut layer_ix = 0;
 | |
|         let locality = ClusterInfo::localize(&layer_indices, 200, me);
 | |
|         assert_eq!(locality.layer_ix, layer_ix);
 | |
|         assert_eq!(
 | |
|             locality.next_layer_bounds,
 | |
|             Some((layer_indices[layer_ix + 1], layer_indices[layer_ix + 2]))
 | |
|         );
 | |
|         me = 201;
 | |
|         layer_ix = 1;
 | |
|         let locality = ClusterInfo::localize(&layer_indices, 200, me);
 | |
|         assert_eq!(
 | |
|             locality.layer_ix, layer_ix,
 | |
|             "layer_indices[layer_ix] is actually {}",
 | |
|             layer_indices[layer_ix]
 | |
|         );
 | |
|         assert_eq!(
 | |
|             locality.next_layer_bounds,
 | |
|             Some((layer_indices[layer_ix + 1], layer_indices[layer_ix + 2]))
 | |
|         );
 | |
|         me = 20_000;
 | |
|         layer_ix = 1;
 | |
|         let locality = ClusterInfo::localize(&layer_indices, 200, me);
 | |
|         assert_eq!(
 | |
|             locality.layer_ix, layer_ix,
 | |
|             "layer_indices[layer_ix] is actually {}",
 | |
|             layer_indices[layer_ix]
 | |
|         );
 | |
|         assert_eq!(
 | |
|             locality.next_layer_bounds,
 | |
|             Some((layer_indices[layer_ix + 1], layer_indices[layer_ix + 2]))
 | |
|         );
 | |
| 
 | |
|         // test no child layer since last layer should have massive capacity
 | |
|         let (_, layer_indices) = ClusterInfo::describe_data_plane(500_000, 200);
 | |
|         me = 40_201;
 | |
|         layer_ix = 2;
 | |
|         let locality = ClusterInfo::localize(&layer_indices, 200, me);
 | |
|         assert_eq!(
 | |
|             locality.layer_ix, layer_ix,
 | |
|             "layer_indices[layer_ix] is actually {}",
 | |
|             layer_indices[layer_ix]
 | |
|         );
 | |
|         assert_eq!(locality.next_layer_bounds, None);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_localize_child_peer_overlap() {
 | |
|         let (_, layer_indices) = ClusterInfo::describe_data_plane(500_000, 200);
 | |
|         let last_ix = layer_indices.len() - 1;
 | |
|         // sample every 33 pairs to reduce test time
 | |
|         for x in (0..*layer_indices.get(last_ix - 2).unwrap()).step_by(33) {
 | |
|             let me_locality = ClusterInfo::localize(&layer_indices, 200, x);
 | |
|             let buddy_locality = ClusterInfo::localize(&layer_indices, 200, x + 1);
 | |
|             assert!(!me_locality.next_layer_peers.is_empty());
 | |
|             assert!(!buddy_locality.next_layer_peers.is_empty());
 | |
|             me_locality
 | |
|                 .next_layer_peers
 | |
|                 .iter()
 | |
|                 .zip(buddy_locality.next_layer_peers.iter())
 | |
|                 .for_each(|(x, y)| assert_ne!(x, y));
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_network_coverage() {
 | |
|         // pretend to be each node in a scaled down network and make sure the set of all the broadcast peers
 | |
|         // includes every node in the network.
 | |
|         let (_, layer_indices) = ClusterInfo::describe_data_plane(25_000, 10);
 | |
|         let mut broadcast_set = HashSet::new();
 | |
|         for my_index in 0..25_000 {
 | |
|             let my_locality = ClusterInfo::localize(&layer_indices, 10, my_index);
 | |
|             broadcast_set.extend(my_locality.neighbor_bounds.0..my_locality.neighbor_bounds.1);
 | |
|             broadcast_set.extend(my_locality.next_layer_peers);
 | |
|         }
 | |
| 
 | |
|         for i in 0..25_000 {
 | |
|             assert!(broadcast_set.contains(&(i as usize)));
 | |
|         }
 | |
|         assert!(broadcast_set.contains(&(layer_indices.last().unwrap() - 1)));
 | |
|         //sanity check for past total capacity.
 | |
|         assert!(!broadcast_set.contains(&(layer_indices.last().unwrap())));
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_push_vote() {
 | |
|         let keys = Keypair::new();
 | |
|         let contact_info = ContactInfo::new_localhost(&keys.pubkey(), 0);
 | |
|         let cluster_info = ClusterInfo::new_with_invalid_keypair(contact_info);
 | |
| 
 | |
|         // make sure empty crds is handled correctly
 | |
|         let now = timestamp();
 | |
|         let (_, votes, max_ts) = cluster_info.get_votes(now);
 | |
|         assert_eq!(votes, vec![]);
 | |
|         assert_eq!(max_ts, now);
 | |
| 
 | |
|         // add a vote
 | |
|         let tx = test_tx();
 | |
|         let index = 1;
 | |
|         cluster_info.push_vote(index, tx.clone());
 | |
| 
 | |
|         // -1 to make sure that the clock is strictly lower then when insert occurred
 | |
|         let (labels, votes, max_ts) = cluster_info.get_votes(now - 1);
 | |
|         assert_eq!(votes, vec![tx]);
 | |
|         assert_eq!(labels.len(), 1);
 | |
|         match labels[0] {
 | |
|             CrdsValueLabel::Vote(_, pubkey) => {
 | |
|                 assert_eq!(pubkey, keys.pubkey());
 | |
|             }
 | |
| 
 | |
|             _ => panic!("Bad match"),
 | |
|         }
 | |
|         assert!(max_ts >= now - 1);
 | |
| 
 | |
|         // make sure timestamp filter works
 | |
|         let (_, votes, new_max_ts) = cluster_info.get_votes(max_ts);
 | |
|         assert_eq!(votes, vec![]);
 | |
|         assert_eq!(max_ts, new_max_ts);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_push_epoch_slots() {
 | |
|         let keys = Keypair::new();
 | |
|         let contact_info = ContactInfo::new_localhost(&keys.pubkey(), 0);
 | |
|         let cluster_info = ClusterInfo::new_with_invalid_keypair(contact_info);
 | |
|         let (slots, since) = cluster_info.get_epoch_slots_since(None);
 | |
|         assert!(slots.is_empty());
 | |
|         assert!(since.is_none());
 | |
|         cluster_info.push_epoch_slots(&[0]);
 | |
| 
 | |
|         let (slots, since) = cluster_info.get_epoch_slots_since(Some(std::u64::MAX));
 | |
|         assert!(slots.is_empty());
 | |
|         assert_eq!(since, Some(std::u64::MAX));
 | |
| 
 | |
|         let (slots, since) = cluster_info.get_epoch_slots_since(None);
 | |
|         assert_eq!(slots.len(), 1);
 | |
|         assert!(since.is_some());
 | |
| 
 | |
|         let (slots, since2) = cluster_info.get_epoch_slots_since(since);
 | |
|         assert!(slots.is_empty());
 | |
|         assert_eq!(since2, since);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_append_entrypoint_to_pulls() {
 | |
|         let node_keypair = Arc::new(Keypair::new());
 | |
|         let cluster_info = ClusterInfo::new(
 | |
|             ContactInfo::new_localhost(&node_keypair.pubkey(), timestamp()),
 | |
|             node_keypair,
 | |
|         );
 | |
|         let entrypoint_pubkey = Pubkey::new_rand();
 | |
|         let entrypoint = ContactInfo::new_localhost(&entrypoint_pubkey, timestamp());
 | |
|         cluster_info.set_entrypoint(entrypoint.clone());
 | |
|         let pulls = cluster_info.new_pull_requests(&HashMap::new());
 | |
|         assert_eq!(1, pulls.len() as u64);
 | |
|         match pulls.get(0) {
 | |
|             Some((addr, msg)) => {
 | |
|                 assert_eq!(*addr, entrypoint.gossip);
 | |
|                 match msg {
 | |
|                     Protocol::PullRequest(_, value) => {
 | |
|                         assert!(value.verify());
 | |
|                         assert_eq!(value.pubkey(), cluster_info.id())
 | |
|                     }
 | |
|                     _ => panic!("wrong protocol"),
 | |
|                 }
 | |
|             }
 | |
|             None => panic!("entrypoint should be a pull destination"),
 | |
|         }
 | |
| 
 | |
|         // now add this message back to the table and make sure after the next pull, the entrypoint is unset
 | |
|         let entrypoint_crdsvalue =
 | |
|             CrdsValue::new_unsigned(CrdsData::ContactInfo(entrypoint.clone()));
 | |
|         let cluster_info = Arc::new(cluster_info);
 | |
|         let timeouts = cluster_info.gossip.read().unwrap().make_timeouts_test();
 | |
|         ClusterInfo::handle_pull_response(
 | |
|             &cluster_info,
 | |
|             &entrypoint_pubkey,
 | |
|             vec![entrypoint_crdsvalue],
 | |
|             &timeouts,
 | |
|         );
 | |
|         let pulls = cluster_info.new_pull_requests(&HashMap::new());
 | |
|         assert_eq!(1, pulls.len() as u64);
 | |
|         assert_eq!(*cluster_info.entrypoint.read().unwrap(), Some(entrypoint));
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_split_messages_small() {
 | |
|         let value = CrdsValue::new_unsigned(CrdsData::ContactInfo(ContactInfo::default()));
 | |
|         test_split_messages(value);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_split_messages_large() {
 | |
|         let value = CrdsValue::new_unsigned(CrdsData::LowestSlot(
 | |
|             0,
 | |
|             LowestSlot::new(Pubkey::default(), 0, 0),
 | |
|         ));
 | |
|         test_split_messages(value);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_split_messages_packet_size() {
 | |
|         // Test that if a value is smaller than payload size but too large to be wrapped in a vec
 | |
|         // that it is still dropped
 | |
|         let payload: Vec<CrdsValue> = vec![];
 | |
|         let vec_size = serialized_size(&payload).unwrap();
 | |
|         let desired_size = MAX_PROTOCOL_PAYLOAD_SIZE - vec_size;
 | |
|         let mut value = CrdsValue::new_unsigned(CrdsData::SnapshotHashes(SnapshotHash {
 | |
|             from: Pubkey::default(),
 | |
|             hashes: vec![],
 | |
|             wallclock: 0,
 | |
|         }));
 | |
| 
 | |
|         let mut i = 0;
 | |
|         while value.size() <= desired_size {
 | |
|             value.data = CrdsData::SnapshotHashes(SnapshotHash {
 | |
|                 from: Pubkey::default(),
 | |
|                 hashes: vec![(0, Hash::default()); i],
 | |
|                 wallclock: 0,
 | |
|             });
 | |
|             i += 1;
 | |
|         }
 | |
|         let split = ClusterInfo::split_gossip_messages(vec![value]);
 | |
|         assert_eq!(split.len(), 0);
 | |
|     }
 | |
| 
 | |
|     fn test_split_messages(value: CrdsValue) {
 | |
|         const NUM_VALUES: u64 = 30;
 | |
|         let value_size = value.size();
 | |
|         let num_values_per_payload = (MAX_PROTOCOL_PAYLOAD_SIZE / value_size).max(1);
 | |
| 
 | |
|         // Expected len is the ceiling of the division
 | |
|         let expected_len = (NUM_VALUES + num_values_per_payload - 1) / num_values_per_payload;
 | |
|         let msgs = vec![value; NUM_VALUES as usize];
 | |
| 
 | |
|         let split = ClusterInfo::split_gossip_messages(msgs);
 | |
|         assert!(split.len() as u64 <= expected_len);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_crds_filter_size() {
 | |
|         //sanity test to ensure filter size never exceeds MTU size
 | |
|         check_pull_request_size(CrdsFilter::new_rand(1000, 10));
 | |
|         check_pull_request_size(CrdsFilter::new_rand(1000, 1000));
 | |
|         check_pull_request_size(CrdsFilter::new_rand(100_000, 1000));
 | |
|         check_pull_request_size(CrdsFilter::new_rand(100_000, MAX_BLOOM_SIZE));
 | |
|     }
 | |
| 
 | |
|     fn check_pull_request_size(filter: CrdsFilter) {
 | |
|         let value = CrdsValue::new_unsigned(CrdsData::ContactInfo(ContactInfo::default()));
 | |
|         let protocol = Protocol::PullRequest(filter, value);
 | |
|         assert!(serialized_size(&protocol).unwrap() <= PACKET_DATA_SIZE as u64);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_tvu_peers_and_stakes() {
 | |
|         let d = ContactInfo::new_localhost(&Pubkey::new(&[0; 32]), timestamp());
 | |
|         let cluster_info = ClusterInfo::new_with_invalid_keypair(d.clone());
 | |
|         let mut stakes = HashMap::new();
 | |
| 
 | |
|         // no stake
 | |
|         let id = Pubkey::new(&[1u8; 32]);
 | |
|         let contact_info = ContactInfo::new_localhost(&id, timestamp());
 | |
|         cluster_info.insert_info(contact_info);
 | |
| 
 | |
|         // normal
 | |
|         let id2 = Pubkey::new(&[2u8; 32]);
 | |
|         let mut contact_info = ContactInfo::new_localhost(&id2, timestamp());
 | |
|         cluster_info.insert_info(contact_info.clone());
 | |
|         stakes.insert(id2, 10);
 | |
| 
 | |
|         // duplicate
 | |
|         contact_info.wallclock = timestamp() + 1;
 | |
|         cluster_info.insert_info(contact_info);
 | |
| 
 | |
|         // no tvu
 | |
|         let id3 = Pubkey::new(&[3u8; 32]);
 | |
|         let mut contact_info = ContactInfo::new_localhost(&id3, timestamp());
 | |
|         contact_info.tvu = "0.0.0.0:0".parse().unwrap();
 | |
|         cluster_info.insert_info(contact_info);
 | |
|         stakes.insert(id3, 10);
 | |
| 
 | |
|         // normal but with different shred version
 | |
|         let id4 = Pubkey::new(&[4u8; 32]);
 | |
|         let mut contact_info = ContactInfo::new_localhost(&id4, timestamp());
 | |
|         contact_info.shred_version = 1;
 | |
|         assert_ne!(contact_info.shred_version, d.shred_version);
 | |
|         cluster_info.insert_info(contact_info);
 | |
|         stakes.insert(id4, 10);
 | |
| 
 | |
|         let stakes = Arc::new(stakes);
 | |
|         let mut peers = cluster_info.tvu_peers();
 | |
|         let peers_and_stakes = stake_weight_peers(&mut peers, Some(stakes));
 | |
|         assert_eq!(peers.len(), 2);
 | |
|         assert_eq!(peers[0].id, id);
 | |
|         assert_eq!(peers[1].id, id2);
 | |
|         assert_eq!(peers_and_stakes.len(), 2);
 | |
|         assert_eq!(peers_and_stakes[0].0, 10);
 | |
|         assert_eq!(peers_and_stakes[1].0, 1);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_pull_from_entrypoint_if_not_present() {
 | |
|         let node_keypair = Arc::new(Keypair::new());
 | |
|         let cluster_info = ClusterInfo::new(
 | |
|             ContactInfo::new_localhost(&node_keypair.pubkey(), timestamp()),
 | |
|             node_keypair,
 | |
|         );
 | |
|         let entrypoint_pubkey = Pubkey::new_rand();
 | |
|         let mut entrypoint = ContactInfo::new_localhost(&entrypoint_pubkey, timestamp());
 | |
|         entrypoint.gossip = socketaddr!("127.0.0.2:1234");
 | |
|         cluster_info.set_entrypoint(entrypoint.clone());
 | |
| 
 | |
|         let mut stakes = HashMap::new();
 | |
| 
 | |
|         let other_node_pubkey = Pubkey::new_rand();
 | |
|         let other_node = ContactInfo::new_localhost(&other_node_pubkey, timestamp());
 | |
|         assert_ne!(other_node.gossip, entrypoint.gossip);
 | |
|         cluster_info.insert_info(other_node.clone());
 | |
|         stakes.insert(other_node_pubkey, 10);
 | |
| 
 | |
|         // Pull request 1:  `other_node` is present but `entrypoint` was just added (so it has a
 | |
|         // fresh timestamp).  There should only be one pull request to `other_node`
 | |
|         let pulls = cluster_info.new_pull_requests(&stakes);
 | |
|         assert_eq!(1, pulls.len() as u64);
 | |
|         assert_eq!(pulls.get(0).unwrap().0, other_node.gossip);
 | |
| 
 | |
|         // Pull request 2: pretend it's been a while since we've pulled from `entrypoint`.  There should
 | |
|         // now be two pull requests
 | |
|         cluster_info
 | |
|             .entrypoint
 | |
|             .write()
 | |
|             .unwrap()
 | |
|             .as_mut()
 | |
|             .unwrap()
 | |
|             .wallclock = 0;
 | |
|         let pulls = cluster_info.new_pull_requests(&stakes);
 | |
|         assert_eq!(2, pulls.len() as u64);
 | |
|         assert_eq!(pulls.get(0).unwrap().0, other_node.gossip);
 | |
|         assert_eq!(pulls.get(1).unwrap().0, entrypoint.gossip);
 | |
| 
 | |
|         // Pull request 3:  `other_node` is present and `entrypoint` was just pulled from.  There should
 | |
|         // only be one pull request to `other_node`
 | |
|         let pulls = cluster_info.new_pull_requests(&stakes);
 | |
|         assert_eq!(1, pulls.len() as u64);
 | |
|         assert_eq!(pulls.get(0).unwrap().0, other_node.gossip);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_repair_peers() {
 | |
|         let node_keypair = Arc::new(Keypair::new());
 | |
|         let cluster_info = ClusterInfo::new(
 | |
|             ContactInfo::new_localhost(&node_keypair.pubkey(), timestamp()),
 | |
|             node_keypair,
 | |
|         );
 | |
|         for i in 0..10 {
 | |
|             // make these invalid for the upcoming repair request
 | |
|             let peer_lowest = if i >= 5 { 10 } else { 0 };
 | |
|             let other_node_pubkey = Pubkey::new_rand();
 | |
|             let other_node = ContactInfo::new_localhost(&other_node_pubkey, timestamp());
 | |
|             cluster_info.insert_info(other_node.clone());
 | |
|             let value = CrdsValue::new_unsigned(CrdsData::LowestSlot(
 | |
|                 0,
 | |
|                 LowestSlot::new(other_node_pubkey, peer_lowest, timestamp()),
 | |
|             ));
 | |
|             let _ = cluster_info
 | |
|                 .gossip
 | |
|                 .write()
 | |
|                 .unwrap()
 | |
|                 .crds
 | |
|                 .insert(value, timestamp());
 | |
|         }
 | |
|         // only half the visible peers should be eligible to serve this repair
 | |
|         assert_eq!(cluster_info.repair_peers(5).len(), 5);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_max_bloom_size() {
 | |
|         // check that the constant fits into the dynamic size
 | |
|         assert!(MAX_BLOOM_SIZE <= max_bloom_size());
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_protocol_size() {
 | |
|         let contact_info = CrdsValue::new_unsigned(CrdsData::ContactInfo(ContactInfo::default()));
 | |
|         let dummy_vec =
 | |
|             vec![CrdsValue::new_unsigned(CrdsData::ContactInfo(ContactInfo::default())); 10];
 | |
|         let dummy_vec_size = serialized_size(&dummy_vec).unwrap();
 | |
|         let mut max_protocol_size;
 | |
| 
 | |
|         max_protocol_size =
 | |
|             serialized_size(&Protocol::PullRequest(CrdsFilter::default(), contact_info)).unwrap()
 | |
|                 - serialized_size(&CrdsFilter::default()).unwrap();
 | |
|         max_protocol_size = max_protocol_size.max(
 | |
|             serialized_size(&Protocol::PullResponse(
 | |
|                 Pubkey::default(),
 | |
|                 dummy_vec.clone(),
 | |
|             ))
 | |
|             .unwrap()
 | |
|                 - dummy_vec_size,
 | |
|         );
 | |
|         max_protocol_size = max_protocol_size.max(
 | |
|             serialized_size(&Protocol::PushMessage(Pubkey::default(), dummy_vec)).unwrap()
 | |
|                 - dummy_vec_size,
 | |
|         );
 | |
|         max_protocol_size = max_protocol_size.max(
 | |
|             serialized_size(&Protocol::PruneMessage(
 | |
|                 Pubkey::default(),
 | |
|                 PruneData::default(),
 | |
|             ))
 | |
|             .unwrap()
 | |
|                 - serialized_size(&PruneData::default()).unwrap(),
 | |
|         );
 | |
| 
 | |
|         // finally assert the header size estimation is correct
 | |
|         assert_eq!(MAX_PROTOCOL_HEADER_SIZE, max_protocol_size);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_protocol_sanitize() {
 | |
|         let mut pd = PruneData::default();
 | |
|         pd.wallclock = MAX_WALLCLOCK;
 | |
|         let msg = Protocol::PruneMessage(Pubkey::default(), pd);
 | |
|         assert_eq!(msg.sanitize(), Err(SanitizeError::ValueOutOfBounds));
 | |
|     }
 | |
| 
 | |
|     // computes the maximum size for pull request blooms
 | |
|     fn max_bloom_size() -> usize {
 | |
|         let filter_size = serialized_size(&CrdsFilter::default())
 | |
|             .expect("unable to serialize default filter") as usize;
 | |
|         let protocol = Protocol::PullRequest(
 | |
|             CrdsFilter::default(),
 | |
|             CrdsValue::new_unsigned(CrdsData::ContactInfo(ContactInfo::default())),
 | |
|         );
 | |
|         let protocol_size =
 | |
|             serialized_size(&protocol).expect("unable to serialize gossip protocol") as usize;
 | |
|         PACKET_DATA_SIZE - (protocol_size - filter_size)
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_push_epoch_slots_large() {
 | |
|         use rand::Rng;
 | |
|         let node_keypair = Arc::new(Keypair::new());
 | |
|         let cluster_info = ClusterInfo::new(
 | |
|             ContactInfo::new_localhost(&node_keypair.pubkey(), timestamp()),
 | |
|             node_keypair,
 | |
|         );
 | |
|         let mut range: Vec<Slot> = vec![];
 | |
|         //random should be hard to compress
 | |
|         for _ in 0..32000 {
 | |
|             let last = *range.last().unwrap_or(&0);
 | |
|             range.push(last + rand::thread_rng().gen_range(1, 32));
 | |
|         }
 | |
|         cluster_info.push_epoch_slots(&range[..16000]);
 | |
|         cluster_info.push_epoch_slots(&range[16000..]);
 | |
|         let (slots, since) = cluster_info.get_epoch_slots_since(None);
 | |
|         let slots: Vec<_> = slots.iter().flat_map(|x| x.to_slots(0)).collect();
 | |
|         assert_eq!(slots, range);
 | |
|         assert!(since.is_some());
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_vote_size() {
 | |
|         let slots = vec![1; 32];
 | |
|         let vote = Vote::new(slots, Hash::default());
 | |
|         let keypair = Arc::new(Keypair::new());
 | |
| 
 | |
|         // Create the biggest possible vote transaction
 | |
|         let vote_ix = vote_instruction::vote_switch(
 | |
|             &keypair.pubkey(),
 | |
|             &keypair.pubkey(),
 | |
|             vote,
 | |
|             Hash::default(),
 | |
|         );
 | |
|         let mut vote_tx = Transaction::new_with_payer(&[vote_ix], Some(&keypair.pubkey()));
 | |
| 
 | |
|         vote_tx.partial_sign(&[keypair.as_ref()], Hash::default());
 | |
|         vote_tx.partial_sign(&[keypair.as_ref()], Hash::default());
 | |
| 
 | |
|         let vote = CrdsVote {
 | |
|             from: keypair.pubkey(),
 | |
|             transaction: vote_tx,
 | |
|             wallclock: 0,
 | |
|         };
 | |
|         let vote = CrdsValue::new_signed(CrdsData::Vote(1, vote), &Keypair::new());
 | |
|         assert!(bincode::serialized_size(&vote).unwrap() <= MAX_PROTOCOL_PAYLOAD_SIZE);
 | |
|     }
 | |
| 
 | |
|     #[test]
 | |
|     fn test_handle_adopt_shred_version() {
 | |
|         let node_keypair = Arc::new(Keypair::new());
 | |
|         let cluster_info = Arc::new(ClusterInfo::new(
 | |
|             ContactInfo::new_localhost(&node_keypair.pubkey(), timestamp()),
 | |
|             node_keypair,
 | |
|         ));
 | |
| 
 | |
|         // Simulating starting up with default entrypoint, no known id, only a gossip
 | |
|         // address
 | |
|         let entrypoint_gossip_addr = socketaddr!("127.0.0.2:1234");
 | |
|         let mut entrypoint = ContactInfo::new_localhost(&Pubkey::default(), timestamp());
 | |
|         entrypoint.gossip = entrypoint_gossip_addr;
 | |
|         assert_eq!(entrypoint.shred_version, 0);
 | |
|         cluster_info.set_entrypoint(entrypoint);
 | |
| 
 | |
|         // Simulate getting entrypoint ContactInfo from gossip
 | |
|         let mut gossiped_entrypoint_info =
 | |
|             ContactInfo::new_localhost(&Pubkey::new_rand(), timestamp());
 | |
|         gossiped_entrypoint_info.gossip = entrypoint_gossip_addr;
 | |
|         gossiped_entrypoint_info.shred_version = 1;
 | |
|         cluster_info.insert_info(gossiped_entrypoint_info.clone());
 | |
| 
 | |
|         // Adopt the entrypoint's gossiped contact info and verify
 | |
|         ClusterInfo::handle_adopt_shred_version(&cluster_info, &mut true);
 | |
|         assert_eq!(
 | |
|             cluster_info.entrypoint.read().unwrap().as_ref().unwrap(),
 | |
|             &gossiped_entrypoint_info
 | |
|         );
 | |
|         assert_eq!(cluster_info.my_shred_version(), 1);
 | |
|     }
 | |
| }
 |