//! The `gossip_service` module implements the network control plane. use crate::cluster_info::{ClusterInfo, VALIDATOR_PORT_RANGE}; use crate::contact_info::ContactInfo; use rand::{thread_rng, Rng}; use solana_client::thin_client::{create_client, ThinClient}; use solana_ledger::bank_forks::BankForks; use solana_perf::recycler::Recycler; use solana_sdk::pubkey::Pubkey; use solana_sdk::signature::{Keypair, Signer}; use solana_streamer::streamer; use std::net::{IpAddr, Ipv4Addr, SocketAddr, TcpListener, UdpSocket}; use std::sync::atomic::{AtomicBool, Ordering}; use std::sync::mpsc::channel; use std::sync::{Arc, RwLock}; use std::thread::{self, sleep, JoinHandle}; use std::time::{Duration, Instant}; pub struct GossipService { thread_hdls: Vec>, } impl GossipService { pub fn new( cluster_info: &Arc, bank_forks: Option>>, gossip_socket: UdpSocket, exit: &Arc, ) -> Self { let (request_sender, request_receiver) = channel(); let gossip_socket = Arc::new(gossip_socket); trace!( "GossipService: id: {}, listening on: {:?}", &cluster_info.id(), gossip_socket.local_addr().unwrap() ); let t_receiver = streamer::receiver( gossip_socket.clone(), &exit, request_sender, Recycler::default(), "gossip_receiver", ); let (response_sender, response_receiver) = channel(); let t_responder = streamer::responder("gossip", gossip_socket, response_receiver); let t_listen = ClusterInfo::listen( cluster_info.clone(), bank_forks.clone(), request_receiver, response_sender.clone(), exit, ); let t_gossip = ClusterInfo::gossip(cluster_info.clone(), bank_forks, response_sender, exit); let thread_hdls = vec![t_receiver, t_responder, t_listen, t_gossip]; Self { thread_hdls } } pub fn join(self) -> thread::Result<()> { for thread_hdl in self.thread_hdls { thread_hdl.join()?; } Ok(()) } } /// Discover Validators in a cluster pub fn discover_cluster( entrypoint: &SocketAddr, num_nodes: usize, ) -> std::io::Result> { discover( Some(entrypoint), Some(num_nodes), Some(30), None, None, None, 0, ) .map(|(_all_peers, validators)| validators) } pub fn discover( entrypoint: Option<&SocketAddr>, num_nodes: Option, // num_nodes only counts validators, excludes spy nodes timeout: Option, find_node_by_pubkey: Option, find_node_by_gossip_addr: Option<&SocketAddr>, my_gossip_addr: Option<&SocketAddr>, my_shred_version: u16, ) -> std::io::Result<(Vec, Vec)> { let exit = Arc::new(AtomicBool::new(false)); let (gossip_service, ip_echo, spy_ref) = make_gossip_node(entrypoint, &exit, my_gossip_addr, my_shred_version); let id = spy_ref.id(); info!("Entrypoint: {:?}", entrypoint); info!("Node Id: {:?}", id); if let Some(my_gossip_addr) = my_gossip_addr { info!("Gossip Address: {:?}", my_gossip_addr); } let _ip_echo_server = ip_echo.map(solana_net_utils::ip_echo_server); let (met_criteria, secs, all_peers, tvu_peers) = spy( spy_ref.clone(), num_nodes, timeout, find_node_by_pubkey, find_node_by_gossip_addr, ); exit.store(true, Ordering::Relaxed); gossip_service.join().unwrap(); if met_criteria { info!( "discover success in {}s...\n{}", secs, spy_ref.contact_info_trace() ); return Ok((all_peers, tvu_peers)); } if !tvu_peers.is_empty() { info!( "discover failed to match criteria by timeout...\n{}", spy_ref.contact_info_trace() ); return Ok((all_peers, tvu_peers)); } info!("discover failed...\n{}", spy_ref.contact_info_trace()); Err(std::io::Error::new( std::io::ErrorKind::Other, "Discover failed", )) } /// Creates a ThinClient per valid node pub fn get_clients(nodes: &[ContactInfo]) -> Vec { nodes .iter() .filter_map(ContactInfo::valid_client_facing_addr) .map(|addrs| create_client(addrs, VALIDATOR_PORT_RANGE)) .collect() } /// Creates a ThinClient by selecting a valid node at random pub fn get_client(nodes: &[ContactInfo]) -> ThinClient { let nodes: Vec<_> = nodes .iter() .filter_map(ContactInfo::valid_client_facing_addr) .collect(); let select = thread_rng().gen_range(0, nodes.len()); create_client(nodes[select], VALIDATOR_PORT_RANGE) } pub fn get_multi_client(nodes: &[ContactInfo]) -> (ThinClient, usize) { let addrs: Vec<_> = nodes .iter() .filter_map(ContactInfo::valid_client_facing_addr) .map(|addrs| addrs) .collect(); let rpc_addrs: Vec<_> = addrs.iter().map(|addr| addr.0).collect(); let tpu_addrs: Vec<_> = addrs.iter().map(|addr| addr.1).collect(); let (_, transactions_socket) = solana_net_utils::bind_in_range( IpAddr::V4(Ipv4Addr::new(0, 0, 0, 0)), VALIDATOR_PORT_RANGE, ) .unwrap(); let num_nodes = tpu_addrs.len(); ( ThinClient::new_from_addrs(rpc_addrs, tpu_addrs, transactions_socket), num_nodes, ) } fn spy( spy_ref: Arc, num_nodes: Option, timeout: Option, find_node_by_pubkey: Option, find_node_by_gossip_addr: Option<&SocketAddr>, ) -> (bool, u64, Vec, Vec) { let now = Instant::now(); let mut met_criteria = false; let mut all_peers: Vec = Vec::new(); let mut tvu_peers: Vec = Vec::new(); let mut i = 1; while !met_criteria { if let Some(secs) = timeout { if now.elapsed() >= Duration::from_secs(secs) { break; } } all_peers = spy_ref .all_peers() .into_iter() .map(|x| x.0) .collect::>(); tvu_peers = spy_ref.all_tvu_peers().into_iter().collect::>(); let found_node_by_pubkey = if let Some(pubkey) = find_node_by_pubkey { all_peers.iter().any(|x| x.id == pubkey) } else { false }; let found_node_by_gossip_addr = if let Some(gossip_addr) = find_node_by_gossip_addr { all_peers.iter().any(|x| x.gossip == *gossip_addr) } else { false }; if let Some(num) = num_nodes { // Only consider validators and archives for `num_nodes` let mut nodes: Vec<_> = tvu_peers.iter().collect(); nodes.sort(); nodes.dedup(); if nodes.len() >= num { if found_node_by_pubkey || found_node_by_gossip_addr { met_criteria = true; } if find_node_by_pubkey.is_none() && find_node_by_gossip_addr.is_none() { met_criteria = true; } } } else if found_node_by_pubkey || found_node_by_gossip_addr { met_criteria = true; } if i % 20 == 0 { info!("discovering...\n{}", spy_ref.contact_info_trace()); } sleep(Duration::from_millis( crate::cluster_info::GOSSIP_SLEEP_MILLIS, )); i += 1; } (met_criteria, now.elapsed().as_secs(), all_peers, tvu_peers) } /// Makes a spy or gossip node based on whether or not a gossip_addr was passed in /// Pass in a gossip addr to fully participate in gossip instead of relying on just pulls fn make_gossip_node( entrypoint: Option<&SocketAddr>, exit: &Arc, gossip_addr: Option<&SocketAddr>, shred_version: u16, ) -> (GossipService, Option, Arc) { let keypair = Arc::new(Keypair::new()); let (node, gossip_socket, ip_echo) = if let Some(gossip_addr) = gossip_addr { ClusterInfo::gossip_node(&keypair.pubkey(), gossip_addr, shred_version) } else { ClusterInfo::spy_node(&keypair.pubkey(), shred_version) }; let cluster_info = ClusterInfo::new(node, keypair); if let Some(entrypoint) = entrypoint { cluster_info.set_entrypoint(ContactInfo::new_gossip_entry_point(entrypoint)); } let cluster_info = Arc::new(cluster_info); let gossip_service = GossipService::new(&cluster_info.clone(), None, gossip_socket, &exit); (gossip_service, ip_echo, cluster_info) } #[cfg(test)] mod tests { use super::*; use crate::cluster_info::{ClusterInfo, Node}; use std::sync::atomic::AtomicBool; use std::sync::Arc; #[test] #[ignore] // test that stage will exit when flag is set fn test_exit() { let exit = Arc::new(AtomicBool::new(false)); let tn = Node::new_localhost(); let cluster_info = ClusterInfo::new_with_invalid_keypair(tn.info.clone()); let c = Arc::new(cluster_info); let d = GossipService::new(&c, None, tn.sockets.gossip, &exit); exit.store(true, Ordering::Relaxed); d.join().unwrap(); } #[test] fn test_gossip_services_spy() { let keypair = Keypair::new(); let peer0 = Pubkey::new_rand(); let peer1 = Pubkey::new_rand(); let contact_info = ContactInfo::new_localhost(&keypair.pubkey(), 0); let peer0_info = ContactInfo::new_localhost(&peer0, 0); let peer1_info = ContactInfo::new_localhost(&peer1, 0); let cluster_info = ClusterInfo::new(contact_info.clone(), Arc::new(keypair)); cluster_info.insert_info(peer0_info.clone()); cluster_info.insert_info(peer1_info); let spy_ref = Arc::new(cluster_info); let (met_criteria, secs, _, tvu_peers) = spy(spy_ref.clone(), None, Some(1), None, None); assert_eq!(met_criteria, false); assert_eq!(secs, 1); assert_eq!(tvu_peers, spy_ref.tvu_peers()); // Find num_nodes let (met_criteria, _, _, _) = spy(spy_ref.clone(), Some(1), None, None, None); assert_eq!(met_criteria, true); let (met_criteria, _, _, _) = spy(spy_ref.clone(), Some(2), None, None, None); assert_eq!(met_criteria, true); // Find specific node by pubkey let (met_criteria, _, _, _) = spy(spy_ref.clone(), None, None, Some(peer0), None); assert_eq!(met_criteria, true); let (met_criteria, _, _, _) = spy( spy_ref.clone(), None, Some(0), Some(Pubkey::new_rand()), None, ); assert_eq!(met_criteria, false); // Find num_nodes *and* specific node by pubkey let (met_criteria, _, _, _) = spy(spy_ref.clone(), Some(1), None, Some(peer0), None); assert_eq!(met_criteria, true); let (met_criteria, _, _, _) = spy(spy_ref.clone(), Some(3), Some(0), Some(peer0), None); assert_eq!(met_criteria, false); let (met_criteria, _, _, _) = spy( spy_ref.clone(), Some(1), Some(0), Some(Pubkey::new_rand()), None, ); assert_eq!(met_criteria, false); // Find specific node by gossip address let (met_criteria, _, _, _) = spy(spy_ref.clone(), None, None, None, Some(&peer0_info.gossip)); assert_eq!(met_criteria, true); let (met_criteria, _, _, _) = spy( spy_ref.clone(), None, Some(0), None, Some(&"1.1.1.1:1234".parse().unwrap()), ); assert_eq!(met_criteria, false); } }