//! The `packet` module defines data structures and methods to pull data from the network. use crate::recvmmsg::{recv_mmsg, NUM_RCVMMSGS}; use crate::result::{Error, Result}; use bincode::{serialize, serialize_into}; use byteorder::{ByteOrder, LittleEndian}; use log::Level; use serde::Serialize; use solana_metrics::counter::Counter; pub use solana_sdk::packet::PACKET_DATA_SIZE; use std::cmp; use std::fmt; use std::io; use std::mem::size_of; use std::net::{IpAddr, Ipv4Addr, Ipv6Addr, SocketAddr, UdpSocket}; use std::sync::{Arc, RwLock}; pub type SharedPackets = Arc>; pub type SharedBlob = Arc>; pub type SharedBlobs = Vec; pub const NUM_PACKETS: usize = 1024 * 8; pub const BLOB_SIZE: usize = (64 * 1024 - 128); // wikipedia says there should be 20b for ipv4 headers pub const BLOB_DATA_SIZE: usize = BLOB_SIZE - (BLOB_HEADER_SIZE * 2); pub const NUM_BLOBS: usize = (NUM_PACKETS * PACKET_DATA_SIZE) / BLOB_SIZE; #[derive(Clone, Default, Debug, PartialEq)] #[repr(C)] pub struct Meta { pub size: usize, pub num_retransmits: u64, pub addr: [u16; 8], pub port: u16, pub v6: bool, } #[derive(Clone)] #[repr(C)] pub struct Packet { pub data: [u8; PACKET_DATA_SIZE], pub meta: Meta, } impl fmt::Debug for Packet { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { write!( f, "Packet {{ size: {:?}, addr: {:?} }}", self.meta.size, self.meta.addr() ) } } impl Default for Packet { fn default() -> Packet { Packet { data: [0u8; PACKET_DATA_SIZE], meta: Meta::default(), } } } impl Meta { pub fn addr(&self) -> SocketAddr { if !self.v6 { let addr = [ self.addr[0] as u8, self.addr[1] as u8, self.addr[2] as u8, self.addr[3] as u8, ]; let ipv4: Ipv4Addr = From::<[u8; 4]>::from(addr); SocketAddr::new(IpAddr::V4(ipv4), self.port) } else { let ipv6: Ipv6Addr = From::<[u16; 8]>::from(self.addr); SocketAddr::new(IpAddr::V6(ipv6), self.port) } } pub fn set_addr(&mut self, a: &SocketAddr) { match *a { SocketAddr::V4(v4) => { let ip = v4.ip().octets(); self.addr[0] = u16::from(ip[0]); self.addr[1] = u16::from(ip[1]); self.addr[2] = u16::from(ip[2]); self.addr[3] = u16::from(ip[3]); self.addr[4] = 0; self.addr[5] = 0; self.addr[6] = 0; self.addr[7] = 0; self.v6 = false; } SocketAddr::V6(v6) => { self.addr = v6.ip().segments(); self.v6 = true; } } self.port = a.port(); } } #[derive(Debug)] pub struct Packets { pub packets: Vec, } //auto derive doesn't support large arrays impl Default for Packets { fn default() -> Packets { Packets { packets: vec![Packet::default(); NUM_PACKETS], } } } impl Packets { pub fn set_addr(&mut self, addr: &SocketAddr) { for m in self.packets.iter_mut() { m.meta.set_addr(&addr); } } } #[derive(Clone)] pub struct Blob { pub data: [u8; BLOB_SIZE], pub meta: Meta, } impl PartialEq for Blob { fn eq(&self, other: &Blob) -> bool { self.data.iter().zip(other.data.iter()).all(|(a, b)| a == b) && self.meta == other.meta } } impl fmt::Debug for Blob { fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { write!( f, "Blob {{ size: {:?}, addr: {:?} }}", self.meta.size, self.meta.addr() ) } } //auto derive doesn't support large arrays impl Default for Blob { fn default() -> Blob { Blob { data: [0u8; BLOB_SIZE], meta: Meta::default(), } } } #[derive(Debug)] pub enum BlobError { /// the Blob's meta and data are not self-consistent BadState, /// Blob verification failed VerificationFailed, } impl Packets { fn run_read_from(&mut self, socket: &UdpSocket) -> Result { self.packets.resize(NUM_PACKETS, Packet::default()); let mut i = 0; //DOCUMENTED SIDE-EFFECT //Performance out of the IO without poll // * block on the socket until it's readable // * set the socket to non blocking // * read until it fails // * set it back to blocking before returning socket.set_nonblocking(false)?; trace!("receiving on {}", socket.local_addr().unwrap()); loop { match recv_mmsg(socket, &mut self.packets[i..]) { Err(_) if i > 0 => { inc_new_counter_info!("packets-recv_count", i); debug!("got {:?} messages on {}", i, socket.local_addr().unwrap()); return Ok(i); } Err(e) => { trace!("recv_from err {:?}", e); return Err(Error::IO(e)); } Ok(npkts) => { if i == 0 { socket.set_nonblocking(true)?; } trace!("got {} packets", npkts); i += npkts; if npkts != NUM_RCVMMSGS || i >= 1024 { inc_new_counter_info!("packets-recv_count", i); return Ok(i); } } } } } pub fn recv_from(&mut self, socket: &UdpSocket) -> Result<()> { let sz = self.run_read_from(socket)?; self.packets.resize(sz, Packet::default()); debug!("recv_from: {}", sz); Ok(()) } pub fn send_to(&self, socket: &UdpSocket) -> Result<()> { for p in &self.packets { let a = p.meta.addr(); socket.send_to(&p.data[..p.meta.size], &a)?; } Ok(()) } } pub fn to_packets_chunked(xs: &[T], chunks: usize) -> Vec { let mut out = vec![]; for x in xs.chunks(chunks) { let p = SharedPackets::default(); p.write() .unwrap() .packets .resize(x.len(), Packet::default()); for (i, o) in x.iter().zip(p.write().unwrap().packets.iter_mut()) { let mut wr = io::Cursor::new(&mut o.data[..]); serialize_into(&mut wr, &i).expect("serialize request"); let len = wr.position() as usize; o.meta.size = len; } out.push(p); } out } pub fn to_packets(xs: &[T]) -> Vec { to_packets_chunked(xs, NUM_PACKETS) } pub fn to_blob(resp: T, rsp_addr: SocketAddr) -> Result { let mut b = Blob::default(); let v = serialize(&resp)?; let len = v.len(); assert!(len <= BLOB_SIZE); b.data[..len].copy_from_slice(&v); b.meta.size = len; b.meta.set_addr(&rsp_addr); Ok(b) } pub fn to_blobs(rsps: Vec<(T, SocketAddr)>) -> Result> { let mut blobs = Vec::new(); for (resp, rsp_addr) in rsps { blobs.push(to_blob(resp, rsp_addr)?); } Ok(blobs) } pub fn to_shared_blob(resp: T, rsp_addr: SocketAddr) -> Result { let blob = Arc::new(RwLock::new(to_blob(resp, rsp_addr)?)); Ok(blob) } pub fn to_shared_blobs(rsps: Vec<(T, SocketAddr)>) -> Result { let mut blobs = Vec::new(); for (resp, rsp_addr) in rsps { blobs.push(to_shared_blob(resp, rsp_addr)?); } Ok(blobs) } macro_rules! range { ($prev:expr, $type:ident) => { $prev..$prev + size_of::<$type>() }; } const PARENT_RANGE: std::ops::Range = range!(0, u64); const SLOT_RANGE: std::ops::Range = range!(PARENT_RANGE.end, u64); const INDEX_RANGE: std::ops::Range = range!(SLOT_RANGE.end, u64); const FORWARD_RANGE: std::ops::Range = range!(INDEX_RANGE.end, bool); const FLAGS_RANGE: std::ops::Range = range!(FORWARD_RANGE.end, u32); const SIZE_RANGE: std::ops::Range = range!(FLAGS_RANGE.end, u64); macro_rules! align { ($x:expr, $align:expr) => { $x + ($align * 8 - 1) & !($align * 8 - 1) }; } pub const BLOB_HEADER_SIZE: usize = align!(SIZE_RANGE.end, 8); pub const BLOB_FLAG_IS_LAST_IN_SLOT: u32 = 0x2; pub const BLOB_FLAG_IS_CODING: u32 = 0x1; impl Blob { pub fn new(data: &[u8]) -> Self { let mut blob = Self::default(); let data_len = cmp::min(data.len(), blob.data.len()); let bytes = &data[..data_len]; blob.data[..data_len].copy_from_slice(bytes); blob.meta.size = blob.data_size() as usize; blob } pub fn parent(&self) -> u64 { LittleEndian::read_u64(&self.data[PARENT_RANGE]) } pub fn set_parent(&mut self, ix: u64) { LittleEndian::write_u64(&mut self.data[PARENT_RANGE], ix); } pub fn slot(&self) -> u64 { LittleEndian::read_u64(&self.data[SLOT_RANGE]) } pub fn set_slot(&mut self, ix: u64) { LittleEndian::write_u64(&mut self.data[SLOT_RANGE], ix); } pub fn index(&self) -> u64 { LittleEndian::read_u64(&self.data[INDEX_RANGE]) } pub fn set_index(&mut self, ix: u64) { LittleEndian::write_u64(&mut self.data[INDEX_RANGE], ix); } /// Used to determine whether or not this blob should be forwarded in retransmit /// A bool is used here instead of a flag because this item is not intended to be signed when /// blob signatures are introduced pub fn should_forward(&self) -> bool { self.data[FORWARD_RANGE][0] & 0x1 == 1 } pub fn forward(&mut self, forward: bool) { self.data[FORWARD_RANGE][0] = u8::from(forward) } pub fn flags(&self) -> u32 { LittleEndian::read_u32(&self.data[FLAGS_RANGE]) } pub fn set_flags(&mut self, ix: u32) { LittleEndian::write_u32(&mut self.data[FLAGS_RANGE], ix); } pub fn is_coding(&self) -> bool { (self.flags() & BLOB_FLAG_IS_CODING) != 0 } pub fn set_coding(&mut self) { let flags = self.flags(); self.set_flags(flags | BLOB_FLAG_IS_CODING); } pub fn set_is_last_in_slot(&mut self) { let flags = self.flags(); self.set_flags(flags | BLOB_FLAG_IS_LAST_IN_SLOT); } pub fn is_last_in_slot(&self) -> bool { (self.flags() & BLOB_FLAG_IS_LAST_IN_SLOT) != 0 } pub fn data_size(&self) -> u64 { LittleEndian::read_u64(&self.data[SIZE_RANGE]) } pub fn set_data_size(&mut self, ix: u64) { LittleEndian::write_u64(&mut self.data[SIZE_RANGE], ix); } pub fn data(&self) -> &[u8] { &self.data[BLOB_HEADER_SIZE..] } pub fn data_mut(&mut self) -> &mut [u8] { &mut self.data[BLOB_HEADER_SIZE..] } pub fn size(&self) -> usize { let size = self.data_size() as usize; if size > BLOB_HEADER_SIZE && size == self.meta.size { size - BLOB_HEADER_SIZE } else { 0 } } pub fn set_size(&mut self, size: usize) { let new_size = size + BLOB_HEADER_SIZE; self.meta.size = new_size; self.set_data_size(new_size as u64); } pub fn recv_blob(socket: &UdpSocket, r: &SharedBlob) -> io::Result<()> { let mut p = r.write().unwrap(); trace!("receiving on {}", socket.local_addr().unwrap()); let (nrecv, from) = socket.recv_from(&mut p.data)?; p.meta.size = nrecv; p.meta.set_addr(&from); trace!("got {} bytes from {}", nrecv, from); Ok(()) } pub fn recv_from(socket: &UdpSocket) -> Result { let mut v = Vec::new(); //DOCUMENTED SIDE-EFFECT //Performance out of the IO without poll // * block on the socket until it's readable // * set the socket to non blocking // * read until it fails // * set it back to blocking before returning socket.set_nonblocking(false)?; for i in 0..NUM_BLOBS { let r = SharedBlob::default(); match Blob::recv_blob(socket, &r) { Err(_) if i > 0 => { trace!("got {:?} messages on {}", i, socket.local_addr().unwrap()); break; } Err(e) => { if e.kind() != io::ErrorKind::WouldBlock { info!("recv_from err {:?}", e); } return Err(Error::IO(e)); } Ok(()) => { if i == 0 { socket.set_nonblocking(true)?; } } } v.push(r); } Ok(v) } pub fn send_to(socket: &UdpSocket, v: SharedBlobs) -> Result<()> { for r in v { { let p = r.read().unwrap(); let a = p.meta.addr(); if let Err(e) = socket.send_to(&p.data[..p.meta.size], &a) { warn!( "error sending {} byte packet to {:?}: {:?}", p.meta.size, a, e ); Err(e)?; } } } Ok(()) } } pub fn index_blobs(blobs: &[SharedBlob], blob_index: &mut u64, slots: &[u64]) { // enumerate all the blobs, those are the indices for (blob, slot) in blobs.iter().zip(slots) { let mut blob = blob.write().unwrap(); blob.set_index(*blob_index); blob.set_slot(*slot); blob.forward(true); *blob_index += 1; } } #[cfg(test)] mod tests { use crate::packet::{ to_packets, Blob, Meta, Packet, Packets, SharedBlob, SharedPackets, NUM_PACKETS, PACKET_DATA_SIZE, }; use solana_sdk::hash::Hash; use solana_sdk::signature::{Keypair, KeypairUtil}; use solana_sdk::system_transaction::SystemTransaction; use std::io; use std::io::Write; use std::net::{Ipv4Addr, SocketAddr, UdpSocket}; #[test] fn test_packets_set_addr() { // test that the address is actually being updated let send_addr = socketaddr!([127, 0, 0, 1], 123); let packets = vec![Packet::default()]; let mut msgs = Packets { packets }; msgs.set_addr(&send_addr); assert_eq!(SocketAddr::from(msgs.packets[0].meta.addr()), send_addr); } #[test] pub fn packet_send_recv() { let reader = UdpSocket::bind("127.0.0.1:0").expect("bind"); let addr = reader.local_addr().unwrap(); let sender = UdpSocket::bind("127.0.0.1:0").expect("bind"); let saddr = sender.local_addr().unwrap(); let p = SharedPackets::default(); p.write().unwrap().packets.resize(10, Packet::default()); for m in p.write().unwrap().packets.iter_mut() { m.meta.set_addr(&addr); m.meta.size = PACKET_DATA_SIZE; } p.read().unwrap().send_to(&sender).unwrap(); p.write().unwrap().recv_from(&reader).unwrap(); for m in p.write().unwrap().packets.iter_mut() { assert_eq!(m.meta.size, PACKET_DATA_SIZE); assert_eq!(m.meta.addr(), saddr); } } #[test] fn test_to_packets() { let keypair = Keypair::new(); let hash = Hash::new(&[1; 32]); let tx = SystemTransaction::new_account(&keypair, keypair.pubkey(), 1, hash, 0); let rv = to_packets(&vec![tx.clone(); 1]); assert_eq!(rv.len(), 1); assert_eq!(rv[0].read().unwrap().packets.len(), 1); let rv = to_packets(&vec![tx.clone(); NUM_PACKETS]); assert_eq!(rv.len(), 1); assert_eq!(rv[0].read().unwrap().packets.len(), NUM_PACKETS); let rv = to_packets(&vec![tx.clone(); NUM_PACKETS + 1]); assert_eq!(rv.len(), 2); assert_eq!(rv[0].read().unwrap().packets.len(), NUM_PACKETS); assert_eq!(rv[1].read().unwrap().packets.len(), 1); } #[test] pub fn blob_send_recv() { trace!("start"); let reader = UdpSocket::bind("127.0.0.1:0").expect("bind"); let addr = reader.local_addr().unwrap(); let sender = UdpSocket::bind("127.0.0.1:0").expect("bind"); let p = SharedBlob::default(); p.write().unwrap().meta.set_addr(&addr); p.write().unwrap().meta.size = 1024; let v = vec![p]; Blob::send_to(&sender, v).unwrap(); trace!("send_to"); let rv = Blob::recv_from(&reader).unwrap(); trace!("recv_from"); assert_eq!(rv.len(), 1); assert_eq!(rv[0].read().unwrap().meta.size, 1024); } #[cfg(all(feature = "ipv6", test))] #[test] pub fn blob_ipv6_send_recv() { let reader = UdpSocket::bind("[::1]:0").expect("bind"); let addr = reader.local_addr().unwrap(); let sender = UdpSocket::bind("[::1]:0").expect("bind"); let p = SharedBlob::default(); p.as_mut().unwrap().meta.set_addr(&addr); p.as_mut().unwrap().meta.size = 1024; let mut v = VecDeque::default(); v.push_back(p); Blob::send_to(&r, &sender, &mut v).unwrap(); let mut rv = Blob::recv_from(&reader).unwrap(); let rp = rv.pop_front().unwrap(); assert_eq!(rp.as_mut().meta.size, 1024); } #[test] pub fn debug_trait() { write!(io::sink(), "{:?}", Packet::default()).unwrap(); write!(io::sink(), "{:?}", Packets::default()).unwrap(); write!(io::sink(), "{:?}", Blob::default()).unwrap(); } #[test] pub fn blob_test() { let mut b = Blob::default(); b.set_index(::max_value()); assert_eq!(b.index(), ::max_value()); b.data_mut()[0] = 1; assert_eq!(b.data()[0], 1); assert_eq!(b.index(), ::max_value()); assert_eq!(b.meta, Meta::default()); } #[test] fn test_blob_forward() { let mut b = Blob::default(); assert!(!b.should_forward()); b.forward(true); assert!(b.should_forward()); } }