Use LRU cache and blake3 hash of shreds to filter duplicates (#13976)
This commit is contained in:
parent
6e9dbb4f6e
commit
f6600810d7
|
@ -40,6 +40,17 @@ version = "0.4.6"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "f6789e291be47ace86a60303502173d84af8327e3627ecf334356ee0f87a164c"
|
checksum = "f6789e291be47ace86a60303502173d84af8327e3627ecf334356ee0f87a164c"
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "ahash"
|
||||||
|
version = "0.6.1"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "865f8b0b3fced577b7df82e9b0eb7609595d7209c0b39e78d0646672e244b1b1"
|
||||||
|
dependencies = [
|
||||||
|
"getrandom 0.2.0",
|
||||||
|
"lazy_static",
|
||||||
|
"version_check 0.9.2",
|
||||||
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "aho-corasick"
|
name = "aho-corasick"
|
||||||
version = "0.7.10"
|
version = "0.7.10"
|
||||||
|
@ -616,7 +627,7 @@ version = "0.1.8"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "25e4c606eb459dd29f7c57b2e0879f2b6f14ee130918c2b78ccb58a9624e6c7a"
|
checksum = "25e4c606eb459dd29f7c57b2e0879f2b6f14ee130918c2b78ccb58a9624e6c7a"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"getrandom",
|
"getrandom 0.1.14",
|
||||||
"proc-macro-hack",
|
"proc-macro-hack",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
@ -1302,6 +1313,17 @@ dependencies = [
|
||||||
"wasi",
|
"wasi",
|
||||||
]
|
]
|
||||||
|
|
||||||
|
[[package]]
|
||||||
|
name = "getrandom"
|
||||||
|
version = "0.2.0"
|
||||||
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
|
checksum = "ee8025cf36f917e6a52cce185b7c7177689b838b7ec138364e50cc2277a56cf4"
|
||||||
|
dependencies = [
|
||||||
|
"cfg-if 0.1.10",
|
||||||
|
"libc",
|
||||||
|
"wasi",
|
||||||
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "gimli"
|
name = "gimli"
|
||||||
version = "0.21.0"
|
version = "0.21.0"
|
||||||
|
@ -2862,7 +2884,7 @@ version = "0.7.3"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "6a6b1679d49b24bbfe0c803429aa1874472f50d9b363131f0e89fc356b544d03"
|
checksum = "6a6b1679d49b24bbfe0c803429aa1874472f50d9b363131f0e89fc356b544d03"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"getrandom",
|
"getrandom 0.1.14",
|
||||||
"libc",
|
"libc",
|
||||||
"rand_chacha 0.2.2",
|
"rand_chacha 0.2.2",
|
||||||
"rand_core 0.5.1",
|
"rand_core 0.5.1",
|
||||||
|
@ -2911,7 +2933,7 @@ version = "0.5.1"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "90bde5296fc891b0cef12a6d03ddccc162ce7b2aff54160af9338f8d40df6d19"
|
checksum = "90bde5296fc891b0cef12a6d03ddccc162ce7b2aff54160af9338f8d40df6d19"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"getrandom",
|
"getrandom 0.1.14",
|
||||||
]
|
]
|
||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
|
@ -3049,7 +3071,7 @@ version = "0.3.4"
|
||||||
source = "registry+https://github.com/rust-lang/crates.io-index"
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
||||||
checksum = "09b23093265f8d200fa7b4c2c76297f47e681c655f6f1285a8780d6a022f7431"
|
checksum = "09b23093265f8d200fa7b4c2c76297f47e681c655f6f1285a8780d6a022f7431"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"getrandom",
|
"getrandom 0.1.14",
|
||||||
"redox_syscall",
|
"redox_syscall",
|
||||||
"rust-argon2",
|
"rust-argon2",
|
||||||
]
|
]
|
||||||
|
@ -3941,6 +3963,7 @@ dependencies = [
|
||||||
name = "solana-core"
|
name = "solana-core"
|
||||||
version = "1.5.0"
|
version = "1.5.0"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
|
"ahash 0.6.1",
|
||||||
"base64 0.12.3",
|
"base64 0.12.3",
|
||||||
"bincode",
|
"bincode",
|
||||||
"bs58",
|
"bs58",
|
||||||
|
|
|
@ -14,6 +14,7 @@ edition = "2018"
|
||||||
codecov = { repository = "solana-labs/solana", branch = "master", service = "github" }
|
codecov = { repository = "solana-labs/solana", branch = "master", service = "github" }
|
||||||
|
|
||||||
[dependencies]
|
[dependencies]
|
||||||
|
ahash = "0.6.1"
|
||||||
base64 = "0.12.3"
|
base64 = "0.12.3"
|
||||||
bincode = "1.3.1"
|
bincode = "1.3.1"
|
||||||
bv = { version = "0.11.1", features = ["serde"] }
|
bv = { version = "0.11.1", features = ["serde"] }
|
||||||
|
|
|
@ -1,6 +1,10 @@
|
||||||
//! The `shred_fetch_stage` pulls shreds from UDP sockets and sends it to a channel.
|
//! The `shred_fetch_stage` pulls shreds from UDP sockets and sends it to a channel.
|
||||||
|
|
||||||
use bv::BitVec;
|
use ahash::AHasher;
|
||||||
|
use lru::LruCache;
|
||||||
|
use rand::{thread_rng, Rng};
|
||||||
|
use std::hash::Hasher;
|
||||||
|
|
||||||
use solana_ledger::blockstore::MAX_DATA_SHREDS_PER_SLOT;
|
use solana_ledger::blockstore::MAX_DATA_SHREDS_PER_SLOT;
|
||||||
use solana_ledger::shred::{
|
use solana_ledger::shred::{
|
||||||
CODING_SHRED, DATA_SHRED, OFFSET_OF_SHRED_INDEX, OFFSET_OF_SHRED_SLOT, OFFSET_OF_SHRED_TYPE,
|
CODING_SHRED, DATA_SHRED, OFFSET_OF_SHRED_INDEX, OFFSET_OF_SHRED_SLOT, OFFSET_OF_SHRED_TYPE,
|
||||||
|
@ -10,9 +14,8 @@ use solana_perf::cuda_runtime::PinnedVec;
|
||||||
use solana_perf::packet::{limited_deserialize, Packet, PacketsRecycler};
|
use solana_perf::packet::{limited_deserialize, Packet, PacketsRecycler};
|
||||||
use solana_perf::recycler::Recycler;
|
use solana_perf::recycler::Recycler;
|
||||||
use solana_runtime::bank_forks::BankForks;
|
use solana_runtime::bank_forks::BankForks;
|
||||||
use solana_sdk::clock::Slot;
|
use solana_sdk::clock::{Slot, DEFAULT_MS_PER_SLOT};
|
||||||
use solana_streamer::streamer::{self, PacketReceiver, PacketSender};
|
use solana_streamer::streamer::{self, PacketReceiver, PacketSender};
|
||||||
use std::collections::HashMap;
|
|
||||||
use std::net::UdpSocket;
|
use std::net::UdpSocket;
|
||||||
use std::sync::atomic::AtomicBool;
|
use std::sync::atomic::AtomicBool;
|
||||||
use std::sync::mpsc::channel;
|
use std::sync::mpsc::channel;
|
||||||
|
@ -21,7 +24,8 @@ use std::sync::RwLock;
|
||||||
use std::thread::{self, Builder, JoinHandle};
|
use std::thread::{self, Builder, JoinHandle};
|
||||||
use std::time::Instant;
|
use std::time::Instant;
|
||||||
|
|
||||||
pub type ShredsReceived = HashMap<(Slot, u8), BitVec<u64>>;
|
const DEFAULT_LRU_SIZE: usize = 10_000;
|
||||||
|
pub type ShredsReceived = LruCache<u64, ()>;
|
||||||
|
|
||||||
#[derive(Default)]
|
#[derive(Default)]
|
||||||
struct ShredFetchStats {
|
struct ShredFetchStats {
|
||||||
|
@ -73,11 +77,12 @@ impl ShredFetchStage {
|
||||||
last_slot: Slot,
|
last_slot: Slot,
|
||||||
slots_per_epoch: u64,
|
slots_per_epoch: u64,
|
||||||
modify: &F,
|
modify: &F,
|
||||||
|
seeds: (u128, u128),
|
||||||
) where
|
) where
|
||||||
F: Fn(&mut Packet),
|
F: Fn(&mut Packet),
|
||||||
{
|
{
|
||||||
p.meta.discard = true;
|
p.meta.discard = true;
|
||||||
if let Some((slot, index)) = Self::get_slot_index(p, stats) {
|
if let Some((slot, _index)) = Self::get_slot_index(p, stats) {
|
||||||
// Seems reasonable to limit shreds to 2 epochs away
|
// Seems reasonable to limit shreds to 2 epochs away
|
||||||
if slot > last_root
|
if slot > last_root
|
||||||
&& slot < (last_slot + 2 * slots_per_epoch)
|
&& slot < (last_slot + 2 * slots_per_epoch)
|
||||||
|
@ -86,16 +91,15 @@ impl ShredFetchStage {
|
||||||
let shred_type = p.data[OFFSET_OF_SHRED_TYPE];
|
let shred_type = p.data[OFFSET_OF_SHRED_TYPE];
|
||||||
if shred_type == DATA_SHRED || shred_type == CODING_SHRED {
|
if shred_type == DATA_SHRED || shred_type == CODING_SHRED {
|
||||||
// Shred filter
|
// Shred filter
|
||||||
let slot_received =
|
|
||||||
shreds_received
|
let mut hasher = AHasher::new_with_keys(seeds.0, seeds.1);
|
||||||
.entry((slot, shred_type))
|
hasher.write(&p.data[0..p.meta.size]);
|
||||||
.or_insert_with(|| {
|
let hash = hasher.finish();
|
||||||
BitVec::new_fill(false, MAX_DATA_SHREDS_PER_SLOT as u64)
|
|
||||||
});
|
if shreds_received.get(&hash).is_none() {
|
||||||
if !slot_received.get(index.into()) {
|
shreds_received.put(hash, ());
|
||||||
p.meta.discard = false;
|
p.meta.discard = false;
|
||||||
modify(p);
|
modify(p);
|
||||||
slot_received.set(index.into(), true);
|
|
||||||
} else {
|
} else {
|
||||||
stats.duplicate_shred += 1;
|
stats.duplicate_shred += 1;
|
||||||
}
|
}
|
||||||
|
@ -116,8 +120,8 @@ impl ShredFetchStage {
|
||||||
) where
|
) where
|
||||||
F: Fn(&mut Packet),
|
F: Fn(&mut Packet),
|
||||||
{
|
{
|
||||||
let mut shreds_received = ShredsReceived::default();
|
let mut shreds_received = LruCache::new(DEFAULT_LRU_SIZE);
|
||||||
let mut last_cleared = Instant::now();
|
let mut last_updated = Instant::now();
|
||||||
|
|
||||||
// In the case of bank_forks=None, setup to accept any slot range
|
// In the case of bank_forks=None, setup to accept any slot range
|
||||||
let mut last_root = 0;
|
let mut last_root = 0;
|
||||||
|
@ -126,11 +130,13 @@ impl ShredFetchStage {
|
||||||
|
|
||||||
let mut last_stats = Instant::now();
|
let mut last_stats = Instant::now();
|
||||||
let mut stats = ShredFetchStats::default();
|
let mut stats = ShredFetchStats::default();
|
||||||
|
let mut seeds = (thread_rng().gen::<u128>(), thread_rng().gen::<u128>());
|
||||||
|
|
||||||
while let Some(mut p) = recvr.iter().next() {
|
while let Some(mut p) = recvr.iter().next() {
|
||||||
if last_cleared.elapsed().as_millis() > 200 {
|
if last_updated.elapsed().as_millis() as u64 > DEFAULT_MS_PER_SLOT {
|
||||||
|
last_updated = Instant::now();
|
||||||
|
seeds = (thread_rng().gen::<u128>(), thread_rng().gen::<u128>());
|
||||||
shreds_received.clear();
|
shreds_received.clear();
|
||||||
last_cleared = Instant::now();
|
|
||||||
if let Some(bank_forks) = bank_forks.as_ref() {
|
if let Some(bank_forks) = bank_forks.as_ref() {
|
||||||
let bank_forks_r = bank_forks.read().unwrap();
|
let bank_forks_r = bank_forks.read().unwrap();
|
||||||
last_root = bank_forks_r.root();
|
last_root = bank_forks_r.root();
|
||||||
|
@ -150,6 +156,7 @@ impl ShredFetchStage {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&modify,
|
&modify,
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
});
|
});
|
||||||
if last_stats.elapsed().as_millis() > 1000 {
|
if last_stats.elapsed().as_millis() > 1000 {
|
||||||
|
@ -215,15 +222,15 @@ impl ShredFetchStage {
|
||||||
) -> Self {
|
) -> Self {
|
||||||
let recycler: PacketsRecycler = Recycler::warmed(100, 1024);
|
let recycler: PacketsRecycler = Recycler::warmed(100, 1024);
|
||||||
|
|
||||||
let tvu_threads = sockets.into_iter().map(|socket| {
|
let (mut tvu_threads, tvu_filter) = Self::packet_modifier(
|
||||||
streamer::receiver(
|
sockets,
|
||||||
socket,
|
|
||||||
&exit,
|
&exit,
|
||||||
sender.clone(),
|
sender.clone(),
|
||||||
recycler.clone(),
|
recycler.clone(),
|
||||||
"shred_fetch_stage",
|
bank_forks.clone(),
|
||||||
)
|
"shred_fetch",
|
||||||
});
|
|_| {},
|
||||||
|
);
|
||||||
|
|
||||||
let (tvu_forwards_threads, fwd_thread_hdl) = Self::packet_modifier(
|
let (tvu_forwards_threads, fwd_thread_hdl) = Self::packet_modifier(
|
||||||
forward_sockets,
|
forward_sockets,
|
||||||
|
@ -239,20 +246,21 @@ impl ShredFetchStage {
|
||||||
vec![repair_socket],
|
vec![repair_socket],
|
||||||
&exit,
|
&exit,
|
||||||
sender.clone(),
|
sender.clone(),
|
||||||
recycler.clone(),
|
recycler,
|
||||||
bank_forks,
|
bank_forks,
|
||||||
"shred_fetch_repair",
|
"shred_fetch_repair",
|
||||||
|p| p.meta.repair = true,
|
|p| p.meta.repair = true,
|
||||||
);
|
);
|
||||||
|
|
||||||
let mut thread_hdls: Vec<_> = tvu_threads
|
tvu_threads.extend(tvu_forwards_threads.into_iter());
|
||||||
.chain(tvu_forwards_threads.into_iter())
|
tvu_threads.extend(repair_receiver.into_iter());
|
||||||
.collect();
|
tvu_threads.push(tvu_filter);
|
||||||
thread_hdls.extend(repair_receiver.into_iter());
|
tvu_threads.push(fwd_thread_hdl);
|
||||||
thread_hdls.push(fwd_thread_hdl);
|
tvu_threads.push(repair_handler);
|
||||||
thread_hdls.push(repair_handler);
|
|
||||||
|
|
||||||
Self { thread_hdls }
|
Self {
|
||||||
|
thread_hdls: tvu_threads,
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
pub fn join(self) -> thread::Result<()> {
|
pub fn join(self) -> thread::Result<()> {
|
||||||
|
@ -271,7 +279,7 @@ mod tests {
|
||||||
#[test]
|
#[test]
|
||||||
fn test_data_code_same_index() {
|
fn test_data_code_same_index() {
|
||||||
solana_logger::setup();
|
solana_logger::setup();
|
||||||
let mut shreds_received = ShredsReceived::default();
|
let mut shreds_received = LruCache::new(DEFAULT_LRU_SIZE);
|
||||||
let mut packet = Packet::default();
|
let mut packet = Packet::default();
|
||||||
let mut stats = ShredFetchStats::default();
|
let mut stats = ShredFetchStats::default();
|
||||||
|
|
||||||
|
@ -279,6 +287,8 @@ mod tests {
|
||||||
let shred = Shred::new_from_data(slot, 3, 0, None, true, true, 0, 0, 0);
|
let shred = Shred::new_from_data(slot, 3, 0, None, true, true, 0, 0, 0);
|
||||||
shred.copy_to_packet(&mut packet);
|
shred.copy_to_packet(&mut packet);
|
||||||
|
|
||||||
|
let seeds = (thread_rng().gen::<u128>(), thread_rng().gen::<u128>());
|
||||||
|
|
||||||
let last_root = 0;
|
let last_root = 0;
|
||||||
let last_slot = 100;
|
let last_slot = 100;
|
||||||
let slots_per_epoch = 10;
|
let slots_per_epoch = 10;
|
||||||
|
@ -290,6 +300,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert!(!packet.meta.discard);
|
assert!(!packet.meta.discard);
|
||||||
|
|
||||||
|
@ -304,6 +315,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert!(!packet.meta.discard);
|
assert!(!packet.meta.discard);
|
||||||
}
|
}
|
||||||
|
@ -311,12 +323,13 @@ mod tests {
|
||||||
#[test]
|
#[test]
|
||||||
fn test_shred_filter() {
|
fn test_shred_filter() {
|
||||||
solana_logger::setup();
|
solana_logger::setup();
|
||||||
let mut shreds_received = ShredsReceived::default();
|
let mut shreds_received = LruCache::new(DEFAULT_LRU_SIZE);
|
||||||
let mut packet = Packet::default();
|
let mut packet = Packet::default();
|
||||||
let mut stats = ShredFetchStats::default();
|
let mut stats = ShredFetchStats::default();
|
||||||
let last_root = 0;
|
let last_root = 0;
|
||||||
let last_slot = 100;
|
let last_slot = 100;
|
||||||
let slots_per_epoch = 10;
|
let slots_per_epoch = 10;
|
||||||
|
let seeds = (thread_rng().gen::<u128>(), thread_rng().gen::<u128>());
|
||||||
// packet size is 0, so cannot get index
|
// packet size is 0, so cannot get index
|
||||||
ShredFetchStage::process_packet(
|
ShredFetchStage::process_packet(
|
||||||
&mut packet,
|
&mut packet,
|
||||||
|
@ -326,6 +339,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert_eq!(stats.index_overrun, 1);
|
assert_eq!(stats.index_overrun, 1);
|
||||||
assert!(packet.meta.discard);
|
assert!(packet.meta.discard);
|
||||||
|
@ -341,6 +355,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert!(packet.meta.discard);
|
assert!(packet.meta.discard);
|
||||||
|
|
||||||
|
@ -353,6 +368,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert!(!packet.meta.discard);
|
assert!(!packet.meta.discard);
|
||||||
|
|
||||||
|
@ -365,6 +381,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert!(packet.meta.discard);
|
assert!(packet.meta.discard);
|
||||||
|
|
||||||
|
@ -380,6 +397,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert!(packet.meta.discard);
|
assert!(packet.meta.discard);
|
||||||
|
|
||||||
|
@ -394,6 +412,7 @@ mod tests {
|
||||||
last_slot,
|
last_slot,
|
||||||
slots_per_epoch,
|
slots_per_epoch,
|
||||||
&|_p| {},
|
&|_p| {},
|
||||||
|
seeds,
|
||||||
);
|
);
|
||||||
assert!(packet.meta.discard);
|
assert!(packet.meta.discard);
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue