solana/runtime/src/bloom.rs

//! Simple Bloom Filter
use bv::BitVec;
use fnv::FnvHasher;
use rand::{self, Rng};
use serde::{Deserialize, Serialize};
use std::fmt;
use std::{cmp, hash::Hasher, marker::PhantomData};

/// Generate a stable hash of `self` for each `hash_index`
/// Best effort can be made for uniqueness of each hash.
pub trait BloomHashIndex {
    fn hash_at_index(&self, hash_index: u64) -> u64;
}

#[derive(Serialize, Deserialize, Default, Clone, PartialEq, AbiExample)]
pub struct Bloom<T: BloomHashIndex> {
    pub keys: Vec<u64>,
    pub bits: BitVec<u64>,
    num_bits_set: u64,
    _phantom: PhantomData<T>,
}

impl<T: BloomHashIndex> fmt::Debug for Bloom<T> {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(
            f,
            "Bloom {{ keys.len: {} bits.len: {} num_set: {} bits: ",
            self.keys.len(),
            self.bits.len(),
            self.num_bits_set
        )?;
        const MAX_PRINT_BITS: u64 = 10;
        for i in 0..std::cmp::min(MAX_PRINT_BITS, self.bits.len()) {
            if self.bits.get(i) {
                write!(f, "1")?;
            } else {
                write!(f, "0")?;
            }
        }
        if self.bits.len() > MAX_PRINT_BITS {
            write!(f, "..")?;
        }
        write!(f, " }}")
    }
}

impl<T: BloomHashIndex> solana_sdk::sanitize::Sanitize for Bloom<T> {}

impl<T: BloomHashIndex> Bloom<T> {
    pub fn new(num_bits: usize, keys: Vec<u64>) -> Self {
        let bits = BitVec::new_fill(false, num_bits as u64);
        Bloom {
            keys,
            bits,
            num_bits_set: 0,
            _phantom: PhantomData::default(),
        }
    }
    /// create filter optimal for num size given the `FALSE_RATE`
    /// the keys are randomized for picking data out of a collision resistant hash of size
    /// `keysize` bytes
    /// https://hur.st/bloomfilter/
    pub fn random(num_items: usize, false_rate: f64, max_bits: usize) -> Self {
        let m = Self::num_bits(num_items as f64, false_rate);
        let num_bits = cmp::max(1, cmp::min(m as usize, max_bits));
        let num_keys = Self::num_keys(num_bits as f64, num_items as f64) as usize;
        let keys: Vec<u64> = (0..num_keys).map(|_| rand::thread_rng().gen()).collect();
        Self::new(num_bits, keys)
    }
    fn num_bits(num_items: f64, false_rate: f64) -> f64 {
        let n = num_items;
        let p = false_rate;
        ((n * p.ln()) / (1f64 / 2f64.powf(2f64.ln())).ln()).ceil()
    }
    fn num_keys(num_bits: f64, num_items: f64) -> f64 {
        let n = num_items;
        let m = num_bits;
        // infinity as usize is zero in rust 1.43 but 2^64-1 in rust 1.45; ensure it's zero here
        if n == 0.0 {
            0.0
        } else {
            1f64.max(((m / n) * 2f64.ln()).round())
        }
    }
    fn pos(&self, key: &T, k: u64) -> u64 {
        key.hash_at_index(k) % self.bits.len()
    }
    pub fn clear(&mut self) {
        self.bits = BitVec::new_fill(false, self.bits.len());
        self.num_bits_set = 0;
    }
    pub fn add(&mut self, key: &T) {
        for k in &self.keys {
            let pos = self.pos(key, *k);
            if !self.bits.get(pos) {
                self.num_bits_set += 1;
                self.bits.set(pos, true);
            }
        }
    }
    pub fn contains(&self, key: &T) -> bool {
        for k in &self.keys {
            let pos = self.pos(key, *k);
            if !self.bits.get(pos) {
                return false;
            }
        }
        true
    }
}

fn slice_hash(slice: &[u8], hash_index: u64) -> u64 {
    let mut hasher = FnvHasher::with_key(hash_index);
    hasher.write(slice);
    hasher.finish()
}

impl<T: AsRef<[u8]>> BloomHashIndex for T {
    fn hash_at_index(&self, hash_index: u64) -> u64 {
        slice_hash(self.as_ref(), hash_index)
    }
}

#[cfg(test)]
mod test {
    use super::*;
    use solana_sdk::hash::{hash, Hash};

    #[test]
    fn test_bloom_filter() {
        //empty
        let bloom: Bloom<Hash> = Bloom::random(0, 0.1, 100);
        assert_eq!(bloom.keys.len(), 0);
        assert_eq!(bloom.bits.len(), 1);

        //normal
        let bloom: Bloom<Hash> = Bloom::random(10, 0.1, 100);
        assert_eq!(bloom.keys.len(), 3);
        assert_eq!(bloom.bits.len(), 48);

        //saturated
        let bloom: Bloom<Hash> = Bloom::random(100, 0.1, 100);
        assert_eq!(bloom.keys.len(), 1);
        assert_eq!(bloom.bits.len(), 100);
    }
    #[test]
    fn test_add_contains() {
        let mut bloom: Bloom<Hash> = Bloom::random(100, 0.1, 100);
        //known keys to avoid false positives in the test
        bloom.keys = vec![0, 1, 2, 3];

        let key = hash(b"hello");
        assert!(!bloom.contains(&key));
        bloom.add(&key);
        assert!(bloom.contains(&key));

        let key = hash(b"world");
        assert!(!bloom.contains(&key));
        bloom.add(&key);
        assert!(bloom.contains(&key));
    }
    #[test]
    fn test_random() {
        let mut b1: Bloom<Hash> = Bloom::random(10, 0.1, 100);
        let mut b2: Bloom<Hash> = Bloom::random(10, 0.1, 100);
        b1.keys.sort();
        b2.keys.sort();
        assert_ne!(b1.keys, b2.keys);
    }
    // Bloom filter math in python
    // n number of items
    // p false rate
    // m number of bits
    // k number of keys
    //
    // n = ceil(m / (-k / log(1 - exp(log(p) / k))))
    // p = pow(1 - exp(-k / (m / n)), k)
    // m = ceil((n * log(p)) / log(1 / pow(2, log(2))));
    // k = round((m / n) * log(2));
    #[test]
    fn test_filter_math() {
        assert_eq!(Bloom::<Hash>::num_bits(100f64, 0.1f64) as u64, 480u64);
        assert_eq!(Bloom::<Hash>::num_bits(100f64, 0.01f64) as u64, 959u64);
        assert_eq!(Bloom::<Hash>::num_keys(1000f64, 50f64) as u64, 14u64);
        assert_eq!(Bloom::<Hash>::num_keys(2000f64, 50f64) as u64, 28u64);
        assert_eq!(Bloom::<Hash>::num_keys(2000f64, 25f64) as u64, 55u64);
        //ensure min keys is 1
        assert_eq!(Bloom::<Hash>::num_keys(20f64, 1000f64) as u64, 1u64);
    }

    #[test]
    fn test_debug() {
        let mut b: Bloom<Hash> = Bloom::new(3, vec![100]);
        b.add(&Hash::default());
        assert_eq!(
            format!("{:?}", b),
            "Bloom { keys.len: 1 bits.len: 3 num_set: 1 bits: 001 }"
        );

        let mut b: Bloom<Hash> = Bloom::new(1000, vec![100]);
        b.add(&Hash::default());
        b.add(&hash(&[1, 2]));
        assert_eq!(
            format!("{:?}", b),
            "Bloom { keys.len: 1 bits.len: 1000 num_set: 2 bits: 0000000000.. }"
        );
    }
}
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`//! Simple Bloom Filter`
			`use bv::BitVec;`
add bloom benchmarking, perf improvement from Fnv ~= 8X (#2477) * add bloom benchmarking, perf improvement from Fnv ~= 8X * have a look at bits.set() * ignore new benches to pacify CI (solana_upload_perf?) 2019-01-17 18:22:21 -08:00			`use fnv::FnvHasher;`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`use rand::{self, Rng};`
Move Bank to its own crate Also: * counters.rs to solana_metrics * genesis_block.rs to solana_sdk 2019-02-18 22:26:22 -08:00			`use serde::{Deserialize, Serialize};`
Add custom print for Bloom object (#10971) 2020-07-10 11:53:24 -07:00			`use std::fmt;`
Cleanup runtime use syntax (#8002) 2020-01-28 17:03:20 -08:00			`use std::{cmp, hash::Hasher, marker::PhantomData};`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00
bloom for forking (#2431) * bloom for forking * clippy fixes * remove bloom_hash_index 2019-01-15 13:56:54 -08:00			/// Generate a stable hash of `self` for each `hash_index`
			`/// Best effort can be made for uniqueness of each hash.`
			`pub trait BloomHashIndex {`
			`fn hash_at_index(&self, hash_index: u64) -> u64;`
			`}`

Add custom print for Bloom object (#10971) 2020-07-10 11:53:24 -07:00			`#[derive(Serialize, Deserialize, Default, Clone, PartialEq, AbiExample)]`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`pub struct Bloom<T: BloomHashIndex> {`
			`pub keys: Vec<u64>,`
Create bank snapshots (#4244) * Revert "Revert "Create bank snapshots (#3671)" (#4243)" This reverts commit 81fa69d3471977259d62b88cd5b83b32e9e38219. * keep saved and unsaved copies of status cache * fix format check * bench for status cache serialize * misc cleanup * remove appendvec storage on purge * fix accounts restore * cleanup * Pass snapshot path as args * Fix clippy 2019-05-30 21:31:35 -07:00			`pub bits: BitVec<u64>,`
			`num_bits_set: u64,`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`_phantom: PhantomData<T>,`
			`}`

Add custom print for Bloom object (#10971) 2020-07-10 11:53:24 -07:00			`impl<T: BloomHashIndex> fmt::Debug for Bloom<T> {`
			`fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {`
			`write!(`
			`f,`
			`"Bloom {{ keys.len: {} bits.len: {} num_set: {} bits: ",`
			`self.keys.len(),`
			`self.bits.len(),`
			`self.num_bits_set`
			`)?;`
			`const MAX_PRINT_BITS: u64 = 10;`
			`for i in 0..std::cmp::min(MAX_PRINT_BITS, self.bits.len()) {`
			`if self.bits.get(i) {`
			`write!(f, "1")?;`
			`} else {`
			`write!(f, "0")?;`
			`}`
			`}`
			`if self.bits.len() > MAX_PRINT_BITS {`
			`write!(f, "..")?;`
			`}`
			`write!(f, " }}")`
			`}`
			`}`

Input values are not sanitized after they are deserialized, making it far too easy for Leo to earn SOL (#9706) * sanitize gossip protocol messages * sanitize transactions * crds protocol sanitize 2020-04-27 11:06:00 -07:00			`impl<T: BloomHashIndex> solana_sdk::sanitize::Sanitize for Bloom<T> {}`

Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`impl<T: BloomHashIndex> Bloom<T> {`
bloom for forking (#2431) * bloom for forking * clippy fixes * remove bloom_hash_index 2019-01-15 13:56:54 -08:00			`pub fn new(num_bits: usize, keys: Vec<u64>) -> Self {`
			`let bits = BitVec::new_fill(false, num_bits as u64);`
			`Bloom {`
			`keys,`
			`bits,`
Create bank snapshots (#4244) * Revert "Revert "Create bank snapshots (#3671)" (#4243)" This reverts commit 81fa69d3471977259d62b88cd5b83b32e9e38219. * keep saved and unsaved copies of status cache * fix format check * bench for status cache serialize * misc cleanup * remove appendvec storage on purge * fix accounts restore * cleanup * Pass snapshot path as args * Fix clippy 2019-05-30 21:31:35 -07:00			`num_bits_set: 0,`
Purge Default::default() 2019-02-09 09:20:43 -08:00			`_phantom: PhantomData::default(),`
bloom for forking (#2431) * bloom for forking * clippy fixes * remove bloom_hash_index 2019-01-15 13:56:54 -08:00			`}`
			`}`
Restore blob size fix (#5516) * Revert "Revert "Fix gossip messages growing beyond blob size (#5460)" (#5512)" This reverts commit 97d57d168b12c20c94e6dc8c6b844a06ff97cb06. * Fix Crds filters 2019-08-13 18:04:14 -07:00			/// create filter optimal for num size given the `FALSE_RATE`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`/// the keys are randomized for picking data out of a collision resistant hash of size`
			/// `keysize` bytes
			`/// https://hur.st/bloomfilter/`
Restore blob size fix (#5516) * Revert "Revert "Fix gossip messages growing beyond blob size (#5460)" (#5512)" This reverts commit 97d57d168b12c20c94e6dc8c6b844a06ff97cb06. * Fix Crds filters 2019-08-13 18:04:14 -07:00			`pub fn random(num_items: usize, false_rate: f64, max_bits: usize) -> Self {`
			`let m = Self::num_bits(num_items as f64, false_rate);`
			`let num_bits = cmp::max(1, cmp::min(m as usize, max_bits));`
			`let num_keys = Self::num_keys(num_bits as f64, num_items as f64) as usize;`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`let keys: Vec<u64> = (0..num_keys).map(\|_\| rand::thread_rng().gen()).collect();`
bloom for forking (#2431) * bloom for forking * clippy fixes * remove bloom_hash_index 2019-01-15 13:56:54 -08:00			`Self::new(num_bits, keys)`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`}`
Clippy cleanup for all targets and nighly rust (also support 1.44.0) (#10445) * address warnings from 'rustup run beta cargo clippy --workspace' minor refactoring in: - cli/src/cli.rs - cli/src/offline/blockhash_query.rs - logger/src/lib.rs - runtime/src/accounts_db.rs expect some performance improvement AccountsDB::clean_accounts() * address warnings from 'rustup run beta cargo clippy --workspace --tests' * address warnings from 'rustup run nightly cargo clippy --workspace --all-targets' * rustfmt * fix warning stragglers * properly fix clippy warnings test_vote_subscribe() replace ref-to-arc with ref parameters where arc not cloned * Remove lock around JsonRpcRequestProcessor (#10417) automerge * make ancestors parameter optional to avoid forcing construction of empty hash maps Co-authored-by: Greg Fitzgerald <greg@solana.com> 2020-06-08 17:38:14 -07:00			`fn num_bits(num_items: f64, false_rate: f64) -> f64 {`
Restore blob size fix (#5516) * Revert "Revert "Fix gossip messages growing beyond blob size (#5460)" (#5512)" This reverts commit 97d57d168b12c20c94e6dc8c6b844a06ff97cb06. * Fix Crds filters 2019-08-13 18:04:14 -07:00			`let n = num_items;`
			`let p = false_rate;`
			`((n * p.ln()) / (1f64 / 2f64.powf(2f64.ln())).ln()).ceil()`
			`}`
Clippy cleanup for all targets and nighly rust (also support 1.44.0) (#10445) * address warnings from 'rustup run beta cargo clippy --workspace' minor refactoring in: - cli/src/cli.rs - cli/src/offline/blockhash_query.rs - logger/src/lib.rs - runtime/src/accounts_db.rs expect some performance improvement AccountsDB::clean_accounts() * address warnings from 'rustup run beta cargo clippy --workspace --tests' * address warnings from 'rustup run nightly cargo clippy --workspace --all-targets' * rustfmt * fix warning stragglers * properly fix clippy warnings test_vote_subscribe() replace ref-to-arc with ref parameters where arc not cloned * Remove lock around JsonRpcRequestProcessor (#10417) automerge * make ancestors parameter optional to avoid forcing construction of empty hash maps Co-authored-by: Greg Fitzgerald <greg@solana.com> 2020-06-08 17:38:14 -07:00			`fn num_keys(num_bits: f64, num_items: f64) -> f64 {`
Restore blob size fix (#5516) * Revert "Revert "Fix gossip messages growing beyond blob size (#5460)" (#5512)" This reverts commit 97d57d168b12c20c94e6dc8c6b844a06ff97cb06. * Fix Crds filters 2019-08-13 18:04:14 -07:00			`let n = num_items;`
			`let m = num_bits;`
Clippy cleanup for all targets and nighly rust (also support 1.44.0) (#10445) * address warnings from 'rustup run beta cargo clippy --workspace' minor refactoring in: - cli/src/cli.rs - cli/src/offline/blockhash_query.rs - logger/src/lib.rs - runtime/src/accounts_db.rs expect some performance improvement AccountsDB::clean_accounts() * address warnings from 'rustup run beta cargo clippy --workspace --tests' * address warnings from 'rustup run nightly cargo clippy --workspace --all-targets' * rustfmt * fix warning stragglers * properly fix clippy warnings test_vote_subscribe() replace ref-to-arc with ref parameters where arc not cloned * Remove lock around JsonRpcRequestProcessor (#10417) automerge * make ancestors parameter optional to avoid forcing construction of empty hash maps Co-authored-by: Greg Fitzgerald <greg@solana.com> 2020-06-08 17:38:14 -07:00			`// infinity as usize is zero in rust 1.43 but 2^64-1 in rust 1.45; ensure it's zero here`
			`if n == 0.0 {`
			`0.0`
			`} else {`
			`1f64.max(((m / n) * 2f64.ln()).round())`
			`}`
Restore blob size fix (#5516) * Revert "Revert "Fix gossip messages growing beyond blob size (#5460)" (#5512)" This reverts commit 97d57d168b12c20c94e6dc8c6b844a06ff97cb06. * Fix Crds filters 2019-08-13 18:04:14 -07:00			`}`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`fn pos(&self, key: &T, k: u64) -> u64 {`
bloom for forking (#2431) * bloom for forking * clippy fixes * remove bloom_hash_index 2019-01-15 13:56:54 -08:00			`key.hash_at_index(k) % self.bits.len()`
			`}`
			`pub fn clear(&mut self) {`
StatusDeque split into separate objects with their own root checkpoint strategy (#2613) Split up StatusDeque into different modules * LastIdQueue tracks last_ids * StatusCache keeps track of signature statuses * StatusCache stores success as a bit in a bloom filter * Overhead for 1m Ok transactions is 4mb in memory * Less concurrency between the objects, last_id and status_cache are read and written to at different points in the pipeline * Each object has its own strategy for merging into the root checkpoint 2019-01-31 06:53:52 -08:00			`self.bits = BitVec::new_fill(false, self.bits.len());`
Create bank snapshots (#4244) * Revert "Revert "Create bank snapshots (#3671)" (#4243)" This reverts commit 81fa69d3471977259d62b88cd5b83b32e9e38219. * keep saved and unsaved copies of status cache * fix format check * bench for status cache serialize * misc cleanup * remove appendvec storage on purge * fix accounts restore * cleanup * Pass snapshot path as args * Fix clippy 2019-05-30 21:31:35 -07:00			`self.num_bits_set = 0;`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`}`
			`pub fn add(&mut self, key: &T) {`
			`for k in &self.keys {`
			`let pos = self.pos(key, *k);`
Create bank snapshots (#4244) * Revert "Revert "Create bank snapshots (#3671)" (#4243)" This reverts commit 81fa69d3471977259d62b88cd5b83b32e9e38219. * keep saved and unsaved copies of status cache * fix format check * bench for status cache serialize * misc cleanup * remove appendvec storage on purge * fix accounts restore * cleanup * Pass snapshot path as args * Fix clippy 2019-05-30 21:31:35 -07:00			`if !self.bits.get(pos) {`
			`self.num_bits_set += 1;`
			`self.bits.set(pos, true);`
			`}`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`}`
			`}`
StatusDeque split into separate objects with their own root checkpoint strategy (#2613) Split up StatusDeque into different modules * LastIdQueue tracks last_ids * StatusCache keeps track of signature statuses * StatusCache stores success as a bit in a bloom filter * Overhead for 1m Ok transactions is 4mb in memory * Less concurrency between the objects, last_id and status_cache are read and written to at different points in the pipeline * Each object has its own strategy for merging into the root checkpoint 2019-01-31 06:53:52 -08:00			`pub fn contains(&self, key: &T) -> bool {`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`for k in &self.keys {`
			`let pos = self.pos(key, *k);`
			`if !self.bits.get(pos) {`
			`return false;`
			`}`
			`}`
			`true`
			`}`
			`}`

bloom for forking (#2431) * bloom for forking * clippy fixes * remove bloom_hash_index 2019-01-15 13:56:54 -08:00			`fn slice_hash(slice: &[u8], hash_index: u64) -> u64 {`
add bloom benchmarking, perf improvement from Fnv ~= 8X (#2477) * add bloom benchmarking, perf improvement from Fnv ~= 8X * have a look at bits.set() * ignore new benches to pacify CI (solana_upload_perf?) 2019-01-17 18:22:21 -08:00			`let mut hasher = FnvHasher::with_key(hash_index);`
			`hasher.write(slice);`
			`hasher.finish()`
bloom for forking (#2431) * bloom for forking * clippy fixes * remove bloom_hash_index 2019-01-15 13:56:54 -08:00			`}`

			`impl<T: AsRef<[u8]>> BloomHashIndex for T {`
			`fn hash_at_index(&self, hash_index: u64) -> u64 {`
			`slice_hash(self.as_ref(), hash_index)`
			`}`
			`}`

Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`#[cfg(test)]`
			`mod test {`
			`use super::*;`
Move drone into its own crate 2018-11-16 08:04:46 -08:00			`use solana_sdk::hash::{hash, Hash};`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00
			`#[test]`
			`fn test_bloom_filter() {`
			`//empty`
			`let bloom: Bloom<Hash> = Bloom::random(0, 0.1, 100);`
			`assert_eq!(bloom.keys.len(), 0);`
			`assert_eq!(bloom.bits.len(), 1);`

			`//normal`
			`let bloom: Bloom<Hash> = Bloom::random(10, 0.1, 100);`
			`assert_eq!(bloom.keys.len(), 3);`
Restore blob size fix (#5516) * Revert "Revert "Fix gossip messages growing beyond blob size (#5460)" (#5512)" This reverts commit 97d57d168b12c20c94e6dc8c6b844a06ff97cb06. * Fix Crds filters 2019-08-13 18:04:14 -07:00			`assert_eq!(bloom.bits.len(), 48);`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00
			`//saturated`
			`let bloom: Bloom<Hash> = Bloom::random(100, 0.1, 100);`
			`assert_eq!(bloom.keys.len(), 1);`
			`assert_eq!(bloom.bits.len(), 100);`
			`}`
			`#[test]`
			`fn test_add_contains() {`
			`let mut bloom: Bloom<Hash> = Bloom::random(100, 0.1, 100);`
Use known keys in the unit test to avoid random false positives. 2018-11-17 20:48:32 -08:00			`//known keys to avoid false positives in the test`
			`bloom.keys = vec![0, 1, 2, 3];`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00
			`let key = hash(b"hello");`
			`assert!(!bloom.contains(&key));`
			`bloom.add(&key);`
			`assert!(bloom.contains(&key));`

			`let key = hash(b"world");`
			`assert!(!bloom.contains(&key));`
			`bloom.add(&key);`
			`assert!(bloom.contains(&key));`
			`}`
			`#[test]`
			`fn test_random() {`
			`let mut b1: Bloom<Hash> = Bloom::random(10, 0.1, 100);`
			`let mut b2: Bloom<Hash> = Bloom::random(10, 0.1, 100);`
			`b1.keys.sort();`
			`b2.keys.sort();`
			`assert_ne!(b1.keys, b2.keys);`
			`}`
Restore blob size fix (#5516) * Revert "Revert "Fix gossip messages growing beyond blob size (#5460)" (#5512)" This reverts commit 97d57d168b12c20c94e6dc8c6b844a06ff97cb06. * Fix Crds filters 2019-08-13 18:04:14 -07:00			`// Bloom filter math in python`
			`// n number of items`
			`// p false rate`
			`// m number of bits`
			`// k number of keys`
			`//`
			`// n = ceil(m / (-k / log(1 - exp(log(p) / k))))`
			`// p = pow(1 - exp(-k / (m / n)), k)`
			`// m = ceil((n * log(p)) / log(1 / pow(2, log(2))));`
			`// k = round((m / n) * log(2));`
			`#[test]`
			`fn test_filter_math() {`
			`assert_eq!(Bloom::<Hash>::num_bits(100f64, 0.1f64) as u64, 480u64);`
			`assert_eq!(Bloom::<Hash>::num_bits(100f64, 0.01f64) as u64, 959u64);`
			`assert_eq!(Bloom::<Hash>::num_keys(1000f64, 50f64) as u64, 14u64);`
			`assert_eq!(Bloom::<Hash>::num_keys(2000f64, 50f64) as u64, 28u64);`
			`assert_eq!(Bloom::<Hash>::num_keys(2000f64, 25f64) as u64, 55u64);`
			`//ensure min keys is 1`
			`assert_eq!(Bloom::<Hash>::num_keys(20f64, 1000f64) as u64, 1u64);`
			`}`
Add custom print for Bloom object (#10971) 2020-07-10 11:53:24 -07:00
			`#[test]`
			`fn test_debug() {`
			`let mut b: Bloom<Hash> = Bloom::new(3, vec![100]);`
			`b.add(&Hash::default());`
			`assert_eq!(`
			`format!("{:?}", b),`
			`"Bloom { keys.len: 1 bits.len: 3 num_set: 1 bits: 001 }"`
			`);`

			`let mut b: Bloom<Hash> = Bloom::new(1000, vec![100]);`
			`b.add(&Hash::default());`
			`b.add(&hash(&[1, 2]));`
			`assert_eq!(`
			`format!("{:?}", b),`
			`"Bloom { keys.len: 1 bits.len: 1000 num_set: 2 bits: 0000000000.. }"`
			`);`
			`}`
Add scalable gossip library (#1546) * Cluster Replicated Data Store Separate the data storage and merge strategy from the network IO boundary. Implement an eager push overlay for transporting recent messages. Simulation shows fast convergence with 20k nodes. 2018-11-15 13:23:26 -08:00			`}`