Remove usage of unsafe for Accounts

This commit is contained in:
Sathish Ambley 2019-03-04 22:36:12 -08:00 committed by sakridge
parent fc8489a04d
commit 6e9d803091
4 changed files with 103 additions and 87 deletions

1
Cargo.lock generated
View File

@ -2245,6 +2245,7 @@ version = "0.12.0"
dependencies = [ dependencies = [
"bincode 1.1.2 (registry+https://github.com/rust-lang/crates.io-index)", "bincode 1.1.2 (registry+https://github.com/rust-lang/crates.io-index)",
"bv 0.11.0 (registry+https://github.com/rust-lang/crates.io-index)", "bv 0.11.0 (registry+https://github.com/rust-lang/crates.io-index)",
"byteorder 1.3.1 (registry+https://github.com/rust-lang/crates.io-index)",
"fnv 1.0.6 (registry+https://github.com/rust-lang/crates.io-index)", "fnv 1.0.6 (registry+https://github.com/rust-lang/crates.io-index)",
"hashbrown 0.1.8 (registry+https://github.com/rust-lang/crates.io-index)", "hashbrown 0.1.8 (registry+https://github.com/rust-lang/crates.io-index)",
"libc 0.2.50 (registry+https://github.com/rust-lang/crates.io-index)", "libc 0.2.50 (registry+https://github.com/rust-lang/crates.io-index)",

View File

@ -21,6 +21,12 @@ use test::Bencher;
const START_SIZE: u64 = 4 * 1024 * 1024; const START_SIZE: u64 = 4 * 1024 * 1024;
const INC_SIZE: u64 = 1 * 1024 * 1024; const INC_SIZE: u64 = 1 * 1024 * 1024;
macro_rules! align_up {
($addr: expr, $align: expr) => {
($addr + ($align - 1)) & !($align - 1)
};
}
fn get_append_vec_bench_path(path: &str) -> PathBuf { fn get_append_vec_bench_path(path: &str) -> PathBuf {
let out_dir = env::var("OUT_DIR").unwrap_or_else(|_| "target".to_string()); let out_dir = env::var("OUT_DIR").unwrap_or_else(|_| "target".to_string());
let mut buf = PathBuf::new(); let mut buf = PathBuf::new();
@ -64,19 +70,24 @@ fn append_vec_atomic_random_change(bencher: &mut Bencher) {
let path = get_append_vec_bench_path("bench_rax"); let path = get_append_vec_bench_path("bench_rax");
let mut vec = AppendVec::<AtomicUsize>::new(&path, true, START_SIZE, INC_SIZE); let mut vec = AppendVec::<AtomicUsize>::new(&path, true, START_SIZE, INC_SIZE);
let size = 1_000_000; let size = 1_000_000;
for _ in 0..size { for k in 0..size {
if vec.append(AtomicUsize::new(0)).is_none() { if vec.append(AtomicUsize::new(k)).is_none() {
assert!(vec.grow_file().is_ok()); assert!(vec.grow_file().is_ok());
assert!(vec.append(AtomicUsize::new(0)).is_some()); assert!(vec.append(AtomicUsize::new(k)).is_some());
} }
} }
bencher.iter(|| { bencher.iter(|| {
let index = thread_rng().gen_range(0, size as u64); let index = thread_rng().gen_range(0, size as u64);
let atomic1 = vec.get(index * std::mem::size_of::<AtomicUsize>() as u64); let atomic1 = vec.get(index * std::mem::size_of::<AtomicUsize>() as u64);
let current1 = atomic1.load(Ordering::Relaxed); let current1 = atomic1.load(Ordering::Relaxed);
assert_eq!(current1, index as usize);
let next = current1 + 1; let next = current1 + 1;
atomic1.store(next, Ordering::Relaxed); let mut index = vec.append(AtomicUsize::new(next));
let atomic2 = vec.get(index * std::mem::size_of::<AtomicUsize>() as u64); if index.is_none() {
assert!(vec.grow_file().is_ok());
index = vec.append(AtomicUsize::new(next));
}
let atomic2 = vec.get(index.unwrap());
let current2 = atomic2.load(Ordering::Relaxed); let current2 = atomic2.load(Ordering::Relaxed);
assert_eq!(current2, next); assert_eq!(current2, next);
}); });
@ -191,11 +202,12 @@ fn bench_account_serialize(bencher: &mut Bencher) {
let num: usize = 1000; let num: usize = 1000;
let account = Account::new(2, 100, Keypair::new().pubkey()); let account = Account::new(2, 100, Keypair::new().pubkey());
let len = get_serialized_size(&account); let len = get_serialized_size(&account);
let memory = vec![0; num * len]; let ser_len = align_up!(len + std::mem::size_of::<u64>(), std::mem::size_of::<u64>());
let mut memory = vec![0; num * ser_len];
bencher.iter(|| { bencher.iter(|| {
for i in 0..num { for i in 0..num {
let start = i * len; let start = i * ser_len;
serialize_account(&memory[start..start + len], &account, len); serialize_account(&mut memory[start..start + ser_len], &account, len);
} }
}); });
@ -205,8 +217,8 @@ fn bench_account_serialize(bencher: &mut Bencher) {
println!("memory: {}", memory[index]); println!("memory: {}", memory[index]);
} }
let start = index * len; let start = index * ser_len;
let new_account = deserialize_account(&memory[start..start + len], 0, len + 8).unwrap(); let new_account = deserialize_account(&memory[start..start + ser_len], 0, num * len).unwrap();
assert_eq!(new_account, account); assert_eq!(new_account, account);
} }

View File

@ -11,6 +11,7 @@ edition = "2018"
[dependencies] [dependencies]
bincode = "1.1.2" bincode = "1.1.2"
bv = { version = "0.11.0", features = ["serde"] } bv = { version = "0.11.0", features = ["serde"] }
byteorder = "1.3.1"
fnv = "1.0.6" fnv = "1.0.6"
hashbrown = "0.1.8" hashbrown = "0.1.8"
libc = "0.2.49" libc = "0.2.49"

View File

@ -1,8 +1,9 @@
use memmap::MmapMut; use byteorder::{LittleEndian, ReadBytesExt, WriteBytesExt};
use memmap::{Mmap, MmapMut};
use solana_sdk::account::Account; use solana_sdk::account::Account;
use solana_sdk::pubkey::Pubkey; use solana_sdk::pubkey::Pubkey;
use std::fs::{File, OpenOptions}; use std::fs::{File, OpenOptions};
use std::io::{Error, ErrorKind, Result, Seek, SeekFrom, Write}; use std::io::{Error, ErrorKind, Read, Result, Seek, SeekFrom, Write};
use std::marker::PhantomData; use std::marker::PhantomData;
use std::mem; use std::mem;
use std::path::Path; use std::path::Path;
@ -11,64 +12,62 @@ use std::sync::Mutex;
const SIZEOF_U64: usize = mem::size_of::<u64>(); const SIZEOF_U64: usize = mem::size_of::<u64>();
macro_rules! align_up {
($addr: expr, $align: expr) => {
($addr + ($align - 1)) & !($align - 1)
};
}
pub struct AppendVec<T> { pub struct AppendVec<T> {
data: File, data: File,
map: MmapMut, mmap: Mmap,
current_offset: AtomicUsize, current_offset: AtomicUsize,
append_lock: Mutex<()>, mmap_mut: Mutex<MmapMut>,
file_size: u64, file_size: u64,
inc_size: u64, inc_size: u64,
phantom: PhantomData<T>, phantom: PhantomData<T>,
} }
fn get_account_size_static() -> usize { fn get_account_size_static() -> usize {
mem::size_of::<u64>() mem::size_of::<Account>() - mem::size_of::<Vec<u8>>()
+ mem::size_of::<Pubkey>()
+ mem::size_of::<bool>()
+ mem::size_of::<Pubkey>()
} }
pub fn get_serialized_size(account: &Account) -> usize { pub fn get_serialized_size(account: &Account) -> usize {
get_account_size_static() + account.userdata.len() get_account_size_static() + account.userdata.len()
} }
pub fn serialize_account(dst_slice: &[u8], account: &Account, len: usize) { pub fn serialize_account(dst_slice: &mut [u8], account: &Account, len: usize) {
let mut at = 0; let mut at = 0;
write_object_unaligned(&mut at, dst_slice, len); write_u64(&mut at, dst_slice, len as u64);
write_object_unaligned(&mut at, dst_slice, account.tokens); write_u64(&mut at, dst_slice, account.tokens);
write_bytes(&mut at, dst_slice, &account.userdata);
let data = &dst_slice[at..at + account.userdata.len()]; write_bytes(&mut at, dst_slice, account.owner.as_ref());
let dst = data.as_ptr() as *mut u8; write_bytes(&mut at, dst_slice, &[account.executable as u8]);
let data = &account.userdata[0..account.userdata.len()];
let src = data.as_ptr();
unsafe {
std::ptr::copy_nonoverlapping(src, dst, account.userdata.len());
}
at += account.userdata.len();
write_object(&mut at, dst_slice, account.owner);
write_object(&mut at, dst_slice, account.executable);
} }
fn write_object_unaligned<X: Sized>(at: &mut usize, dst_slice: &[u8], value: X) { fn read_bytes(at: &mut usize, dst_slice: &mut [u8], src_slice: &[u8], len: usize) {
let data = &dst_slice[*at..*at + mem::size_of::<X>()]; let data = &src_slice[*at..*at + len];
#[allow(clippy::cast_ptr_alignment)] (&data[..]).read_exact(&mut dst_slice[..]).unwrap();
let ptr = data.as_ptr() as *mut X; *at += len;
unsafe {
std::ptr::write_unaligned(ptr, value);
}
*at += mem::size_of::<X>();
} }
fn write_object<X: Sized>(at: &mut usize, dst_slice: &[u8], value: X) { fn write_bytes(at: &mut usize, dst_slice: &mut [u8], src_slice: &[u8]) {
let data = &dst_slice[*at..*at + mem::size_of::<X>()]; let data = &mut dst_slice[*at..*at + src_slice.len()];
#[allow(clippy::cast_ptr_alignment)] (&mut data[..]).write_all(&src_slice).unwrap();
let ptr = data.as_ptr() as *mut X; *at += src_slice.len();
unsafe { }
std::ptr::write(ptr, value);
} fn read_u64(at: &mut usize, src_slice: &[u8]) -> u64 {
*at += mem::size_of::<X>(); let data = &src_slice[*at..*at + mem::size_of::<u64>()];
*at += mem::size_of::<u64>();
(&data[..]).read_u64::<LittleEndian>().unwrap()
}
fn write_u64(at: &mut usize, dst_slice: &mut [u8], value: u64) {
let data = &mut dst_slice[*at..*at + mem::size_of::<u64>()];
(&mut data[..]).write_u64::<LittleEndian>(value).unwrap();
*at += mem::size_of::<u64>();
} }
pub fn deserialize_account( pub fn deserialize_account(
@ -77,30 +76,24 @@ pub fn deserialize_account(
current_offset: usize, current_offset: usize,
) -> Result<Account> { ) -> Result<Account> {
let mut at = index; let mut at = index;
let data = &src_slice[at..(at + mem::size_of::<u64>())];
#[allow(clippy::cast_ptr_alignment)]
let size: u64 = unsafe { std::ptr::read_unaligned(data.as_ptr() as *const _) };
let len = size as usize;
at += SIZEOF_U64 as usize;
let size = read_u64(&mut at, &src_slice);
let len = size as usize;
assert!(current_offset >= at + len); assert!(current_offset >= at + len);
let data = &src_slice[at..(at + mem::size_of::<u64>())]; let tokens = read_u64(&mut at, &src_slice);
#[allow(clippy::cast_ptr_alignment)]
let tokens: u64 = unsafe { std::ptr::read_unaligned(data.as_ptr() as *const _) };
at += mem::size_of::<u64>();
let userdata_len = len - get_account_size_static(); let userdata_len = len - get_account_size_static();
let mut userdata = vec![]; let mut userdata = vec![0; userdata_len];
userdata.extend_from_slice(&src_slice[at..at + userdata_len]); read_bytes(&mut at, &mut userdata, &src_slice, userdata_len);
at += userdata_len;
let data = &src_slice[at..(at + mem::size_of::<Pubkey>())]; let mut pubkey = vec![0; mem::size_of::<Pubkey>()];
let owner: Pubkey = unsafe { std::ptr::read(data.as_ptr() as *const _) }; read_bytes(&mut at, &mut pubkey, &src_slice, mem::size_of::<Pubkey>());
at += mem::size_of::<Pubkey>(); let owner = Pubkey::new(&pubkey);
let data = &src_slice[at..(at + mem::size_of::<bool>())]; let mut exec = vec![0; mem::size_of::<bool>()];
let executable: bool = unsafe { std::ptr::read(data.as_ptr() as *const _) }; read_bytes(&mut at, &mut exec, &src_slice, mem::size_of::<bool>());
let executable: bool = exec[0] != 0;
Ok(Account { Ok(Account {
tokens, tokens,
@ -126,13 +119,14 @@ where
data.write_all(&[0]).unwrap(); data.write_all(&[0]).unwrap();
data.seek(SeekFrom::Start(0)).unwrap(); data.seek(SeekFrom::Start(0)).unwrap();
data.flush().unwrap(); data.flush().unwrap();
let map = unsafe { MmapMut::map_mut(&data).expect("failed to map the data file") }; let mmap = unsafe { Mmap::map(&data).expect("failed to map the data file") };
let mmap_mut = unsafe { MmapMut::map_mut(&data).expect("failed to map the data file") };
AppendVec { AppendVec {
data, data,
map, mmap,
current_offset: AtomicUsize::new(0), current_offset: AtomicUsize::new(0),
append_lock: Mutex::new(()), mmap_mut: Mutex::new(mmap_mut),
file_size: size, file_size: size,
inc_size: inc, inc_size: inc,
phantom: PhantomData, phantom: PhantomData,
@ -140,7 +134,7 @@ where
} }
pub fn reset(&mut self) { pub fn reset(&mut self) {
let _append_lock = self.append_lock.lock().unwrap(); let _mmap_mut = self.mmap_mut.lock().unwrap();
self.current_offset.store(0, Ordering::Relaxed); self.current_offset.store(0, Ordering::Relaxed);
} }
@ -149,7 +143,7 @@ where
let offset = self.current_offset.load(Ordering::Relaxed); let offset = self.current_offset.load(Ordering::Relaxed);
let at = index as usize; let at = index as usize;
assert!(offset >= at + mem::size_of::<T>()); assert!(offset >= at + mem::size_of::<T>());
let data = &self.map[at..at + mem::size_of::<T>()]; let data = &self.mmap[at..at + mem::size_of::<T>()];
let ptr = data.as_ptr() as *const T; let ptr = data.as_ptr() as *const T;
let x: Option<&T> = unsafe { ptr.as_ref() }; let x: Option<&T> = unsafe { ptr.as_ref() };
x.unwrap() x.unwrap()
@ -160,33 +154,33 @@ where
if self.inc_size == 0 { if self.inc_size == 0 {
return Err(Error::new(ErrorKind::WriteZero, "Grow not supported")); return Err(Error::new(ErrorKind::WriteZero, "Grow not supported"));
} }
let _append_lock = self.append_lock.lock().unwrap(); let mut mmap_mut = self.mmap_mut.lock().unwrap();
let index = self.current_offset.load(Ordering::Relaxed) + mem::size_of::<T>(); let index = self.current_offset.load(Ordering::Relaxed) + mem::size_of::<T>();
if index as u64 + self.inc_size < self.file_size { if index as u64 + self.inc_size < self.file_size {
// grow was already called // grow was already called
return Ok(()); return Ok(());
} }
let end = self.file_size + self.inc_size; let end = self.file_size + self.inc_size;
drop(self.map.to_owned()); drop(mmap_mut.to_owned());
drop(self.mmap.to_owned());
self.data.seek(SeekFrom::Start(end))?; self.data.seek(SeekFrom::Start(end))?;
self.data.write_all(&[0])?; self.data.write_all(&[0])?;
self.data.seek(SeekFrom::Start(0))?; self.mmap = unsafe { Mmap::map(&self.data)? };
self.data.flush()?; *mmap_mut = unsafe { MmapMut::map_mut(&self.data)? };
self.map = unsafe { MmapMut::map_mut(&self.data)? };
self.file_size = end; self.file_size = end;
Ok(()) Ok(())
} }
#[allow(dead_code)] #[allow(dead_code)]
pub fn append(&self, val: T) -> Option<u64> { pub fn append(&self, val: T) -> Option<u64> {
let _append_lock = self.append_lock.lock().unwrap(); let mmap_mut = self.mmap_mut.lock().unwrap();
let index = self.current_offset.load(Ordering::Relaxed); let index = self.current_offset.load(Ordering::Relaxed);
if (self.file_size as usize) < index + mem::size_of::<T>() { if (self.file_size as usize) < index + mem::size_of::<T>() {
return None; return None;
} }
let data = &self.map[index..(index + mem::size_of::<T>())]; let data = &mmap_mut[index..(index + mem::size_of::<T>())];
unsafe { unsafe {
let ptr = data.as_ptr() as *mut T; let ptr = data.as_ptr() as *mut T;
std::ptr::write(ptr, val) std::ptr::write(ptr, val)
@ -199,25 +193,32 @@ where
pub fn get_account(&self, index: u64) -> Result<Account> { pub fn get_account(&self, index: u64) -> Result<Account> {
let index = index as usize; let index = index as usize;
deserialize_account( deserialize_account(
&self.map[..], &self.mmap[..],
index, index,
self.current_offset.load(Ordering::Relaxed), self.current_offset.load(Ordering::Relaxed),
) )
} }
pub fn append_account(&self, account: &Account) -> Option<u64> { pub fn append_account(&self, account: &Account) -> Option<u64> {
let _append_lock = self.append_lock.lock().unwrap(); let mut mmap_mut = self.mmap_mut.lock().unwrap();
let data_at = self.current_offset.load(Ordering::Relaxed); let data_at = align_up!(
self.current_offset.load(Ordering::Relaxed),
mem::size_of::<u64>()
);
let len = get_serialized_size(account); let len = get_serialized_size(account);
if (self.file_size as usize) < data_at + len + SIZEOF_U64 { if (self.file_size as usize) < data_at + len + SIZEOF_U64 {
return None; return None;
} }
serialize_account(&self.map[data_at..data_at + len], account, len); serialize_account(
&mut mmap_mut[data_at..data_at + len + SIZEOF_U64],
&account,
len,
);
self.current_offset self.current_offset
.fetch_add(len + SIZEOF_U64, Ordering::Relaxed); .store(data_at + len + SIZEOF_U64, Ordering::Relaxed);
Some(data_at as u64) Some(data_at as u64)
} }
} }
@ -337,17 +338,18 @@ pub mod tests {
let path = Path::new("random"); let path = Path::new("random");
let mut vec = AppendVec::<AtomicUsize>::new(path, true, START_SIZE, INC_SIZE); let mut vec = AppendVec::<AtomicUsize>::new(path, true, START_SIZE, INC_SIZE);
let size = 1_000; let size = 1_000;
for _ in 0..size { for k in 0..size {
if vec.append(AtomicUsize::new(0)).is_none() { if vec.append(AtomicUsize::new(k)).is_none() {
assert!(vec.grow_file().is_ok()); assert!(vec.grow_file().is_ok());
assert!(vec.append(AtomicUsize::new(0)).is_some()); assert!(vec.append(AtomicUsize::new(0)).is_some());
} }
} }
let index = thread_rng().gen_range(0, size as u64); let index = thread_rng().gen_range(0, size as u64);
let atomic1 = vec.get(index); let atomic1 = vec.get(index * mem::size_of::<AtomicUsize>() as u64);
let current1 = atomic1.load(Ordering::Relaxed); let current1 = atomic1.load(Ordering::Relaxed);
assert_eq!(current1, index as usize);
let next = current1 + 1; let next = current1 + 1;
atomic1.store(next, Ordering::Relaxed); let index = vec.append(AtomicUsize::new(next)).unwrap();
let atomic2 = vec.get(index); let atomic2 = vec.get(index);
let current2 = atomic2.load(Ordering::Relaxed); let current2 = atomic2.load(Ordering::Relaxed);
assert_eq!(current2, next); assert_eq!(current2, next);