use tempfile::{NamedTempFile, TempDir}; use lmdb::Transaction; use rand::prelude::SliceRandom; use rand::Rng; use std::env::current_dir; use std::fs::OpenOptions; use std::io::{IoSlice, Read, Seek, SeekFrom, Write}; use std::path::Path; use std::time::{Duration, SystemTime}; #[cfg(unix)] use std::{os::unix::io::AsRawFd, ptr, slice}; const ITERATIONS: usize = 3; const KEY_SIZE: usize = 24; const VALUE_SIZE: usize = 2000; const ELEMENTS: usize = 100_000; fn human_readable_bytes(bytes: usize) -> String { if bytes < 1024 { format!("{bytes}B") } else if bytes < 1024 * 1024 { format!("{}KiB", bytes / 1024) } else if bytes < 1024 * 1024 * 1024 { format!("{}MiB", bytes / 1024 / 1024) } else if bytes < 1024 * 1024 * 1024 * 1024 { format!("{}GiB", bytes / 1024 / 1024 / 1024) } else { format!("{}TiB", bytes / 1024 / 1024 / 1024 / 1024) } } fn print_load_time(name: &'static str, duration: Duration) { let throughput = ELEMENTS * (KEY_SIZE + VALUE_SIZE) * 1000 / duration.as_millis() as usize; println!( "{}: Loaded {} items ({}) in {}ms ({}/s)", name, ELEMENTS, human_readable_bytes(ELEMENTS * (KEY_SIZE + VALUE_SIZE)), duration.as_millis(), human_readable_bytes(throughput), ); } /// Returns pairs of key, value fn gen_data(count: usize, key_size: usize, value_size: usize) -> Vec<(Vec, Vec)> { let mut pairs = vec![]; for _ in 0..count { let key: Vec = (0..key_size).map(|_| rand::thread_rng().gen()).collect(); let value: Vec = (0..value_size).map(|_| rand::thread_rng().gen()).collect(); pairs.push((key, value)); } pairs } fn lmdb_bench(path: &Path) { let env = lmdb::Environment::new().open(path).unwrap(); env.set_map_size(4096 * 1024 * 1024).unwrap(); let mut pairs = gen_data(1000, KEY_SIZE, VALUE_SIZE); let pairs_len = pairs.len(); let db = env.open_db(None).unwrap(); { let start = SystemTime::now(); let mut txn = env.begin_rw_txn().unwrap(); { for i in 0..ELEMENTS { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); txn.put(db, &key, &value, lmdb::WriteFlags::empty()) .unwrap(); } } txn.commit().unwrap(); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); print_load_time("lmdb-zero", duration); let mut key_order: Vec = (0..ELEMENTS).collect(); key_order.shuffle(&mut rand::thread_rng()); let txn = env.begin_ro_txn().unwrap(); { for _ in 0..ITERATIONS { let start = SystemTime::now(); let mut checksum = 0u64; let mut expected_checksum = 0u64; for &i in &key_order { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let result: &[u8] = txn.get(db, &key).unwrap(); checksum += result[0] as u64; expected_checksum += value[0] as u64; } assert_eq!(checksum, expected_checksum); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); println!( "lmdb: Random read {} items in {}ms", ELEMENTS, duration.as_millis() ); } } } } #[cfg(target_os = "linux")] fn uring_bench(path: &Path) { let mut file = OpenOptions::new() .read(true) .write(true) .create(true) .open(path) .unwrap(); let mut pairs = gen_data(1000, KEY_SIZE, VALUE_SIZE); let pairs_len = pairs.len(); let start = SystemTime::now(); { for i in 0..ELEMENTS { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let s1 = IoSlice::new(key); let s2 = IoSlice::new(value); assert_eq!( file.write_vectored(&[s1, s2]).unwrap(), key.len() + value.len() ); } } file.sync_all().unwrap(); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); print_load_time("uring_read()/write()", duration); let mut key_order: Vec = (0..ELEMENTS).collect(); key_order.shuffle(&mut rand::thread_rng()); { for _ in 0..ITERATIONS { let start = SystemTime::now(); let uring_entries = 10usize; let mut ring = io_uring::IoUring::new(uring_entries as u32).unwrap(); let mut buffers = vec![vec![0u8; VALUE_SIZE]; uring_entries]; let mut checksum = 0u64; let mut expected_checksum = 0u64; for (uring_counter, &i) in key_order.iter().enumerate() { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let offset = i * (key.len() + value.len()) + key.len(); expected_checksum += value[0] as u64; let buffer_index = uring_counter % uring_entries; let buf = &mut buffers[buffer_index]; let iovec = libc::iovec { iov_base: buf.as_mut_ptr() as *mut libc::c_void, iov_len: buf.len(), }; let read_e = io_uring::opcode::Readv::new(io_uring::types::Fd(file.as_raw_fd()), &iovec, 1) .offset(offset as u64) .build() .user_data(buffer_index as u64); unsafe { ring.submission().push(&read_e).unwrap(); } ring.submit().unwrap(); if uring_counter % uring_entries == (uring_entries - 1) { ring.submit_and_wait(uring_entries).unwrap(); for _ in 0..uring_entries { let cqe = ring.completion().next().unwrap(); checksum += buffers[cqe.user_data() as usize][0] as u64; } } } assert_eq!(checksum, expected_checksum); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); println!( "uring_read()/write(): Random read {} items in {}ms", ELEMENTS, duration.as_millis() ); } } } fn readwrite_bench(path: &Path) { let mut file = OpenOptions::new() .read(true) .write(true) .create(true) .open(path) .unwrap(); let mut pairs = gen_data(1000, KEY_SIZE, VALUE_SIZE); let pairs_len = pairs.len(); let start = SystemTime::now(); { for i in 0..ELEMENTS { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let s1 = IoSlice::new(key); let s2 = IoSlice::new(value); assert_eq!( file.write_vectored(&[s1, s2]).unwrap(), key.len() + value.len() ); } } file.sync_all().unwrap(); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); print_load_time("read()/write()", duration); let mut key_order: Vec = (0..ELEMENTS).collect(); key_order.shuffle(&mut rand::thread_rng()); { for _ in 0..ITERATIONS { let start = SystemTime::now(); let mut checksum = 0u64; let mut expected_checksum = 0u64; let mut buffer = vec![0u8; 2000]; for &i in &key_order { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let offset = i * (key.len() + value.len()) + key.len(); file.seek(SeekFrom::Start(offset as u64)).unwrap(); file.read_exact(&mut buffer).unwrap(); checksum += buffer[0] as u64; expected_checksum += value[0] as u64; } assert_eq!(checksum, expected_checksum); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); println!( "read()/write(): Random read {} items in {}ms", ELEMENTS, duration.as_millis() ); } } } #[cfg(unix)] fn mmap_bench(path: &Path) { let file = OpenOptions::new() .read(true) .write(true) .create(true) .open(path) .unwrap(); let len = 4 * 1024 * 1024 * 1024; file.set_len(len).unwrap(); let mmap_raw = unsafe { libc::mmap( ptr::null_mut(), len as libc::size_t, libc::PROT_READ | libc::PROT_WRITE, libc::MAP_SHARED, file.as_raw_fd(), 0, ) }; assert_ne!(mmap_raw, libc::MAP_FAILED); let mmap = unsafe { slice::from_raw_parts_mut(mmap_raw as *mut u8, len as usize) }; let mut pairs = gen_data(1000, KEY_SIZE, VALUE_SIZE); let pairs_len = pairs.len(); let mut write_index = 0; let start = SystemTime::now(); { for i in 0..ELEMENTS { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); mmap[write_index..(write_index + key.len())].copy_from_slice(key); write_index += key.len(); mmap[write_index..(write_index + value.len())].copy_from_slice(value); write_index += value.len(); } } let result = unsafe { libc::msync(mmap_raw, len as libc::size_t, libc::MS_SYNC) }; assert_eq!(result, 0); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); print_load_time("mmap()", duration); let mut key_order: Vec = (0..ELEMENTS).collect(); key_order.shuffle(&mut rand::thread_rng()); { for _ in 0..ITERATIONS { let start = SystemTime::now(); let mut checksum = 0u64; let mut expected_checksum = 0u64; for &i in &key_order { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let offset = i * (key.len() + value.len()) + key.len(); let buffer = &mmap[offset..(offset + value.len())]; checksum += buffer[0] as u64; expected_checksum += value[0] as u64; } assert_eq!(checksum, expected_checksum); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); println!( "mmap(): Random read {} items in {}ms", ELEMENTS, duration.as_millis() ); } } } #[cfg(unix)] fn mmap_anon_bench() { let len: usize = 4 * 1024 * 1024 * 1024; let mmap_raw = unsafe { libc::mmap( ptr::null_mut(), len as libc::size_t, libc::PROT_READ | libc::PROT_WRITE, libc::MAP_SHARED | libc::MAP_ANON, 0, 0, ) }; assert_ne!(mmap_raw, libc::MAP_FAILED); let mmap = unsafe { slice::from_raw_parts_mut(mmap_raw as *mut u8, len) }; let mut pairs = gen_data(1000, KEY_SIZE, VALUE_SIZE); let pairs_len = pairs.len(); let mut write_index = 0; let start = SystemTime::now(); { for i in 0..ELEMENTS { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); mmap[write_index..(write_index + key.len())].copy_from_slice(key); write_index += key.len(); mmap[write_index..(write_index + value.len())].copy_from_slice(value); write_index += value.len(); } } let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); print_load_time("mmap(ANON)", duration); let mut key_order: Vec = (0..ELEMENTS).collect(); key_order.shuffle(&mut rand::thread_rng()); { for _ in 0..ITERATIONS { let start = SystemTime::now(); let mut checksum = 0u64; let mut expected_checksum = 0u64; for &i in &key_order { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let offset = i * (key.len() + value.len()) + key.len(); let buffer = &mmap[offset..(offset + value.len())]; checksum += buffer[0] as u64; expected_checksum += value[0] as u64; } assert_eq!(checksum, expected_checksum); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); println!( "mmap(ANON): Random read {} items in {}ms", ELEMENTS, duration.as_millis() ); } } } fn vec_bench() { let len: usize = 4 * 1024 * 1024 * 1024; let mut mmap = vec![0; len]; let mut pairs = gen_data(1000, KEY_SIZE, VALUE_SIZE); let pairs_len = pairs.len(); let mut write_index = 0; let start = SystemTime::now(); { for i in 0..ELEMENTS { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); mmap[write_index..(write_index + key.len())].copy_from_slice(key); write_index += key.len(); mmap[write_index..(write_index + value.len())].copy_from_slice(value); write_index += value.len(); } } let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); print_load_time("vec[]", duration); let mut key_order: Vec = (0..ELEMENTS).collect(); key_order.shuffle(&mut rand::thread_rng()); { for _ in 0..ITERATIONS { let start = SystemTime::now(); let mut checksum = 0u64; let mut expected_checksum = 0u64; for &i in &key_order { let (key, value) = &mut pairs[i % pairs_len]; key[0..8].copy_from_slice(&(i as u64).to_le_bytes()); let offset = i * (key.len() + value.len()) + key.len(); let buffer = &mmap[offset..(offset + value.len())]; checksum += buffer[0] as u64; expected_checksum += value[0] as u64; } assert_eq!(checksum, expected_checksum); let end = SystemTime::now(); let duration = end.duration_since(start).unwrap(); println!( "vec[]: Random read {} items in {}ms", ELEMENTS, duration.as_millis() ); } } } fn main() { // Benchmark lmdb against raw read()/write() performance { let tmpfile: TempDir = tempfile::tempdir_in(current_dir().unwrap()).unwrap(); lmdb_bench(tmpfile.path()); } { let tmpfile: NamedTempFile = NamedTempFile::new_in(current_dir().unwrap()).unwrap(); readwrite_bench(tmpfile.path()); } #[cfg(target_os = "linux")] { let tmpfile: NamedTempFile = NamedTempFile::new_in(current_dir().unwrap()).unwrap(); uring_bench(tmpfile.path()); } #[cfg(unix)] { let tmpfile: NamedTempFile = NamedTempFile::new_in(current_dir().unwrap()).unwrap(); mmap_bench(tmpfile.path()); mmap_anon_bench(); } vec_bench(); }