use rand::Rng; use eddie::JaroWinkler; use rand::rngs::ThreadRng; use std::time::Duration; use strsim; use natural; use criterion::{ criterion_group, criterion_main, Criterion, }; pub fn jarwin_benchmark(cr: &mut Criterion) { let jarwin = JaroWinkler::new(); let mut group = cr.benchmark_group("jarwin"); for size in &[3, 6, 9, 12, 15] { group.bench_with_input(format!("eddie size={}", size), size, |bench, _| { let mut gen = Generator::new(*size, 2); bench.iter(|| { let (s1, s2) = &gen.next(); jarwin.similarity(s1, s2) }); } ); group.bench_with_input(format!("strsim size={}", size), size, |bench, _| { let mut gen = Generator::new(*size, 2); bench.iter(|| { let (s1, s2) = &gen.next(); strsim::jaro_winkler(s1, s2) }); } ); if *size == 3 { continue; } group.bench_with_input(format!("natural size={}", size), size, |bench, _| { let mut gen = Generator::new(*size, 2); bench.iter(|| { let (s1, s2) = &gen.next(); natural::distance::jaro_winkler_distance(s1, s2) }); } ); } group.finish(); } criterion_group!{ name = benches; config = Criterion::default() .warm_up_time(Duration::from_millis(50)) .measurement_time(Duration::from_millis(200)); targets = jarwin_benchmark } criterion_main!(benches); const GEN_SAMPLE_SIZE: usize = 1000; struct Generator { pub sample: Vec<(String, String)>, rng: ThreadRng, len: usize, edits: usize, chars: Vec, i: usize, } impl Generator { pub fn new(len: usize, edits: usize) -> Generator { let chars = "abcdefghijklmnopqrstuvwxyz".chars().collect(); let rng = rand::thread_rng(); let sample = Vec::with_capacity(GEN_SAMPLE_SIZE); let i = 0; let mut gen = Generator { rng, len, edits, chars, sample, i }; gen.fill(); gen } #[inline] pub fn next<'a>(&'a mut self) -> &'a (String, String) { let i = self.i; if self.i >= self.sample.len() { self.i = 0; } &self.sample[i] } fn fill(&mut self) -> &mut Self { for _ in 0..GEN_SAMPLE_SIZE { let w1 = self.gen_word(); // let w2 = self.gen_word(); let w2 = self.edit(&w1, self.edits); self.sample.push((w1, w2)); } self } fn gen_word(&mut self) -> String { let Generator { rng, chars, len, .. } = self; let mut word: Vec = Vec::with_capacity(*len); for _ in 0..*len { let c = chars[rng.gen_range(0, chars.len()) as usize]; word.push(c); } word.iter().collect() } fn edit(&mut self, _word: &str, edits: usize) -> String { let Generator { rng, chars, .. } = self; let mut word: Vec = _word.chars().collect(); for _ in 0..edits { if word.len() == 0 { break; } let i = rng.gen_range(0, word.len()) as usize; let c = chars[rng.gen_range(0, chars.len()) as usize]; let case = rng.gen_range(0, 3); match case { 0 => { word.insert(i, c); } 1 => { word.remove(i); } 2 => { word[i] = c; } _ => { panic!("Unreachable"); } } } word.iter().collect() } }