#[cfg(feature = "levenshtein")] use fst::automaton::Levenshtein; use fst::automaton::{Str, Subsequence}; #[cfg(feature = "levenshtein")] use fst::raw::{Builder, Fst}; use fst::set::Set; use fst::{self, Automaton, IntoStreamer, Streamer}; static WORDS: &'static str = include_str!("../data/words-10000"); fn get_set() -> Set> { Set::from_iter(WORDS.lines()).unwrap() } #[cfg(feature = "levenshtein")] fn fst_set(ss: I) -> Fst> where I: IntoIterator, S: AsRef<[u8]>, { let mut bfst = Builder::memory(); let mut ss: Vec> = ss.into_iter().map(|s| s.as_ref().to_vec()).collect(); ss.sort(); for s in ss.iter().into_iter() { bfst.add(s).unwrap(); } let fst = bfst.into_fst(); ss.dedup(); assert_eq!(fst.len(), ss.len()); fst } #[cfg(feature = "levenshtein")] #[test] fn levenshtein_simple() { let set = fst_set(vec!["woof", "wood", "banana"]); let q = Levenshtein::new("woog", 1).unwrap(); let vs = set.search(&q).into_stream().into_byte_keys(); assert_eq!(vs, vec!["wood".as_bytes(), "woof".as_bytes()]); } #[cfg(feature = "levenshtein")] #[test] fn levenshtein_unicode() { let set = fst_set(vec!["woof", "wood", "banana", "☃snowman☃"]); let q = Levenshtein::new("snoman", 3).unwrap(); let vs = set.search(&q).into_stream().into_byte_keys(); assert_eq!(vs, vec!["☃snowman☃".as_bytes()]); } #[cfg(feature = "levenshtein")] #[test] fn complement_small() { let keys = vec!["fa", "fo", "fob", "focus", "foo", "food", "foul"]; let set = Set::from_iter(keys).unwrap(); let lev = Levenshtein::new("foo", 1).unwrap(); let stream = set.search(lev.complement()).into_stream(); let keys = stream.into_strs().unwrap(); assert_eq!(keys, vec!["fa", "focus", "foul"]); } #[cfg(feature = "levenshtein")] #[test] fn startswith_small() { let keys = vec![ "", "cooing", "fa", "fo", "fob", "focus", "foo", "food", "foul", "fritter", "frothing", ]; let set = Set::from_iter(keys).unwrap(); let lev = Levenshtein::new("foo", 1).unwrap(); let stream = set.search(lev.starts_with()).into_stream(); let keys = stream.into_strs().unwrap(); assert_eq!( keys, vec![ "cooing", "fo", "fob", "focus", "foo", "food", "foul", "frothing", ] ); } #[cfg(feature = "levenshtein")] #[test] fn intersection_small() { let keys = vec!["fab", "fo", "fob", "focus", "foo", "food", "foul", "goo"]; let set = Set::from_iter(keys).unwrap(); let lev = Levenshtein::new("foo", 1).unwrap(); let prefix = Str::new("fo").starts_with(); let stream = set.search(lev.intersection(prefix)).into_stream(); let keys = stream.into_strs().unwrap(); assert_eq!(keys, vec!["fo", "fob", "foo", "food"]); } #[cfg(feature = "levenshtein")] #[test] fn union_small() { let keys = vec!["fab", "fob", "focus", "foo", "food", "goo"]; let set = Set::from_iter(keys).unwrap(); let lev = Levenshtein::new("foo", 1).unwrap(); let prefix = Str::new("fo").starts_with(); let stream = set.search(lev.union(prefix)).into_stream(); let keys = stream.into_strs().unwrap(); assert_eq!(keys, vec!["fob", "focus", "foo", "food", "goo"]); } #[cfg(feature = "levenshtein")] #[test] fn intersection_large() { use fst::set::OpBuilder; let set = get_set(); let lev = Levenshtein::new("foo", 3).unwrap(); let prefix = Str::new("fa").starts_with(); let mut stream1 = set.search((&lev).intersection(&prefix)).into_stream(); let mut stream2 = OpBuilder::new() .add(set.search(&lev)) .add(set.search(&prefix)) .intersection(); while let Some(key1) = stream1.next() { assert_eq!(stream2.next(), Some(key1)); } assert_eq!(stream2.next(), None); } #[cfg(feature = "levenshtein")] #[test] fn union_large() { use fst::set::OpBuilder; let set = get_set(); let lev = Levenshtein::new("foo", 3).unwrap(); let prefix = Str::new("fa").starts_with(); let mut stream1 = set.search((&lev).union(&prefix)).into_stream(); let mut stream2 = OpBuilder::new() .add(set.search(&lev)) .add(set.search(&prefix)) .union(); while let Some(key1) = stream1.next() { assert_eq!(stream2.next(), Some(key1)); } assert_eq!(stream2.next(), None); } #[test] fn str() { let set = get_set(); let exact = Str::new("vatican"); let mut stream = set.search(&exact).into_stream(); assert_eq!(stream.next().unwrap(), b"vatican"); assert_eq!(stream.next(), None); let exact_mismatch = Str::new("abracadabra"); let mut stream = set.search(&exact_mismatch).into_stream(); assert_eq!(stream.next(), None); let starts_with = Str::new("vati").starts_with(); let mut stream = set.search(&starts_with).into_stream(); assert_eq!(stream.next().unwrap(), b"vatican"); assert_eq!(stream.next().unwrap(), b"vation"); assert_eq!(stream.next(), None); } #[test] fn subsequence() { let set = get_set(); let subseq = Subsequence::new("nockbunsurrundd"); let mut stream = set.search(&subseq).into_stream(); assert_eq!(stream.next().unwrap(), b"bannockburnsurrounded"); assert_eq!(stream.next(), None); } #[test] fn implements_default() { let map: fst::Map> = Default::default(); assert!(map.is_empty()); let set: fst::Set> = Default::default(); assert!(set.is_empty()); }