aboutsummaryrefslogtreecommitdiff
path: root/src/transducer.rs
blob: 679c7572625a28c4be47b5f7544601c74fffc8e2 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
use fst::Automaton;

use crate::{StateID, DFA};

macro_rules! imp {
    ($ty:ty, $id:ty) => {
        impl<T: AsRef<[$id]>, S: StateID> Automaton for $ty {
            type State = S;

            #[inline]
            fn start(&self) -> S {
                self.start_state()
            }

            #[inline]
            fn is_match(&self, state: &S) -> bool {
                self.is_match_state(*state)
            }

            #[inline]
            fn accept(&self, state: &S, byte: u8) -> S {
                self.next_state(*state, byte)
            }

            #[inline]
            fn can_match(&self, state: &S) -> bool {
                !self.is_dead_state(*state)
            }
        }
    };
}

imp!(crate::dense::DenseDFA<T, S>, S);
imp!(crate::dense::Standard<T, S>, S);
imp!(crate::dense::ByteClass<T, S>, S);
imp!(crate::dense::Premultiplied<T, S>, S);
imp!(crate::dense::PremultipliedByteClass<T, S>, S);
imp!(crate::sparse::SparseDFA<T, S>, u8);
imp!(crate::sparse::Standard<T, S>, u8);
imp!(crate::sparse::ByteClass<T, S>, u8);

#[cfg(test)]
mod tests {
    use bstr::BString;
    use fst::{Automaton, IntoStreamer, Set, Streamer};

    use crate::dense::{self, DenseDFA};
    use crate::sparse::SparseDFA;

    fn search<A: Automaton, D: AsRef<[u8]>>(
        set: &Set<D>,
        aut: A,
    ) -> Vec<BString> {
        let mut stream = set.search(aut).into_stream();

        let mut results = vec![];
        while let Some(key) = stream.next() {
            results.push(BString::from(key));
        }
        results
    }

    #[test]
    fn dense_anywhere() {
        let set =
            Set::from_iter(&["a", "bar", "baz", "wat", "xba", "xbax", "z"])
                .unwrap();
        let dfa = DenseDFA::new("ba.*").unwrap();
        let got = search(&set, &dfa);
        assert_eq!(got, vec!["bar", "baz", "xba", "xbax"]);
    }

    #[test]
    fn dense_anchored() {
        let set =
            Set::from_iter(&["a", "bar", "baz", "wat", "xba", "xbax", "z"])
                .unwrap();
        let dfa = dense::Builder::new().anchored(true).build("ba.*").unwrap();
        let got = search(&set, &dfa);
        assert_eq!(got, vec!["bar", "baz"]);
    }

    #[test]
    fn sparse_anywhere() {
        let set =
            Set::from_iter(&["a", "bar", "baz", "wat", "xba", "xbax", "z"])
                .unwrap();
        let dfa = SparseDFA::new("ba.*").unwrap();
        let got = search(&set, &dfa);
        assert_eq!(got, vec!["bar", "baz", "xba", "xbax"]);
    }

    #[test]
    fn sparse_anchored() {
        let set =
            Set::from_iter(&["a", "bar", "baz", "wat", "xba", "xbax", "z"])
                .unwrap();
        let dfa = dense::Builder::new()
            .anchored(true)
            .build("ba.*")
            .unwrap()
            .to_sparse()
            .unwrap();
        let got = search(&set, &dfa);
        assert_eq!(got, vec!["bar", "baz"]);
    }
}