trie_alg/
lib.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
//! # `trie-alg`
//! Implement a trie space optimized for character set in use
//! ```
//! let mut t = trie!();
//! t.add("abc");           // true
//! t.add("abc");           // false
//! t.contains("abc");      // true
//! t.contains("a");        // false
//! 
//! let mut t = multi_trie!();
//! t.add("abc");           // true
//! t.count("abc")          // 1
//! t.add("abc");           // false
//! t.count("abc")          // 2
//! t.contains("abc")       // true
//! t.contains("a")         // false
//! t.count("a")            // 0
//! 
//! struct LowerCaseWithHash();
//! impl CharSet for LowerCaseWithHash {
//!     const SIZE: usize = 27;
//!     fn map(ch: char) -> usize {
//!         if ch.is_ascii_lowercase() {
//!            ch as usize - 'a' as usize 
//!         } else {
//!             26
//!         }
//!     }
//!
//!     fn unmap(hash: usize) -> char {
//!         if hash < 26 {
//!             (b'a'+hash as u8) as char
//!         }else {
//!             '#'
//!         }
//!     }
//! }
//! 
//! let mut t = multi_trie!(LowerCaseWithHash);
//! ```
//! 
//! ## Todo
//! - [ ] Implement error handling for `CharSet` trait
//! - [ ] Implement iterators to iterate over trie
//! - [ ] Implement `delete` method to remove string from trie
//! - [ ] Implement `TrieMap` to store information at the trie node -> MultiTrie will derive from this
//! - [ ] Implement function to count string with given prefix in the trie

#[macro_use]
pub mod trie;

#[cfg(test)]
mod tests {

    use crate::trie::*;

    #[test]
    fn trie_works() {
        let mut t = trie!();
        t.add("abc");
        assert!(t.contains("abc"));
        assert!(!t.contains("a"));
    }

    #[test]
    fn multi_trie_works() {
        let mut t = multi_trie!();
        t.add("abc");
        assert_eq!(t.count("abc"), 1);
        t.add("abc");
        assert_eq!(t.count("abc"), 2);
        assert!(t.contains("abc"));
        assert!(!t.contains("a"));
        assert_eq!(t.count("a"), 0);
    }

    struct LowerCaseWithHash();
    impl CharSet for LowerCaseWithHash {
        const SIZE: usize = 27;
        fn map(ch: char) -> usize {
            if ch.is_ascii_lowercase() {
               ch as usize - 'a' as usize 
            } else {
                26
            }
        }

        fn unmap(hash: usize) -> char {
            if hash < 26 {
                (b'a'+hash as u8) as char
            }else {
                '#'
            }
        }
    }

    #[test]
    fn custom_charset_works(){
        let mut t = multi_trie!(LowerCaseWithHash);
        t.add("abc");
        assert_eq!(t.count("abc"), 1);
        t.add("abc");
        assert_eq!(t.count("abc"), 2);
        t.add("ab#c");
        t.add("ab#c");
        assert_eq!(t.count("ab#c"), 2);
        assert!(t.contains("abc"));
        assert!(!t.contains("a"));
        assert_eq!(t.count("a"), 0);
    }

    #[test]
    fn multi_trie_works_uppercase() {
        let mut t = multi_trie!(charset::UpperCase);
        t.add("ABC");
        assert_eq!(t.count("ABC"), 1);
        t.add("ABC");
        assert_eq!(t.count("ABC"), 2);
        assert!(t.contains("ABC"));
        assert!(!t.contains("A"));
        assert_eq!(t.count("A"), 0);
    }
}