string_interner/lib.rs
1#![no_std]
2#![doc(html_root_url = "https://docs.rs/crate/string-interner/0.18.0")]
3#![warn(unsafe_op_in_unsafe_fn, clippy::redundant_closure_for_method_calls)]
4
5//! Caches strings efficiently, with minimal memory footprint and associates them with unique symbols.
6//! These symbols allow constant time comparisons and look-ups to the underlying interned strings.
7//!
8//! ### Example: Interning & Symbols
9//!
10//! ```
11//! use string_interner::StringInterner;
12//!
13//! let mut interner = StringInterner::default();
14//! let sym0 = interner.get_or_intern("Elephant");
15//! let sym1 = interner.get_or_intern("Tiger");
16//! let sym2 = interner.get_or_intern("Horse");
17//! let sym3 = interner.get_or_intern("Tiger");
18//! assert_ne!(sym0, sym1);
19//! assert_ne!(sym0, sym2);
20//! assert_ne!(sym1, sym2);
21//! assert_eq!(sym1, sym3); // same!
22//! ```
23//!
24//! ### Example: Creation by `FromIterator`
25//!
26//! ```
27//! # use string_interner::DefaultStringInterner;
28//! let interner = ["Elephant", "Tiger", "Horse", "Tiger"]
29//! .into_iter()
30//! .collect::<DefaultStringInterner>();
31//! ```
32//!
33//! ### Example: Look-up
34//!
35//! ```
36//! # use string_interner::StringInterner;
37//! let mut interner = StringInterner::default();
38//! let sym = interner.get_or_intern("Banana");
39//! assert_eq!(interner.resolve(sym), Some("Banana"));
40//! ```
41//!
42//! ### Example: Iteration
43//!
44//! ```
45//! # use string_interner::{DefaultStringInterner, Symbol};
46//! let interner = <DefaultStringInterner>::from_iter(["Earth", "Water", "Fire", "Air"]);
47//! for (sym, str) in &interner {
48//! println!("{} = {}", sym.to_usize(), str);
49//! }
50//! ```
51//!
52//! ### Example: Use Different Backend
53//!
54//! ```
55//! # use string_interner::StringInterner;
56//! use string_interner::backend::BufferBackend;
57//! type Interner = StringInterner<BufferBackend>;
58//! let mut interner = Interner::new();
59//! let sym1 = interner.get_or_intern("Tiger");
60//! let sym2 = interner.get_or_intern("Horse");
61//! let sym3 = interner.get_or_intern("Tiger");
62//! assert_ne!(sym1, sym2);
63//! assert_eq!(sym1, sym3); // same!
64//! ```
65//!
66//! ### Example: Use Different Backend & Symbol
67//!
68//! ```
69//! # use string_interner::StringInterner;
70//! use string_interner::{backend::BucketBackend, symbol::SymbolU16};
71//! type Interner = StringInterner<BucketBackend<SymbolU16>>;
72//! let mut interner = Interner::new();
73//! let sym1 = interner.get_or_intern("Tiger");
74//! let sym2 = interner.get_or_intern("Horse");
75//! let sym3 = interner.get_or_intern("Tiger");
76//! assert_ne!(sym1, sym2);
77//! assert_eq!(sym1, sym3); // same!
78//! ```
79//!
80//! ## Backends
81//!
82//! The `string_interner` crate provides different backends with different strengths.
83//! The table below compactly shows when to use which backend according to the following
84//! performance characteristics and properties.
85//!
86//! | **Property** | **BucketBackend** | **StringBackend** | **BufferBackend** | | Explanation |
87//! |:-------------|:-----------------:|:-----------------:|:-----------------:|:--|:--|
88//! | Fill | 🤷 | 👍 | ⭐ | | Efficiency of filling an empty string interner. |
89//! | Fill Duplicates | 1) | 1) | 1) | | Efficiency of filling a string interner with strings that are already interned. |
90//! | Resolve | ⭐ | 👍 | 👎 | | Efficiency of resolving a symbol of an interned string. |
91//! | Allocations | 🤷 | 👍 | ⭐ | | The number of allocations performed by the backend. |
92//! | Footprint | 🤷 | 👍 | ⭐ | | The total heap memory consumed by the backend. |
93//! | Iteration | ⭐ | 👍 | 👎 | | Efficiency of iterating over the interned strings. |
94//! | | | | | | |
95//! | Contiguous | ✅ | ✅ | ❌ | | The returned symbols have contiguous values. |
96//! | Stable Refs | ✅ | ❌ | ❌ | | The interned strings have stable references. |
97//! | Static Strings | ✅ | ❌ | ❌ | | Allows to intern `&'static str` without heap allocations. |
98//!
99//! 1. Performance of interning pre-interned string is the same for all backends since
100//! this is implemented in the `StringInterner` front-end via a `HashMap` query for
101//! all `StringInterner` instances.
102//!
103//! ### Legend
104//!
105//! | ⭐ | **best performance** | 👍 | **good performance** | 🤷 | **okay performance** | 👎 | **bad performance** |
106//! |-|-|-|-|-|-|-|-|
107//!
108//! ## When to use which backend?
109//!
110//! ### Bucket Backend
111//!
112//! Given the table above the `BucketBackend` might seem inferior to the other backends.
113//! However, it allows to efficiently intern `&'static str` and avoids deallocations.
114//!
115//! ### String Backend
116//!
117//! Overall the `StringBackend` performs really well and therefore is the backend
118//! that the `StringInterner` uses by default.
119//!
120//! ### Buffer Backend
121//!
122//! The `BufferBackend` is in some sense similar to the `StringBackend` on steroids.
123//! Some operations are even slightly more efficient and it consumes less memory.
124//! However, all this is at the costs of a less efficient resolution of symbols.
125//! Note that the symbols generated by the `BufferBackend` are not contiguous.
126
127extern crate alloc;
128#[cfg(feature = "std")]
129#[macro_use]
130extern crate std;
131
132#[cfg(feature = "serde")]
133mod serde_impl;
134
135pub mod backend;
136mod interner;
137pub mod symbol;
138
139/// A convenience [`StringInterner`] type based on the [`DefaultBackend`].
140#[cfg(feature = "backends")]
141pub type DefaultStringInterner<B = DefaultBackend, H = DefaultHashBuilder> =
142 self::interner::StringInterner<B, H>;
143
144#[cfg(feature = "backends")]
145#[doc(inline)]
146pub use self::backend::DefaultBackend;
147#[doc(inline)]
148pub use self::{
149 interner::StringInterner,
150 symbol::{DefaultSymbol, Symbol},
151};
152
153#[doc(inline)]
154pub use hashbrown::DefaultHashBuilder;