intl_memoizer/lib.rs
1//! This crate contains a memoizer for internationalization formatters. Often it is
2//! expensive (in terms of performance and memory) to construct a formatter, but then
3//! relatively cheap to run the format operation.
4//!
5//! The [IntlMemoizer] is the main struct that creates a per-locale [IntlLangMemoizer].
6
7use std::cell::RefCell;
8use std::collections::hash_map::Entry;
9use std::collections::HashMap;
10use std::hash::Hash;
11use std::rc::{Rc, Weak};
12use unic_langid::LanguageIdentifier;
13
14pub mod concurrent;
15
16/// The trait that needs to be implemented for each intl formatter that needs to be
17/// memoized.
18pub trait Memoizable {
19 /// Type of the arguments that are used to construct the formatter.
20 type Args: 'static + Eq + Hash + Clone;
21
22 /// Type of any errors that can occur during the construction process.
23 type Error;
24
25 /// Construct a formatter. This maps the [`Self::Args`] type to the actual constructor
26 /// for an intl formatter.
27 fn construct(lang: LanguageIdentifier, args: Self::Args) -> Result<Self, Self::Error>
28 where
29 Self: std::marker::Sized;
30}
31
32/// The [`IntlLangMemoizer`] can memoize multiple constructed internationalization
33/// formatters, and their configuration for a single locale. For instance, given "en-US",
34/// a memorizer could retain 3 DateTimeFormat instances, and a PluralRules.
35///
36/// For memoizing with multiple locales, see [`IntlMemoizer`].
37///
38/// # Example
39///
40/// The code example does the following steps:
41///
42/// 1. Create a static counter
43/// 2. Create an `ExampleFormatter`
44/// 3. Implement [`Memoizable`] for `ExampleFormatter`.
45/// 4. Use `IntlLangMemoizer::with_try_get` to run `ExampleFormatter::format`
46/// 5. Demonstrate the memoization using the static counter
47///
48/// ```
49/// use intl_memoizer::{IntlLangMemoizer, Memoizable};
50/// use unic_langid::LanguageIdentifier;
51///
52/// // Create a static counter so that we can demonstrate the side effects of when
53/// // the memoizer re-constructs an API.
54///
55/// static mut INTL_EXAMPLE_CONSTRUCTS: u32 = 0;
56/// fn increment_constructs() {
57/// unsafe {
58/// INTL_EXAMPLE_CONSTRUCTS += 1;
59/// }
60/// }
61///
62/// fn get_constructs_count() -> u32 {
63/// unsafe { INTL_EXAMPLE_CONSTRUCTS }
64/// }
65///
66/// /// Create an example formatter, that doesn't really do anything useful. In a real
67/// /// implementation, this could be a PluralRules or DateTimeFormat struct.
68/// struct ExampleFormatter {
69/// lang: LanguageIdentifier,
70/// /// This is here to show how to initiate the API with an argument.
71/// prefix: String,
72/// }
73///
74/// impl ExampleFormatter {
75/// /// Perform an example format by printing information about the formatter
76/// /// configuration, and the arguments passed into the individual format operation.
77/// fn format(&self, example_string: &str) -> String {
78/// format!(
79/// "{} lang({}) string({})",
80/// self.prefix, self.lang, example_string
81/// )
82/// }
83/// }
84///
85/// /// Multiple classes of structs may be add1ed to the memoizer, with the restriction
86/// /// that they must implement the `Memoizable` trait.
87/// impl Memoizable for ExampleFormatter {
88/// /// The arguments will be passed into the constructor. Here a single `String`
89/// /// will be used as a prefix to the formatting operation.
90/// type Args = (String,);
91///
92/// /// If the constructor is fallible, than errors can be described here.
93/// type Error = ();
94///
95/// /// This function wires together the `Args` and `Error` type to construct
96/// /// the intl API. In our example, there is
97/// fn construct(lang: LanguageIdentifier, args: Self::Args) -> Result<Self, Self::Error> {
98/// // Keep track for example purposes that this was constructed.
99/// increment_constructs();
100///
101/// Ok(Self {
102/// lang,
103/// prefix: args.0,
104/// })
105/// }
106/// }
107///
108/// // The following demonstrates how these structs are actually used with the memoizer.
109///
110/// // Construct a new memoizer.
111/// let lang = "en-US".parse().expect("Failed to parse.");
112/// let memoizer = IntlLangMemoizer::new(lang);
113///
114/// // These arguments are passed into the constructor for `ExampleFormatter`.
115/// let construct_args = (String::from("prefix:"),);
116/// let message1 = "The format operation will run";
117/// let message2 = "ExampleFormatter will be re-used, when a second format is run";
118///
119/// // Run `IntlLangMemoizer::with_try_get`. The name of the method means "with" an
120/// // intl formatter, "try and get" the result. See the method documentation for
121/// // more details.
122///
123/// let result1 = memoizer
124/// .with_try_get::<ExampleFormatter, _, _>(construct_args.clone(), |intl_example| {
125/// intl_example.format(message1)
126/// });
127///
128/// // The memoized instance of `ExampleFormatter` will be re-used.
129/// let result2 = memoizer
130/// .with_try_get::<ExampleFormatter, _, _>(construct_args.clone(), |intl_example| {
131/// intl_example.format(message2)
132/// });
133///
134/// assert_eq!(
135/// result1.unwrap(),
136/// "prefix: lang(en-US) string(The format operation will run)"
137/// );
138/// assert_eq!(
139/// result2.unwrap(),
140/// "prefix: lang(en-US) string(ExampleFormatter will be re-used, when a second format is run)"
141/// );
142/// assert_eq!(
143/// get_constructs_count(),
144/// 1,
145/// "The constructor was only run once."
146/// );
147///
148/// let construct_args = (String::from("re-init:"),);
149///
150/// // Since the constructor args changed, `ExampleFormatter` will be re-constructed.
151/// let result1 = memoizer
152/// .with_try_get::<ExampleFormatter, _, _>(construct_args.clone(), |intl_example| {
153/// intl_example.format(message1)
154/// });
155///
156/// // The memoized instance of `ExampleFormatter` will be re-used.
157/// let result2 = memoizer
158/// .with_try_get::<ExampleFormatter, _, _>(construct_args.clone(), |intl_example| {
159/// intl_example.format(message2)
160/// });
161///
162/// assert_eq!(
163/// result1.unwrap(),
164/// "re-init: lang(en-US) string(The format operation will run)"
165/// );
166/// assert_eq!(
167/// result2.unwrap(),
168/// "re-init: lang(en-US) string(ExampleFormatter will be re-used, when a second format is run)"
169/// );
170/// assert_eq!(
171/// get_constructs_count(),
172/// 2,
173/// "The constructor was invalidated and ran again."
174/// );
175/// ```
176#[derive(Debug)]
177pub struct IntlLangMemoizer {
178 lang: LanguageIdentifier,
179 map: RefCell<type_map::TypeMap>,
180}
181
182impl IntlLangMemoizer {
183 /// Create a new [`IntlLangMemoizer`] that is unique to a specific
184 /// [`LanguageIdentifier`]
185 pub fn new(lang: LanguageIdentifier) -> Self {
186 Self {
187 lang,
188 map: RefCell::new(type_map::TypeMap::new()),
189 }
190 }
191
192 /// `with_try_get` means `with` an internationalization formatter, `try` and `get` a result.
193 /// The (potentially expensive) constructor for the formatter (such as PluralRules or
194 /// DateTimeFormat) will be memoized and only constructed once for a given
195 /// `construct_args`. After that the format operation can be run multiple times
196 /// inexpensively.
197 ///
198 /// The first generic argument `I` must be provided, but the `R` and `U` will be
199 /// deduced by the typing of the `callback` argument that is provided.
200 ///
201 /// I - The memoizable intl object, for instance a `PluralRules` instance. This
202 /// must implement the Memoizable trait.
203 ///
204 /// R - The return result from the callback `U`.
205 ///
206 /// U - The callback function. Takes an instance of `I` as the first parameter and
207 /// returns the R value.
208 pub fn with_try_get<I, R, U>(&self, construct_args: I::Args, callback: U) -> Result<R, I::Error>
209 where
210 Self: Sized,
211 I: Memoizable + 'static,
212 U: FnOnce(&I) -> R,
213 {
214 let mut map = self
215 .map
216 .try_borrow_mut()
217 .expect("Cannot use memoizer reentrantly");
218 let cache = map
219 .entry::<HashMap<I::Args, I>>()
220 .or_insert_with(HashMap::new);
221
222 let e = match cache.entry(construct_args.clone()) {
223 Entry::Occupied(entry) => entry.into_mut(),
224 Entry::Vacant(entry) => {
225 let val = I::construct(self.lang.clone(), construct_args)?;
226 entry.insert(val)
227 }
228 };
229 Ok(callback(e))
230 }
231}
232
233/// [`IntlMemoizer`] is designed to handle lazily-initialized references to
234/// internationalization formatters.
235///
236/// Constructing a new formatter is often expensive in terms of memory and performance,
237/// and the instance is often read-only during its lifetime. The format operations in
238/// comparison are relatively cheap.
239///
240/// Because of this relationship, it can be helpful to memoize the constructors, and
241/// re-use them across multiple format operations. This strategy is used where all
242/// instances of intl APIs such as `PluralRules`, `DateTimeFormat` etc. are memoized
243/// between all `FluentBundle` instances.
244///
245/// # Example
246///
247/// For a more complete example of the memoization, see the [`IntlLangMemoizer`] documentation.
248/// This example provides a higher-level overview.
249///
250/// ```
251/// # use intl_memoizer::{IntlMemoizer, IntlLangMemoizer, Memoizable};
252/// # use unic_langid::LanguageIdentifier;
253/// # use std::rc::Rc;
254/// #
255/// # struct ExampleFormatter {
256/// # lang: LanguageIdentifier,
257/// # prefix: String,
258/// # }
259/// #
260/// # impl ExampleFormatter {
261/// # fn format(&self, example_string: &str) -> String {
262/// # format!(
263/// # "{} lang({}) string({})",
264/// # self.prefix, self.lang, example_string
265/// # )
266/// # }
267/// # }
268/// #
269/// # impl Memoizable for ExampleFormatter {
270/// # type Args = (String,);
271/// # type Error = ();
272/// # fn construct(lang: LanguageIdentifier, args: Self::Args) -> Result<Self, Self::Error> {
273/// # Ok(Self {
274/// # lang,
275/// # prefix: args.0,
276/// # })
277/// # }
278/// # }
279/// #
280/// let mut memoizer = IntlMemoizer::default();
281///
282/// // The memoziation happens per-locale.
283/// let en_us = "en-US".parse().expect("Failed to parse.");
284/// let en_us_memoizer: Rc<IntlLangMemoizer> = memoizer.get_for_lang(en_us);
285///
286/// // These arguments are passed into the constructor for `ExampleFormatter`. The
287/// // construct_args will be used for determining the memoization, but the message
288/// // can be different and re-use the constructed instance.
289/// let construct_args = (String::from("prefix:"),);
290/// let message = "The format operation will run";
291///
292/// // Use the `ExampleFormatter` from the `IntlLangMemoizer` example. It returns a
293/// // string that demonstrates the configuration of the formatter. This step will
294/// // construct a new formatter if needed, and run the format operation.
295/// //
296/// // See `IntlLangMemoizer` for more details on this step.
297/// let en_us_result = en_us_memoizer
298/// .with_try_get::<ExampleFormatter, _, _>(construct_args.clone(), |intl_example| {
299/// intl_example.format(message)
300/// });
301///
302/// // The example formatter constructs a string with diagnostic information about
303/// // the configuration.
304/// assert_eq!(
305/// en_us_result.unwrap(),
306/// "prefix: lang(en-US) string(The format operation will run)"
307/// );
308///
309/// // The process can be repeated for a new locale.
310///
311/// let de_de = "de-DE".parse().expect("Failed to parse.");
312/// let de_de_memoizer: Rc<IntlLangMemoizer> = memoizer.get_for_lang(de_de);
313///
314/// let de_de_result = de_de_memoizer
315/// .with_try_get::<ExampleFormatter, _, _>(construct_args.clone(), |intl_example| {
316/// intl_example.format(message)
317/// });
318///
319/// assert_eq!(
320/// de_de_result.unwrap(),
321/// "prefix: lang(de-DE) string(The format operation will run)"
322/// );
323/// ```
324#[derive(Default)]
325pub struct IntlMemoizer {
326 map: HashMap<LanguageIdentifier, Weak<IntlLangMemoizer>>,
327}
328
329impl IntlMemoizer {
330 /// Get a [`IntlLangMemoizer`] for a given language. If one does not exist for
331 /// a locale, it will be constructed and weakly retained. See [`IntlLangMemoizer`]
332 /// for more detailed documentation how to use it.
333 pub fn get_for_lang(&mut self, lang: LanguageIdentifier) -> Rc<IntlLangMemoizer> {
334 match self.map.entry(lang.clone()) {
335 Entry::Vacant(empty) => {
336 let entry = Rc::new(IntlLangMemoizer::new(lang));
337 empty.insert(Rc::downgrade(&entry));
338 entry
339 }
340 Entry::Occupied(mut entry) => {
341 if let Some(entry) = entry.get().upgrade() {
342 entry
343 } else {
344 let e = Rc::new(IntlLangMemoizer::new(lang));
345 entry.insert(Rc::downgrade(&e));
346 e
347 }
348 }
349 }
350 }
351}
352
353#[cfg(test)]
354mod tests {
355 use super::*;
356 use fluent_langneg::{negotiate_languages, NegotiationStrategy};
357 use intl_pluralrules::{PluralCategory, PluralRuleType, PluralRules as IntlPluralRules};
358 use std::{sync::Arc, thread};
359
360 struct PluralRules(pub IntlPluralRules);
361
362 impl PluralRules {
363 pub fn new(
364 lang: LanguageIdentifier,
365 pr_type: PluralRuleType,
366 ) -> Result<Self, &'static str> {
367 let default_lang: LanguageIdentifier = "en".parse().unwrap();
368 let pr_lang = negotiate_languages(
369 &[lang],
370 &IntlPluralRules::get_locales(pr_type),
371 Some(&default_lang),
372 NegotiationStrategy::Lookup,
373 )[0]
374 .clone();
375
376 Ok(Self(IntlPluralRules::create(pr_lang, pr_type)?))
377 }
378 }
379
380 impl Memoizable for PluralRules {
381 type Args = (PluralRuleType,);
382 type Error = &'static str;
383 fn construct(lang: LanguageIdentifier, args: Self::Args) -> Result<Self, Self::Error> {
384 Self::new(lang, args.0)
385 }
386 }
387
388 #[test]
389 fn test_single_thread() {
390 let lang: LanguageIdentifier = "en".parse().unwrap();
391
392 let mut memoizer = IntlMemoizer::default();
393 {
394 let en_memoizer = memoizer.get_for_lang(lang.clone());
395
396 let result = en_memoizer
397 .with_try_get::<PluralRules, _, _>((PluralRuleType::CARDINAL,), |cb| cb.0.select(5))
398 .unwrap();
399 assert_eq!(result, Ok(PluralCategory::OTHER));
400 }
401
402 {
403 let en_memoizer = memoizer.get_for_lang(lang);
404
405 let result = en_memoizer
406 .with_try_get::<PluralRules, _, _>((PluralRuleType::CARDINAL,), |cb| cb.0.select(5))
407 .unwrap();
408 assert_eq!(result, Ok(PluralCategory::OTHER));
409 }
410 }
411
412 #[test]
413 fn test_concurrent() {
414 let lang: LanguageIdentifier = "en".parse().unwrap();
415 let memoizer = Arc::new(concurrent::IntlLangMemoizer::new(lang));
416 let mut threads = vec![];
417
418 // Spawn four threads that all use the PluralRules.
419 for _ in 0..4 {
420 let memoizer = Arc::clone(&memoizer);
421 threads.push(thread::spawn(move || {
422 memoizer
423 .with_try_get::<PluralRules, _, _>((PluralRuleType::CARDINAL,), |cb| {
424 cb.0.select(5)
425 })
426 .expect("Failed to get a PluralRules result.")
427 }));
428 }
429
430 for thread in threads.drain(..) {
431 let result = thread.join().expect("Failed to join thread.");
432 assert_eq!(result, Ok(PluralCategory::OTHER));
433 }
434 }
435}