unic_ucd_normal/decomposition.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79
// Copyright 2012-2015 The Rust Project Developers.
// Copyright 2017 The UNIC Project Developers.
//
// See the COPYRIGHT file at the top-level directory of this distribution.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.
use core::ops::FnMut;
use crate::composition::{canonical_decomposition, compatibility_decomposition};
use unic_ucd_hangul::{decompose_syllable, is_syllable};
/// Compute canonical Unicode decomposition for character.
///
/// See [Unicode Standard Annex #15](https://www.unicode.org/reports/tr15/) for more information.
pub fn decompose_canonical<F>(ch: char, mut callback: F)
where
F: FnMut(char),
{
d(ch, &mut callback, false);
}
/// Compute canonical or compatible Unicode decomposition for character.
///
/// See [Unicode Standard Annex #15](https://www.unicode.org/reports/tr15/) for more information.
pub fn decompose_compatible<F>(ch: char, mut callback: F)
where
F: FnMut(char),
{
d(ch, &mut callback, true);
}
// FIXME: This is a workaround, we should use `F` instead of `&mut F`
fn d<F>(ch: char, callback: &mut F, k: bool)
where
F: FnMut(char),
{
// 7-bit ASCII never decomposes
if ch <= '\x7f' {
(*callback)(ch);
return;
}
// Perform decomposition for Hangul
if is_syllable(ch) {
decompose_syllable(ch, callback);
return;
}
// First check the canonical decompositions
if let Some(canon) = canonical_decomposition(ch) {
for x in canon {
d(*x, callback, k);
}
return;
}
// Bottom out if we're not doing compat.
if !k {
(*callback)(ch);
return;
}
// Then check the compatibility decompositions
if let Some(compat) = compatibility_decomposition(ch) {
for x in compat {
d(*x, callback, k);
}
return;
}
// Finally bottom out.
(*callback)(ch);
}