ucd_util/
property.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
/// The type of a property name table.
///
/// A property name table is a sequence of sorted tuples, where the first
/// value in each tuple is a normalized property name and the second value of
/// each tuple is the corresponding canonical property name.
pub type PropertyTable = &'static [(&'static str, &'static str)];

/// Find the canonical property name for the given normalized property name.
///
/// If no such property exists, then `None` is returned.
///
/// The normalized property name must have been normalized according to
/// UAX44 LM3, which can be done using `symbolic_name_normalize`.
pub fn canonical_property_name(
    property_table: PropertyTable,
    normalized_property_name: &str,
) -> Option<&'static str> {
    property_table
        .binary_search_by_key(&normalized_property_name, |&(n, _)| n)
        .ok()
        .map(|i| property_table[i].1)
}

/// Type of a property value table.
///
/// A property value table maps property names to a mapping of property values,
/// where the mapping of property values is represented by a sequence of
/// tuples. The first element of each tuple is a normalized property value
/// while the second element of each tuple is the corresponding canonical
/// property value.
///
/// Note that a property value table only includes values for properties that
/// are catalogs, enumerations or binary properties. Properties that have
/// string values (such as case or decomposition mappings), numeric values
/// or are miscellaneous are not represented in this table.
pub type PropertyValueTable = &'static [(&'static str, PropertyValues)];

/// A mapping of property values for a specific property.
///
/// The first element of each tuple is a normalized property value while the
/// second element of each tuple is the corresponding canonical property
/// value.
pub type PropertyValues = &'static [(&'static str, &'static str)];

/// Find the set of possible property values for a given property.
///
/// The set returned is a mapping expressed as a sorted list of tuples.
/// The first element of each tuple is a normalized property value while the
/// second element of each tuple is the corresponding canonical property
/// value.
///
/// If no such property exists, then `None` is returned.
///
/// The given property name must be in its canonical form, which can be
/// found using `canonical_property_name`.
pub fn property_values(
    property_value_table: PropertyValueTable,
    canonical_property_name: &str,
) -> Option<PropertyValues> {
    property_value_table
        .binary_search_by_key(&canonical_property_name, |&(n, _)| n)
        .ok()
        .map(|i| property_value_table[i].1)
}

/// Find the canonical property value for the given normalized property
/// value.
///
/// The given property values should correspond to the values for the property
/// under question, which can be found using `property_values`.
///
/// If no such property value exists, then `None` is returned.
///
/// The normalized property value must have been normalized according to
/// UAX44 LM3, which can be done using `symbolic_name_normalize`.
pub fn canonical_property_value(
    property_values: PropertyValues,
    normalized_property_value: &str,
) -> Option<&'static str> {
    // This is cute. The types line up, so why not?
    canonical_property_name(property_values, normalized_property_value)
}

#[cfg(test)]
mod tests {
    use crate::unicode_tables::property_names::PROPERTY_NAMES;
    use crate::unicode_tables::property_values::PROPERTY_VALUES;

    use super::{
        canonical_property_name, canonical_property_value, property_values,
    };

    #[test]
    fn canonical_property_name_1() {
        assert_eq!(
            canonical_property_name(PROPERTY_NAMES, "gc"),
            Some("General_Category")
        );
        assert_eq!(
            canonical_property_name(PROPERTY_NAMES, "generalcategory"),
            Some("General_Category")
        );
        assert_eq!(canonical_property_name(PROPERTY_NAMES, "g c"), None);
    }

    #[test]
    fn property_values_1() {
        assert_eq!(
            property_values(PROPERTY_VALUES, "White_Space"),
            Some(
                &[
                    ("f", "No"),
                    ("false", "No"),
                    ("n", "No"),
                    ("no", "No"),
                    ("t", "Yes"),
                    ("true", "Yes"),
                    ("y", "Yes"),
                    ("yes", "Yes"),
                ][..]
            )
        );
    }

    #[test]
    fn canonical_property_value_1() {
        let values = property_values(PROPERTY_VALUES, "White_Space").unwrap();
        assert_eq!(canonical_property_value(values, "false"), Some("No"));
        assert_eq!(canonical_property_value(values, "t"), Some("Yes"));
        assert_eq!(canonical_property_value(values, "F"), None);
    }
}