1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
|
use std::path::Path;
use crate::{common::UcdFile, error::Error};
/// A single row in the `PropertyAliases.txt` file.
#[derive(Clone, Debug, Default, Eq, PartialEq)]
pub struct PropertyAlias {
/// An abbreviation for this property.
pub abbreviation: String,
/// The "long" name of this property.
pub long: String,
/// Additional aliases (if present).
pub aliases: Vec<String>,
}
impl UcdFile for PropertyAlias {
fn relative_file_path() -> &'static Path {
Path::new("PropertyAliases.txt")
}
}
impl std::str::FromStr for PropertyAlias {
type Err = Error;
fn from_str(line: &str) -> Result<PropertyAlias, Error> {
let re_parts = regex!(
r"(?x)
^
\s*(?P<abbrev>[^\s;]+)\s*;
\s*(?P<long>[^\s;]+)\s*
(?:;(?P<aliases>.*))?
",
);
let re_aliases = regex!(r"\s*(?P<alias>[^\s;]+)\s*;?\s*");
let caps = match re_parts.captures(line.trim()) {
Some(caps) => caps,
None => return err!("invalid PropertyAliases line: '{}'", line),
};
let mut aliases = vec![];
if let Some(m) = caps.name("aliases") {
for acaps in re_aliases.captures_iter(m.as_str()) {
let alias = acaps.name("alias").unwrap().as_str();
aliases.push(alias.to_string());
}
}
Ok(PropertyAlias {
abbreviation: caps.name("abbrev").unwrap().as_str().to_string(),
long: caps.name("long").unwrap().as_str().to_string(),
aliases,
})
}
}
#[cfg(test)]
mod tests {
use super::PropertyAlias;
#[test]
fn parse1() {
let line = "cjkAccountingNumeric ; kAccountingNumeric\n";
let row: PropertyAlias = line.parse().unwrap();
assert_eq!(row.abbreviation, "cjkAccountingNumeric");
assert_eq!(row.long, "kAccountingNumeric");
assert!(row.aliases.is_empty());
}
#[test]
fn parse2() {
let line = "nv ; Numeric_Value\n";
let row: PropertyAlias = line.parse().unwrap();
assert_eq!(row.abbreviation, "nv");
assert_eq!(row.long, "Numeric_Value");
assert!(row.aliases.is_empty());
}
#[test]
fn parse3() {
let line =
"scf ; Simple_Case_Folding ; sfc\n";
let row: PropertyAlias = line.parse().unwrap();
assert_eq!(row.abbreviation, "scf");
assert_eq!(row.long, "Simple_Case_Folding");
assert_eq!(row.aliases, vec!["sfc"]);
}
#[test]
fn parse4() {
let line = "cjkRSUnicode ; kRSUnicode ; Unicode_Radical_Stroke; URS\n";
let row: PropertyAlias = line.parse().unwrap();
assert_eq!(row.abbreviation, "cjkRSUnicode");
assert_eq!(row.long, "kRSUnicode");
assert_eq!(row.aliases, vec!["Unicode_Radical_Stroke", "URS"]);
}
#[test]
fn parse5() {
let line = "isc ; ISO_Comment";
let row: PropertyAlias = line.parse().unwrap();
assert_eq!(row.abbreviation, "isc");
assert_eq!(row.long, "ISO_Comment");
assert!(row.aliases.is_empty());
}
}
|