mirror of
https://github.com/crate-ci/typos.git
synced 2025-01-12 01:31:26 -05:00
112 lines
2.9 KiB
Rust
112 lines
2.9 KiB
Rust
use std::collections::HashMap;
|
|
|
|
pub const DICT: &str = include_str!("../assets/words.go");
|
|
|
|
#[test]
|
|
fn codegen() {
|
|
let mut content = vec![];
|
|
generate(&mut content);
|
|
|
|
let content = String::from_utf8(content).unwrap();
|
|
let content = codegenrs::rustfmt(&content, None).unwrap();
|
|
snapbox::assert_data_eq!(content, snapbox::file!["../src/dict_codegen.rs"].raw());
|
|
}
|
|
|
|
fn generate<W: std::io::Write>(file: &mut W) {
|
|
writeln!(
|
|
file,
|
|
"// This file is @generated by {}",
|
|
file!().replace('\\', "/")
|
|
)
|
|
.unwrap();
|
|
writeln!(file).unwrap();
|
|
|
|
let Words {
|
|
main,
|
|
american,
|
|
british,
|
|
} = parse_dict(DICT);
|
|
|
|
dictgen::DictGen::new()
|
|
.name("MAIN_DICTIONARY")
|
|
.value_type("&[&str]")
|
|
.ordered_map()
|
|
.write(
|
|
file,
|
|
main.into_iter().map(|kv| (kv.0, format!("&{:?}", kv.1))),
|
|
)
|
|
.unwrap();
|
|
|
|
dictgen::DictGen::new()
|
|
.name("AMERICAN_DICTIONARY")
|
|
.value_type("&[&str]")
|
|
.ordered_map()
|
|
.write(
|
|
file,
|
|
american
|
|
.into_iter()
|
|
.map(|kv| (kv.0, format!("&{:?}", kv.1))),
|
|
)
|
|
.unwrap();
|
|
|
|
dictgen::DictGen::new()
|
|
.name("BRITISH_DICTIONARY")
|
|
.value_type("&[&str]")
|
|
.ordered_map()
|
|
.write(
|
|
file,
|
|
british.into_iter().map(|kv| (kv.0, format!("&{:?}", kv.1))),
|
|
)
|
|
.unwrap();
|
|
}
|
|
|
|
struct Words<'s> {
|
|
main: HashMap<&'s str, Vec<&'s str>>,
|
|
american: HashMap<&'s str, Vec<&'s str>>,
|
|
british: HashMap<&'s str, Vec<&'s str>>,
|
|
}
|
|
|
|
fn parse_dict(raw: &str) -> Words<'_> {
|
|
let mut bad = HashMap::new();
|
|
let mut main = HashMap::new();
|
|
let mut american = HashMap::new();
|
|
let mut british = HashMap::new();
|
|
|
|
let mapping = regex::Regex::new(r#"^"(.*)", "(.*)",$"#).unwrap();
|
|
|
|
let mut current = &mut bad;
|
|
for line in raw.lines() {
|
|
let line = line.split_once("//").map(|l| l.0).unwrap_or(line).trim();
|
|
if line.is_empty() || line.starts_with("package") {
|
|
continue;
|
|
} else if line.contains("DictMain") {
|
|
current = &mut main;
|
|
} else if line.contains("DictAmerican") {
|
|
current = &mut american;
|
|
} else if line.contains("DictBritish") {
|
|
current = &mut british;
|
|
} else if line.contains('}') {
|
|
current = &mut bad;
|
|
} else {
|
|
let captures = mapping.captures(line);
|
|
if let Some(captures) = captures {
|
|
current.insert(
|
|
captures.get(1).unwrap().as_str(),
|
|
vec![captures.get(2).unwrap().as_str()],
|
|
);
|
|
} else {
|
|
eprintln!("Unknown line: {line}");
|
|
}
|
|
}
|
|
}
|
|
|
|
if !bad.is_empty() {
|
|
panic!("Failed parsing; found extra words: {bad:#?}");
|
|
}
|
|
|
|
Words {
|
|
main,
|
|
american,
|
|
british,
|
|
}
|
|
}
|