2019-10-28 15:33:48 -04:00
|
|
|
use std::collections::HashMap;
|
|
|
|
|
|
|
|
use structopt::StructOpt;
|
|
|
|
|
|
|
|
pub const DICT: &str = include_str!("../../assets/words.go");
|
|
|
|
|
2019-10-29 09:55:50 -04:00
|
|
|
struct Words<'s> {
|
|
|
|
main: HashMap<&'s str, Vec<&'s str>>,
|
|
|
|
american: HashMap<&'s str, Vec<&'s str>>,
|
|
|
|
british: HashMap<&'s str, Vec<&'s str>>,
|
|
|
|
}
|
|
|
|
|
|
|
|
fn parse_dict(raw: &str) -> Words {
|
2019-10-28 15:33:48 -04:00
|
|
|
let mut bad = HashMap::new();
|
|
|
|
let mut main = HashMap::new();
|
|
|
|
let mut american = HashMap::new();
|
|
|
|
let mut british = HashMap::new();
|
|
|
|
|
|
|
|
let mapping = regex::Regex::new(r#"^"(.*)", "(.*)",$"#).unwrap();
|
|
|
|
|
|
|
|
let mut current = &mut bad;
|
|
|
|
for line in raw.lines() {
|
|
|
|
let line = line.splitn(2, "//").next().unwrap().trim();
|
2019-10-29 10:07:27 -04:00
|
|
|
if line.is_empty() || line.starts_with("package") {
|
2019-10-28 15:33:48 -04:00
|
|
|
continue;
|
|
|
|
} else if line.contains("DictMain") {
|
|
|
|
current = &mut main;
|
|
|
|
} else if line.contains("DictAmerican") {
|
|
|
|
current = &mut american;
|
|
|
|
} else if line.contains("DictBritish") {
|
|
|
|
current = &mut british;
|
2019-10-28 18:25:41 -04:00
|
|
|
} else if line.contains('}') {
|
2019-10-28 15:33:48 -04:00
|
|
|
current = &mut bad;
|
|
|
|
} else {
|
|
|
|
let captures = mapping.captures(line);
|
|
|
|
if let Some(captures) = captures {
|
|
|
|
current.insert(
|
|
|
|
captures.get(1).unwrap().as_str(),
|
|
|
|
vec![captures.get(2).unwrap().as_str()],
|
|
|
|
);
|
|
|
|
} else {
|
|
|
|
eprintln!("Unknown line: {}", line);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if !bad.is_empty() {
|
|
|
|
panic!("Failed parsing; found extra words: {:#?}", bad);
|
|
|
|
}
|
2019-10-29 09:55:50 -04:00
|
|
|
|
|
|
|
Words {
|
|
|
|
main,
|
|
|
|
american,
|
|
|
|
british,
|
|
|
|
}
|
2019-10-28 15:33:48 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
fn generate<W: std::io::Write>(file: &mut W) {
|
|
|
|
writeln!(
|
|
|
|
file,
|
|
|
|
"// This file is code-genned by {}",
|
|
|
|
env!("CARGO_PKG_NAME")
|
|
|
|
)
|
|
|
|
.unwrap();
|
2019-10-29 09:53:32 -04:00
|
|
|
writeln!(file, "#![allow(clippy::unreadable_literal)]",).unwrap();
|
2019-10-28 15:33:48 -04:00
|
|
|
writeln!(file).unwrap();
|
|
|
|
|
2019-10-29 09:55:50 -04:00
|
|
|
let Words {
|
|
|
|
main,
|
|
|
|
american,
|
|
|
|
british,
|
|
|
|
} = parse_dict(DICT);
|
2021-06-07 09:22:31 -04:00
|
|
|
let mut main: Vec<_> = main.into_iter().collect();
|
|
|
|
main.sort_unstable_by(|a, b| {
|
|
|
|
unicase::UniCase::new(a.0)
|
|
|
|
.partial_cmp(&unicase::UniCase::new(b.0))
|
|
|
|
.unwrap()
|
|
|
|
});
|
|
|
|
let mut american: Vec<_> = american.into_iter().collect();
|
|
|
|
american.sort_unstable_by(|a, b| {
|
|
|
|
unicase::UniCase::new(a.0)
|
|
|
|
.partial_cmp(&unicase::UniCase::new(b.0))
|
|
|
|
.unwrap()
|
|
|
|
});
|
|
|
|
let mut british: Vec<_> = british.into_iter().collect();
|
|
|
|
british.sort_unstable_by(|a, b| {
|
|
|
|
unicase::UniCase::new(a.0)
|
|
|
|
.partial_cmp(&unicase::UniCase::new(b.0))
|
|
|
|
.unwrap()
|
|
|
|
});
|
|
|
|
|
|
|
|
writeln!(file, "pub static MAIN_DICTIONARY: &[(&str, &[&str])] = &[").unwrap();
|
|
|
|
for (typo, corrections) in main.into_iter() {
|
2019-10-28 15:33:48 -04:00
|
|
|
let value = itertools::join(corrections.iter().map(|s| format!("{:?}", s)), ", ");
|
|
|
|
let value = format!("&[{}]", value);
|
2021-06-07 09:22:31 -04:00
|
|
|
|
|
|
|
let key = format!("{:?}", typo);
|
|
|
|
writeln!(file, " ({}, {}),", key, &value).unwrap();
|
2019-10-28 15:33:48 -04:00
|
|
|
}
|
2021-06-07 09:22:31 -04:00
|
|
|
writeln!(file, "];").unwrap();
|
2019-10-28 18:25:41 -04:00
|
|
|
writeln!(file).unwrap();
|
2019-10-28 15:33:48 -04:00
|
|
|
|
|
|
|
writeln!(
|
|
|
|
file,
|
2021-06-07 09:22:31 -04:00
|
|
|
"pub static AMERICAN_DICTIONARY: &[(&str, &[&str])] = &["
|
2019-10-28 15:33:48 -04:00
|
|
|
)
|
|
|
|
.unwrap();
|
2021-06-07 09:22:31 -04:00
|
|
|
for (typo, corrections) in american.into_iter() {
|
2019-10-28 15:33:48 -04:00
|
|
|
let value = itertools::join(corrections.iter().map(|s| format!("{:?}", s)), ", ");
|
|
|
|
let value = format!("&[{}]", value);
|
2021-06-07 09:22:31 -04:00
|
|
|
|
|
|
|
let key = format!("{:?}", typo);
|
|
|
|
writeln!(file, " ({}, {}),", key, &value).unwrap();
|
2019-10-28 15:33:48 -04:00
|
|
|
}
|
2021-06-07 09:22:31 -04:00
|
|
|
writeln!(file, "];").unwrap();
|
2019-10-28 18:25:41 -04:00
|
|
|
writeln!(file).unwrap();
|
2019-10-28 15:33:48 -04:00
|
|
|
|
|
|
|
writeln!(
|
|
|
|
file,
|
2021-06-07 09:22:31 -04:00
|
|
|
"pub static BRITISH_DICTIONARY: &[(&str, &[&str])] = &["
|
2019-10-28 15:33:48 -04:00
|
|
|
)
|
|
|
|
.unwrap();
|
2021-06-07 09:22:31 -04:00
|
|
|
for (typo, corrections) in british.into_iter() {
|
2019-10-28 15:33:48 -04:00
|
|
|
let value = itertools::join(corrections.iter().map(|s| format!("{:?}", s)), ", ");
|
|
|
|
let value = format!("&[{}]", value);
|
2021-06-07 09:22:31 -04:00
|
|
|
|
|
|
|
let key = format!("{:?}", typo);
|
|
|
|
writeln!(file, " ({}, {}),", key, &value).unwrap();
|
2019-10-28 15:33:48 -04:00
|
|
|
}
|
2021-06-07 09:22:31 -04:00
|
|
|
writeln!(file, "];").unwrap();
|
2019-10-28 15:33:48 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
#[derive(Debug, StructOpt)]
|
|
|
|
#[structopt(rename_all = "kebab-case")]
|
|
|
|
struct Options {
|
|
|
|
#[structopt(flatten)]
|
|
|
|
codegen: codegenrs::CodeGenArgs,
|
|
|
|
#[structopt(flatten)]
|
|
|
|
rustmft: codegenrs::RustfmtArgs,
|
|
|
|
}
|
|
|
|
|
|
|
|
fn run() -> Result<i32, Box<dyn std::error::Error>> {
|
|
|
|
let options = Options::from_args();
|
|
|
|
|
|
|
|
let mut content = vec![];
|
|
|
|
generate(&mut content);
|
|
|
|
|
|
|
|
let content = String::from_utf8(content)?;
|
|
|
|
let content = options.rustmft.reformat(&content)?;
|
|
|
|
options.codegen.write_str(&content)?;
|
|
|
|
|
|
|
|
Ok(0)
|
|
|
|
}
|
|
|
|
|
|
|
|
fn main() {
|
|
|
|
let code = run().unwrap();
|
|
|
|
std::process::exit(code);
|
|
|
|
}
|