2019-01-22 15:01:33 -07:00
|
|
|
#![feature(test)]
|
|
|
|
|
|
|
|
extern crate test;
|
|
|
|
|
|
|
|
mod data;
|
|
|
|
|
2019-10-25 15:48:39 -06:00
|
|
|
use assert_fs::prelude::*;
|
|
|
|
use bstr::ByteSlice;
|
2019-01-22 15:01:33 -07:00
|
|
|
|
2019-10-30 07:26:59 -06:00
|
|
|
fn bench_read(data: &str, b: &mut test::Bencher) {
|
2019-01-22 15:01:33 -07:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
2019-10-30 07:26:59 -06:00
|
|
|
sample_path.write_str(data).unwrap();
|
2019-01-22 15:01:33 -07:00
|
|
|
|
2019-10-30 07:26:59 -06:00
|
|
|
b.iter(|| std::fs::read(sample_path.path()));
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn read_empty(b: &mut test::Bencher) {
|
|
|
|
bench_read(data::EMPTY, b);
|
2019-01-22 15:01:33 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn read_no_tokens(b: &mut test::Bencher) {
|
|
|
|
bench_read(data::NO_TOKENS, b);
|
2019-01-22 15:01:33 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn read_single_token(b: &mut test::Bencher) {
|
|
|
|
bench_read(data::SINGLE_TOKEN, b);
|
2019-01-22 15:01:33 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn read_sherlock(b: &mut test::Bencher) {
|
|
|
|
bench_read(data::SHERLOCK, b);
|
2019-01-22 15:01:33 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn read_code(b: &mut test::Bencher) {
|
|
|
|
bench_read(data::CODE, b);
|
2019-01-22 15:01:33 -07:00
|
|
|
}
|
2019-10-25 15:48:39 -06:00
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn read_corpus(b: &mut test::Bencher) {
|
|
|
|
bench_read(data::CORPUS, b);
|
|
|
|
}
|
2019-10-25 15:48:39 -06:00
|
|
|
|
2019-10-30 07:26:59 -06:00
|
|
|
fn bench_split_lines(data: &str, b: &mut test::Bencher) {
|
|
|
|
b.iter(|| data.as_bytes().lines().enumerate().last());
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-11-02 09:38:32 -06:00
|
|
|
fn parse_lines_empty(b: &mut test::Bencher) {
|
2019-10-30 07:26:59 -06:00
|
|
|
bench_split_lines(data::EMPTY, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-11-02 09:38:32 -06:00
|
|
|
fn parse_lines_no_tokens(b: &mut test::Bencher) {
|
2019-10-30 07:26:59 -06:00
|
|
|
bench_split_lines(data::NO_TOKENS, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-11-02 09:38:32 -06:00
|
|
|
fn parse_lines_single_token(b: &mut test::Bencher) {
|
2019-10-30 07:26:59 -06:00
|
|
|
bench_split_lines(data::SINGLE_TOKEN, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-11-02 09:38:32 -06:00
|
|
|
fn parse_lines_sherlock(b: &mut test::Bencher) {
|
2019-10-30 07:26:59 -06:00
|
|
|
bench_split_lines(data::SHERLOCK, b);
|
|
|
|
}
|
2019-10-25 15:48:39 -06:00
|
|
|
|
2019-10-30 07:26:59 -06:00
|
|
|
#[bench]
|
2019-11-02 09:38:32 -06:00
|
|
|
fn parse_lines_code(b: &mut test::Bencher) {
|
2019-10-30 07:26:59 -06:00
|
|
|
bench_split_lines(data::CODE, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-11-02 09:38:32 -06:00
|
|
|
fn parse_lines_corpus(b: &mut test::Bencher) {
|
2019-10-30 07:26:59 -06:00
|
|
|
bench_split_lines(data::CORPUS, b);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn bench_parse_ident(data: &str, b: &mut test::Bencher) {
|
2019-10-25 15:48:39 -06:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
2019-10-30 07:26:59 -06:00
|
|
|
sample_path.write_str(data).unwrap();
|
2019-10-25 15:48:39 -06:00
|
|
|
|
2019-10-30 07:26:59 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-11-14 20:09:56 -07:00
|
|
|
let checks = typos::checks::TyposSettings::new().build_identifier_parser();
|
|
|
|
b.iter(|| {
|
|
|
|
checks.check_file(
|
|
|
|
sample_path.path(),
|
|
|
|
true,
|
|
|
|
&parser,
|
2020-03-23 18:21:29 -05:00
|
|
|
&typos::report::PrintSilent,
|
2019-11-14 20:09:56 -07:00
|
|
|
)
|
|
|
|
});
|
2019-10-25 15:48:39 -06:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_idents_empty(b: &mut test::Bencher) {
|
|
|
|
bench_parse_ident(data::EMPTY, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_idents_no_tokens(b: &mut test::Bencher) {
|
|
|
|
bench_parse_ident(data::NO_TOKENS, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_idents_single_token(b: &mut test::Bencher) {
|
|
|
|
bench_parse_ident(data::SINGLE_TOKEN, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_idents_sherlock(b: &mut test::Bencher) {
|
|
|
|
bench_parse_ident(data::SHERLOCK, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_idents_code(b: &mut test::Bencher) {
|
|
|
|
bench_parse_ident(data::CODE, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_idents_corpus(b: &mut test::Bencher) {
|
|
|
|
bench_parse_ident(data::CORPUS, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
2019-10-30 07:26:59 -06:00
|
|
|
fn bench_parse_word(data: &str, b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data).unwrap();
|
|
|
|
|
2019-10-25 15:48:39 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-11-14 20:09:56 -07:00
|
|
|
let checks = typos::checks::TyposSettings::new().build_word_parser();
|
|
|
|
b.iter(|| {
|
|
|
|
checks.check_file(
|
|
|
|
sample_path.path(),
|
|
|
|
true,
|
|
|
|
&parser,
|
2020-03-23 18:21:29 -05:00
|
|
|
&typos::report::PrintSilent,
|
2019-11-14 20:09:56 -07:00
|
|
|
)
|
|
|
|
});
|
2019-10-30 07:26:59 -06:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_words_empty(b: &mut test::Bencher) {
|
|
|
|
bench_parse_word(data::EMPTY, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_words_no_tokens(b: &mut test::Bencher) {
|
|
|
|
bench_parse_word(data::NO_TOKENS, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_words_single_token(b: &mut test::Bencher) {
|
|
|
|
bench_parse_word(data::SINGLE_TOKEN, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_words_sherlock(b: &mut test::Bencher) {
|
|
|
|
bench_parse_word(data::SHERLOCK, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_words_code(b: &mut test::Bencher) {
|
|
|
|
bench_parse_word(data::CODE, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn parse_words_corpus(b: &mut test::Bencher) {
|
|
|
|
bench_parse_word(data::CORPUS, b);
|
|
|
|
}
|
|
|
|
|
|
|
|
fn bench_check_file(data: &str, b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data).unwrap();
|
|
|
|
|
2020-05-27 20:46:41 -05:00
|
|
|
let corrections = typos_cli::dict::BuiltIn::new(Default::default());
|
2019-10-25 15:48:39 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-11-14 20:09:56 -07:00
|
|
|
let checks = typos::checks::TyposSettings::new().build_checks();
|
|
|
|
b.iter(|| {
|
|
|
|
checks.check_file(
|
|
|
|
sample_path.path(),
|
|
|
|
true,
|
|
|
|
&parser,
|
|
|
|
&corrections,
|
2020-03-23 18:21:29 -05:00
|
|
|
&typos::report::PrintSilent,
|
2019-11-14 20:09:56 -07:00
|
|
|
)
|
|
|
|
});
|
2019-10-30 07:26:59 -06:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn check_file_empty(b: &mut test::Bencher) {
|
|
|
|
bench_check_file(data::EMPTY, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn check_file_no_tokens(b: &mut test::Bencher) {
|
|
|
|
bench_check_file(data::NO_TOKENS, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn check_file_single_token(b: &mut test::Bencher) {
|
|
|
|
bench_check_file(data::SINGLE_TOKEN, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn check_file_sherlock(b: &mut test::Bencher) {
|
|
|
|
bench_check_file(data::SHERLOCK, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-30 07:26:59 -06:00
|
|
|
fn check_file_code(b: &mut test::Bencher) {
|
|
|
|
bench_check_file(data::CODE, b);
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn check_file_corpus(b: &mut test::Bencher) {
|
|
|
|
bench_check_file(data::CORPUS, b);
|
2019-10-25 15:48:39 -06:00
|
|
|
}
|