2019-01-22 15:01:33 -07:00
|
|
|
#![feature(test)]
|
|
|
|
|
|
|
|
extern crate test;
|
|
|
|
|
|
|
|
mod data;
|
|
|
|
|
2019-10-25 15:48:39 -06:00
|
|
|
use assert_fs::prelude::*;
|
|
|
|
use bstr::ByteSlice;
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
#[bench]
|
2019-10-25 15:17:24 -06:00
|
|
|
fn check_file_empty(b: &mut test::Bencher) {
|
2019-01-22 15:01:33 -07:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::EMPTY).unwrap();
|
|
|
|
|
2019-08-08 10:24:50 -05:00
|
|
|
let corrections = typos_dict::BuiltIn::new();
|
2019-07-25 07:45:16 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-07-27 19:20:02 -06:00
|
|
|
let checks = typos::checks::CheckSettings::new().build(&corrections, &parser);
|
2019-07-31 21:01:09 -06:00
|
|
|
b.iter(|| checks.check_file(sample_path.path(), true, typos::report::print_silent));
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-25 15:17:24 -06:00
|
|
|
fn check_file_no_tokens(b: &mut test::Bencher) {
|
2019-01-22 15:01:33 -07:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::NO_TOKENS).unwrap();
|
|
|
|
|
2019-08-08 10:24:50 -05:00
|
|
|
let corrections = typos_dict::BuiltIn::new();
|
2019-07-25 07:45:16 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-07-27 19:20:02 -06:00
|
|
|
let checks = typos::checks::CheckSettings::new().build(&corrections, &parser);
|
2019-07-31 21:01:09 -06:00
|
|
|
b.iter(|| checks.check_file(sample_path.path(), true, typos::report::print_silent));
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-25 15:17:24 -06:00
|
|
|
fn check_file_single_token(b: &mut test::Bencher) {
|
2019-01-22 15:01:33 -07:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::SINGLE_TOKEN).unwrap();
|
|
|
|
|
2019-08-08 10:24:50 -05:00
|
|
|
let corrections = typos_dict::BuiltIn::new();
|
2019-07-25 07:45:16 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-07-27 19:20:02 -06:00
|
|
|
let checks = typos::checks::CheckSettings::new().build(&corrections, &parser);
|
2019-07-31 21:01:09 -06:00
|
|
|
b.iter(|| checks.check_file(sample_path.path(), true, typos::report::print_silent));
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-25 15:17:24 -06:00
|
|
|
fn check_file_sherlock(b: &mut test::Bencher) {
|
2019-01-22 15:01:33 -07:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::SHERLOCK).unwrap();
|
|
|
|
|
2019-08-08 10:24:50 -05:00
|
|
|
let corrections = typos_dict::BuiltIn::new();
|
2019-07-25 07:45:16 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-07-27 19:20:02 -06:00
|
|
|
let checks = typos::checks::CheckSettings::new().build(&corrections, &parser);
|
2019-07-31 21:01:09 -06:00
|
|
|
b.iter(|| checks.check_file(sample_path.path(), true, typos::report::print_silent));
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-25 15:17:24 -06:00
|
|
|
fn check_file_code(b: &mut test::Bencher) {
|
2019-01-22 15:01:33 -07:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::CODE).unwrap();
|
|
|
|
|
2019-08-08 10:24:50 -05:00
|
|
|
let corrections = typos_dict::BuiltIn::new();
|
2019-07-25 07:45:16 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-07-27 19:20:02 -06:00
|
|
|
let checks = typos::checks::CheckSettings::new().build(&corrections, &parser);
|
2019-07-31 21:01:09 -06:00
|
|
|
b.iter(|| checks.check_file(sample_path.path(), true, typos::report::print_silent));
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
2019-10-25 15:17:24 -06:00
|
|
|
fn check_file_corpus(b: &mut test::Bencher) {
|
2019-01-22 15:01:33 -07:00
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::CORPUS).unwrap();
|
|
|
|
|
2019-08-08 10:24:50 -05:00
|
|
|
let corrections = typos_dict::BuiltIn::new();
|
2019-07-25 07:45:16 -06:00
|
|
|
let parser = typos::tokens::Parser::new();
|
2019-07-27 19:20:02 -06:00
|
|
|
let checks = typos::checks::CheckSettings::new().build(&corrections, &parser);
|
2019-07-31 21:01:09 -06:00
|
|
|
b.iter(|| checks.check_file(sample_path.path(), true, typos::report::print_silent));
|
2019-01-22 15:01:33 -07:00
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
2019-10-25 15:48:39 -06:00
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn read_empty(b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::EMPTY).unwrap();
|
|
|
|
|
|
|
|
b.iter(|| std::fs::read(sample_path.path()));
|
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn read_no_tokens(b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::NO_TOKENS).unwrap();
|
|
|
|
|
|
|
|
b.iter(|| std::fs::read(sample_path.path()));
|
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn read_single_token(b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::SINGLE_TOKEN).unwrap();
|
|
|
|
|
|
|
|
b.iter(|| std::fs::read(sample_path.path()));
|
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn read_sherlock(b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::SHERLOCK).unwrap();
|
|
|
|
|
|
|
|
b.iter(|| std::fs::read(sample_path.path()));
|
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn read_code(b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::CODE).unwrap();
|
|
|
|
|
|
|
|
b.iter(|| std::fs::read(sample_path.path()));
|
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn read_corpus(b: &mut test::Bencher) {
|
|
|
|
let temp = assert_fs::TempDir::new().unwrap();
|
|
|
|
let sample_path = temp.child("sample");
|
|
|
|
sample_path.write_str(data::CORPUS).unwrap();
|
|
|
|
|
|
|
|
b.iter(|| std::fs::read(sample_path.path()));
|
|
|
|
|
|
|
|
temp.close().unwrap();
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_lines_empty(b: &mut test::Bencher) {
|
|
|
|
b.iter(|| data::EMPTY.as_bytes().lines().enumerate().last());
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_lines_no_tokens(b: &mut test::Bencher) {
|
|
|
|
b.iter(|| data::NO_TOKENS.as_bytes().lines().enumerate().last());
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_lines_single_token(b: &mut test::Bencher) {
|
|
|
|
b.iter(|| data::SINGLE_TOKEN.as_bytes().lines().enumerate().last());
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_lines_sherlock(b: &mut test::Bencher) {
|
|
|
|
b.iter(|| data::SHERLOCK.as_bytes().lines().enumerate().last());
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_lines_code(b: &mut test::Bencher) {
|
|
|
|
b.iter(|| data::CODE.as_bytes().lines().enumerate().last());
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_lines_corpus(b: &mut test::Bencher) {
|
|
|
|
b.iter(|| data::CORPUS.as_bytes().lines().enumerate().last());
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn parse_empty(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::EMPTY
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn parse_no_tokens(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::NO_TOKENS
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn parse_single_token(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::SINGLE_TOKEN
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn parse_sherlock(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::SHERLOCK
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn parse_code(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::CODE
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn parse_corpus(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::CORPUS
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_empty(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::EMPTY
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).for_each(|l| {
|
|
|
|
l.split().last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_no_tokens(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::NO_TOKENS
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).for_each(|l| {
|
|
|
|
l.split().last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_single_token(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::SINGLE_TOKEN
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).for_each(|l| {
|
|
|
|
l.split().last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_sherlock(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::SHERLOCK
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).for_each(|l| {
|
|
|
|
l.split().last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_code(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::CODE
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).for_each(|l| {
|
|
|
|
l.split().last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
#[bench]
|
|
|
|
fn split_corpus(b: &mut test::Bencher) {
|
|
|
|
let parser = typos::tokens::Parser::new();
|
|
|
|
b.iter(|| {
|
|
|
|
data::CORPUS
|
|
|
|
.as_bytes()
|
|
|
|
.lines()
|
|
|
|
.enumerate()
|
|
|
|
.for_each(|(_idx, l)| {
|
|
|
|
parser.parse_bytes(l).for_each(|l| {
|
|
|
|
l.split().last();
|
|
|
|
()
|
|
|
|
})
|
|
|
|
})
|
|
|
|
});
|
|
|
|
}
|