mirror of
https://github.com/cargo-bins/cargo-binstall.git
synced 2025-05-16 08:50:02 +00:00
Leon template library (#766)
* leon: first implementation * Update crates/leon/src/values.rs Co-authored-by: Jiahao XU <Jiahao_XU@outlook.com> * Workaround orphan rules to make API more intuitive * Fmt * Clippy * Use CoW * Use cow for items too * Test that const construction works * leon: Initial attempt at O(n) parser * leon: finish parser (except escapes) * leon: Improve ergonomics of compile-time templates * Document helpers * leon: Docs tweaks * leon: Use macro to minimise parser tests * leon: add escapes to parser * leon: test escapes preceding keys * leon: add multibyte tests * leon: test escapes following keys * Format * Debug * leon: Don't actually need to keep track of the key * leon: Parse to vec first * leon: there's actually no need for string cows * leon: reorganise and redo macro now that there's no coww * Well that was silly * leon: Adjust text end when pushing * leon: catch unbalanced keys * Add error tests * leon: Catch unfinished escape * Comment out debugging * leon: fuzz * Clippy * leon: Box parse error * leon: &dyn instead of impl * Can't impl FromStr, so rename to parse * Add Vec<> to values * leon: Add benches for ways to supply values * leon: Add bench comparing to std and tt * Fix fuzz * Fmt * Split ParseError and RenderError * Make miette optional * Remove RenderError lifetime * Simplify ParseError type schema * Write concrete Values types instead of generics * Add license files * Reduce criterion deps * Make default a cow * Add a CLI leon tool * Fix tests * Clippy * Disable cli by default * Avoid failing the build when cli is off * Add to ci * Update crates/leon/src/main.rs Co-authored-by: Jiahao XU <Jiahao_XU@outlook.com> * Update crates/leon/Cargo.toml Co-authored-by: Jiahao XU <Jiahao_XU@outlook.com> * Bump version * Error not transparent * Diagnostic can do forwarding * Simplify error type * Expand doc examples * Generic Values for Hash and BTree maps * One more borrowed * Forward implementations * More generics * Add has_keys * Lock stdout in leon tool * No more debug comments in parser * Even more generics * Macros to reduce bench duplication * Further simplify error * Fix leon main * Stable support * Clippy --------- Co-authored-by: Jiahao XU <Jiahao_XU@outlook.com>
This commit is contained in:
parent
daf8cdd010
commit
2227d363f7
20 changed files with 2382 additions and 162 deletions
crates/leon/src
565
crates/leon/src/parser.rs
Normal file
565
crates/leon/src/parser.rs
Normal file
|
@ -0,0 +1,565 @@
|
|||
use std::mem::replace;
|
||||
|
||||
use crate::{Item, ParseError, Template};
|
||||
|
||||
#[derive(Debug, Clone, Copy)]
|
||||
enum Token {
|
||||
Text {
|
||||
start: usize,
|
||||
end: usize,
|
||||
},
|
||||
BracePair {
|
||||
start: usize,
|
||||
key_seen: bool,
|
||||
end: usize,
|
||||
},
|
||||
Escape {
|
||||
start: usize,
|
||||
end: usize,
|
||||
ch: Option<char>,
|
||||
},
|
||||
}
|
||||
|
||||
impl Token {
|
||||
fn start_text(pos: usize, ch: char) -> Self {
|
||||
Self::Text {
|
||||
start: pos,
|
||||
end: pos + ch.len_utf8(),
|
||||
}
|
||||
}
|
||||
|
||||
fn start_text_single(pos: usize) -> Self {
|
||||
Self::Text {
|
||||
start: pos,
|
||||
end: pos,
|
||||
}
|
||||
}
|
||||
|
||||
fn start_brace_pair(pos: usize, ch: char) -> Self {
|
||||
Self::BracePair {
|
||||
start: pos,
|
||||
key_seen: false,
|
||||
end: pos + ch.len_utf8(),
|
||||
}
|
||||
}
|
||||
|
||||
fn start_escape(pos: usize, ch: char) -> Self {
|
||||
Self::Escape {
|
||||
start: pos,
|
||||
end: pos + ch.len_utf8(),
|
||||
ch: None,
|
||||
}
|
||||
}
|
||||
|
||||
fn is_empty(&self, source_len: usize) -> bool {
|
||||
match self {
|
||||
Self::Text { start, end } => {
|
||||
*start >= source_len || *end >= source_len || *start > *end
|
||||
}
|
||||
Self::BracePair {
|
||||
start,
|
||||
key_seen,
|
||||
end,
|
||||
} => !key_seen || *start >= source_len || *end >= source_len || *start > *end,
|
||||
Self::Escape { start, end, .. } => {
|
||||
*start >= source_len || *end >= source_len || *start > *end
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
fn start(&self) -> usize {
|
||||
match self {
|
||||
Self::Text { start, .. }
|
||||
| Self::BracePair { start, .. }
|
||||
| Self::Escape { start, .. } => *start,
|
||||
}
|
||||
}
|
||||
|
||||
fn end(&self) -> usize {
|
||||
match self {
|
||||
Self::Text { end, .. } | Self::BracePair { end, .. } | Self::Escape { end, .. } => *end,
|
||||
}
|
||||
}
|
||||
|
||||
fn set_end(&mut self, pos: usize) {
|
||||
match self {
|
||||
Self::Text { end, .. } | Self::BracePair { end, .. } | Self::Escape { end, .. } => {
|
||||
*end = pos
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
impl<'s> Template<'s> {
|
||||
pub(crate) fn parse_items(s: &'s str) -> Result<Vec<Item<'s>>, ParseError> {
|
||||
let source_len = s.len();
|
||||
let mut tokens = Vec::new();
|
||||
|
||||
let mut current = Token::start_text(0, '\0');
|
||||
|
||||
for (pos, chara) in s.char_indices() {
|
||||
match (&mut current, chara) {
|
||||
(tok @ (Token::Text { .. } | Token::Escape { ch: Some(_), .. }), ch @ '{') => {
|
||||
if matches!(tok, Token::Text { .. }) && tok.start() == pos {
|
||||
*tok = Token::start_brace_pair(pos, ch);
|
||||
} else {
|
||||
if let Token::Text { end, .. } = tok {
|
||||
*end = pos - 1;
|
||||
}
|
||||
tokens.push(replace(tok, Token::start_brace_pair(pos, ch)));
|
||||
}
|
||||
}
|
||||
(txt @ Token::Text { .. }, ch @ '\\') => {
|
||||
if txt.is_empty(source_len) || txt.start() == pos {
|
||||
*txt = Token::start_escape(pos, ch);
|
||||
} else {
|
||||
if let Token::Text { end, .. } = txt {
|
||||
*end = pos - 1;
|
||||
}
|
||||
tokens.push(replace(txt, Token::start_escape(pos, ch)));
|
||||
}
|
||||
}
|
||||
(bp @ Token::BracePair { .. }, '}') => {
|
||||
if let Token::BracePair { end, .. } = bp {
|
||||
*end = pos;
|
||||
} else {
|
||||
unreachable!("bracepair isn't bracepair");
|
||||
}
|
||||
|
||||
tokens.push(replace(bp, Token::start_text_single(pos + 1)));
|
||||
}
|
||||
(Token::BracePair { start, .. }, '\\') => {
|
||||
return Err(ParseError::key_escape(s, *start, pos));
|
||||
}
|
||||
(Token::BracePair { key_seen, end, .. }, ws) if ws.is_whitespace() => {
|
||||
if *key_seen {
|
||||
*end = pos;
|
||||
} else {
|
||||
// We're in a brace pair, but we're not in the key yet.
|
||||
}
|
||||
}
|
||||
(Token::BracePair { key_seen, end, .. }, _) => {
|
||||
*key_seen = true;
|
||||
*end = pos + 1;
|
||||
}
|
||||
(Token::Text { .. }, '}') => {
|
||||
return Err(ParseError::unbalanced(s, pos, pos));
|
||||
}
|
||||
(Token::Text { end, .. }, _) => {
|
||||
*end = pos;
|
||||
}
|
||||
(esc @ Token::Escape { .. }, es @ ('\\' | '{' | '}')) => {
|
||||
if let Token::Escape { start, end, ch, .. } = esc {
|
||||
if ch.is_none() {
|
||||
*end = pos;
|
||||
*ch = Some(es);
|
||||
} else if es == '\\' {
|
||||
// A new escape right after a completed escape.
|
||||
tokens.push(replace(esc, Token::start_escape(pos, es)));
|
||||
} else if es == '{' {
|
||||
// A new brace pair right after a completed escape, should be handled prior to this.
|
||||
unreachable!("escape followed by brace pair, unhandled");
|
||||
} else {
|
||||
// } right after a completed escape, probably unreachable but just in case:
|
||||
return Err(ParseError::key_escape(s, *start, pos));
|
||||
}
|
||||
} else {
|
||||
unreachable!("escape is not an escape");
|
||||
}
|
||||
}
|
||||
(
|
||||
Token::Escape {
|
||||
start, ch: None, ..
|
||||
},
|
||||
_,
|
||||
) => {
|
||||
return Err(ParseError::escape(s, *start, pos));
|
||||
}
|
||||
(Token::Escape { ch: Some(_), .. }, _) => {
|
||||
tokens.push(replace(&mut current, Token::start_text_single(pos)));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if !current.is_empty(source_len) {
|
||||
if current.end() < source_len - 1 {
|
||||
current.set_end(source_len - 1);
|
||||
}
|
||||
|
||||
tokens.push(current);
|
||||
}
|
||||
|
||||
if let Token::BracePair { start, end, .. } = current {
|
||||
return Err(ParseError::unbalanced(s, start, end));
|
||||
}
|
||||
|
||||
if let Token::Escape {
|
||||
start,
|
||||
end,
|
||||
ch: None,
|
||||
} = current
|
||||
{
|
||||
return Err(ParseError::escape(s, start, end));
|
||||
}
|
||||
|
||||
let mut items = Vec::with_capacity(tokens.len());
|
||||
for token in tokens {
|
||||
match token {
|
||||
Token::Text { start, end } => {
|
||||
items.push(Item::Text(&s[start..=end]));
|
||||
}
|
||||
Token::BracePair {
|
||||
start,
|
||||
end,
|
||||
key_seen: false,
|
||||
} => {
|
||||
return Err(ParseError::key_empty(s, start, end));
|
||||
}
|
||||
Token::BracePair {
|
||||
start,
|
||||
end,
|
||||
key_seen: true,
|
||||
} => {
|
||||
let key = s[start..=end]
|
||||
.trim_matches(|c: char| c.is_whitespace() || c == '{' || c == '}');
|
||||
if key.is_empty() {
|
||||
return Err(ParseError::key_empty(s, start, end));
|
||||
} else {
|
||||
items.push(Item::Key(key));
|
||||
}
|
||||
}
|
||||
Token::Escape {
|
||||
ch: Some(_), end, ..
|
||||
} => {
|
||||
items.push(Item::Text(&s[end..=end]));
|
||||
}
|
||||
Token::Escape {
|
||||
ch: None,
|
||||
start,
|
||||
end,
|
||||
} => {
|
||||
return Err(ParseError::escape(s, start, end));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
Ok(items)
|
||||
}
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod test_valid {
|
||||
use crate::{template, Item::*, Template};
|
||||
|
||||
#[test]
|
||||
fn empty() {
|
||||
let template = Template::parse("").unwrap();
|
||||
assert_eq!(template, Template::default());
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn no_keys() {
|
||||
let template = Template::parse("hello world").unwrap();
|
||||
assert_eq!(template, template!(Text("hello world")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn leading_key() {
|
||||
let template = Template::parse("{salutation} world").unwrap();
|
||||
assert_eq!(template, template!(Key("salutation"), Text(" world")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn trailing_key() {
|
||||
let template = Template::parse("hello {name}").unwrap();
|
||||
assert_eq!(template, template!(Text("hello "), Key("name")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn middle_key() {
|
||||
let template = Template::parse("hello {name}!").unwrap();
|
||||
assert_eq!(template, template!(Text("hello "), Key("name"), Text("!")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn middle_text() {
|
||||
let template = Template::parse("{salutation} good {title}").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(Key("salutation"), Text(" good "), Key("title"))
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multiline() {
|
||||
let template = Template::parse(
|
||||
"
|
||||
And if thy native country was { ancient civilisation },
|
||||
What need to slight thee? Came not {hero} thence,
|
||||
Who gave to { country } her books and art of writing?
|
||||
",
|
||||
)
|
||||
.unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(
|
||||
Text("\n And if thy native country was "),
|
||||
Key("ancient civilisation"),
|
||||
Text(",\n What need to slight thee? Came not "),
|
||||
Key("hero"),
|
||||
Text(" thence,\n Who gave to "),
|
||||
Key("country"),
|
||||
Text(" her books and art of writing?\n "),
|
||||
)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_no_whitespace() {
|
||||
let template = Template::parse("{word}").unwrap();
|
||||
assert_eq!(template, template!(Key("word")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_leading_whitespace() {
|
||||
let template = Template::parse("{ word}").unwrap();
|
||||
assert_eq!(template, template!(Key("word")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_trailing_whitespace() {
|
||||
let template = Template::parse("{word\n}").unwrap();
|
||||
assert_eq!(template, template!(Key("word")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_both_whitespace() {
|
||||
let template = Template::parse(
|
||||
"{
|
||||
\tword
|
||||
}",
|
||||
)
|
||||
.unwrap();
|
||||
assert_eq!(template, template!(Key("word")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_inner_whitespace() {
|
||||
let template = Template::parse("{ a word }").unwrap();
|
||||
assert_eq!(template, template!(Key("a word")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn escape_left() {
|
||||
let template = Template::parse(r"this \{ single left brace").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(Text("this "), Text("{"), Text(" single left brace"))
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn escape_right() {
|
||||
let template = Template::parse(r"this \} single right brace").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(Text("this "), Text("}"), Text(" single right brace"))
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn escape_both() {
|
||||
let template = Template::parse(r"these \{ two \} braces").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(
|
||||
Text("these "),
|
||||
Text("{"),
|
||||
Text(" two "),
|
||||
Text("}"),
|
||||
Text(" braces")
|
||||
)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn escape_doubled() {
|
||||
let template = Template::parse(r"these \{\{ four \}\} braces").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(
|
||||
Text("these "),
|
||||
Text("{"),
|
||||
Text("{"),
|
||||
Text(" four "),
|
||||
Text("}"),
|
||||
Text("}"),
|
||||
Text(" braces")
|
||||
)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn escape_escape() {
|
||||
let template = Template::parse(r"these \\ backslashes \\\\").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(
|
||||
Text("these "),
|
||||
Text(r"\"),
|
||||
Text(" backslashes "),
|
||||
Text(r"\"),
|
||||
Text(r"\"),
|
||||
)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn escape_before_key() {
|
||||
let template = Template::parse(r"\\{ a } \{{ b } \}{ c }").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(
|
||||
Text(r"\"),
|
||||
Key("a"),
|
||||
Text(" "),
|
||||
Text(r"{"),
|
||||
Key("b"),
|
||||
Text(" "),
|
||||
Text(r"}"),
|
||||
Key("c"),
|
||||
)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn escape_after_key() {
|
||||
let template = Template::parse(r"{ a }\\ { b }\{ { c }\}").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(
|
||||
Key("a"),
|
||||
Text(r"\"),
|
||||
Text(" "),
|
||||
Key("b"),
|
||||
Text(r"{"),
|
||||
Text(" "),
|
||||
Key("c"),
|
||||
Text(r"}"),
|
||||
)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multibyte_texts() {
|
||||
let template = Template::parse("幸徳 {particle} 秋水").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(Text("幸徳 "), Key("particle"), Text(" 秋水"))
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multibyte_key() {
|
||||
let template = Template::parse("The { 連盟 }").unwrap();
|
||||
assert_eq!(template, template!(Text("The "), Key("連盟")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multibyte_both() {
|
||||
let template = Template::parse("大杉 {栄}").unwrap();
|
||||
assert_eq!(template, template!(Text("大杉 "), Key("栄")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multibyte_whitespace() {
|
||||
let template = Template::parse("岩佐 作{ 太 }郎").unwrap();
|
||||
assert_eq!(template, template!(Text("岩佐 作"), Key("太"), Text("郎")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multibyte_with_escapes() {
|
||||
let template = Template::parse(r"日本\{アナキスト\}連盟").unwrap();
|
||||
assert_eq!(
|
||||
template,
|
||||
template!(
|
||||
Text("日本"),
|
||||
Text(r"{"),
|
||||
Text("アナキスト"),
|
||||
Text(r"}"),
|
||||
Text("連盟")
|
||||
)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multibyte_rtl_text() {
|
||||
let template = Template::parse("محمد صايل").unwrap();
|
||||
assert_eq!(template, template!(Text("محمد صايل")));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn multibyte_rtl_key() {
|
||||
let template = Template::parse("محمد {ريشة}").unwrap();
|
||||
assert_eq!(template, template!(Text("محمد "), Key("ريشة")));
|
||||
}
|
||||
}
|
||||
|
||||
#[cfg(test)]
|
||||
mod test_error {
|
||||
use crate::{ParseError, Template};
|
||||
|
||||
#[test]
|
||||
fn key_left_half() {
|
||||
let template = Template::parse("{ open").unwrap_err();
|
||||
assert_eq!(template, ParseError::unbalanced("{ open", 0, 6));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_right_half() {
|
||||
let template = Template::parse("open }").unwrap_err();
|
||||
assert_eq!(template, ParseError::unbalanced("open }", 5, 5));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_with_half_escape() {
|
||||
let template = Template::parse(r"this is { not \ allowed }").unwrap_err();
|
||||
assert_eq!(
|
||||
template,
|
||||
ParseError::key_escape(r"this is { not \ allowed }", 8, 14)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_with_full_escape() {
|
||||
let template = Template::parse(r"{ not \} allowed }").unwrap_err();
|
||||
assert_eq!(
|
||||
template,
|
||||
ParseError::key_escape(r"{ not \} allowed }", 0, 6)
|
||||
);
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_empty() {
|
||||
let template = Template::parse(r"void: {}").unwrap_err();
|
||||
assert_eq!(template, ParseError::key_empty(r"void: {}", 6, 7));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn key_only_whitespace() {
|
||||
let template = Template::parse(r"nothing: { }").unwrap_err();
|
||||
assert_eq!(template, ParseError::key_empty(r"nothing: { }", 9, 11));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn bad_escape() {
|
||||
let template = Template::parse(r"not \a thing").unwrap_err();
|
||||
assert_eq!(template, ParseError::escape(r"not \a thing", 4, 5));
|
||||
}
|
||||
|
||||
#[test]
|
||||
fn end_escape() {
|
||||
let template = Template::parse(r"forget me not \").unwrap_err();
|
||||
assert_eq!(template, ParseError::escape(r"forget me not \", 14, 15));
|
||||
}
|
||||
}
|
Loading…
Add table
Add a link
Reference in a new issue