Skip to content

Commit

Permalink
add validation for tags on silent rules (fixes #1035)
Browse files Browse the repository at this point in the history
  • Loading branch information
tomtau committed Sep 4, 2024
1 parent 537660c commit 1d4dc46
Show file tree
Hide file tree
Showing 11 changed files with 156 additions and 38 deletions.
8 changes: 4 additions & 4 deletions debugger/Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
[package]
name = "pest_debugger"
description = "pest grammar debugger"
version = "2.7.11"
version = "2.7.12"
edition = "2021"
authors = [
"Dragoș Tiselice <[email protected]>",
Expand All @@ -17,9 +17,9 @@ readme = "_README.md"
rust-version = "1.61"

[dependencies]
pest = { path = "../pest", version = "2.7.11" }
pest_meta = { path = "../meta", version = "2.7.11" }
pest_vm = { path = "../vm", version = "2.7.11" }
pest = { path = "../pest", version = "2.7.12" }
pest_meta = { path = "../meta", version = "2.7.12" }
pest_vm = { path = "../vm", version = "2.7.12" }
reqwest = { version = "= 0.11.13", default-features = false, features = [
"blocking",
"json",
Expand Down
6 changes: 3 additions & 3 deletions derive/Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
[package]
name = "pest_derive"
description = "pest's derive macro"
version = "2.7.11"
version = "2.7.12"
edition = "2021"
authors = ["Dragoș Tiselice <[email protected]>"]
homepage = "https://pest.rs/"
Expand All @@ -25,5 +25,5 @@ grammar-extras = ["pest_generator/grammar-extras"]

[dependencies]
# for tests, included transitively anyway
pest = { path = "../pest", version = "2.7.11", default-features = false }
pest_generator = { path = "../generator", version = "2.7.11", default-features = false }
pest = { path = "../pest", version = "2.7.12", default-features = false }
pest_generator = { path = "../generator", version = "2.7.12", default-features = false }
6 changes: 3 additions & 3 deletions generator/Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
[package]
name = "pest_generator"
description = "pest code generator"
version = "2.7.11"
version = "2.7.12"
edition = "2021"
authors = ["Dragoș Tiselice <[email protected]>"]
homepage = "https://pest.rs/"
Expand All @@ -22,8 +22,8 @@ grammar-extras = ["pest_meta/grammar-extras"]
export-internal = []

[dependencies]
pest = { path = "../pest", version = "2.7.11", default-features = false }
pest_meta = { path = "../meta", version = "2.7.11" }
pest = { path = "../pest", version = "2.7.12", default-features = false }
pest_meta = { path = "../meta", version = "2.7.12" }
proc-macro2 = "1.0"
quote = "1.0"
syn = "2.0"
6 changes: 3 additions & 3 deletions grammars/Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
[package]
name = "pest_grammars"
description = "pest popular grammar implementations"
version = "2.7.11"
version = "2.7.12"
edition = "2021"
authors = ["Dragoș Tiselice <[email protected]>"]
homepage = "https://pest.rs/"
Expand All @@ -14,8 +14,8 @@ readme = "_README.md"
rust-version = "1.61"

[dependencies]
pest = { path = "../pest", version = "2.7.11" }
pest_derive = { path = "../derive", version = "2.7.11" }
pest = { path = "../pest", version = "2.7.12" }
pest_derive = { path = "../derive", version = "2.7.12" }

[dev-dependencies]
criterion = "0.5"
Expand Down
4 changes: 2 additions & 2 deletions meta/Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
[package]
name = "pest_meta"
description = "pest meta language parser and validator"
version = "2.7.11"
version = "2.7.12"
edition = "2021"
authors = ["Dragoș Tiselice <[email protected]>"]
homepage = "https://pest.rs/"
Expand All @@ -22,7 +22,7 @@ include = [
rust-version = "1.61"

[dependencies]
pest = { path = "../pest", version = "2.7.11" }
pest = { path = "../pest", version = "2.7.12" }
once_cell = "1.8.0"

[build-dependencies]
Expand Down
117 changes: 117 additions & 0 deletions meta/src/validator.rs
Original file line number Diff line number Diff line change
Expand Up @@ -226,6 +226,8 @@ pub fn validate_ast<'a, 'i: 'a>(rules: &'a Vec<ParserRule<'i>>) -> Vec<Error<Rul
errors.extend(validate_choices(rules));
errors.extend(validate_whitespace_comment(rules));
errors.extend(validate_left_recursion(rules));
#[cfg(feature = "grammar-extras")]
errors.extend(validate_tag_silent_rules(rules));

errors.sort_by_key(|error| match error.location {
InputLocation::Span(span) => span,
Expand All @@ -235,6 +237,78 @@ pub fn validate_ast<'a, 'i: 'a>(rules: &'a Vec<ParserRule<'i>>) -> Vec<Error<Rul
errors
}

#[cfg(feature = "grammar-extras")]
fn validate_tag_silent_rules<'a, 'i: 'a>(rules: &'a [ParserRule<'i>]) -> Vec<Error<Rule>> {
use crate::ast::RuleType;

fn to_type_hash_map<'a, 'i: 'a>(
rules: &'a [ParserRule<'i>],
) -> HashMap<String, (&'a ParserNode<'i>, RuleType)> {
rules
.iter()
.map(|r| (r.name.clone(), (&r.node, r.ty)))
.collect()
}
let mut result = vec![];

fn check_silent_builtin<'a, 'i: 'a>(
expr: &ParserExpr<'i>,
rules_ref: &HashMap<String, (&'a ParserNode<'i>, RuleType)>,
span: Span<'a>,
) -> Option<Error<Rule>> {
match &expr {
ParserExpr::Ident(rule_name) => {
let rule = rules_ref.get(rule_name);
if matches!(rule, Some((_, RuleType::Silent))) {
return Some(Error::<Rule>::new_from_span(
ErrorVariant::CustomError {
message: "tags on silent rules will not appear in the output"
.to_owned(),
},
span,
));
} else if BUILTINS.contains(rule_name.as_str()) {
return Some(Error::new_from_span(
ErrorVariant::CustomError {
message: "tags on built-in rules will not appear in the output"
.to_owned(),
},
span,
));
}
}
ParserExpr::Rep(node)
| ParserExpr::RepMinMax(node, _, _)
| ParserExpr::RepMax(node, _)
| ParserExpr::RepMin(node, _)
| ParserExpr::RepOnce(node)
| ParserExpr::RepExact(node, _)
| ParserExpr::Opt(node)
| ParserExpr::Push(node)
| ParserExpr::PosPred(node)
| ParserExpr::NegPred(node) => {
return check_silent_builtin(&node.expr, rules_ref, span);
}
_ => {}
};
None
}

let rules_map = to_type_hash_map(rules);
for rule in rules {
let rules_ref = &rules_map;
let mut errors = rule.node.clone().filter_map_top_down(|node1| {
if let ParserExpr::NodeTag(node2, _) = node1.expr {
check_silent_builtin(&node2.expr, rules_ref, node1.span)
} else {
None
}
});
result.append(&mut errors);
}
result
}

/// Checks if `expr` is non-progressing, that is the expression does not
/// consume any input or any stack. This includes expressions matching the empty input,
/// `SOI` and ̀ `EOI`, predicates and repetitions.
Expand Down Expand Up @@ -1796,4 +1870,47 @@ mod tests {
PestParser::parse(Rule::grammar_rules, input).unwrap(),
));
}

#[test]
#[should_panic(expected = "grammar error
--> 1:7
|
1 | a = { #b = b } b = _{ ASCII_DIGIT+ }
| ^----^
|
= tags on silent rules will not appear in the output")]
#[cfg(feature = "grammar-extras")]
fn tag_on_silent_rule() {
let input = "a = { #b = b } b = _{ ASCII_DIGIT+ }";
unwrap_or_report(consume_rules(
PestParser::parse(Rule::grammar_rules, input).unwrap(),
));
}

#[test]
#[should_panic(expected = "grammar error
--> 1:7
|
1 | a = { #b = ASCII_DIGIT+ }
| ^---------------^
|
= tags on built-in rules will not appear in the output")]
#[cfg(feature = "grammar-extras")]
fn tag_on_builtin_rule() {
let input = "a = { #b = ASCII_DIGIT+ }";
unwrap_or_report(consume_rules(
PestParser::parse(Rule::grammar_rules, input).unwrap(),
));
}

#[test]
#[cfg(feature = "grammar-extras")]
fn tag_on_normal_rule() {
let input = "a = { #b = b } b = { ASCII_DIGIT+ }";
unwrap_or_report(consume_rules(
PestParser::parse(Rule::grammar_rules, input).unwrap(),
));
}
}
2 changes: 1 addition & 1 deletion pest/Cargo.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
[package]
name = "pest"
description = "The Elegant Parser"
version = "2.7.11"
version = "2.7.12"
edition = "2021"
authors = ["Dragoș Tiselice <[email protected]>"]
homepage = "https://pest.rs/"
Expand Down
1 change: 1 addition & 0 deletions pest/examples/parens.rs
Original file line number Diff line number Diff line change
Expand Up @@ -48,6 +48,7 @@ impl Parser<Rule> for ParenParser {
}

#[derive(Debug)]
#[allow(dead_code)]
struct Paren(Vec<Paren>);

fn expr(pairs: Pairs<Rule>) -> Vec<Paren> {
Expand Down
37 changes: 18 additions & 19 deletions pest/src/error.rs
Original file line number Diff line number Diff line change
Expand Up @@ -730,14 +730,13 @@ fn visualize_whitespace(input: &str) -> String {

#[cfg(test)]
mod tests {
use super::super::position;
use super::*;
use alloc::vec;

#[test]
fn display_parsing_error_mixed() {
let input = "ab\ncd\nef";
let pos = position::Position::new(input, 4).unwrap();
let pos = Position::new(input, 4).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::ParsingError {
positives: vec![1, 2, 3],
Expand All @@ -763,7 +762,7 @@ mod tests {
#[test]
fn display_parsing_error_positives() {
let input = "ab\ncd\nef";
let pos = position::Position::new(input, 4).unwrap();
let pos = Position::new(input, 4).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::ParsingError {
positives: vec![1, 2],
Expand All @@ -789,7 +788,7 @@ mod tests {
#[test]
fn display_parsing_error_negatives() {
let input = "ab\ncd\nef";
let pos = position::Position::new(input, 4).unwrap();
let pos = Position::new(input, 4).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::ParsingError {
positives: vec![],
Expand All @@ -815,7 +814,7 @@ mod tests {
#[test]
fn display_parsing_error_unknown() {
let input = "ab\ncd\nef";
let pos = position::Position::new(input, 4).unwrap();
let pos = Position::new(input, 4).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::ParsingError {
positives: vec![],
Expand All @@ -841,7 +840,7 @@ mod tests {
#[test]
fn display_custom_pos() {
let input = "ab\ncd\nef";
let pos = position::Position::new(input, 4).unwrap();
let pos = Position::new(input, 4).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::CustomError {
message: "error: big one".to_owned(),
Expand All @@ -866,8 +865,8 @@ mod tests {
#[test]
fn display_custom_span_two_lines() {
let input = "ab\ncd\nefgh";
let start = position::Position::new(input, 4).unwrap();
let end = position::Position::new(input, 9).unwrap();
let start = Position::new(input, 4).unwrap();
let end = Position::new(input, 9).unwrap();
let error: Error<u32> = Error::new_from_span(
ErrorVariant::CustomError {
message: "error: big one".to_owned(),
Expand All @@ -893,8 +892,8 @@ mod tests {
#[test]
fn display_custom_span_three_lines() {
let input = "ab\ncd\nefgh";
let start = position::Position::new(input, 1).unwrap();
let end = position::Position::new(input, 9).unwrap();
let start = Position::new(input, 1).unwrap();
let end = Position::new(input, 9).unwrap();
let error: Error<u32> = Error::new_from_span(
ErrorVariant::CustomError {
message: "error: big one".to_owned(),
Expand All @@ -921,8 +920,8 @@ mod tests {
#[test]
fn display_custom_span_two_lines_inverted_cols() {
let input = "abcdef\ngh";
let start = position::Position::new(input, 5).unwrap();
let end = position::Position::new(input, 8).unwrap();
let start = Position::new(input, 5).unwrap();
let end = Position::new(input, 8).unwrap();
let error: Error<u32> = Error::new_from_span(
ErrorVariant::CustomError {
message: "error: big one".to_owned(),
Expand All @@ -948,8 +947,8 @@ mod tests {
#[test]
fn display_custom_span_end_after_newline() {
let input = "abcdef\n";
let start = position::Position::new(input, 0).unwrap();
let end = position::Position::new(input, 7).unwrap();
let start = Position::new(input, 0).unwrap();
let end = Position::new(input, 7).unwrap();
assert!(start.at_start());
assert!(end.at_end());

Expand Down Expand Up @@ -977,8 +976,8 @@ mod tests {
#[test]
fn display_custom_span_empty() {
let input = "";
let start = position::Position::new(input, 0).unwrap();
let end = position::Position::new(input, 0).unwrap();
let start = Position::new(input, 0).unwrap();
let end = Position::new(input, 0).unwrap();
assert!(start.at_start());
assert!(end.at_end());

Expand Down Expand Up @@ -1006,7 +1005,7 @@ mod tests {
#[test]
fn mapped_parsing_error() {
let input = "ab\ncd\nef";
let pos = position::Position::new(input, 4).unwrap();
let pos = Position::new(input, 4).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::ParsingError {
positives: vec![1, 2, 3],
Expand All @@ -1033,7 +1032,7 @@ mod tests {
#[test]
fn error_with_path() {
let input = "ab\ncd\nef";
let pos = position::Position::new(input, 4).unwrap();
let pos = Position::new(input, 4).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::ParsingError {
positives: vec![1, 2, 3],
Expand All @@ -1060,7 +1059,7 @@ mod tests {
#[test]
fn underline_with_tabs() {
let input = "a\txbc";
let pos = position::Position::new(input, 2).unwrap();
let pos = Position::new(input, 2).unwrap();
let error: Error<u32> = Error::new_from_pos(
ErrorVariant::ParsingError {
positives: vec![1, 2, 3],
Expand Down
1 change: 1 addition & 0 deletions pest/src/parser_state.rs
Original file line number Diff line number Diff line change
Expand Up @@ -438,6 +438,7 @@ pub struct ParserState<'i, R: RuleType> {
/// * CreateUser = { "create" ~ "user" ~ Name }
/// * CreateTable = { "create" ~ "table" ~ Name }
/// * Name = { SOME_DEFINITION }
///
/// While parsing the query we'll update tracker position to the start of "Bobby", because we'd
/// successfully parse "create" + "user" (and not "table").
parse_attempts: ParseAttempts<R>,
Expand Down
Loading

0 comments on commit 1d4dc46

Please sign in to comment.