-
Notifications
You must be signed in to change notification settings - Fork 12.9k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Rollup merge of #133730 - dtolnay:parentest, r=compiler-errors
Add pretty-printer parenthesis insertion test This test demonstrates numerous bugs in rustc_ast_pretty, including all five of: - Failing to insert parentheses where necessary to preserve the meaning of a syntax tree, producing invalid syntax. - Failing to insert parentheses, producing valid syntax with the wrong meaning. - Inserting too many parentheses. - Inserting parentheses in the wrong place, producing invalid syntax. - Losing syntactically significant parts of the syntax tree. These pretty-printer bugs have consequences for `-Zunpretty=expanded`. The `cargo expand` subcommand cannot work reliably unless rustc can consistently produce valid Rust output. Erroneous syntax cannot be passed through rustfmt, or queried with [syn-select](https://crates.io/crates/syn-select). The test in this PR is a port of a test from Syn that tests the automatic parenthesis insertion performed by Syn's `ToTokens` impls. In Syn we actually run this test over every expression in every Rust source file in the whole rust-lang/rust repo, including rustc and the standard library and tools and test suites. For the test here, I have only used a small selection of interesting expressions. This will serve as an easy spot to accumulate regression tests as the various bugs get fixed. Once rustc's pretty-printer is in better shape, it's possible that the test can be expanded to cover a larger set of expressions collected automatically like in Syn.
- Loading branch information
Showing
1 changed file
with
242 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,242 @@ | ||
//@ run-pass | ||
//@ ignore-cross-compile | ||
|
||
// This test covers the AST pretty-printer's automatic insertion of parentheses | ||
// into unparenthesized syntax trees according to precedence and various grammar | ||
// restrictions and edge cases. | ||
// | ||
// For example if the following syntax tree represents the expression a*(b+c), | ||
// in which the parenthesis is necessary for precedence: | ||
// | ||
// Binary('*', Path("a"), Paren(Binary('+', Path("b"), Path("c")))) | ||
// | ||
// then the pretty-printer needs to be able to print the following | ||
// unparenthesized syntax tree with an automatically inserted parenthesization. | ||
// | ||
// Binary('*', Path("a"), Binary('+', Path("b"), Path("c"))) | ||
// | ||
// Handling this correctly is relevant in real-world code when pretty-printing | ||
// macro-generated syntax trees, in which expressions can get interpolated into | ||
// one another without any parenthesization being visible in the syntax tree. | ||
// | ||
// macro_rules! repro { | ||
// ($rhs:expr) => { | ||
// a * $rhs | ||
// }; | ||
// } | ||
// | ||
// let _ = repro!(b + c); | ||
|
||
#![feature(rustc_private)] | ||
|
||
extern crate rustc_ast; | ||
extern crate rustc_ast_pretty; | ||
extern crate rustc_driver; | ||
extern crate rustc_errors; | ||
extern crate rustc_parse; | ||
extern crate rustc_session; | ||
extern crate rustc_span; | ||
extern crate smallvec; | ||
|
||
use std::mem; | ||
use std::process::ExitCode; | ||
|
||
use rustc_ast::ast::{DUMMY_NODE_ID, Expr, ExprKind, Stmt}; | ||
use rustc_ast::mut_visit::{self, DummyAstNode as _, MutVisitor}; | ||
use rustc_ast::node_id::NodeId; | ||
use rustc_ast::ptr::P; | ||
use rustc_ast_pretty::pprust; | ||
use rustc_errors::Diag; | ||
use rustc_parse::parser::Recovery; | ||
use rustc_session::parse::ParseSess; | ||
use rustc_span::{DUMMY_SP, FileName, Span}; | ||
use smallvec::SmallVec; | ||
|
||
// Every parenthesis in the following expressions is re-inserted by the | ||
// pretty-printer. | ||
// | ||
// FIXME: Some of them shouldn't be. | ||
static EXPRS: &[&str] = &[ | ||
// Straightforward binary operator precedence. | ||
"2 * 2 + 2", | ||
"2 + 2 * 2", | ||
"(2 + 2) * 2", | ||
"2 * (2 + 2)", | ||
"2 + 2 + 2", | ||
// Return has lower precedence than a binary operator. | ||
"(return 2) + 2", | ||
"2 + (return 2)", // FIXME: no parenthesis needed. | ||
"(return) + 2", // FIXME: no parenthesis needed. | ||
// These mean different things. | ||
"return - 2", | ||
"(return) - 2", | ||
// These mean different things. | ||
"if let _ = true && false {}", | ||
"if let _ = (true && false) {}", | ||
// Conditions end at the first curly brace, so struct expressions need to be | ||
// parenthesized. Except in a match guard, where conditions end at arrow. | ||
"if let _ = (Struct {}) {}", | ||
"match 2 { _ if let _ = Struct {} => {} }", | ||
// Match arms terminate eagerly, so parenthesization is needed around some | ||
// expressions. | ||
"match 2 { _ => 1 - 1 }", | ||
"match 2 { _ => ({ 1 }) - 1 }", | ||
// Grammar restriction: break value starting with a labeled loop is not | ||
// allowed, except if the break is also labeled. | ||
"break 'outer 'inner: loop {} + 2", | ||
"break ('inner: loop {} + 2)", | ||
// Grammar restriction: the value in let-else is not allowed to end in a | ||
// curly brace. | ||
"{ let _ = 1 + 1 else {}; }", | ||
"{ let _ = (loop {}) else {}; }", | ||
"{ let _ = mac!() else {}; }", | ||
"{ let _ = (mac! {}) else {}; }", | ||
// Parentheses are necessary to prevent an eager statement boundary. | ||
"{ 2 - 1 }", | ||
"{ (match 2 {}) - 1 }", | ||
"{ (match 2 {})() - 1 }", | ||
"{ (match 2 {})[0] - 1 }", | ||
"{ (loop {}) - 1 }", | ||
// Angle bracket is eagerly parsed as a path's generic argument list. | ||
"(2 as T) < U", | ||
"(2 as T<U>) < V", // FIXME: no parentheses needed. | ||
/* | ||
// FIXME: pretty-printer produces invalid syntax. `2 + 2 as T < U` | ||
"(2 + 2 as T) < U", | ||
*/ | ||
/* | ||
// FIXME: pretty-printer produces invalid syntax. `if (let _ = () && Struct {}.x) {}` | ||
"if let _ = () && (Struct {}).x {}", | ||
*/ | ||
/* | ||
// FIXME: pretty-printer produces invalid syntax. `(1 < 2 == false) as usize` | ||
"((1 < 2) == false) as usize", | ||
*/ | ||
/* | ||
// FIXME: pretty-printer produces invalid syntax. `for _ in 1..{ 2 } {}` | ||
"for _ in (1..{ 2 }) {}", | ||
*/ | ||
/* | ||
// FIXME: pretty-printer loses the attribute. `{ let Struct { field } = s; }` | ||
"{ let Struct { #[attr] field } = s; }", | ||
*/ | ||
/* | ||
// FIXME: pretty-printer turns this into a range. `0..to_string()` | ||
"(0.).to_string()", | ||
"0. .. 1.", | ||
*/ | ||
/* | ||
// FIXME: pretty-printer loses the dyn*. `i as Trait` | ||
"i as dyn* Trait", | ||
*/ | ||
]; | ||
|
||
// Flatten the content of parenthesis nodes into their parent node. For example | ||
// this syntax tree representing the expression a*(b+c): | ||
// | ||
// Binary('*', Path("a"), Paren(Binary('+', Path("b"), Path("c")))) | ||
// | ||
// would unparenthesize to: | ||
// | ||
// Binary('*', Path("a"), Binary('+', Path("b"), Path("c"))) | ||
struct Unparenthesize; | ||
|
||
impl MutVisitor for Unparenthesize { | ||
fn visit_expr(&mut self, e: &mut P<Expr>) { | ||
while let ExprKind::Paren(paren) = &mut e.kind { | ||
**e = mem::replace(&mut *paren, Expr::dummy()); | ||
} | ||
mut_visit::walk_expr(self, e); | ||
} | ||
} | ||
|
||
// Erase Span information that could distinguish between identical expressions | ||
// parsed from different source strings. | ||
struct Normalize; | ||
|
||
impl MutVisitor for Normalize { | ||
const VISIT_TOKENS: bool = true; | ||
|
||
fn visit_id(&mut self, id: &mut NodeId) { | ||
*id = DUMMY_NODE_ID; | ||
} | ||
|
||
fn visit_span(&mut self, span: &mut Span) { | ||
*span = DUMMY_SP; | ||
} | ||
|
||
fn visit_expr(&mut self, expr: &mut P<Expr>) { | ||
if let ExprKind::Binary(binop, _left, _right) = &mut expr.kind { | ||
self.visit_span(&mut binop.span); | ||
} | ||
mut_visit::walk_expr(self, expr); | ||
} | ||
|
||
fn flat_map_stmt(&mut self, mut stmt: Stmt) -> SmallVec<[Stmt; 1]> { | ||
self.visit_span(&mut stmt.span); | ||
mut_visit::walk_flat_map_stmt(self, stmt) | ||
} | ||
} | ||
|
||
fn parse_expr(psess: &ParseSess, source_code: &str) -> Option<P<Expr>> { | ||
let parser = rustc_parse::unwrap_or_emit_fatal(rustc_parse::new_parser_from_source_str( | ||
psess, | ||
FileName::anon_source_code(source_code), | ||
source_code.to_owned(), | ||
)); | ||
|
||
let mut expr = parser.recovery(Recovery::Forbidden).parse_expr().map_err(Diag::cancel).ok()?; | ||
Normalize.visit_expr(&mut expr); | ||
Some(expr) | ||
} | ||
|
||
fn main() -> ExitCode { | ||
let mut status = ExitCode::SUCCESS; | ||
let mut fail = |description: &str, before: &str, after: &str| { | ||
status = ExitCode::FAILURE; | ||
eprint!( | ||
"{description}\n BEFORE: {before}\n AFTER: {after}\n\n", | ||
before = before.replace('\n', "\n "), | ||
after = after.replace('\n', "\n "), | ||
); | ||
}; | ||
|
||
rustc_span::create_default_session_globals_then(|| { | ||
let psess = &ParseSess::new(vec![rustc_parse::DEFAULT_LOCALE_RESOURCE]); | ||
|
||
for &source_code in EXPRS { | ||
let expr = parse_expr(psess, source_code).unwrap(); | ||
|
||
// Check for FALSE POSITIVE: pretty-printer inserting parentheses where not needed. | ||
// Pseudocode: | ||
// assert(expr == parse(print(expr))) | ||
let printed = &pprust::expr_to_string(&expr); | ||
let Some(expr2) = parse_expr(psess, printed) else { | ||
fail("Pretty-printer produced invalid syntax", source_code, printed); | ||
continue; | ||
}; | ||
if format!("{expr:#?}") != format!("{expr2:#?}") { | ||
fail("Pretty-printer inserted unnecessary parenthesis", source_code, printed); | ||
continue; | ||
} | ||
|
||
// Check for FALSE NEGATIVE: pretty-printer failing to place necessary parentheses. | ||
// Pseudocode: | ||
// assert(unparenthesize(expr) == unparenthesize(parse(print(unparenthesize(expr))))) | ||
let mut expr = expr; | ||
Unparenthesize.visit_expr(&mut expr); | ||
let printed = &pprust::expr_to_string(&expr); | ||
let Some(mut expr2) = parse_expr(psess, printed) else { | ||
fail("Pretty-printer with no parens produced invalid syntax", source_code, printed); | ||
continue; | ||
}; | ||
Unparenthesize.visit_expr(&mut expr2); | ||
if format!("{expr:#?}") != format!("{expr2:#?}") { | ||
fail("Pretty-printer lost necessary parentheses", source_code, printed); | ||
continue; | ||
} | ||
} | ||
}); | ||
|
||
status | ||
} |