Use datatest for parser tests (#21936)

2025-12-12 18:21:46 +01:00 · 2025-12-12 18:21:46 +01:00 · f94ac77e2f
parent f095e19c2c
commit f94ac77e2f
4 changed files with 67 additions and 59 deletions
--- a/Cargo.lock
+++ b/Cargo.lock
@ -1663,7 +1663,6 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "46fdb647ebde000f43b5b53f773c30cf9b0cb4300453208713fa38b2c70935a0"
 dependencies = [
 "console 0.15.11",
- "globset",
 "once_cell",
 "pest",
 "pest_derive",
@ -1671,7 +1670,6 @@ dependencies = [
 "ron",
 "serde",
 "similar",
- "walkdir",
 ]

 [[package]]
@ -3398,6 +3396,7 @@ dependencies = [
 "bitflags 2.10.0",
 "bstr",
 "compact_str",
+ "datatest-stable",
 "get-size2",
 "insta",
 "itertools 0.14.0",
--- a/crates/ruff_python_formatter/Cargo.toml
+++ b/crates/ruff_python_formatter/Cargo.toml
@ -44,7 +44,7 @@ tracing = { workspace = true }
 ruff_formatter = { workspace = true }

 datatest-stable = { workspace = true }
-insta = { workspace = true, features = ["glob"] }
+insta = { workspace = true }
 regex = { workspace = true }
 serde = { workspace = true }
 serde_json = { workspace = true }
--- a/crates/ruff_python_parser/Cargo.toml
+++ b/crates/ruff_python_parser/Cargo.toml
@ -12,6 +12,10 @@ license = { workspace = true }

 [lib]

+[[test]]
+name = "fixtures"
+harness = false
+
 [dependencies]
 ruff_python_ast = { workspace = true, features = ["get-size"] }
 ruff_python_trivia = { workspace = true }
@ -34,7 +38,8 @@ ruff_python_ast = { workspace = true, features = ["serde"] }
 ruff_source_file = { workspace = true }

 anyhow = { workspace = true }
-insta = { workspace = true, features = ["glob"] }
+datatest-stable = { workspace = true }
+insta = { workspace = true }
 itertools = { workspace = true }
 serde = { workspace = true }
 serde_json = { workspace = true }
--- a/crates/ruff_python_parser/tests/fixtures.rs
+++ b/crates/ruff_python_parser/tests/fixtures.rs
@ -1,9 +1,8 @@
 use std::cell::RefCell;
 use std::cmp::Ordering;
 use std::fmt::{Formatter, Write};
-use std::fs;
-use std::path::Path;

+use datatest_stable::Utf8Path;
 use itertools::Itertools;
 use ruff_annotate_snippets::{Level, Renderer, Snippet};
 use ruff_python_ast::token::{Token, Tokens};
@ -17,38 +16,49 @@ use ruff_python_parser::{Mode, ParseErrorType, ParseOptions, Parsed, parse_unche
 use ruff_source_file::{LineIndex, OneIndexed, SourceCode};
 use ruff_text_size::{Ranged, TextLen, TextRange, TextSize};

-#[test]
-fn valid_syntax() {
-    insta::glob!("../resources", "valid/**/*.py", test_valid_syntax);
+#[expect(clippy::needless_pass_by_value, clippy::unnecessary_wraps)]
+fn valid_syntax(path: &Utf8Path, content: String) -> datatest_stable::Result<()> {
+    test_valid_syntax(path, &content, "./resources/valid");
+    Ok(())
 }

-#[test]
-fn invalid_syntax() {
-    insta::glob!("../resources", "invalid/**/*.py", test_invalid_syntax);
+#[expect(clippy::needless_pass_by_value, clippy::unnecessary_wraps)]
+fn invalid_syntax(path: &Utf8Path, content: String) -> datatest_stable::Result<()> {
+    test_invalid_syntax(path, &content, "./resources/invalid");
+    Ok(())
 }

-#[test]
-fn inline_ok() {
-    insta::glob!("../resources/inline", "ok/**/*.py", test_valid_syntax);
+#[expect(clippy::needless_pass_by_value, clippy::unnecessary_wraps)]
+fn inline_ok(path: &Utf8Path, content: String) -> datatest_stable::Result<()> {
+    test_valid_syntax(path, &content, "./resources/inline/ok");
+    Ok(())
 }

-#[test]
-fn inline_err() {
-    insta::glob!("../resources/inline", "err/**/*.py", test_invalid_syntax);
+#[expect(clippy::needless_pass_by_value, clippy::unnecessary_wraps)]
+fn inline_err(path: &Utf8Path, content: String) -> datatest_stable::Result<()> {
+    test_invalid_syntax(path, &content, "./resources/inline/err");
+    Ok(())
+}
+
+datatest_stable::harness! {
+    { test = valid_syntax, root = "./resources/valid", pattern = r"\.pyi?$" },
+    { test = inline_ok, root = "./resources/inline/ok", pattern = r"\.pyi?$" },
+    { test = invalid_syntax, root = "./resources/invalid", pattern = r"\.pyi?$" },
+    { test = inline_err, root="./resources/inline/err", pattern = r"\.pyi?$" }
 }

 /// Asserts that the parser generates no syntax errors for a valid program.
 /// Snapshots the AST.
-fn test_valid_syntax(input_path: &Path) {
-    let source = fs::read_to_string(input_path).expect("Expected test file to exist");
-    let options = extract_options(&source).unwrap_or_else(|| {
+fn test_valid_syntax(input_path: &Utf8Path, source: &str, root: &str) {
+    let test_name = input_path.strip_prefix(root).unwrap_or(input_path).as_str();
+    let options = extract_options(source).unwrap_or_else(|| {
        ParseOptions::from(Mode::Module).with_target_version(PythonVersion::latest_preview())
    });
-    let parsed = parse_unchecked(&source, options.clone());
+    let parsed = parse_unchecked(source, options.clone());

    if parsed.has_syntax_errors() {
-        let line_index = LineIndex::from_source_text(&source);
-        let source_code = SourceCode::new(&source, &line_index);
+        let line_index = LineIndex::from_source_text(source);
+        let source_code = SourceCode::new(source, &line_index);

        let mut message = "Expected no syntax errors for a valid program but the parser generated the following errors:\n".to_string();

@ -81,8 +91,8 @@ fn test_valid_syntax(input_path: &Path) {
        panic!("{input_path:?}: {message}");
    }

-    validate_tokens(parsed.tokens(), source.text_len(), input_path);
-    validate_ast(&parsed, source.text_len(), input_path);
+    validate_tokens(parsed.tokens(), source.text_len());
+    validate_ast(&parsed, source.text_len());

    let mut output = String::new();
    writeln!(&mut output, "## AST").unwrap();
@ -91,7 +101,7 @@ fn test_valid_syntax(input_path: &Path) {
    let parsed = parsed.try_into_module().expect("Parsed with Mode::Module");

    let mut visitor =
-        SemanticSyntaxCheckerVisitor::new(&source).with_python_version(options.target_version());
+        SemanticSyntaxCheckerVisitor::new(source).with_python_version(options.target_version());

    for stmt in parsed.suite() {
        visitor.visit_stmt(stmt);
@ -102,8 +112,8 @@ fn test_valid_syntax(input_path: &Path) {
    if !semantic_syntax_errors.is_empty() {
        let mut message = "Expected no semantic syntax errors for a valid program:\n".to_string();

-        let line_index = LineIndex::from_source_text(&source);
-        let source_code = SourceCode::new(&source, &line_index);
+        let line_index = LineIndex::from_source_text(source);
+        let source_code = SourceCode::new(source, &line_index);

        for error in semantic_syntax_errors {
            writeln!(
@ -125,6 +135,7 @@ fn test_valid_syntax(input_path: &Path) {
        omit_expression => true,
        input_file => input_path,
        prepend_module_to_snapshot => false,
+        snapshot_suffix => test_name
    }, {
        insta::assert_snapshot!(output);
    });
@ -132,22 +143,23 @@ fn test_valid_syntax(input_path: &Path) {

 /// Assert that the parser generates at least one syntax error for the given input file.
 /// Snapshots the AST and the error messages.
-fn test_invalid_syntax(input_path: &Path) {
-    let source = fs::read_to_string(input_path).expect("Expected test file to exist");
-    let options = extract_options(&source).unwrap_or_else(|| {
+fn test_invalid_syntax(input_path: &Utf8Path, source: &str, root: &str) {
+    let test_name = input_path.strip_prefix(root).unwrap_or(input_path).as_str();
+
+    let options = extract_options(source).unwrap_or_else(|| {
        ParseOptions::from(Mode::Module).with_target_version(PythonVersion::PY314)
    });
-    let parsed = parse_unchecked(&source, options.clone());
+    let parsed = parse_unchecked(source, options.clone());

-    validate_tokens(parsed.tokens(), source.text_len(), input_path);
-    validate_ast(&parsed, source.text_len(), input_path);
+    validate_tokens(parsed.tokens(), source.text_len());
+    validate_ast(&parsed, source.text_len());

    let mut output = String::new();
    writeln!(&mut output, "## AST").unwrap();
    writeln!(&mut output, "\n```\n{:#?}\n```", parsed.syntax()).unwrap();

-    let line_index = LineIndex::from_source_text(&source);
-    let source_code = SourceCode::new(&source, &line_index);
+    let line_index = LineIndex::from_source_text(source);
+    let source_code = SourceCode::new(source, &line_index);

    if !parsed.errors().is_empty() {
        writeln!(&mut output, "## Errors\n").unwrap();
@ -186,7 +198,7 @@ fn test_invalid_syntax(input_path: &Path) {
    let parsed = parsed.try_into_module().expect("Parsed with Mode::Module");

    let mut visitor =
-        SemanticSyntaxCheckerVisitor::new(&source).with_python_version(options.target_version());
+        SemanticSyntaxCheckerVisitor::new(source).with_python_version(options.target_version());

    for stmt in parsed.suite() {
        visitor.visit_stmt(stmt);
@ -196,7 +208,7 @@ fn test_invalid_syntax(input_path: &Path) {

    assert!(
        parsed.has_syntax_errors() || !semantic_syntax_errors.is_empty(),
-        "{input_path:?}: Expected parser to generate at least one syntax error for a program containing syntax errors."
+        "Expected parser to generate at least one syntax error for a program containing syntax errors."
    );

    if !semantic_syntax_errors.is_empty() {
@ -220,6 +232,7 @@ fn test_invalid_syntax(input_path: &Path) {
        omit_expression => true,
        input_file => input_path,
        prepend_module_to_snapshot => false,
+        snapshot_suffix => test_name
    }, {
        insta::assert_snapshot!(output);
    });
@ -372,26 +385,24 @@ impl std::fmt::Display for CodeFrame<'_> {
 /// Verifies that:
 /// * the ranges are strictly increasing when loop the tokens in insertion order
 /// * all ranges are within the length of the source code
-fn validate_tokens(tokens: &[Token], source_length: TextSize, test_path: &Path) {
+fn validate_tokens(tokens: &[Token], source_length: TextSize) {
    let mut previous: Option<&Token> = None;

    for token in tokens {
        assert!(
            token.end() <= source_length,
-            "{path}: Token range exceeds the source code length. Token: {token:#?}",
-            path = test_path.display()
+            "Token range exceeds the source code length. Token: {token:#?}",
        );

        if let Some(previous) = previous {
            assert_eq!(
                previous.range().ordering(token.range()),
                Ordering::Less,
-                "{path}: Token ranges are not in increasing order
+                "Token ranges are not in increasing order
 Previous token: {previous:#?}
 Current token: {token:#?}
 Tokens: {tokens:#?}
 ",
-                path = test_path.display(),
            );
        }

@ -403,9 +414,9 @@ Tokens: {tokens:#?}
 /// * the range of the parent node fully encloses all its child nodes
 /// * the ranges are strictly increasing when traversing the nodes in pre-order.
 /// * all ranges are within the length of the source code.
-fn validate_ast(parsed: &Parsed<Mod>, source_len: TextSize, test_path: &Path) {
+fn validate_ast(parsed: &Parsed<Mod>, source_len: TextSize) {
    walk_module(
-        &mut ValidateAstVisitor::new(parsed.tokens(), source_len, test_path),
+        &mut ValidateAstVisitor::new(parsed.tokens(), source_len),
        parsed.syntax(),
    );
 }
@ -416,17 +427,15 @@ struct ValidateAstVisitor<'a> {
    parents: Vec<AnyNodeRef<'a>>,
    previous: Option<AnyNodeRef<'a>>,
    source_length: TextSize,
-    test_path: &'a Path,
 }

 impl<'a> ValidateAstVisitor<'a> {
-    fn new(tokens: &'a Tokens, source_length: TextSize, test_path: &'a Path) -> Self {
+    fn new(tokens: &'a Tokens, source_length: TextSize) -> Self {
        Self {
            tokens: tokens.iter().peekable(),
            parents: Vec::new(),
            previous: None,
            source_length,
-            test_path,
        }
    }
 }
@ -444,8 +453,7 @@ impl ValidateAstVisitor<'_> {
            // At this point, next_token.end() > node.start()
            assert!(
                next.start() >= node.start(),
-                "{path}: The start of the node falls within a token.\nNode: {node:#?}\n\nToken: {next:#?}\n\nRoot: {root:#?}",
-                path = self.test_path.display(),
+                "The start of the node falls within a token.\nNode: {node:#?}\n\nToken: {next:#?}\n\nRoot: {root:#?}",
                root = self.parents.first()
            );
        }
@ -464,8 +472,7 @@ impl ValidateAstVisitor<'_> {
            // At this point, `next_token.end() > node.end()`
            assert!(
                next.start() >= node.end(),
-                "{path}: The end of the node falls within a token.\nNode: {node:#?}\n\nToken: {next:#?}\n\nRoot: {root:#?}",
-                path = self.test_path.display(),
+                "The end of the node falls within a token.\nNode: {node:#?}\n\nToken: {next:#?}\n\nRoot: {root:#?}",
                root = self.parents.first()
            );
        }
@ -476,16 +483,14 @@ impl<'ast> SourceOrderVisitor<'ast> for ValidateAstVisitor<'ast> {
    fn enter_node(&mut self, node: AnyNodeRef<'ast>) -> TraversalSignal {
        assert!(
            node.end() <= self.source_length,
-            "{path}: The range of the node exceeds the length of the source code. Node: {node:#?}",
-            path = self.test_path.display()
+            "The range of the node exceeds the length of the source code. Node: {node:#?}",
        );

        if let Some(previous) = self.previous {
            assert_ne!(
                previous.range().ordering(node.range()),
                Ordering::Greater,
-                "{path}: The ranges of the nodes are not strictly increasing when traversing the AST in pre-order.\nPrevious node: {previous:#?}\n\nCurrent node: {node:#?}\n\nRoot: {root:#?}",
-                path = self.test_path.display(),
+                "The ranges of the nodes are not strictly increasing when traversing the AST in pre-order.\nPrevious node: {previous:#?}\n\nCurrent node: {node:#?}\n\nRoot: {root:#?}",
                root = self.parents.first()
            );
        }
@ -493,8 +498,7 @@ impl<'ast> SourceOrderVisitor<'ast> for ValidateAstVisitor<'ast> {
        if let Some(parent) = self.parents.last() {
            assert!(
                parent.range().contains_range(node.range()),
-                "{path}: The range of the parent node does not fully enclose the range of the child node.\nParent node: {parent:#?}\n\nChild node: {node:#?}\n\nRoot: {root:#?}",
-                path = self.test_path.display(),
+                "The range of the parent node does not fully enclose the range of the child node.\nParent node: {parent:#?}\n\nChild node: {node:#?}\n\nRoot: {root:#?}",
                root = self.parents.first()
            );
        }