Extend ruff_dev formatter script to compute statistics and format a project (#5492)

## Summary This extends the `ruff_dev` formatter script util. Instead of only doing stability checks, you can now choose different compatible options on the CLI and get statistics. * It adds an option the formats all files that ruff would check to allow looking at an entire black-formatted repository with `git diff` * It computes the [Jaccard index](https://en.wikipedia.org/wiki/Jaccard_index) as a measure of deviation between input and output, which is useful as single number metric for assessing our current deviations from black. * It adds progress bars to both the single projects as well as the multi-project mode. * It adds an option to write the multi-project output to a file Sample usage: ``` $ cargo run --bin ruff_dev -- format-dev --stability-check crates/ruff/resources/test/cpython $ cargo run --bin ruff_dev -- format-dev --stability-check /home/konsti/projects/django Syntax error in /home/konsti/projects/django/tests/test_runner_apps/tagged/tests_syntax_error.py: source contains syntax errors (parser error): BaseError { error: UnrecognizedToken(Name { name: "syntax_error" }, None), offset: 131, source_path: "<filename>" } Found 0 stability errors in 2755 files (jaccard index 0.911) in 9.75s $ cargo run --bin ruff_dev -- format-dev --write /home/konsti/projects/django ``` Options: ``` Several utils related to the formatter which can be run on one or more repositories. The selected set of files in a repository is the same as for `ruff check`. * Check formatter stability: Format a repository twice and ensure that it looks that the first and second formatting look the same. * Format: Format the files in a repository to be able to check them with `git diff` * Statistics: The subcommand the Jaccard index between the (assumed to be black formatted) input and the ruff formatted output Usage: ruff_dev format-dev [OPTIONS] [FILES]... Arguments: [FILES]... Like `ruff check`'s files. See `--multi-project` if you want to format an ecosystem checkout Options: --stability-check Check stability We want to ensure that once formatted content stays the same when formatted again, which is known as formatter stability or formatter idempotency, and that the formatter prints syntactically valid code. As our test cases cover only a limited amount of code, this allows checking entire repositories. --write Format the files. Without this flag, the python files are not modified --format <FORMAT> Control the verbosity of the output [default: default] Possible values: - minimal: Filenames only - default: Filenames and reduced diff - full: Full diff and invalid code -x, --exit-first-error Print only the first error and exit, `-x` is same as pytest --multi-project Checks each project inside a directory, useful e.g. if you want to check all of the ecosystem checkouts --error-file <ERROR_FILE> Write all errors to this file in addition to stdout. Only used in multi-project mode ``` ## Test Plan I ran this on django (2755 files, jaccard index 0.911) and discovered a magic trailing comma problem and that we really needed to implement import formatting. I ran the script on cpython to identify https://github.com/astral-sh/ruff/pull/5558.
2025-07-24 13:33:50 +00:00 · 2023-07-07 13:30:12 +02:00 · 2023-07-07 13:30:12 +02:00 · b22e6c3d38
commit b22e6c3d38
parent 40ddc1604c
10 changed files with 726 additions and 499 deletions
--- a/Cargo.lock
+++ b/Cargo.lock
@ -404,6 +404,7 @@ dependencies = [
 "encode_unicode",
 "lazy_static",
 "libc",
+ "unicode-width",
 "windows-sys 0.45.0",
 ]

@ -949,6 +950,19 @@ dependencies = [
 "hashbrown 0.14.0",
 ]

+[[package]]
+name = "indicatif"
+version = "0.17.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8ff8cc23a7393a397ed1d7f56e6365cba772aba9f9912ab968b03043c395d057"
+dependencies = [
+ "console",
+ "instant",
+ "number_prefix",
+ "portable-atomic",
+ "unicode-width",
+]
+
 [[package]]
 name = "inotify"
 version = "0.9.6"
@ -1333,6 +1347,12 @@ dependencies = [
 "libc",
 ]

+[[package]]
+name = "number_prefix"
+version = "0.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "830b246a0e5f20af87141b25c173cd1b609bd7779a4617d6ec582abaf90870f3"
+
 [[package]]
 name = "once_cell"
 version = "1.18.0"
@ -1557,6 +1577,12 @@ dependencies = [
 "syn 1.0.109",
 ]

+[[package]]
+name = "portable-atomic"
+version = "1.3.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "767eb9f07d4a5ebcb39bbf2d452058a93c011373abf6832e24194a1c3f004794"
+
 [[package]]
 name = "predicates"
 version = "3.0.3"
@ -1959,6 +1985,8 @@ version = "0.0.0"
 dependencies = [
 "anyhow",
 "clap",
+ "ignore",
+ "indicatif",
 "itertools",
 "libcst",
 "log",
@ -1969,6 +1997,7 @@ dependencies = [
 "ruff",
 "ruff_cli",
 "ruff_diagnostics",
+ "ruff_formatter",
 "ruff_python_formatter",
 "ruff_python_stdlib",
 "ruff_textwrap",
@ -1979,6 +2008,7 @@ dependencies = [
 "similar",
 "strum",
 "strum_macros",
+ "tempfile",
 ]

 [[package]]
@ -2071,6 +2101,7 @@ dependencies = [
 "serde_json",
 "similar",
 "smallvec",
+ "thiserror",
 ]

 [[package]]
@ -2629,18 +2660,18 @@ dependencies = [

 [[package]]
 name = "thiserror"
-version = "1.0.41"
+version = "1.0.43"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c16a64ba9387ef3fdae4f9c1a7f07a0997fce91985c0336f1ddc1822b3b37802"
+checksum = "a35fc5b8971143ca348fa6df4f024d4d55264f3468c71ad1c2f365b0a4d58c42"
 dependencies = [
 "thiserror-impl",
 ]

 [[package]]
 name = "thiserror-impl"
-version = "1.0.41"
+version = "1.0.43"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d14928354b01c4d6a4f0e549069adef399a284e7995c7ccca94e8a07a5346c59"
+checksum = "463fe12d7993d3b327787537ce8dd4dfa058de32fc2b195ef3cde03dc4771e8f"
 dependencies = [
 "proc-macro2",
 "quote",
--- a/Cargo.toml
+++ b/Cargo.toml
@ -45,6 +45,7 @@ strum = { version = "0.24.1", features = ["strum_macros"] }
 strum_macros = { version = "0.24.3" }
 syn = { version = "2.0.15" }
 test-case = { version = "3.0.0" }
+thiserror = { version = "1.0.43" }
 toml = { version = "0.7.2" }

 # v0.0.1
--- a/crates/ruff/Cargo.toml
+++ b/crates/ruff/Cargo.toml
@ -74,7 +74,7 @@ shellexpand = { workspace = true }
 smallvec = { workspace = true }
 strum = { workspace = true }
 strum_macros = { workspace = true }
-thiserror = { version = "1.0.38" }
+thiserror = { version = "1.0.43" }
 toml = { workspace = true }
 typed-arena = { version = "2.0.2" }
 unicode-width = { version = "0.1.10" }
--- a/crates/ruff_cli/src/args.rs
+++ b/crates/ruff_cli/src/args.rs
@ -74,7 +74,8 @@ pub enum Command {
    },
 }

-#[derive(Clone, Debug, clap::Args)]
+// The `Parser` derive is for ruff_dev, for ruff_cli `Args` would be sufficient
+#[derive(Clone, Debug, clap::Parser)]
 #[allow(clippy::struct_excessive_bools, clippy::module_name_repetitions)]
 pub struct CheckArgs {
    /// List of files or directories to check.
--- a/crates/ruff_dev/Cargo.toml
+++ b/crates/ruff_dev/Cargo.toml
@ -14,12 +14,15 @@ license = { workspace = true }
 ruff = { path = "../ruff", features = ["schemars"] }
 ruff_cli = { path = "../ruff_cli" }
 ruff_diagnostics = { path = "../ruff_diagnostics" }
+ruff_formatter = { path = "../ruff_formatter" }
 ruff_python_formatter = { path = "../ruff_python_formatter" }
 ruff_python_stdlib = { path = "../ruff_python_stdlib" }
 ruff_textwrap = { path = "../ruff_textwrap" }

 anyhow = { workspace = true }
 clap = { workspace = true }
+ignore = { workspace = true }
+indicatif = "0.17.5"
 itertools = { workspace = true }
 libcst = { workspace = true }
 log = { workspace = true }
@ -34,3 +37,4 @@ serde_json = { workspace = true }
 similar = { workspace = true }
 strum = { workspace = true }
 strum_macros = { workspace = true }
+tempfile = "3.6.0"
--- a/crates/ruff_dev/src/check_formatter_stability.rs
+++ b/crates/ruff_dev/src/check_formatter_stability.rs
@ -1,472 +0,0 @@
-//! We want to ensure that once formatted content stays the same when formatted again, which is
-//! known as formatter stability or formatter idempotency, and that the formatter prints
-//! syntactically valid code. As our test cases cover only a limited amount of code, this allows
-//! checking entire repositories.
-
-use std::fmt::{Display, Formatter};
-use std::fs::File;
-use std::io::Write;
-use std::io::{stdout, BufWriter};
-use std::panic::catch_unwind;
-use std::path::{Path, PathBuf};
-use std::process::ExitCode;
-use std::sync::mpsc::channel;
-use std::time::{Duration, Instant};
-use std::{fmt, fs, iter};
-
-use anyhow::{bail, Context};
-use clap::Parser;
-use log::debug;
-use similar::{ChangeTag, TextDiff};
-
-use ruff::resolver::python_files_in_path;
-use ruff::settings::types::{FilePattern, FilePatternSet};
-use ruff_cli::args::CheckArgs;
-use ruff_cli::resolve::resolve;
-use ruff_python_formatter::{format_module, PyFormatOptions};
-
-/// Control the verbosity of the output
-#[derive(Copy, Clone, PartialEq, Eq, clap::ValueEnum, Default)]
-pub(crate) enum Format {
-    /// Filenames only
-    Minimal,
-    /// Filenames and reduced diff
-    #[default]
-    Default,
-    /// Full diff and invalid code
-    Full,
-}
-
-#[derive(clap::Args)]
-pub(crate) struct Args {
-    /// Like `ruff check`'s files
-    pub(crate) files: Vec<PathBuf>,
-    /// Control the verbosity of the output
-    #[arg(long, default_value_t, value_enum)]
-    pub(crate) format: Format,
-    /// Print only the first error and exit, `-x` is same as pytest
-    #[arg(long, short = 'x')]
-    pub(crate) exit_first_error: bool,
-    /// Checks each project inside a directory
-    #[arg(long)]
-    pub(crate) multi_project: bool,
-    /// Write all errors to this file in addition to stdout
-    #[arg(long)]
-    pub(crate) error_file: Option<PathBuf>,
-}
-
-/// Generate ourself a `try_parse_from` impl for `CheckArgs`. This is a strange way to use clap but
-/// we want the same behaviour as `ruff_cli` and clap seems to lack a way to parse directly to
-/// `Args` instead of a `Parser`
-#[derive(Debug, clap::Parser)]
-struct WrapperArgs {
-    #[clap(flatten)]
-    check_args: CheckArgs,
-}
-
-pub(crate) fn main(args: &Args) -> anyhow::Result<ExitCode> {
-    let all_success = if args.multi_project {
-        check_multi_project(args)
-    } else {
-        let result = check_repo(args)?;
-
-        #[allow(clippy::print_stdout)]
-        {
-            print!("{}", result.display(args.format));
-            println!(
-                "Found {} stability errors in {} files in {:.2}s",
-                result.diagnostics.len(),
-                result.file_count,
-                result.duration.as_secs_f32(),
-            );
-        }
-
-        result.is_success()
-    };
-    if all_success {
-        Ok(ExitCode::SUCCESS)
-    } else {
-        Ok(ExitCode::FAILURE)
-    }
-}
-
-enum Message {
-    Start {
-        path: PathBuf,
-    },
-    Failed {
-        path: PathBuf,
-        error: anyhow::Error,
-    },
-    Finished {
-        path: PathBuf,
-        result: CheckRepoResult,
-    },
-}
-
-fn check_multi_project(args: &Args) -> bool {
-    let mut all_success = true;
-    let mut total_errors = 0;
-    let mut total_files = 0;
-    let start = Instant::now();
-
-    rayon::scope(|scope| {
-        let (sender, receiver) = channel();
-
-        for base_dir in &args.files {
-            for dir in base_dir.read_dir().unwrap() {
-                let path = dir.unwrap().path().clone();
-
-                let sender = sender.clone();
-
-                scope.spawn(move |_| {
-                    sender.send(Message::Start { path: path.clone() }).unwrap();
-
-                    match check_repo(&Args {
-                        files: vec![path.clone()],
-                        error_file: args.error_file.clone(),
-                        ..*args
-                    }) {
-                        Ok(result) => sender.send(Message::Finished { result, path }),
-                        Err(error) => sender.send(Message::Failed { error, path }),
-                    }
-                    .unwrap();
-                });
-            }
-        }
-
-        scope.spawn(|_| {
-            let mut stdout = stdout().lock();
-            let mut error_file = args.error_file.as_ref().map(|error_file| {
-                BufWriter::new(File::create(error_file).expect("Couldn't open error file"))
-            });
-
-            for message in receiver {
-                match message {
-                    Message::Start { path } => {
-                        writeln!(stdout, "Starting {}", path.display()).unwrap();
-                    }
-                    Message::Finished { path, result } => {
-                        total_errors += result.diagnostics.len();
-                        total_files += result.file_count;
-
-                        writeln!(
-                            stdout,
-                            "Finished {} with {} files in {:.2}s",
-                            path.display(),
-                            result.file_count,
-                            result.duration.as_secs_f32(),
-                        )
-                        .unwrap();
-                        write!(stdout, "{}", result.display(args.format)).unwrap();
-                        if let Some(error_file) = &mut error_file {
-                            write!(error_file, "{}", result.display(args.format)).unwrap();
-                        }
-                        all_success = all_success && result.is_success();
-                    }
-                    Message::Failed { path, error } => {
-                        writeln!(stdout, "Failed {}: {}", path.display(), error).unwrap();
-                        all_success = false;
-                    }
-                }
-            }
-        });
-    });
-
-    let duration = start.elapsed();
-
-    #[allow(clippy::print_stdout)]
-    {
-        println!(
-            "{total_errors} stability errors in {total_files} files in {}s",
-            duration.as_secs_f32()
-        );
-    }
-
-    all_success
-}
-
-/// Returns whether the check was successful
-fn check_repo(args: &Args) -> anyhow::Result<CheckRepoResult> {
-    let start = Instant::now();
-
-    // Find files to check (or in this case, format twice). Adapted from ruff_cli
-    // First argument is ignored
-    let dummy = PathBuf::from("check");
-    let check_args_input = iter::once(&dummy).chain(&args.files);
-    let check_args: CheckArgs = WrapperArgs::try_parse_from(check_args_input)?.check_args;
-    let (cli, overrides) = check_args.partition();
-    let mut pyproject_config = resolve(
-        cli.isolated,
-        cli.config.as_deref(),
-        &overrides,
-        cli.stdin_filename.as_deref(),
-    )?;
-    // We don't want to format pyproject.toml
-    pyproject_config.settings.lib.include = FilePatternSet::try_from_vec(vec![
-        FilePattern::Builtin("*.py"),
-        FilePattern::Builtin("*.pyi"),
-    ])
-    .unwrap();
-    let (paths, _resolver) = python_files_in_path(&cli.files, &pyproject_config, &overrides)?;
-
-    if paths.is_empty() {
-        bail!("no python files in {:?}", cli.files)
-    }
-
-    let mut formatted_counter = 0;
-    let errors: Vec<_> = paths
-        .into_iter()
-        .map(|dir_entry| {
-            // Doesn't make sense to recover here in this test script
-            dir_entry.expect("Iterating the files in the repository failed")
-        })
-        .filter(|dir_entry| {
-            // For some reason it does not filter in the beginning
-            dir_entry.file_name() != "pyproject.toml"
-        })
-        .map(|dir_entry| {
-            let file = dir_entry.path().to_path_buf();
-            formatted_counter += 1;
-            // Handle panics (mostly in `debug_assert!`)
-            let result = match catch_unwind(|| check_file(&file)) {
-                Ok(result) => result,
-                Err(panic) => {
-                    if let Some(message) = panic.downcast_ref::<String>() {
-                        Err(FormatterStabilityError::Panic {
-                            message: message.clone(),
-                        })
-                    } else if let Some(&message) = panic.downcast_ref::<&str>() {
-                        Err(FormatterStabilityError::Panic {
-                            message: message.to_string(),
-                        })
-                    } else {
-                        Err(FormatterStabilityError::Panic {
-                            // This should not happen, but it can
-                            message: "(Panic didn't set a string message)".to_string(),
-                        })
-                    }
-                }
-            };
-            (result, file)
-        })
-        // We only care about the errors
-        .filter_map(|(result, file)| match result {
-            Err(error) => Some(Diagnostic { file, error }),
-            Ok(()) => None,
-        })
-        .collect();
-
-    let duration = start.elapsed();
-
-    Ok(CheckRepoResult {
-        duration,
-        file_count: formatted_counter,
-        diagnostics: errors,
-    })
-}
-
-/// A compact diff that only shows a header and changes, but nothing unchanged. This makes viewing
-/// multiple errors easier.
-fn diff_show_only_changes(
-    writer: &mut Formatter,
-    formatted: &str,
-    reformatted: &str,
-) -> fmt::Result {
-    for changes in TextDiff::from_lines(formatted, reformatted)
-        .unified_diff()
-        .iter_hunks()
-    {
-        for (idx, change) in changes
-            .iter_changes()
-            .filter(|change| change.tag() != ChangeTag::Equal)
-            .enumerate()
-        {
-            if idx == 0 {
-                writeln!(writer, "{}", changes.header())?;
-            }
-            write!(writer, "{}", change.tag())?;
-            writer.write_str(change.value())?;
-        }
-    }
-    Ok(())
-}
-
-struct CheckRepoResult {
-    duration: Duration,
-    file_count: usize,
-    diagnostics: Vec<Diagnostic>,
-}
-
-impl CheckRepoResult {
-    fn display(&self, format: Format) -> DisplayCheckRepoResult {
-        DisplayCheckRepoResult {
-            result: self,
-            format,
-        }
-    }
-
-    fn is_success(&self) -> bool {
-        self.diagnostics.is_empty()
-    }
-}
-
-struct DisplayCheckRepoResult<'a> {
-    result: &'a CheckRepoResult,
-    format: Format,
-}
-
-impl Display for DisplayCheckRepoResult<'_> {
-    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
-        for diagnostic in &self.result.diagnostics {
-            write!(f, "{}", diagnostic.display(self.format))?;
-        }
-        Ok(())
-    }
-}
-
-#[derive(Debug)]
-struct Diagnostic {
-    file: PathBuf,
-    error: FormatterStabilityError,
-}
-
-impl Diagnostic {
-    fn display(&self, format: Format) -> DisplayDiagnostic {
-        DisplayDiagnostic {
-            diagnostic: self,
-            format,
-        }
-    }
-}
-
-struct DisplayDiagnostic<'a> {
-    format: Format,
-    diagnostic: &'a Diagnostic,
-}
-
-impl Display for DisplayDiagnostic<'_> {
-    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
-        let Diagnostic { file, error } = &self.diagnostic;
-
-        match error {
-            FormatterStabilityError::Unstable {
-                formatted,
-                reformatted,
-            } => {
-                writeln!(f, "Unstable formatting {}", file.display())?;
-                match self.format {
-                    Format::Minimal => {}
-                    Format::Default => {
-                        diff_show_only_changes(f, formatted, reformatted)?;
-                    }
-                    Format::Full => {
-                        let diff = TextDiff::from_lines(formatted.as_str(), reformatted.as_str())
-                            .unified_diff()
-                            .header("Formatted once", "Formatted twice")
-                            .to_string();
-                        writeln!(
-                            f,
-                            r#"Reformatting the formatted code a second time resulted in formatting changes.
---
-{diff}---
-
-Formatted once:
---
-{formatted}---
-
-Formatted twice:
---
-{reformatted}---\n"#,
-                        )?;
-                    }
-                }
-            }
-            FormatterStabilityError::InvalidSyntax { err, formatted } => {
-                writeln!(
-                    f,
-                    "Formatter generated invalid syntax {}: {}",
-                    file.display(),
-                    err
-                )?;
-                if self.format == Format::Full {
-                    writeln!(f, "---\n{formatted}\n---\n")?;
-                }
-            }
-            FormatterStabilityError::Panic { message } => {
-                writeln!(f, "Panic {}: {}", file.display(), message)?;
-            }
-            FormatterStabilityError::Other(err) => {
-                writeln!(f, "Uncategorized error {}: {}", file.display(), err)?;
-            }
-        }
-        Ok(())
-    }
-}
-
-#[derive(Debug)]
-enum FormatterStabilityError {
-    /// First and second pass of the formatter are different
-    Unstable {
-        formatted: String,
-        reformatted: String,
-    },
-    /// The formatter printed invalid code
-    InvalidSyntax {
-        err: anyhow::Error,
-        formatted: String,
-    },
-    /// From `catch_unwind`
-    Panic {
-        message: String,
-    },
-    Other(anyhow::Error),
-}
-
-impl From<anyhow::Error> for FormatterStabilityError {
-    fn from(error: anyhow::Error) -> Self {
-        Self::Other(error)
-    }
-}
-
-/// Run the formatter twice on the given file. Does not write back to the file
-fn check_file(input_path: &Path) -> Result<(), FormatterStabilityError> {
-    let content = fs::read_to_string(input_path).context("Failed to read file")?;
-    let printed = match format_module(&content, PyFormatOptions::default()) {
-        Ok(printed) => printed,
-        Err(err) => {
-            return if err
-                .to_string()
-                .starts_with("Source contains syntax errors ")
-            {
-                debug!(
-                    "Skipping {} with invalid first pass {}",
-                    input_path.display(),
-                    err
-                );
-                Ok(())
-            } else {
-                Err(err.into())
-            };
-        }
-    };
-    let formatted = printed.as_code();
-
-    let reformatted = match format_module(formatted, PyFormatOptions::default()) {
-        Ok(reformatted) => reformatted,
-        Err(err) => {
-            return Err(FormatterStabilityError::InvalidSyntax {
-                err,
-                formatted: formatted.to_string(),
-            });
-        }
-    };
-
-    if reformatted.as_code() != formatted {
-        return Err(FormatterStabilityError::Unstable {
-            formatted: formatted.to_string(),
-            reformatted: reformatted.into_code(),
-        });
-    }
-    Ok(())
-}
--- a/crates/ruff_dev/src/format_dev.rs
+++ b/crates/ruff_dev/src/format_dev.rs
@ -0,0 +1,628 @@
+use anyhow::{bail, Context};
+use clap::{CommandFactory, FromArgMatches};
+use ignore::DirEntry;
+use indicatif::ProgressBar;
+use rayon::iter::{IntoParallelIterator, ParallelIterator};
+use ruff::resolver::python_files_in_path;
+use ruff::settings::types::{FilePattern, FilePatternSet};
+use ruff_cli::args::CheckArgs;
+use ruff_cli::resolve::resolve;
+use ruff_formatter::{FormatError, PrintError};
+use ruff_python_formatter::{format_module, FormatModuleError, PyFormatOptions};
+use similar::{ChangeTag, TextDiff};
+use std::fmt::{Display, Formatter};
+use std::fs::File;
+use std::io::{BufWriter, Write};
+use std::ops::{Add, AddAssign};
+use std::panic::catch_unwind;
+use std::path::{Path, PathBuf};
+use std::process::ExitCode;
+use std::sync::mpsc::channel;
+use std::time::{Duration, Instant};
+use std::{fmt, fs, io};
+use tempfile::NamedTempFile;
+
+/// Find files that ruff would check so we can format them. Adapted from `ruff_cli`.
+fn ruff_check_paths(dirs: &[PathBuf]) -> anyhow::Result<Vec<Result<DirEntry, ignore::Error>>> {
+    let args_matches = CheckArgs::command()
+        .no_binary_name(true)
+        .get_matches_from(dirs);
+    let check_args: CheckArgs = CheckArgs::from_arg_matches(&args_matches)?;
+    let (cli, overrides) = check_args.partition();
+    let mut pyproject_config = resolve(
+        cli.isolated,
+        cli.config.as_deref(),
+        &overrides,
+        cli.stdin_filename.as_deref(),
+    )?;
+    // We don't want to format pyproject.toml
+    pyproject_config.settings.lib.include = FilePatternSet::try_from_vec(vec![
+        FilePattern::Builtin("*.py"),
+        FilePattern::Builtin("*.pyi"),
+    ])
+    .unwrap();
+    let (paths, _resolver) = python_files_in_path(&cli.files, &pyproject_config, &overrides)?;
+    if paths.is_empty() {
+        bail!("no python files in {:?}", dirs)
+    }
+    Ok(paths)
+}
+
+/// Collects statistics over the formatted files, currently only computes the Jaccard index
+///
+/// The [Jaccard index](https://en.wikipedia.org/wiki/Jaccard_index) can be defined as
+/// ```text
+/// J(A, B) = |A∩B| / (|A\B| + |B\A| + |A∩B|)
+/// ```
+/// where in our case `A` is the black formatted input, `B` is the ruff formatted output and the
+/// intersection are the lines in the diff that didn't change. We don't just track intersection and
+/// union so we can make statistics about size changes. If the input is not black formatted, this
+/// only becomes a measure for the changes made to the codebase during the initial formatting.
+#[derive(Default, Debug, Copy, Clone)]
+pub(crate) struct Statistics {
+    /// The size of `A\B`, the number of lines only in the input, which we assume to be black
+    /// formatted
+    black_input: u32,
+    /// The size of `B\A`, the number of lines only in the formatted output
+    ruff_output: u32,
+    /// The number of matching identical lines
+    intersection: u32,
+}
+
+impl Statistics {
+    pub(crate) fn from_versions(black: &str, ruff: &str) -> Self {
+        if black == ruff {
+            let intersection = u32::try_from(black.lines().count()).unwrap();
+            Self {
+                black_input: 0,
+                ruff_output: 0,
+                intersection,
+            }
+        } else {
+            let diff = TextDiff::from_lines(black, ruff);
+            let mut statistics = Self::default();
+            for change in diff.iter_all_changes() {
+                match change.tag() {
+                    ChangeTag::Delete => statistics.black_input += 1,
+                    ChangeTag::Insert => statistics.ruff_output += 1,
+                    ChangeTag::Equal => statistics.intersection += 1,
+                }
+            }
+            statistics
+        }
+    }
+
+    #[allow(clippy::cast_precision_loss)]
+    pub(crate) fn jaccard_index(&self) -> f32 {
+        self.intersection as f32 / (self.black_input + self.ruff_output + self.intersection) as f32
+    }
+}
+
+impl Add<Statistics> for Statistics {
+    type Output = Statistics;
+
+    fn add(self, rhs: Statistics) -> Self::Output {
+        Statistics {
+            black_input: self.black_input + rhs.black_input,
+            ruff_output: self.ruff_output + rhs.ruff_output,
+            intersection: self.intersection + rhs.intersection,
+        }
+    }
+}
+
+impl AddAssign<Statistics> for Statistics {
+    fn add_assign(&mut self, rhs: Statistics) {
+        *self = *self + rhs;
+    }
+}
+
+/// Control the verbosity of the output
+#[derive(Copy, Clone, PartialEq, Eq, clap::ValueEnum, Default)]
+pub(crate) enum Format {
+    /// Filenames only
+    Minimal,
+    /// Filenames and reduced diff
+    #[default]
+    Default,
+    /// Full diff and invalid code
+    Full,
+}
+
+#[allow(clippy::struct_excessive_bools)]
+#[derive(clap::Args)]
+pub(crate) struct Args {
+    /// Like `ruff check`'s files. See `--multi-project` if you want to format an ecosystem
+    /// checkout.
+    pub(crate) files: Vec<PathBuf>,
+    /// Check stability
+    ///
+    /// We want to ensure that once formatted content stays the same when formatted again, which is
+    /// known as formatter stability or formatter idempotency, and that the formatter prints
+    /// syntactically valid code. As our test cases cover only a limited amount of code, this allows
+    /// checking entire repositories.
+    #[arg(long)]
+    pub(crate) stability_check: bool,
+    /// Format the files. Without this flag, the python files are not modified
+    #[arg(long)]
+    pub(crate) write: bool,
+    /// Control the verbosity of the output
+    #[arg(long, default_value_t, value_enum)]
+    pub(crate) format: Format,
+    /// Print only the first error and exit, `-x` is same as pytest
+    #[arg(long, short = 'x')]
+    pub(crate) exit_first_error: bool,
+    /// Checks each project inside a directory, useful e.g. if you want to check all of the
+    /// ecosystem checkouts.
+    #[arg(long)]
+    pub(crate) multi_project: bool,
+    /// Write all errors to this file in addition to stdout. Only used in multi-project mode.
+    #[arg(long)]
+    pub(crate) error_file: Option<PathBuf>,
+}
+
+pub(crate) fn main(args: &Args) -> anyhow::Result<ExitCode> {
+    let all_success = if args.multi_project {
+        format_dev_multi_project(args)
+    } else {
+        let result = format_dev_project(&args.files, args.stability_check, args.write, true)?;
+
+        #[allow(clippy::print_stdout)]
+        {
+            print!("{}", result.display(args.format));
+            println!(
+                "Found {} stability errors in {} files (jaccard index {:.3}) in {:.2}s",
+                result
+                    .diagnostics
+                    .iter()
+                    .filter(|diagnostics| !diagnostics.error.is_success())
+                    .count(),
+                result.file_count,
+                result.statistics.jaccard_index(),
+                result.duration.as_secs_f32(),
+            );
+        }
+
+        !result.is_success()
+    };
+    if all_success {
+        Ok(ExitCode::SUCCESS)
+    } else {
+        Ok(ExitCode::FAILURE)
+    }
+}
+
+/// Each `path` is one of the `files` in `Args`
+enum Message {
+    Start {
+        path: PathBuf,
+    },
+    Failed {
+        path: PathBuf,
+        error: anyhow::Error,
+    },
+    Finished {
+        path: PathBuf,
+        result: CheckRepoResult,
+    },
+}
+
+/// Checks a directory of projects
+fn format_dev_multi_project(args: &Args) -> bool {
+    let mut all_success = true;
+    let mut total_errors = 0;
+    let mut total_files = 0;
+    let start = Instant::now();
+
+    rayon::scope(|scope| {
+        let (sender, receiver) = channel();
+
+        // Workers, to check is subdirectory in parallel
+        for base_dir in &args.files {
+            for dir in base_dir.read_dir().unwrap() {
+                let path = dir.unwrap().path().clone();
+
+                let sender = sender.clone();
+
+                scope.spawn(move |_| {
+                    sender.send(Message::Start { path: path.clone() }).unwrap();
+
+                    match format_dev_project(
+                        &[path.clone()],
+                        args.stability_check,
+                        args.write,
+                        false,
+                    ) {
+                        Ok(result) => sender.send(Message::Finished { result, path }),
+                        Err(error) => sender.send(Message::Failed { error, path }),
+                    }
+                    .unwrap();
+                });
+            }
+        }
+
+        // Main thread, writing to stdout
+        scope.spawn(|_| {
+            let mut error_file = args.error_file.as_ref().map(|error_file| {
+                BufWriter::new(File::create(error_file).expect("Couldn't open error file"))
+            });
+
+            let bar = ProgressBar::new(args.files.len() as u64);
+            for message in receiver {
+                match message {
+                    Message::Start { path } => {
+                        bar.println(path.display().to_string());
+                    }
+                    Message::Finished { path, result } => {
+                        total_errors += result.diagnostics.len();
+                        total_files += result.file_count;
+
+                        bar.println(format!(
+                            "Finished {} with {} files (jaccard index {:.3}) in {:.2}s",
+                            path.display(),
+                            result.file_count,
+                            result.statistics.jaccard_index(),
+                            result.duration.as_secs_f32(),
+                        ));
+                        bar.println(result.display(args.format).to_string().trim_end());
+                        if let Some(error_file) = &mut error_file {
+                            write!(error_file, "{}", result.display(args.format)).unwrap();
+                        }
+                        all_success = all_success && !result.is_success();
+                        bar.inc(1);
+                    }
+                    Message::Failed { path, error } => {
+                        bar.println(format!("Failed {}: {}", path.display(), error));
+                        all_success = false;
+                        bar.inc(1);
+                    }
+                }
+            }
+            bar.finish();
+        });
+    });
+
+    let duration = start.elapsed();
+
+    #[allow(clippy::print_stdout)]
+    {
+        println!(
+            "{total_errors} stability errors in {total_files} files in {}s",
+            duration.as_secs_f32()
+        );
+    }
+
+    all_success
+}
+
+fn format_dev_project(
+    files: &[PathBuf],
+    stability_check: bool,
+    write: bool,
+    progress_bar: bool,
+) -> anyhow::Result<CheckRepoResult> {
+    let start = Instant::now();
+
+    // Find files to check (or in this case, format twice). Adapted from ruff_cli
+    // First argument is ignored
+    let paths = ruff_check_paths(files)?;
+
+    let bar = progress_bar.then(|| ProgressBar::new(paths.len() as u64));
+    let result_iter = paths
+        .into_par_iter()
+        .map(|dir_entry| {
+            let dir_entry = match dir_entry.context("Iterating the files in the repository failed")
+            {
+                Ok(dir_entry) => dir_entry,
+                Err(err) => return Err(err),
+            };
+            let file = dir_entry.path().to_path_buf();
+            // For some reason it does not filter in the beginning
+            if dir_entry.file_name() == "pyproject.toml" {
+                return Ok((Ok(Statistics::default()), file));
+            }
+
+            let file = dir_entry.path().to_path_buf();
+            // Handle panics (mostly in `debug_assert!`)
+            let result = match catch_unwind(|| format_dev_file(&file, stability_check, write)) {
+                Ok(result) => result,
+                Err(panic) => {
+                    if let Some(message) = panic.downcast_ref::<String>() {
+                        Err(CheckFileError::Panic {
+                            message: message.clone(),
+                        })
+                    } else if let Some(&message) = panic.downcast_ref::<&str>() {
+                        Err(CheckFileError::Panic {
+                            message: message.to_string(),
+                        })
+                    } else {
+                        Err(CheckFileError::Panic {
+                            // This should not happen, but it can
+                            message: "(Panic didn't set a string message)".to_string(),
+                        })
+                    }
+                }
+            };
+            if let Some(bar) = &bar {
+                bar.inc(1);
+            }
+            Ok((result, file))
+        })
+        .collect::<anyhow::Result<Vec<_>>>()?;
+    if let Some(bar) = bar {
+        bar.finish();
+    }
+
+    let mut statistics = Statistics::default();
+    let mut formatted_counter = 0;
+    let mut diagnostics = Vec::new();
+    for (result, file) in result_iter {
+        formatted_counter += 1;
+        match result {
+            Ok(statistics_file) => statistics += statistics_file,
+            Err(error) => diagnostics.push(Diagnostic { file, error }),
+        }
+    }
+
+    let duration = start.elapsed();
+
+    Ok(CheckRepoResult {
+        duration,
+        file_count: formatted_counter,
+        diagnostics,
+        statistics,
+    })
+}
+
+/// A compact diff that only shows a header and changes, but nothing unchanged. This makes viewing
+/// multiple errors easier.
+fn diff_show_only_changes(
+    writer: &mut Formatter,
+    formatted: &str,
+    reformatted: &str,
+) -> fmt::Result {
+    for changes in TextDiff::from_lines(formatted, reformatted)
+        .unified_diff()
+        .iter_hunks()
+    {
+        for (idx, change) in changes
+            .iter_changes()
+            .filter(|change| change.tag() != ChangeTag::Equal)
+            .enumerate()
+        {
+            if idx == 0 {
+                writeln!(writer, "{}", changes.header())?;
+            }
+            write!(writer, "{}", change.tag())?;
+            writer.write_str(change.value())?;
+        }
+    }
+    Ok(())
+}
+
+struct CheckRepoResult {
+    duration: Duration,
+    file_count: usize,
+    diagnostics: Vec<Diagnostic>,
+    statistics: Statistics,
+}
+
+impl CheckRepoResult {
+    fn display(&self, format: Format) -> DisplayCheckRepoResult {
+        DisplayCheckRepoResult {
+            result: self,
+            format,
+        }
+    }
+
+    /// We also emit diagnostics if the input file was already invalid or the were io errors. This
+    /// method helps to differentiate
+    fn is_success(&self) -> bool {
+        self.diagnostics
+            .iter()
+            .all(|diagnostic| diagnostic.error.is_success())
+    }
+}
+
+struct DisplayCheckRepoResult<'a> {
+    result: &'a CheckRepoResult,
+    format: Format,
+}
+
+impl Display for DisplayCheckRepoResult<'_> {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
+        for diagnostic in &self.result.diagnostics {
+            write!(f, "{}", diagnostic.display(self.format))?;
+        }
+        Ok(())
+    }
+}
+
+#[derive(Debug)]
+struct Diagnostic {
+    file: PathBuf,
+    error: CheckFileError,
+}
+
+impl Diagnostic {
+    fn display(&self, format: Format) -> DisplayDiagnostic {
+        DisplayDiagnostic {
+            diagnostic: self,
+            format,
+        }
+    }
+}
+
+struct DisplayDiagnostic<'a> {
+    format: Format,
+    diagnostic: &'a Diagnostic,
+}
+
+impl Display for DisplayDiagnostic<'_> {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
+        let Diagnostic { file, error } = &self.diagnostic;
+
+        match error {
+            CheckFileError::Unstable {
+                formatted,
+                reformatted,
+            } => {
+                writeln!(f, "Unstable formatting {}", file.display())?;
+                match self.format {
+                    Format::Minimal => {}
+                    Format::Default => {
+                        diff_show_only_changes(f, formatted, reformatted)?;
+                    }
+                    Format::Full => {
+                        let diff = TextDiff::from_lines(formatted.as_str(), reformatted.as_str())
+                            .unified_diff()
+                            .header("Formatted once", "Formatted twice")
+                            .to_string();
+                        writeln!(
+                            f,
+                            r#"Reformatting the formatted code a second time resulted in formatting changes.
+---
+{diff}---
+
+Formatted once:
+---
+{formatted}---
+
+Formatted twice:
+---
+{reformatted}---\n"#,
+                        )?;
+                    }
+                }
+            }
+            CheckFileError::Panic { message } => {
+                writeln!(f, "Panic {}: {}", file.display(), message)?;
+            }
+            CheckFileError::SyntaxErrorInInput(error) => {
+                writeln!(f, "Syntax error in {}: {}", file.display(), error)?;
+            }
+            CheckFileError::SyntaxErrorInOutput { formatted, error } => {
+                writeln!(
+                    f,
+                    "Formatter generated invalid syntax {}: {}",
+                    file.display(),
+                    error
+                )?;
+                if self.format == Format::Full {
+                    writeln!(f, "---\n{formatted}\n---\n")?;
+                }
+            }
+            CheckFileError::FormatError(error) => {
+                writeln!(f, "Formatter error for {}: {}", file.display(), error)?;
+            }
+            CheckFileError::PrintError(error) => {
+                writeln!(f, "Printer error for {}: {}", file.display(), error)?;
+            }
+            CheckFileError::IoError(error) => {
+                writeln!(f, "Error reading {}: {}", file.display(), error)?;
+            }
+        }
+        Ok(())
+    }
+}
+
+#[derive(Debug)]
+enum CheckFileError {
+    /// First and second pass of the formatter are different
+    Unstable {
+        formatted: String,
+        reformatted: String,
+    },
+    /// The input file was already invalid (not a bug)
+    SyntaxErrorInInput(FormatModuleError),
+    /// The formatter introduced a syntax error
+    SyntaxErrorInOutput {
+        formatted: String,
+        error: FormatModuleError,
+    },
+    /// The formatter failed (bug)
+    FormatError(FormatError),
+    /// The printer failed (bug)
+    PrintError(PrintError),
+    /// Failed to read the file, this sometimes happens e.g. with strange filenames (not a bug)
+    IoError(io::Error),
+    /// From `catch_unwind`
+    Panic { message: String },
+}
+
+impl CheckFileError {
+    /// Returns `false` if this is a formatter bug or `true` is if it is something outside of ruff
+    fn is_success(&self) -> bool {
+        match self {
+            CheckFileError::SyntaxErrorInInput(_) | CheckFileError::IoError(_) => true,
+            CheckFileError::Unstable { .. }
+            | CheckFileError::SyntaxErrorInOutput { .. }
+            | CheckFileError::FormatError(_)
+            | CheckFileError::PrintError(_)
+            | CheckFileError::Panic { .. } => false,
+        }
+    }
+}
+
+impl From<io::Error> for CheckFileError {
+    fn from(value: io::Error) -> Self {
+        Self::IoError(value)
+    }
+}
+
+fn format_dev_file(
+    input_path: &Path,
+    stability_check: bool,
+    write: bool,
+) -> Result<Statistics, CheckFileError> {
+    let content = fs::read_to_string(input_path)?;
+    let printed = match format_module(&content, PyFormatOptions::default()) {
+        Ok(printed) => printed,
+        Err(err @ (FormatModuleError::LexError(_) | FormatModuleError::ParseError(_))) => {
+            return Err(CheckFileError::SyntaxErrorInInput(err));
+        }
+        Err(FormatModuleError::FormatError(err)) => {
+            return Err(CheckFileError::FormatError(err));
+        }
+        Err(FormatModuleError::PrintError(err)) => {
+            return Err(CheckFileError::PrintError(err));
+        }
+    };
+    let formatted = printed.as_code();
+
+    if write && content != formatted {
+        // Simple atomic write.
+        // The file is in a directory so it must have a parent. Surprisingly `DirEntry` doesn't
+        // give us access without unwrap
+        let mut file = NamedTempFile::new_in(input_path.parent().unwrap())?;
+        file.write_all(formatted.as_bytes())?;
+        // "If a file exists at the target path, persist will atomically replace it."
+        file.persist(input_path).map_err(|error| error.error)?;
+    }
+
+    if stability_check {
+        let reformatted = match format_module(formatted, PyFormatOptions::default()) {
+            Ok(reformatted) => reformatted,
+            Err(err @ (FormatModuleError::LexError(_) | FormatModuleError::ParseError(_))) => {
+                return Err(CheckFileError::SyntaxErrorInOutput {
+                    formatted: formatted.to_string(),
+                    error: err,
+                });
+            }
+            Err(FormatModuleError::FormatError(err)) => {
+                return Err(CheckFileError::FormatError(err));
+            }
+            Err(FormatModuleError::PrintError(err)) => {
+                return Err(CheckFileError::PrintError(err));
+            }
+        };
+
+        if reformatted.as_code() != formatted {
+            return Err(CheckFileError::Unstable {
+                formatted: formatted.to_string(),
+                reformatted: reformatted.into_code(),
+            });
+        }
+    }
+
+    Ok(Statistics::from_versions(&content, formatted))
+}
--- a/crates/ruff_dev/src/main.rs
+++ b/crates/ruff_dev/src/main.rs
@ -8,7 +8,7 @@ use ruff::logging::{set_up_logging, LogLevel};
 use ruff_cli::check;
 use std::process::ExitCode;

-mod check_formatter_stability;
+mod format_dev;
 mod generate_all;
 mod generate_cli_help;
 mod generate_docs;
@ -63,9 +63,15 @@ enum Command {
        #[clap(long)]
        repeat: usize,
    },
-    /// Format a repository twice and ensure that it looks that the first and second formatting
-    /// look the same. Same arguments as `ruff check`
-    CheckFormatterStability(check_formatter_stability::Args),
+    /// Several utils related to the formatter which can be run on one or more repositories. The
+    /// selected set of files in a repository is the same as for `ruff check`.
+    ///
+    /// * Check formatter stability: Format a repository twice and ensure that it looks that the
+    ///   first and second formatting look the same.
+    /// * Format: Format the files in a repository to be able to check them with `git diff`
+    /// * Statistics: The subcommand the Jaccard index between the (assumed to be black formatted)
+    ///   input and the ruff formatted output
+    FormatDev(format_dev::Args),
 }

 fn main() -> Result<ExitCode> {
@ -93,8 +99,8 @@ fn main() -> Result<ExitCode> {
                check(args.clone(), log_level)?;
            }
        }
-        Command::CheckFormatterStability(args) => {
-            let exit_code = check_formatter_stability::main(&args)?;
+        Command::FormatDev(args) => {
+            let exit_code = format_dev::main(&args)?;
            return Ok(exit_code);
        }
    }
--- a/crates/ruff_python_formatter/Cargo.toml
+++ b/crates/ruff_python_formatter/Cargo.toml
@ -27,6 +27,7 @@ rustc-hash = { workspace = true }
 rustpython-parser = { workspace = true }
 serde = { workspace = true, optional = true }
 smallvec = { workspace = true }
+thiserror = { workspace = true }

 [dev-dependencies]
 ruff_formatter = { path = "../ruff_formatter", features = ["serde"]}
--- a/crates/ruff_python_formatter/src/lib.rs
+++ b/crates/ruff_python_formatter/src/lib.rs
@ -3,17 +3,23 @@ use crate::comments::{
 };
 use crate::context::PyFormatContext;
 pub use crate::options::{MagicTrailingComma, PyFormatOptions, QuoteStyle};
-use anyhow::{anyhow, Context, Result};
-use ruff_formatter::prelude::*;
-use ruff_formatter::{format, write};
+use ruff_formatter::format_element::tag;
+use ruff_formatter::prelude::{
+    dynamic_text, source_position, source_text_slice, text, ContainsNewlines, Formatter, Tag,
+};
+use ruff_formatter::{
+    format, normalize_newlines, write, Buffer, Format, FormatElement, FormatError, FormatResult,
+    PrintError,
+};
 use ruff_formatter::{Formatted, Printed, SourceCode};
 use ruff_python_ast::node::{AnyNodeRef, AstNode, NodeKind};
 use ruff_python_ast::source_code::{CommentRanges, CommentRangesBuilder, Locator};
 use ruff_text_size::{TextLen, TextRange};
 use rustpython_parser::ast::{Mod, Ranged};
-use rustpython_parser::lexer::lex;
-use rustpython_parser::{parse_tokens, Mode};
+use rustpython_parser::lexer::{lex, LexicalError};
+use rustpython_parser::{parse_tokens, Mode, ParseError};
 use std::borrow::Cow;
+use thiserror::Error;

 pub(crate) mod builders;
 pub mod cli;
@ -84,16 +90,40 @@ where
    }
 }

-pub fn format_module(contents: &str, options: PyFormatOptions) -> Result<Printed> {
+#[derive(Error, Debug)]
+pub enum FormatModuleError {
+    #[error("source contains syntax errors (lexer error): {0:?}")]
+    LexError(LexicalError),
+    #[error("source contains syntax errors (parser error): {0:?}")]
+    ParseError(ParseError),
+    #[error(transparent)]
+    FormatError(#[from] FormatError),
+    #[error(transparent)]
+    PrintError(#[from] PrintError),
+}
+
+impl From<LexicalError> for FormatModuleError {
+    fn from(value: LexicalError) -> Self {
+        Self::LexError(value)
+    }
+}
+
+impl From<ParseError> for FormatModuleError {
+    fn from(value: ParseError) -> Self {
+        Self::ParseError(value)
+    }
+}
+
+pub fn format_module(
+    contents: &str,
+    options: PyFormatOptions,
+) -> Result<Printed, FormatModuleError> {
    // Tokenize once
    let mut tokens = Vec::new();
    let mut comment_ranges = CommentRangesBuilder::default();

    for result in lex(contents, Mode::Module) {
-        let (token, range) = match result {
-            Ok((token, range)) => (token, range),
-            Err(err) => return Err(anyhow!("Source contains syntax errors {err:?}")),
-        };
+        let (token, range) = result?;

        comment_ranges.visit_token(&token, range);
        tokens.push(Ok((token, range)));
@ -102,14 +132,11 @@ pub fn format_module(contents: &str, options: PyFormatOptions) -> Result<Printed
    let comment_ranges = comment_ranges.finish();

    // Parse the AST.
-    let python_ast = parse_tokens(tokens, Mode::Module, "<filename>")
-        .with_context(|| "Syntax error in input")?;
+    let python_ast = parse_tokens(tokens, Mode::Module, "<filename>")?;

    let formatted = format_node(&python_ast, &comment_ranges, contents, options)?;

-    formatted
-        .print()
-        .with_context(|| "Failed to print the formatter IR")
+    Ok(formatted.print()?)
 }

 pub fn format_node<'a>(