diff: inline hunk processing in get_diff_stat()

This is simpler and more efficient. If we add word-diff to unified_diff_hunks(), it will do more expensive work that isn't needed here.
2025-02-05 19:14:43 +00:00 · 2024-06-29 00:39:02 +09:00 · 2024-06-29 00:39:02 +09:00 · 0ca8502c5a
commit 0ca8502c5a
parent 1b658ea80e
1 changed files with 11 additions and 7 deletions
--- a/cli/src/diff_util.rs
+++ b/cli/src/diff_util.rs
@ -995,15 +995,19 @@ fn get_diff_stat(
    // TODO: this matches git's behavior, which is to count the number of newlines
    // in the file. but that behavior seems unhelpful; no one really cares how
    // many `0xa0` characters are in an image.
-    let hunks = unified_diff_hunks(&left_content.contents, &right_content.contents, 0);
+    let diff = Diff::for_tokenizer(
+        &[&left_content.contents, &right_content.contents],
+        diff::find_line_ranges,
+    );
    let mut added = 0;
    let mut removed = 0;
-    for hunk in hunks {
-        for (line_type, _content) in hunk.lines {
-            match line_type {
-                DiffLineType::Context => {}
-                DiffLineType::Removed => removed += 1,
-                DiffLineType::Added => added += 1,
+    for hunk in diff.hunks() {
+        match hunk {
+            DiffHunk::Matching(_) => {}
+            DiffHunk::Different(contents) => {
+                let [left, right] = contents.try_into().unwrap();
+                removed += left.split_inclusive(|b| *b == b'\n').count();
+                added += right.split_inclusive(|b| *b == b'\n').count();
            }
        }
    }