Code

diff: fix handling of binary rewrite diffs
authorJeff King <peff@peff.net>
Tue, 9 Dec 2008 08:12:28 +0000 (03:12 -0500)
committerJunio C Hamano <gitster@pobox.com>
Wed, 10 Dec 2008 06:14:25 +0000 (22:14 -0800)
The current emit_rewrite_diff code always writes a text patch without
checking whether the content is binary. This means that if you end up with
a rewrite diff for a binary file, you get lots of raw binary goo in your
patch.

Instead, if we have binary files, then let's just skip emit_rewrite_diff
altogether. We will already have shown the "dissimilarity index" line, so
it is really about the diff contents. If binary diffs are turned off, the
"Binary files a/file and b/file differ" message should be the same in
either case. If we do have binary patches turned on, there isn't much
point in making a less-efficient binary patch that does a total rewrite;
no human is going to read it, and since binary patches don't apply with
any fuzz anyway, the result of application should be the same.

Signed-off-by: Jeff King <peff@peff.net>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
diff.c
t/t4031-diff-rewrite-binary.sh [new file with mode: 0755]

diff --git a/diff.c b/diff.c
index e21af3b7ee0d5a0871f76dcbb1acced2345c6ea8..50277b82b2289395fd11a3d5b4d63cf45f825a51 100644 (file)
--- a/diff.c
+++ b/diff.c
@@ -1376,7 +1376,9 @@ static void builtin_diff(const char *name_a,
                 */
                if ((one->mode ^ two->mode) & S_IFMT)
                        goto free_ab_and_return;
-               if (complete_rewrite) {
+               if (complete_rewrite &&
+                   !diff_filespec_is_binary(one) &&
+                   !diff_filespec_is_binary(two)) {
                        emit_rewrite_diff(name_a, name_b, one, two, o);
                        o->found_changes = 1;
                        goto free_ab_and_return;
diff --git a/t/t4031-diff-rewrite-binary.sh b/t/t4031-diff-rewrite-binary.sh
new file mode 100755 (executable)
index 0000000..e16c355
--- /dev/null
@@ -0,0 +1,45 @@
+#!/bin/sh
+
+test_description='rewrite diff on binary file'
+
+. ./test-lib.sh
+
+# We must be large enough to meet the MINIMUM_BREAK_SIZE
+# requirement.
+make_file() {
+       for i in 1 2 3 4 5 6 7 8 9 10
+       do
+               for j in 1 2 3 4 5 6 7 8 9
+               do
+                       for k in 1 2 3 4 5
+                       do
+                               printf "$1\n"
+                       done
+               done
+       done >file
+}
+
+test_expect_success 'create binary file with changes' '
+       make_file "\\0" &&
+       git add file &&
+       make_file "\\01"
+'
+
+test_expect_success 'vanilla diff is binary' '
+       git diff >diff &&
+       grep "Binary files a/file and b/file differ" diff
+'
+
+test_expect_success 'rewrite diff is binary' '
+       git diff -B >diff &&
+       grep "dissimilarity index" diff &&
+       grep "Binary files a/file and b/file differ" diff
+'
+
+test_expect_success 'rewrite diff can show binary patch' '
+       git diff -B --binary >diff &&
+       grep "dissimilarity index" diff &&
+       grep "GIT binary patch" diff
+'
+
+test_done