Commit 364f51bd by Russell Belfer

Merge pull request #668 from nulltoken/topic/binary-blobs

Enhancing the blob diffing experience
parents 1f796cd1 d1c4312a
......@@ -337,12 +337,21 @@ GIT_EXTERN(int) git_diff_print_patch(
/**
* Directly run a text diff on two blobs.
*
* Compared to a file, a blob lacks some contextual information. As such, the
* `git_diff_file` parameters of the callbacks will be filled accordingly to the following:
* `mode` will be set to 0, `path` will be set to NULL. When dealing with a NULL blob, `oid`
* will be set to 0.
*
* When at least one of the blobs being dealt with is binary, the `git_diff_delta` binary
* attribute will be set to 1 and no call to the hunk_cb nor line_cb will be made.
*/
GIT_EXTERN(int) git_diff_blobs(
git_blob *old_blob,
git_blob *new_blob,
git_diff_options *options,
void *cb_data,
git_diff_file_fn file_cb,
git_diff_hunk_fn hunk_cb,
git_diff_data_fn line_cb);
......
......@@ -169,7 +169,6 @@ static int file_is_binary_by_attr(
}
static int file_is_binary_by_content(
git_diff_list *diff,
git_diff_delta *delta,
git_map *old_data,
git_map *new_data)
......@@ -177,8 +176,6 @@ static int file_is_binary_by_content(
git_buf search;
git_text_stats stats;
GIT_UNUSED(diff);
if ((delta->old_file.flags & BINARY_DIFF_FLAGS) == 0) {
search.ptr = old_data->data;
search.size = min(old_data->len, 4000);
......@@ -301,6 +298,16 @@ static void release_content(git_diff_file *file, git_map *map, git_blob *blob)
}
}
static void fill_map_from_mmfile(git_map *dst, mmfile_t *src) {
assert(dst && src);
dst->data = src->ptr;
dst->len = src->size;
#ifdef GIT_WIN32
dst->fmh = NULL;
#endif
}
int git_diff_foreach(
git_diff_list *diff,
void *data,
......@@ -408,7 +415,7 @@ int git_diff_foreach(
*/
if (delta->binary == -1) {
error = file_is_binary_by_content(
diff, delta, &old_data, &new_data);
delta, &old_data, &new_data);
if (error < 0)
goto cleanup;
}
......@@ -689,55 +696,83 @@ int git_diff_print_patch(
return error;
}
int git_diff_blobs(
git_blob *old_blob,
git_blob *new_blob,
git_diff_options *options,
void *cb_data,
git_diff_file_fn file_cb,
git_diff_hunk_fn hunk_cb,
git_diff_data_fn line_cb)
{
diff_output_info info;
git_diff_delta delta;
mmfile_t old_data, new_data;
git_map old_map, new_map;
xpparam_t xdiff_params;
xdemitconf_t xdiff_config;
xdemitcb_t xdiff_callback;
git_blob *new, *old;
memset(&delta, 0, sizeof(delta));
new = new_blob;
old = old_blob;
if (options && (options->flags & GIT_DIFF_REVERSE)) {
git_blob *swap = old_blob;
old_blob = new_blob;
new_blob = swap;
git_blob *swap = old;
old = new;
new = swap;
}
if (old_blob) {
old_data.ptr = (char *)git_blob_rawcontent(old_blob);
old_data.size = git_blob_rawsize(old_blob);
if (old) {
old_data.ptr = (char *)git_blob_rawcontent(old);
old_data.size = git_blob_rawsize(old);
git_oid_cpy(&delta.old_file.oid, git_object_id((const git_object *)old));
} else {
old_data.ptr = "";
old_data.size = 0;
}
if (new_blob) {
new_data.ptr = (char *)git_blob_rawcontent(new_blob);
new_data.size = git_blob_rawsize(new_blob);
if (new) {
new_data.ptr = (char *)git_blob_rawcontent(new);
new_data.size = git_blob_rawsize(new);
git_oid_cpy(&delta.new_file.oid, git_object_id((const git_object *)new));
} else {
new_data.ptr = "";
new_data.size = 0;
}
/* populate a "fake" delta record */
delta.status = old_data.ptr ?
(new_data.ptr ? GIT_DELTA_MODIFIED : GIT_DELTA_DELETED) :
(new_data.ptr ? GIT_DELTA_ADDED : GIT_DELTA_UNTRACKED);
delta.old_file.mode = 0100644; /* can't know the truth from a blob alone */
delta.new_file.mode = 0100644;
git_oid_cpy(&delta.old_file.oid, git_object_id((const git_object *)old_blob));
git_oid_cpy(&delta.new_file.oid, git_object_id((const git_object *)new_blob));
delta.old_file.path = NULL;
delta.new_file.path = NULL;
delta.similarity = 0;
delta.status = new ?
(old ? GIT_DELTA_MODIFIED : GIT_DELTA_ADDED) :
(old ? GIT_DELTA_DELETED : GIT_DELTA_UNTRACKED);
if (git_oid_cmp(&delta.new_file.oid, &delta.old_file.oid) == 0)
delta.status = GIT_DELTA_UNMODIFIED;
delta.old_file.size = old_data.size;
delta.new_file.size = new_data.size;
fill_map_from_mmfile(&old_map, &old_data);
fill_map_from_mmfile(&new_map, &new_data);
if (file_is_binary_by_content(&delta, &old_map, &new_map) < 0)
return -1;
if (file_cb != NULL) {
int error = file_cb(cb_data, &delta, 1);
if (error < 0)
return error;
}
/* don't do hunk and line diffs if the two blobs are identical */
if (delta.status == GIT_DELTA_UNMODIFIED)
return 0;
/* don't do hunk and line diffs if file is binary */
if (delta.binary == 1)
return 0;
info.diff = NULL;
info.delta = &delta;
......
......@@ -2,23 +2,43 @@
#include "diff_helpers.h"
static git_repository *g_repo = NULL;
static diff_expects exp;
static git_diff_options opts;
static git_blob *d, *alien;
void test_diff_blob__initialize(void)
{
git_oid oid;
g_repo = cl_git_sandbox_init("attr");
memset(&opts, 0, sizeof(opts));
opts.context_lines = 1;
opts.interhunk_lines = 1;
memset(&exp, 0, sizeof(exp));
/* tests/resources/attr/root_test4.txt */
cl_git_pass(git_oid_fromstrn(&oid, "fe773770c5a6", 12));
cl_git_pass(git_blob_lookup_prefix(&d, g_repo, &oid, 6));
/* alien.png */
cl_git_pass(git_oid_fromstrn(&oid, "edf3dcee", 8));
cl_git_pass(git_blob_lookup_prefix(&alien, g_repo, &oid, 4));
}
void test_diff_blob__cleanup(void)
{
git_blob_free(d);
git_blob_free(alien);
cl_git_sandbox_cleanup();
}
void test_diff_blob__0(void)
void test_diff_blob__can_compare_text_blobs(void)
{
git_blob *a, *b, *c, *d;
git_oid a_oid, b_oid, c_oid, d_oid;
git_diff_options opts = {0};
diff_expects exp;
git_blob *a, *b, *c;
git_oid a_oid, b_oid, c_oid;
/* tests/resources/attr/root_test1 */
cl_git_pass(git_oid_fromstrn(&a_oid, "45141a79", 8));
......@@ -32,18 +52,14 @@ void test_diff_blob__0(void)
cl_git_pass(git_oid_fromstrn(&c_oid, "c96bbb2c2557a832", 16));
cl_git_pass(git_blob_lookup_prefix(&c, g_repo, &c_oid, 8));
/* tests/resources/attr/root_test4.txt */
cl_git_pass(git_oid_fromstrn(&d_oid, "fe773770c5a6", 12));
cl_git_pass(git_blob_lookup_prefix(&d, g_repo, &d_oid, 6));
/* Doing the equivalent of a `git diff -U1` on these files */
opts.context_lines = 1;
opts.interhunk_lines = 1;
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
a, b, &opts, &exp, diff_hunk_fn, diff_line_fn));
a, b, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.files == 1);
cl_assert(exp.file_mods == 1);
cl_assert(exp.at_least_one_of_them_is_binary == false);
cl_assert(exp.hunks == 1);
cl_assert(exp.lines == 6);
......@@ -53,7 +69,11 @@ void test_diff_blob__0(void)
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
b, c, &opts, &exp, diff_hunk_fn, diff_line_fn));
b, c, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.files == 1);
cl_assert(exp.file_mods == 1);
cl_assert(exp.at_least_one_of_them_is_binary == false);
cl_assert(exp.hunks == 1);
cl_assert(exp.lines == 15);
......@@ -63,7 +83,11 @@ void test_diff_blob__0(void)
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
a, c, &opts, &exp, diff_hunk_fn, diff_line_fn));
a, c, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.files == 1);
cl_assert(exp.file_mods == 1);
cl_assert(exp.at_least_one_of_them_is_binary == false);
cl_assert(exp.hunks == 1);
cl_assert(exp.lines == 13);
......@@ -75,7 +99,11 @@ void test_diff_blob__0(void)
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
c, d, &opts, &exp, diff_hunk_fn, diff_line_fn));
c, d, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.files == 1);
cl_assert(exp.file_mods == 1);
cl_assert(exp.at_least_one_of_them_is_binary == false);
cl_assert(exp.hunks == 2);
cl_assert(exp.lines == 14);
......@@ -86,6 +114,141 @@ void test_diff_blob__0(void)
git_blob_free(a);
git_blob_free(b);
git_blob_free(c);
git_blob_free(d);
}
void test_diff_blob__can_compare_against_null_blobs(void)
{
git_blob *e = NULL;
cl_git_pass(git_diff_blobs(
d, e, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.files == 1);
cl_assert(exp.file_dels == 1);
cl_assert(exp.at_least_one_of_them_is_binary == false);
cl_assert(exp.hunks == 1);
cl_assert(exp.hunk_old_lines == 14);
cl_assert(exp.lines == 14);
cl_assert(exp.line_dels == 14);
opts.flags |= GIT_DIFF_REVERSE;
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
d, e, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.files == 1);
cl_assert(exp.file_adds == 1);
cl_assert(exp.at_least_one_of_them_is_binary == false);
cl_assert(exp.hunks == 1);
cl_assert(exp.hunk_new_lines == 14);
cl_assert(exp.lines == 14);
cl_assert(exp.line_adds == 14);
opts.flags ^= GIT_DIFF_REVERSE;
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
alien, NULL, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.at_least_one_of_them_is_binary == true);
cl_assert(exp.files == 1);
cl_assert(exp.file_dels == 1);
cl_assert(exp.hunks == 0);
cl_assert(exp.lines == 0);
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
NULL, alien, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.at_least_one_of_them_is_binary == true);
cl_assert(exp.files == 1);
cl_assert(exp.file_adds == 1);
cl_assert(exp.hunks == 0);
cl_assert(exp.lines == 0);
}
void assert_identical_blobs_comparison(diff_expects exp)
{
cl_assert(exp.files == 1);
cl_assert(exp.file_unmodified == 1);
cl_assert(exp.hunks == 0);
cl_assert(exp.lines == 0);
}
void test_diff_blob__can_compare_identical_blobs(void)
{
cl_git_pass(git_diff_blobs(
d, d, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.at_least_one_of_them_is_binary == false);
assert_identical_blobs_comparison(exp);
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
NULL, NULL, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.at_least_one_of_them_is_binary == false);
assert_identical_blobs_comparison(exp);
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
alien, alien, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
cl_assert(exp.at_least_one_of_them_is_binary == true);
assert_identical_blobs_comparison(exp);
}
void assert_binary_blobs_comparison(diff_expects exp)
{
cl_assert(exp.at_least_one_of_them_is_binary == true);
cl_assert(exp.files == 1);
cl_assert(exp.file_mods == 1);
cl_assert(exp.hunks == 0);
cl_assert(exp.lines == 0);
}
void test_diff_blob__can_compare_two_binary_blobs(void)
{
git_blob *heart;
git_oid h_oid;
/* heart.png */
cl_git_pass(git_oid_fromstrn(&h_oid, "de863bff", 8));
cl_git_pass(git_blob_lookup_prefix(&heart, g_repo, &h_oid, 4));
cl_git_pass(git_diff_blobs(
alien, heart, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
assert_binary_blobs_comparison(exp);
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
heart, alien, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
assert_binary_blobs_comparison(exp);
git_blob_free(heart);
}
void test_diff_blob__can_compare_a_binary_blob_and_a_text_blob(void)
{
cl_git_pass(git_diff_blobs(
alien, d, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
assert_binary_blobs_comparison(exp);
memset(&exp, 0, sizeof(exp));
cl_git_pass(git_diff_blobs(
d, alien, &opts, &exp, diff_file_fn, diff_hunk_fn, diff_line_fn));
assert_binary_blobs_comparison(exp);
}
......@@ -30,6 +30,8 @@ int diff_file_fn(
GIT_UNUSED(progress);
e-> at_least_one_of_them_is_binary = delta->binary;
e->files++;
switch (delta->status) {
case GIT_DELTA_ADDED: e->file_adds++; break;
......@@ -37,6 +39,7 @@ int diff_file_fn(
case GIT_DELTA_MODIFIED: e->file_mods++; break;
case GIT_DELTA_IGNORED: e->file_ignored++; break;
case GIT_DELTA_UNTRACKED: e->file_untracked++; break;
case GIT_DELTA_UNMODIFIED: e->file_unmodified++; break;
default: break;
}
return 0;
......
......@@ -11,6 +11,7 @@ typedef struct {
int file_mods;
int file_ignored;
int file_untracked;
int file_unmodified;
int hunks;
int hunk_new_lines;
......@@ -20,6 +21,8 @@ typedef struct {
int line_ctxt;
int line_adds;
int line_dels;
bool at_least_one_of_them_is_binary;
} diff_expects;
extern int diff_file_fn(
......
......@@ -113,16 +113,16 @@ void test_diff_tree__options(void)
*/
diff_expects test_expects[] = {
/* a vs b tests */
{ 5, 3, 0, 2, 0, 0, 4, 0, 0, 51, 2, 46, 3 },
{ 5, 3, 0, 2, 0, 0, 4, 0, 0, 53, 4, 46, 3 },
{ 5, 0, 3, 2, 0, 0, 4, 0, 0, 52, 3, 3, 46 },
{ 5, 3, 0, 2, 0, 0, 5, 0, 0, 54, 3, 48, 3 },
{ 5, 3, 0, 2, 0, 0, 0, 4, 0, 0, 51, 2, 46, 3 },
{ 5, 3, 0, 2, 0, 0, 0, 4, 0, 0, 53, 4, 46, 3 },
{ 5, 0, 3, 2, 0, 0, 0, 4, 0, 0, 52, 3, 3, 46 },
{ 5, 3, 0, 2, 0, 0, 0, 5, 0, 0, 54, 3, 48, 3 },
/* c vs d tests */
{ 1, 0, 0, 1, 0, 0, 1, 0, 0, 22, 9, 10, 3 },
{ 1, 0, 0, 1, 0, 0, 1, 0, 0, 19, 12, 7, 0 },
{ 1, 0, 0, 1, 0, 0, 1, 0, 0, 20, 11, 8, 1 },
{ 1, 0, 0, 1, 0, 0, 1, 0, 0, 20, 11, 8, 1 },
{ 1, 0, 0, 1, 0, 0, 1, 0, 0, 18, 11, 0, 7 },
{ 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 22, 9, 10, 3 },
{ 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 19, 12, 7, 0 },
{ 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 20, 11, 8, 1 },
{ 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 20, 11, 8, 1 },
{ 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 18, 11, 0, 7 },
{ 0 },
};
diff_expects *expected;
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment