Commit 368a2b4e by Vicent Martí

Merge pull request #1204 from arrbee/diff-blob-to-buffer

Have diff blob to buffer share code (and add tests)
parents 7dfc5c3c f2b7f7a6
...@@ -91,7 +91,7 @@ GIT_INLINE(const git_oid *) git_blob_id(const git_blob *blob) ...@@ -91,7 +91,7 @@ GIT_INLINE(const git_oid *) git_blob_id(const git_blob *blob)
* @param blob pointer to the blob * @param blob pointer to the blob
* @return the pointer; NULL if the blob has no contents * @return the pointer; NULL if the blob has no contents
*/ */
GIT_EXTERN(const void *) git_blob_rawcontent(git_blob *blob); GIT_EXTERN(const void *) git_blob_rawcontent(const git_blob *blob);
/** /**
* Get the size in bytes of the contents of a blob * Get the size in bytes of the contents of a blob
...@@ -99,7 +99,7 @@ GIT_EXTERN(const void *) git_blob_rawcontent(git_blob *blob); ...@@ -99,7 +99,7 @@ GIT_EXTERN(const void *) git_blob_rawcontent(git_blob *blob);
* @param blob pointer to the blob * @param blob pointer to the blob
* @return size on bytes * @return size on bytes
*/ */
GIT_EXTERN(git_off_t) git_blob_rawsize(git_blob *blob); GIT_EXTERN(git_off_t) git_blob_rawsize(const git_blob *blob);
/** /**
* Read a file from the working folder of a repository * Read a file from the working folder of a repository
......
...@@ -802,28 +802,50 @@ GIT_EXTERN(int) git_diff_patch_to_str( ...@@ -802,28 +802,50 @@ GIT_EXTERN(int) git_diff_patch_to_str(
*/ */
/** /**
* Directly run a text diff on two blobs. * Directly run a diff on two blobs.
* *
* Compared to a file, a blob lacks some contextual information. As such, * Compared to a file, a blob lacks some contextual information. As such,
* the `git_diff_file` parameters of the callbacks will be filled * the `git_diff_file` given to the callback will have some fake data; i.e.
* accordingly to the following: `mode` will be set to 0, `path` will be set * `mode` will be 0 and `path` will be NULL.
* to NULL. When dealing with a NULL blob, `oid` will be set to 0.
* *
* When at least one of the blobs being dealt with is binary, the * NULL is allowed for either `old_blob` or `new_blob` and will be treated
* `git_diff_delta` binary attribute will be set to 1 and no call to the * as an empty blob, with the `oid` set to NULL in the `git_diff_file` data.
* hunk_cb nor line_cb will be made. *
* We do run a binary content check on the two blobs and if either of the
* blobs looks like binary data, the `git_diff_delta` binary attribute will
* be set to 1 and no call to the hunk_cb nor line_cb will be made (unless
* you pass `GIT_DIFF_FORCE_TEXT` of course).
* *
* @return 0 on success, GIT_EUSER on non-zero callback, or error code * @return 0 on success, GIT_EUSER on non-zero callback, or error code
*/ */
GIT_EXTERN(int) git_diff_blobs( GIT_EXTERN(int) git_diff_blobs(
git_blob *old_blob, const git_blob *old_blob,
git_blob *new_blob, const git_blob *new_blob,
const git_diff_options *options, const git_diff_options *options,
git_diff_file_cb file_cb, git_diff_file_cb file_cb,
git_diff_hunk_cb hunk_cb, git_diff_hunk_cb hunk_cb,
git_diff_data_cb line_cb, git_diff_data_cb line_cb,
void *payload); void *payload);
/**
* Directly run a diff between a blob and a buffer.
*
* As with `git_diff_blobs`, comparing a blob and buffer lacks some context,
* so the `git_diff_file` parameters to the callbacks will be faked a la the
* rules for `git_diff_blobs()`.
*
* @return 0 on success, GIT_EUSER on non-zero callback, or error code
*/
GIT_EXTERN(int) git_diff_blob_to_buffer(
const git_blob *old_blob,
const char *buffer,
size_t buffer_len,
const git_diff_options *options,
git_diff_file_cb file_cb,
git_diff_hunk_cb hunk_cb,
git_diff_data_cb data_cb,
void *payload);
GIT_END_DECL GIT_END_DECL
/** @} */ /** @} */
......
...@@ -13,13 +13,13 @@ ...@@ -13,13 +13,13 @@
#include "blob.h" #include "blob.h"
#include "filter.h" #include "filter.h"
const void *git_blob_rawcontent(git_blob *blob) const void *git_blob_rawcontent(const git_blob *blob)
{ {
assert(blob); assert(blob);
return blob->odb_object->raw.data; return blob->odb_object->raw.data;
} }
git_off_t git_blob_rawsize(git_blob *blob) git_off_t git_blob_rawsize(const git_blob *blob)
{ {
assert(blob); assert(blob);
return (git_off_t)blob->odb_object->raw.len; return (git_off_t)blob->odb_object->raw.len;
......
...@@ -132,16 +132,16 @@ static int diff_delta_is_binary_by_attr( ...@@ -132,16 +132,16 @@ static int diff_delta_is_binary_by_attr(
} }
static int diff_delta_is_binary_by_content( static int diff_delta_is_binary_by_content(
diff_context *ctxt, git_diff_delta *delta, git_diff_file *file, git_map *map) diff_context *ctxt,
git_diff_delta *delta,
git_diff_file *file,
const git_map *map)
{ {
git_buf search; const git_buf search = { map->data, 0, min(map->len, 4000) };
GIT_UNUSED(ctxt); GIT_UNUSED(ctxt);
if ((file->flags & KNOWN_BINARY_FLAGS) == 0) { if ((file->flags & KNOWN_BINARY_FLAGS) == 0) {
search.ptr = map->data;
search.size = min(map->len, 4000);
if (git_buf_text_is_binary(&search)) if (git_buf_text_is_binary(&search))
file->flags |= GIT_DIFF_FILE_BINARY; file->flags |= GIT_DIFF_FILE_BINARY;
else else
...@@ -1231,9 +1231,8 @@ int git_diff_print_patch( ...@@ -1231,9 +1231,8 @@ int git_diff_print_patch(
return error; return error;
} }
static void set_data_from_blob( static void set_data_from_blob(
git_blob *blob, git_map *map, git_diff_file *file) const git_blob *blob, git_map *map, git_diff_file *file)
{ {
if (blob) { if (blob) {
file->size = git_blob_rawsize(blob); file->size = git_blob_rawsize(blob);
...@@ -1251,83 +1250,152 @@ static void set_data_from_blob( ...@@ -1251,83 +1250,152 @@ static void set_data_from_blob(
} }
} }
int git_diff_blobs( static void set_data_from_buffer(
git_blob *old_blob, const char *buffer, size_t buffer_len, git_map *map, git_diff_file *file)
git_blob *new_blob,
const git_diff_options *options,
git_diff_file_cb file_cb,
git_diff_hunk_cb hunk_cb,
git_diff_data_cb data_cb,
void *payload)
{ {
int error; file->size = (git_off_t)buffer_len;
git_repository *repo; file->mode = 0644;
if (!buffer)
file->flags |= GIT_DIFF_FILE_NO_DATA;
else
git_odb_hash(&file->oid, buffer, buffer_len, GIT_OBJ_BLOB);
map->len = buffer_len;
map->data = (char *)buffer;
}
typedef struct {
diff_context ctxt; diff_context ctxt;
git_diff_delta delta; git_diff_delta delta;
git_diff_patch patch; git_diff_patch patch;
} diff_single_data;
GITERR_CHECK_VERSION(options, GIT_DIFF_OPTIONS_VERSION, "git_diff_options"); static int diff_single_init(
diff_single_data *data,
if (options && (options->flags & GIT_DIFF_REVERSE)) { git_repository *repo,
git_blob *swap = old_blob; const git_diff_options *opts,
old_blob = new_blob; git_diff_file_cb file_cb,
new_blob = swap; git_diff_hunk_cb hunk_cb,
} git_diff_data_cb data_cb,
void *payload)
{
GITERR_CHECK_VERSION(opts, GIT_DIFF_OPTIONS_VERSION, "git_diff_options");
if (new_blob) memset(data, 0, sizeof(*data));
repo = git_object_owner((git_object *)new_blob);
else if (old_blob)
repo = git_object_owner((git_object *)old_blob);
else
repo = NULL;
diff_context_init( diff_context_init(
&ctxt, NULL, repo, options, &data->ctxt, NULL, repo, opts, file_cb, hunk_cb, data_cb, payload);
file_cb, hunk_cb, data_cb, payload);
diff_patch_init(&ctxt, &patch); diff_patch_init(&data->ctxt, &data->patch);
/* create a fake delta record and simulate diff_patch_load */ return 0;
}
memset(&delta, 0, sizeof(delta)); static int diff_single_apply(diff_single_data *data)
delta.binary = -1; {
int error;
git_diff_delta *delta = &data->delta;
bool has_old = ((delta->old_file.flags & GIT_DIFF_FILE_NO_DATA) == 0);
bool has_new = ((delta->new_file.flags & GIT_DIFF_FILE_NO_DATA) == 0);
set_data_from_blob(old_blob, &patch.old_data, &delta.old_file); /* finish setting up fake git_diff_delta record and loaded data */
set_data_from_blob(new_blob, &patch.new_data, &delta.new_file);
delta.status = new_blob ? data->patch.delta = delta;
(old_blob ? GIT_DELTA_MODIFIED : GIT_DELTA_ADDED) : delta->binary = -1;
(old_blob ? GIT_DELTA_DELETED : GIT_DELTA_UNTRACKED);
if (git_oid_cmp(&delta.new_file.oid, &delta.old_file.oid) == 0) delta->status = has_new ?
delta.status = GIT_DELTA_UNMODIFIED; (has_old ? GIT_DELTA_MODIFIED : GIT_DELTA_ADDED) :
(has_old ? GIT_DELTA_DELETED : GIT_DELTA_UNTRACKED);
patch.delta = δ if (git_oid_cmp(&delta->new_file.oid, &delta->old_file.oid) == 0)
delta->status = GIT_DELTA_UNMODIFIED;
if ((error = diff_delta_is_binary_by_content( if ((error = diff_delta_is_binary_by_content(
&ctxt, &delta, &delta.old_file, &patch.old_data)) < 0 || &data->ctxt, delta, &delta->old_file, &data->patch.old_data)) < 0 ||
(error = diff_delta_is_binary_by_content( (error = diff_delta_is_binary_by_content(
&ctxt, &delta, &delta.new_file, &patch.new_data)) < 0) &data->ctxt, delta, &delta->new_file, &data->patch.new_data)) < 0)
goto cleanup; goto cleanup;
patch.flags |= GIT_DIFF_PATCH_LOADED; data->patch.flags |= GIT_DIFF_PATCH_LOADED;
if (delta.binary != 1 && delta.status != GIT_DELTA_UNMODIFIED)
patch.flags |= GIT_DIFF_PATCH_DIFFABLE; if (delta->binary != 1 && delta->status != GIT_DELTA_UNMODIFIED)
data->patch.flags |= GIT_DIFF_PATCH_DIFFABLE;
/* do diffs */ /* do diffs */
if (!(error = diff_delta_file_callback(&ctxt, patch.delta, 1))) if (!(error = diff_delta_file_callback(&data->ctxt, delta, 1)))
error = diff_patch_generate(&ctxt, &patch); error = diff_patch_generate(&data->ctxt, &data->patch);
cleanup: cleanup:
diff_patch_unload(&patch);
if (error == GIT_EUSER) if (error == GIT_EUSER)
giterr_clear(); giterr_clear();
diff_patch_unload(&data->patch);
return error; return error;
} }
int git_diff_blobs(
const git_blob *old_blob,
const git_blob *new_blob,
const git_diff_options *options,
git_diff_file_cb file_cb,
git_diff_hunk_cb hunk_cb,
git_diff_data_cb data_cb,
void *payload)
{
int error;
diff_single_data d;
git_repository *repo =
new_blob ? git_object_owner((const git_object *)new_blob) :
old_blob ? git_object_owner((const git_object *)old_blob) : NULL;
if ((error = diff_single_init(
&d, repo, options, file_cb, hunk_cb, data_cb, payload)) < 0)
return error;
if (options && (options->flags & GIT_DIFF_REVERSE) != 0) {
const git_blob *swap = old_blob;
old_blob = new_blob;
new_blob = swap;
}
set_data_from_blob(old_blob, &d.patch.old_data, &d.delta.old_file);
set_data_from_blob(new_blob, &d.patch.new_data, &d.delta.new_file);
return diff_single_apply(&d);
}
int git_diff_blob_to_buffer(
const git_blob *old_blob,
const char *buf,
size_t buflen,
const git_diff_options *options,
git_diff_file_cb file_cb,
git_diff_hunk_cb hunk_cb,
git_diff_data_cb data_cb,
void *payload)
{
int error;
diff_single_data d;
git_repository *repo =
old_blob ? git_object_owner((const git_object *)old_blob) : NULL;
if ((error = diff_single_init(
&d, repo, options, file_cb, hunk_cb, data_cb, payload)) < 0)
return error;
if (options && (options->flags & GIT_DIFF_REVERSE) != 0) {
set_data_from_buffer(buf, buflen, &d.patch.old_data, &d.delta.old_file);
set_data_from_blob(old_blob, &d.patch.new_data, &d.delta.new_file);
} else {
set_data_from_blob(old_blob, &d.patch.old_data, &d.delta.old_file);
set_data_from_buffer(buf, buflen, &d.patch.new_data, &d.delta.new_file);
}
return diff_single_apply(&d);
}
size_t git_diff_num_deltas(git_diff_list *diff) size_t git_diff_num_deltas(git_diff_list *diff)
{ {
......
...@@ -347,3 +347,81 @@ void test_diff_blob__can_correctly_detect_a_textual_blob_as_non_binary(void) ...@@ -347,3 +347,81 @@ void test_diff_blob__can_correctly_detect_a_textual_blob_as_non_binary(void)
/* tests/resources/attr/root_test4.txt */ /* tests/resources/attr/root_test4.txt */
cl_assert_equal_i(false, git_blob_is_binary(d)); cl_assert_equal_i(false, git_blob_is_binary(d));
} }
/*
* git_diff_blob_to_buffer tests
*/
void test_diff_blob__can_compare_blob_to_buffer(void)
{
git_blob *a;
git_oid a_oid;
const char *a_content = "Hello from the root\n";
const char *b_content = "Hello from the root\n\nSome additional lines\n\nDown here below\n\n";
/* tests/resources/attr/root_test1 */
cl_git_pass(git_oid_fromstrn(&a_oid, "45141a79", 8));
cl_git_pass(git_blob_lookup_prefix(&a, g_repo, &a_oid, 4));
/* diff from blob a to content of b */
cl_git_pass(git_diff_blob_to_buffer(
a, b_content, strlen(b_content),
&opts, diff_file_cb, diff_hunk_cb, diff_line_cb, &expected));
cl_assert_equal_i(1, expected.files);
cl_assert_equal_i(1, expected.file_status[GIT_DELTA_MODIFIED]);
cl_assert_equal_i(0, expected.files_binary);
cl_assert_equal_i(1, expected.hunks);
cl_assert_equal_i(6, expected.lines);
cl_assert_equal_i(1, expected.line_ctxt);
cl_assert_equal_i(5, expected.line_adds);
cl_assert_equal_i(0, expected.line_dels);
/* diff from blob a to content of a */
memset(&expected, 0, sizeof(expected));
cl_git_pass(git_diff_blob_to_buffer(
a, a_content, strlen(a_content),
&opts, diff_file_cb, diff_hunk_cb, diff_line_cb, &expected));
assert_identical_blobs_comparison(&expected);
/* diff from NULL blob to content of b */
memset(&expected, 0, sizeof(expected));
cl_git_pass(git_diff_blob_to_buffer(
NULL, a_content, strlen(a_content),
&opts, diff_file_cb, diff_hunk_cb, diff_line_cb, &expected));
cl_assert_equal_i(1, expected.files);
cl_assert_equal_i(1, expected.file_status[GIT_DELTA_ADDED]);
cl_assert_equal_i(1, expected.hunks);
cl_assert_equal_i(1, expected.lines);
cl_assert_equal_i(1, expected.line_adds);
/* diff from blob a to NULL buffer */
memset(&expected, 0, sizeof(expected));
cl_git_pass(git_diff_blob_to_buffer(
a, NULL, 0,
&opts, diff_file_cb, diff_hunk_cb, diff_line_cb, &expected));
cl_assert_equal_i(1, expected.files);
cl_assert_equal_i(1, expected.file_status[GIT_DELTA_DELETED]);
cl_assert_equal_i(1, expected.hunks);
cl_assert_equal_i(1, expected.lines);
cl_assert_equal_i(1, expected.line_dels);
/* diff with reverse */
opts.flags ^= GIT_DIFF_REVERSE;
memset(&expected, 0, sizeof(expected));
cl_git_pass(git_diff_blob_to_buffer(
a, NULL, 0,
&opts, diff_file_cb, diff_hunk_cb, diff_line_cb, &expected));
cl_assert_equal_i(1, expected.files);
cl_assert_equal_i(1, expected.file_status[GIT_DELTA_ADDED]);
cl_assert_equal_i(1, expected.hunks);
cl_assert_equal_i(1, expected.lines);
cl_assert_equal_i(1, expected.line_adds);
git_blob_free(a);
}
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment