diff_xdiff.c 6.82 KB
Newer Older
1 2 3 4 5 6
/*
 * Copyright (C) the libgit2 contributors. All rights reserved.
 *
 * This file is part of libgit2, distributed under the GNU GPL v2 with
 * a Linking Exception. For full terms see the included COPYING file.
 */
7 8 9

#include "diff_xdiff.h"

10
#include "git2/errors.h"
11 12
#include "diff.h"
#include "diff_driver.h"
13
#include "patch_generate.h"
14 15 16 17 18 19 20 21 22 23 24 25 26 27 28

static int git_xdiff_scan_int(const char **str, int *value)
{
	const char *scan = *str;
	int v = 0, digits = 0;
	/* find next digit */
	for (scan = *str; *scan && !git__isdigit(*scan); scan++);
	/* parse next number */
	for (; git__isdigit(*scan); scan++, digits++)
		v = (v * 10) + (*scan - '0');
	*str = scan;
	*value = v;
	return (digits > 0) ? 0 : -1;
}

29
static int git_xdiff_parse_hunk(git_diff_hunk *hunk, const char *header)
30 31 32
{
	/* expect something of the form "@@ -%d[,%d] +%d[,%d] @@" */
	if (*header != '@')
33
		goto fail;
34
	if (git_xdiff_scan_int(&header, &hunk->old_start) < 0)
35
		goto fail;
36
	if (*header == ',') {
37
		if (git_xdiff_scan_int(&header, &hunk->old_lines) < 0)
38
			goto fail;
39
	} else
40 41
		hunk->old_lines = 1;
	if (git_xdiff_scan_int(&header, &hunk->new_start) < 0)
42
		goto fail;
43
	if (*header == ',') {
44
		if (git_xdiff_scan_int(&header, &hunk->new_lines) < 0)
45
			goto fail;
46
	} else
47 48
		hunk->new_lines = 1;
	if (hunk->old_start < 0 || hunk->new_start < 0)
49
		goto fail;
50 51

	return 0;
52 53

fail:
54
	giterr_set(GITERR_INVALID, "malformed hunk header from xdiff");
55
	return -1;
56 57 58 59
}

typedef struct {
	git_xdiff_output *xo;
60
	git_patch_generated *patch;
61
	git_diff_hunk hunk;
Russell Belfer committed
62
	int old_lineno, new_lineno;
63
	mmfile_t xd_old_data, xd_new_data;
64 65
} git_xdiff_info;

66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86
static int diff_update_lines(
	git_xdiff_info *info,
	git_diff_line *line,
	const char *content,
	size_t content_len)
{
	const char *scan = content, *scan_end = content + content_len;

	for (line->num_lines = 0; scan < scan_end; ++scan)
		if (*scan == '\n')
			++line->num_lines;

	line->content     = content;
	line->content_len = content_len;

	/* expect " "/"-"/"+", then data */
	switch (line->origin) {
	case GIT_DIFF_LINE_ADDITION:
	case GIT_DIFF_LINE_DEL_EOFNL:
		line->old_lineno = -1;
		line->new_lineno = info->new_lineno;
Russell Belfer committed
87
		info->new_lineno += (int)line->num_lines;
88 89 90 91 92
		break;
	case GIT_DIFF_LINE_DELETION:
	case GIT_DIFF_LINE_ADD_EOFNL:
		line->old_lineno = info->old_lineno;
		line->new_lineno = -1;
Russell Belfer committed
93
		info->old_lineno += (int)line->num_lines;
94 95 96 97 98
		break;
	case GIT_DIFF_LINE_CONTEXT:
	case GIT_DIFF_LINE_CONTEXT_EOFNL:
		line->old_lineno = info->old_lineno;
		line->new_lineno = info->new_lineno;
Russell Belfer committed
99 100
		info->old_lineno += (int)line->num_lines;
		info->new_lineno += (int)line->num_lines;
101 102
		break;
	default:
103
		giterr_set(GITERR_INVALID, "unknown diff line origin %02x",
104 105 106 107 108 109 110
			(unsigned int)line->origin);
		return -1;
	}

	return 0;
}

111 112 113
static int git_xdiff_cb(void *priv, mmbuffer_t *bufs, int len)
{
	git_xdiff_info *info = priv;
114
	git_patch_generated *patch = info->patch;
115
	const git_diff_delta *delta = patch->base.delta;
116
	git_patch_generated_output *output = &info->xo->output;
117
	git_diff_line line;
118 119

	if (len == 1) {
120
		output->error = git_xdiff_parse_hunk(&info->hunk, bufs[0].ptr);
121 122 123
		if (output->error < 0)
			return output->error;

124 125 126 127 128 129
		info->hunk.header_len = bufs[0].size;
		if (info->hunk.header_len >= sizeof(info->hunk.header))
			info->hunk.header_len = sizeof(info->hunk.header) - 1;
		memcpy(info->hunk.header, bufs[0].ptr, info->hunk.header_len);
		info->hunk.header[info->hunk.header_len] = '\0';

130
		if (output->hunk_cb != NULL &&
131 132 133
			(output->error = output->hunk_cb(
				delta, &info->hunk, output->payload)))
			return output->error;
134 135 136

		info->old_lineno = info->hunk.old_start;
		info->new_lineno = info->hunk.new_start;
137 138 139 140
	}

	if (len == 2 || len == 3) {
		/* expect " "/"-"/"+", then data */
141
		line.origin =
142 143 144 145
			(*bufs[0].ptr == '+') ? GIT_DIFF_LINE_ADDITION :
			(*bufs[0].ptr == '-') ? GIT_DIFF_LINE_DELETION :
			GIT_DIFF_LINE_CONTEXT;

146 147 148 149 150 151 152
		if (line.origin == GIT_DIFF_LINE_ADDITION)
			line.content_offset = bufs[1].ptr - info->xd_new_data.ptr;
		else if (line.origin == GIT_DIFF_LINE_DELETION)
			line.content_offset = bufs[1].ptr - info->xd_old_data.ptr;
		else
			line.content_offset = -1;

153 154 155
		output->error = diff_update_lines(
			info, &line, bufs[1].ptr, bufs[1].size);

156 157 158
		if (!output->error && output->data_cb != NULL)
			output->error = output->data_cb(
				delta, &info->hunk, &line, output->payload);
159 160 161 162 163 164 165 166
	}

	if (len == 3 && !output->error) {
		/* If we have a '+' and a third buf, then we have added a line
		 * without a newline and the old code had one, so DEL_EOFNL.
		 * If we have a '-' and a third buf, then we have removed a line
		 * with out a newline but added a blank line, so ADD_EOFNL.
		 */
167
		line.origin =
168 169 170 171
			(*bufs[0].ptr == '+') ? GIT_DIFF_LINE_DEL_EOFNL :
			(*bufs[0].ptr == '-') ? GIT_DIFF_LINE_ADD_EOFNL :
			GIT_DIFF_LINE_CONTEXT_EOFNL;

172 173
		line.content_offset = -1;

174 175 176
		output->error = diff_update_lines(
			info, &line, bufs[2].ptr, bufs[2].size);

177 178 179
		if (!output->error && output->data_cb != NULL)
			output->error = output->data_cb(
				delta, &info->hunk, &line, output->payload);
180 181 182 183 184
	}

	return output->error;
}

185
static int git_xdiff(git_patch_generated_output *output, git_patch_generated *patch)
186 187 188
{
	git_xdiff_output *xo = (git_xdiff_output *)output;
	git_xdiff_info info;
189
	git_diff_find_context_payload findctxt;
190 191 192 193 194 195 196

	memset(&info, 0, sizeof(info));
	info.patch = patch;
	info.xo    = xo;

	xo->callback.priv = &info;

197
	git_diff_find_context_init(
198
		&xo->config.find_func, &findctxt, git_patch_generated_driver(patch));
199
	xo->config.find_func_priv = &findctxt;
200 201 202 203 204 205

	if (xo->config.find_func != NULL)
		xo->config.flags |= XDL_EMIT_FUNCNAMES;
	else
		xo->config.flags &= ~XDL_EMIT_FUNCNAMES;

206 207 208
	/* TODO: check ofile.opts_flags to see if driver-specific per-file
	 * updates are needed to xo->params.flags
	 */
209

210 211
	git_patch_generated_old_data(&info.xd_old_data.ptr, &info.xd_old_data.size, patch);
	git_patch_generated_new_data(&info.xd_new_data.ptr, &info.xd_new_data.size, patch);
212

213 214 215 216 217 218
	if (info.xd_old_data.size > GIT_XDIFF_MAX_SIZE ||
		info.xd_new_data.size > GIT_XDIFF_MAX_SIZE) {
		giterr_set(GITERR_INVALID, "files too large for diff");
		return -1;
	}

219
	xdl_diff(&info.xd_old_data, &info.xd_new_data,
220 221
		&xo->params, &xo->config, &xo->callback);

222 223
	git_diff_find_context_clear(&findctxt);

224 225 226 227 228
	return xo->output.error;
}

void git_xdiff_init(git_xdiff_output *xo, const git_diff_options *opts)
{
Russell Belfer committed
229
	uint32_t flags = opts ? opts->flags : 0;
230 231 232 233 234 235 236 237 238 239 240 241 242

	xo->output.diff_cb = git_xdiff;

	xo->config.ctxlen = opts ? opts->context_lines : 3;
	xo->config.interhunkctxlen = opts ? opts->interhunk_lines : 0;

	if (flags & GIT_DIFF_IGNORE_WHITESPACE)
		xo->params.flags |= XDF_WHITESPACE_FLAGS;
	if (flags & GIT_DIFF_IGNORE_WHITESPACE_CHANGE)
		xo->params.flags |= XDF_IGNORE_WHITESPACE_CHANGE;
	if (flags & GIT_DIFF_IGNORE_WHITESPACE_EOL)
		xo->params.flags |= XDF_IGNORE_WHITESPACE_AT_EOL;

243 244 245 246 247
	if (flags & GIT_DIFF_PATIENCE)
		xo->params.flags |= XDF_PATIENCE_DIFF;
	if (flags & GIT_DIFF_MINIMAL)
		xo->params.flags |= XDF_NEED_MINIMAL;

248 249
	xo->callback.outf = git_xdiff_cb;
}