diff_xdiff.c 6.77 KB
Newer Older
1 2 3 4 5 6
/*
 * Copyright (C) the libgit2 contributors. All rights reserved.
 *
 * This file is part of libgit2, distributed under the GNU GPL v2 with
 * a Linking Exception. For full terms see the included COPYING file.
 */
7
#include "git2/errors.h"
8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
#include "common.h"
#include "diff.h"
#include "diff_driver.h"
#include "diff_patch.h"
#include "diff_xdiff.h"

static int git_xdiff_scan_int(const char **str, int *value)
{
	const char *scan = *str;
	int v = 0, digits = 0;
	/* find next digit */
	for (scan = *str; *scan && !git__isdigit(*scan); scan++);
	/* parse next number */
	for (; git__isdigit(*scan); scan++, digits++)
		v = (v * 10) + (*scan - '0');
	*str = scan;
	*value = v;
	return (digits > 0) ? 0 : -1;
}

28
static int git_xdiff_parse_hunk(git_diff_hunk *hunk, const char *header)
29 30 31
{
	/* expect something of the form "@@ -%d[,%d] +%d[,%d] @@" */
	if (*header != '@')
32
		goto fail;
33
	if (git_xdiff_scan_int(&header, &hunk->old_start) < 0)
34
		goto fail;
35
	if (*header == ',') {
36
		if (git_xdiff_scan_int(&header, &hunk->old_lines) < 0)
37
			goto fail;
38
	} else
39 40
		hunk->old_lines = 1;
	if (git_xdiff_scan_int(&header, &hunk->new_start) < 0)
41
		goto fail;
42
	if (*header == ',') {
43
		if (git_xdiff_scan_int(&header, &hunk->new_lines) < 0)
44
			goto fail;
45
	} else
46 47
		hunk->new_lines = 1;
	if (hunk->old_start < 0 || hunk->new_start < 0)
48
		goto fail;
49 50

	return 0;
51 52 53 54

fail:
	giterr_set(GITERR_INVALID, "Malformed hunk header from xdiff");
	return -1;
55 56 57 58
}

typedef struct {
	git_xdiff_output *xo;
59 60
	git_patch *patch;
	git_diff_hunk hunk;
Russell Belfer committed
61
	int old_lineno, new_lineno;
62
	mmfile_t xd_old_data, xd_new_data;
63 64
} git_xdiff_info;

65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85
static int diff_update_lines(
	git_xdiff_info *info,
	git_diff_line *line,
	const char *content,
	size_t content_len)
{
	const char *scan = content, *scan_end = content + content_len;

	for (line->num_lines = 0; scan < scan_end; ++scan)
		if (*scan == '\n')
			++line->num_lines;

	line->content     = content;
	line->content_len = content_len;

	/* expect " "/"-"/"+", then data */
	switch (line->origin) {
	case GIT_DIFF_LINE_ADDITION:
	case GIT_DIFF_LINE_DEL_EOFNL:
		line->old_lineno = -1;
		line->new_lineno = info->new_lineno;
Russell Belfer committed
86
		info->new_lineno += (int)line->num_lines;
87 88 89 90 91
		break;
	case GIT_DIFF_LINE_DELETION:
	case GIT_DIFF_LINE_ADD_EOFNL:
		line->old_lineno = info->old_lineno;
		line->new_lineno = -1;
Russell Belfer committed
92
		info->old_lineno += (int)line->num_lines;
93 94 95 96 97
		break;
	case GIT_DIFF_LINE_CONTEXT:
	case GIT_DIFF_LINE_CONTEXT_EOFNL:
		line->old_lineno = info->old_lineno;
		line->new_lineno = info->new_lineno;
Russell Belfer committed
98 99
		info->old_lineno += (int)line->num_lines;
		info->new_lineno += (int)line->num_lines;
100 101 102 103 104 105 106 107 108 109
		break;
	default:
		giterr_set(GITERR_INVALID, "Unknown diff line origin %02x",
			(unsigned int)line->origin);
		return -1;
	}

	return 0;
}

110 111 112
static int git_xdiff_cb(void *priv, mmbuffer_t *bufs, int len)
{
	git_xdiff_info *info = priv;
113
	git_patch *patch = info->patch;
Russell Belfer committed
114
	const git_diff_delta *delta = git_patch_get_delta(patch);
115
	git_diff_output *output = &info->xo->output;
116
	git_diff_line line;
117 118

	if (len == 1) {
119
		output->error = git_xdiff_parse_hunk(&info->hunk, bufs[0].ptr);
120 121 122
		if (output->error < 0)
			return output->error;

123 124 125 126 127 128
		info->hunk.header_len = bufs[0].size;
		if (info->hunk.header_len >= sizeof(info->hunk.header))
			info->hunk.header_len = sizeof(info->hunk.header) - 1;
		memcpy(info->hunk.header, bufs[0].ptr, info->hunk.header_len);
		info->hunk.header[info->hunk.header_len] = '\0';

129
		if (output->hunk_cb != NULL &&
130 131 132
			(output->error = output->hunk_cb(
				delta, &info->hunk, output->payload)))
			return output->error;
133 134 135

		info->old_lineno = info->hunk.old_start;
		info->new_lineno = info->hunk.new_start;
136 137 138 139
	}

	if (len == 2 || len == 3) {
		/* expect " "/"-"/"+", then data */
140
		line.origin =
141 142 143 144
			(*bufs[0].ptr == '+') ? GIT_DIFF_LINE_ADDITION :
			(*bufs[0].ptr == '-') ? GIT_DIFF_LINE_DELETION :
			GIT_DIFF_LINE_CONTEXT;

145 146 147 148 149 150 151
		if (line.origin == GIT_DIFF_LINE_ADDITION)
			line.content_offset = bufs[1].ptr - info->xd_new_data.ptr;
		else if (line.origin == GIT_DIFF_LINE_DELETION)
			line.content_offset = bufs[1].ptr - info->xd_old_data.ptr;
		else
			line.content_offset = -1;

152 153 154
		output->error = diff_update_lines(
			info, &line, bufs[1].ptr, bufs[1].size);

155 156 157
		if (!output->error && output->data_cb != NULL)
			output->error = output->data_cb(
				delta, &info->hunk, &line, output->payload);
158 159 160 161 162 163 164 165
	}

	if (len == 3 && !output->error) {
		/* If we have a '+' and a third buf, then we have added a line
		 * without a newline and the old code had one, so DEL_EOFNL.
		 * If we have a '-' and a third buf, then we have removed a line
		 * with out a newline but added a blank line, so ADD_EOFNL.
		 */
166
		line.origin =
167 168 169 170
			(*bufs[0].ptr == '+') ? GIT_DIFF_LINE_DEL_EOFNL :
			(*bufs[0].ptr == '-') ? GIT_DIFF_LINE_ADD_EOFNL :
			GIT_DIFF_LINE_CONTEXT_EOFNL;

171 172
		line.content_offset = -1;

173 174 175
		output->error = diff_update_lines(
			info, &line, bufs[2].ptr, bufs[2].size);

176 177 178
		if (!output->error && output->data_cb != NULL)
			output->error = output->data_cb(
				delta, &info->hunk, &line, output->payload);
179 180 181 182 183
	}

	return output->error;
}

184
static int git_xdiff(git_diff_output *output, git_patch *patch)
185 186 187
{
	git_xdiff_output *xo = (git_xdiff_output *)output;
	git_xdiff_info info;
188
	git_diff_find_context_payload findctxt;
189 190 191 192 193 194 195

	memset(&info, 0, sizeof(info));
	info.patch = patch;
	info.xo    = xo;

	xo->callback.priv = &info;

196
	git_diff_find_context_init(
197
		&xo->config.find_func, &findctxt, git_patch__driver(patch));
198
	xo->config.find_func_priv = &findctxt;
199 200 201 202 203 204

	if (xo->config.find_func != NULL)
		xo->config.flags |= XDL_EMIT_FUNCNAMES;
	else
		xo->config.flags &= ~XDL_EMIT_FUNCNAMES;

205 206 207
	/* TODO: check ofile.opts_flags to see if driver-specific per-file
	 * updates are needed to xo->params.flags
	 */
208

209 210
	git_patch__old_data(&info.xd_old_data.ptr, &info.xd_old_data.size, patch);
	git_patch__new_data(&info.xd_new_data.ptr, &info.xd_new_data.size, patch);
211

212 213 214 215 216 217
	if (info.xd_old_data.size > GIT_XDIFF_MAX_SIZE ||
		info.xd_new_data.size > GIT_XDIFF_MAX_SIZE) {
		giterr_set(GITERR_INVALID, "files too large for diff");
		return -1;
	}

218
	xdl_diff(&info.xd_old_data, &info.xd_new_data,
219 220
		&xo->params, &xo->config, &xo->callback);

221 222
	git_diff_find_context_clear(&findctxt);

223 224 225 226 227
	return xo->output.error;
}

void git_xdiff_init(git_xdiff_output *xo, const git_diff_options *opts)
{
Russell Belfer committed
228
	uint32_t flags = opts ? opts->flags : 0;
229 230 231 232 233 234 235 236 237 238 239 240 241

	xo->output.diff_cb = git_xdiff;

	xo->config.ctxlen = opts ? opts->context_lines : 3;
	xo->config.interhunkctxlen = opts ? opts->interhunk_lines : 0;

	if (flags & GIT_DIFF_IGNORE_WHITESPACE)
		xo->params.flags |= XDF_WHITESPACE_FLAGS;
	if (flags & GIT_DIFF_IGNORE_WHITESPACE_CHANGE)
		xo->params.flags |= XDF_IGNORE_WHITESPACE_CHANGE;
	if (flags & GIT_DIFF_IGNORE_WHITESPACE_EOL)
		xo->params.flags |= XDF_IGNORE_WHITESPACE_AT_EOL;

242 243 244 245 246
	if (flags & GIT_DIFF_PATIENCE)
		xo->params.flags |= XDF_PATIENCE_DIFF;
	if (flags & GIT_DIFF_MINIMAL)
		xo->params.flags |= XDF_NEED_MINIMAL;

247 248
	xo->callback.outf = git_xdiff_cb;
}