attr.c 15.6 KB
Newer Older
1
#include "repository.h"
2 3
#include "fileops.h"
#include "config.h"
4
#include "git2/oid.h"
5 6
#include <ctype.h>

7
GIT__USE_STRMAP;
8

9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27
const char *git_attr__true  = "[internal]__TRUE__";
const char *git_attr__false = "[internal]__FALSE__";
const char *git_attr__unset = "[internal]__UNSET__";

git_attr_t git_attr_value(const char *attr)
{
	if (attr == NULL || attr == git_attr__unset)
		return GIT_ATTR_UNSPECIFIED_T;

	if (attr == git_attr__true)
		return GIT_ATTR_TRUE_T;

	if (attr == git_attr__false)
		return GIT_ATTR_FALSE_T;

	return GIT_ATTR_VALUE_T;
}


28
static int collect_attr_files(
29 30 31 32
	git_repository *repo,
	uint32_t flags,
	const char *path,
	git_vector *files);
33 34 35


int git_attr_get(
36
	const char **value,
37 38 39
    git_repository *repo,
	uint32_t flags,
	const char *pathname,
40
	const char *name)
41 42 43 44
{
	int error;
	git_attr_path path;
	git_vector files = GIT_VECTOR_INIT;
45
	size_t i, j;
46 47 48 49 50 51
	git_attr_file *file;
	git_attr_name attr;
	git_attr_rule *rule;

	*value = NULL;

52 53 54
	if (git_attr_path__init(&path, pathname, git_repository_workdir(repo)) < 0)
		return -1;

55
	if ((error = collect_attr_files(repo, flags, pathname, &files)) < 0)
56
		goto cleanup;
57 58 59 60 61 62 63 64 65 66 67

	attr.name = name;
	attr.name_hash = git_attr_file__name_hash(name);

	git_vector_foreach(&files, i, file) {

		git_attr_file__foreach_matching_rule(file, &path, j, rule) {
			int pos = git_vector_bsearch(&rule->assigns, &attr);
			if (pos >= 0) {
				*value = ((git_attr_assignment *)git_vector_get(
							  &rule->assigns, pos))->value;
68
				goto cleanup;
69 70 71 72
			}
		}
	}

73
cleanup:
74
	git_vector_free(&files);
75
	git_attr_path__free(&path);
76 77 78 79 80 81 82 83 84 85 86

	return error;
}


typedef struct {
	git_attr_name name;
	git_attr_assignment *found;
} attr_get_many_info;

int git_attr_get_many(
87
	const char **values,
88 89 90 91
    git_repository *repo,
	uint32_t flags,
	const char *pathname,
    size_t num_attr,
92
	const char **names)
93 94 95 96
{
	int error;
	git_attr_path path;
	git_vector files = GIT_VECTOR_INIT;
97
	size_t i, j, k;
98 99 100 101 102
	git_attr_file *file;
	git_attr_rule *rule;
	attr_get_many_info *info = NULL;
	size_t num_found = 0;

103
	memset((void *)values, 0, sizeof(const char *) * num_attr);
104

105 106 107
	if (git_attr_path__init(&path, pathname, git_repository_workdir(repo)) < 0)
		return -1;

108
	if ((error = collect_attr_files(repo, flags, pathname, &files)) < 0)
109
		goto cleanup;
110

111 112
	info = git__calloc(num_attr, sizeof(attr_get_many_info));
	GITERR_CHECK_ALLOC(info);
113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143

	git_vector_foreach(&files, i, file) {

		git_attr_file__foreach_matching_rule(file, &path, j, rule) {

			for (k = 0; k < num_attr; k++) {
				int pos;

				if (info[k].found != NULL) /* already found assignment */
					continue;

				if (!info[k].name.name) {
					info[k].name.name = names[k];
					info[k].name.name_hash = git_attr_file__name_hash(names[k]);
				}

				pos = git_vector_bsearch(&rule->assigns, &info[k].name);
				if (pos >= 0) {
					info[k].found = (git_attr_assignment *)
						git_vector_get(&rule->assigns, pos);
					values[k] = info[k].found->value;

					if (++num_found == num_attr)
						goto cleanup;
				}
			}
		}
	}

cleanup:
	git_vector_free(&files);
144
	git_attr_path__free(&path);
145 146 147 148 149 150 151
	git__free(info);

	return error;
}


int git_attr_foreach(
152 153 154
    git_repository *repo,
	uint32_t flags,
	const char *pathname,
155 156 157 158 159 160
	int (*callback)(const char *name, const char *value, void *payload),
	void *payload)
{
	int error;
	git_attr_path path;
	git_vector files = GIT_VECTOR_INIT;
161
	size_t i, j, k;
162 163 164
	git_attr_file *file;
	git_attr_rule *rule;
	git_attr_assignment *assign;
165
	git_strmap *seen = NULL;
166

167 168 169
	if (git_attr_path__init(&path, pathname, git_repository_workdir(repo)) < 0)
		return -1;

170
	if ((error = collect_attr_files(repo, flags, pathname, &files)) < 0)
171
		goto cleanup;
172

173
	seen = git_strmap_alloc();
174
	GITERR_CHECK_ALLOC(seen);
175 176 177 178 179 180 181

	git_vector_foreach(&files, i, file) {

		git_attr_file__foreach_matching_rule(file, &path, j, rule) {

			git_vector_foreach(&rule->assigns, k, assign) {
				/* skip if higher priority assignment was already seen */
182
				if (git_strmap_exists(seen, assign->name))
183 184
					continue;

185
				git_strmap_insert(seen, assign->name, assign, error);
186 187
				if (error < 0)
					goto cleanup;
188

189 190
				error = callback(assign->name, assign->value, payload);
				if (error) {
Russell Belfer committed
191
					giterr_clear();
192
					error = GIT_EUSER;
193
					goto cleanup;
194
				}
195 196 197 198 199
			}
		}
	}

cleanup:
200
	git_strmap_free(seen);
201
	git_vector_free(&files);
202
	git_attr_path__free(&path);
203 204 205 206 207

	return error;
}


208 209 210 211 212 213 214
int git_attr_add_macro(
	git_repository *repo,
	const char *name,
	const char *values)
{
	int error;
	git_attr_rule *macro = NULL;
215
	git_pool *pool;
216

217 218
	if (git_attr_cache__init(repo) < 0)
		return -1;
219 220

	macro = git__calloc(1, sizeof(git_attr_rule));
221
	GITERR_CHECK_ALLOC(macro);
222

223 224 225
	pool = &git_repository_attr_cache(repo)->pool;

	macro->match.pattern = git_pool_strdup(pool, name);
226
	GITERR_CHECK_ALLOC(macro->match.pattern);
227 228 229 230

	macro->match.length = strlen(macro->match.pattern);
	macro->match.flags = GIT_ATTR_FNMATCH_MACRO;

231
	error = git_attr_assignment__parse(repo, pool, &macro->assigns, &values);
232

233
	if (!error)
234 235
		error = git_attr_cache__insert_macro(repo, macro);

236
	if (error < 0)
237 238 239 240 241
		git_attr_rule__free(macro);

	return error;
}

242 243
bool git_attr_cache__is_cached(
	git_repository *repo, git_attr_file_source source, const char *path)
244
{
245
	git_buf cache_key = GIT_BUF_INIT;
246
	git_strmap *files = git_repository_attr_cache(repo)->files;
247 248 249 250 251 252 253 254 255 256 257 258 259 260 261
	const char *workdir = git_repository_workdir(repo);
	bool rval;

	if (workdir && git__prefixcmp(path, workdir) == 0)
		path += strlen(workdir);
	if (git_buf_printf(&cache_key, "%d#%s", (int)source, path) < 0)
		return false;

	rval = git_strmap_exists(files, git_buf_cstr(&cache_key));

	git_buf_free(&cache_key);

	return rval;
}

262 263
static int load_attr_file(
	const char **data,
Vicent Marti committed
264
	git_futils_filestamp *stamp,
265
	const char *filename)
266 267 268 269
{
	int error;
	git_buf content = GIT_BUF_INIT;

Vicent Marti committed
270
	error = git_futils_filestamp_check(stamp, filename);
271 272
	if (error < 0)
		return error;
273

274 275 276 277
	/* if error == 0, then file is up to date. By returning GIT_ENOTFOUND,
	 * we tell the caller not to reparse this file...
	 */
	if (!error)
278
		return GIT_ENOTFOUND;
279

280
	error = git_futils_readbuffer(&content, filename);
281 282 283 284 285 286
	if (error < 0)
		return error;

	*data = git_buf_detach(&content);

	return 0;
287
}
288

289
static int load_attr_blob_from_index(
290 291 292 293 294
	const char **content,
	git_blob **blob,
	git_repository *repo,
	const git_oid *old_oid,
	const char *relfile)
295 296 297 298 299 300
{
	int error;
	git_index *index;
	git_index_entry *entry;

	if ((error = git_repository_index__weakptr(&index, repo)) < 0 ||
301
		(error = git_index_find(index, relfile)) < 0)
302
		return error;
303

Edward Thomson committed
304
	entry = git_index_get_byindex(index, error);
305

306
	if (old_oid && git_oid_cmp(old_oid, &entry->oid) == 0)
307
		return GIT_ENOTFOUND;
308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340

	if ((error = git_blob_lookup(blob, repo, &entry->oid)) < 0)
		return error;

	*content = git_blob_rawcontent(*blob);
	return 0;
}

static int load_attr_from_cache(
	git_attr_file **file,
	git_attr_cache *cache,
	git_attr_file_source source,
	const char *relative_path)
{
	git_buf  cache_key = GIT_BUF_INIT;
	khiter_t cache_pos;

	*file = NULL;

	if (!cache || !cache->files)
		return 0;

	if (git_buf_printf(&cache_key, "%d#%s", (int)source, relative_path) < 0)
		return -1;

	cache_pos = git_strmap_lookup_index(cache->files, cache_key.ptr);

	git_buf_free(&cache_key);

	if (git_strmap_valid_index(cache->files, cache_pos))
		*file = git_strmap_value_at(cache->files, cache_pos);

	return 0;
341
}
342

343
int git_attr_cache__internal_file(
344 345
	git_repository *repo,
	const char *filename,
346
	git_attr_file **file)
347
{
348
	int error = 0;
349
	git_attr_cache *cache = git_repository_attr_cache(repo);
350
	khiter_t cache_pos = git_strmap_lookup_index(cache->files, filename);
351

352 353
	if (git_strmap_valid_index(cache->files, cache_pos)) {
		*file = git_strmap_value_at(cache->files, cache_pos);
354
		return 0;
355 356
	}

357
	if (git_attr_file__new(file, 0, filename, &cache->pool) < 0)
358
		return -1;
359

360 361 362
	git_strmap_insert(cache->files, (*file)->key + 2, *file, error);
	if (error > 0)
		error = 0;
363 364 365 366

	return error;
}

367
int git_attr_cache__push_file(
368
	git_repository *repo,
369 370 371 372
	const char *base,
	const char *filename,
	git_attr_file_source source,
	git_attr_file_parser parse,
373
	void* parsedata,
374
	git_vector *stack)
375
{
376
	int error = 0;
377
	git_buf path = GIT_BUF_INIT;
378 379 380
	const char *workdir = git_repository_workdir(repo);
	const char *relfile, *content = NULL;
	git_attr_cache *cache = git_repository_attr_cache(repo);
381
	git_attr_file *file = NULL;
382
	git_blob *blob = NULL;
Vicent Marti committed
383
	git_futils_filestamp stamp;
384 385

	assert(filename && stack);
386

387 388
	/* join base and path as needed */
	if (base != NULL && git_path_root(filename) < 0) {
389 390
		if (git_buf_joinpath(&path, base, filename) < 0)
			return -1;
391 392
		filename = path.ptr;
	}
393

394 395 396
	relfile = filename;
	if (workdir && git__prefixcmp(relfile, workdir) == 0)
		relfile += strlen(workdir);
397

398
	/* check cache */
399 400
	if (load_attr_from_cache(&file, cache, source, relfile) < 0)
		return -1;
401

402
	/* if not in cache, load data, parse, and cache */
403

404
	if (source == GIT_ATTR_FILE_FROM_FILE) {
Vicent Marti committed
405
		git_futils_filestamp_set(
406
			&stamp, file ? &file->cache_data.stamp : NULL);
407

408
		error = load_attr_file(&content, &stamp, filename);
409 410 411
	} else {
		error = load_attr_blob_from_index(&content, &blob,
			repo, file ? &file->cache_data.oid : NULL, relfile);
412 413 414 415
	}

	if (error) {
		/* not finding a file is not an error for this function */
416
		if (error == GIT_ENOTFOUND) {
417 418 419 420 421 422
			giterr_clear();
			error = 0;
		}
		goto finish;
	}

423 424 425 426 427 428 429 430
	/* if we got here, we have to parse and/or reparse the file */
	if (file)
		git_attr_file__clear_rules(file);
	else {
		error = git_attr_file__new(&file, source, relfile, &cache->pool);
		if (error < 0)
			goto finish;
	}
431

432
	if (parse && (error = parse(repo, parsedata, content, file)) < 0)
433 434
		goto finish;

435
	git_strmap_insert(cache->files, file->key, file, error); //-V595
436 437 438
	if (error > 0)
		error = 0;

439 440 441 442
	/* remember "cache buster" file signature */
	if (blob)
		git_oid_cpy(&file->cache_data.oid, git_object_id((git_object *)blob));
	else
Vicent Marti committed
443
		git_futils_filestamp_set(&file->cache_data.stamp, &stamp);
444

445 446
finish:
	/* push file onto vector if we found one*/
447
	if (!error && file != NULL)
448
		error = git_vector_insert(stack, file);
449

450 451 452 453 454 455 456 457
	if (error != 0)
		git_attr_file__free(file);

	if (blob)
		git_blob_free(blob);
	else
		git__free((void *)content);

458
	git_buf_free(&path);
459

460 461 462
	return error;
}

463
#define push_attr_file(R,S,B,F) \
464
	git_attr_cache__push_file((R),(B),(F),GIT_ATTR_FILE_FROM_FILE,git_attr_file__parse_buffer,NULL,(S))
465

466 467
typedef struct {
	git_repository *repo;
468 469 470
	uint32_t flags;
	const char *workdir;
	git_index *index;
471 472 473
	git_vector *files;
} attr_walk_up_info;

474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500
int git_attr_cache__decide_sources(
	uint32_t flags, bool has_wd, bool has_index, git_attr_file_source *srcs)
{
	int count = 0;

	switch (flags & 0x03) {
	case GIT_ATTR_CHECK_FILE_THEN_INDEX:
		if (has_wd)
			srcs[count++] = GIT_ATTR_FILE_FROM_FILE;
		if (has_index)
			srcs[count++] = GIT_ATTR_FILE_FROM_INDEX;
		break;
	case GIT_ATTR_CHECK_INDEX_THEN_FILE:
		if (has_index)
			srcs[count++] = GIT_ATTR_FILE_FROM_INDEX;
		if (has_wd)
			srcs[count++] = GIT_ATTR_FILE_FROM_FILE;
		break;
	case GIT_ATTR_CHECK_INDEX_ONLY:
		if (has_index)
			srcs[count++] = GIT_ATTR_FILE_FROM_INDEX;
		break;
	}

	return count;
}

501 502
static int push_one_attr(void *ref, git_buf *path)
{
503
	int error = 0, n_src, i;
504
	attr_walk_up_info *info = (attr_walk_up_info *)ref;
505 506 507 508 509 510 511 512
	git_attr_file_source src[2];

	n_src = git_attr_cache__decide_sources(
		info->flags, info->workdir != NULL, info->index != NULL, src);

	for (i = 0; !error && i < n_src; ++i)
		error = git_attr_cache__push_file(
			info->repo, path->ptr, GIT_ATTR_FILE, src[i],
513
			git_attr_file__parse_buffer, NULL, info->files);
514 515

	return error;
516 517
}

518
static int collect_attr_files(
519 520 521 522
	git_repository *repo,
	uint32_t flags,
	const char *path,
	git_vector *files)
523
{
524
	int error;
525 526
	git_buf dir = GIT_BUF_INIT;
	const char *workdir = git_repository_workdir(repo);
527
	attr_walk_up_info info;
528

529 530 531
	if (git_attr_cache__init(repo) < 0 ||
		git_vector_init(files, 4, NULL) < 0)
		return -1;
532

533 534
	/* Resolve path in a non-bare repo */
	if (workdir != NULL)
535 536
		error = git_path_find_dir(&dir, path, workdir);
	else
537
		error = git_path_dirname_r(&dir, path);
538
	if (error < 0)
539 540 541 542 543 544 545 546 547
		goto cleanup;

	/* in precendence order highest to lowest:
	 * - $GIT_DIR/info/attributes
	 * - path components with .gitattributes
	 * - config core.attributesfile
	 * - $GIT_PREFIX/etc/gitattributes
	 */

548
	error = push_attr_file(
549
		repo, files, git_repository_path(repo), GIT_ATTR_FILE_INREPO);
550
	if (error < 0)
551 552
		goto cleanup;

553 554 555 556 557
	info.repo  = repo;
	info.flags = flags;
	info.workdir = workdir;
	if (git_repository_index__weakptr(&info.index, repo) < 0)
		giterr_clear(); /* no error even if there is no index */
558
	info.files = files;
559

560
	error = git_path_walk_up(&dir, workdir, push_one_attr, &info);
561
	if (error < 0)
562 563
		goto cleanup;

564
	if (git_repository_attr_cache(repo)->cfg_attr_file != NULL) {
565
		error = push_attr_file(
566 567 568
			repo, files, NULL, git_repository_attr_cache(repo)->cfg_attr_file);
		if (error < 0)
			goto cleanup;
569 570
	}

571 572 573 574
	if ((flags & GIT_ATTR_CHECK_NO_SYSTEM) == 0) {
		error = git_futils_find_system_file(&dir, GIT_ATTR_FILE_SYSTEM);
		if (!error)
			error = push_attr_file(repo, files, NULL, dir.ptr);
575
		else if (error == GIT_ENOTFOUND)
576 577
			error = 0;
	}
578 579

 cleanup:
580
	if (error < 0)
581 582 583 584 585 586
		git_vector_free(files);
	git_buf_free(&dir);

	return error;
}

587 588 589 590 591 592 593 594 595 596 597 598
static char *try_global_default(const char *relpath)
{
	git_buf dflt = GIT_BUF_INIT;
	char *rval = NULL;

	if (!git_futils_find_global_file(&dflt, relpath))
		rval = git_buf_detach(&dflt);

	git_buf_free(&dflt);

	return rval;
}
599

600
int git_attr_cache__init(git_repository *repo)
601
{
602
	int ret;
603 604
	git_attr_cache *cache = git_repository_attr_cache(repo);
	git_config *cfg;
605 606

	if (cache->initialized)
607
		return 0;
608

609
	/* cache config settings for attributes and ignores */
610
	if (git_repository_config__weakptr(&cfg, repo) < 0)
611
		return -1;
612

613
	ret = git_config_get_string(&cache->cfg_attr_file, cfg, GIT_ATTR_CONFIG);
614
	if (ret < 0 && ret != GIT_ENOTFOUND)
615
		return ret;
616 617
	if (ret == GIT_ENOTFOUND)
		cache->cfg_attr_file = try_global_default(GIT_ATTR_CONFIG_DEFAULT);
618

619
	ret = git_config_get_string(&cache->cfg_excl_file, cfg, GIT_IGNORE_CONFIG);
620
	if (ret < 0 && ret != GIT_ENOTFOUND)
621
		return ret;
622 623
	if (ret == GIT_ENOTFOUND)
		cache->cfg_excl_file = try_global_default(GIT_IGNORE_CONFIG_DEFAULT);
624

625
	giterr_clear();
626 627

	/* allocate hashtable for attribute and ignore file contents */
628
	if (cache->files == NULL) {
629
		cache->files = git_strmap_alloc();
630
		GITERR_CHECK_ALLOC(cache->files);
631 632
	}

633
	/* allocate hashtable for attribute macros */
634
	if (cache->macros == NULL) {
635
		cache->macros = git_strmap_alloc();
636
		GITERR_CHECK_ALLOC(cache->macros);
637
	}
638

639 640 641 642
	/* allocate string pool */
	if (git_pool_init(&cache->pool, 1, 0) < 0)
		return -1;

643 644 645
	cache->initialized = 1;

	/* insert default macros */
646
	return git_attr_add_macro(repo, "binary", "-diff -crlf -text");
647 648 649 650 651
}

void git_attr_cache_flush(
	git_repository *repo)
{
652
	git_attr_cache *cache;
653

654 655 656
	if (!repo)
		return;

657
	cache = git_repository_attr_cache(repo);
658

659 660
	if (cache->files != NULL) {
		git_attr_file *file;
661

662
		git_strmap_foreach_value(cache->files, file, {
663 664 665
			git_attr_file__free(file);
		});

666
		git_strmap_free(cache->files);
667 668
	}

669
	if (cache->macros != NULL) {
670 671
		git_attr_rule *rule;

672
		git_strmap_foreach_value(cache->macros, rule, {
673 674 675
			git_attr_rule__free(rule);
		});

676
		git_strmap_free(cache->macros);
677 678
	}

679 680 681
	git_pool_clear(&cache->pool);

	cache->initialized = 0;
682
}
683 684 685

int git_attr_cache__insert_macro(git_repository *repo, git_attr_rule *macro)
{
686
	git_strmap *macros = git_repository_attr_cache(repo)->macros;
687 688
	int error;

689
	/* TODO: generate warning log if (macro->assigns.length == 0) */
690
	if (macro->assigns.length == 0)
691
		return 0;
692

693
	git_strmap_insert(macros, macro->match.pattern, macro, error);
694
	return (error < 0) ? -1 : 0;
695
}
696 697 698 699

git_attr_rule *git_attr_cache__lookup_macro(
	git_repository *repo, const char *name)
{
700
	git_strmap *macros = git_repository_attr_cache(repo)->macros;
701 702
	khiter_t pos;

703
	pos = git_strmap_lookup_index(macros, name);
704

705
	if (!git_strmap_valid_index(macros, pos))
706 707
		return NULL;

708
	return (git_attr_rule *)git_strmap_value_at(macros, pos);
709 710
}