Commit 0e0589fc by Edward Thomson

iterator: combine fs+workdir iterators more completely

Drop some of the layers of indirection between the workdir and the
filesystem iterators.  This makes the code a little bit easier to
follow, and reduces the number of unnecessary allocations a bit as
well.  (Prior to this, when we filter entries, we would allocate them,
filter them and then free them; now we do the filtering before
allocation.)

Also, rename `git_iterator_advance_over_with_status` to just
`git_iterator_advance_over`.  Mostly because it's a fucking long-ass
function name otherwise.
parent d051de24
...@@ -394,7 +394,7 @@ static int checkout_action_wd_only( ...@@ -394,7 +394,7 @@ static int checkout_action_wd_only(
git_buf_sets(&data->tmp, wd->path); git_buf_sets(&data->tmp, wd->path);
saved_wd.path = data->tmp.ptr; saved_wd.path = data->tmp.ptr;
error = git_iterator_advance_over_with_status( error = git_iterator_advance_over(
wditem, &untracked_state, workdir); wditem, &untracked_state, workdir);
if (error == GIT_ITEROVER) if (error == GIT_ITEROVER)
over = true; over = true;
...@@ -930,7 +930,7 @@ static int checkout_conflicts_load(checkout_data *data, git_iterator *workdir, g ...@@ -930,7 +930,7 @@ static int checkout_conflicts_load(checkout_data *data, git_iterator *workdir, g
git_index *index; git_index *index;
/* Only write conficts from sources that have them: indexes. */ /* Only write conficts from sources that have them: indexes. */
if ((index = git_iterator_get_index(data->target)) == NULL) if ((index = git_iterator_index(data->target)) == NULL)
return 0; return 0;
data->update_conflicts._cmp = checkout_conflictdata_cmp; data->update_conflicts._cmp = checkout_conflictdata_cmp;
...@@ -1080,7 +1080,7 @@ static int checkout_conflicts_coalesce_renames( ...@@ -1080,7 +1080,7 @@ static int checkout_conflicts_coalesce_renames(
size_t i, names; size_t i, names;
int error = 0; int error = 0;
if ((index = git_iterator_get_index(data->target)) == NULL) if ((index = git_iterator_index(data->target)) == NULL)
return 0; return 0;
/* Juggle entries based on renames */ /* Juggle entries based on renames */
...@@ -1138,7 +1138,7 @@ static int checkout_conflicts_mark_directoryfile( ...@@ -1138,7 +1138,7 @@ static int checkout_conflicts_mark_directoryfile(
const char *path; const char *path;
int prefixed, error = 0; int prefixed, error = 0;
if ((index = git_iterator_get_index(data->target)) == NULL) if ((index = git_iterator_index(data->target)) == NULL)
return 0; return 0;
len = git_index_entrycount(index); len = git_index_entrycount(index);
...@@ -2378,7 +2378,7 @@ static int checkout_data_init( ...@@ -2378,7 +2378,7 @@ static int checkout_data_init(
if ((error = git_repository_index(&data->index, data->repo)) < 0) if ((error = git_repository_index(&data->index, data->repo)) < 0)
goto cleanup; goto cleanup;
if (data->index != git_iterator_get_index(target)) { if (data->index != git_iterator_index(target)) {
if ((error = git_index_read(data->index, true)) < 0) if ((error = git_index_read(data->index, true)) < 0)
goto cleanup; goto cleanup;
...@@ -2600,7 +2600,7 @@ int git_checkout_iterator( ...@@ -2600,7 +2600,7 @@ int git_checkout_iterator(
(error = checkout_create_conflicts(&data)) < 0) (error = checkout_create_conflicts(&data)) < 0)
goto cleanup; goto cleanup;
if (data.index != git_iterator_get_index(target) && if (data.index != git_iterator_index(target) &&
(error = checkout_extensions_update_index(&data)) < 0) (error = checkout_extensions_update_index(&data)) < 0)
goto cleanup; goto cleanup;
......
...@@ -826,8 +826,7 @@ static int maybe_modified( ...@@ -826,8 +826,7 @@ static int maybe_modified(
*/ */
} else if (git_oid_iszero(&nitem->id) && new_is_workdir) { } else if (git_oid_iszero(&nitem->id) && new_is_workdir) {
bool use_ctime = ((diff->diffcaps & GIT_DIFFCAPS_TRUST_CTIME) != 0); bool use_ctime = ((diff->diffcaps & GIT_DIFFCAPS_TRUST_CTIME) != 0);
git_index *index; git_index *index = git_iterator_index(info->new_iter);
git_iterator_index(&index, info->new_iter);
status = GIT_DELTA_UNMODIFIED; status = GIT_DELTA_UNMODIFIED;
...@@ -980,15 +979,14 @@ static int iterator_advance_into( ...@@ -980,15 +979,14 @@ static int iterator_advance_into(
return error; return error;
} }
static int iterator_advance_over_with_status( static int iterator_advance_over(
const git_index_entry **entry, const git_index_entry **entry,
git_iterator_status_t *status, git_iterator_status_t *status,
git_iterator *iterator) git_iterator *iterator)
{ {
int error; int error = git_iterator_advance_over(entry, status, iterator);
if ((error = git_iterator_advance_over_with_status( if (error == GIT_ITEROVER) {
entry, status, iterator)) == GIT_ITEROVER) {
*entry = NULL; *entry = NULL;
error = 0; error = 0;
} }
...@@ -1056,7 +1054,7 @@ static int handle_unmatched_new_item( ...@@ -1056,7 +1054,7 @@ static int handle_unmatched_new_item(
return iterator_advance(&info->nitem, info->new_iter); return iterator_advance(&info->nitem, info->new_iter);
/* iterate into dir looking for an actual untracked file */ /* iterate into dir looking for an actual untracked file */
if ((error = iterator_advance_over_with_status( if ((error = iterator_advance_over(
&info->nitem, &untracked_state, info->new_iter)) < 0) &info->nitem, &untracked_state, info->new_iter)) < 0)
return error; return error;
......
...@@ -49,15 +49,19 @@ ...@@ -49,15 +49,19 @@
git__free(P); return -1; } \ git__free(P); return -1; } \
} while (0) } while (0)
#define GIT_ITERATOR_FIRST_ACCESS (1 << 15)
#define GIT_ITERATOR_HONOR_IGNORES (1 << 16)
#define GIT_ITERATOR_IGNORE_DOT_GIT (1 << 17)
#define iterator__flag(I,F) ((((git_iterator *)(I))->flags & GIT_ITERATOR_ ## F) != 0) #define iterator__flag(I,F) ((((git_iterator *)(I))->flags & GIT_ITERATOR_ ## F) != 0)
#define iterator__ignore_case(I) iterator__flag(I,IGNORE_CASE) #define iterator__ignore_case(I) iterator__flag(I,IGNORE_CASE)
#define iterator__include_trees(I) iterator__flag(I,INCLUDE_TREES) #define iterator__include_trees(I) iterator__flag(I,INCLUDE_TREES)
#define iterator__dont_autoexpand(I) iterator__flag(I,DONT_AUTOEXPAND) #define iterator__dont_autoexpand(I) iterator__flag(I,DONT_AUTOEXPAND)
#define iterator__do_autoexpand(I) !iterator__flag(I,DONT_AUTOEXPAND) #define iterator__do_autoexpand(I) !iterator__flag(I,DONT_AUTOEXPAND)
#define iterator__include_conflicts(I) iterator__flag(I, INCLUDE_CONFLICTS) #define iterator__include_conflicts(I) iterator__flag(I,INCLUDE_CONFLICTS)
#define GIT_ITERATOR_FIRST_ACCESS (1 << 15)
#define iterator__has_been_accessed(I) iterator__flag(I,FIRST_ACCESS) #define iterator__has_been_accessed(I) iterator__flag(I,FIRST_ACCESS)
#define iterator__honor_ignores(I) iterator__flag(I,HONOR_IGNORES)
#define iterator__ignore_dot_git(I) iterator__flag(I,IGNORE_DOT_GIT)
#define iterator__end(I) ((git_iterator *)(I))->end #define iterator__end(I) ((git_iterator *)(I))->end
#define iterator__past_end(I,PATH) \ #define iterator__past_end(I,PATH) \
...@@ -221,6 +225,29 @@ static int iterator__reset_range( ...@@ -221,6 +225,29 @@ static int iterator__reset_range(
return 0; return 0;
} }
int git_iterator_set_ignore_case(git_iterator *iter, bool ignore_case)
{
if (ignore_case) {
iter->flags = (iter->flags | GIT_ITERATOR_IGNORE_CASE);
iter->strcomp = git__strcasecmp;
iter->strncomp = git__strncasecmp;
iter->prefixcomp = git__prefixcmp_icase;
iter->entry_srch = git_index_entry_isrch;
} else {
iter->flags = (iter->flags & ~GIT_ITERATOR_IGNORE_CASE);
iter->strcomp = git__strcmp;
iter->strncomp = git__strncmp;
iter->prefixcomp = git__prefixcmp;
iter->entry_srch = git_index_entry_srch;
}
iterator_pathlist__update_ignore_case(iter);
return 0;
}
static int iterator__update_ignore_case( static int iterator__update_ignore_case(
git_iterator *iter, git_iterator *iter,
git_iterator_flag_t flags) git_iterator_flag_t flags)
...@@ -241,23 +268,7 @@ static int iterator__update_ignore_case( ...@@ -241,23 +268,7 @@ static int iterator__update_ignore_case(
ignore_case = (index->ignore_case == 1); ignore_case = (index->ignore_case == 1);
} }
if (ignore_case) { return git_iterator_set_ignore_case(iter, ignore_case);
iter->flags = (iter->flags | GIT_ITERATOR_IGNORE_CASE);
iter->strcomp = git__strcasecmp;
iter->strncomp = git__strncasecmp;
iter->prefixcomp = git__prefixcmp_icase;
} else {
iter->flags = (iter->flags & ~GIT_ITERATOR_IGNORE_CASE);
iter->strcomp = git__strcmp;
iter->strncomp = git__strncmp;
iter->prefixcomp = git__prefixcmp;
}
iterator_pathlist__update_ignore_case(iter);
return 0;
} }
GIT_INLINE(void) iterator__clear_entry(const git_index_entry **entry) GIT_INLINE(void) iterator__clear_entry(const git_index_entry **entry)
...@@ -269,14 +280,18 @@ GIT_INLINE(void) iterator__clear_entry(const git_index_entry **entry) ...@@ -269,14 +280,18 @@ GIT_INLINE(void) iterator__clear_entry(const git_index_entry **entry)
static int iterator_range_init( static int iterator_range_init(
git_iterator *iter, const char *start, const char *end) git_iterator *iter, const char *start, const char *end)
{ {
if (start) { if (start && *start) {
iter->start = git__strdup(start); iter->start = git__strdup(start);
GITERR_CHECK_ALLOC(iter->start); GITERR_CHECK_ALLOC(iter->start);
iter->start_len = strlen(iter->start);
} }
if (end) { if (end && *end) {
iter->end = git__strdup(end); iter->end = git__strdup(end);
GITERR_CHECK_ALLOC(iter->end); GITERR_CHECK_ALLOC(iter->end);
iter->end_len = strlen(iter->end);
} }
iter->started = (iter->start == NULL); iter->started = (iter->start == NULL);
...@@ -290,11 +305,13 @@ static void iterator_range_free(git_iterator *iter) ...@@ -290,11 +305,13 @@ static void iterator_range_free(git_iterator *iter)
if (iter->start) { if (iter->start) {
git__free(iter->start); git__free(iter->start);
iter->start = NULL; iter->start = NULL;
iter->start_len = 0;
} }
if (iter->end) { if (iter->end) {
git__free(iter->end); git__free(iter->end);
iter->end = NULL; iter->end = NULL;
iter->end_len = 0;
} }
} }
...@@ -333,10 +350,9 @@ static int iterator_init_common( ...@@ -333,10 +350,9 @@ static int iterator_init_common(
static git_iterator_options default_opts = GIT_ITERATOR_OPTIONS_INIT; static git_iterator_options default_opts = GIT_ITERATOR_OPTIONS_INIT;
git_iterator_options *options = given_opts ? given_opts : &default_opts; git_iterator_options *options = given_opts ? given_opts : &default_opts;
bool ignore_case; bool ignore_case;
int precompose;
int error; int error;
assert(repo);
iter->repo = repo; iter->repo = repo;
iter->flags = options->flags; iter->flags = options->flags;
...@@ -344,7 +360,7 @@ static int iterator_init_common( ...@@ -344,7 +360,7 @@ static int iterator_init_common(
ignore_case = true; ignore_case = true;
} else if ((iter->flags & GIT_ITERATOR_DONT_IGNORE_CASE) != 0) { } else if ((iter->flags & GIT_ITERATOR_DONT_IGNORE_CASE) != 0) {
ignore_case = false; ignore_case = false;
} else { } else if (repo) {
git_index *index; git_index *index;
if ((error = git_repository_index__weakptr(&index, iter->repo)) < 0) if ((error = git_repository_index__weakptr(&index, iter->repo)) < 0)
...@@ -356,6 +372,19 @@ static int iterator_init_common( ...@@ -356,6 +372,19 @@ static int iterator_init_common(
iter->flags |= GIT_ITERATOR_IGNORE_CASE; iter->flags |= GIT_ITERATOR_IGNORE_CASE;
else else
iter->flags |= GIT_ITERATOR_DONT_IGNORE_CASE; iter->flags |= GIT_ITERATOR_DONT_IGNORE_CASE;
} else {
ignore_case = false;
}
/* try to look up precompose and set flag if appropriate */
if (repo &&
(iter->flags & GIT_ITERATOR_PRECOMPOSE_UNICODE) == 0 &&
(iter->flags & GIT_ITERATOR_DONT_PRECOMPOSE_UNICODE) == 0) {
if (git_repository__cvar(&precompose, repo, GIT_CVAR_PRECOMPOSE) < 0)
giterr_clear();
else if (precompose)
iter->flags |= GIT_ITERATOR_PRECOMPOSE_UNICODE;
} }
if ((iter->flags & GIT_ITERATOR_DONT_AUTOEXPAND)) if ((iter->flags & GIT_ITERATOR_DONT_AUTOEXPAND))
...@@ -364,6 +393,7 @@ static int iterator_init_common( ...@@ -364,6 +393,7 @@ static int iterator_init_common(
iter->strcomp = ignore_case ? git__strcasecmp : git__strcmp; iter->strcomp = ignore_case ? git__strcasecmp : git__strcmp;
iter->strncomp = ignore_case ? git__strncasecmp : git__strncmp; iter->strncomp = ignore_case ? git__strncasecmp : git__strncmp;
iter->prefixcomp = ignore_case ? git__prefixcmp_icase : git__prefixcmp; iter->prefixcomp = ignore_case ? git__prefixcmp_icase : git__prefixcmp;
iter->entry_srch = ignore_case ? git_index_entry_srch : git_index_entry_isrch;
if ((error = iterator_range_init(iter, options->start, options->end)) < 0 || if ((error = iterator_range_init(iter, options->start, options->end)) < 0 ||
(error = iterator_pathlist_init(iter, &options->pathlist)) < 0) (error = iterator_pathlist_init(iter, &options->pathlist)) < 0)
...@@ -376,6 +406,7 @@ static void iterator_clear(git_iterator *iter) ...@@ -376,6 +406,7 @@ static void iterator_clear(git_iterator *iter)
{ {
iter->started = false; iter->started = false;
iter->ended = false; iter->ended = false;
iter->stat_calls = 0;
iter->pathlist_walk_idx = 0; iter->pathlist_walk_idx = 0;
iter->flags &= ~GIT_ITERATOR_FIRST_ACCESS; iter->flags &= ~GIT_ITERATOR_FIRST_ACCESS;
} }
...@@ -416,7 +447,7 @@ GIT_INLINE(bool) iterator_has_ended(git_iterator *iter, const char *path) ...@@ -416,7 +447,7 @@ GIT_INLINE(bool) iterator_has_ended(git_iterator *iter, const char *path)
/* walker for the index iterator that allows it to walk the sorted pathlist /* walker for the index iterator that allows it to walk the sorted pathlist
* entries alongside sorted iterator entries. * entries alongside sorted iterator entries.
*/ */
static bool iterator_pathlist_contains(git_iterator *iter, const char *path) static bool iterator_pathlist_next_is(git_iterator *iter, const char *path)
{ {
char *p; char *p;
size_t path_len, p_len, cmp_len, i; size_t path_len, p_len, cmp_len, i;
...@@ -483,6 +514,62 @@ static bool iterator_pathlist_contains(git_iterator *iter, const char *path) ...@@ -483,6 +514,62 @@ static bool iterator_pathlist_contains(git_iterator *iter, const char *path)
return false; return false;
} }
typedef enum {
ITERATOR_PATHLIST_NOT_FOUND = 0,
ITERATOR_PATHLIST_IS_FILE = 1,
ITERATOR_PATHLIST_IS_DIR = 2,
ITERATOR_PATHLIST_IS_PARENT = 3,
ITERATOR_PATHLIST_FULL = 4,
} iterator_pathlist_search_t;
static iterator_pathlist_search_t iterator_pathlist_search(
git_iterator *iter, const char *path, size_t path_len)
{
const char *p;
size_t idx;
int error;
error = git_vector_bsearch2(&idx, &iter->pathlist,
(git_vector_cmp)iter->strcomp, path);
/* the given path was found in the pathlist. since the pathlist only
* matches directories when they're suffixed with a '/', analyze the
* path string to determine whether it's a directory or not.
*/
if (error == 0) {
if (path_len && path[path_len-1] == '/')
return ITERATOR_PATHLIST_IS_DIR;
return ITERATOR_PATHLIST_IS_FILE;
}
/* at this point, the path we're examining may be a directory (though we
* don't know that yet, since we're avoiding a stat unless it's necessary)
* so walk the pathlist looking for the given path with a '/' after it,
*/
while ((p = git_vector_get(&iter->pathlist, idx)) != NULL) {
if (iter->prefixcomp(p, path) != 0)
break;
/* an exact match would have been matched by the bsearch above */
assert(p[path_len]);
/* is this a literal directory entry (eg `foo/`) or a file beneath */
if (p[path_len] == '/') {
return (p[path_len+1] == '\0') ?
ITERATOR_PATHLIST_IS_DIR :
ITERATOR_PATHLIST_IS_PARENT;
}
if (p[path_len] > '/')
break;
idx++;
}
return ITERATOR_PATHLIST_NOT_FOUND;
}
/* Empty iterator */ /* Empty iterator */
static int empty_iterator__noop(const git_index_entry **e, git_iterator *i) static int empty_iterator__noop(const git_index_entry **e, git_iterator *i)
...@@ -684,8 +771,6 @@ static int tree_iterator_frame_init( ...@@ -684,8 +771,6 @@ static int tree_iterator_frame_init(
memset(new_frame, 0x0, sizeof(tree_iterator_frame)); memset(new_frame, 0x0, sizeof(tree_iterator_frame));
new_frame->tree = dup; new_frame->tree = dup;
if (frame_entry && if (frame_entry &&
(error = tree_iterator_compute_path(&new_frame->path, frame_entry)) < 0) (error = tree_iterator_compute_path(&new_frame->path, frame_entry)) < 0)
goto done; goto done;
...@@ -911,7 +996,7 @@ static int tree_iterator_advance(const git_index_entry **out, git_iterator *i) ...@@ -911,7 +996,7 @@ static int tree_iterator_advance(const git_index_entry **out, git_iterator *i)
} }
/* if we have a list of paths we're interested in, examine it */ /* if we have a list of paths we're interested in, examine it */
if (!iterator_pathlist_contains(&iter->base, iter->entry_path.ptr)) if (!iterator_pathlist_next_is(&iter->base, iter->entry_path.ptr))
continue; continue;
is_tree = git_tree_entry__is_tree(entry->tree_entry); is_tree = git_tree_entry__is_tree(entry->tree_entry);
...@@ -1058,6 +1143,7 @@ int git_iterator_for_tree( ...@@ -1058,6 +1143,7 @@ int git_iterator_for_tree(
tree_iterator_current, tree_iterator_current,
tree_iterator_advance, tree_iterator_advance,
tree_iterator_advance_into, tree_iterator_advance_into,
NULL, /* advance_over */
tree_iterator_reset, tree_iterator_reset,
tree_iterator_reset_range, tree_iterator_reset_range,
tree_iterator_at_end, tree_iterator_at_end,
...@@ -1124,975 +1210,913 @@ int git_iterator_current_parent_tree( ...@@ -1124,975 +1210,913 @@ int git_iterator_current_parent_tree(
return 0; return 0;
} }
/* Index iterator */ /* Filesystem iterator */
typedef struct {
struct stat st;
size_t path_len;
iterator_pathlist_search_t match;
char path[GIT_FLEX_ARRAY];
} filesystem_iterator_entry;
typedef struct {
git_vector entries;
git_pool entry_pool;
size_t next_idx;
size_t path_len;
int is_ignored;
} filesystem_iterator_frame;
typedef struct { typedef struct {
git_iterator base; git_iterator base;
git_iterator_callbacks cb; char *root;
size_t root_len;
unsigned int dirload_flags;
git_tree *tree;
git_index *index; git_index *index;
git_vector entries; git_vector index_snapshot;
git_vector_cmp entry_srch;
size_t current;
/* when limiting with a pathlist, this is the current index into it */
size_t pathlist_idx;
/* when not in autoexpand mode, use these to represent "tree" state */
git_buf partial;
size_t partial_pos;
char restore_terminator;
git_index_entry tree_entry;
} index_iterator;
static const git_index_entry *index_iterator__index_entry(index_iterator *ii) git_array_t(filesystem_iterator_frame) frames;
{ git_ignores ignores;
const git_index_entry *ie = git_vector_get(&ii->entries, ii->current);
if (ie != NULL && iterator__past_end(ii, ie->path)) { /* info about the current entry */
ii->current = git_vector_length(&ii->entries); git_index_entry entry;
ie = NULL; git_buf current_path;
} int current_is_ignored;
return ie; /* temporary buffer for advance_over */
git_buf tmp_buf;
} filesystem_iterator;
GIT_INLINE(filesystem_iterator_frame *) filesystem_iterator_parent_frame(
filesystem_iterator *iter)
{
return iter->frames.size > 1 ?
&iter->frames.ptr[iter->frames.size-2] : NULL;
} }
static const git_index_entry *index_iterator__advance_over_unwanted( GIT_INLINE(filesystem_iterator_frame *) filesystem_iterator_current_frame(
index_iterator *ii) filesystem_iterator *iter)
{ {
const git_index_entry *ie = index_iterator__index_entry(ii); return iter->frames.size ? &iter->frames.ptr[iter->frames.size-1] : NULL;
bool match; }
while (ie) { GIT_INLINE(filesystem_iterator_entry *) filesystem_iterator_current_entry(
if (!iterator__include_conflicts(ii) && filesystem_iterator_frame *frame)
git_index_entry_is_conflict(ie)) { {
ii->current++; return frame->next_idx == 0 ?
ie = index_iterator__index_entry(ii); NULL : frame->entries.contents[frame->next_idx-1];
continue; }
}
/* if we have a pathlist, this entry's path must be in it to be static int filesystem_iterator_entry_cmp(const void *_a, const void *_b)
* returned. walk the pathlist in unison with the index to {
* compare paths. const filesystem_iterator_entry *a = (const filesystem_iterator_entry *)_a;
*/ const filesystem_iterator_entry *b = (const filesystem_iterator_entry *)_b;
if (ii->base.pathlist.length) {
match = iterator_pathlist_walk__contains(&ii->base, ie->path);
if (!match) { return git__strcmp(a->path, b->path);
ii->current++; }
ie = index_iterator__index_entry(ii);
continue;
}
}
break; static int filesystem_iterator_entry_cmp_icase(const void *_a, const void *_b)
} {
const filesystem_iterator_entry *a = (const filesystem_iterator_entry *)_a;
const filesystem_iterator_entry *b = (const filesystem_iterator_entry *)_b;
return ie; return git__strcasecmp(a->path, b->path);
} }
static void index_iterator__next_prefix_tree(index_iterator *ii) #define FILESYSTEM_MAX_DEPTH 100
/**
* Figure out if an entry is a submodule.
*
* We consider it a submodule if the path is listed as a submodule in
* either the tree or the index.
*/
static int is_submodule(
bool *out, filesystem_iterator *iter, const char *path, size_t path_len)
{ {
const char *slash; bool is_submodule = false;
int error;
if (!iterator__include_trees(ii)) *out = false;
return;
slash = strchr(&ii->partial.ptr[ii->partial_pos], '/'); /* first see if this path is a submodule in HEAD */
if (iter->tree) {
git_tree_entry *entry;
if (slash != NULL) { error = git_tree_entry_bypath(&entry, iter->tree, path);
ii->partial_pos = (slash - ii->partial.ptr) + 1;
ii->restore_terminator = ii->partial.ptr[ii->partial_pos];
ii->partial.ptr[ii->partial_pos] = '\0';
} else {
ii->partial_pos = ii->partial.size;
}
if (index_iterator__index_entry(ii) == NULL) if (error < 0 && error != GIT_ENOTFOUND)
ii->partial_pos = ii->partial.size; return error;
}
static int index_iterator__first_prefix_tree(index_iterator *ii) if (!error) {
{ is_submodule = (entry->attr == GIT_FILEMODE_COMMIT);
const git_index_entry *ie = index_iterator__advance_over_unwanted(ii); git_tree_entry_free(entry);
const char *scan, *prior, *slash; }
}
if (!ie || !iterator__include_trees(ii)) if (!is_submodule && iter->index) {
return 0; size_t pos;
/* find longest common prefix with prior index entry */ error = git_index_snapshot_find(&pos,
for (scan = slash = ie->path, prior = ii->partial.ptr; &iter->index_snapshot, iter->base.entry_srch, path, path_len, 0);
*scan && *scan == *prior; ++scan, ++prior)
if (*scan == '/')
slash = scan;
if (git_buf_sets(&ii->partial, ie->path) < 0) if (error < 0 && error != GIT_ENOTFOUND)
return -1; return error;
ii->partial_pos = (slash - ie->path) + 1; if (!error) {
index_iterator__next_prefix_tree(ii); git_index_entry *e = git_vector_get(&iter->index_snapshot, pos);
is_submodule = (e->mode == GIT_FILEMODE_COMMIT);
}
}
*out = is_submodule;
return 0; return 0;
} }
#define index_iterator__at_tree(I) \ GIT_INLINE(git_dir_flag) filesystem_iterator_dir_flag(git_index_entry *entry)
(iterator__include_trees(I) && (I)->partial_pos < (I)->partial.size) {
#if defined(GIT_WIN32) && !defined(__MINGW32__)
return (entry && entry->mode) ?
(S_ISDIR(entry->mode) ? GIT_DIR_FLAG_TRUE : GIT_DIR_FLAG_FALSE) :
GIT_DIR_FLAG_UNKNOWN;
#else
GIT_UNUSED(entry);
return GIT_DIR_FLAG_UNKNOWN;
#endif
}
static int index_iterator__current( static void filesystem_iterator_frame_push_ignores(
const git_index_entry **entry, git_iterator *self) filesystem_iterator *iter,
filesystem_iterator_entry *frame_entry,
filesystem_iterator_frame *new_frame)
{ {
index_iterator *ii = (index_iterator *)self; filesystem_iterator_frame *previous_frame;
const git_index_entry *ie = git_vector_get(&ii->entries, ii->current); const char *path = frame_entry ? frame_entry->path : "";
if (ie != NULL && index_iterator__at_tree(ii)) { if (!iterator__honor_ignores(&iter->base))
ii->tree_entry.path = ii->partial.ptr; return;
ie = &ii->tree_entry;
if (git_ignore__lookup(&new_frame->is_ignored,
&iter->ignores, path, GIT_DIR_FLAG_TRUE) < 0) {
giterr_clear();
new_frame->is_ignored = GIT_IGNORE_NOTFOUND;
} }
if (entry) /* if this is not the top level directory... */
*entry = ie; if (frame_entry) {
const char *relative_path;
ii->base.flags |= GIT_ITERATOR_FIRST_ACCESS; previous_frame = filesystem_iterator_parent_frame(iter);
return (ie != NULL) ? 0 : GIT_ITEROVER; /* push new ignores for files in this directory */
relative_path = frame_entry->path + previous_frame->path_len;
/* inherit ignored from parent if no rule specified */
if (new_frame->is_ignored <= GIT_IGNORE_NOTFOUND)
new_frame->is_ignored = previous_frame->is_ignored;
git_ignore__push_dir(&iter->ignores, relative_path);
}
} }
static int index_iterator__at_end(git_iterator *self) static void filesystem_iterator_frame_pop_ignores(
filesystem_iterator *iter)
{ {
index_iterator *ii = (index_iterator *)self; if (iterator__honor_ignores(&iter->base))
return (ii->current >= git_vector_length(&ii->entries)); git_ignore__pop_dir(&iter->ignores);
} }
static int index_iterator__advance( GIT_INLINE(bool) filesystem_iterator_examine_path(
const git_index_entry **entry, git_iterator *self) bool *is_dir_out,
iterator_pathlist_search_t *match_out,
filesystem_iterator *iter,
filesystem_iterator_entry *frame_entry,
const char *path,
size_t path_len)
{ {
index_iterator *ii = (index_iterator *)self; bool is_dir = 0;
size_t entrycount = git_vector_length(&ii->entries); iterator_pathlist_search_t match = ITERATOR_PATHLIST_FULL;
const git_index_entry *ie;
if (!iterator__has_been_accessed(ii)) *is_dir_out = false;
return index_iterator__current(entry, self); *match_out = ITERATOR_PATHLIST_NOT_FOUND;
if (index_iterator__at_tree(ii)) { if (iter->base.start_len) {
if (iterator__do_autoexpand(ii)) { int cmp = iter->base.strncomp(path, iter->base.start, path_len);
ii->partial.ptr[ii->partial_pos] = ii->restore_terminator;
index_iterator__next_prefix_tree(ii);
} else {
/* advance to sibling tree (i.e. find entry with new prefix) */
while (ii->current < entrycount) {
ii->current++;
if (!(ie = git_vector_get(&ii->entries, ii->current)) || /* we haven't stat'ed `path` yet, so we don't yet know if it's a
ii->base.prefixcomp(ie->path, ii->partial.ptr) != 0) * directory or not. special case if the current path may be a
break; * directory that matches the start prefix.
} */
if (cmp == 0) {
if (iter->base.start[path_len] == '/')
is_dir = true;
if (index_iterator__first_prefix_tree(ii) < 0) else if (iter->base.start[path_len] != '\0')
return -1; cmp = -1;
} }
} else {
if (ii->current < entrycount)
ii->current++;
if (index_iterator__first_prefix_tree(ii) < 0) if (cmp < 0)
return -1; return false;
} }
return index_iterator__current(entry, self); if (iter->base.end_len) {
} int cmp = iter->base.strncomp(path, iter->base.end, iter->base.end_len);
static int index_iterator__advance_into(
const git_index_entry **entry, git_iterator *self)
{
index_iterator *ii = (index_iterator *)self;
const git_index_entry *ie = git_vector_get(&ii->entries, ii->current);
if (ie != NULL && index_iterator__at_tree(ii)) { if (cmp > 0)
if (ii->restore_terminator) return false;
ii->partial.ptr[ii->partial_pos] = ii->restore_terminator;
index_iterator__next_prefix_tree(ii);
} }
return index_iterator__current(entry, self); /* if we have a pathlist that we're limiting to, examine this path now
} * to avoid a `stat` if we're not interested in the path.
static int index_iterator__reset(git_iterator *self)
{
index_iterator *ii = (index_iterator *)self;
const git_index_entry *ie;
ii->current = 0;
ii->base.flags &= ~GIT_ITERATOR_FIRST_ACCESS;
iterator_pathlist_walk__reset(self);
/* if we're given a start prefix, find it; if we're given a pathlist, find
* the first of those. start at the later of the two.
*/ */
if (ii->base.start) if (iter->base.pathlist.length) {
git_index_snapshot_find( /* if our parent was explicitly included, so too are we */
&ii->current, &ii->entries, ii->entry_srch, ii->base.start, 0, 0); if (frame_entry && frame_entry->match != ITERATOR_PATHLIST_IS_PARENT)
match = ITERATOR_PATHLIST_FULL;
if ((ie = index_iterator__advance_over_unwanted(ii)) == NULL) else
return 0; match = iterator_pathlist_search(&iter->base, path, path_len);
if (git_buf_sets(&ii->partial, ie->path) < 0)
return -1;
ii->partial_pos = 0;
if (ii->base.start) { if (match == ITERATOR_PATHLIST_NOT_FOUND)
size_t startlen = strlen(ii->base.start); return false;
ii->partial_pos = (startlen > ii->partial.size) ? /* Ensure that the pathlist entry lines up with what we expected */
ii->partial.size : startlen; if (match == ITERATOR_PATHLIST_IS_DIR ||
match == ITERATOR_PATHLIST_IS_PARENT)
is_dir = true;
} }
index_iterator__next_prefix_tree(ii); *is_dir_out = is_dir;
*match_out = match;
return 0; return true;
}
static int index_iterator__reset_range(
git_iterator *self, const char *start, const char *end)
{
if (iterator__reset_range(self, start, end) < 0)
return -1;
return index_iterator__reset(self);
}
static void index_iterator__free(git_iterator *self)
{
index_iterator *ii = (index_iterator *)self;
git_index_snapshot_release(&ii->entries, ii->index);
ii->index = NULL;
git_buf_free(&ii->partial);
} }
int git_iterator_for_index( GIT_INLINE(bool) filesystem_iterator_is_dot_git(
git_iterator **iter, filesystem_iterator *iter, const char *path, size_t path_len)
git_repository *repo,
git_index *index,
git_iterator_options *options)
{ {
int error = 0; size_t len;
index_iterator *ii = git__calloc(1, sizeof(index_iterator));
GITERR_CHECK_ALLOC(ii);
if ((error = git_index_snapshot_new(&ii->entries, index)) < 0) {
git__free(ii);
return error;
}
ii->index = index;
ITERATOR_BASE_INIT(ii, index, INDEX, repo);
if ((error = iterator__update_ignore_case((git_iterator *)ii, options ? options->flags : 0)) < 0) {
git_iterator_free((git_iterator *)ii);
return error;
}
ii->entry_srch = iterator__ignore_case(ii) ? if (!iterator__ignore_dot_git(&iter->base))
git_index_entry_isrch : git_index_entry_srch; return false;
git_vector_set_cmp(&ii->entries, iterator__ignore_case(ii) ? if ((len = path_len) < 4)
git_index_entry_icmp : git_index_entry_cmp); return false;
git_vector_sort(&ii->entries);
git_buf_init(&ii->partial, 0); if (path[len - 1] == '/')
ii->tree_entry.mode = GIT_FILEMODE_TREE; len--;
index_iterator__reset((git_iterator *)ii); if (git__tolower(path[len - 1]) != 't' ||
git__tolower(path[len - 2]) != 'i' ||
git__tolower(path[len - 3]) != 'g' ||
git__tolower(path[len - 4]) != '.')
return false;
*iter = (git_iterator *)ii; return (len == 4 || path[len - 5] == '/');
return 0;
} }
static filesystem_iterator_entry *filesystem_iterator_entry_init(
typedef struct fs_iterator_frame fs_iterator_frame; filesystem_iterator_frame *frame,
struct fs_iterator_frame { const char *path,
fs_iterator_frame *next; size_t path_len,
git_vector entries; struct stat *statbuf,
size_t index; iterator_pathlist_search_t pathlist_match)
int is_ignored;
};
typedef struct fs_iterator fs_iterator;
struct fs_iterator {
git_iterator base;
git_iterator_callbacks cb;
fs_iterator_frame *stack;
git_index_entry entry;
git_buf path;
size_t root_len;
uint32_t dirload_flags;
int depth;
iterator_pathlist__match_t pathlist_match;
int (*enter_dir_cb)(fs_iterator *self);
int (*leave_dir_cb)(fs_iterator *self);
int (*update_entry_cb)(fs_iterator *self);
};
#define FS_MAX_DEPTH 100
typedef struct {
struct stat st;
iterator_pathlist__match_t pathlist_match;
size_t path_len;
char path[GIT_FLEX_ARRAY];
} fs_iterator_path_with_stat;
static int fs_iterator_path_with_stat_cmp(const void *a, const void *b)
{ {
const fs_iterator_path_with_stat *psa = a, *psb = b; filesystem_iterator_entry *entry;
return strcmp(psa->path, psb->path); size_t entry_size;
}
static int fs_iterator_path_with_stat_cmp_icase(const void *a, const void *b) /* Make sure to append two bytes, one for the path's null
{ * termination, one for a possible trailing '/' for folders.
const fs_iterator_path_with_stat *psa = a, *psb = b; */
return strcasecmp(psa->path, psb->path); if (GIT_ADD_SIZET_OVERFLOW(&entry_size,
} sizeof(filesystem_iterator_entry), path_len) ||
GIT_ADD_SIZET_OVERFLOW(&entry_size, entry_size, 2) ||
(entry = git_pool_malloc(&frame->entry_pool, entry_size)) == NULL)
return NULL;
static fs_iterator_frame *fs_iterator__alloc_frame(fs_iterator *fi) entry->path_len = path_len;
{ entry->match = pathlist_match;
fs_iterator_frame *ff = git__calloc(1, sizeof(fs_iterator_frame)); memcpy(entry->path, path, path_len);
git_vector_cmp entry_compare = CASESELECT( memcpy(&entry->st, statbuf, sizeof(struct stat));
iterator__ignore_case(fi),
fs_iterator_path_with_stat_cmp_icase,
fs_iterator_path_with_stat_cmp);
if (ff && git_vector_init(&ff->entries, 0, entry_compare) < 0) { /* Suffix directory paths with a '/' */
git__free(ff); if (S_ISDIR(entry->st.st_mode))
ff = NULL; entry->path[entry->path_len++] = '/';
}
return ff; entry->path[entry->path_len] = '\0';
}
static void fs_iterator__free_frame(fs_iterator_frame *ff) return entry;
{
git_vector_free_deep(&ff->entries);
git__free(ff);
} }
static void fs_iterator__pop_frame( static int filesystem_iterator_frame_push(
fs_iterator *fi, fs_iterator_frame *ff, bool pop_last) filesystem_iterator *iter,
filesystem_iterator_entry *frame_entry)
{ {
if (fi && fi->stack == ff) { filesystem_iterator_frame *new_frame = NULL;
if (!ff->next && !pop_last) { git_path_diriter diriter = GIT_PATH_DIRITER_INIT;
memset(&fi->entry, 0, sizeof(fi->entry)); git_buf root = GIT_BUF_INIT;
return; const char *path;
} filesystem_iterator_entry *entry;
struct stat statbuf;
if (fi->leave_dir_cb) size_t path_len;
(void)fi->leave_dir_cb(fi); int error;
fi->stack = ff->next; if (iter->frames.size == FILESYSTEM_MAX_DEPTH) {
fi->depth--; giterr_set(GITERR_REPOSITORY,
"directory nesting too deep (%d)", iter->frames.size);
return -1;
} }
fs_iterator__free_frame(ff); new_frame = git_array_alloc(iter->frames);
} GITERR_CHECK_ALLOC(new_frame);
static int fs_iterator__update_entry(fs_iterator *fi);
static int fs_iterator__advance_over(
const git_index_entry **entry, git_iterator *self);
static int fs_iterator__entry_cmp(const void *i, const void *item)
{
const fs_iterator *fi = (const fs_iterator *)i;
const fs_iterator_path_with_stat *ps = item;
return fi->base.prefixcomp(fi->base.start, ps->path);
}
static void fs_iterator__seek_frame_start( memset(new_frame, 0, sizeof(filesystem_iterator_frame));
fs_iterator *fi, fs_iterator_frame *ff)
{
if (!ff)
return;
if (fi->base.start) if (frame_entry)
git_vector_bsearch2( git_buf_joinpath(&root, iter->root, frame_entry->path);
&ff->index, &ff->entries, fs_iterator__entry_cmp, fi);
else else
ff->index = 0; git_buf_puts(&root, iter->root);
}
static int dirload_with_stat(git_vector *contents, fs_iterator *fi) if (git_buf_oom(&root)) {
{ error = -1;
git_path_diriter diriter = GIT_PATH_DIRITER_INIT; goto done;
const char *path; }
size_t start_len = fi->base.start ? strlen(fi->base.start) : 0;
size_t end_len = fi->base.end ? strlen(fi->base.end) : 0; new_frame->path_len = frame_entry ? frame_entry->path_len : 0;
fs_iterator_path_with_stat *ps;
size_t path_len, cmp_len, ps_size;
iterator_pathlist__match_t pathlist_match = ITERATOR_PATHLIST_MATCH;
int error;
/* Any error here is equivalent to the dir not existing, skip over it */ /* Any error here is equivalent to the dir not existing, skip over it */
if ((error = git_path_diriter_init( if ((error = git_path_diriter_init(
&diriter, fi->path.ptr, fi->dirload_flags)) < 0) { &diriter, root.ptr, iter->dirload_flags)) < 0) {
error = GIT_ENOTFOUND; error = GIT_ENOTFOUND;
goto done; goto done;
} }
if ((error = git_vector_init(&new_frame->entries, 64,
iterator__ignore_case(&iter->base) ?
filesystem_iterator_entry_cmp_icase :
filesystem_iterator_entry_cmp)) < 0)
goto done;
git_pool_init(&new_frame->entry_pool, 1);
/* check if this directory is ignored */
filesystem_iterator_frame_push_ignores(iter, frame_entry, new_frame);
while ((error = git_path_diriter_next(&diriter)) == 0) { while ((error = git_path_diriter_next(&diriter)) == 0) {
iterator_pathlist_search_t pathlist_match = ITERATOR_PATHLIST_FULL;
bool dir_expected = false;
if ((error = git_path_diriter_fullpath(&path, &path_len, &diriter)) < 0) if ((error = git_path_diriter_fullpath(&path, &path_len, &diriter)) < 0)
goto done; goto done;
assert(path_len > fi->root_len); assert(path_len > iter->root_len);
/* remove the prefix if requested */ /* remove the prefix if requested */
path += fi->root_len; path += iter->root_len;
path_len -= fi->root_len; path_len -= iter->root_len;
/* skip if before start_stat or after end_stat */
cmp_len = min(start_len, path_len);
if (cmp_len && fi->base.strncomp(path, fi->base.start, cmp_len) < 0)
continue;
/* skip if after end_stat */
cmp_len = min(end_len, path_len);
if (cmp_len && fi->base.strncomp(path, fi->base.end, cmp_len) > 0)
continue;
/* if we have a pathlist that we're limiting to, examine this path. /* examine start / end and the pathlist to see if this path is in it.
* if the frame has already deemed us inside the path (eg, we're in * note that since we haven't yet stat'ed the path, we cannot know
* `foo/bar` and the pathlist previously was detected to say `foo/`) * whether it's a directory yet or not, so this can give us an
* then simply continue. otherwise, examine the pathlist looking for * expected type (S_IFDIR or S_IFREG) that we should examine)
* this path or children of this path.
*/ */
if (fi->base.pathlist.length && if (!filesystem_iterator_examine_path(&dir_expected, &pathlist_match,
fi->pathlist_match != ITERATOR_PATHLIST_MATCH && iter, frame_entry, path, path_len))
fi->pathlist_match != ITERATOR_PATHLIST_MATCH_DIRECTORY &&
!(pathlist_match = iterator_pathlist__match(&fi->base, path, path_len)))
continue; continue;
/* Make sure to append two bytes, one for the path's null /* TODO: don't need to stat if assume unchanged for this path and
* termination, one for a possible trailing '/' for folders. * we have an index, we can just copy the data out of it.
*/ */
GITERR_CHECK_ALLOC_ADD(&ps_size, sizeof(fs_iterator_path_with_stat), path_len);
GITERR_CHECK_ALLOC_ADD(&ps_size, ps_size, 2);
ps = git__calloc(1, ps_size);
ps->path_len = path_len;
memcpy(ps->path, path, path_len);
/* TODO: don't stat if assume unchanged for this path */ if ((error = git_path_diriter_stat(&statbuf, &diriter)) < 0) {
if ((error = git_path_diriter_stat(&ps->st, &diriter)) < 0) {
if (error == GIT_ENOTFOUND) {
/* file was removed between readdir and lstat */ /* file was removed between readdir and lstat */
git__free(ps); if (error == GIT_ENOTFOUND)
continue; continue;
}
if (pathlist_match == ITERATOR_PATHLIST_MATCH_DIRECTORY) { /* treat the file as unreadable */
/* were looking for a directory, but this is a file */ memset(&statbuf, 0, sizeof(statbuf));
git__free(ps); statbuf.st_mode = GIT_FILEMODE_UNREADABLE;
continue;
error = 0;
} }
/* Treat the file as unreadable if we get any other error */ iter->base.stat_calls++;
memset(&ps->st, 0, sizeof(ps->st));
ps->st.st_mode = GIT_FILEMODE_UNREADABLE;
giterr_clear();
error = 0;
} else if (S_ISDIR(ps->st.st_mode)) {
/* Suffix directory paths with a '/' */
ps->path[ps->path_len++] = '/';
ps->path[ps->path_len] = '\0';
} else if(!S_ISREG(ps->st.st_mode) && !S_ISLNK(ps->st.st_mode)) {
/* Ignore wacky things in the filesystem */ /* Ignore wacky things in the filesystem */
git__free(ps); if (!S_ISDIR(statbuf.st_mode) &&
!S_ISREG(statbuf.st_mode) &&
!S_ISLNK(statbuf.st_mode) &&
statbuf.st_mode != GIT_FILEMODE_UNREADABLE)
continue; continue;
if (filesystem_iterator_is_dot_git(iter, path, path_len))
continue;
/* convert submodules to GITLINK and remove trailing slashes */
if (S_ISDIR(statbuf.st_mode)) {
bool submodule = false;
if ((error = is_submodule(&submodule, iter, path, path_len)) < 0)
goto done;
if (submodule)
statbuf.st_mode = GIT_FILEMODE_COMMIT;
} }
/* record whether this path was explicitly found in the path list /* Ensure that the pathlist entry lines up with what we expected */
* or whether we're only examining it because something beneath it if (dir_expected && !S_ISDIR(statbuf.st_mode))
* is in the path list. continue;
*/
ps->pathlist_match = pathlist_match; entry = filesystem_iterator_entry_init(new_frame,
git_vector_insert(contents, ps); path, path_len, &statbuf, pathlist_match);
GITERR_CHECK_ALLOC(entry);
git_vector_insert(&new_frame->entries, entry);
} }
if (error == GIT_ITEROVER) if (error == GIT_ITEROVER)
error = 0; error = 0;
/* sort now that directory suffix is added */ /* sort now that directory suffix is added */
git_vector_sort(contents); git_vector_sort(&new_frame->entries);
done: done:
if (error < 0)
git_array_pop(iter->frames);
git_buf_free(&root);
git_path_diriter_free(&diriter); git_path_diriter_free(&diriter);
return error; return error;
} }
GIT_INLINE(void) filesystem_iterator_frame_pop(filesystem_iterator *iter)
static int fs_iterator__expand_dir(fs_iterator *fi)
{ {
int error; filesystem_iterator_frame *frame;
fs_iterator_frame *ff;
if (fi->depth > FS_MAX_DEPTH) {
giterr_set(GITERR_REPOSITORY,
"Directory nesting is too deep (%d)", fi->depth);
return -1;
}
ff = fs_iterator__alloc_frame(fi);
GITERR_CHECK_ALLOC(ff);
error = dirload_with_stat(&ff->entries, fi); assert(iter->frames.size);
if (error < 0) {
git_error_state last_error = { 0 };
giterr_state_capture(&last_error, error);
/* these callbacks may clear the error message */ frame = git_array_pop(iter->frames);
fs_iterator__free_frame(ff); filesystem_iterator_frame_pop_ignores(iter);
fs_iterator__advance_over(NULL, (git_iterator *)fi);
/* next time return value we skipped to */
fi->base.flags &= ~GIT_ITERATOR_FIRST_ACCESS;
return giterr_state_restore(&last_error); git_pool_clear(&frame->entry_pool);
} git_vector_free(&frame->entries);
}
if (ff->entries.length == 0) { static void filesystem_iterator_set_current(
fs_iterator__free_frame(ff); filesystem_iterator *iter,
return GIT_ENOTFOUND; filesystem_iterator_entry *entry)
} {
fi->base.stat_calls += ff->entries.length; iter->entry.ctime.seconds = entry->st.st_ctime;
iter->entry.ctime.nanoseconds = entry->st.st_ctime_nsec;
fs_iterator__seek_frame_start(fi, ff); iter->entry.mtime.seconds = entry->st.st_mtime;
iter->entry.mtime.nanoseconds = entry->st.st_mtime_nsec;
ff->next = fi->stack; iter->entry.dev = entry->st.st_dev;
fi->stack = ff; iter->entry.ino = entry->st.st_ino;
fi->depth++; iter->entry.mode = git_futils_canonical_mode(entry->st.st_mode);
iter->entry.uid = entry->st.st_uid;
iter->entry.gid = entry->st.st_gid;
iter->entry.file_size = entry->st.st_size;
if (fi->enter_dir_cb && (error = fi->enter_dir_cb(fi)) < 0) iter->entry.path = entry->path;
return error;
return fs_iterator__update_entry(fi); iter->current_is_ignored = GIT_IGNORE_UNCHECKED;
} }
static int fs_iterator__current( static int filesystem_iterator_current(
const git_index_entry **entry, git_iterator *self) const git_index_entry **out, git_iterator *i)
{ {
fs_iterator *fi = (fs_iterator *)self; filesystem_iterator *iter = (filesystem_iterator *)i;
const git_index_entry *fe = (fi->entry.path == NULL) ? NULL : &fi->entry;
if (entry) if (!iterator__has_been_accessed(i))
*entry = fe; return iter->base.cb->advance(out, i);
fi->base.flags |= GIT_ITERATOR_FIRST_ACCESS;
return (fe != NULL) ? 0 : GIT_ITEROVER; if (!iter->frames.size) {
} *out = NULL;
return GIT_ITEROVER;
}
static int fs_iterator__at_end(git_iterator *self) *out = &iter->entry;
{ return 0;
return (((fs_iterator *)self)->entry.path == NULL);
} }
static int fs_iterator__advance_into( static int filesystem_iterator_advance(
const git_index_entry **entry, git_iterator *iter) const git_index_entry **out, git_iterator *i)
{ {
filesystem_iterator *iter = (filesystem_iterator *)i;
int error = 0; int error = 0;
fs_iterator *fi = (fs_iterator *)iter;
iterator__clear_entry(entry); iter->base.flags |= GIT_ITERATOR_FIRST_ACCESS;
/* Allow you to explicitly advance into a commit/submodule (as well as a /* examine filesystem entries until we find the next one to return */
* tree) to avoid cases where an entry is mislabeled as a submodule in while (true) {
* the working directory. The fs iterator will never have COMMMIT filesystem_iterator_frame *frame;
* entries on it's own, but a wrapper might add them. filesystem_iterator_entry *entry;
*/
if (fi->entry.path != NULL &&
(fi->entry.mode == GIT_FILEMODE_TREE ||
fi->entry.mode == GIT_FILEMODE_COMMIT))
/* returns GIT_ENOTFOUND if the directory is empty */
error = fs_iterator__expand_dir(fi);
if (!error && entry) if ((frame = filesystem_iterator_current_frame(iter)) == NULL) {
error = fs_iterator__current(entry, iter);
if (!error && !fi->entry.path)
error = GIT_ITEROVER; error = GIT_ITEROVER;
break;
}
return error; /* no more entries in this frame. pop the frame out */
} if (frame->next_idx == frame->entries.length) {
filesystem_iterator_frame_pop(iter);
continue;
}
static void fs_iterator__advance_over_internal(git_iterator *self) /* we have more entries in the current frame, that's our next entry */
{ entry = frame->entries.contents[frame->next_idx];
fs_iterator *fi = (fs_iterator *)self; frame->next_idx++;
fs_iterator_frame *ff;
fs_iterator_path_with_stat *next;
while (fi->entry.path != NULL) { if (S_ISDIR(entry->st.st_mode)) {
ff = fi->stack; if (iterator__do_autoexpand(iter)) {
next = git_vector_get(&ff->entries, ++ff->index); error = filesystem_iterator_frame_push(iter, entry);
if (next != NULL) /* may get GIT_ENOTFOUND due to races or permission problems
* that we want to quietly swallow
*/
if (error == GIT_ENOTFOUND)
continue;
else if (error < 0)
break; break;
}
if (!iterator__include_trees(iter))
continue;
}
fs_iterator__pop_frame(fi, ff, false); filesystem_iterator_set_current(iter, entry);
break;
} }
if (out)
*out = (error == 0) ? &iter->entry : NULL;
return error;
} }
static int fs_iterator__advance_over( static int filesystem_iterator_advance_into(
const git_index_entry **entry, git_iterator *self) const git_index_entry **out, git_iterator *i)
{ {
filesystem_iterator *iter = (filesystem_iterator *)i;
filesystem_iterator_frame *frame;
filesystem_iterator_entry *prev_entry;
int error; int error;
if (entry != NULL) if (out)
*entry = NULL; *out = NULL;
fs_iterator__advance_over_internal(self);
error = fs_iterator__update_entry((fs_iterator *)self);
if (!error && entry != NULL) if ((frame = filesystem_iterator_current_frame(iter)) == NULL)
error = fs_iterator__current(entry, self); return GIT_ITEROVER;
return error; /* get the last seen entry */
} prev_entry = filesystem_iterator_current_entry(frame);
static int fs_iterator__advance( /* it's legal to call advance_into when auto-expand is on. in this case,
const git_index_entry **entry, git_iterator *self) * we will have pushed a new (empty) frame on to the stack for this
{ * new directory. since it's empty, its current_entry should be null.
fs_iterator *fi = (fs_iterator *)self; */
assert(iterator__do_autoexpand(i) ^ (prev_entry != NULL));
if (!iterator__has_been_accessed(fi)) if (prev_entry) {
return fs_iterator__current(entry, self); if (prev_entry->st.st_mode != GIT_FILEMODE_COMMIT &&
!S_ISDIR(prev_entry->st.st_mode))
return 0;
/* given include_trees & autoexpand, we might have to go into a tree */ if ((error = filesystem_iterator_frame_push(iter, prev_entry)) < 0)
if (iterator__do_autoexpand(fi) &&
fi->entry.path != NULL &&
fi->entry.mode == GIT_FILEMODE_TREE)
{
int error = fs_iterator__advance_into(entry, self);
if (error != GIT_ENOTFOUND)
return error; return error;
/* continue silently past empty directories if autoexpanding */
giterr_clear();
} }
return fs_iterator__advance_over(entry, self); /* we've advanced into the directory in question, let advance
* find the first entry
*/
return filesystem_iterator_advance(out, i);
} }
static int fs_iterator__reset(git_iterator *self) int git_iterator_current_workdir_path(git_buf **out, git_iterator *i)
{ {
int error; filesystem_iterator *iter = (filesystem_iterator *)i;
fs_iterator *fi = (fs_iterator *)self; const git_index_entry *entry;
fi->base.flags &= ~GIT_ITERATOR_FIRST_ACCESS; if (i->type != GIT_ITERATOR_TYPE_FS &&
i->type != GIT_ITERATOR_TYPE_WORKDIR) {
*out = NULL;
return 0;
}
while (fi->stack != NULL && fi->stack->next != NULL) git_buf_truncate(&iter->current_path, iter->root_len);
fs_iterator__pop_frame(fi, fi->stack, false);
fi->depth = 0;
fs_iterator__seek_frame_start(fi, fi->stack); if (git_iterator_current(&entry, i) < 0 ||
git_buf_puts(&iter->current_path, entry->path) < 0)
return -1;
error = fs_iterator__update_entry(fi); *out = &iter->current_path;
if (error == GIT_ITEROVER) return 0;
error = 0; }
return error; GIT_INLINE(git_dir_flag) entry_dir_flag(git_index_entry *entry)
{
#if defined(GIT_WIN32) && !defined(__MINGW32__)
return (entry && entry->mode) ?
(S_ISDIR(entry->mode) ? GIT_DIR_FLAG_TRUE : GIT_DIR_FLAG_FALSE) :
GIT_DIR_FLAG_UNKNOWN;
#else
GIT_UNUSED(entry);
return GIT_DIR_FLAG_UNKNOWN;
#endif
} }
static int fs_iterator__reset_range( static void filesystem_iterator_update_ignored(filesystem_iterator *iter)
git_iterator *self, const char *start, const char *end)
{ {
int error; filesystem_iterator_frame *frame;
git_dir_flag dir_flag = entry_dir_flag(&iter->entry);
if ((error = iterator__reset_range(self, start, end)) < 0) if (git_ignore__lookup(&iter->current_is_ignored,
return error; &iter->ignores, iter->entry.path, dir_flag) < 0) {
giterr_clear();
iter->current_is_ignored = GIT_IGNORE_NOTFOUND;
}
return fs_iterator__reset(self); /* use ignore from containing frame stack */
if (iter->current_is_ignored <= GIT_IGNORE_NOTFOUND) {
frame = filesystem_iterator_current_frame(iter);
iter->current_is_ignored = frame->is_ignored;
}
} }
static void fs_iterator__free(git_iterator *self) GIT_INLINE(bool) filesystem_iterator_current_is_ignored(
filesystem_iterator *iter)
{ {
fs_iterator *fi = (fs_iterator *)self; if (iter->current_is_ignored == GIT_IGNORE_UNCHECKED)
filesystem_iterator_update_ignored(iter);
while (fi->stack != NULL)
fs_iterator__pop_frame(fi, fi->stack, true);
git_buf_free(&fi->path); return (iter->current_is_ignored == GIT_IGNORE_TRUE);
} }
static int fs_iterator__update_entry(fs_iterator *fi) bool git_iterator_current_is_ignored(git_iterator *i)
{ {
fs_iterator_path_with_stat *ps; if (i->type != GIT_ITERATOR_TYPE_WORKDIR)
return false;
while (true) {
memset(&fi->entry, 0, sizeof(fi->entry));
if (!fi->stack) return filesystem_iterator_current_is_ignored((filesystem_iterator *)i);
return GIT_ITEROVER; }
ps = git_vector_get(&fi->stack->entries, fi->stack->index); bool git_iterator_current_tree_is_ignored(git_iterator *i)
if (!ps) {
return GIT_ITEROVER; filesystem_iterator *iter = (filesystem_iterator *)i;
filesystem_iterator_frame *frame;
git_buf_truncate(&fi->path, fi->root_len); if (i->type != GIT_ITERATOR_TYPE_WORKDIR)
if (git_buf_put(&fi->path, ps->path, ps->path_len) < 0) return false;
return -1;
if (iterator__past_end(fi, fi->path.ptr + fi->root_len)) frame = filesystem_iterator_current_frame(iter);
return GIT_ITEROVER; return (frame->is_ignored == GIT_IGNORE_TRUE);
}
fi->entry.path = ps->path; static int filesystem_iterator_advance_over(
fi->pathlist_match = ps->pathlist_match; const git_index_entry **out,
git_index_entry__init_from_stat(&fi->entry, &ps->st, true); git_iterator_status_t *status,
git_iterator *i)
{
filesystem_iterator *iter = (filesystem_iterator *)i;
filesystem_iterator_frame *current_frame;
filesystem_iterator_entry *current_entry;
const git_index_entry *entry = NULL;
const char *base;
int error = 0;
/* need different mode here to keep directories during iteration */ *out = NULL;
fi->entry.mode = git_futils_canonical_mode(ps->st.st_mode); *status = GIT_ITERATOR_STATUS_NORMAL;
/* allow wrapper to check/update the entry (can force skip) */ assert(iterator__has_been_accessed(i));
if (fi->update_entry_cb &&
fi->update_entry_cb(fi) == GIT_ENOTFOUND) {
fs_iterator__advance_over_internal(&fi->base);
continue;
}
/* if this is a tree and trees aren't included, then skip */ current_frame = filesystem_iterator_current_frame(iter);
if (fi->entry.mode == GIT_FILEMODE_TREE && !iterator__include_trees(fi)) { assert(current_frame);
int error = fs_iterator__advance_into(NULL, &fi->base); current_entry = filesystem_iterator_current_entry(current_frame);
assert(current_entry);
if (error != GIT_ENOTFOUND) if ((error = git_iterator_current(&entry, i)) < 0)
return error; return error;
giterr_clear(); if (!S_ISDIR(entry->mode)) {
fs_iterator__advance_over_internal(&fi->base); if (filesystem_iterator_current_is_ignored(iter))
continue; *status = GIT_ITERATOR_STATUS_IGNORED;
}
break; return filesystem_iterator_advance(out, i);
} }
return 0; git_buf_clear(&iter->tmp_buf);
} if ((error = git_buf_puts(&iter->tmp_buf, entry->path)) < 0)
return error;
static int fs_iterator__initialize( base = iter->tmp_buf.ptr;
git_iterator **out, fs_iterator *fi, const char *root)
{
int error;
if (git_buf_sets(&fi->path, root) < 0 || git_path_to_dir(&fi->path) < 0) { /* scan inside the directory looking for files. if we find nothing,
git__free(fi); * we will remain EMPTY. if we find any ignored item, upgrade EMPTY to
return -1; * IGNORED. if we find a real actual item, upgrade all the way to NORMAL
} * and then stop.
fi->root_len = fi->path.size; *
fi->pathlist_match = ITERATOR_PATHLIST_MATCH_CHILD; * however, if we're here looking for a pathlist item (but are not
* actually in the pathlist ourselves) then start at FILTERED instead of
* EMPTY. callers then know that this path was not something they asked
* about.
*/
*status = current_entry->match == ITERATOR_PATHLIST_IS_PARENT ?
GIT_ITERATOR_STATUS_FILTERED : GIT_ITERATOR_STATUS_EMPTY;
fi->dirload_flags = while (entry && !iter->base.prefixcomp(entry->path, base)) {
(iterator__ignore_case(fi) ? GIT_PATH_DIR_IGNORE_CASE : 0) | if (filesystem_iterator_current_is_ignored(iter)) {
(iterator__flag(fi, PRECOMPOSE_UNICODE) ? /* if we found an explicitly ignored item, then update from
GIT_PATH_DIR_PRECOMPOSE_UNICODE : 0); * EMPTY to IGNORED
*/
*status = GIT_ITERATOR_STATUS_IGNORED;
} else if (S_ISDIR(entry->mode)) {
error = filesystem_iterator_advance_into(&entry, i);
if ((error = fs_iterator__expand_dir(fi)) < 0) { if (!error)
if (error == GIT_ENOTFOUND || error == GIT_ITEROVER) { continue;
giterr_clear();
/* this directory disappeared, ignore it */
else if (error == GIT_ENOTFOUND)
error = 0; error = 0;
/* a real error occurred */
else
break;
} else { } else {
git_iterator_free((git_iterator *)fi); /* we found a non-ignored item, treat parent as untracked */
fi = NULL; *status = GIT_ITERATOR_STATUS_NORMAL;
break;
}
if ((error = git_iterator_advance(&entry, i)) < 0)
break;
} }
/* wrap up scan back to base directory */
while (entry && !iter->base.prefixcomp(entry->path, base)) {
if ((error = git_iterator_advance(&entry, i)) < 0)
break;
} }
*out = (git_iterator *)fi; if (!error)
*out = entry;
return error; return error;
} }
int git_iterator_for_filesystem( static void filesystem_iterator_clear(filesystem_iterator *iter)
git_iterator **out,
const char *root,
git_iterator_options *options)
{ {
fs_iterator *fi = git__calloc(1, sizeof(fs_iterator)); while (iter->frames.size)
GITERR_CHECK_ALLOC(fi); filesystem_iterator_frame_pop(iter);
ITERATOR_BASE_INIT(fi, fs, FS, NULL); git_array_clear(iter->frames);
git_ignore__free(&iter->ignores);
if (options && (options->flags & GIT_ITERATOR_IGNORE_CASE) != 0) git_buf_free(&iter->tmp_buf);
fi->base.flags |= GIT_ITERATOR_IGNORE_CASE;
return fs_iterator__initialize(out, fi, root); iterator_clear(&iter->base);
} }
static int filesystem_iterator_init(filesystem_iterator *iter)
typedef struct {
fs_iterator fi;
git_ignores ignores;
int is_ignored;
/*
* We may have a tree or the index+snapshot to compare against
* when checking for submodules.
*/
git_tree *tree;
git_index *index;
git_vector index_snapshot;
git_vector_cmp entry_srch;
} workdir_iterator;
GIT_INLINE(bool) workdir_path_is_dotgit(const git_buf *path)
{ {
size_t len; int error;
if (!path || (len = path->size) < 4) if (iterator__honor_ignores(&iter->base) &&
return false; (error = git_ignore__for_path(iter->base.repo,
".gitignore", &iter->ignores)) < 0)
return error;
if (path->ptr[len - 1] == '/') if ((error = filesystem_iterator_frame_push(iter, NULL)) < 0)
len--; return error;
if (git__tolower(path->ptr[len - 1]) != 't' || iter->base.flags &= ~GIT_ITERATOR_FIRST_ACCESS;
git__tolower(path->ptr[len - 2]) != 'i' ||
git__tolower(path->ptr[len - 3]) != 'g' ||
git__tolower(path->ptr[len - 4]) != '.')
return false;
return (len == 4 || path->ptr[len - 5] == '/'); return 0;
} }
/** static int filesystem_iterator_reset(git_iterator *i)
* Figure out if an entry is a submodule.
*
* We consider it a submodule if the path is listed as a submodule in
* either the tree or the index.
*/
static int is_submodule(workdir_iterator *wi, fs_iterator_path_with_stat *ie)
{ {
int error, is_submodule = 0; filesystem_iterator *iter = (filesystem_iterator *)i;
if (wi->tree) {
git_tree_entry *e;
/* remove the trailing slash for finding */
ie->path[ie->path_len-1] = '\0';
error = git_tree_entry_bypath(&e, wi->tree, ie->path);
ie->path[ie->path_len-1] = '/';
if (error < 0 && error != GIT_ENOTFOUND)
return 0;
if (!error) {
is_submodule = e->attr == GIT_FILEMODE_COMMIT;
git_tree_entry_free(e);
}
}
if (!is_submodule && wi->index) { filesystem_iterator_clear(iter);
git_index_entry *e; return filesystem_iterator_init(iter);
size_t pos; }
error = git_index_snapshot_find(&pos, &wi->index_snapshot, wi->entry_srch, ie->path, ie->path_len-1, 0); static int filesystem_iterator_reset_range(
if (error < 0 && error != GIT_ENOTFOUND) git_iterator *i, const char *start, const char *end)
return 0; {
if (iterator_range_reset(i, start, end) < 0)
return -1;
if (!error) { return filesystem_iterator_reset(i);
e = git_vector_get(&wi->index_snapshot, pos); }
is_submodule = e->mode == GIT_FILEMODE_COMMIT; static int filesystem_iterator_at_end(git_iterator *i)
} {
} filesystem_iterator *iter = (filesystem_iterator *)i;
return is_submodule; return (iter->frames.size == 0);
} }
GIT_INLINE(git_dir_flag) git_entry__dir_flag(git_index_entry *entry) { static void filesystem_iterator_free(git_iterator *i)
#if defined(GIT_WIN32) && !defined(__MINGW32__) {
return (entry && entry->mode) filesystem_iterator *iter = (filesystem_iterator *)i;
? S_ISDIR(entry->mode) ? GIT_DIR_FLAG_TRUE : GIT_DIR_FLAG_FALSE filesystem_iterator_clear(iter);
: GIT_DIR_FLAG_UNKNOWN;
#else
GIT_UNUSED(entry);
return GIT_DIR_FLAG_UNKNOWN;
#endif
} }
static int workdir_iterator__enter_dir(fs_iterator *fi) static int iterator_for_filesystem(
git_iterator **out,
git_repository *repo,
const char *root,
git_index *index,
git_tree *tree,
git_iterator_type_t type,
git_iterator_options *options)
{ {
workdir_iterator *wi = (workdir_iterator *)fi; filesystem_iterator *iter;
fs_iterator_frame *ff = fi->stack; size_t root_len;
size_t pos; int error;
fs_iterator_path_with_stat *entry;
bool found_submodules = false;
git_dir_flag dir_flag = git_entry__dir_flag(&fi->entry); static git_iterator_callbacks callbacks = {
filesystem_iterator_current,
filesystem_iterator_advance,
filesystem_iterator_advance_into,
filesystem_iterator_advance_over,
filesystem_iterator_reset,
filesystem_iterator_reset_range,
filesystem_iterator_at_end,
filesystem_iterator_free
};
/* check if this directory is ignored */ *out = NULL;
if (git_ignore__lookup(&ff->is_ignored, &wi->ignores, fi->path.ptr + fi->root_len, dir_flag) < 0) {
giterr_clear();
ff->is_ignored = GIT_IGNORE_NOTFOUND;
}
/* if this is not the top level directory... */ if (root == NULL)
if (ff->next != NULL) { return git_iterator_for_nothing(out, options);
ssize_t slash_pos = git_buf_rfind_next(&fi->path, '/');
/* inherit ignored from parent if no rule specified */ iter = git__calloc(1, sizeof(filesystem_iterator));
if (ff->is_ignored <= GIT_IGNORE_NOTFOUND) GITERR_CHECK_ALLOC(iter);
ff->is_ignored = ff->next->is_ignored;
/* push new ignores for files in this directory */ root_len = strlen(root);
(void)git_ignore__push_dir(&wi->ignores, &fi->path.ptr[slash_pos + 1]);
}
/* convert submodules to GITLINK and remove trailing slashes */ iter->root = git__malloc(root_len+2);
git_vector_foreach(&ff->entries, pos, entry) { GITERR_CHECK_ALLOC(iter->root);
if (!S_ISDIR(entry->st.st_mode) || !strcmp(GIT_DIR, entry->path))
continue;
if (is_submodule(wi, entry)) { memcpy(iter->root, root, root_len);
entry->st.st_mode = GIT_FILEMODE_COMMIT;
entry->path_len--;
entry->path[entry->path_len] = '\0';
found_submodules = true;
}
}
/* if we renamed submodules, re-sort and re-seek to start */ if (root_len == 0 || root[root_len-1] != '/') {
if (found_submodules) { iter->root[root_len] = '/';
git_vector_set_sorted(&ff->entries, 0); root_len++;
git_vector_sort(&ff->entries);
fs_iterator__seek_frame_start(fi, ff);
} }
iter->root[root_len] = '\0';
iter->root_len = root_len;
return 0; if ((error = git_buf_puts(&iter->current_path, iter->root)) < 0)
} goto on_error;
static int workdir_iterator__leave_dir(fs_iterator *fi) iter->base.type = type;
{ iter->base.cb = &callbacks;
workdir_iterator *wi = (workdir_iterator *)fi;
git_ignore__pop_dir(&wi->ignores);
return 0;
}
static int workdir_iterator__update_entry(fs_iterator *fi)
{
workdir_iterator *wi = (workdir_iterator *)fi;
/* skip over .git entries */ if ((error = iterator_init_common(&iter->base, repo, options)) < 0)
if (workdir_path_is_dotgit(&fi->path)) goto on_error;
return GIT_ENOTFOUND;
if (tree && (error = git_tree_dup(&iter->tree, tree)) < 0)
goto on_error;
if ((iter->index = index) != NULL &&
(error = git_index_snapshot_new(&iter->index_snapshot, index)) < 0)
goto on_error;
iter->dirload_flags =
(iterator__ignore_case(&iter->base) ? GIT_PATH_DIR_IGNORE_CASE : 0) |
(iterator__flag(&iter->base, PRECOMPOSE_UNICODE) ?
GIT_PATH_DIR_PRECOMPOSE_UNICODE : 0);
/* reset is_ignored since we haven't checked yet */ if ((error = filesystem_iterator_init(iter)) < 0)
wi->is_ignored = GIT_IGNORE_UNCHECKED; goto on_error;
*out = &iter->base;
return 0; return 0;
on_error:
git__free(iter->root);
git_buf_free(&iter->current_path);
git_iterator_free(&iter->base);
return error;
} }
static void workdir_iterator__free(git_iterator *self) int git_iterator_for_filesystem(
git_iterator **out,
const char *root,
git_iterator_options *options)
{ {
workdir_iterator *wi = (workdir_iterator *)self; return iterator_for_filesystem(out,
if (wi->index) NULL, root, NULL, NULL, GIT_ITERATOR_TYPE_FS, options);
git_index_snapshot_release(&wi->index_snapshot, wi->index);
git_tree_free(wi->tree);
fs_iterator__free(self);
git_ignore__free(&wi->ignores);
} }
int git_iterator_for_workdir_ext( int git_iterator_for_workdir_ext(
...@@ -2101,254 +2125,354 @@ int git_iterator_for_workdir_ext( ...@@ -2101,254 +2125,354 @@ int git_iterator_for_workdir_ext(
const char *repo_workdir, const char *repo_workdir,
git_index *index, git_index *index,
git_tree *tree, git_tree *tree,
git_iterator_options *options) git_iterator_options *given_opts)
{ {
int error, precompose = 0; git_iterator_options options = GIT_ITERATOR_OPTIONS_INIT;
workdir_iterator *wi;
if (!repo_workdir) { if (!repo_workdir) {
if (git_repository__ensure_not_bare(repo, "scan working directory") < 0) if (git_repository__ensure_not_bare(repo, "scan working directory") < 0)
return GIT_EBAREREPO; return GIT_EBAREREPO;
repo_workdir = git_repository_workdir(repo); repo_workdir = git_repository_workdir(repo);
} }
/* initialize as an fs iterator then do overrides */ /* upgrade to a workdir iterator, adding necessary internal flags */
wi = git__calloc(1, sizeof(workdir_iterator)); if (given_opts)
GITERR_CHECK_ALLOC(wi); memcpy(&options, given_opts, sizeof(git_iterator_options));
ITERATOR_BASE_INIT((&wi->fi), fs, FS, repo);
wi->fi.base.type = GIT_ITERATOR_TYPE_WORKDIR; options.flags |= GIT_ITERATOR_HONOR_IGNORES |
wi->fi.cb.free = workdir_iterator__free; GIT_ITERATOR_IGNORE_DOT_GIT;
wi->fi.enter_dir_cb = workdir_iterator__enter_dir;
wi->fi.leave_dir_cb = workdir_iterator__leave_dir;
wi->fi.update_entry_cb = workdir_iterator__update_entry;
if ((error = iterator__update_ignore_case((git_iterator *)wi, options ? options->flags : 0)) < 0 || return iterator_for_filesystem(out,
(error = git_ignore__for_path(repo, ".gitignore", &wi->ignores)) < 0) repo, repo_workdir, index, tree, GIT_ITERATOR_TYPE_WORKDIR, &options);
{ }
git_iterator_free((git_iterator *)wi);
return error;
}
if (tree && (error = git_tree_dup(&wi->tree, tree)) < 0)
return error;
wi->index = index; /* Index iterator */
if (index && (error = git_index_snapshot_new(&wi->index_snapshot, index)) < 0) {
git_iterator_free((git_iterator *)wi);
return error;
}
wi->entry_srch = iterator__ignore_case(wi) ?
git_index_entry_isrch : git_index_entry_srch;
/* try to look up precompose and set flag if appropriate */ typedef struct {
if (git_repository__cvar(&precompose, repo, GIT_CVAR_PRECOMPOSE) < 0) git_iterator base;
giterr_clear(); git_iterator_callbacks cb;
else if (precompose) git_index *index;
wi->fi.base.flags |= GIT_ITERATOR_PRECOMPOSE_UNICODE; git_vector entries;
git_vector_cmp entry_srch;
size_t current;
/* when limiting with a pathlist, this is the current index into it */
size_t pathlist_idx;
/* when not in autoexpand mode, use these to represent "tree" state */
git_buf partial;
size_t partial_pos;
char restore_terminator;
git_index_entry tree_entry;
} index_iterator;
return fs_iterator__initialize(out, &wi->fi, repo_workdir); static const git_index_entry *index_iterator__index_entry(index_iterator *ii)
{
const git_index_entry *ie = git_vector_get(&ii->entries, ii->current);
if (ie != NULL && iterator__past_end(ii, ie->path)) {
ii->current = git_vector_length(&ii->entries);
ie = NULL;
}
return ie;
} }
void git_iterator_free(git_iterator *iter) static const git_index_entry *index_iterator__advance_over_unwanted(
index_iterator *ii)
{ {
if (iter == NULL) const git_index_entry *ie = index_iterator__index_entry(ii);
return; bool match;
iter->cb->free(iter); while (ie) {
if (!iterator__include_conflicts(ii) &&
git_index_entry_is_conflict(ie)) {
ii->current++;
ie = index_iterator__index_entry(ii);
continue;
}
git_vector_free(&iter->pathlist); /* if we have a pathlist, this entry's path must be in it to be
git__free(iter->start); * returned. walk the pathlist in unison with the index to
git__free(iter->end); * compare paths.
*/
if (ii->base.pathlist.length) {
match = iterator_pathlist_walk__contains(&ii->base, ie->path);
memset(iter, 0, sizeof(*iter)); if (!match) {
ii->current++;
ie = index_iterator__index_entry(ii);
continue;
}
}
git__free(iter); break;
}
return ie;
} }
int git_iterator_set_ignore_case(git_iterator *iter, bool ignore_case) static void index_iterator__next_prefix_tree(index_iterator *ii)
{ {
bool desire_ignore_case = (ignore_case != 0); const char *slash;
if (iterator__ignore_case(iter) == desire_ignore_case) if (!iterator__include_trees(ii))
return 0; return;
if (iter->type == GIT_ITERATOR_TYPE_EMPTY) { slash = strchr(&ii->partial.ptr[ii->partial_pos], '/');
if (desire_ignore_case)
iter->flags |= GIT_ITERATOR_IGNORE_CASE; if (slash != NULL) {
else ii->partial_pos = (slash - ii->partial.ptr) + 1;
iter->flags &= ~GIT_ITERATOR_IGNORE_CASE; ii->restore_terminator = ii->partial.ptr[ii->partial_pos];
ii->partial.ptr[ii->partial_pos] = '\0';
} else { } else {
giterr_set(GITERR_INVALID, ii->partial_pos = ii->partial.size;
"Cannot currently set ignore case on non-empty iterators");
return -1;
} }
return 0; if (index_iterator__index_entry(ii) == NULL)
ii->partial_pos = ii->partial.size;
} }
git_index *git_iterator_get_index(git_iterator *iter) static int index_iterator__first_prefix_tree(index_iterator *ii)
{ {
if (iter->type == GIT_ITERATOR_TYPE_INDEX) const git_index_entry *ie = index_iterator__advance_over_unwanted(ii);
return ((index_iterator *)iter)->index; const char *scan, *prior, *slash;
return NULL;
if (!ie || !iterator__include_trees(ii))
return 0;
/* find longest common prefix with prior index entry */
for (scan = slash = ie->path, prior = ii->partial.ptr;
*scan && *scan == *prior; ++scan, ++prior)
if (*scan == '/')
slash = scan;
if (git_buf_sets(&ii->partial, ie->path) < 0)
return -1;
ii->partial_pos = (slash - ie->path) + 1;
index_iterator__next_prefix_tree(ii);
return 0;
} }
static void workdir_iterator_update_is_ignored(workdir_iterator *wi) #define index_iterator__at_tree(I) \
(iterator__include_trees(I) && (I)->partial_pos < (I)->partial.size)
static int index_iterator__current(
const git_index_entry **entry, git_iterator *self)
{ {
git_dir_flag dir_flag = git_entry__dir_flag(&wi->fi.entry); index_iterator *ii = (index_iterator *)self;
const git_index_entry *ie = git_vector_get(&ii->entries, ii->current);
if (git_ignore__lookup(&wi->is_ignored, &wi->ignores, wi->fi.entry.path, dir_flag) < 0) { if (ie != NULL && index_iterator__at_tree(ii)) {
giterr_clear(); ii->tree_entry.path = ii->partial.ptr;
wi->is_ignored = GIT_IGNORE_NOTFOUND; ie = &ii->tree_entry;
} }
/* use ignore from containing frame stack */ if (entry)
if (wi->is_ignored <= GIT_IGNORE_NOTFOUND) *entry = ie;
wi->is_ignored = wi->fi.stack->is_ignored;
ii->base.flags |= GIT_ITERATOR_FIRST_ACCESS;
return (ie != NULL) ? 0 : GIT_ITEROVER;
} }
bool git_iterator_current_is_ignored(git_iterator *iter) static int index_iterator__at_end(git_iterator *self)
{ {
workdir_iterator *wi = (workdir_iterator *)iter; index_iterator *ii = (index_iterator *)self;
return (ii->current >= git_vector_length(&ii->entries));
}
if (iter->type != GIT_ITERATOR_TYPE_WORKDIR) static int index_iterator__advance(
return false; const git_index_entry **entry, git_iterator *self)
{
index_iterator *ii = (index_iterator *)self;
size_t entrycount = git_vector_length(&ii->entries);
const git_index_entry *ie;
if (!iterator__has_been_accessed(ii))
return index_iterator__current(entry, self);
if (wi->is_ignored != GIT_IGNORE_UNCHECKED) if (index_iterator__at_tree(ii)) {
return (bool)(wi->is_ignored == GIT_IGNORE_TRUE); if (iterator__do_autoexpand(ii)) {
ii->partial.ptr[ii->partial_pos] = ii->restore_terminator;
index_iterator__next_prefix_tree(ii);
} else {
/* advance to sibling tree (i.e. find entry with new prefix) */
while (ii->current < entrycount) {
ii->current++;
workdir_iterator_update_is_ignored(wi); if (!(ie = git_vector_get(&ii->entries, ii->current)) ||
ii->base.prefixcomp(ie->path, ii->partial.ptr) != 0)
break;
}
return (bool)(wi->is_ignored == GIT_IGNORE_TRUE); if (index_iterator__first_prefix_tree(ii) < 0)
return -1;
}
} else {
if (ii->current < entrycount)
ii->current++;
if (index_iterator__first_prefix_tree(ii) < 0)
return -1;
}
return index_iterator__current(entry, self);
} }
bool git_iterator_current_tree_is_ignored(git_iterator *iter) static int index_iterator__advance_into(
const git_index_entry **entry, git_iterator *self)
{ {
workdir_iterator *wi = (workdir_iterator *)iter; index_iterator *ii = (index_iterator *)self;
const git_index_entry *ie = git_vector_get(&ii->entries, ii->current);
if (iter->type != GIT_ITERATOR_TYPE_WORKDIR) if (ie != NULL && index_iterator__at_tree(ii)) {
return false; if (ii->restore_terminator)
ii->partial.ptr[ii->partial_pos] = ii->restore_terminator;
index_iterator__next_prefix_tree(ii);
}
return (bool)(wi->fi.stack->is_ignored == GIT_IGNORE_TRUE); return index_iterator__current(entry, self);
} }
int git_iterator_cmp(git_iterator *iter, const char *path_prefix) static int index_iterator__reset(git_iterator *self)
{ {
const git_index_entry *entry; index_iterator *ii = (index_iterator *)self;
const git_index_entry *ie;
/* a "done" iterator is after every prefix */ ii->current = 0;
if (git_iterator_current(&entry, iter) < 0 || entry == NULL) ii->base.flags &= ~GIT_ITERATOR_FIRST_ACCESS;
return 1;
/* a NULL prefix is after any valid iterator */ iterator_pathlist_walk__reset(self);
if (!path_prefix)
/* if we're given a start prefix, find it; if we're given a pathlist, find
* the first of those. start at the later of the two.
*/
if (ii->base.start)
git_index_snapshot_find(
&ii->current, &ii->entries, ii->entry_srch, ii->base.start, 0, 0);
if ((ie = index_iterator__advance_over_unwanted(ii)) == NULL)
return 0;
if (git_buf_sets(&ii->partial, ie->path) < 0)
return -1; return -1;
return iter->prefixcomp(entry->path, path_prefix); ii->partial_pos = 0;
}
int git_iterator_current_workdir_path(git_buf **path, git_iterator *iter) if (ii->base.start) {
{ size_t startlen = strlen(ii->base.start);
workdir_iterator *wi = (workdir_iterator *)iter;
if (iter->type != GIT_ITERATOR_TYPE_WORKDIR || !wi->fi.entry.path) ii->partial_pos = (startlen > ii->partial.size) ?
*path = NULL; ii->partial.size : startlen;
else }
*path = &wi->fi.path;
index_iterator__next_prefix_tree(ii);
return 0; return 0;
} }
int git_iterator_index(git_index **out, git_iterator *iter) static int index_iterator__reset_range(
git_iterator *self, const char *start, const char *end)
{ {
workdir_iterator *wi = (workdir_iterator *)iter; if (iterator__reset_range(self, start, end) < 0)
return -1;
if (iter->type != GIT_ITERATOR_TYPE_WORKDIR)
*out = NULL;
*out = wi->index; return index_iterator__reset(self);
}
return 0; static void index_iterator__free(git_iterator *self)
{
index_iterator *ii = (index_iterator *)self;
git_index_snapshot_release(&ii->entries, ii->index);
ii->index = NULL;
git_buf_free(&ii->partial);
} }
int git_iterator_advance_over_with_status( int git_iterator_for_index(
const git_index_entry **entryptr, git_iterator **iter,
git_iterator_status_t *status, git_repository *repo,
git_iterator *iter) git_index *index,
git_iterator_options *options)
{ {
int error = 0; int error = 0;
workdir_iterator *wi = (workdir_iterator *)iter; index_iterator *ii = git__calloc(1, sizeof(index_iterator));
char *base = NULL; GITERR_CHECK_ALLOC(ii);
const git_index_entry *entry;
*status = GIT_ITERATOR_STATUS_NORMAL;
if (iter->type != GIT_ITERATOR_TYPE_WORKDIR) if ((error = git_index_snapshot_new(&ii->entries, index)) < 0) {
return git_iterator_advance(entryptr, iter); git__free(ii);
if ((error = git_iterator_current(&entry, iter)) < 0)
return error; return error;
}
ii->index = index;
if (!S_ISDIR(entry->mode)) { ITERATOR_BASE_INIT(ii, index, INDEX, repo);
workdir_iterator_update_is_ignored(wi);
if (wi->is_ignored == GIT_IGNORE_TRUE) if ((error = iterator__update_ignore_case((git_iterator *)ii, options ? options->flags : 0)) < 0) {
*status = GIT_ITERATOR_STATUS_IGNORED; git_iterator_free((git_iterator *)ii);
return git_iterator_advance(entryptr, iter); return error;
} }
*status = GIT_ITERATOR_STATUS_EMPTY; ii->entry_srch = iterator__ignore_case(ii) ?
git_index_entry_isrch : git_index_entry_srch;
base = git__strdup(entry->path); git_vector_set_cmp(&ii->entries, iterator__ignore_case(ii) ?
GITERR_CHECK_ALLOC(base); git_index_entry_icmp : git_index_entry_cmp);
git_vector_sort(&ii->entries);
/* scan inside directory looking for a non-ignored item */ git_buf_init(&ii->partial, 0);
while (entry && !iter->prefixcomp(entry->path, base)) { ii->tree_entry.mode = GIT_FILEMODE_TREE;
workdir_iterator_update_is_ignored(wi);
/* if we found an explicitly ignored item, then update from index_iterator__reset((git_iterator *)ii);
* EMPTY to IGNORED
*/
if (wi->is_ignored == GIT_IGNORE_TRUE)
*status = GIT_ITERATOR_STATUS_IGNORED;
else if (S_ISDIR(entry->mode)) {
error = git_iterator_advance_into(&entry, iter);
if (!error) *iter = (git_iterator *)ii;
continue; return 0;
}
else if (error == GIT_ENOTFOUND) {
/* we entered this directory only hoping to find child matches to
* our pathlist (eg, this is `foo` and we had a pathlist entry for
* `foo/bar`). it should not be ignored, it should be excluded.
*/
if (wi->fi.pathlist_match == ITERATOR_PATHLIST_MATCH_CHILD)
*status = GIT_ITERATOR_STATUS_FILTERED;
else
wi->is_ignored = GIT_IGNORE_TRUE; /* mark empty dirs ignored */
error = 0; void git_iterator_free(git_iterator *iter)
} else {
break; /* real error, stop here */ if (iter == NULL)
} else { return;
/* we found a non-ignored item, treat parent as untracked */
*status = GIT_ITERATOR_STATUS_NORMAL;
break;
}
if ((error = git_iterator_advance(&entry, iter)) < 0) iter->cb->free(iter);
break;
}
/* wrap up scan back to base directory */ git_vector_free(&iter->pathlist);
while (entry && !iter->prefixcomp(entry->path, base)) git__free(iter->start);
if ((error = git_iterator_advance(&entry, iter)) < 0) git__free(iter->end);
break;
*entryptr = entry; memset(iter, 0, sizeof(*iter));
git__free(base);
return error; git__free(iter);
}
int git_iterator_cmp(git_iterator *iter, const char *path_prefix)
{
const git_index_entry *entry;
/* a "done" iterator is after every prefix */
if (git_iterator_current(&entry, iter) < 0 || entry == NULL)
return 1;
/* a NULL prefix is after any valid iterator */
if (!path_prefix)
return -1;
return iter->prefixcomp(entry->path, path_prefix);
}
git_index *git_iterator_index(git_iterator *iter)
{
if (iter->type == GIT_ITERATOR_TYPE_INDEX)
return ((index_iterator *)iter)->index;
if (iter->type == GIT_ITERATOR_TYPE_FS ||
iter->type == GIT_ITERATOR_TYPE_WORKDIR)
return ((filesystem_iterator *)iter)->index;
return NULL;
} }
int git_iterator_walk( int git_iterator_walk(
......
...@@ -34,10 +34,19 @@ typedef enum { ...@@ -34,10 +34,19 @@ typedef enum {
GIT_ITERATOR_DONT_AUTOEXPAND = (1u << 3), GIT_ITERATOR_DONT_AUTOEXPAND = (1u << 3),
/** convert precomposed unicode to decomposed unicode */ /** convert precomposed unicode to decomposed unicode */
GIT_ITERATOR_PRECOMPOSE_UNICODE = (1u << 4), GIT_ITERATOR_PRECOMPOSE_UNICODE = (1u << 4),
/** never convert precomposed unicode to decomposed unicode */
GIT_ITERATOR_DONT_PRECOMPOSE_UNICODE = (1u << 5),
/** include conflicts */ /** include conflicts */
GIT_ITERATOR_INCLUDE_CONFLICTS = (1u << 5), GIT_ITERATOR_INCLUDE_CONFLICTS = (1u << 6),
} git_iterator_flag_t; } git_iterator_flag_t;
typedef enum {
GIT_ITERATOR_STATUS_NORMAL = 0,
GIT_ITERATOR_STATUS_IGNORED = 1,
GIT_ITERATOR_STATUS_EMPTY = 2,
GIT_ITERATOR_STATUS_FILTERED = 3
} git_iterator_status_t;
typedef struct { typedef struct {
const char *start; const char *start;
const char *end; const char *end;
...@@ -57,6 +66,8 @@ typedef struct { ...@@ -57,6 +66,8 @@ typedef struct {
int (*current)(const git_index_entry **, git_iterator *); int (*current)(const git_index_entry **, git_iterator *);
int (*advance)(const git_index_entry **, git_iterator *); int (*advance)(const git_index_entry **, git_iterator *);
int (*advance_into)(const git_index_entry **, git_iterator *); int (*advance_into)(const git_index_entry **, git_iterator *);
int (*advance_over)(
const git_index_entry **, git_iterator_status_t *, git_iterator *);
int (*reset)(git_iterator *); int (*reset)(git_iterator *);
int (*reset_range)(git_iterator *, const char *start, const char *end); int (*reset_range)(git_iterator *, const char *start, const char *end);
int (*at_end)(git_iterator *); int (*at_end)(git_iterator *);
...@@ -67,8 +78,13 @@ struct git_iterator { ...@@ -67,8 +78,13 @@ struct git_iterator {
git_iterator_type_t type; git_iterator_type_t type;
git_iterator_callbacks *cb; git_iterator_callbacks *cb;
git_repository *repo; git_repository *repo;
char *start; char *start;
size_t start_len;
char *end; char *end;
size_t end_len;
bool started; bool started;
bool ended; bool ended;
git_vector pathlist; git_vector pathlist;
...@@ -76,6 +92,7 @@ struct git_iterator { ...@@ -76,6 +92,7 @@ struct git_iterator {
int (*strcomp)(const char *a, const char *b); int (*strcomp)(const char *a, const char *b);
int (*strncomp)(const char *a, const char *b, size_t n); int (*strncomp)(const char *a, const char *b, size_t n);
int (*prefixcomp)(const char *str, const char *prefix); int (*prefixcomp)(const char *str, const char *prefix);
int (*entry_srch)(const void *key, const void *array_member);
size_t stat_calls; size_t stat_calls;
unsigned int flags; unsigned int flags;
}; };
...@@ -183,6 +200,28 @@ GIT_INLINE(int) git_iterator_advance_into( ...@@ -183,6 +200,28 @@ GIT_INLINE(int) git_iterator_advance_into(
return iter->cb->advance_into(entry, iter); return iter->cb->advance_into(entry, iter);
} }
/* Advance over a directory and check if it contains no files or just
* ignored files.
*
* In a tree or the index, all directories will contain files, but in the
* working directory it is possible to have an empty directory tree or a
* tree that only contains ignored files. Many Git operations treat these
* cases specially. This advances over a directory (presumably an
* untracked directory) but checks during the scan if there are any files
* and any non-ignored files.
*/
GIT_INLINE(int) git_iterator_advance_over(
const git_index_entry **entry,
git_iterator_status_t *status,
git_iterator *iter)
{
if (iter->cb->advance_over)
return iter->cb->advance_over(entry, status, iter);
*status = GIT_ITERATOR_STATUS_NORMAL;
return git_iterator_advance(entry, iter);
}
/** /**
* Advance into a tree or skip over it if it is empty. * Advance into a tree or skip over it if it is empty.
* *
...@@ -273,35 +312,12 @@ extern int git_iterator_cmp( ...@@ -273,35 +312,12 @@ extern int git_iterator_cmp(
extern int git_iterator_current_workdir_path( extern int git_iterator_current_workdir_path(
git_buf **path, git_iterator *iter); git_buf **path, git_iterator *iter);
/* Return index pointer if index iterator, else NULL */
extern git_index *git_iterator_get_index(git_iterator *iter);
typedef enum {
GIT_ITERATOR_STATUS_NORMAL = 0,
GIT_ITERATOR_STATUS_IGNORED = 1,
GIT_ITERATOR_STATUS_EMPTY = 2,
GIT_ITERATOR_STATUS_FILTERED = 3
} git_iterator_status_t;
/* Advance over a directory and check if it contains no files or just
* ignored files.
*
* In a tree or the index, all directories will contain files, but in the
* working directory it is possible to have an empty directory tree or a
* tree that only contains ignored files. Many Git operations treat these
* cases specially. This advances over a directory (presumably an
* untracked directory) but checks during the scan if there are any files
* and any non-ignored files.
*/
extern int git_iterator_advance_over_with_status(
const git_index_entry **entry, git_iterator_status_t *status, git_iterator *iter);
/** /**
* Retrieve the index stored in the iterator. * Retrieve the index stored in the iterator.
* *
* Only implemented for the workdir iterator * Only implemented for the workdir and index iterators.
*/ */
extern int git_iterator_index(git_index **out, git_iterator *iter); extern git_index *git_iterator_index(git_iterator *iter);
typedef int (*git_iterator_walk_cb)( typedef int (*git_iterator_walk_cb)(
const git_index_entry **entries, const git_index_entry **entries,
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment