/* * Copyright (C) the libgit2 contributors. All rights reserved. * * This file is part of libgit2, distributed under the GNU GPL v2 with * a Linking Exception. For full terms see the included COPYING file. */ #ifndef INCLUDE_fs_path_h__ #define INCLUDE_fs_path_h__ #include "common.h" #include "posix.h" #include "str.h" #include "vector.h" #include "utf8.h" /** * Path manipulation utils * * These are path utilities that munge paths without actually * looking at the real filesystem. */ /* * The dirname() function shall take a pointer to a character string * that contains a pathname, and return a pointer to a string that is a * pathname of the parent directory of that file. Trailing '/' characters * in the path are not counted as part of the path. * * If path does not contain a '/', then dirname() shall return a pointer to * the string ".". If path is a null pointer or points to an empty string, * dirname() shall return a pointer to the string "." . * * The `git_fs_path_dirname` implementation is thread safe. The returned * string must be manually free'd. * * The `git_fs_path_dirname_r` implementation writes the dirname to a `git_str` * if the buffer pointer is not NULL. * It returns an error code < 0 if there is an allocation error, otherwise * the length of the dirname (which will be > 0). */ extern char *git_fs_path_dirname(const char *path); extern int git_fs_path_dirname_r(git_str *buffer, const char *path); /* * This function returns the basename of the file, which is the last * part of its full name given by fname, with the drive letter and * leading directories stripped off. For example, the basename of * c:/foo/bar/file.ext is file.ext, and the basename of a:foo is foo. * * Trailing slashes and backslashes are significant: the basename of * c:/foo/bar/ is an empty string after the rightmost slash. * * The `git_fs_path_basename` implementation is thread safe. The returned * string must be manually free'd. * * The `git_fs_path_basename_r` implementation writes the basename to a `git_str`. * It returns an error code < 0 if there is an allocation error, otherwise * the length of the basename (which will be >= 0). */ extern char *git_fs_path_basename(const char *path); extern int git_fs_path_basename_r(git_str *buffer, const char *path); /* Return the offset of the start of the basename. Unlike the other * basename functions, this returns 0 if the path is empty. */ extern size_t git_fs_path_basename_offset(git_str *buffer); /** * Find offset to root of path if path has one. * * This will return a number >= 0 which is the offset to the start of the * path, if the path is rooted (i.e. "/rooted/path" returns 0 and * "c:/windows/rooted/path" returns 2). If the path is not rooted, this * returns -1. */ extern int git_fs_path_root(const char *path); /** * Ensure path has a trailing '/'. */ extern int git_fs_path_to_dir(git_str *path); /** * Ensure string has a trailing '/' if there is space for it. */ extern void git_fs_path_string_to_dir(char *path, size_t size); /** * Taken from git.git; returns nonzero if the given path is "." or "..". */ GIT_INLINE(int) git_fs_path_is_dot_or_dotdot(const char *name) { return (name[0] == '.' && (name[1] == '\0' || (name[1] == '.' && name[2] == '\0'))); } #ifdef GIT_WIN32 GIT_INLINE(int) git_fs_path_is_dot_or_dotdotW(const wchar_t *name) { return (name[0] == L'.' && (name[1] == L'\0' || (name[1] == L'.' && name[2] == L'\0'))); } #define git_fs_path_is_absolute(p) \ (git__isalpha((p)[0]) && (p)[1] == ':' && ((p)[2] == '\\' || (p)[2] == '/')) #define git_fs_path_is_dirsep(p) \ ((p) == '/' || (p) == '\\') /** * Convert backslashes in path to forward slashes. */ GIT_INLINE(void) git_fs_path_mkposix(char *path) { while (*path) { if (*path == '\\') *path = '/'; path++; } } #else # define git_fs_path_mkposix(p) /* blank */ #define git_fs_path_is_absolute(p) \ ((p)[0] == '/') #define git_fs_path_is_dirsep(p) \ ((p) == '/') #endif /** * Check if string is a relative path (i.e. starts with "./" or "../") */ GIT_INLINE(int) git_fs_path_is_relative(const char *p) { return (p[0] == '.' && (p[1] == '/' || (p[1] == '.' && p[2] == '/'))); } /** * Check if string is at end of path segment (i.e. looking at '/' or '\0') */ GIT_INLINE(int) git_fs_path_at_end_of_segment(const char *p) { return !*p || *p == '/'; } extern int git__percent_decode(git_str *decoded_out, const char *input); /** * Extract path from file:// URL. */ extern int git_fs_path_fromurl(git_str *local_path_out, const char *file_url); /** * Path filesystem utils * * These are path utilities that actually access the filesystem. */ /** * Check if a file exists and can be accessed. * @return true or false */ extern bool git_fs_path_exists(const char *path); /** * Check if the given path points to a directory. * @return true or false */ extern bool git_fs_path_isdir(const char *path); /** * Check if the given path points to a regular file. * @return true or false */ extern bool git_fs_path_isfile(const char *path); /** * Check if the given path points to a symbolic link. * @return true or false */ extern bool git_fs_path_islink(const char *path); /** * Check if the given path is a directory, and is empty. */ extern bool git_fs_path_is_empty_dir(const char *path); /** * Stat a file and/or link and set error if needed. */ extern int git_fs_path_lstat(const char *path, struct stat *st); /** * Check if the parent directory contains the item. * * @param dir Directory to check. * @param item Item that might be in the directory. * @return 0 if item exists in directory, <0 otherwise. */ extern bool git_fs_path_contains(git_str *dir, const char *item); /** * Check if the given path contains the given subdirectory. * * @param parent Directory path that might contain subdir * @param subdir Subdirectory name to look for in parent * @return true if subdirectory exists, false otherwise. */ extern bool git_fs_path_contains_dir(git_str *parent, const char *subdir); /** * Determine the common directory length between two paths, including * the final path separator. For example, given paths 'a/b/c/1.txt * and 'a/b/c/d/2.txt', the common directory is 'a/b/c/', and this * will return the length of the string 'a/b/c/', which is 6. * * @param one The first path * @param two The second path * @return The length of the common directory */ extern size_t git_fs_path_common_dirlen(const char *one, const char *two); /** * Make the path relative to the given parent path. * * @param path The path to make relative * @param parent The parent path to make path relative to * @return 0 if path was made relative, GIT_ENOTFOUND * if there was not common root between the paths, * or <0. */ extern int git_fs_path_make_relative(git_str *path, const char *parent); /** * Check if the given path contains the given file. * * @param dir Directory path that might contain file * @param file File name to look for in parent * @return true if file exists, false otherwise. */ extern bool git_fs_path_contains_file(git_str *dir, const char *file); /** * Prepend base to unrooted path or just copy path over. * * This will optionally return the index into the path where the "root" * is, either the end of the base directory prefix or the path root. */ extern int git_fs_path_join_unrooted( git_str *path_out, const char *path, const char *base, ssize_t *root_at); /** * Removes multiple occurrences of '/' in a row, squashing them into a * single '/'. */ extern void git_fs_path_squash_slashes(git_str *path); /** * Clean up path, prepending base if it is not already rooted. */ extern int git_fs_path_prettify(git_str *path_out, const char *path, const char *base); /** * Clean up path, prepending base if it is not already rooted and * appending a slash. */ extern int git_fs_path_prettify_dir(git_str *path_out, const char *path, const char *base); /** * Get a directory from a path. * * If path is a directory, this acts like `git_fs_path_prettify_dir` * (cleaning up path and appending a '/'). If path is a normal file, * this prettifies it, then removed the filename a la dirname and * appends the trailing '/'. If the path does not exist, it is * treated like a regular filename. */ extern int git_fs_path_find_dir(git_str *dir); /** * Resolve relative references within a path. * * This eliminates "./" and "../" relative references inside a path, * as well as condensing multiple slashes into single ones. It will * not touch the path before the "ceiling" length. * * Additionally, this will recognize an "c:/" drive prefix or a "xyz://" URL * prefix and not touch that part of the path. */ extern int git_fs_path_resolve_relative(git_str *path, size_t ceiling); /** * Apply a relative path to base path. * * Note that the base path could be a filename or a URL and this * should still work. The relative path is walked segment by segment * with three rules: series of slashes will be condensed to a single * slash, "." will be eaten with no change, and ".." will remove a * segment from the base path. */ extern int git_fs_path_apply_relative(git_str *target, const char *relpath); enum { GIT_FS_PATH_DIR_IGNORE_CASE = (1u << 0), GIT_FS_PATH_DIR_PRECOMPOSE_UNICODE = (1u << 1), GIT_FS_PATH_DIR_INCLUDE_DOT_AND_DOTDOT = (1u << 2), }; /** * Walk each directory entry, except '.' and '..', calling fn(state). * * @param pathbuf Buffer the function reads the initial directory * path from, and updates with each successive entry's name. * @param flags Combination of GIT_FS_PATH_DIR flags. * @param callback Callback for each entry. Passed the `payload` and each * successive path inside the directory as a full path. This may * safely append text to the pathbuf if needed. Return non-zero to * cancel iteration (and return value will be propagated back). * @param payload Passed to callback as first argument. * @return 0 on success or error code from OS error or from callback */ extern int git_fs_path_direach( git_str *pathbuf, uint32_t flags, int (*callback)(void *payload, git_str *path), void *payload); /** * Sort function to order two paths */ extern int git_fs_path_cmp( const char *name1, size_t len1, int isdir1, const char *name2, size_t len2, int isdir2, int (*compare)(const char *, const char *, size_t)); /** * Invoke callback up path directory by directory until the ceiling is * reached (inclusive of a final call at the root_path). * * Returning anything other than 0 from the callback function * will stop the iteration and propagate the error to the caller. * * @param pathbuf Buffer the function reads the directory from and * and updates with each successive name. * @param ceiling Prefix of path at which to stop walking up. If NULL, * this will walk all the way up to the root. If not a prefix of * pathbuf, the callback will be invoked a single time on the * original input path. * @param callback Function to invoke on each path. Passed the `payload` * and the buffer containing the current path. The path should not * be modified in any way. Return non-zero to stop iteration. * @param payload Passed to fn as the first ath. */ extern int git_fs_path_walk_up( git_str *pathbuf, const char *ceiling, int (*callback)(void *payload, const char *path), void *payload); enum { GIT_FS_PATH_NOTEQUAL = 0, GIT_FS_PATH_EQUAL = 1, GIT_FS_PATH_PREFIX = 2 }; /* * Determines if a path is equal to or potentially a child of another. * @param parent The possible parent * @param child The possible child */ GIT_INLINE(int) git_fs_path_equal_or_prefixed( const char *parent, const char *child, ssize_t *prefixlen) { const char *p = parent, *c = child; int lastslash = 0; while (*p && *c) { lastslash = (*p == '/'); if (*p++ != *c++) return GIT_FS_PATH_NOTEQUAL; } if (*p != '\0') return GIT_FS_PATH_NOTEQUAL; if (*c == '\0') { if (prefixlen) *prefixlen = p - parent; return GIT_FS_PATH_EQUAL; } if (*c == '/' || lastslash) { if (prefixlen) *prefixlen = (p - parent) - lastslash; return GIT_FS_PATH_PREFIX; } return GIT_FS_PATH_NOTEQUAL; } /* translate errno to libgit2 error code and set error message */ extern int git_fs_path_set_error( int errno_value, const char *path, const char *action); /* check if non-ascii characters are present in filename */ extern bool git_fs_path_has_non_ascii(const char *path, size_t pathlen); #define GIT_PATH_REPO_ENCODING "UTF-8" #ifdef __APPLE__ #define GIT_PATH_NATIVE_ENCODING "UTF-8-MAC" #else #define GIT_PATH_NATIVE_ENCODING "UTF-8" #endif #ifdef GIT_USE_ICONV #include <iconv.h> typedef struct { iconv_t map; git_str buf; } git_fs_path_iconv_t; #define GIT_PATH_ICONV_INIT { (iconv_t)-1, GIT_STR_INIT } /* Init iconv data for converting decomposed UTF-8 to precomposed */ extern int git_fs_path_iconv_init_precompose(git_fs_path_iconv_t *ic); /* Clear allocated iconv data */ extern void git_fs_path_iconv_clear(git_fs_path_iconv_t *ic); /* * Rewrite `in` buffer using iconv map if necessary, replacing `in` * pointer internal iconv buffer if rewrite happened. The `in` pointer * will be left unchanged if no rewrite was needed. */ extern int git_fs_path_iconv(git_fs_path_iconv_t *ic, const char **in, size_t *inlen); #endif /* GIT_USE_ICONV */ extern bool git_fs_path_does_decompose_unicode(const char *root); typedef struct git_fs_path_diriter git_fs_path_diriter; #if defined(GIT_WIN32) && !defined(__MINGW32__) struct git_fs_path_diriter { git_win32_path path; size_t parent_len; git_str path_utf8; size_t parent_utf8_len; HANDLE handle; unsigned int flags; WIN32_FIND_DATAW current; unsigned int needs_next; }; #define GIT_FS_PATH_DIRITER_INIT { {0}, 0, GIT_STR_INIT, 0, INVALID_HANDLE_VALUE } #else struct git_fs_path_diriter { git_str path; size_t parent_len; unsigned int flags; DIR *dir; #ifdef GIT_USE_ICONV git_fs_path_iconv_t ic; #endif }; #define GIT_FS_PATH_DIRITER_INIT { GIT_STR_INIT } #endif /** * Initialize a directory iterator. * * @param diriter Pointer to a diriter structure that will be setup. * @param path The path that will be iterated over * @param flags Directory reader flags * @return 0 or an error code */ extern int git_fs_path_diriter_init( git_fs_path_diriter *diriter, const char *path, unsigned int flags); /** * Advance the directory iterator. Will return GIT_ITEROVER when * the iteration has completed successfully. * * @param diriter The directory iterator * @return 0, GIT_ITEROVER, or an error code */ extern int git_fs_path_diriter_next(git_fs_path_diriter *diriter); /** * Returns the file name of the current item in the iterator. * * @param out Pointer to store the path in * @param out_len Pointer to store the length of the path in * @param diriter The directory iterator * @return 0 or an error code */ extern int git_fs_path_diriter_filename( const char **out, size_t *out_len, git_fs_path_diriter *diriter); /** * Returns the full path of the current item in the iterator; that * is the current filename plus the path of the directory that the * iterator was constructed with. * * @param out Pointer to store the path in * @param out_len Pointer to store the length of the path in * @param diriter The directory iterator * @return 0 or an error code */ extern int git_fs_path_diriter_fullpath( const char **out, size_t *out_len, git_fs_path_diriter *diriter); /** * Performs an `lstat` on the current item in the iterator. * * @param out Pointer to store the stat data in * @param diriter The directory iterator * @return 0 or an error code */ extern int git_fs_path_diriter_stat(struct stat *out, git_fs_path_diriter *diriter); /** * Closes the directory iterator. * * @param diriter The directory iterator */ extern void git_fs_path_diriter_free(git_fs_path_diriter *diriter); /** * Load all directory entries (except '.' and '..') into a vector. * * For cases where `git_fs_path_direach()` is not appropriate, this * allows you to load the filenames in a directory into a vector * of strings. That vector can then be sorted, iterated, or whatever. * Remember to free alloc of the allocated strings when you are done. * * @param contents Vector to fill with directory entry names. * @param path The directory to read from. * @param prefix_len When inserting entries, the trailing part of path * will be prefixed after this length. I.e. given path "/a/b" and * prefix_len 3, the entries will look like "b/e1", "b/e2", etc. * @param flags Combination of GIT_FS_PATH_DIR flags. */ extern int git_fs_path_dirload( git_vector *contents, const char *path, size_t prefix_len, uint32_t flags); /* Used for paths to repositories on the filesystem */ extern bool git_fs_path_is_local_file_url(const char *file_url); extern int git_fs_path_from_url_or_path(git_str *local_path_out, const char *url_or_path); /* Flags to determine path validity in `git_fs_path_isvalid` */ #define GIT_FS_PATH_REJECT_EMPTY_COMPONENT (1 << 0) #define GIT_FS_PATH_REJECT_TRAVERSAL (1 << 1) #define GIT_FS_PATH_REJECT_SLASH (1 << 2) #define GIT_FS_PATH_REJECT_BACKSLASH (1 << 3) #define GIT_FS_PATH_REJECT_TRAILING_DOT (1 << 4) #define GIT_FS_PATH_REJECT_TRAILING_SPACE (1 << 5) #define GIT_FS_PATH_REJECT_TRAILING_COLON (1 << 6) #define GIT_FS_PATH_REJECT_DOS_PATHS (1 << 7) #define GIT_FS_PATH_REJECT_NT_CHARS (1 << 8) #define GIT_FS_PATH_REJECT_LONG_PATHS (1 << 9) #define GIT_FS_PATH_REJECT_MAX (1 << 9) /* Default path safety for writing files to disk: since we use the * Win32 "File Namespace" APIs ("\\?\") we need to protect from * paths that the normal Win32 APIs would not write. */ #ifdef GIT_WIN32 # define GIT_FS_PATH_REJECT_FILESYSTEM_DEFAULTS \ GIT_FS_PATH_REJECT_EMPTY_COMPONENT | \ GIT_FS_PATH_REJECT_TRAVERSAL | \ GIT_FS_PATH_REJECT_BACKSLASH | \ GIT_FS_PATH_REJECT_TRAILING_DOT | \ GIT_FS_PATH_REJECT_TRAILING_SPACE | \ GIT_FS_PATH_REJECT_TRAILING_COLON | \ GIT_FS_PATH_REJECT_DOS_PATHS | \ GIT_FS_PATH_REJECT_NT_CHARS #else # define GIT_FS_PATH_REJECT_FILESYSTEM_DEFAULTS \ GIT_FS_PATH_REJECT_EMPTY_COMPONENT | \ GIT_FS_PATH_REJECT_TRAVERSAL #endif /** * Validate a filesystem path; with custom callbacks per-character and * per-path component. */ extern bool git_fs_path_str_is_valid_ext( const git_str *path, unsigned int flags, bool (*validate_char_cb)(char ch, void *payload), bool (*validate_component_cb)(const char *component, size_t len, void *payload), bool (*validate_length_cb)(const char *component, size_t len, size_t utf8_char_len), void *payload); GIT_INLINE(bool) git_fs_path_is_valid_ext( const char *path, unsigned int flags, bool (*validate_char_cb)(char ch, void *payload), bool (*validate_component_cb)(const char *component, size_t len, void *payload), bool (*validate_length_cb)(const char *component, size_t len, size_t utf8_char_len), void *payload) { const git_str str = GIT_STR_INIT_CONST(path, SIZE_MAX); return git_fs_path_str_is_valid_ext( &str, flags, validate_char_cb, validate_component_cb, validate_length_cb, payload); } /** * Validate a filesystem path. This ensures that the given path is legal * and does not contain any "unsafe" components like path traversal ('.' * or '..'), characters that are inappropriate for lesser filesystems * (trailing ' ' or ':' characters), or filenames ("component names") * that are not supported ('AUX', 'COM1"). */ GIT_INLINE(bool) git_fs_path_is_valid( const char *path, unsigned int flags) { const git_str str = GIT_STR_INIT_CONST(path, SIZE_MAX); return git_fs_path_str_is_valid_ext(&str, flags, NULL, NULL, NULL, NULL); } /** Validate a filesystem path in a `git_str`. */ GIT_INLINE(bool) git_fs_path_str_is_valid( const git_str *path, unsigned int flags) { return git_fs_path_str_is_valid_ext(path, flags, NULL, NULL, NULL, NULL); } extern int git_fs_path_validate_str_length_with_suffix( git_str *path, size_t suffix_len); /** * Validate an on-disk path, taking into account that it will have a * suffix appended (eg, `.lock`). */ GIT_INLINE(int) git_fs_path_validate_filesystem_with_suffix( const char *path, size_t path_len, size_t suffix_len) { #ifdef GIT_WIN32 size_t path_chars, total_chars; path_chars = git_utf8_char_length(path, path_len); if (GIT_ADD_SIZET_OVERFLOW(&total_chars, path_chars, suffix_len) || total_chars > MAX_PATH) { git_error_set(GIT_ERROR_FILESYSTEM, "path too long: '%s'", path); return -1; } return 0; #else GIT_UNUSED(path); GIT_UNUSED(path_len); GIT_UNUSED(suffix_len); return 0; #endif } /** * Validate an path on the filesystem. This ensures that the given * path is valid for the operating system/platform; for example, this * will ensure that the given absolute path is smaller than MAX_PATH on * Windows. * * For paths within the working directory, you should use ensure that * `core.longpaths` is obeyed. Use `git_fs_path_validate_workdir`. */ GIT_INLINE(int) git_fs_path_validate_filesystem( const char *path, size_t path_len) { return git_fs_path_validate_filesystem_with_suffix(path, path_len, 0); } /** * Convert any backslashes into slashes */ int git_fs_path_normalize_slashes(git_str *out, const char *path); bool git_fs_path_supports_symlinks(const char *dir); /** * Validate a system file's ownership * * Verify that the file in question is owned by an administrator or system * account, or at least by the current user. * * This function returns 0 if successful. If the file is not owned by any of * these, or any other if there have been problems determining the file * ownership, it returns -1. */ int git_fs_path_validate_system_file_ownership(const char *path); /** * Search the current PATH for the given executable, returning the full * path if it is found. */ int git_fs_path_find_executable(git_str *fullpath, const char *executable); #endif