/*
 * Copyright (C) the libgit2 contributors. All rights reserved.
 *
 * This file is part of libgit2, distributed under the GNU GPL v2 with
 * a Linking Exception. For full terms see the included COPYING file.
 */
#ifndef INCLUDE_str_h__
#define INCLUDE_str_h__

#include "common.h"

struct git_str {
	char *ptr;
	size_t asize;
	size_t size;
};

typedef enum {
	GIT_STR_BOM_NONE = 0,
	GIT_STR_BOM_UTF8 = 1,
	GIT_STR_BOM_UTF16_LE = 2,
	GIT_STR_BOM_UTF16_BE = 3,
	GIT_STR_BOM_UTF32_LE = 4,
	GIT_STR_BOM_UTF32_BE = 5
} git_str_bom_t;

typedef struct {
	git_str_bom_t bom; /* BOM found at head of text */
	unsigned int nul, cr, lf, crlf; /* NUL, CR, LF and CRLF counts */
	unsigned int printable, nonprintable; /* These are just approximations! */
} git_str_text_stats;

extern char git_str__initstr[];
extern char git_str__oom[];

/* Use to initialize string buffer structure when git_str is on stack */
#define GIT_STR_INIT { git_str__initstr, 0, 0 }

/**
 * Static initializer for git_str from static string buffer
 */
#define GIT_STR_INIT_CONST(str, len) { (char *)(str), 0, (size_t)(len) }

GIT_INLINE(bool) git_str_is_allocated(const git_str *str)
{
	return (str->ptr != NULL && str->asize > 0);
}

/**
 * Initialize a git_str structure.
 *
 * For the cases where GIT_STR_INIT cannot be used to do static
 * initialization.
 */
extern int git_str_init(git_str *str, size_t initial_size);

extern void git_str_dispose(git_str *str);

/**
 * Resize the string buffer allocation to make more space.
 *
 * This will attempt to grow the string buffer to accommodate the target
 * size.  The bstring buffer's `ptr` will be replaced with a newly
 * allocated block of data.  Be careful so that memory allocated by the
 * caller is not lost.  As a special variant, if you pass `target_size` as
 * 0 and the memory is not allocated by libgit2, this will allocate a new
 * buffer of size `size` and copy the external data into it.
 *
 * Currently, this will never shrink a buffer, only expand it.
 *
 * If the allocation fails, this will return an error and the buffer will be
 * marked as invalid for future operations, invaliding the contents.
 *
 * @param str The buffer to be resized; may or may not be allocated yet
 * @param target_size The desired available size
 * @return 0 on success, -1 on allocation failure
 */
int git_str_grow(git_str *str, size_t target_size);

/**
 * Resize the buffer allocation to make more space.
 *
 * This will attempt to grow the string buffer to accommodate the
 * additional size.  It is similar to `git_str_grow`, but performs the
 * new size calculation, checking for overflow.
 *
 * Like `git_str_grow`, if this is a user-supplied string buffer,
 * this will allocate a new string uffer.
 */
extern int git_str_grow_by(git_str *str, size_t additional_size);

/**
 * Attempt to grow the buffer to hold at least `target_size` bytes.
 *
 * If the allocation fails, this will return an error.  If `mark_oom` is
 * true, this will mark the string buffer as invalid for future
 * operations; if false, existing string buffer content will be preserved,
 * but calling code must handle that string buffer was not expanded.  If
 * `preserve_external` is true, then any existing data pointed to be
 * `ptr` even if `asize` is zero will be copied into the newly allocated
 * string buffer.
 */
extern int git_str_try_grow(
	git_str *str, size_t target_size, bool mark_oom);

extern void git_str_swap(git_str *str_a, git_str *str_b);
extern char *git_str_detach(git_str *str);
extern int git_str_attach(git_str *str, char *ptr, size_t asize);

/* Populates a `git_str` where the contents are not "owned" by the string
 * buffer, and calls to `git_str_dispose` will not free the given str.
 */
extern void git_str_attach_notowned(
	git_str *str, const char *ptr, size_t size);

/**
 * Test if there have been any reallocation failures with this git_str.
 *
 * Any function that writes to a git_str can fail due to memory allocation
 * issues.  If one fails, the git_str will be marked with an OOM error and
 * further calls to modify the string buffer will fail.  Check
 * git_str_oom() at the end of your sequence and it will be true if you
 * ran out of memory at any point with that string buffer.
 *
 * @return false if no error, true if allocation error
 */
GIT_INLINE(bool) git_str_oom(const git_str *str)
{
	return (str->ptr == git_str__oom);
}

/*
 * Functions below that return int value error codes will return 0 on
 * success or -1 on failure (which generally means an allocation failed).
 * Using a git_str where the allocation has failed with result in -1 from
 * all further calls using that string buffer.  As a result, you can
 * ignore the return code of these functions and call them in a series
 * then just call git_str_oom at the end.
 */

int git_str_set(git_str *str, const void *data, size_t datalen);

int git_str_sets(git_str *str, const char *string);
int git_str_putc(git_str *str, char c);
int git_str_putcn(git_str *str, char c, size_t len);
int git_str_put(git_str *str, const char *data, size_t len);
int git_str_puts(git_str *str, const char *string);
int git_str_printf(git_str *str, const char *format, ...) GIT_FORMAT_PRINTF(2, 3);
int git_str_vprintf(git_str *str, const char *format, va_list ap);
void git_str_clear(git_str *str);
void git_str_consume_bytes(git_str *str, size_t len);
void git_str_consume(git_str *str, const char *end);
void git_str_truncate(git_str *str, size_t len);
void git_str_shorten(git_str *str, size_t amount);
void git_str_truncate_at_char(git_str *path, char separator);
void git_str_rtruncate_at_char(git_str *path, char separator);

/** General join with separator */
int git_str_join_n(git_str *str, char separator, int len, ...);
/** Fast join of two strings - first may legally point into `str` data */
int git_str_join(git_str *str, char separator, const char *str_a, const char *str_b);
/** Fast join of three strings - cannot reference `str` data */
int git_str_join3(git_str *str, char separator, const char *str_a, const char *str_b, const char *str_c);

/**
 * Join two strings as paths, inserting a slash between as needed.
 * @return 0 on success, -1 on failure
 */
GIT_INLINE(int) git_str_joinpath(git_str *str, const char *a, const char *b)
{
	return git_str_join(str, '/', a, b);
}

GIT_INLINE(const char *) git_str_cstr(const git_str *str)
{
	return str->ptr;
}

GIT_INLINE(size_t) git_str_len(const git_str *str)
{
	return str->size;
}

int git_str_copy_cstr(char *data, size_t datasize, const git_str *str);

#define git_str_PUTS(str, cstr) git_str_put(str, cstr, sizeof(cstr) - 1)

GIT_INLINE(ssize_t) git_str_rfind_next(const git_str *str, char ch)
{
	ssize_t idx = (ssize_t)str->size - 1;
	while (idx >= 0 && str->ptr[idx] == ch) idx--;
	while (idx >= 0 && str->ptr[idx] != ch) idx--;
	return idx;
}

GIT_INLINE(ssize_t) git_str_rfind(const git_str *str, char ch)
{
	ssize_t idx = (ssize_t)str->size - 1;
	while (idx >= 0 && str->ptr[idx] != ch) idx--;
	return idx;
}

GIT_INLINE(ssize_t) git_str_find(const git_str *str, char ch)
{
	void *found = memchr(str->ptr, ch, str->size);
	return found ? (ssize_t)((const char *)found - str->ptr) : -1;
}

/* Remove whitespace from the end of the string buffer */
void git_str_rtrim(git_str *str);

int git_str_cmp(const git_str *a, const git_str *b);

/* Quote and unquote a string buffer as specified in
 * http://marc.info/?l=git&m=112927316408690&w=2
 */
int git_str_quote(git_str *str);
int git_str_unquote(git_str *str);

/* Write data as base64 encoded in string buffer */
int git_str_encode_base64(git_str *str, const char *data, size_t len);
/* Decode the given bas64 and write the result to the string buffer */
int git_str_decode_base64(git_str *str, const char *base64, size_t len);

/* Write data as "base85" encoded in string buffer */
int git_str_encode_base85(git_str *str, const char *data, size_t len);
/* Decode the given "base85" and write the result to the string buffer */
int git_str_decode_base85(git_str *str, const char *base64, size_t len, size_t output_len);

/*
 * Decode the given percent-encoded string and write the result to the
 * string buffer.
 */
int git_str_decode_percent(git_str *str, const char *encoded, size_t len);

/*
 * Insert, remove or replace a portion of the string buffer.
 *
 * @param str The string buffer to work with
 *
 * @param where The location in the string buffer where the transformation
 * should be applied.
 *
 * @param nb_to_remove The number of chars to be removed. 0 to not
 * remove any character in the string buffer.
 *
 * @param data A pointer to the data which should be inserted.
 *
 * @param nb_to_insert The number of chars to be inserted. 0 to not
 * insert any character from the string buffer.
 *
 * @return 0 or an error code.
 */
int git_str_splice(
	git_str *str,
	size_t where,
	size_t nb_to_remove,
	const char *data,
	size_t nb_to_insert);

/**
 * Append string to string buffer, prefixing each character from
 * `esc_chars` with `esc_with` string.
 *
 * @param str String buffer to append data to
 * @param string String to escape and append
 * @param esc_chars Characters to be escaped
 * @param esc_with String to insert in from of each found character
 * @return 0 on success, <0 on failure (probably allocation problem)
 */
extern int git_str_puts_escaped(
	git_str *str,
	const char *string,
	const char *esc_chars,
	const char *esc_with);

/**
 * Append string escaping characters that are regex special
 */
GIT_INLINE(int) git_str_puts_escape_regex(git_str *str, const char *string)
{
	return git_str_puts_escaped(str, string, "^.[]$()|*+?{}\\", "\\");
}

/**
 * Unescape all characters in a string buffer in place
 *
 * I.e. remove backslashes
 */
extern void git_str_unescape(git_str *str);

/**
 * Replace all \r\n with \n.
 *
 * @return 0 on success, -1 on memory error
 */
extern int git_str_crlf_to_lf(git_str *tgt, const git_str *src);

/**
 * Replace all \n with \r\n. Does not modify existing \r\n.
 *
 * @return 0 on success, -1 on memory error
 */
extern int git_str_lf_to_crlf(git_str *tgt, const git_str *src);

/**
 * Fill string buffer with the common prefix of a array of strings
 *
 * String buffer will be set to empty if there is no common prefix
 */
extern int git_str_common_prefix(git_str *buf, char *const *const strings, size_t count);

/**
 * Check if a string buffer begins with a UTF BOM
 *
 * @param bom Set to the type of BOM detected or GIT_BOM_NONE
 * @param str String buffer in which to check the first bytes for a BOM
 * @return Number of bytes of BOM data (or 0 if no BOM found)
 */
extern int git_str_detect_bom(git_str_bom_t *bom, const git_str *str);

/**
 * Gather stats for a piece of text
 *
 * Fill the `stats` structure with counts of unreadable characters, carriage
 * returns, etc, so it can be used in heuristics.  This automatically skips
 * a trailing EOF (\032 character).  Also it will look for a BOM at the
 * start of the text and can be told to skip that as well.
 *
 * @param stats Structure to be filled in
 * @param str Text to process
 * @param skip_bom Exclude leading BOM from stats if true
 * @return Does the string buffer heuristically look like binary data
 */
extern bool git_str_gather_text_stats(
	git_str_text_stats *stats, const git_str *str, bool skip_bom);

/**
* Check quickly if string buffer looks like it contains binary data
*
* @param str string buffer to check
* @return 1 if string buffer looks like non-text data
*/
int git_str_is_binary(const git_str *str);

/**
* Check quickly if buffer contains a NUL byte
*
* @param str string buffer to check
* @return 1 if string buffer contains a NUL byte
*/
int git_str_contains_nul(const git_str *str);

#endif