Hash :
f0e693b1
Author :
Date :
2021-09-07T17:53:49
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354
/*
* Copyright (C) the libgit2 contributors. All rights reserved.
*
* This file is part of libgit2, distributed under the GNU GPL v2 with
* a Linking Exception. For full terms see the included COPYING file.
*/
#ifndef INCLUDE_str_h__
#define INCLUDE_str_h__
#include "common.h"
struct git_str {
char *ptr;
size_t asize;
size_t size;
};
typedef enum {
GIT_STR_BOM_NONE = 0,
GIT_STR_BOM_UTF8 = 1,
GIT_STR_BOM_UTF16_LE = 2,
GIT_STR_BOM_UTF16_BE = 3,
GIT_STR_BOM_UTF32_LE = 4,
GIT_STR_BOM_UTF32_BE = 5
} git_str_bom_t;
typedef struct {
git_str_bom_t bom; /* BOM found at head of text */
unsigned int nul, cr, lf, crlf; /* NUL, CR, LF and CRLF counts */
unsigned int printable, nonprintable; /* These are just approximations! */
} git_str_text_stats;
extern char git_str__initstr[];
extern char git_str__oom[];
/* Use to initialize string buffer structure when git_str is on stack */
#define GIT_STR_INIT { git_str__initstr, 0, 0 }
/**
* Static initializer for git_str from static string buffer
*/
#define GIT_STR_INIT_CONST(str, len) { (char *)(str), 0, (size_t)(len) }
GIT_INLINE(bool) git_str_is_allocated(const git_str *str)
{
return (str->ptr != NULL && str->asize > 0);
}
/**
* Initialize a git_str structure.
*
* For the cases where GIT_STR_INIT cannot be used to do static
* initialization.
*/
extern int git_str_init(git_str *str, size_t initial_size);
extern void git_str_dispose(git_str *str);
/**
* Resize the string buffer allocation to make more space.
*
* This will attempt to grow the string buffer to accommodate the target
* size. The bstring buffer's `ptr` will be replaced with a newly
* allocated block of data. Be careful so that memory allocated by the
* caller is not lost. As a special variant, if you pass `target_size` as
* 0 and the memory is not allocated by libgit2, this will allocate a new
* buffer of size `size` and copy the external data into it.
*
* Currently, this will never shrink a buffer, only expand it.
*
* If the allocation fails, this will return an error and the buffer will be
* marked as invalid for future operations, invaliding the contents.
*
* @param str The buffer to be resized; may or may not be allocated yet
* @param target_size The desired available size
* @return 0 on success, -1 on allocation failure
*/
int git_str_grow(git_str *str, size_t target_size);
/**
* Resize the buffer allocation to make more space.
*
* This will attempt to grow the string buffer to accommodate the
* additional size. It is similar to `git_str_grow`, but performs the
* new size calculation, checking for overflow.
*
* Like `git_str_grow`, if this is a user-supplied string buffer,
* this will allocate a new string uffer.
*/
extern int git_str_grow_by(git_str *str, size_t additional_size);
/**
* Attempt to grow the buffer to hold at least `target_size` bytes.
*
* If the allocation fails, this will return an error. If `mark_oom` is
* true, this will mark the string buffer as invalid for future
* operations; if false, existing string buffer content will be preserved,
* but calling code must handle that string buffer was not expanded. If
* `preserve_external` is true, then any existing data pointed to be
* `ptr` even if `asize` is zero will be copied into the newly allocated
* string buffer.
*/
extern int git_str_try_grow(
git_str *str, size_t target_size, bool mark_oom);
extern void git_str_swap(git_str *str_a, git_str *str_b);
extern char *git_str_detach(git_str *str);
extern int git_str_attach(git_str *str, char *ptr, size_t asize);
/* Populates a `git_str` where the contents are not "owned" by the string
* buffer, and calls to `git_str_dispose` will not free the given str.
*/
extern void git_str_attach_notowned(
git_str *str, const char *ptr, size_t size);
/**
* Test if there have been any reallocation failures with this git_str.
*
* Any function that writes to a git_str can fail due to memory allocation
* issues. If one fails, the git_str will be marked with an OOM error and
* further calls to modify the string buffer will fail. Check
* git_str_oom() at the end of your sequence and it will be true if you
* ran out of memory at any point with that string buffer.
*
* @return false if no error, true if allocation error
*/
GIT_INLINE(bool) git_str_oom(const git_str *str)
{
return (str->ptr == git_str__oom);
}
/*
* Functions below that return int value error codes will return 0 on
* success or -1 on failure (which generally means an allocation failed).
* Using a git_str where the allocation has failed with result in -1 from
* all further calls using that string buffer. As a result, you can
* ignore the return code of these functions and call them in a series
* then just call git_str_oom at the end.
*/
int git_str_set(git_str *str, const void *data, size_t datalen);
int git_str_sets(git_str *str, const char *string);
int git_str_putc(git_str *str, char c);
int git_str_putcn(git_str *str, char c, size_t len);
int git_str_put(git_str *str, const char *data, size_t len);
int git_str_puts(git_str *str, const char *string);
int git_str_printf(git_str *str, const char *format, ...) GIT_FORMAT_PRINTF(2, 3);
int git_str_vprintf(git_str *str, const char *format, va_list ap);
void git_str_clear(git_str *str);
void git_str_consume_bytes(git_str *str, size_t len);
void git_str_consume(git_str *str, const char *end);
void git_str_truncate(git_str *str, size_t len);
void git_str_shorten(git_str *str, size_t amount);
void git_str_truncate_at_char(git_str *path, char separator);
void git_str_rtruncate_at_char(git_str *path, char separator);
/** General join with separator */
int git_str_join_n(git_str *str, char separator, int len, ...);
/** Fast join of two strings - first may legally point into `str` data */
int git_str_join(git_str *str, char separator, const char *str_a, const char *str_b);
/** Fast join of three strings - cannot reference `str` data */
int git_str_join3(git_str *str, char separator, const char *str_a, const char *str_b, const char *str_c);
/**
* Join two strings as paths, inserting a slash between as needed.
* @return 0 on success, -1 on failure
*/
GIT_INLINE(int) git_str_joinpath(git_str *str, const char *a, const char *b)
{
return git_str_join(str, '/', a, b);
}
GIT_INLINE(const char *) git_str_cstr(const git_str *str)
{
return str->ptr;
}
GIT_INLINE(size_t) git_str_len(const git_str *str)
{
return str->size;
}
int git_str_copy_cstr(char *data, size_t datasize, const git_str *str);
#define git_str_PUTS(str, cstr) git_str_put(str, cstr, sizeof(cstr) - 1)
GIT_INLINE(ssize_t) git_str_rfind_next(const git_str *str, char ch)
{
ssize_t idx = (ssize_t)str->size - 1;
while (idx >= 0 && str->ptr[idx] == ch) idx--;
while (idx >= 0 && str->ptr[idx] != ch) idx--;
return idx;
}
GIT_INLINE(ssize_t) git_str_rfind(const git_str *str, char ch)
{
ssize_t idx = (ssize_t)str->size - 1;
while (idx >= 0 && str->ptr[idx] != ch) idx--;
return idx;
}
GIT_INLINE(ssize_t) git_str_find(const git_str *str, char ch)
{
void *found = memchr(str->ptr, ch, str->size);
return found ? (ssize_t)((const char *)found - str->ptr) : -1;
}
/* Remove whitespace from the end of the string buffer */
void git_str_rtrim(git_str *str);
int git_str_cmp(const git_str *a, const git_str *b);
/* Quote and unquote a string buffer as specified in
* http://marc.info/?l=git&m=112927316408690&w=2
*/
int git_str_quote(git_str *str);
int git_str_unquote(git_str *str);
/* Write data as base64 encoded in string buffer */
int git_str_encode_base64(git_str *str, const char *data, size_t len);
/* Decode the given bas64 and write the result to the string buffer */
int git_str_decode_base64(git_str *str, const char *base64, size_t len);
/* Write data as "base85" encoded in string buffer */
int git_str_encode_base85(git_str *str, const char *data, size_t len);
/* Decode the given "base85" and write the result to the string buffer */
int git_str_decode_base85(git_str *str, const char *base64, size_t len, size_t output_len);
/*
* Decode the given percent-encoded string and write the result to the
* string buffer.
*/
int git_str_decode_percent(git_str *str, const char *encoded, size_t len);
/*
* Insert, remove or replace a portion of the string buffer.
*
* @param str The string buffer to work with
*
* @param where The location in the string buffer where the transformation
* should be applied.
*
* @param nb_to_remove The number of chars to be removed. 0 to not
* remove any character in the string buffer.
*
* @param data A pointer to the data which should be inserted.
*
* @param nb_to_insert The number of chars to be inserted. 0 to not
* insert any character from the string buffer.
*
* @return 0 or an error code.
*/
int git_str_splice(
git_str *str,
size_t where,
size_t nb_to_remove,
const char *data,
size_t nb_to_insert);
/**
* Append string to string buffer, prefixing each character from
* `esc_chars` with `esc_with` string.
*
* @param str String buffer to append data to
* @param string String to escape and append
* @param esc_chars Characters to be escaped
* @param esc_with String to insert in from of each found character
* @return 0 on success, <0 on failure (probably allocation problem)
*/
extern int git_str_puts_escaped(
git_str *str,
const char *string,
const char *esc_chars,
const char *esc_with);
/**
* Append string escaping characters that are regex special
*/
GIT_INLINE(int) git_str_puts_escape_regex(git_str *str, const char *string)
{
return git_str_puts_escaped(str, string, "^.[]$()|*+?{}\\", "\\");
}
/**
* Unescape all characters in a string buffer in place
*
* I.e. remove backslashes
*/
extern void git_str_unescape(git_str *str);
/**
* Replace all \r\n with \n.
*
* @return 0 on success, -1 on memory error
*/
extern int git_str_crlf_to_lf(git_str *tgt, const git_str *src);
/**
* Replace all \n with \r\n. Does not modify existing \r\n.
*
* @return 0 on success, -1 on memory error
*/
extern int git_str_lf_to_crlf(git_str *tgt, const git_str *src);
/**
* Fill string buffer with the common prefix of a array of strings
*
* String buffer will be set to empty if there is no common prefix
*/
extern int git_str_common_prefix(git_str *buf, char *const *const strings, size_t count);
/**
* Check if a string buffer begins with a UTF BOM
*
* @param bom Set to the type of BOM detected or GIT_BOM_NONE
* @param str String buffer in which to check the first bytes for a BOM
* @return Number of bytes of BOM data (or 0 if no BOM found)
*/
extern int git_str_detect_bom(git_str_bom_t *bom, const git_str *str);
/**
* Gather stats for a piece of text
*
* Fill the `stats` structure with counts of unreadable characters, carriage
* returns, etc, so it can be used in heuristics. This automatically skips
* a trailing EOF (\032 character). Also it will look for a BOM at the
* start of the text and can be told to skip that as well.
*
* @param stats Structure to be filled in
* @param str Text to process
* @param skip_bom Exclude leading BOM from stats if true
* @return Does the string buffer heuristically look like binary data
*/
extern bool git_str_gather_text_stats(
git_str_text_stats *stats, const git_str *str, bool skip_bom);
/**
* Check quickly if string buffer looks like it contains binary data
*
* @param str string buffer to check
* @return 1 if string buffer looks like non-text data
*/
int git_str_is_binary(const git_str *str);
/**
* Check quickly if buffer contains a NUL byte
*
* @param str string buffer to check
* @return 1 if string buffer contains a NUL byte
*/
int git_str_contains_nul(const git_str *str);
#endif