1 /*
2  * Copyright (C) the libgit2 contributors. All rights reserved.
3  *
4  * This file is part of libgit2, distributed under the GNU GPL v2 with
5  * a Linking Exception. For full terms see the included COPYING file.
6  */
7 #ifndef INCLUDE_buffer_h__
8 #define INCLUDE_buffer_h__
9 
10 #include "common.h"
11 #include "git2/strarray.h"
12 #include "git2/buffer.h"
13 
14 /* typedef struct {
15  *  	char   *ptr;
16  *  	size_t asize, size;
17  * } git_buf;
18  */
19 
20 typedef enum {
21 	GIT_BUF_BOM_NONE = 0,
22 	GIT_BUF_BOM_UTF8 = 1,
23 	GIT_BUF_BOM_UTF16_LE = 2,
24 	GIT_BUF_BOM_UTF16_BE = 3,
25 	GIT_BUF_BOM_UTF32_LE = 4,
26 	GIT_BUF_BOM_UTF32_BE = 5
27 } git_buf_bom_t;
28 
29 typedef struct {
30 	git_buf_bom_t bom; /* BOM found at head of text */
31 	unsigned int nul, cr, lf, crlf; /* NUL, CR, LF and CRLF counts */
32 	unsigned int printable, nonprintable; /* These are just approximations! */
33 } git_buf_text_stats;
34 
35 extern char git_buf__initbuf[];
36 extern char git_buf__oom[];
37 
38 /* Use to initialize buffer structure when git_buf is on stack */
39 #define GIT_BUF_INIT { git_buf__initbuf, 0, 0 }
40 
41 /**
42  * Static initializer for git_buf from static buffer
43  */
44 #ifdef GIT_DEPRECATE_HARD
45 # define GIT_BUF_INIT_CONST(STR,LEN) { (char *)(STR), 0, (size_t)(LEN) }
46 #endif
47 
git_buf_is_allocated(const git_buf * buf)48 GIT_INLINE(bool) git_buf_is_allocated(const git_buf *buf)
49 {
50 	return (buf->ptr != NULL && buf->asize > 0);
51 }
52 
53 /**
54  * Initialize a git_buf structure.
55  *
56  * For the cases where GIT_BUF_INIT cannot be used to do static
57  * initialization.
58  */
59 extern int git_buf_init(git_buf *buf, size_t initial_size);
60 
61 #ifdef GIT_DEPRECATE_HARD
62 
63 /**
64  * Resize the buffer allocation to make more space.
65  *
66  * This will attempt to grow the buffer to accommodate the target size.
67  *
68  * If the buffer refers to memory that was not allocated by libgit2 (i.e.
69  * the `asize` field is zero), then `ptr` will be replaced with a newly
70  * allocated block of data.  Be careful so that memory allocated by the
71  * caller is not lost.  As a special variant, if you pass `target_size` as
72  * 0 and the memory is not allocated by libgit2, this will allocate a new
73  * buffer of size `size` and copy the external data into it.
74  *
75  * Currently, this will never shrink a buffer, only expand it.
76  *
77  * If the allocation fails, this will return an error and the buffer will be
78  * marked as invalid for future operations, invaliding the contents.
79  *
80  * @param buffer The buffer to be resized; may or may not be allocated yet
81  * @param target_size The desired available size
82  * @return 0 on success, -1 on allocation failure
83  */
84 int git_buf_grow(git_buf *buffer, size_t target_size);
85 
86 #endif
87 
88 /**
89  * Resize the buffer allocation to make more space.
90  *
91  * This will attempt to grow the buffer to accommodate the additional size.
92  * It is similar to `git_buf_grow`, but performs the new size calculation,
93  * checking for overflow.
94  *
95  * Like `git_buf_grow`, if this is a user-supplied buffer, this will allocate
96  * a new buffer.
97  */
98 extern int git_buf_grow_by(git_buf *buffer, size_t additional_size);
99 
100 /**
101  * Attempt to grow the buffer to hold at least `target_size` bytes.
102  *
103  * If the allocation fails, this will return an error.  If `mark_oom` is true,
104  * this will mark the buffer as invalid for future operations; if false,
105  * existing buffer content will be preserved, but calling code must handle
106  * that buffer was not expanded.  If `preserve_external` is true, then any
107  * existing data pointed to be `ptr` even if `asize` is zero will be copied
108  * into the newly allocated buffer.
109  */
110 extern int git_buf_try_grow(
111 	git_buf *buf, size_t target_size, bool mark_oom);
112 
113 /**
114  * Sanitizes git_buf structures provided from user input.  Users of the
115  * library, when providing git_buf's, may wish to provide a NULL ptr for
116  * ease of handling.  The buffer routines, however, expect a non-NULL ptr
117  * always.  This helper method simply handles NULL input, converting to a
118  * git_buf__initbuf. If a buffer with a non-NULL ptr is passed in, this method
119  * assures that the buffer is '\0'-terminated.
120  */
121 extern int git_buf_sanitize(git_buf *buf);
122 
123 extern void git_buf_swap(git_buf *buf_a, git_buf *buf_b);
124 extern char *git_buf_detach(git_buf *buf);
125 extern int git_buf_attach(git_buf *buf, char *ptr, size_t asize);
126 
127 /* Populates a `git_buf` where the contents are not "owned" by the
128  * buffer, and calls to `git_buf_dispose` will not free the given buf.
129  */
130 extern void git_buf_attach_notowned(
131 	git_buf *buf, const char *ptr, size_t size);
132 
133 /**
134  * Test if there have been any reallocation failures with this git_buf.
135  *
136  * Any function that writes to a git_buf can fail due to memory allocation
137  * issues.  If one fails, the git_buf will be marked with an OOM error and
138  * further calls to modify the buffer will fail.  Check git_buf_oom() at the
139  * end of your sequence and it will be true if you ran out of memory at any
140  * point with that buffer.
141  *
142  * @return false if no error, true if allocation error
143  */
git_buf_oom(const git_buf * buf)144 GIT_INLINE(bool) git_buf_oom(const git_buf *buf)
145 {
146 	return (buf->ptr == git_buf__oom);
147 }
148 
149 /*
150  * Functions below that return int value error codes will return 0 on
151  * success or -1 on failure (which generally means an allocation failed).
152  * Using a git_buf where the allocation has failed with result in -1 from
153  * all further calls using that buffer.  As a result, you can ignore the
154  * return code of these functions and call them in a series then just call
155  * git_buf_oom at the end.
156  */
157 
158 #ifdef GIT_DEPRECATE_HARD
159 int git_buf_set(git_buf *buffer, const void *data, size_t datalen);
160 #endif
161 
162 int git_buf_sets(git_buf *buf, const char *string);
163 int git_buf_putc(git_buf *buf, char c);
164 int git_buf_putcn(git_buf *buf, char c, size_t len);
165 int git_buf_put(git_buf *buf, const char *data, size_t len);
166 int git_buf_puts(git_buf *buf, const char *string);
167 int git_buf_printf(git_buf *buf, const char *format, ...) GIT_FORMAT_PRINTF(2, 3);
168 int git_buf_vprintf(git_buf *buf, const char *format, va_list ap);
169 void git_buf_clear(git_buf *buf);
170 void git_buf_consume_bytes(git_buf *buf, size_t len);
171 void git_buf_consume(git_buf *buf, const char *end);
172 void git_buf_truncate(git_buf *buf, size_t len);
173 void git_buf_shorten(git_buf *buf, size_t amount);
174 void git_buf_truncate_at_char(git_buf *buf, char separator);
175 void git_buf_rtruncate_at_char(git_buf *path, char separator);
176 
177 /** General join with separator */
178 int git_buf_join_n(git_buf *buf, char separator, int nbuf, ...);
179 /** Fast join of two strings - first may legally point into `buf` data */
180 int git_buf_join(git_buf *buf, char separator, const char *str_a, const char *str_b);
181 /** Fast join of three strings - cannot reference `buf` data */
182 int git_buf_join3(git_buf *buf, char separator, const char *str_a, const char *str_b, const char *str_c);
183 
184 /**
185  * Join two strings as paths, inserting a slash between as needed.
186  * @return 0 on success, -1 on failure
187  */
git_buf_joinpath(git_buf * buf,const char * a,const char * b)188 GIT_INLINE(int) git_buf_joinpath(git_buf *buf, const char *a, const char *b)
189 {
190 	return git_buf_join(buf, '/', a, b);
191 }
192 
git_buf_cstr(const git_buf * buf)193 GIT_INLINE(const char *) git_buf_cstr(const git_buf *buf)
194 {
195 	return buf->ptr;
196 }
197 
git_buf_len(const git_buf * buf)198 GIT_INLINE(size_t) git_buf_len(const git_buf *buf)
199 {
200 	return buf->size;
201 }
202 
203 int git_buf_copy_cstr(char *data, size_t datasize, const git_buf *buf);
204 
205 #define git_buf_PUTS(buf, str) git_buf_put(buf, str, sizeof(str) - 1)
206 
git_buf_rfind_next(const git_buf * buf,char ch)207 GIT_INLINE(ssize_t) git_buf_rfind_next(const git_buf *buf, char ch)
208 {
209 	ssize_t idx = (ssize_t)buf->size - 1;
210 	while (idx >= 0 && buf->ptr[idx] == ch) idx--;
211 	while (idx >= 0 && buf->ptr[idx] != ch) idx--;
212 	return idx;
213 }
214 
git_buf_rfind(const git_buf * buf,char ch)215 GIT_INLINE(ssize_t) git_buf_rfind(const git_buf *buf, char ch)
216 {
217 	ssize_t idx = (ssize_t)buf->size - 1;
218 	while (idx >= 0 && buf->ptr[idx] != ch) idx--;
219 	return idx;
220 }
221 
git_buf_find(const git_buf * buf,char ch)222 GIT_INLINE(ssize_t) git_buf_find(const git_buf *buf, char ch)
223 {
224 	void *found = memchr(buf->ptr, ch, buf->size);
225 	return found ? (ssize_t)((const char *)found - buf->ptr) : -1;
226 }
227 
228 /* Remove whitespace from the end of the buffer */
229 void git_buf_rtrim(git_buf *buf);
230 
231 int git_buf_cmp(const git_buf *a, const git_buf *b);
232 
233 /* Quote and unquote a buffer as specified in
234  * http://marc.info/?l=git&m=112927316408690&w=2
235  */
236 int git_buf_quote(git_buf *buf);
237 int git_buf_unquote(git_buf *buf);
238 
239 /* Write data as base64 encoded in buffer */
240 int git_buf_encode_base64(git_buf *buf, const char *data, size_t len);
241 /* Decode the given bas64 and write the result to the buffer */
242 int git_buf_decode_base64(git_buf *buf, const char *base64, size_t len);
243 
244 /* Write data as "base85" encoded in buffer */
245 int git_buf_encode_base85(git_buf *buf, const char *data, size_t len);
246 /* Decode the given "base85" and write the result to the buffer */
247 int git_buf_decode_base85(git_buf *buf, const char *base64, size_t len, size_t output_len);
248 
249 /* Decode the given percent-encoded string and write the result to the buffer */
250 int git_buf_decode_percent(git_buf *buf, const char *str, size_t len);
251 
252 /*
253  * Insert, remove or replace a portion of the buffer.
254  *
255  * @param buf The buffer to work with
256  *
257  * @param where The location in the buffer where the transformation
258  * should be applied.
259  *
260  * @param nb_to_remove The number of chars to be removed. 0 to not
261  * remove any character in the buffer.
262  *
263  * @param data A pointer to the data which should be inserted.
264  *
265  * @param nb_to_insert The number of chars to be inserted. 0 to not
266  * insert any character from the buffer.
267  *
268  * @return 0 or an error code.
269  */
270 int git_buf_splice(
271 	git_buf *buf,
272 	size_t where,
273 	size_t nb_to_remove,
274 	const char *data,
275 	size_t nb_to_insert);
276 
277 /**
278  * Append string to buffer, prefixing each character from `esc_chars` with
279  * `esc_with` string.
280  *
281  * @param buf Buffer to append data to
282  * @param string String to escape and append
283  * @param esc_chars Characters to be escaped
284  * @param esc_with String to insert in from of each found character
285  * @return 0 on success, <0 on failure (probably allocation problem)
286  */
287 extern int git_buf_puts_escaped(
288 	git_buf *buf,
289 	const char *string,
290 	const char *esc_chars,
291 	const char *esc_with);
292 
293 /**
294  * Append string escaping characters that are regex special
295  */
git_buf_puts_escape_regex(git_buf * buf,const char * string)296 GIT_INLINE(int) git_buf_puts_escape_regex(git_buf *buf, const char *string)
297 {
298 	return git_buf_puts_escaped(buf, string, "^.[]$()|*+?{}\\", "\\");
299 }
300 
301 /**
302  * Unescape all characters in a buffer in place
303  *
304  * I.e. remove backslashes
305  */
306 extern void git_buf_unescape(git_buf *buf);
307 
308 /**
309  * Replace all \r\n with \n.
310  *
311  * @return 0 on success, -1 on memory error
312  */
313 extern int git_buf_crlf_to_lf(git_buf *tgt, const git_buf *src);
314 
315 /**
316  * Replace all \n with \r\n. Does not modify existing \r\n.
317  *
318  * @return 0 on success, -1 on memory error
319  */
320 extern int git_buf_lf_to_crlf(git_buf *tgt, const git_buf *src);
321 
322 /**
323  * Fill buffer with the common prefix of a array of strings
324  *
325  * Buffer will be set to empty if there is no common prefix
326  */
327 extern int git_buf_common_prefix(git_buf *buf, char *const *const strings, size_t count);
328 
329 /**
330  * Check if a buffer begins with a UTF BOM
331  *
332  * @param bom Set to the type of BOM detected or GIT_BOM_NONE
333  * @param buf Buffer in which to check the first bytes for a BOM
334  * @return Number of bytes of BOM data (or 0 if no BOM found)
335  */
336 extern int git_buf_detect_bom(git_buf_bom_t *bom, const git_buf *buf);
337 
338 /**
339  * Gather stats for a piece of text
340  *
341  * Fill the `stats` structure with counts of unreadable characters, carriage
342  * returns, etc, so it can be used in heuristics.  This automatically skips
343  * a trailing EOF (\032 character).  Also it will look for a BOM at the
344  * start of the text and can be told to skip that as well.
345  *
346  * @param stats Structure to be filled in
347  * @param buf Text to process
348  * @param skip_bom Exclude leading BOM from stats if true
349  * @return Does the buffer heuristically look like binary data
350  */
351 extern bool git_buf_gather_text_stats(
352 	git_buf_text_stats *stats, const git_buf *buf, bool skip_bom);
353 
354 #ifdef GIT_DEPRECATE_HARD
355 
356 /**
357 * Check quickly if buffer looks like it contains binary data
358 *
359 * @param buf Buffer to check
360 * @return 1 if buffer looks like non-text data
361 */
362 int git_buf_is_binary(const git_buf *buf);
363 
364 /**
365 * Check quickly if buffer contains a NUL byte
366 *
367 * @param buf Buffer to check
368 * @return 1 if buffer contains a NUL byte
369 */
370 int git_buf_contains_nul(const git_buf *buf);
371 
372 #endif
373 
374 #endif
375