1 /*
2  * Copyright (C) the libgit2 contributors. All rights reserved.
3  *
4  * This file is part of libgit2, distributed under the GNU GPL v2 with
5  * a Linking Exception. For full terms see the included COPYING file.
6  */
7 
8 #include "index.h"
9 
10 #include <stddef.h>
11 
12 #include "repository.h"
13 #include "tree.h"
14 #include "tree-cache.h"
15 #include "hash.h"
16 #include "iterator.h"
17 #include "pathspec.h"
18 #include "ignore.h"
19 #include "blob.h"
20 #include "idxmap.h"
21 #include "diff.h"
22 #include "varint.h"
23 
24 #include "git2/odb.h"
25 #include "git2/oid.h"
26 #include "git2/blob.h"
27 #include "git2/config.h"
28 #include "git2/sys/index.h"
29 
30 static int index_apply_to_wd_diff(git_index *index, int action, const git_strarray *paths,
31 				  unsigned int flags,
32 				  git_index_matched_path_cb cb, void *payload);
33 
34 #define minimal_entry_size (offsetof(struct entry_short, path))
35 
36 static const size_t INDEX_FOOTER_SIZE = GIT_OID_RAWSZ;
37 static const size_t INDEX_HEADER_SIZE = 12;
38 
39 static const unsigned int INDEX_VERSION_NUMBER_DEFAULT = 2;
40 static const unsigned int INDEX_VERSION_NUMBER_LB = 2;
41 static const unsigned int INDEX_VERSION_NUMBER_EXT = 3;
42 static const unsigned int INDEX_VERSION_NUMBER_COMP = 4;
43 static const unsigned int INDEX_VERSION_NUMBER_UB = 4;
44 
45 static const unsigned int INDEX_HEADER_SIG = 0x44495243;
46 static const char INDEX_EXT_TREECACHE_SIG[] = {'T', 'R', 'E', 'E'};
47 static const char INDEX_EXT_UNMERGED_SIG[] = {'R', 'E', 'U', 'C'};
48 static const char INDEX_EXT_CONFLICT_NAME_SIG[] = {'N', 'A', 'M', 'E'};
49 
50 #define INDEX_OWNER(idx) ((git_repository *)(GIT_REFCOUNT_OWNER(idx)))
51 
52 struct index_header {
53 	uint32_t signature;
54 	uint32_t version;
55 	uint32_t entry_count;
56 };
57 
58 struct index_extension {
59 	char signature[4];
60 	uint32_t extension_size;
61 };
62 
63 struct entry_time {
64 	uint32_t seconds;
65 	uint32_t nanoseconds;
66 };
67 
68 struct entry_short {
69 	struct entry_time ctime;
70 	struct entry_time mtime;
71 	uint32_t dev;
72 	uint32_t ino;
73 	uint32_t mode;
74 	uint32_t uid;
75 	uint32_t gid;
76 	uint32_t file_size;
77 	git_oid oid;
78 	uint16_t flags;
79 	char path[1]; /* arbitrary length */
80 };
81 
82 struct entry_long {
83 	struct entry_time ctime;
84 	struct entry_time mtime;
85 	uint32_t dev;
86 	uint32_t ino;
87 	uint32_t mode;
88 	uint32_t uid;
89 	uint32_t gid;
90 	uint32_t file_size;
91 	git_oid oid;
92 	uint16_t flags;
93 	uint16_t flags_extended;
94 	char path[1]; /* arbitrary length */
95 };
96 
97 struct entry_srch_key {
98 	const char *path;
99 	size_t pathlen;
100 	int stage;
101 };
102 
103 struct entry_internal {
104 	git_index_entry entry;
105 	size_t pathlen;
106 	char path[GIT_FLEX_ARRAY];
107 };
108 
109 struct reuc_entry_internal {
110 	git_index_reuc_entry entry;
111 	size_t pathlen;
112 	char path[GIT_FLEX_ARRAY];
113 };
114 
115 bool git_index__enforce_unsaved_safety = false;
116 
117 /* local declarations */
118 static int read_extension(size_t *read_len, git_index *index, const char *buffer, size_t buffer_size);
119 static int read_header(struct index_header *dest, const void *buffer);
120 
121 static int parse_index(git_index *index, const char *buffer, size_t buffer_size);
122 static bool is_index_extended(git_index *index);
123 static int write_index(git_oid *checksum, git_index *index, git_filebuf *file);
124 
125 static void index_entry_free(git_index_entry *entry);
126 static void index_entry_reuc_free(git_index_reuc_entry *reuc);
127 
index_map_set(git_idxmap * map,git_index_entry * e,bool ignore_case)128 GIT_INLINE(int) index_map_set(git_idxmap *map, git_index_entry *e, bool ignore_case)
129 {
130 	if (ignore_case)
131 		return git_idxmap_icase_set((git_idxmap_icase *) map, e, e);
132 	else
133 		return git_idxmap_set(map, e, e);
134 }
135 
index_map_delete(git_idxmap * map,git_index_entry * e,bool ignore_case)136 GIT_INLINE(int) index_map_delete(git_idxmap *map, git_index_entry *e, bool ignore_case)
137 {
138 	if (ignore_case)
139 		return git_idxmap_icase_delete((git_idxmap_icase *) map, e);
140 	else
141 		return git_idxmap_delete(map, e);
142 }
143 
index_map_resize(git_idxmap * map,size_t count,bool ignore_case)144 GIT_INLINE(int) index_map_resize(git_idxmap *map, size_t count, bool ignore_case)
145 {
146 	if (ignore_case)
147 		return git_idxmap_icase_resize((git_idxmap_icase *) map, count);
148 	else
149 		return git_idxmap_resize(map, count);
150 }
151 
git_index_entry_srch(const void * key,const void * array_member)152 int git_index_entry_srch(const void *key, const void *array_member)
153 {
154 	const struct entry_srch_key *srch_key = key;
155 	const struct entry_internal *entry = array_member;
156 	int cmp;
157 	size_t len1, len2, len;
158 
159 	len1 = srch_key->pathlen;
160 	len2 = entry->pathlen;
161 	len = len1 < len2 ? len1 : len2;
162 
163 	cmp = memcmp(srch_key->path, entry->path, len);
164 	if (cmp)
165 		return cmp;
166 	if (len1 < len2)
167 		return -1;
168 	if (len1 > len2)
169 		return 1;
170 
171 	if (srch_key->stage != GIT_INDEX_STAGE_ANY)
172 		return srch_key->stage - GIT_INDEX_ENTRY_STAGE(&entry->entry);
173 
174 	return 0;
175 }
176 
git_index_entry_isrch(const void * key,const void * array_member)177 int git_index_entry_isrch(const void *key, const void *array_member)
178 {
179 	const struct entry_srch_key *srch_key = key;
180 	const struct entry_internal *entry = array_member;
181 	int cmp;
182 	size_t len1, len2, len;
183 
184 	len1 = srch_key->pathlen;
185 	len2 = entry->pathlen;
186 	len = len1 < len2 ? len1 : len2;
187 
188 	cmp = strncasecmp(srch_key->path, entry->path, len);
189 
190 	if (cmp)
191 		return cmp;
192 	if (len1 < len2)
193 		return -1;
194 	if (len1 > len2)
195 		return 1;
196 
197 	if (srch_key->stage != GIT_INDEX_STAGE_ANY)
198 		return srch_key->stage - GIT_INDEX_ENTRY_STAGE(&entry->entry);
199 
200 	return 0;
201 }
202 
index_entry_srch_path(const void * path,const void * array_member)203 static int index_entry_srch_path(const void *path, const void *array_member)
204 {
205 	const git_index_entry *entry = array_member;
206 
207 	return strcmp((const char *)path, entry->path);
208 }
209 
index_entry_isrch_path(const void * path,const void * array_member)210 static int index_entry_isrch_path(const void *path, const void *array_member)
211 {
212 	const git_index_entry *entry = array_member;
213 
214 	return strcasecmp((const char *)path, entry->path);
215 }
216 
git_index_entry_cmp(const void * a,const void * b)217 int git_index_entry_cmp(const void *a, const void *b)
218 {
219 	int diff;
220 	const git_index_entry *entry_a = a;
221 	const git_index_entry *entry_b = b;
222 
223 	diff = strcmp(entry_a->path, entry_b->path);
224 
225 	if (diff == 0)
226 		diff = (GIT_INDEX_ENTRY_STAGE(entry_a) - GIT_INDEX_ENTRY_STAGE(entry_b));
227 
228 	return diff;
229 }
230 
git_index_entry_icmp(const void * a,const void * b)231 int git_index_entry_icmp(const void *a, const void *b)
232 {
233 	int diff;
234 	const git_index_entry *entry_a = a;
235 	const git_index_entry *entry_b = b;
236 
237 	diff = strcasecmp(entry_a->path, entry_b->path);
238 
239 	if (diff == 0)
240 		diff = (GIT_INDEX_ENTRY_STAGE(entry_a) - GIT_INDEX_ENTRY_STAGE(entry_b));
241 
242 	return diff;
243 }
244 
conflict_name_cmp(const void * a,const void * b)245 static int conflict_name_cmp(const void *a, const void *b)
246 {
247 	const git_index_name_entry *name_a = a;
248 	const git_index_name_entry *name_b = b;
249 
250 	if (name_a->ancestor && !name_b->ancestor)
251 		return 1;
252 
253 	if (!name_a->ancestor && name_b->ancestor)
254 		return -1;
255 
256 	if (name_a->ancestor)
257 		return strcmp(name_a->ancestor, name_b->ancestor);
258 
259 	if (!name_a->ours || !name_b->ours)
260 		return 0;
261 
262 	return strcmp(name_a->ours, name_b->ours);
263 }
264 
265 /**
266  * TODO: enable this when resolving case insensitive conflicts
267  */
268 #if 0
269 static int conflict_name_icmp(const void *a, const void *b)
270 {
271 	const git_index_name_entry *name_a = a;
272 	const git_index_name_entry *name_b = b;
273 
274 	if (name_a->ancestor && !name_b->ancestor)
275 		return 1;
276 
277 	if (!name_a->ancestor && name_b->ancestor)
278 		return -1;
279 
280 	if (name_a->ancestor)
281 		return strcasecmp(name_a->ancestor, name_b->ancestor);
282 
283 	if (!name_a->ours || !name_b->ours)
284 		return 0;
285 
286 	return strcasecmp(name_a->ours, name_b->ours);
287 }
288 #endif
289 
reuc_srch(const void * key,const void * array_member)290 static int reuc_srch(const void *key, const void *array_member)
291 {
292 	const git_index_reuc_entry *reuc = array_member;
293 
294 	return strcmp(key, reuc->path);
295 }
296 
reuc_isrch(const void * key,const void * array_member)297 static int reuc_isrch(const void *key, const void *array_member)
298 {
299 	const git_index_reuc_entry *reuc = array_member;
300 
301 	return strcasecmp(key, reuc->path);
302 }
303 
reuc_cmp(const void * a,const void * b)304 static int reuc_cmp(const void *a, const void *b)
305 {
306 	const git_index_reuc_entry *info_a = a;
307 	const git_index_reuc_entry *info_b = b;
308 
309 	return strcmp(info_a->path, info_b->path);
310 }
311 
reuc_icmp(const void * a,const void * b)312 static int reuc_icmp(const void *a, const void *b)
313 {
314 	const git_index_reuc_entry *info_a = a;
315 	const git_index_reuc_entry *info_b = b;
316 
317 	return strcasecmp(info_a->path, info_b->path);
318 }
319 
index_entry_reuc_free(git_index_reuc_entry * reuc)320 static void index_entry_reuc_free(git_index_reuc_entry *reuc)
321 {
322 	git__free(reuc);
323 }
324 
index_entry_free(git_index_entry * entry)325 static void index_entry_free(git_index_entry *entry)
326 {
327 	if (!entry)
328 		return;
329 
330 	memset(&entry->id, 0, sizeof(entry->id));
331 	git__free(entry);
332 }
333 
git_index__create_mode(unsigned int mode)334 unsigned int git_index__create_mode(unsigned int mode)
335 {
336 	if (S_ISLNK(mode))
337 		return S_IFLNK;
338 
339 	if (S_ISDIR(mode) || (mode & S_IFMT) == (S_IFLNK | S_IFDIR))
340 		return (S_IFLNK | S_IFDIR);
341 
342 	return S_IFREG | GIT_PERMS_CANONICAL(mode);
343 }
344 
index_merge_mode(git_index * index,git_index_entry * existing,unsigned int mode)345 static unsigned int index_merge_mode(
346 	git_index *index, git_index_entry *existing, unsigned int mode)
347 {
348 	if (index->no_symlinks && S_ISREG(mode) &&
349 		existing && S_ISLNK(existing->mode))
350 		return existing->mode;
351 
352 	if (index->distrust_filemode && S_ISREG(mode))
353 		return (existing && S_ISREG(existing->mode)) ?
354 			existing->mode : git_index__create_mode(0666);
355 
356 	return git_index__create_mode(mode);
357 }
358 
index_find_in_entries(size_t * out,git_vector * entries,git_vector_cmp entry_srch,const char * path,size_t path_len,int stage)359 GIT_INLINE(int) index_find_in_entries(
360 	size_t *out, git_vector *entries, git_vector_cmp entry_srch,
361 	const char *path, size_t path_len, int stage)
362 {
363 	struct entry_srch_key srch_key;
364 	srch_key.path = path;
365 	srch_key.pathlen = !path_len ? strlen(path) : path_len;
366 	srch_key.stage = stage;
367 	return git_vector_bsearch2(out, entries, entry_srch, &srch_key);
368 }
369 
index_find(size_t * out,git_index * index,const char * path,size_t path_len,int stage)370 GIT_INLINE(int) index_find(
371 	size_t *out, git_index *index,
372 	const char *path, size_t path_len, int stage)
373 {
374 	git_vector_sort(&index->entries);
375 
376 	return index_find_in_entries(
377 		out, &index->entries, index->entries_search, path, path_len, stage);
378 }
379 
git_index__set_ignore_case(git_index * index,bool ignore_case)380 void git_index__set_ignore_case(git_index *index, bool ignore_case)
381 {
382 	index->ignore_case = ignore_case;
383 
384 	if (ignore_case) {
385 		index->entries_cmp_path    = git__strcasecmp_cb;
386 		index->entries_search      = git_index_entry_isrch;
387 		index->entries_search_path = index_entry_isrch_path;
388 		index->reuc_search         = reuc_isrch;
389 	} else {
390 		index->entries_cmp_path    = git__strcmp_cb;
391 		index->entries_search      = git_index_entry_srch;
392 		index->entries_search_path = index_entry_srch_path;
393 		index->reuc_search         = reuc_srch;
394 	}
395 
396 	git_vector_set_cmp(&index->entries,
397 		ignore_case ? git_index_entry_icmp : git_index_entry_cmp);
398 	git_vector_sort(&index->entries);
399 
400 	git_vector_set_cmp(&index->reuc, ignore_case ? reuc_icmp : reuc_cmp);
401 	git_vector_sort(&index->reuc);
402 }
403 
git_index_open(git_index ** index_out,const char * index_path)404 int git_index_open(git_index **index_out, const char *index_path)
405 {
406 	git_index *index;
407 	int error = -1;
408 
409 	GIT_ASSERT_ARG(index_out);
410 
411 	index = git__calloc(1, sizeof(git_index));
412 	GIT_ERROR_CHECK_ALLOC(index);
413 
414 	if (git_pool_init(&index->tree_pool, 1) < 0)
415 		goto fail;
416 
417 	if (index_path != NULL) {
418 		index->index_file_path = git__strdup(index_path);
419 		if (!index->index_file_path)
420 			goto fail;
421 
422 		/* Check if index file is stored on disk already */
423 		if (git_path_exists(index->index_file_path) == true)
424 			index->on_disk = 1;
425 	}
426 
427 	if (git_vector_init(&index->entries, 32, git_index_entry_cmp) < 0 ||
428 	    git_idxmap_new(&index->entries_map) < 0 ||
429 	    git_vector_init(&index->names, 8, conflict_name_cmp) < 0 ||
430 	    git_vector_init(&index->reuc, 8, reuc_cmp) < 0 ||
431 	    git_vector_init(&index->deleted, 8, git_index_entry_cmp) < 0)
432 		goto fail;
433 
434 	index->entries_cmp_path = git__strcmp_cb;
435 	index->entries_search = git_index_entry_srch;
436 	index->entries_search_path = index_entry_srch_path;
437 	index->reuc_search = reuc_srch;
438 	index->version = INDEX_VERSION_NUMBER_DEFAULT;
439 
440 	if (index_path != NULL && (error = git_index_read(index, true)) < 0)
441 		goto fail;
442 
443 	*index_out = index;
444 	GIT_REFCOUNT_INC(index);
445 
446 	return 0;
447 
448 fail:
449 	git_pool_clear(&index->tree_pool);
450 	git_index_free(index);
451 	return error;
452 }
453 
git_index_new(git_index ** out)454 int git_index_new(git_index **out)
455 {
456 	return git_index_open(out, NULL);
457 }
458 
index_free(git_index * index)459 static void index_free(git_index *index)
460 {
461 	/* index iterators increment the refcount of the index, so if we
462 	 * get here then there should be no outstanding iterators.
463 	 */
464 	if (git_atomic32_get(&index->readers))
465 		return;
466 
467 	git_index_clear(index);
468 	git_idxmap_free(index->entries_map);
469 	git_vector_free(&index->entries);
470 	git_vector_free(&index->names);
471 	git_vector_free(&index->reuc);
472 	git_vector_free(&index->deleted);
473 
474 	git__free(index->index_file_path);
475 
476 	git__memzero(index, sizeof(*index));
477 	git__free(index);
478 }
479 
git_index_free(git_index * index)480 void git_index_free(git_index *index)
481 {
482 	if (index == NULL)
483 		return;
484 
485 	GIT_REFCOUNT_DEC(index, index_free);
486 }
487 
488 /* call with locked index */
index_free_deleted(git_index * index)489 static void index_free_deleted(git_index *index)
490 {
491 	int readers = (int)git_atomic32_get(&index->readers);
492 	size_t i;
493 
494 	if (readers > 0 || !index->deleted.length)
495 		return;
496 
497 	for (i = 0; i < index->deleted.length; ++i) {
498 		git_index_entry *ie = git_atomic_swap(index->deleted.contents[i], NULL);
499 		index_entry_free(ie);
500 	}
501 
502 	git_vector_clear(&index->deleted);
503 }
504 
505 /* call with locked index */
index_remove_entry(git_index * index,size_t pos)506 static int index_remove_entry(git_index *index, size_t pos)
507 {
508 	int error = 0;
509 	git_index_entry *entry = git_vector_get(&index->entries, pos);
510 
511 	if (entry != NULL) {
512 		git_tree_cache_invalidate_path(index->tree, entry->path);
513 		index_map_delete(index->entries_map, entry, index->ignore_case);
514 	}
515 
516 	error = git_vector_remove(&index->entries, pos);
517 
518 	if (!error) {
519 		if (git_atomic32_get(&index->readers) > 0) {
520 			error = git_vector_insert(&index->deleted, entry);
521 		} else {
522 			index_entry_free(entry);
523 		}
524 
525 		index->dirty = 1;
526 	}
527 
528 	return error;
529 }
530 
git_index_clear(git_index * index)531 int git_index_clear(git_index *index)
532 {
533 	int error = 0;
534 
535 	GIT_ASSERT_ARG(index);
536 
537 	index->dirty = 1;
538 	index->tree = NULL;
539 	git_pool_clear(&index->tree_pool);
540 
541 	git_idxmap_clear(index->entries_map);
542 	while (!error && index->entries.length > 0)
543 		error = index_remove_entry(index, index->entries.length - 1);
544 
545 	if (error)
546 		goto done;
547 
548 	index_free_deleted(index);
549 
550 	if ((error = git_index_name_clear(index)) < 0 ||
551 		(error = git_index_reuc_clear(index)) < 0)
552 	    goto done;
553 
554 	git_futils_filestamp_set(&index->stamp, NULL);
555 
556 done:
557 	return error;
558 }
559 
create_index_error(int error,const char * msg)560 static int create_index_error(int error, const char *msg)
561 {
562 	git_error_set_str(GIT_ERROR_INDEX, msg);
563 	return error;
564 }
565 
git_index_set_caps(git_index * index,int caps)566 int git_index_set_caps(git_index *index, int caps)
567 {
568 	unsigned int old_ignore_case;
569 
570 	GIT_ASSERT_ARG(index);
571 
572 	old_ignore_case = index->ignore_case;
573 
574 	if (caps == GIT_INDEX_CAPABILITY_FROM_OWNER) {
575 		git_repository *repo = INDEX_OWNER(index);
576 		int val;
577 
578 		if (!repo)
579 			return create_index_error(
580 				-1, "cannot access repository to set index caps");
581 
582 		if (!git_repository__configmap_lookup(&val, repo, GIT_CONFIGMAP_IGNORECASE))
583 			index->ignore_case = (val != 0);
584 		if (!git_repository__configmap_lookup(&val, repo, GIT_CONFIGMAP_FILEMODE))
585 			index->distrust_filemode = (val == 0);
586 		if (!git_repository__configmap_lookup(&val, repo, GIT_CONFIGMAP_SYMLINKS))
587 			index->no_symlinks = (val == 0);
588 	}
589 	else {
590 		index->ignore_case = ((caps & GIT_INDEX_CAPABILITY_IGNORE_CASE) != 0);
591 		index->distrust_filemode = ((caps & GIT_INDEX_CAPABILITY_NO_FILEMODE) != 0);
592 		index->no_symlinks = ((caps & GIT_INDEX_CAPABILITY_NO_SYMLINKS) != 0);
593 	}
594 
595 	if (old_ignore_case != index->ignore_case) {
596 		git_index__set_ignore_case(index, (bool)index->ignore_case);
597 	}
598 
599 	return 0;
600 }
601 
git_index_caps(const git_index * index)602 int git_index_caps(const git_index *index)
603 {
604 	return ((index->ignore_case ? GIT_INDEX_CAPABILITY_IGNORE_CASE : 0) |
605 			(index->distrust_filemode ? GIT_INDEX_CAPABILITY_NO_FILEMODE : 0) |
606 			(index->no_symlinks ? GIT_INDEX_CAPABILITY_NO_SYMLINKS : 0));
607 }
608 
git_index_checksum(git_index * index)609 const git_oid *git_index_checksum(git_index *index)
610 {
611 	return &index->checksum;
612 }
613 
614 /**
615  * Returns 1 for changed, 0 for not changed and <0 for errors
616  */
compare_checksum(git_index * index)617 static int compare_checksum(git_index *index)
618 {
619 	int fd;
620 	ssize_t bytes_read;
621 	git_oid checksum = {{ 0 }};
622 
623 	if ((fd = p_open(index->index_file_path, O_RDONLY)) < 0)
624 		return fd;
625 
626 	if (p_lseek(fd, -20, SEEK_END) < 0) {
627 		p_close(fd);
628 		git_error_set(GIT_ERROR_OS, "failed to seek to end of file");
629 		return -1;
630 	}
631 
632 	bytes_read = p_read(fd, &checksum, GIT_OID_RAWSZ);
633 	p_close(fd);
634 
635 	if (bytes_read < 0)
636 		return -1;
637 
638 	return !!git_oid_cmp(&checksum, &index->checksum);
639 }
640 
git_index_read(git_index * index,int force)641 int git_index_read(git_index *index, int force)
642 {
643 	int error = 0, updated;
644 	git_buf buffer = GIT_BUF_INIT;
645 	git_futils_filestamp stamp = index->stamp;
646 
647 	if (!index->index_file_path)
648 		return create_index_error(-1,
649 			"failed to read index: The index is in-memory only");
650 
651 	index->on_disk = git_path_exists(index->index_file_path);
652 
653 	if (!index->on_disk) {
654 		if (force && (error = git_index_clear(index)) < 0)
655 			return error;
656 
657 		index->dirty = 0;
658 		return 0;
659 	}
660 
661 	if ((updated = git_futils_filestamp_check(&stamp, index->index_file_path) < 0) ||
662 	    ((updated = compare_checksum(index)) < 0)) {
663 		git_error_set(
664 			GIT_ERROR_INDEX,
665 			"failed to read index: '%s' no longer exists",
666 			index->index_file_path);
667 		return updated;
668 	}
669 
670 	if (!updated && !force)
671 		return 0;
672 
673 	error = git_futils_readbuffer(&buffer, index->index_file_path);
674 	if (error < 0)
675 		return error;
676 
677 	index->tree = NULL;
678 	git_pool_clear(&index->tree_pool);
679 
680 	error = git_index_clear(index);
681 
682 	if (!error)
683 		error = parse_index(index, buffer.ptr, buffer.size);
684 
685 	if (!error) {
686 		git_futils_filestamp_set(&index->stamp, &stamp);
687 		index->dirty = 0;
688 	}
689 
690 	git_buf_dispose(&buffer);
691 	return error;
692 }
693 
git_index_read_safely(git_index * index)694 int git_index_read_safely(git_index *index)
695 {
696 	if (git_index__enforce_unsaved_safety && index->dirty) {
697 		git_error_set(GIT_ERROR_INDEX,
698 			"the index has unsaved changes that would be overwritten by this operation");
699 		return GIT_EINDEXDIRTY;
700 	}
701 
702 	return git_index_read(index, false);
703 }
704 
git_index__changed_relative_to(git_index * index,const git_oid * checksum)705 int git_index__changed_relative_to(
706 	git_index *index, const git_oid *checksum)
707 {
708 	/* attempt to update index (ignoring errors) */
709 	if (git_index_read(index, false) < 0)
710 		git_error_clear();
711 
712 	return !!git_oid_cmp(&index->checksum, checksum);
713 }
714 
is_racy_entry(git_index * index,const git_index_entry * entry)715 static bool is_racy_entry(git_index *index, const git_index_entry *entry)
716 {
717 	/* Git special-cases submodules in the check */
718 	if (S_ISGITLINK(entry->mode))
719 		return false;
720 
721 	return git_index_entry_newer_than_index(entry, index);
722 }
723 
724 /*
725  * Force the next diff to take a look at those entries which have the
726  * same timestamp as the current index.
727  */
truncate_racily_clean(git_index * index)728 static int truncate_racily_clean(git_index *index)
729 {
730 	size_t i;
731 	int error;
732 	git_index_entry *entry;
733 	git_diff_options diff_opts = GIT_DIFF_OPTIONS_INIT;
734 	git_diff *diff = NULL;
735 	git_vector paths = GIT_VECTOR_INIT;
736 	git_diff_delta *delta;
737 
738 	/* Nothing to do if there's no repo to talk about */
739 	if (!INDEX_OWNER(index))
740 		return 0;
741 
742 	/* If there's no workdir, we can't know where to even check */
743 	if (!git_repository_workdir(INDEX_OWNER(index)))
744 		return 0;
745 
746 	diff_opts.flags |= GIT_DIFF_INCLUDE_TYPECHANGE | GIT_DIFF_IGNORE_SUBMODULES | GIT_DIFF_DISABLE_PATHSPEC_MATCH;
747 	git_vector_foreach(&index->entries, i, entry) {
748 		if ((entry->flags_extended & GIT_INDEX_ENTRY_UPTODATE) == 0 &&
749 			is_racy_entry(index, entry))
750 			git_vector_insert(&paths, (char *)entry->path);
751 	}
752 
753 	if (paths.length == 0)
754 		goto done;
755 
756 	diff_opts.pathspec.count = paths.length;
757 	diff_opts.pathspec.strings = (char **)paths.contents;
758 
759 	if ((error = git_diff_index_to_workdir(&diff, INDEX_OWNER(index), index, &diff_opts)) < 0)
760 		return error;
761 
762 	git_vector_foreach(&diff->deltas, i, delta) {
763 		entry = (git_index_entry *)git_index_get_bypath(index, delta->old_file.path, 0);
764 
765 		/* Ensure that we have a stage 0 for this file (ie, it's not a
766 		 * conflict), otherwise smudging it is quite pointless.
767 		 */
768 		if (entry) {
769 			entry->file_size = 0;
770 			index->dirty = 1;
771 		}
772 	}
773 
774 done:
775 	git_diff_free(diff);
776 	git_vector_free(&paths);
777 	return 0;
778 }
779 
git_index_version(git_index * index)780 unsigned git_index_version(git_index *index)
781 {
782 	GIT_ASSERT_ARG(index);
783 
784 	return index->version;
785 }
786 
git_index_set_version(git_index * index,unsigned int version)787 int git_index_set_version(git_index *index, unsigned int version)
788 {
789 	GIT_ASSERT_ARG(index);
790 
791 	if (version < INDEX_VERSION_NUMBER_LB ||
792 	    version > INDEX_VERSION_NUMBER_UB) {
793 		git_error_set(GIT_ERROR_INDEX, "invalid version number");
794 		return -1;
795 	}
796 
797 	index->version = version;
798 
799 	return 0;
800 }
801 
git_index_write(git_index * index)802 int git_index_write(git_index *index)
803 {
804 	git_indexwriter writer = GIT_INDEXWRITER_INIT;
805 	int error;
806 
807 	truncate_racily_clean(index);
808 
809 	if ((error = git_indexwriter_init(&writer, index)) == 0 &&
810 		(error = git_indexwriter_commit(&writer)) == 0)
811 		index->dirty = 0;
812 
813 	git_indexwriter_cleanup(&writer);
814 
815 	return error;
816 }
817 
git_index_path(const git_index * index)818 const char *git_index_path(const git_index *index)
819 {
820 	GIT_ASSERT_ARG_WITH_RETVAL(index, NULL);
821 	return index->index_file_path;
822 }
823 
git_index_write_tree(git_oid * oid,git_index * index)824 int git_index_write_tree(git_oid *oid, git_index *index)
825 {
826 	git_repository *repo;
827 
828 	GIT_ASSERT_ARG(oid);
829 	GIT_ASSERT_ARG(index);
830 
831 	repo = INDEX_OWNER(index);
832 
833 	if (repo == NULL)
834 		return create_index_error(-1, "Failed to write tree. "
835 		  "the index file is not backed up by an existing repository");
836 
837 	return git_tree__write_index(oid, index, repo);
838 }
839 
git_index_write_tree_to(git_oid * oid,git_index * index,git_repository * repo)840 int git_index_write_tree_to(
841 	git_oid *oid, git_index *index, git_repository *repo)
842 {
843 	GIT_ASSERT_ARG(oid);
844 	GIT_ASSERT_ARG(index);
845 	GIT_ASSERT_ARG(repo);
846 
847 	return git_tree__write_index(oid, index, repo);
848 }
849 
git_index_entrycount(const git_index * index)850 size_t git_index_entrycount(const git_index *index)
851 {
852 	GIT_ASSERT_ARG(index);
853 
854 	return index->entries.length;
855 }
856 
git_index_get_byindex(git_index * index,size_t n)857 const git_index_entry *git_index_get_byindex(
858 	git_index *index, size_t n)
859 {
860 	GIT_ASSERT_ARG_WITH_RETVAL(index, NULL);
861 
862 	git_vector_sort(&index->entries);
863 	return git_vector_get(&index->entries, n);
864 }
865 
git_index_get_bypath(git_index * index,const char * path,int stage)866 const git_index_entry *git_index_get_bypath(
867 	git_index *index, const char *path, int stage)
868 {
869 	git_index_entry key = {{ 0 }};
870 	git_index_entry *value;
871 
872 	GIT_ASSERT_ARG_WITH_RETVAL(index, NULL);
873 
874 	key.path = path;
875 	GIT_INDEX_ENTRY_STAGE_SET(&key, stage);
876 
877 	if (index->ignore_case)
878 		value = git_idxmap_icase_get((git_idxmap_icase *) index->entries_map, &key);
879 	else
880 		value = git_idxmap_get(index->entries_map, &key);
881 
882 	if (!value) {
883 	    git_error_set(GIT_ERROR_INDEX, "index does not contain '%s'", path);
884 	    return NULL;
885 	}
886 
887 	return value;
888 }
889 
git_index_entry__init_from_stat(git_index_entry * entry,struct stat * st,bool trust_mode)890 void git_index_entry__init_from_stat(
891 	git_index_entry *entry, struct stat *st, bool trust_mode)
892 {
893 	entry->ctime.seconds = (int32_t)st->st_ctime;
894 	entry->mtime.seconds = (int32_t)st->st_mtime;
895 #if defined(GIT_USE_NSEC)
896 	entry->mtime.nanoseconds = st->st_mtime_nsec;
897 	entry->ctime.nanoseconds = st->st_ctime_nsec;
898 #endif
899 	entry->dev  = st->st_rdev;
900 	entry->ino  = st->st_ino;
901 	entry->mode = (!trust_mode && S_ISREG(st->st_mode)) ?
902 		git_index__create_mode(0666) : git_index__create_mode(st->st_mode);
903 	entry->uid  = st->st_uid;
904 	entry->gid  = st->st_gid;
905 	entry->file_size = (uint32_t)st->st_size;
906 }
907 
index_entry_adjust_namemask(git_index_entry * entry,size_t path_length)908 static void index_entry_adjust_namemask(
909 		git_index_entry *entry,
910 		size_t path_length)
911 {
912 	entry->flags &= ~GIT_INDEX_ENTRY_NAMEMASK;
913 
914 	if (path_length < GIT_INDEX_ENTRY_NAMEMASK)
915 		entry->flags |= path_length & GIT_INDEX_ENTRY_NAMEMASK;
916 	else
917 		entry->flags |= GIT_INDEX_ENTRY_NAMEMASK;
918 }
919 
920 /* When `from_workdir` is true, we will validate the paths to avoid placing
921  * paths that are invalid for the working directory on the current filesystem
922  * (eg, on Windows, we will disallow `GIT~1`, `AUX`, `COM1`, etc).  This
923  * function will *always* prevent `.git` and directory traversal `../` from
924  * being added to the index.
925  */
index_entry_create(git_index_entry ** out,git_repository * repo,const char * path,struct stat * st,bool from_workdir)926 static int index_entry_create(
927 	git_index_entry **out,
928 	git_repository *repo,
929 	const char *path,
930 	struct stat *st,
931 	bool from_workdir)
932 {
933 	size_t pathlen = strlen(path), alloclen;
934 	struct entry_internal *entry;
935 	unsigned int path_valid_flags = GIT_PATH_REJECT_INDEX_DEFAULTS;
936 	uint16_t mode = 0;
937 
938 	/* always reject placing `.git` in the index and directory traversal.
939 	 * when requested, disallow platform-specific filenames and upgrade to
940 	 * the platform-specific `.git` tests (eg, `git~1`, etc).
941 	 */
942 	if (from_workdir)
943 		path_valid_flags |= GIT_PATH_REJECT_WORKDIR_DEFAULTS;
944 	if (st)
945 		mode = st->st_mode;
946 
947 	if (!git_path_validate(repo, path, mode, path_valid_flags)) {
948 		git_error_set(GIT_ERROR_INDEX, "invalid path: '%s'", path);
949 		return -1;
950 	}
951 
952 	GIT_ERROR_CHECK_ALLOC_ADD(&alloclen, sizeof(struct entry_internal), pathlen);
953 	GIT_ERROR_CHECK_ALLOC_ADD(&alloclen, alloclen, 1);
954 	entry = git__calloc(1, alloclen);
955 	GIT_ERROR_CHECK_ALLOC(entry);
956 
957 	entry->pathlen = pathlen;
958 	memcpy(entry->path, path, pathlen);
959 	entry->entry.path = entry->path;
960 
961 	*out = (git_index_entry *)entry;
962 	return 0;
963 }
964 
index_entry_init(git_index_entry ** entry_out,git_index * index,const char * rel_path)965 static int index_entry_init(
966 	git_index_entry **entry_out,
967 	git_index *index,
968 	const char *rel_path)
969 {
970 	int error = 0;
971 	git_index_entry *entry = NULL;
972 	git_buf path = GIT_BUF_INIT;
973 	struct stat st;
974 	git_oid oid;
975 	git_repository *repo;
976 
977 	if (INDEX_OWNER(index) == NULL)
978 		return create_index_error(-1,
979 			"could not initialize index entry. "
980 			"Index is not backed up by an existing repository.");
981 
982 	/*
983 	 * FIXME: this is duplicated with the work in
984 	 * git_blob__create_from_paths. It should accept an optional stat
985 	 * structure so we can pass in the one we have to do here.
986 	 */
987 	repo = INDEX_OWNER(index);
988 	if (git_repository__ensure_not_bare(repo, "create blob from file") < 0)
989 		return GIT_EBAREREPO;
990 
991 	if (git_repository_workdir_path(&path, repo, rel_path) < 0)
992 		return -1;
993 
994 	error = git_path_lstat(path.ptr, &st);
995 	git_buf_dispose(&path);
996 
997 	if (error < 0)
998 		return error;
999 
1000 	if (index_entry_create(&entry, INDEX_OWNER(index), rel_path, &st, true) < 0)
1001 		return -1;
1002 
1003 	/* write the blob to disk and get the oid and stat info */
1004 	error = git_blob__create_from_paths(
1005 		&oid, &st, INDEX_OWNER(index), NULL, rel_path, 0, true);
1006 
1007 	if (error < 0) {
1008 		index_entry_free(entry);
1009 		return error;
1010 	}
1011 
1012 	entry->id = oid;
1013 	git_index_entry__init_from_stat(entry, &st, !index->distrust_filemode);
1014 
1015 	*entry_out = (git_index_entry *)entry;
1016 	return 0;
1017 }
1018 
reuc_entry_alloc(const char * path)1019 static git_index_reuc_entry *reuc_entry_alloc(const char *path)
1020 {
1021 	size_t pathlen = strlen(path),
1022 		structlen = sizeof(struct reuc_entry_internal),
1023 		alloclen;
1024 	struct reuc_entry_internal *entry;
1025 
1026 	if (GIT_ADD_SIZET_OVERFLOW(&alloclen, structlen, pathlen) ||
1027 		GIT_ADD_SIZET_OVERFLOW(&alloclen, alloclen, 1))
1028 		return NULL;
1029 
1030 	entry = git__calloc(1, alloclen);
1031 	if (!entry)
1032 		return NULL;
1033 
1034 	entry->pathlen = pathlen;
1035 	memcpy(entry->path, path, pathlen);
1036 	entry->entry.path = entry->path;
1037 
1038 	return (git_index_reuc_entry *)entry;
1039 }
1040 
index_entry_reuc_init(git_index_reuc_entry ** reuc_out,const char * path,int ancestor_mode,const git_oid * ancestor_oid,int our_mode,const git_oid * our_oid,int their_mode,const git_oid * their_oid)1041 static int index_entry_reuc_init(git_index_reuc_entry **reuc_out,
1042 	const char *path,
1043 	int ancestor_mode, const git_oid *ancestor_oid,
1044 	int our_mode, const git_oid *our_oid,
1045 	int their_mode, const git_oid *their_oid)
1046 {
1047 	git_index_reuc_entry *reuc = NULL;
1048 
1049 	GIT_ASSERT_ARG(reuc_out);
1050 	GIT_ASSERT_ARG(path);
1051 
1052 	*reuc_out = reuc = reuc_entry_alloc(path);
1053 	GIT_ERROR_CHECK_ALLOC(reuc);
1054 
1055 	if ((reuc->mode[0] = ancestor_mode) > 0) {
1056 		GIT_ASSERT(ancestor_oid);
1057 		git_oid_cpy(&reuc->oid[0], ancestor_oid);
1058 	}
1059 
1060 	if ((reuc->mode[1] = our_mode) > 0) {
1061 		GIT_ASSERT(our_oid);
1062 		git_oid_cpy(&reuc->oid[1], our_oid);
1063 	}
1064 
1065 	if ((reuc->mode[2] = their_mode) > 0) {
1066 		GIT_ASSERT(their_oid);
1067 		git_oid_cpy(&reuc->oid[2], their_oid);
1068 	}
1069 
1070 	return 0;
1071 }
1072 
index_entry_cpy(git_index_entry * tgt,const git_index_entry * src)1073 static void index_entry_cpy(
1074 	git_index_entry *tgt,
1075 	const git_index_entry *src)
1076 {
1077 	const char *tgt_path = tgt->path;
1078 	memcpy(tgt, src, sizeof(*tgt));
1079 	tgt->path = tgt_path;
1080 }
1081 
index_entry_dup(git_index_entry ** out,git_index * index,const git_index_entry * src)1082 static int index_entry_dup(
1083 	git_index_entry **out,
1084 	git_index *index,
1085 	const git_index_entry *src)
1086 {
1087 	if (index_entry_create(out, INDEX_OWNER(index), src->path, NULL, false) < 0)
1088 		return -1;
1089 
1090 	index_entry_cpy(*out, src);
1091 	return 0;
1092 }
1093 
index_entry_cpy_nocache(git_index_entry * tgt,const git_index_entry * src)1094 static void index_entry_cpy_nocache(
1095 	git_index_entry *tgt,
1096 	const git_index_entry *src)
1097 {
1098 	git_oid_cpy(&tgt->id, &src->id);
1099 	tgt->mode = src->mode;
1100 	tgt->flags = src->flags;
1101 	tgt->flags_extended = (src->flags_extended & GIT_INDEX_ENTRY_EXTENDED_FLAGS);
1102 }
1103 
index_entry_dup_nocache(git_index_entry ** out,git_index * index,const git_index_entry * src)1104 static int index_entry_dup_nocache(
1105 	git_index_entry **out,
1106 	git_index *index,
1107 	const git_index_entry *src)
1108 {
1109 	if (index_entry_create(out, INDEX_OWNER(index), src->path, NULL, false) < 0)
1110 		return -1;
1111 
1112 	index_entry_cpy_nocache(*out, src);
1113 	return 0;
1114 }
1115 
has_file_name(git_index * index,const git_index_entry * entry,size_t pos,int ok_to_replace)1116 static int has_file_name(git_index *index,
1117 	 const git_index_entry *entry, size_t pos, int ok_to_replace)
1118 {
1119 	size_t len = strlen(entry->path);
1120 	int stage = GIT_INDEX_ENTRY_STAGE(entry);
1121 	const char *name = entry->path;
1122 
1123 	while (pos < index->entries.length) {
1124 		struct entry_internal *p = index->entries.contents[pos++];
1125 
1126 		if (len >= p->pathlen)
1127 			break;
1128 		if (memcmp(name, p->path, len))
1129 			break;
1130 		if (GIT_INDEX_ENTRY_STAGE(&p->entry) != stage)
1131 			continue;
1132 		if (p->path[len] != '/')
1133 			continue;
1134 		if (!ok_to_replace)
1135 			return -1;
1136 
1137 		if (index_remove_entry(index, --pos) < 0)
1138 			break;
1139 	}
1140 	return 0;
1141 }
1142 
1143 /*
1144  * Do we have another file with a pathname that is a proper
1145  * subset of the name we're trying to add?
1146  */
has_dir_name(git_index * index,const git_index_entry * entry,int ok_to_replace)1147 static int has_dir_name(git_index *index,
1148 		const git_index_entry *entry, int ok_to_replace)
1149 {
1150 	int stage = GIT_INDEX_ENTRY_STAGE(entry);
1151 	const char *name = entry->path;
1152 	const char *slash = name + strlen(name);
1153 
1154 	for (;;) {
1155 		size_t len, pos;
1156 
1157 		for (;;) {
1158 			if (*--slash == '/')
1159 				break;
1160 			if (slash <= entry->path)
1161 				return 0;
1162 		}
1163 		len = slash - name;
1164 
1165 		if (!index_find(&pos, index, name, len, stage)) {
1166 			if (!ok_to_replace)
1167 				return -1;
1168 
1169 			if (index_remove_entry(index, pos) < 0)
1170 				break;
1171 			continue;
1172 		}
1173 
1174 		/*
1175 		 * Trivial optimization: if we find an entry that
1176 		 * already matches the sub-directory, then we know
1177 		 * we're ok, and we can exit.
1178 		 */
1179 		for (; pos < index->entries.length; ++pos) {
1180 			struct entry_internal *p = index->entries.contents[pos];
1181 
1182 			if (p->pathlen <= len ||
1183 			    p->path[len] != '/' ||
1184 			    memcmp(p->path, name, len))
1185 				break; /* not our subdirectory */
1186 
1187 			if (GIT_INDEX_ENTRY_STAGE(&p->entry) == stage)
1188 				return 0;
1189 		}
1190 	}
1191 
1192 	return 0;
1193 }
1194 
check_file_directory_collision(git_index * index,git_index_entry * entry,size_t pos,int ok_to_replace)1195 static int check_file_directory_collision(git_index *index,
1196 		git_index_entry *entry, size_t pos, int ok_to_replace)
1197 {
1198 	if (has_file_name(index, entry, pos, ok_to_replace) < 0 ||
1199 	    has_dir_name(index, entry, ok_to_replace) < 0) {
1200 		git_error_set(GIT_ERROR_INDEX,
1201 			"'%s' appears as both a file and a directory", entry->path);
1202 		return -1;
1203 	}
1204 
1205 	return 0;
1206 }
1207 
canonicalize_directory_path(git_index * index,git_index_entry * entry,git_index_entry * existing)1208 static int canonicalize_directory_path(
1209 	git_index *index,
1210 	git_index_entry *entry,
1211 	git_index_entry *existing)
1212 {
1213 	const git_index_entry *match, *best = NULL;
1214 	char *search, *sep;
1215 	size_t pos, search_len, best_len;
1216 
1217 	if (!index->ignore_case)
1218 		return 0;
1219 
1220 	/* item already exists in the index, simply re-use the existing case */
1221 	if (existing) {
1222 		memcpy((char *)entry->path, existing->path, strlen(existing->path));
1223 		return 0;
1224 	}
1225 
1226 	/* nothing to do */
1227 	if (strchr(entry->path, '/') == NULL)
1228 		return 0;
1229 
1230 	if ((search = git__strdup(entry->path)) == NULL)
1231 		return -1;
1232 
1233 	/* starting at the parent directory and descending to the root, find the
1234 	 * common parent directory.
1235 	 */
1236 	while (!best && (sep = strrchr(search, '/'))) {
1237 		sep[1] = '\0';
1238 
1239 		search_len = strlen(search);
1240 
1241 		git_vector_bsearch2(
1242 			&pos, &index->entries, index->entries_search_path, search);
1243 
1244 		while ((match = git_vector_get(&index->entries, pos))) {
1245 			if (GIT_INDEX_ENTRY_STAGE(match) != 0) {
1246 				/* conflicts do not contribute to canonical paths */
1247 			} else if (strncmp(search, match->path, search_len) == 0) {
1248 				/* prefer an exact match to the input filename */
1249 				best = match;
1250 				best_len = search_len;
1251 				break;
1252 			} else if (strncasecmp(search, match->path, search_len) == 0) {
1253 				/* continue walking, there may be a path with an exact
1254 				 * (case sensitive) match later in the index, but use this
1255 				 * as the best match until that happens.
1256 				 */
1257 				if (!best) {
1258 					best = match;
1259 					best_len = search_len;
1260 				}
1261 			} else {
1262 				break;
1263 			}
1264 
1265 			pos++;
1266 		}
1267 
1268 		sep[0] = '\0';
1269 	}
1270 
1271 	if (best)
1272 		memcpy((char *)entry->path, best->path, best_len);
1273 
1274 	git__free(search);
1275 	return 0;
1276 }
1277 
index_no_dups(void ** old,void * new)1278 static int index_no_dups(void **old, void *new)
1279 {
1280 	const git_index_entry *entry = new;
1281 	GIT_UNUSED(old);
1282 	git_error_set(GIT_ERROR_INDEX, "'%s' appears multiple times at stage %d",
1283 		entry->path, GIT_INDEX_ENTRY_STAGE(entry));
1284 	return GIT_EEXISTS;
1285 }
1286 
index_existing_and_best(git_index_entry ** existing,size_t * existing_position,git_index_entry ** best,git_index * index,const git_index_entry * entry)1287 static void index_existing_and_best(
1288 	git_index_entry **existing,
1289 	size_t *existing_position,
1290 	git_index_entry **best,
1291 	git_index *index,
1292 	const git_index_entry *entry)
1293 {
1294 	git_index_entry *e;
1295 	size_t pos;
1296 	int error;
1297 
1298 	error = index_find(&pos,
1299 		index, entry->path, 0, GIT_INDEX_ENTRY_STAGE(entry));
1300 
1301 	if (error == 0) {
1302 		*existing = index->entries.contents[pos];
1303 		*existing_position = pos;
1304 		*best = index->entries.contents[pos];
1305 		return;
1306 	}
1307 
1308 	*existing = NULL;
1309 	*existing_position = 0;
1310 	*best = NULL;
1311 
1312 	if (GIT_INDEX_ENTRY_STAGE(entry) == 0) {
1313 		for (; pos < index->entries.length; pos++) {
1314 			int (*strcomp)(const char *a, const char *b) =
1315 				index->ignore_case ? git__strcasecmp : git__strcmp;
1316 
1317 			e = index->entries.contents[pos];
1318 
1319 			if (strcomp(entry->path, e->path) != 0)
1320 				break;
1321 
1322 			if (GIT_INDEX_ENTRY_STAGE(e) == GIT_INDEX_STAGE_ANCESTOR) {
1323 				*best = e;
1324 				continue;
1325 			} else {
1326 				*best = e;
1327 				break;
1328 			}
1329 		}
1330 	}
1331 }
1332 
1333 /* index_insert takes ownership of the new entry - if it can't insert
1334  * it, then it will return an error **and also free the entry**.  When
1335  * it replaces an existing entry, it will update the entry_ptr with the
1336  * actual entry in the index (and free the passed in one).
1337  *
1338  * trust_path is whether we use the given path, or whether (on case
1339  * insensitive systems only) we try to canonicalize the given path to
1340  * be within an existing directory.
1341  *
1342  * trust_mode is whether we trust the mode in entry_ptr.
1343  *
1344  * trust_id is whether we trust the id or it should be validated.
1345  */
index_insert(git_index * index,git_index_entry ** entry_ptr,int replace,bool trust_path,bool trust_mode,bool trust_id)1346 static int index_insert(
1347 	git_index *index,
1348 	git_index_entry **entry_ptr,
1349 	int replace,
1350 	bool trust_path,
1351 	bool trust_mode,
1352 	bool trust_id)
1353 {
1354 	git_index_entry *existing, *best, *entry;
1355 	size_t path_length, position;
1356 	int error;
1357 
1358 	GIT_ASSERT_ARG(index);
1359 	GIT_ASSERT_ARG(entry_ptr);
1360 
1361 	entry = *entry_ptr;
1362 
1363 	/* Make sure that the path length flag is correct */
1364 	path_length = ((struct entry_internal *)entry)->pathlen;
1365 	index_entry_adjust_namemask(entry, path_length);
1366 
1367 	/* This entry is now up-to-date and should not be checked for raciness */
1368 	entry->flags_extended |= GIT_INDEX_ENTRY_UPTODATE;
1369 
1370 	git_vector_sort(&index->entries);
1371 
1372 	/*
1373 	 * Look if an entry with this path already exists, either staged, or (if
1374 	 * this entry is a regular staged item) as the "ours" side of a conflict.
1375 	 */
1376 	index_existing_and_best(&existing, &position, &best, index, entry);
1377 
1378 	/* Update the file mode */
1379 	entry->mode = trust_mode ?
1380 		git_index__create_mode(entry->mode) :
1381 		index_merge_mode(index, best, entry->mode);
1382 
1383 	/* Canonicalize the directory name */
1384 	if (!trust_path && (error = canonicalize_directory_path(index, entry, best)) < 0)
1385 		goto out;
1386 
1387 	/* Ensure that the given id exists (unless it's a submodule) */
1388 	if (!trust_id && INDEX_OWNER(index) &&
1389 	    (entry->mode & GIT_FILEMODE_COMMIT) != GIT_FILEMODE_COMMIT) {
1390 
1391 		if (!git_object__is_valid(INDEX_OWNER(index), &entry->id,
1392 					  git_object__type_from_filemode(entry->mode))) {
1393 			error = -1;
1394 			goto out;
1395 		}
1396 	}
1397 
1398 	/* Look for tree / blob name collisions, removing conflicts if requested */
1399 	if ((error = check_file_directory_collision(index, entry, position, replace)) < 0)
1400 		goto out;
1401 
1402 	/*
1403 	 * If we are replacing an existing item, overwrite the existing entry
1404 	 * and return it in place of the passed in one.
1405 	 */
1406 	if (existing) {
1407 		if (replace) {
1408 			index_entry_cpy(existing, entry);
1409 
1410 			if (trust_path)
1411 				memcpy((char *)existing->path, entry->path, strlen(entry->path));
1412 		}
1413 
1414 		index_entry_free(entry);
1415 		*entry_ptr = existing;
1416 	} else {
1417 		/*
1418 		 * If replace is not requested or no existing entry exists, insert
1419 		 * at the sorted position.  (Since we re-sort after each insert to
1420 		 * check for dups, this is actually cheaper in the long run.)
1421 		 */
1422 		if ((error = git_vector_insert_sorted(&index->entries, entry, index_no_dups)) < 0 ||
1423 		    (error = index_map_set(index->entries_map, entry, index->ignore_case)) < 0)
1424 			goto out;
1425 	}
1426 
1427 	index->dirty = 1;
1428 
1429 out:
1430 	if (error < 0) {
1431 		index_entry_free(*entry_ptr);
1432 		*entry_ptr = NULL;
1433 	}
1434 
1435 	return error;
1436 }
1437 
index_conflict_to_reuc(git_index * index,const char * path)1438 static int index_conflict_to_reuc(git_index *index, const char *path)
1439 {
1440 	const git_index_entry *conflict_entries[3];
1441 	int ancestor_mode, our_mode, their_mode;
1442 	git_oid const *ancestor_oid, *our_oid, *their_oid;
1443 	int ret;
1444 
1445 	if ((ret = git_index_conflict_get(&conflict_entries[0],
1446 		&conflict_entries[1], &conflict_entries[2], index, path)) < 0)
1447 		return ret;
1448 
1449 	ancestor_mode = conflict_entries[0] == NULL ? 0 : conflict_entries[0]->mode;
1450 	our_mode = conflict_entries[1] == NULL ? 0 : conflict_entries[1]->mode;
1451 	their_mode = conflict_entries[2] == NULL ? 0 : conflict_entries[2]->mode;
1452 
1453 	ancestor_oid = conflict_entries[0] == NULL ? NULL : &conflict_entries[0]->id;
1454 	our_oid = conflict_entries[1] == NULL ? NULL : &conflict_entries[1]->id;
1455 	their_oid = conflict_entries[2] == NULL ? NULL : &conflict_entries[2]->id;
1456 
1457 	if ((ret = git_index_reuc_add(index, path, ancestor_mode, ancestor_oid,
1458 		our_mode, our_oid, their_mode, their_oid)) >= 0)
1459 		ret = git_index_conflict_remove(index, path);
1460 
1461 	return ret;
1462 }
1463 
is_file_or_link(const int filemode)1464 GIT_INLINE(bool) is_file_or_link(const int filemode)
1465 {
1466 	return (filemode == GIT_FILEMODE_BLOB ||
1467 		filemode == GIT_FILEMODE_BLOB_EXECUTABLE ||
1468 		filemode == GIT_FILEMODE_LINK);
1469 }
1470 
valid_filemode(const int filemode)1471 GIT_INLINE(bool) valid_filemode(const int filemode)
1472 {
1473 	return (is_file_or_link(filemode) || filemode == GIT_FILEMODE_COMMIT);
1474 }
1475 
git_index_add_from_buffer(git_index * index,const git_index_entry * source_entry,const void * buffer,size_t len)1476 int git_index_add_from_buffer(
1477     git_index *index, const git_index_entry *source_entry,
1478     const void *buffer, size_t len)
1479 {
1480 	git_index_entry *entry = NULL;
1481 	int error = 0;
1482 	git_oid id;
1483 
1484 	GIT_ASSERT_ARG(index);
1485 	GIT_ASSERT_ARG(source_entry && source_entry->path);
1486 
1487 	if (INDEX_OWNER(index) == NULL)
1488 		return create_index_error(-1,
1489 			"could not initialize index entry. "
1490 			"Index is not backed up by an existing repository.");
1491 
1492 	if (!is_file_or_link(source_entry->mode)) {
1493 		git_error_set(GIT_ERROR_INDEX, "invalid filemode");
1494 		return -1;
1495 	}
1496 
1497 	if (len > UINT32_MAX) {
1498 		git_error_set(GIT_ERROR_INDEX, "buffer is too large");
1499 		return -1;
1500 	}
1501 
1502 	if (index_entry_dup(&entry, index, source_entry) < 0)
1503 		return -1;
1504 
1505 	error = git_blob_create_from_buffer(&id, INDEX_OWNER(index), buffer, len);
1506 	if (error < 0) {
1507 		index_entry_free(entry);
1508 		return error;
1509 	}
1510 
1511 	git_oid_cpy(&entry->id, &id);
1512 	entry->file_size = (uint32_t)len;
1513 
1514 	if ((error = index_insert(index, &entry, 1, true, true, true)) < 0)
1515 		return error;
1516 
1517 	/* Adding implies conflict was resolved, move conflict entries to REUC */
1518 	if ((error = index_conflict_to_reuc(index, entry->path)) < 0 && error != GIT_ENOTFOUND)
1519 		return error;
1520 
1521 	git_tree_cache_invalidate_path(index->tree, entry->path);
1522 	return 0;
1523 }
1524 
add_repo_as_submodule(git_index_entry ** out,git_index * index,const char * path)1525 static int add_repo_as_submodule(git_index_entry **out, git_index *index, const char *path)
1526 {
1527 	git_repository *sub;
1528 	git_buf abspath = GIT_BUF_INIT;
1529 	git_repository *repo = INDEX_OWNER(index);
1530 	git_reference *head;
1531 	git_index_entry *entry;
1532 	struct stat st;
1533 	int error;
1534 
1535 	if ((error = git_repository_workdir_path(&abspath, repo, path)) < 0)
1536 		return error;
1537 
1538 	if ((error = p_stat(abspath.ptr, &st)) < 0) {
1539 		git_error_set(GIT_ERROR_OS, "failed to stat repository dir");
1540 		return -1;
1541 	}
1542 
1543 	if (index_entry_create(&entry, INDEX_OWNER(index), path, &st, true) < 0)
1544 		return -1;
1545 
1546 	git_index_entry__init_from_stat(entry, &st, !index->distrust_filemode);
1547 
1548 	if ((error = git_repository_open(&sub, abspath.ptr)) < 0)
1549 		return error;
1550 
1551 	if ((error = git_repository_head(&head, sub)) < 0)
1552 		return error;
1553 
1554 	git_oid_cpy(&entry->id, git_reference_target(head));
1555 	entry->mode = GIT_FILEMODE_COMMIT;
1556 
1557 	git_reference_free(head);
1558 	git_repository_free(sub);
1559 	git_buf_dispose(&abspath);
1560 
1561 	*out = entry;
1562 	return 0;
1563 }
1564 
git_index_add_bypath(git_index * index,const char * path)1565 int git_index_add_bypath(git_index *index, const char *path)
1566 {
1567 	git_index_entry *entry = NULL;
1568 	int ret;
1569 
1570 	GIT_ASSERT_ARG(index);
1571 	GIT_ASSERT_ARG(path);
1572 
1573 	if ((ret = index_entry_init(&entry, index, path)) == 0)
1574 		ret = index_insert(index, &entry, 1, false, false, true);
1575 
1576 	/* If we were given a directory, let's see if it's a submodule */
1577 	if (ret < 0 && ret != GIT_EDIRECTORY)
1578 		return ret;
1579 
1580 	if (ret == GIT_EDIRECTORY) {
1581 		git_submodule *sm;
1582 		git_error_state err;
1583 
1584 		git_error_state_capture(&err, ret);
1585 
1586 		ret = git_submodule_lookup(&sm, INDEX_OWNER(index), path);
1587 		if (ret == GIT_ENOTFOUND)
1588 			return git_error_state_restore(&err);
1589 
1590 		git_error_state_free(&err);
1591 
1592 		/*
1593 		 * EEXISTS means that there is a repository at that path, but it's not known
1594 		 * as a submodule. We add its HEAD as an entry and don't register it.
1595 		 */
1596 		if (ret == GIT_EEXISTS) {
1597 			if ((ret = add_repo_as_submodule(&entry, index, path)) < 0)
1598 				return ret;
1599 
1600 			if ((ret = index_insert(index, &entry, 1, false, false, true)) < 0)
1601 				return ret;
1602 		} else if (ret < 0) {
1603 			return ret;
1604 		} else {
1605 			ret = git_submodule_add_to_index(sm, false);
1606 			git_submodule_free(sm);
1607 			return ret;
1608 		}
1609 	}
1610 
1611 	/* Adding implies conflict was resolved, move conflict entries to REUC */
1612 	if ((ret = index_conflict_to_reuc(index, path)) < 0 && ret != GIT_ENOTFOUND)
1613 		return ret;
1614 
1615 	git_tree_cache_invalidate_path(index->tree, entry->path);
1616 	return 0;
1617 }
1618 
git_index_remove_bypath(git_index * index,const char * path)1619 int git_index_remove_bypath(git_index *index, const char *path)
1620 {
1621 	int ret;
1622 
1623 	GIT_ASSERT_ARG(index);
1624 	GIT_ASSERT_ARG(path);
1625 
1626 	if (((ret = git_index_remove(index, path, 0)) < 0 &&
1627 		ret != GIT_ENOTFOUND) ||
1628 		((ret = index_conflict_to_reuc(index, path)) < 0 &&
1629 		ret != GIT_ENOTFOUND))
1630 		return ret;
1631 
1632 	if (ret == GIT_ENOTFOUND)
1633 		git_error_clear();
1634 
1635 	return 0;
1636 }
1637 
git_index__fill(git_index * index,const git_vector * source_entries)1638 int git_index__fill(git_index *index, const git_vector *source_entries)
1639 {
1640 	const git_index_entry *source_entry = NULL;
1641 	int error = 0;
1642 	size_t i;
1643 
1644 	GIT_ASSERT_ARG(index);
1645 
1646 	if (!source_entries->length)
1647 		return 0;
1648 
1649 	if (git_vector_size_hint(&index->entries, source_entries->length) < 0 ||
1650 	    index_map_resize(index->entries_map, (size_t)(source_entries->length * 1.3),
1651 			     index->ignore_case) < 0)
1652 		return -1;
1653 
1654 	git_vector_foreach(source_entries, i, source_entry) {
1655 		git_index_entry *entry = NULL;
1656 
1657 		if ((error = index_entry_dup(&entry, index, source_entry)) < 0)
1658 			break;
1659 
1660 		index_entry_adjust_namemask(entry, ((struct entry_internal *)entry)->pathlen);
1661 		entry->flags_extended |= GIT_INDEX_ENTRY_UPTODATE;
1662 		entry->mode = git_index__create_mode(entry->mode);
1663 
1664 		if ((error = git_vector_insert(&index->entries, entry)) < 0)
1665 			break;
1666 
1667 		if ((error = index_map_set(index->entries_map, entry, index->ignore_case)) < 0)
1668 			break;
1669 
1670 		index->dirty = 1;
1671 	}
1672 
1673 	if (!error)
1674 		git_vector_sort(&index->entries);
1675 
1676 	return error;
1677 }
1678 
1679 
git_index_add(git_index * index,const git_index_entry * source_entry)1680 int git_index_add(git_index *index, const git_index_entry *source_entry)
1681 {
1682 	git_index_entry *entry = NULL;
1683 	int ret;
1684 
1685 	GIT_ASSERT_ARG(index);
1686 	GIT_ASSERT_ARG(source_entry && source_entry->path);
1687 
1688 	if (!valid_filemode(source_entry->mode)) {
1689 		git_error_set(GIT_ERROR_INDEX, "invalid entry mode");
1690 		return -1;
1691 	}
1692 
1693 	if ((ret = index_entry_dup(&entry, index, source_entry)) < 0 ||
1694 		(ret = index_insert(index, &entry, 1, true, true, false)) < 0)
1695 		return ret;
1696 
1697 	git_tree_cache_invalidate_path(index->tree, entry->path);
1698 	return 0;
1699 }
1700 
git_index_remove(git_index * index,const char * path,int stage)1701 int git_index_remove(git_index *index, const char *path, int stage)
1702 {
1703 	int error;
1704 	size_t position;
1705 	git_index_entry remove_key = {{ 0 }};
1706 
1707 	remove_key.path = path;
1708 	GIT_INDEX_ENTRY_STAGE_SET(&remove_key, stage);
1709 
1710 	index_map_delete(index->entries_map, &remove_key, index->ignore_case);
1711 
1712 	if (index_find(&position, index, path, 0, stage) < 0) {
1713 		git_error_set(
1714 			GIT_ERROR_INDEX, "index does not contain %s at stage %d", path, stage);
1715 		error = GIT_ENOTFOUND;
1716 	} else {
1717 		error = index_remove_entry(index, position);
1718 	}
1719 
1720 	return error;
1721 }
1722 
git_index_remove_directory(git_index * index,const char * dir,int stage)1723 int git_index_remove_directory(git_index *index, const char *dir, int stage)
1724 {
1725 	git_buf pfx = GIT_BUF_INIT;
1726 	int error = 0;
1727 	size_t pos;
1728 	git_index_entry *entry;
1729 
1730 	if (!(error = git_buf_sets(&pfx, dir)) &&
1731 		!(error = git_path_to_dir(&pfx)))
1732 		index_find(&pos, index, pfx.ptr, pfx.size, GIT_INDEX_STAGE_ANY);
1733 
1734 	while (!error) {
1735 		entry = git_vector_get(&index->entries, pos);
1736 		if (!entry || git__prefixcmp(entry->path, pfx.ptr) != 0)
1737 			break;
1738 
1739 		if (GIT_INDEX_ENTRY_STAGE(entry) != stage) {
1740 			++pos;
1741 			continue;
1742 		}
1743 
1744 		error = index_remove_entry(index, pos);
1745 
1746 		/* removed entry at 'pos' so we don't need to increment */
1747 	}
1748 
1749 	git_buf_dispose(&pfx);
1750 
1751 	return error;
1752 }
1753 
git_index_find_prefix(size_t * at_pos,git_index * index,const char * prefix)1754 int git_index_find_prefix(size_t *at_pos, git_index *index, const char *prefix)
1755 {
1756 	int error = 0;
1757 	size_t pos;
1758 	const git_index_entry *entry;
1759 
1760 	index_find(&pos, index, prefix, strlen(prefix), GIT_INDEX_STAGE_ANY);
1761 	entry = git_vector_get(&index->entries, pos);
1762 	if (!entry || git__prefixcmp(entry->path, prefix) != 0)
1763 		error = GIT_ENOTFOUND;
1764 
1765 	if (!error && at_pos)
1766 		*at_pos = pos;
1767 
1768 	return error;
1769 }
1770 
git_index__find_pos(size_t * out,git_index * index,const char * path,size_t path_len,int stage)1771 int git_index__find_pos(
1772 	size_t *out, git_index *index, const char *path, size_t path_len, int stage)
1773 {
1774 	GIT_ASSERT_ARG(index);
1775 	GIT_ASSERT_ARG(path);
1776 	return index_find(out, index, path, path_len, stage);
1777 }
1778 
git_index_find(size_t * at_pos,git_index * index,const char * path)1779 int git_index_find(size_t *at_pos, git_index *index, const char *path)
1780 {
1781 	size_t pos;
1782 
1783 	GIT_ASSERT_ARG(index);
1784 	GIT_ASSERT_ARG(path);
1785 
1786 	if (git_vector_bsearch2(
1787 			&pos, &index->entries, index->entries_search_path, path) < 0) {
1788 		git_error_set(GIT_ERROR_INDEX, "index does not contain %s", path);
1789 		return GIT_ENOTFOUND;
1790 	}
1791 
1792 	/* Since our binary search only looked at path, we may be in the
1793 	 * middle of a list of stages.
1794 	 */
1795 	for (; pos > 0; --pos) {
1796 		const git_index_entry *prev = git_vector_get(&index->entries, pos - 1);
1797 
1798 		if (index->entries_cmp_path(prev->path, path) != 0)
1799 			break;
1800 	}
1801 
1802 	if (at_pos)
1803 		*at_pos = pos;
1804 
1805 	return 0;
1806 }
1807 
git_index_conflict_add(git_index * index,const git_index_entry * ancestor_entry,const git_index_entry * our_entry,const git_index_entry * their_entry)1808 int git_index_conflict_add(git_index *index,
1809 	const git_index_entry *ancestor_entry,
1810 	const git_index_entry *our_entry,
1811 	const git_index_entry *their_entry)
1812 {
1813 	git_index_entry *entries[3] = { 0 };
1814 	unsigned short i;
1815 	int ret = 0;
1816 
1817 	GIT_ASSERT_ARG(index);
1818 
1819 	if ((ancestor_entry &&
1820 			(ret = index_entry_dup(&entries[0], index, ancestor_entry)) < 0) ||
1821 		(our_entry &&
1822 			(ret = index_entry_dup(&entries[1], index, our_entry)) < 0) ||
1823 		(their_entry &&
1824 			(ret = index_entry_dup(&entries[2], index, their_entry)) < 0))
1825 		goto on_error;
1826 
1827 	/* Validate entries */
1828 	for (i = 0; i < 3; i++) {
1829 		if (entries[i] && !valid_filemode(entries[i]->mode)) {
1830 			git_error_set(GIT_ERROR_INDEX, "invalid filemode for stage %d entry",
1831 				i + 1);
1832 			ret = -1;
1833 			goto on_error;
1834 		}
1835 	}
1836 
1837 	/* Remove existing index entries for each path */
1838 	for (i = 0; i < 3; i++) {
1839 		if (entries[i] == NULL)
1840 			continue;
1841 
1842 		if ((ret = git_index_remove(index, entries[i]->path, 0)) != 0) {
1843 			if (ret != GIT_ENOTFOUND)
1844 				goto on_error;
1845 
1846 			git_error_clear();
1847 			ret = 0;
1848 		}
1849 	}
1850 
1851 	/* Add the conflict entries */
1852 	for (i = 0; i < 3; i++) {
1853 		if (entries[i] == NULL)
1854 			continue;
1855 
1856 		/* Make sure stage is correct */
1857 		GIT_INDEX_ENTRY_STAGE_SET(entries[i], i + 1);
1858 
1859 		if ((ret = index_insert(index, &entries[i], 1, true, true, false)) < 0)
1860 			goto on_error;
1861 
1862 		entries[i] = NULL; /* don't free if later entry fails */
1863 	}
1864 
1865 	return 0;
1866 
1867 on_error:
1868 	for (i = 0; i < 3; i++) {
1869 		if (entries[i] != NULL)
1870 			index_entry_free(entries[i]);
1871 	}
1872 
1873 	return ret;
1874 }
1875 
index_conflict__get_byindex(const git_index_entry ** ancestor_out,const git_index_entry ** our_out,const git_index_entry ** their_out,git_index * index,size_t n)1876 static int index_conflict__get_byindex(
1877 	const git_index_entry **ancestor_out,
1878 	const git_index_entry **our_out,
1879 	const git_index_entry **their_out,
1880 	git_index *index,
1881 	size_t n)
1882 {
1883 	const git_index_entry *conflict_entry;
1884 	const char *path = NULL;
1885 	size_t count;
1886 	int stage, len = 0;
1887 
1888 	GIT_ASSERT_ARG(ancestor_out);
1889 	GIT_ASSERT_ARG(our_out);
1890 	GIT_ASSERT_ARG(their_out);
1891 	GIT_ASSERT_ARG(index);
1892 
1893 	*ancestor_out = NULL;
1894 	*our_out = NULL;
1895 	*their_out = NULL;
1896 
1897 	for (count = git_index_entrycount(index); n < count; ++n) {
1898 		conflict_entry = git_vector_get(&index->entries, n);
1899 
1900 		if (path && index->entries_cmp_path(conflict_entry->path, path) != 0)
1901 			break;
1902 
1903 		stage = GIT_INDEX_ENTRY_STAGE(conflict_entry);
1904 		path = conflict_entry->path;
1905 
1906 		switch (stage) {
1907 		case 3:
1908 			*their_out = conflict_entry;
1909 			len++;
1910 			break;
1911 		case 2:
1912 			*our_out = conflict_entry;
1913 			len++;
1914 			break;
1915 		case 1:
1916 			*ancestor_out = conflict_entry;
1917 			len++;
1918 			break;
1919 		default:
1920 			break;
1921 		};
1922 	}
1923 
1924 	return len;
1925 }
1926 
git_index_conflict_get(const git_index_entry ** ancestor_out,const git_index_entry ** our_out,const git_index_entry ** their_out,git_index * index,const char * path)1927 int git_index_conflict_get(
1928 	const git_index_entry **ancestor_out,
1929 	const git_index_entry **our_out,
1930 	const git_index_entry **their_out,
1931 	git_index *index,
1932 	const char *path)
1933 {
1934 	size_t pos;
1935 	int len = 0;
1936 
1937 	GIT_ASSERT_ARG(ancestor_out);
1938 	GIT_ASSERT_ARG(our_out);
1939 	GIT_ASSERT_ARG(their_out);
1940 	GIT_ASSERT_ARG(index);
1941 	GIT_ASSERT_ARG(path);
1942 
1943 	*ancestor_out = NULL;
1944 	*our_out = NULL;
1945 	*their_out = NULL;
1946 
1947 	if (git_index_find(&pos, index, path) < 0)
1948 		return GIT_ENOTFOUND;
1949 
1950 	if ((len = index_conflict__get_byindex(
1951 		ancestor_out, our_out, their_out, index, pos)) < 0)
1952 		return len;
1953 	else if (len == 0)
1954 		return GIT_ENOTFOUND;
1955 
1956 	return 0;
1957 }
1958 
index_conflict_remove(git_index * index,const char * path)1959 static int index_conflict_remove(git_index *index, const char *path)
1960 {
1961 	size_t pos = 0;
1962 	git_index_entry *conflict_entry;
1963 	int error = 0;
1964 
1965 	if (path != NULL && git_index_find(&pos, index, path) < 0)
1966 		return GIT_ENOTFOUND;
1967 
1968 	while ((conflict_entry = git_vector_get(&index->entries, pos)) != NULL) {
1969 
1970 		if (path != NULL &&
1971 			index->entries_cmp_path(conflict_entry->path, path) != 0)
1972 			break;
1973 
1974 		if (GIT_INDEX_ENTRY_STAGE(conflict_entry) == 0) {
1975 			pos++;
1976 			continue;
1977 		}
1978 
1979 		if ((error = index_remove_entry(index, pos)) < 0)
1980 			break;
1981 	}
1982 
1983 	return error;
1984 }
1985 
git_index_conflict_remove(git_index * index,const char * path)1986 int git_index_conflict_remove(git_index *index, const char *path)
1987 {
1988 	GIT_ASSERT_ARG(index);
1989 	GIT_ASSERT_ARG(path);
1990 	return index_conflict_remove(index, path);
1991 }
1992 
git_index_conflict_cleanup(git_index * index)1993 int git_index_conflict_cleanup(git_index *index)
1994 {
1995 	GIT_ASSERT_ARG(index);
1996 	return index_conflict_remove(index, NULL);
1997 }
1998 
git_index_has_conflicts(const git_index * index)1999 int git_index_has_conflicts(const git_index *index)
2000 {
2001 	size_t i;
2002 	git_index_entry *entry;
2003 
2004 	GIT_ASSERT_ARG(index);
2005 
2006 	git_vector_foreach(&index->entries, i, entry) {
2007 		if (GIT_INDEX_ENTRY_STAGE(entry) > 0)
2008 			return 1;
2009 	}
2010 
2011 	return 0;
2012 }
2013 
git_index_iterator_new(git_index_iterator ** iterator_out,git_index * index)2014 int git_index_iterator_new(
2015 	git_index_iterator **iterator_out,
2016 	git_index *index)
2017 {
2018 	git_index_iterator *it;
2019 	int error;
2020 
2021 	GIT_ASSERT_ARG(iterator_out);
2022 	GIT_ASSERT_ARG(index);
2023 
2024 	it = git__calloc(1, sizeof(git_index_iterator));
2025 	GIT_ERROR_CHECK_ALLOC(it);
2026 
2027 	if ((error = git_index_snapshot_new(&it->snap, index)) < 0) {
2028 		git__free(it);
2029 		return error;
2030 	}
2031 
2032 	it->index = index;
2033 
2034 	*iterator_out = it;
2035 	return 0;
2036 }
2037 
git_index_iterator_next(const git_index_entry ** out,git_index_iterator * it)2038 int git_index_iterator_next(
2039 	const git_index_entry **out,
2040 	git_index_iterator *it)
2041 {
2042 	GIT_ASSERT_ARG(out);
2043 	GIT_ASSERT_ARG(it);
2044 
2045 	if (it->cur >= git_vector_length(&it->snap))
2046 		return GIT_ITEROVER;
2047 
2048 	*out = (git_index_entry *)git_vector_get(&it->snap, it->cur++);
2049 	return 0;
2050 }
2051 
git_index_iterator_free(git_index_iterator * it)2052 void git_index_iterator_free(git_index_iterator *it)
2053 {
2054 	if (it == NULL)
2055 		return;
2056 
2057 	git_index_snapshot_release(&it->snap, it->index);
2058 	git__free(it);
2059 }
2060 
git_index_conflict_iterator_new(git_index_conflict_iterator ** iterator_out,git_index * index)2061 int git_index_conflict_iterator_new(
2062 	git_index_conflict_iterator **iterator_out,
2063 	git_index *index)
2064 {
2065 	git_index_conflict_iterator *it = NULL;
2066 
2067 	GIT_ASSERT_ARG(iterator_out);
2068 	GIT_ASSERT_ARG(index);
2069 
2070 	it = git__calloc(1, sizeof(git_index_conflict_iterator));
2071 	GIT_ERROR_CHECK_ALLOC(it);
2072 
2073 	it->index = index;
2074 
2075 	*iterator_out = it;
2076 	return 0;
2077 }
2078 
git_index_conflict_next(const git_index_entry ** ancestor_out,const git_index_entry ** our_out,const git_index_entry ** their_out,git_index_conflict_iterator * iterator)2079 int git_index_conflict_next(
2080 	const git_index_entry **ancestor_out,
2081 	const git_index_entry **our_out,
2082 	const git_index_entry **their_out,
2083 	git_index_conflict_iterator *iterator)
2084 {
2085 	const git_index_entry *entry;
2086 	int len;
2087 
2088 	GIT_ASSERT_ARG(ancestor_out);
2089 	GIT_ASSERT_ARG(our_out);
2090 	GIT_ASSERT_ARG(their_out);
2091 	GIT_ASSERT_ARG(iterator);
2092 
2093 	*ancestor_out = NULL;
2094 	*our_out = NULL;
2095 	*their_out = NULL;
2096 
2097 	while (iterator->cur < iterator->index->entries.length) {
2098 		entry = git_index_get_byindex(iterator->index, iterator->cur);
2099 
2100 		if (git_index_entry_is_conflict(entry)) {
2101 			if ((len = index_conflict__get_byindex(
2102 				ancestor_out,
2103 				our_out,
2104 				their_out,
2105 				iterator->index,
2106 				iterator->cur)) < 0)
2107 				return len;
2108 
2109 			iterator->cur += len;
2110 			return 0;
2111 		}
2112 
2113 		iterator->cur++;
2114 	}
2115 
2116 	return GIT_ITEROVER;
2117 }
2118 
git_index_conflict_iterator_free(git_index_conflict_iterator * iterator)2119 void git_index_conflict_iterator_free(git_index_conflict_iterator *iterator)
2120 {
2121 	if (iterator == NULL)
2122 		return;
2123 
2124 	git__free(iterator);
2125 }
2126 
git_index_name_entrycount(git_index * index)2127 size_t git_index_name_entrycount(git_index *index)
2128 {
2129 	GIT_ASSERT_ARG(index);
2130 	return index->names.length;
2131 }
2132 
git_index_name_get_byindex(git_index * index,size_t n)2133 const git_index_name_entry *git_index_name_get_byindex(
2134 	git_index *index, size_t n)
2135 {
2136 	GIT_ASSERT_ARG_WITH_RETVAL(index, NULL);
2137 
2138 	git_vector_sort(&index->names);
2139 	return git_vector_get(&index->names, n);
2140 }
2141 
index_name_entry_free(git_index_name_entry * ne)2142 static void index_name_entry_free(git_index_name_entry *ne)
2143 {
2144 	if (!ne)
2145 		return;
2146 	git__free(ne->ancestor);
2147 	git__free(ne->ours);
2148 	git__free(ne->theirs);
2149 	git__free(ne);
2150 }
2151 
git_index_name_add(git_index * index,const char * ancestor,const char * ours,const char * theirs)2152 int git_index_name_add(git_index *index,
2153 	const char *ancestor, const char *ours, const char *theirs)
2154 {
2155 	git_index_name_entry *conflict_name;
2156 
2157 	GIT_ASSERT_ARG((ancestor && ours) || (ancestor && theirs) || (ours && theirs));
2158 
2159 	conflict_name = git__calloc(1, sizeof(git_index_name_entry));
2160 	GIT_ERROR_CHECK_ALLOC(conflict_name);
2161 
2162 	if ((ancestor && !(conflict_name->ancestor = git__strdup(ancestor))) ||
2163 		(ours     && !(conflict_name->ours     = git__strdup(ours))) ||
2164 		(theirs   && !(conflict_name->theirs   = git__strdup(theirs))) ||
2165 		git_vector_insert(&index->names, conflict_name) < 0)
2166 	{
2167 		index_name_entry_free(conflict_name);
2168 		return -1;
2169 	}
2170 
2171 	index->dirty = 1;
2172 	return 0;
2173 }
2174 
git_index_name_clear(git_index * index)2175 int git_index_name_clear(git_index *index)
2176 {
2177 	size_t i;
2178 	git_index_name_entry *conflict_name;
2179 
2180 	GIT_ASSERT_ARG(index);
2181 
2182 	git_vector_foreach(&index->names, i, conflict_name)
2183 		index_name_entry_free(conflict_name);
2184 
2185 	git_vector_clear(&index->names);
2186 
2187 	index->dirty = 1;
2188 
2189 	return 0;
2190 }
2191 
git_index_reuc_entrycount(git_index * index)2192 size_t git_index_reuc_entrycount(git_index *index)
2193 {
2194 	GIT_ASSERT_ARG(index);
2195 	return index->reuc.length;
2196 }
2197 
index_reuc_on_dup(void ** old,void * new)2198 static int index_reuc_on_dup(void **old, void *new)
2199 {
2200 	index_entry_reuc_free(*old);
2201 	*old = new;
2202 	return GIT_EEXISTS;
2203 }
2204 
index_reuc_insert(git_index * index,git_index_reuc_entry * reuc)2205 static int index_reuc_insert(
2206 	git_index *index,
2207 	git_index_reuc_entry *reuc)
2208 {
2209 	int res;
2210 
2211 	GIT_ASSERT_ARG(index);
2212 	GIT_ASSERT_ARG(reuc && reuc->path != NULL);
2213 	GIT_ASSERT(git_vector_is_sorted(&index->reuc));
2214 
2215 	res = git_vector_insert_sorted(&index->reuc, reuc, &index_reuc_on_dup);
2216 	index->dirty = 1;
2217 
2218 	return res == GIT_EEXISTS ? 0 : res;
2219 }
2220 
git_index_reuc_add(git_index * index,const char * path,int ancestor_mode,const git_oid * ancestor_oid,int our_mode,const git_oid * our_oid,int their_mode,const git_oid * their_oid)2221 int git_index_reuc_add(git_index *index, const char *path,
2222 	int ancestor_mode, const git_oid *ancestor_oid,
2223 	int our_mode, const git_oid *our_oid,
2224 	int their_mode, const git_oid *their_oid)
2225 {
2226 	git_index_reuc_entry *reuc = NULL;
2227 	int error = 0;
2228 
2229 	GIT_ASSERT_ARG(index);
2230 	GIT_ASSERT_ARG(path);
2231 
2232 	if ((error = index_entry_reuc_init(&reuc, path, ancestor_mode,
2233 			ancestor_oid, our_mode, our_oid, their_mode, their_oid)) < 0 ||
2234 		(error = index_reuc_insert(index, reuc)) < 0)
2235 		index_entry_reuc_free(reuc);
2236 
2237 	return error;
2238 }
2239 
git_index_reuc_find(size_t * at_pos,git_index * index,const char * path)2240 int git_index_reuc_find(size_t *at_pos, git_index *index, const char *path)
2241 {
2242 	return git_vector_bsearch2(at_pos, &index->reuc, index->reuc_search, path);
2243 }
2244 
git_index_reuc_get_bypath(git_index * index,const char * path)2245 const git_index_reuc_entry *git_index_reuc_get_bypath(
2246 	git_index *index, const char *path)
2247 {
2248 	size_t pos;
2249 
2250 	GIT_ASSERT_ARG_WITH_RETVAL(index, NULL);
2251 	GIT_ASSERT_ARG_WITH_RETVAL(path, NULL);
2252 
2253 	if (!index->reuc.length)
2254 		return NULL;
2255 
2256 	GIT_ASSERT_WITH_RETVAL(git_vector_is_sorted(&index->reuc), NULL);
2257 
2258 	if (git_index_reuc_find(&pos, index, path) < 0)
2259 		return NULL;
2260 
2261 	return git_vector_get(&index->reuc, pos);
2262 }
2263 
git_index_reuc_get_byindex(git_index * index,size_t n)2264 const git_index_reuc_entry *git_index_reuc_get_byindex(
2265 	git_index *index, size_t n)
2266 {
2267 	GIT_ASSERT_ARG_WITH_RETVAL(index, NULL);
2268 	GIT_ASSERT_WITH_RETVAL(git_vector_is_sorted(&index->reuc), NULL);
2269 
2270 	return git_vector_get(&index->reuc, n);
2271 }
2272 
git_index_reuc_remove(git_index * index,size_t position)2273 int git_index_reuc_remove(git_index *index, size_t position)
2274 {
2275 	int error;
2276 	git_index_reuc_entry *reuc;
2277 
2278 	GIT_ASSERT_ARG(index);
2279 	GIT_ASSERT(git_vector_is_sorted(&index->reuc));
2280 
2281 	reuc = git_vector_get(&index->reuc, position);
2282 	error = git_vector_remove(&index->reuc, position);
2283 
2284 	if (!error)
2285 		index_entry_reuc_free(reuc);
2286 
2287 	index->dirty = 1;
2288 	return error;
2289 }
2290 
git_index_reuc_clear(git_index * index)2291 int git_index_reuc_clear(git_index *index)
2292 {
2293 	size_t i;
2294 
2295 	GIT_ASSERT_ARG(index);
2296 
2297 	for (i = 0; i < index->reuc.length; ++i)
2298 		index_entry_reuc_free(git_atomic_swap(index->reuc.contents[i], NULL));
2299 
2300 	git_vector_clear(&index->reuc);
2301 
2302 	index->dirty = 1;
2303 
2304 	return 0;
2305 }
2306 
index_error_invalid(const char * message)2307 static int index_error_invalid(const char *message)
2308 {
2309 	git_error_set(GIT_ERROR_INDEX, "invalid data in index - %s", message);
2310 	return -1;
2311 }
2312 
read_reuc(git_index * index,const char * buffer,size_t size)2313 static int read_reuc(git_index *index, const char *buffer, size_t size)
2314 {
2315 	const char *endptr;
2316 	size_t len;
2317 	int i;
2318 
2319 	/* If called multiple times, the vector might already be initialized */
2320 	if (index->reuc._alloc_size == 0 &&
2321 		git_vector_init(&index->reuc, 16, reuc_cmp) < 0)
2322 		return -1;
2323 
2324 	while (size) {
2325 		git_index_reuc_entry *lost;
2326 
2327 		len = p_strnlen(buffer, size) + 1;
2328 		if (size <= len)
2329 			return index_error_invalid("reading reuc entries");
2330 
2331 		lost = reuc_entry_alloc(buffer);
2332 		GIT_ERROR_CHECK_ALLOC(lost);
2333 
2334 		size -= len;
2335 		buffer += len;
2336 
2337 		/* read 3 ASCII octal numbers for stage entries */
2338 		for (i = 0; i < 3; i++) {
2339 			int64_t tmp;
2340 
2341 			if (git__strntol64(&tmp, buffer, size, &endptr, 8) < 0 ||
2342 				!endptr || endptr == buffer || *endptr ||
2343 				tmp < 0 || tmp > UINT32_MAX) {
2344 				index_entry_reuc_free(lost);
2345 				return index_error_invalid("reading reuc entry stage");
2346 			}
2347 
2348 			lost->mode[i] = (uint32_t)tmp;
2349 
2350 			len = (endptr + 1) - buffer;
2351 			if (size <= len) {
2352 				index_entry_reuc_free(lost);
2353 				return index_error_invalid("reading reuc entry stage");
2354 			}
2355 
2356 			size -= len;
2357 			buffer += len;
2358 		}
2359 
2360 		/* read up to 3 OIDs for stage entries */
2361 		for (i = 0; i < 3; i++) {
2362 			if (!lost->mode[i])
2363 				continue;
2364 			if (size < 20) {
2365 				index_entry_reuc_free(lost);
2366 				return index_error_invalid("reading reuc entry oid");
2367 			}
2368 
2369 			git_oid_fromraw(&lost->oid[i], (const unsigned char *) buffer);
2370 			size -= 20;
2371 			buffer += 20;
2372 		}
2373 
2374 		/* entry was read successfully - insert into reuc vector */
2375 		if (git_vector_insert(&index->reuc, lost) < 0)
2376 			return -1;
2377 	}
2378 
2379 	/* entries are guaranteed to be sorted on-disk */
2380 	git_vector_set_sorted(&index->reuc, true);
2381 
2382 	return 0;
2383 }
2384 
2385 
read_conflict_names(git_index * index,const char * buffer,size_t size)2386 static int read_conflict_names(git_index *index, const char *buffer, size_t size)
2387 {
2388 	size_t len;
2389 
2390 	/* This gets called multiple times, the vector might already be initialized */
2391 	if (index->names._alloc_size == 0 &&
2392 		git_vector_init(&index->names, 16, conflict_name_cmp) < 0)
2393 		return -1;
2394 
2395 #define read_conflict_name(ptr) \
2396 	len = p_strnlen(buffer, size) + 1; \
2397 	if (size < len) { \
2398 		index_error_invalid("reading conflict name entries"); \
2399 		goto out_err; \
2400 	} \
2401 	if (len == 1) \
2402 		ptr = NULL; \
2403 	else { \
2404 		ptr = git__malloc(len); \
2405 		GIT_ERROR_CHECK_ALLOC(ptr); \
2406 		memcpy(ptr, buffer, len); \
2407 	} \
2408 	\
2409 	buffer += len; \
2410 	size -= len;
2411 
2412 	while (size) {
2413 		git_index_name_entry *conflict_name = git__calloc(1, sizeof(git_index_name_entry));
2414 		GIT_ERROR_CHECK_ALLOC(conflict_name);
2415 
2416 		read_conflict_name(conflict_name->ancestor);
2417 		read_conflict_name(conflict_name->ours);
2418 		read_conflict_name(conflict_name->theirs);
2419 
2420 		if (git_vector_insert(&index->names, conflict_name) < 0)
2421 			goto out_err;
2422 
2423 		continue;
2424 
2425 out_err:
2426 		git__free(conflict_name->ancestor);
2427 		git__free(conflict_name->ours);
2428 		git__free(conflict_name->theirs);
2429 		git__free(conflict_name);
2430 		return -1;
2431 	}
2432 
2433 #undef read_conflict_name
2434 
2435 	/* entries are guaranteed to be sorted on-disk */
2436 	git_vector_set_sorted(&index->names, true);
2437 
2438 	return 0;
2439 }
2440 
index_entry_size(size_t path_len,size_t varint_len,uint32_t flags)2441 static size_t index_entry_size(size_t path_len, size_t varint_len, uint32_t flags)
2442 {
2443 	if (varint_len) {
2444 		if (flags & GIT_INDEX_ENTRY_EXTENDED)
2445 			return offsetof(struct entry_long, path) + path_len + 1 + varint_len;
2446 		else
2447 			return offsetof(struct entry_short, path) + path_len + 1 + varint_len;
2448 	} else {
2449 #define entry_size(type,len) ((offsetof(type, path) + (len) + 8) & ~7)
2450 		if (flags & GIT_INDEX_ENTRY_EXTENDED)
2451 			return entry_size(struct entry_long, path_len);
2452 		else
2453 			return entry_size(struct entry_short, path_len);
2454 #undef entry_size
2455 	}
2456 }
2457 
read_entry(git_index_entry ** out,size_t * out_size,git_index * index,const void * buffer,size_t buffer_size,const char * last)2458 static int read_entry(
2459 	git_index_entry **out,
2460 	size_t *out_size,
2461 	git_index *index,
2462 	const void *buffer,
2463 	size_t buffer_size,
2464 	const char *last)
2465 {
2466 	size_t path_length, entry_size;
2467 	const char *path_ptr;
2468 	struct entry_short source;
2469 	git_index_entry entry = {{0}};
2470 	bool compressed = index->version >= INDEX_VERSION_NUMBER_COMP;
2471 	char *tmp_path = NULL;
2472 
2473 	if (INDEX_FOOTER_SIZE + minimal_entry_size > buffer_size)
2474 		return -1;
2475 
2476 	/* buffer is not guaranteed to be aligned */
2477 	memcpy(&source, buffer, sizeof(struct entry_short));
2478 
2479 	entry.ctime.seconds = (git_time_t)ntohl(source.ctime.seconds);
2480 	entry.ctime.nanoseconds = ntohl(source.ctime.nanoseconds);
2481 	entry.mtime.seconds = (git_time_t)ntohl(source.mtime.seconds);
2482 	entry.mtime.nanoseconds = ntohl(source.mtime.nanoseconds);
2483 	entry.dev = ntohl(source.dev);
2484 	entry.ino = ntohl(source.ino);
2485 	entry.mode = ntohl(source.mode);
2486 	entry.uid = ntohl(source.uid);
2487 	entry.gid = ntohl(source.gid);
2488 	entry.file_size = ntohl(source.file_size);
2489 	git_oid_cpy(&entry.id, &source.oid);
2490 	entry.flags = ntohs(source.flags);
2491 
2492 	if (entry.flags & GIT_INDEX_ENTRY_EXTENDED) {
2493 		uint16_t flags_raw;
2494 		size_t flags_offset;
2495 
2496 		flags_offset = offsetof(struct entry_long, flags_extended);
2497 		memcpy(&flags_raw, (const char *) buffer + flags_offset,
2498 			sizeof(flags_raw));
2499 		flags_raw = ntohs(flags_raw);
2500 
2501 		memcpy(&entry.flags_extended, &flags_raw, sizeof(flags_raw));
2502 		path_ptr = (const char *) buffer + offsetof(struct entry_long, path);
2503 	} else
2504 		path_ptr = (const char *) buffer + offsetof(struct entry_short, path);
2505 
2506 	if (!compressed) {
2507 		path_length = entry.flags & GIT_INDEX_ENTRY_NAMEMASK;
2508 
2509 		/* if this is a very long string, we must find its
2510 		 * real length without overflowing */
2511 		if (path_length == 0xFFF) {
2512 			const char *path_end;
2513 
2514 			path_end = memchr(path_ptr, '\0', buffer_size);
2515 			if (path_end == NULL)
2516 				return -1;
2517 
2518 			path_length = path_end - path_ptr;
2519 		}
2520 
2521 		entry_size = index_entry_size(path_length, 0, entry.flags);
2522 		entry.path = (char *)path_ptr;
2523 	} else {
2524 		size_t varint_len, last_len, prefix_len, suffix_len, path_len;
2525 		uintmax_t strip_len;
2526 
2527 		strip_len = git_decode_varint((const unsigned char *)path_ptr, &varint_len);
2528 		last_len = strlen(last);
2529 
2530 		if (varint_len == 0 || last_len < strip_len)
2531 			return index_error_invalid("incorrect prefix length");
2532 
2533 		prefix_len = last_len - (size_t)strip_len;
2534 		suffix_len = strlen(path_ptr + varint_len);
2535 
2536 		GIT_ERROR_CHECK_ALLOC_ADD(&path_len, prefix_len, suffix_len);
2537 		GIT_ERROR_CHECK_ALLOC_ADD(&path_len, path_len, 1);
2538 
2539 		if (path_len > GIT_PATH_MAX)
2540 			return index_error_invalid("unreasonable path length");
2541 
2542 		tmp_path = git__malloc(path_len);
2543 		GIT_ERROR_CHECK_ALLOC(tmp_path);
2544 
2545 		memcpy(tmp_path, last, prefix_len);
2546 		memcpy(tmp_path + prefix_len, path_ptr + varint_len, suffix_len + 1);
2547 		entry_size = index_entry_size(suffix_len, varint_len, entry.flags);
2548 		entry.path = tmp_path;
2549 	}
2550 
2551 	if (entry_size == 0)
2552 		return -1;
2553 
2554 	if (INDEX_FOOTER_SIZE + entry_size > buffer_size)
2555 		return -1;
2556 
2557 	if (index_entry_dup(out, index, &entry) < 0) {
2558 		git__free(tmp_path);
2559 		return -1;
2560 	}
2561 
2562 	git__free(tmp_path);
2563 	*out_size = entry_size;
2564 	return 0;
2565 }
2566 
read_header(struct index_header * dest,const void * buffer)2567 static int read_header(struct index_header *dest, const void *buffer)
2568 {
2569 	const struct index_header *source = buffer;
2570 
2571 	dest->signature = ntohl(source->signature);
2572 	if (dest->signature != INDEX_HEADER_SIG)
2573 		return index_error_invalid("incorrect header signature");
2574 
2575 	dest->version = ntohl(source->version);
2576 	if (dest->version < INDEX_VERSION_NUMBER_LB ||
2577 		dest->version > INDEX_VERSION_NUMBER_UB)
2578 		return index_error_invalid("incorrect header version");
2579 
2580 	dest->entry_count = ntohl(source->entry_count);
2581 	return 0;
2582 }
2583 
read_extension(size_t * read_len,git_index * index,const char * buffer,size_t buffer_size)2584 static int read_extension(size_t *read_len, git_index *index, const char *buffer, size_t buffer_size)
2585 {
2586 	struct index_extension dest;
2587 	size_t total_size;
2588 
2589 	/* buffer is not guaranteed to be aligned */
2590 	memcpy(&dest, buffer, sizeof(struct index_extension));
2591 	dest.extension_size = ntohl(dest.extension_size);
2592 
2593 	total_size = dest.extension_size + sizeof(struct index_extension);
2594 
2595 	if (dest.extension_size > total_size ||
2596 		buffer_size < total_size ||
2597 		buffer_size - total_size < INDEX_FOOTER_SIZE) {
2598 		index_error_invalid("extension is truncated");
2599 		return -1;
2600 	}
2601 
2602 	/* optional extension */
2603 	if (dest.signature[0] >= 'A' && dest.signature[0] <= 'Z') {
2604 		/* tree cache */
2605 		if (memcmp(dest.signature, INDEX_EXT_TREECACHE_SIG, 4) == 0) {
2606 			if (git_tree_cache_read(&index->tree, buffer + 8, dest.extension_size, &index->tree_pool) < 0)
2607 				return -1;
2608 		} else if (memcmp(dest.signature, INDEX_EXT_UNMERGED_SIG, 4) == 0) {
2609 			if (read_reuc(index, buffer + 8, dest.extension_size) < 0)
2610 				return -1;
2611 		} else if (memcmp(dest.signature, INDEX_EXT_CONFLICT_NAME_SIG, 4) == 0) {
2612 			if (read_conflict_names(index, buffer + 8, dest.extension_size) < 0)
2613 				return -1;
2614 		}
2615 		/* else, unsupported extension. We cannot parse this, but we can skip
2616 		 * it by returning `total_size */
2617 	} else {
2618 		/* we cannot handle non-ignorable extensions;
2619 		 * in fact they aren't even defined in the standard */
2620 		git_error_set(GIT_ERROR_INDEX, "unsupported mandatory extension: '%.4s'", dest.signature);
2621 		return -1;
2622 	}
2623 
2624 	*read_len = total_size;
2625 
2626 	return 0;
2627 }
2628 
parse_index(git_index * index,const char * buffer,size_t buffer_size)2629 static int parse_index(git_index *index, const char *buffer, size_t buffer_size)
2630 {
2631 	int error = 0;
2632 	unsigned int i;
2633 	struct index_header header = { 0 };
2634 	git_oid checksum_calculated, checksum_expected;
2635 	const char *last = NULL;
2636 	const char *empty = "";
2637 
2638 #define seek_forward(_increase) { \
2639 	if (_increase >= buffer_size) { \
2640 		error = index_error_invalid("ran out of data while parsing"); \
2641 		goto done; } \
2642 	buffer += _increase; \
2643 	buffer_size -= _increase;\
2644 }
2645 
2646 	if (buffer_size < INDEX_HEADER_SIZE + INDEX_FOOTER_SIZE)
2647 		return index_error_invalid("insufficient buffer space");
2648 
2649 	/* Precalculate the SHA1 of the files's contents -- we'll match it to
2650 	 * the provided SHA1 in the footer */
2651 	git_hash_buf(&checksum_calculated, buffer, buffer_size - INDEX_FOOTER_SIZE);
2652 
2653 	/* Parse header */
2654 	if ((error = read_header(&header, buffer)) < 0)
2655 		return error;
2656 
2657 	index->version = header.version;
2658 	if (index->version >= INDEX_VERSION_NUMBER_COMP)
2659 		last = empty;
2660 
2661 	seek_forward(INDEX_HEADER_SIZE);
2662 
2663 	GIT_ASSERT(!index->entries.length);
2664 
2665 	if ((error = index_map_resize(index->entries_map, header.entry_count, index->ignore_case)) < 0)
2666 		return error;
2667 
2668 	/* Parse all the entries */
2669 	for (i = 0; i < header.entry_count && buffer_size > INDEX_FOOTER_SIZE; ++i) {
2670 		git_index_entry *entry = NULL;
2671 		size_t entry_size;
2672 
2673 		if ((error = read_entry(&entry, &entry_size, index, buffer, buffer_size, last)) < 0) {
2674 			error = index_error_invalid("invalid entry");
2675 			goto done;
2676 		}
2677 
2678 		if ((error = git_vector_insert(&index->entries, entry)) < 0) {
2679 			index_entry_free(entry);
2680 			goto done;
2681 		}
2682 
2683 		if ((error = index_map_set(index->entries_map, entry, index->ignore_case)) < 0) {
2684 			index_entry_free(entry);
2685 			goto done;
2686 		}
2687 		error = 0;
2688 
2689 		if (index->version >= INDEX_VERSION_NUMBER_COMP)
2690 			last = entry->path;
2691 
2692 		seek_forward(entry_size);
2693 	}
2694 
2695 	if (i != header.entry_count) {
2696 		error = index_error_invalid("header entries changed while parsing");
2697 		goto done;
2698 	}
2699 
2700 	/* There's still space for some extensions! */
2701 	while (buffer_size > INDEX_FOOTER_SIZE) {
2702 		size_t extension_size;
2703 
2704 		if ((error = read_extension(&extension_size, index, buffer, buffer_size)) < 0) {
2705 			goto done;
2706 		}
2707 
2708 		seek_forward(extension_size);
2709 	}
2710 
2711 	if (buffer_size != INDEX_FOOTER_SIZE) {
2712 		error = index_error_invalid(
2713 			"buffer size does not match index footer size");
2714 		goto done;
2715 	}
2716 
2717 	/* 160-bit SHA-1 over the content of the index file before this checksum. */
2718 	git_oid_fromraw(&checksum_expected, (const unsigned char *)buffer);
2719 
2720 	if (git_oid__cmp(&checksum_calculated, &checksum_expected) != 0) {
2721 		error = index_error_invalid(
2722 			"calculated checksum does not match expected");
2723 		goto done;
2724 	}
2725 
2726 	git_oid_cpy(&index->checksum, &checksum_calculated);
2727 
2728 #undef seek_forward
2729 
2730 	/* Entries are stored case-sensitively on disk, so re-sort now if
2731 	 * in-memory index is supposed to be case-insensitive
2732 	 */
2733 	git_vector_set_sorted(&index->entries, !index->ignore_case);
2734 	git_vector_sort(&index->entries);
2735 
2736 	index->dirty = 0;
2737 done:
2738 	return error;
2739 }
2740 
is_index_extended(git_index * index)2741 static bool is_index_extended(git_index *index)
2742 {
2743 	size_t i, extended;
2744 	git_index_entry *entry;
2745 
2746 	extended = 0;
2747 
2748 	git_vector_foreach(&index->entries, i, entry) {
2749 		entry->flags &= ~GIT_INDEX_ENTRY_EXTENDED;
2750 		if (entry->flags_extended & GIT_INDEX_ENTRY_EXTENDED_FLAGS) {
2751 			extended++;
2752 			entry->flags |= GIT_INDEX_ENTRY_EXTENDED;
2753 		}
2754 	}
2755 
2756 	return (extended > 0);
2757 }
2758 
write_disk_entry(git_filebuf * file,git_index_entry * entry,const char * last)2759 static int write_disk_entry(git_filebuf *file, git_index_entry *entry, const char *last)
2760 {
2761 	void *mem = NULL;
2762 	struct entry_short ondisk;
2763 	size_t path_len, disk_size;
2764 	int varint_len = 0;
2765 	char *path;
2766 	const char *path_start = entry->path;
2767 	size_t same_len = 0;
2768 
2769 	path_len = ((struct entry_internal *)entry)->pathlen;
2770 
2771 	if (last) {
2772 		const char *last_c = last;
2773 
2774 		while (*path_start == *last_c) {
2775 			if (!*path_start || !*last_c)
2776 				break;
2777 			++path_start;
2778 			++last_c;
2779 			++same_len;
2780 		}
2781 		path_len -= same_len;
2782 		varint_len = git_encode_varint(NULL, 0, strlen(last) - same_len);
2783 	}
2784 
2785 	disk_size = index_entry_size(path_len, varint_len, entry->flags);
2786 
2787 	if (git_filebuf_reserve(file, &mem, disk_size) < 0)
2788 		return -1;
2789 
2790 	memset(mem, 0x0, disk_size);
2791 
2792 	/**
2793 	 * Yes, we have to truncate.
2794 	 *
2795 	 * The on-disk format for Index entries clearly defines
2796 	 * the time and size fields to be 4 bytes each -- so even if
2797 	 * we store these values with 8 bytes on-memory, they must
2798 	 * be truncated to 4 bytes before writing to disk.
2799 	 *
2800 	 * In 2038 I will be either too dead or too rich to care about this
2801 	 */
2802 	ondisk.ctime.seconds = htonl((uint32_t)entry->ctime.seconds);
2803 	ondisk.mtime.seconds = htonl((uint32_t)entry->mtime.seconds);
2804 	ondisk.ctime.nanoseconds = htonl(entry->ctime.nanoseconds);
2805 	ondisk.mtime.nanoseconds = htonl(entry->mtime.nanoseconds);
2806 	ondisk.dev = htonl(entry->dev);
2807 	ondisk.ino = htonl(entry->ino);
2808 	ondisk.mode = htonl(entry->mode);
2809 	ondisk.uid = htonl(entry->uid);
2810 	ondisk.gid = htonl(entry->gid);
2811 	ondisk.file_size = htonl((uint32_t)entry->file_size);
2812 
2813 	git_oid_cpy(&ondisk.oid, &entry->id);
2814 
2815 	ondisk.flags = htons(entry->flags);
2816 
2817 	if (entry->flags & GIT_INDEX_ENTRY_EXTENDED) {
2818 		const size_t path_offset = offsetof(struct entry_long, path);
2819 		struct entry_long ondisk_ext;
2820 		memcpy(&ondisk_ext, &ondisk, sizeof(struct entry_short));
2821 		ondisk_ext.flags_extended = htons(entry->flags_extended &
2822 			GIT_INDEX_ENTRY_EXTENDED_FLAGS);
2823 		memcpy(mem, &ondisk_ext, path_offset);
2824 		path = (char *)mem + path_offset;
2825 		disk_size -= path_offset;
2826 	} else {
2827 		const size_t path_offset = offsetof(struct entry_short, path);
2828 		memcpy(mem, &ondisk, path_offset);
2829 		path = (char *)mem + path_offset;
2830 		disk_size -= path_offset;
2831 	}
2832 
2833 	if (last) {
2834 		varint_len = git_encode_varint((unsigned char *) path,
2835 					  disk_size, strlen(last) - same_len);
2836 		GIT_ASSERT(varint_len > 0);
2837 
2838 		path += varint_len;
2839 		disk_size -= varint_len;
2840 
2841 		/*
2842 		 * If using path compression, we are not allowed
2843 		 * to have additional trailing NULs.
2844 		 */
2845 		GIT_ASSERT(disk_size == path_len + 1);
2846 	} else {
2847 		/*
2848 		 * If no path compression is used, we do have
2849 		 * NULs as padding. As such, simply assert that
2850 		 * we have enough space left to write the path.
2851 		 */
2852 		GIT_ASSERT(disk_size > path_len);
2853 	}
2854 
2855 	memcpy(path, path_start, path_len + 1);
2856 
2857 	return 0;
2858 }
2859 
write_entries(git_index * index,git_filebuf * file)2860 static int write_entries(git_index *index, git_filebuf *file)
2861 {
2862 	int error = 0;
2863 	size_t i;
2864 	git_vector case_sorted = GIT_VECTOR_INIT, *entries = NULL;
2865 	git_index_entry *entry;
2866 	const char *last = NULL;
2867 
2868 	/* If index->entries is sorted case-insensitively, then we need
2869 	 * to re-sort it case-sensitively before writing */
2870 	if (index->ignore_case) {
2871 		if ((error = git_vector_dup(&case_sorted, &index->entries, git_index_entry_cmp)) < 0)
2872 			goto done;
2873 
2874 		git_vector_sort(&case_sorted);
2875 		entries = &case_sorted;
2876 	} else {
2877 		entries = &index->entries;
2878 	}
2879 
2880 	if (index->version >= INDEX_VERSION_NUMBER_COMP)
2881 		last = "";
2882 
2883 	git_vector_foreach(entries, i, entry) {
2884 		if ((error = write_disk_entry(file, entry, last)) < 0)
2885 			break;
2886 		if (index->version >= INDEX_VERSION_NUMBER_COMP)
2887 			last = entry->path;
2888 	}
2889 
2890 done:
2891 	git_vector_free(&case_sorted);
2892 	return error;
2893 }
2894 
write_extension(git_filebuf * file,struct index_extension * header,git_buf * data)2895 static int write_extension(git_filebuf *file, struct index_extension *header, git_buf *data)
2896 {
2897 	struct index_extension ondisk;
2898 
2899 	memset(&ondisk, 0x0, sizeof(struct index_extension));
2900 	memcpy(&ondisk, header, 4);
2901 	ondisk.extension_size = htonl(header->extension_size);
2902 
2903 	git_filebuf_write(file, &ondisk, sizeof(struct index_extension));
2904 	return git_filebuf_write(file, data->ptr, data->size);
2905 }
2906 
create_name_extension_data(git_buf * name_buf,git_index_name_entry * conflict_name)2907 static int create_name_extension_data(git_buf *name_buf, git_index_name_entry *conflict_name)
2908 {
2909 	int error = 0;
2910 
2911 	if (conflict_name->ancestor == NULL)
2912 		error = git_buf_put(name_buf, "\0", 1);
2913 	else
2914 		error = git_buf_put(name_buf, conflict_name->ancestor, strlen(conflict_name->ancestor) + 1);
2915 
2916 	if (error != 0)
2917 		goto on_error;
2918 
2919 	if (conflict_name->ours == NULL)
2920 		error = git_buf_put(name_buf, "\0", 1);
2921 	else
2922 		error = git_buf_put(name_buf, conflict_name->ours, strlen(conflict_name->ours) + 1);
2923 
2924 	if (error != 0)
2925 		goto on_error;
2926 
2927 	if (conflict_name->theirs == NULL)
2928 		error = git_buf_put(name_buf, "\0", 1);
2929 	else
2930 		error = git_buf_put(name_buf, conflict_name->theirs, strlen(conflict_name->theirs) + 1);
2931 
2932 on_error:
2933 	return error;
2934 }
2935 
write_name_extension(git_index * index,git_filebuf * file)2936 static int write_name_extension(git_index *index, git_filebuf *file)
2937 {
2938 	git_buf name_buf = GIT_BUF_INIT;
2939 	git_vector *out = &index->names;
2940 	git_index_name_entry *conflict_name;
2941 	struct index_extension extension;
2942 	size_t i;
2943 	int error = 0;
2944 
2945 	git_vector_foreach(out, i, conflict_name) {
2946 		if ((error = create_name_extension_data(&name_buf, conflict_name)) < 0)
2947 			goto done;
2948 	}
2949 
2950 	memset(&extension, 0x0, sizeof(struct index_extension));
2951 	memcpy(&extension.signature, INDEX_EXT_CONFLICT_NAME_SIG, 4);
2952 	extension.extension_size = (uint32_t)name_buf.size;
2953 
2954 	error = write_extension(file, &extension, &name_buf);
2955 
2956 	git_buf_dispose(&name_buf);
2957 
2958 done:
2959 	return error;
2960 }
2961 
create_reuc_extension_data(git_buf * reuc_buf,git_index_reuc_entry * reuc)2962 static int create_reuc_extension_data(git_buf *reuc_buf, git_index_reuc_entry *reuc)
2963 {
2964 	int i;
2965 	int error = 0;
2966 
2967 	if ((error = git_buf_put(reuc_buf, reuc->path, strlen(reuc->path) + 1)) < 0)
2968 		return error;
2969 
2970 	for (i = 0; i < 3; i++) {
2971 		if ((error = git_buf_printf(reuc_buf, "%o", reuc->mode[i])) < 0 ||
2972 			(error = git_buf_put(reuc_buf, "\0", 1)) < 0)
2973 			return error;
2974 	}
2975 
2976 	for (i = 0; i < 3; i++) {
2977 		if (reuc->mode[i] && (error = git_buf_put(reuc_buf, (char *)&reuc->oid[i].id, GIT_OID_RAWSZ)) < 0)
2978 			return error;
2979 	}
2980 
2981 	return 0;
2982 }
2983 
write_reuc_extension(git_index * index,git_filebuf * file)2984 static int write_reuc_extension(git_index *index, git_filebuf *file)
2985 {
2986 	git_buf reuc_buf = GIT_BUF_INIT;
2987 	git_vector *out = &index->reuc;
2988 	git_index_reuc_entry *reuc;
2989 	struct index_extension extension;
2990 	size_t i;
2991 	int error = 0;
2992 
2993 	git_vector_foreach(out, i, reuc) {
2994 		if ((error = create_reuc_extension_data(&reuc_buf, reuc)) < 0)
2995 			goto done;
2996 	}
2997 
2998 	memset(&extension, 0x0, sizeof(struct index_extension));
2999 	memcpy(&extension.signature, INDEX_EXT_UNMERGED_SIG, 4);
3000 	extension.extension_size = (uint32_t)reuc_buf.size;
3001 
3002 	error = write_extension(file, &extension, &reuc_buf);
3003 
3004 	git_buf_dispose(&reuc_buf);
3005 
3006 done:
3007 	return error;
3008 }
3009 
write_tree_extension(git_index * index,git_filebuf * file)3010 static int write_tree_extension(git_index *index, git_filebuf *file)
3011 {
3012 	struct index_extension extension;
3013 	git_buf buf = GIT_BUF_INIT;
3014 	int error;
3015 
3016 	if (index->tree == NULL)
3017 		return 0;
3018 
3019 	if ((error = git_tree_cache_write(&buf, index->tree)) < 0)
3020 		return error;
3021 
3022 	memset(&extension, 0x0, sizeof(struct index_extension));
3023 	memcpy(&extension.signature, INDEX_EXT_TREECACHE_SIG, 4);
3024 	extension.extension_size = (uint32_t)buf.size;
3025 
3026 	error = write_extension(file, &extension, &buf);
3027 
3028 	git_buf_dispose(&buf);
3029 
3030 	return error;
3031 }
3032 
clear_uptodate(git_index * index)3033 static void clear_uptodate(git_index *index)
3034 {
3035 	git_index_entry *entry;
3036 	size_t i;
3037 
3038 	git_vector_foreach(&index->entries, i, entry)
3039 		entry->flags_extended &= ~GIT_INDEX_ENTRY_UPTODATE;
3040 }
3041 
write_index(git_oid * checksum,git_index * index,git_filebuf * file)3042 static int write_index(git_oid *checksum, git_index *index, git_filebuf *file)
3043 {
3044 	git_oid hash_final;
3045 	struct index_header header;
3046 	bool is_extended;
3047 	uint32_t index_version_number;
3048 
3049 	GIT_ASSERT_ARG(index);
3050 	GIT_ASSERT_ARG(file);
3051 
3052 	if (index->version <= INDEX_VERSION_NUMBER_EXT)  {
3053 		is_extended = is_index_extended(index);
3054 		index_version_number = is_extended ? INDEX_VERSION_NUMBER_EXT : INDEX_VERSION_NUMBER_LB;
3055 	} else {
3056 		index_version_number = index->version;
3057 	}
3058 
3059 	header.signature = htonl(INDEX_HEADER_SIG);
3060 	header.version = htonl(index_version_number);
3061 	header.entry_count = htonl((uint32_t)index->entries.length);
3062 
3063 	if (git_filebuf_write(file, &header, sizeof(struct index_header)) < 0)
3064 		return -1;
3065 
3066 	if (write_entries(index, file) < 0)
3067 		return -1;
3068 
3069 	/* write the tree cache extension */
3070 	if (index->tree != NULL && write_tree_extension(index, file) < 0)
3071 		return -1;
3072 
3073 	/* write the rename conflict extension */
3074 	if (index->names.length > 0 && write_name_extension(index, file) < 0)
3075 		return -1;
3076 
3077 	/* write the reuc extension */
3078 	if (index->reuc.length > 0 && write_reuc_extension(index, file) < 0)
3079 		return -1;
3080 
3081 	/* get out the hash for all the contents we've appended to the file */
3082 	git_filebuf_hash(&hash_final, file);
3083 	git_oid_cpy(checksum, &hash_final);
3084 
3085 	/* write it at the end of the file */
3086 	if (git_filebuf_write(file, hash_final.id, GIT_OID_RAWSZ) < 0)
3087 		return -1;
3088 
3089 	/* file entries are no longer up to date */
3090 	clear_uptodate(index);
3091 
3092 	return 0;
3093 }
3094 
git_index_entry_stage(const git_index_entry * entry)3095 int git_index_entry_stage(const git_index_entry *entry)
3096 {
3097 	return GIT_INDEX_ENTRY_STAGE(entry);
3098 }
3099 
git_index_entry_is_conflict(const git_index_entry * entry)3100 int git_index_entry_is_conflict(const git_index_entry *entry)
3101 {
3102 	return (GIT_INDEX_ENTRY_STAGE(entry) > 0);
3103 }
3104 
3105 typedef struct read_tree_data {
3106 	git_index *index;
3107 	git_vector *old_entries;
3108 	git_vector *new_entries;
3109 	git_vector_cmp entry_cmp;
3110 	git_tree_cache *tree;
3111 } read_tree_data;
3112 
read_tree_cb(const char * root,const git_tree_entry * tentry,void * payload)3113 static int read_tree_cb(
3114 	const char *root, const git_tree_entry *tentry, void *payload)
3115 {
3116 	read_tree_data *data = payload;
3117 	git_index_entry *entry = NULL, *old_entry;
3118 	git_buf path = GIT_BUF_INIT;
3119 	size_t pos;
3120 
3121 	if (git_tree_entry__is_tree(tentry))
3122 		return 0;
3123 
3124 	if (git_buf_joinpath(&path, root, tentry->filename) < 0)
3125 		return -1;
3126 
3127 	if (index_entry_create(&entry, INDEX_OWNER(data->index), path.ptr, NULL, false) < 0)
3128 		return -1;
3129 
3130 	entry->mode = tentry->attr;
3131 	git_oid_cpy(&entry->id, git_tree_entry_id(tentry));
3132 
3133 	/* look for corresponding old entry and copy data to new entry */
3134 	if (data->old_entries != NULL &&
3135 		!index_find_in_entries(
3136 			&pos, data->old_entries, data->entry_cmp, path.ptr, 0, 0) &&
3137 		(old_entry = git_vector_get(data->old_entries, pos)) != NULL &&
3138 		entry->mode == old_entry->mode &&
3139 		git_oid_equal(&entry->id, &old_entry->id))
3140 	{
3141 		index_entry_cpy(entry, old_entry);
3142 		entry->flags_extended = 0;
3143 	}
3144 
3145 	index_entry_adjust_namemask(entry, path.size);
3146 	git_buf_dispose(&path);
3147 
3148 	if (git_vector_insert(data->new_entries, entry) < 0) {
3149 		index_entry_free(entry);
3150 		return -1;
3151 	}
3152 
3153 	return 0;
3154 }
3155 
git_index_read_tree(git_index * index,const git_tree * tree)3156 int git_index_read_tree(git_index *index, const git_tree *tree)
3157 {
3158 	int error = 0;
3159 	git_vector entries = GIT_VECTOR_INIT;
3160 	git_idxmap *entries_map;
3161 	read_tree_data data;
3162 	size_t i;
3163 	git_index_entry *e;
3164 
3165 	if (git_idxmap_new(&entries_map) < 0)
3166 		return -1;
3167 
3168 	git_vector_set_cmp(&entries, index->entries._cmp); /* match sort */
3169 
3170 	data.index = index;
3171 	data.old_entries = &index->entries;
3172 	data.new_entries = &entries;
3173 	data.entry_cmp   = index->entries_search;
3174 
3175 	index->tree = NULL;
3176 	git_pool_clear(&index->tree_pool);
3177 
3178 	git_vector_sort(&index->entries);
3179 
3180 	if ((error = git_tree_walk(tree, GIT_TREEWALK_POST, read_tree_cb, &data)) < 0)
3181 		goto cleanup;
3182 
3183 	if ((error = index_map_resize(entries_map, entries.length, index->ignore_case)) < 0)
3184 		goto cleanup;
3185 
3186 	git_vector_foreach(&entries, i, e) {
3187 		if ((error = index_map_set(entries_map, e, index->ignore_case)) < 0) {
3188 			git_error_set(GIT_ERROR_INDEX, "failed to insert entry into map");
3189 			return error;
3190 		}
3191 	}
3192 
3193 	error = 0;
3194 
3195 	git_vector_sort(&entries);
3196 
3197 	if ((error = git_index_clear(index)) < 0) {
3198 		/* well, this isn't good */;
3199 	} else {
3200 		git_vector_swap(&entries, &index->entries);
3201 		entries_map = git_atomic_swap(index->entries_map, entries_map);
3202 	}
3203 
3204 	index->dirty = 1;
3205 
3206 cleanup:
3207 	git_vector_free(&entries);
3208 	git_idxmap_free(entries_map);
3209 	if (error < 0)
3210 		return error;
3211 
3212 	error = git_tree_cache_read_tree(&index->tree, tree, &index->tree_pool);
3213 
3214 	return error;
3215 }
3216 
git_index_read_iterator(git_index * index,git_iterator * new_iterator,size_t new_length_hint)3217 static int git_index_read_iterator(
3218 	git_index *index,
3219 	git_iterator *new_iterator,
3220 	size_t new_length_hint)
3221 {
3222 	git_vector new_entries = GIT_VECTOR_INIT,
3223 		remove_entries = GIT_VECTOR_INIT;
3224 	git_idxmap *new_entries_map = NULL;
3225 	git_iterator *index_iterator = NULL;
3226 	git_iterator_options opts = GIT_ITERATOR_OPTIONS_INIT;
3227 	const git_index_entry *old_entry, *new_entry;
3228 	git_index_entry *entry;
3229 	size_t i;
3230 	int error;
3231 
3232 	GIT_ASSERT((new_iterator->flags & GIT_ITERATOR_DONT_IGNORE_CASE));
3233 
3234 	if ((error = git_vector_init(&new_entries, new_length_hint, index->entries._cmp)) < 0 ||
3235 	    (error = git_vector_init(&remove_entries, index->entries.length, NULL)) < 0 ||
3236 	    (error = git_idxmap_new(&new_entries_map)) < 0)
3237 		goto done;
3238 
3239 	if (new_length_hint && (error = index_map_resize(new_entries_map, new_length_hint,
3240 							 index->ignore_case)) < 0)
3241 		goto done;
3242 
3243 	opts.flags = GIT_ITERATOR_DONT_IGNORE_CASE |
3244 		GIT_ITERATOR_INCLUDE_CONFLICTS;
3245 
3246 	if ((error = git_iterator_for_index(&index_iterator,
3247 			git_index_owner(index), index, &opts)) < 0 ||
3248 		((error = git_iterator_current(&old_entry, index_iterator)) < 0 &&
3249 			error != GIT_ITEROVER) ||
3250 		((error = git_iterator_current(&new_entry, new_iterator)) < 0 &&
3251 			error != GIT_ITEROVER))
3252 		goto done;
3253 
3254 	while (true) {
3255 		git_index_entry
3256 			*dup_entry = NULL,
3257 			*add_entry = NULL,
3258 			*remove_entry = NULL;
3259 		int diff;
3260 
3261 		error = 0;
3262 
3263 		if (old_entry && new_entry)
3264 			diff = git_index_entry_cmp(old_entry, new_entry);
3265 		else if (!old_entry && new_entry)
3266 			diff = 1;
3267 		else if (old_entry && !new_entry)
3268 			diff = -1;
3269 		else
3270 			break;
3271 
3272 		if (diff < 0) {
3273 			remove_entry = (git_index_entry *)old_entry;
3274 		} else if (diff > 0) {
3275 			dup_entry = (git_index_entry *)new_entry;
3276 		} else {
3277 			/* Path and stage are equal, if the OID is equal, keep it to
3278 			 * keep the stat cache data.
3279 			 */
3280 			if (git_oid_equal(&old_entry->id, &new_entry->id) &&
3281 				old_entry->mode == new_entry->mode) {
3282 				add_entry = (git_index_entry *)old_entry;
3283 			} else {
3284 				dup_entry = (git_index_entry *)new_entry;
3285 				remove_entry = (git_index_entry *)old_entry;
3286 			}
3287 		}
3288 
3289 		if (dup_entry) {
3290 			if ((error = index_entry_dup_nocache(&add_entry, index, dup_entry)) < 0)
3291 				goto done;
3292 
3293 			index_entry_adjust_namemask(add_entry,
3294 				((struct entry_internal *)add_entry)->pathlen);
3295 		}
3296 
3297 		/* invalidate this path in the tree cache if this is new (to
3298 		 * invalidate the parent trees)
3299 		 */
3300 		if (dup_entry && !remove_entry && index->tree)
3301 			git_tree_cache_invalidate_path(index->tree, dup_entry->path);
3302 
3303 		if (add_entry) {
3304 			if ((error = git_vector_insert(&new_entries, add_entry)) == 0)
3305 				error = index_map_set(new_entries_map, add_entry,
3306 						      index->ignore_case);
3307 		}
3308 
3309 		if (remove_entry && error >= 0)
3310 			error = git_vector_insert(&remove_entries, remove_entry);
3311 
3312 		if (error < 0) {
3313 			git_error_set(GIT_ERROR_INDEX, "failed to insert entry");
3314 			goto done;
3315 		}
3316 
3317 		if (diff <= 0) {
3318 			if ((error = git_iterator_advance(&old_entry, index_iterator)) < 0 &&
3319 				error != GIT_ITEROVER)
3320 				goto done;
3321 		}
3322 
3323 		if (diff >= 0) {
3324 			if ((error = git_iterator_advance(&new_entry, new_iterator)) < 0 &&
3325 				error != GIT_ITEROVER)
3326 				goto done;
3327 		}
3328 	}
3329 
3330 	if ((error = git_index_name_clear(index)) < 0 ||
3331 		(error = git_index_reuc_clear(index)) < 0)
3332 	    goto done;
3333 
3334 	git_vector_swap(&new_entries, &index->entries);
3335 	new_entries_map = git_atomic_swap(index->entries_map, new_entries_map);
3336 
3337 	git_vector_foreach(&remove_entries, i, entry) {
3338 		if (index->tree)
3339 			git_tree_cache_invalidate_path(index->tree, entry->path);
3340 
3341 		index_entry_free(entry);
3342 	}
3343 
3344 	clear_uptodate(index);
3345 
3346 	index->dirty = 1;
3347 	error = 0;
3348 
3349 done:
3350 	git_idxmap_free(new_entries_map);
3351 	git_vector_free(&new_entries);
3352 	git_vector_free(&remove_entries);
3353 	git_iterator_free(index_iterator);
3354 	return error;
3355 }
3356 
git_index_read_index(git_index * index,const git_index * new_index)3357 int git_index_read_index(
3358 	git_index *index,
3359 	const git_index *new_index)
3360 {
3361 	git_iterator *new_iterator = NULL;
3362 	git_iterator_options opts = GIT_ITERATOR_OPTIONS_INIT;
3363 	int error;
3364 
3365 	opts.flags = GIT_ITERATOR_DONT_IGNORE_CASE |
3366 		GIT_ITERATOR_INCLUDE_CONFLICTS;
3367 
3368 	if ((error = git_iterator_for_index(&new_iterator,
3369 		git_index_owner(new_index), (git_index *)new_index, &opts)) < 0 ||
3370 		(error = git_index_read_iterator(index, new_iterator,
3371 		new_index->entries.length)) < 0)
3372 		goto done;
3373 
3374 done:
3375 	git_iterator_free(new_iterator);
3376 	return error;
3377 }
3378 
git_index_owner(const git_index * index)3379 git_repository *git_index_owner(const git_index *index)
3380 {
3381 	return INDEX_OWNER(index);
3382 }
3383 
3384 enum {
3385 	INDEX_ACTION_NONE = 0,
3386 	INDEX_ACTION_UPDATE = 1,
3387 	INDEX_ACTION_REMOVE = 2,
3388 	INDEX_ACTION_ADDALL = 3,
3389 };
3390 
git_index_add_all(git_index * index,const git_strarray * paths,unsigned int flags,git_index_matched_path_cb cb,void * payload)3391 int git_index_add_all(
3392 	git_index *index,
3393 	const git_strarray *paths,
3394 	unsigned int flags,
3395 	git_index_matched_path_cb cb,
3396 	void *payload)
3397 {
3398 	int error;
3399 	git_repository *repo;
3400 	git_iterator *wditer = NULL;
3401 	git_pathspec ps;
3402 	bool no_fnmatch = (flags & GIT_INDEX_ADD_DISABLE_PATHSPEC_MATCH) != 0;
3403 
3404 	GIT_ASSERT_ARG(index);
3405 
3406 	repo = INDEX_OWNER(index);
3407 	if ((error = git_repository__ensure_not_bare(repo, "index add all")) < 0)
3408 		return error;
3409 
3410 	if ((error = git_pathspec__init(&ps, paths)) < 0)
3411 		return error;
3412 
3413 	/* optionally check that pathspec doesn't mention any ignored files */
3414 	if ((flags & GIT_INDEX_ADD_CHECK_PATHSPEC) != 0 &&
3415 		(flags & GIT_INDEX_ADD_FORCE) == 0 &&
3416 		(error = git_ignore__check_pathspec_for_exact_ignores(
3417 			repo, &ps.pathspec, no_fnmatch)) < 0)
3418 		goto cleanup;
3419 
3420 	error = index_apply_to_wd_diff(index, INDEX_ACTION_ADDALL, paths, flags, cb, payload);
3421 
3422 	if (error)
3423 		git_error_set_after_callback(error);
3424 
3425 cleanup:
3426 	git_iterator_free(wditer);
3427 	git_pathspec__clear(&ps);
3428 
3429 	return error;
3430 }
3431 
3432 struct foreach_diff_data {
3433 	git_index *index;
3434 	const git_pathspec *pathspec;
3435 	unsigned int flags;
3436 	git_index_matched_path_cb cb;
3437 	void *payload;
3438 };
3439 
apply_each_file(const git_diff_delta * delta,float progress,void * payload)3440 static int apply_each_file(const git_diff_delta *delta, float progress, void *payload)
3441 {
3442 	struct foreach_diff_data *data = payload;
3443 	const char *match, *path;
3444 	int error = 0;
3445 
3446 	GIT_UNUSED(progress);
3447 
3448 	path = delta->old_file.path;
3449 
3450 	/* We only want those which match the pathspecs */
3451 	if (!git_pathspec__match(
3452 		    &data->pathspec->pathspec, path, false, (bool)data->index->ignore_case,
3453 		    &match, NULL))
3454 		return 0;
3455 
3456 	if (data->cb)
3457 		error = data->cb(path, match, data->payload);
3458 
3459 	if (error > 0) /* skip this entry */
3460 		return 0;
3461 	if (error < 0) /* actual error */
3462 		return error;
3463 
3464 	/* If the workdir item does not exist, remove it from the index. */
3465 	if ((delta->new_file.flags & GIT_DIFF_FLAG_EXISTS) == 0)
3466 		error = git_index_remove_bypath(data->index, path);
3467 	else
3468 		error = git_index_add_bypath(data->index, delta->new_file.path);
3469 
3470 	return error;
3471 }
3472 
index_apply_to_wd_diff(git_index * index,int action,const git_strarray * paths,unsigned int flags,git_index_matched_path_cb cb,void * payload)3473 static int index_apply_to_wd_diff(git_index *index, int action, const git_strarray *paths,
3474 				  unsigned int flags,
3475 				  git_index_matched_path_cb cb, void *payload)
3476 {
3477 	int error;
3478 	git_diff *diff;
3479 	git_pathspec ps;
3480 	git_repository *repo;
3481 	git_diff_options opts = GIT_DIFF_OPTIONS_INIT;
3482 	struct foreach_diff_data data = {
3483 		index,
3484 		NULL,
3485 		flags,
3486 		cb,
3487 		payload,
3488 	};
3489 
3490 	GIT_ASSERT_ARG(index);
3491 	GIT_ASSERT_ARG(action == INDEX_ACTION_UPDATE || action == INDEX_ACTION_ADDALL);
3492 
3493 	repo = INDEX_OWNER(index);
3494 
3495 	if (!repo) {
3496 		return create_index_error(-1,
3497 			"cannot run update; the index is not backed up by a repository.");
3498 	}
3499 
3500 	/*
3501 	 * We do the matching ourselves intead of passing the list to
3502 	 * diff because we want to tell the callback which one
3503 	 * matched, which we do not know if we ask diff to filter for us.
3504 	 */
3505 	if ((error = git_pathspec__init(&ps, paths)) < 0)
3506 		return error;
3507 
3508 	opts.flags = GIT_DIFF_INCLUDE_TYPECHANGE;
3509 	if (action == INDEX_ACTION_ADDALL) {
3510 		opts.flags |= GIT_DIFF_INCLUDE_UNTRACKED |
3511 			GIT_DIFF_RECURSE_UNTRACKED_DIRS;
3512 
3513 		if (flags == GIT_INDEX_ADD_FORCE)
3514 			opts.flags |= GIT_DIFF_INCLUDE_IGNORED;
3515 	}
3516 
3517 	if ((error = git_diff_index_to_workdir(&diff, repo, index, &opts)) < 0)
3518 		goto cleanup;
3519 
3520 	data.pathspec = &ps;
3521 	error = git_diff_foreach(diff, apply_each_file, NULL, NULL, NULL, &data);
3522 	git_diff_free(diff);
3523 
3524 	if (error) /* make sure error is set if callback stopped iteration */
3525 		git_error_set_after_callback(error);
3526 
3527 cleanup:
3528 	git_pathspec__clear(&ps);
3529 	return error;
3530 }
3531 
index_apply_to_all(git_index * index,int action,const git_strarray * paths,git_index_matched_path_cb cb,void * payload)3532 static int index_apply_to_all(
3533 	git_index *index,
3534 	int action,
3535 	const git_strarray *paths,
3536 	git_index_matched_path_cb cb,
3537 	void *payload)
3538 {
3539 	int error = 0;
3540 	size_t i;
3541 	git_pathspec ps;
3542 	const char *match;
3543 	git_buf path = GIT_BUF_INIT;
3544 
3545 	GIT_ASSERT_ARG(index);
3546 
3547 	if ((error = git_pathspec__init(&ps, paths)) < 0)
3548 		return error;
3549 
3550 	git_vector_sort(&index->entries);
3551 
3552 	for (i = 0; !error && i < index->entries.length; ++i) {
3553 		git_index_entry *entry = git_vector_get(&index->entries, i);
3554 
3555 		/* check if path actually matches */
3556 		if (!git_pathspec__match(
3557 				&ps.pathspec, entry->path, false, (bool)index->ignore_case,
3558 				&match, NULL))
3559 			continue;
3560 
3561 		/* issue notification callback if requested */
3562 		if (cb && (error = cb(entry->path, match, payload)) != 0) {
3563 			if (error > 0) { /* return > 0 means skip this one */
3564 				error = 0;
3565 				continue;
3566 			}
3567 			if (error < 0)   /* return < 0 means abort */
3568 				break;
3569 		}
3570 
3571 		/* index manipulation may alter entry, so don't depend on it */
3572 		if ((error = git_buf_sets(&path, entry->path)) < 0)
3573 			break;
3574 
3575 		switch (action) {
3576 		case INDEX_ACTION_NONE:
3577 			break;
3578 		case INDEX_ACTION_UPDATE:
3579 			error = git_index_add_bypath(index, path.ptr);
3580 
3581 			if (error == GIT_ENOTFOUND) {
3582 				git_error_clear();
3583 
3584 				error = git_index_remove_bypath(index, path.ptr);
3585 
3586 				if (!error) /* back up foreach if we removed this */
3587 					i--;
3588 			}
3589 			break;
3590 		case INDEX_ACTION_REMOVE:
3591 			if (!(error = git_index_remove_bypath(index, path.ptr)))
3592 				i--; /* back up foreach if we removed this */
3593 			break;
3594 		default:
3595 			git_error_set(GIT_ERROR_INVALID, "unknown index action %d", action);
3596 			error = -1;
3597 			break;
3598 		}
3599 	}
3600 
3601 	git_buf_dispose(&path);
3602 	git_pathspec__clear(&ps);
3603 
3604 	return error;
3605 }
3606 
git_index_remove_all(git_index * index,const git_strarray * pathspec,git_index_matched_path_cb cb,void * payload)3607 int git_index_remove_all(
3608 	git_index *index,
3609 	const git_strarray *pathspec,
3610 	git_index_matched_path_cb cb,
3611 	void *payload)
3612 {
3613 	int error = index_apply_to_all(
3614 		index, INDEX_ACTION_REMOVE, pathspec, cb, payload);
3615 
3616 	if (error) /* make sure error is set if callback stopped iteration */
3617 		git_error_set_after_callback(error);
3618 
3619 	return error;
3620 }
3621 
git_index_update_all(git_index * index,const git_strarray * pathspec,git_index_matched_path_cb cb,void * payload)3622 int git_index_update_all(
3623 	git_index *index,
3624 	const git_strarray *pathspec,
3625 	git_index_matched_path_cb cb,
3626 	void *payload)
3627 {
3628 	int error = index_apply_to_wd_diff(index, INDEX_ACTION_UPDATE, pathspec, 0, cb, payload);
3629 	if (error) /* make sure error is set if callback stopped iteration */
3630 		git_error_set_after_callback(error);
3631 
3632 	return error;
3633 }
3634 
git_index_snapshot_new(git_vector * snap,git_index * index)3635 int git_index_snapshot_new(git_vector *snap, git_index *index)
3636 {
3637 	int error;
3638 
3639 	GIT_REFCOUNT_INC(index);
3640 
3641 	git_atomic32_inc(&index->readers);
3642 	git_vector_sort(&index->entries);
3643 
3644 	error = git_vector_dup(snap, &index->entries, index->entries._cmp);
3645 
3646 	if (error < 0)
3647 		git_index_snapshot_release(snap, index);
3648 
3649 	return error;
3650 }
3651 
git_index_snapshot_release(git_vector * snap,git_index * index)3652 void git_index_snapshot_release(git_vector *snap, git_index *index)
3653 {
3654 	git_vector_free(snap);
3655 
3656 	git_atomic32_dec(&index->readers);
3657 
3658 	git_index_free(index);
3659 }
3660 
git_index_snapshot_find(size_t * out,git_vector * entries,git_vector_cmp entry_srch,const char * path,size_t path_len,int stage)3661 int git_index_snapshot_find(
3662 	size_t *out, git_vector *entries, git_vector_cmp entry_srch,
3663 	const char *path, size_t path_len, int stage)
3664 {
3665 	return index_find_in_entries(out, entries, entry_srch, path, path_len, stage);
3666 }
3667 
git_indexwriter_init(git_indexwriter * writer,git_index * index)3668 int git_indexwriter_init(
3669 	git_indexwriter *writer,
3670 	git_index *index)
3671 {
3672 	int error;
3673 
3674 	GIT_REFCOUNT_INC(index);
3675 
3676 	writer->index = index;
3677 
3678 	if (!index->index_file_path)
3679 		return create_index_error(-1,
3680 			"failed to write index: The index is in-memory only");
3681 
3682 	if ((error = git_filebuf_open(
3683 		&writer->file, index->index_file_path, GIT_FILEBUF_HASH_CONTENTS, GIT_INDEX_FILE_MODE)) < 0) {
3684 
3685 		if (error == GIT_ELOCKED)
3686 			git_error_set(GIT_ERROR_INDEX, "the index is locked; this might be due to a concurrent or crashed process");
3687 
3688 		return error;
3689 	}
3690 
3691 	writer->should_write = 1;
3692 
3693 	return 0;
3694 }
3695 
git_indexwriter_init_for_operation(git_indexwriter * writer,git_repository * repo,unsigned int * checkout_strategy)3696 int git_indexwriter_init_for_operation(
3697 	git_indexwriter *writer,
3698 	git_repository *repo,
3699 	unsigned int *checkout_strategy)
3700 {
3701 	git_index *index;
3702 	int error;
3703 
3704 	if ((error = git_repository_index__weakptr(&index, repo)) < 0 ||
3705 		(error = git_indexwriter_init(writer, index)) < 0)
3706 		return error;
3707 
3708 	writer->should_write = (*checkout_strategy & GIT_CHECKOUT_DONT_WRITE_INDEX) == 0;
3709 	*checkout_strategy |= GIT_CHECKOUT_DONT_WRITE_INDEX;
3710 
3711 	return 0;
3712 }
3713 
git_indexwriter_commit(git_indexwriter * writer)3714 int git_indexwriter_commit(git_indexwriter *writer)
3715 {
3716 	int error;
3717 	git_oid checksum = {{ 0 }};
3718 
3719 	if (!writer->should_write)
3720 		return 0;
3721 
3722 	git_vector_sort(&writer->index->entries);
3723 	git_vector_sort(&writer->index->reuc);
3724 
3725 	if ((error = write_index(&checksum, writer->index, &writer->file)) < 0) {
3726 		git_indexwriter_cleanup(writer);
3727 		return error;
3728 	}
3729 
3730 	if ((error = git_filebuf_commit(&writer->file)) < 0)
3731 		return error;
3732 
3733 	if ((error = git_futils_filestamp_check(
3734 		&writer->index->stamp, writer->index->index_file_path)) < 0) {
3735 		git_error_set(GIT_ERROR_OS, "could not read index timestamp");
3736 		return -1;
3737 	}
3738 
3739 	writer->index->dirty = 0;
3740 	writer->index->on_disk = 1;
3741 	git_oid_cpy(&writer->index->checksum, &checksum);
3742 
3743 	git_index_free(writer->index);
3744 	writer->index = NULL;
3745 
3746 	return 0;
3747 }
3748 
git_indexwriter_cleanup(git_indexwriter * writer)3749 void git_indexwriter_cleanup(git_indexwriter *writer)
3750 {
3751 	git_filebuf_cleanup(&writer->file);
3752 
3753 	git_index_free(writer->index);
3754 	writer->index = NULL;
3755 }
3756 
3757 /* Deprecated functions */
3758 
3759 #ifndef GIT_DEPRECATE_HARD
git_index_add_frombuffer(git_index * index,const git_index_entry * source_entry,const void * buffer,size_t len)3760 int git_index_add_frombuffer(
3761     git_index *index, const git_index_entry *source_entry,
3762     const void *buffer, size_t len)
3763 {
3764 	return git_index_add_from_buffer(index, source_entry, buffer, len);
3765 }
3766 #endif
3767