1 /*
2  * Copyright (C) the libgit2 contributors. All rights reserved.
3  *
4  * This file is part of libgit2, distributed under the GNU GPL v2 with
5  * a Linking Exception. For full terms see the included COPYING file.
6  */
7 
8 #include "clone.h"
9 
10 #include "git2/clone.h"
11 #include "git2/remote.h"
12 #include "git2/revparse.h"
13 #include "git2/branch.h"
14 #include "git2/config.h"
15 #include "git2/checkout.h"
16 #include "git2/commit.h"
17 #include "git2/tree.h"
18 
19 #include "remote.h"
20 #include "futils.h"
21 #include "refs.h"
22 #include "path.h"
23 #include "repository.h"
24 #include "odb.h"
25 
26 static int clone_local_into(git_repository *repo, git_remote *remote, const git_fetch_options *fetch_opts, const git_checkout_options *co_opts, const char *branch, int link);
27 
create_branch(git_reference ** branch,git_repository * repo,const git_oid * target,const char * name,const char * log_message)28 static int create_branch(
29 	git_reference **branch,
30 	git_repository *repo,
31 	const git_oid *target,
32 	const char *name,
33 	const char *log_message)
34 {
35 	git_commit *head_obj = NULL;
36 	git_reference *branch_ref = NULL;
37 	git_buf refname = GIT_BUF_INIT;
38 	int error;
39 
40 	/* Find the target commit */
41 	if ((error = git_commit_lookup(&head_obj, repo, target)) < 0)
42 		return error;
43 
44 	/* Create the new branch */
45 	if ((error = git_buf_printf(&refname, GIT_REFS_HEADS_DIR "%s", name)) < 0)
46 		return error;
47 
48 	error = git_reference_create(&branch_ref, repo, git_buf_cstr(&refname), target, 0, log_message);
49 	git_buf_dispose(&refname);
50 	git_commit_free(head_obj);
51 
52 	if (!error)
53 		*branch = branch_ref;
54 	else
55 		git_reference_free(branch_ref);
56 
57 	return error;
58 }
59 
setup_tracking_config(git_repository * repo,const char * branch_name,const char * remote_name,const char * merge_target)60 static int setup_tracking_config(
61 	git_repository *repo,
62 	const char *branch_name,
63 	const char *remote_name,
64 	const char *merge_target)
65 {
66 	git_config *cfg;
67 	git_buf remote_key = GIT_BUF_INIT, merge_key = GIT_BUF_INIT;
68 	int error = -1;
69 
70 	if (git_repository_config__weakptr(&cfg, repo) < 0)
71 		return -1;
72 
73 	if (git_buf_printf(&remote_key, "branch.%s.remote", branch_name) < 0)
74 		goto cleanup;
75 
76 	if (git_buf_printf(&merge_key, "branch.%s.merge", branch_name) < 0)
77 		goto cleanup;
78 
79 	if (git_config_set_string(cfg, git_buf_cstr(&remote_key), remote_name) < 0)
80 		goto cleanup;
81 
82 	if (git_config_set_string(cfg, git_buf_cstr(&merge_key), merge_target) < 0)
83 		goto cleanup;
84 
85 	error = 0;
86 
87 cleanup:
88 	git_buf_dispose(&remote_key);
89 	git_buf_dispose(&merge_key);
90 	return error;
91 }
92 
create_tracking_branch(git_reference ** branch,git_repository * repo,const git_oid * target,const char * branch_name,const char * log_message)93 static int create_tracking_branch(
94 	git_reference **branch,
95 	git_repository *repo,
96 	const git_oid *target,
97 	const char *branch_name,
98 	const char *log_message)
99 {
100 	int error;
101 
102 	if ((error = create_branch(branch, repo, target, branch_name, log_message)) < 0)
103 		return error;
104 
105 	return setup_tracking_config(
106 		repo,
107 		branch_name,
108 		GIT_REMOTE_ORIGIN,
109 		git_reference_name(*branch));
110 }
111 
update_head_to_new_branch(git_repository * repo,const git_oid * target,const char * name,const char * reflog_message)112 static int update_head_to_new_branch(
113 	git_repository *repo,
114 	const git_oid *target,
115 	const char *name,
116 	const char *reflog_message)
117 {
118 	git_reference *tracking_branch = NULL;
119 	int error;
120 
121 	if (!git__prefixcmp(name, GIT_REFS_HEADS_DIR))
122 		name += strlen(GIT_REFS_HEADS_DIR);
123 
124 	error = create_tracking_branch(&tracking_branch, repo, target, name,
125 			reflog_message);
126 
127 	if (!error)
128 		error = git_repository_set_head(
129 			repo, git_reference_name(tracking_branch));
130 
131 	git_reference_free(tracking_branch);
132 
133 	/* if it already existed, then the user's refspec created it for us, ignore it' */
134 	if (error == GIT_EEXISTS)
135 		error = 0;
136 
137 	return error;
138 }
139 
update_head_to_default(git_repository * repo)140 static int update_head_to_default(git_repository *repo)
141 {
142 	git_buf initialbranch = GIT_BUF_INIT;
143 	const char *branch_name;
144 	int error = 0;
145 
146 	if ((error = git_repository_initialbranch(&initialbranch, repo)) < 0)
147 		goto done;
148 
149 	if (git__prefixcmp(initialbranch.ptr, GIT_REFS_HEADS_DIR) != 0) {
150 		git_error_set(GIT_ERROR_INVALID, "invalid initial branch '%s'", initialbranch.ptr);
151 		error = -1;
152 		goto done;
153 	}
154 
155 	branch_name = initialbranch.ptr + strlen(GIT_REFS_HEADS_DIR);
156 
157 	error = setup_tracking_config(repo, branch_name, GIT_REMOTE_ORIGIN,
158 		initialbranch.ptr);
159 
160 done:
161 	git_buf_dispose(&initialbranch);
162 	return error;
163 }
164 
update_remote_head(git_repository * repo,git_remote * remote,git_buf * target,const char * reflog_message)165 static int update_remote_head(
166 	git_repository *repo,
167 	git_remote *remote,
168 	git_buf *target,
169 	const char *reflog_message)
170 {
171 	git_refspec *refspec;
172 	git_reference *remote_head = NULL;
173 	git_buf remote_head_name = GIT_BUF_INIT;
174 	git_buf remote_branch_name = GIT_BUF_INIT;
175 	int error;
176 
177 	/* Determine the remote tracking ref name from the local branch */
178 	refspec = git_remote__matching_refspec(remote, git_buf_cstr(target));
179 
180 	if (refspec == NULL) {
181 		git_error_set(GIT_ERROR_NET, "the remote's default branch does not fit the refspec configuration");
182 		error = GIT_EINVALIDSPEC;
183 		goto cleanup;
184 	}
185 
186 	if ((error = git_refspec_transform(
187 		&remote_branch_name,
188 		refspec,
189 		git_buf_cstr(target))) < 0)
190 		goto cleanup;
191 
192 	if ((error = git_buf_printf(&remote_head_name,
193 		"%s%s/%s",
194 		GIT_REFS_REMOTES_DIR,
195 		git_remote_name(remote),
196 		GIT_HEAD_FILE)) < 0)
197 		goto cleanup;
198 
199 	error = git_reference_symbolic_create(
200 		&remote_head,
201 		repo,
202 		git_buf_cstr(&remote_head_name),
203 		git_buf_cstr(&remote_branch_name),
204 		true,
205 		reflog_message);
206 
207 cleanup:
208 	git_reference_free(remote_head);
209 	git_buf_dispose(&remote_branch_name);
210 	git_buf_dispose(&remote_head_name);
211 	return error;
212 }
213 
update_head_to_remote(git_repository * repo,git_remote * remote,const char * reflog_message)214 static int update_head_to_remote(
215 		git_repository *repo,
216 		git_remote *remote,
217 		const char *reflog_message)
218 {
219 	int error = 0;
220 	size_t refs_len;
221 	const git_remote_head *remote_head, **refs;
222 	const git_oid *remote_head_id;
223 	git_buf branch = GIT_BUF_INIT;
224 
225 	if ((error = git_remote_ls(&refs, &refs_len, remote)) < 0)
226 		return error;
227 
228 	/* We cloned an empty repository or one with an unborn HEAD */
229 	if (refs_len == 0 || strcmp(refs[0]->name, GIT_HEAD_FILE))
230 		return update_head_to_default(repo);
231 
232 	/* We know we have HEAD, let's see where it points */
233 	remote_head = refs[0];
234 	GIT_ASSERT(remote_head);
235 
236 	remote_head_id = &remote_head->oid;
237 
238 	error = git_remote_default_branch(&branch, remote);
239 	if (error == GIT_ENOTFOUND) {
240 		error = git_repository_set_head_detached(
241 			repo, remote_head_id);
242 		goto cleanup;
243 	}
244 
245 	if ((error = update_remote_head(repo, remote, &branch, reflog_message)) < 0)
246 		goto cleanup;
247 
248 	error = update_head_to_new_branch(
249 		repo,
250 		remote_head_id,
251 		git_buf_cstr(&branch),
252 		reflog_message);
253 
254 cleanup:
255 	git_buf_dispose(&branch);
256 
257 	return error;
258 }
259 
update_head_to_branch(git_repository * repo,git_remote * remote,const char * branch,const char * reflog_message)260 static int update_head_to_branch(
261 		git_repository *repo,
262 		git_remote *remote,
263 		const char *branch,
264 		const char *reflog_message)
265 {
266 	int retcode;
267 	git_buf remote_branch_name = GIT_BUF_INIT;
268 	git_reference *remote_ref = NULL;
269 	git_buf default_branch = GIT_BUF_INIT;
270 
271 	GIT_ASSERT_ARG(remote);
272 	GIT_ASSERT_ARG(branch);
273 
274 	if ((retcode = git_buf_printf(&remote_branch_name, GIT_REFS_REMOTES_DIR "%s/%s",
275 		git_remote_name(remote), branch)) < 0 )
276 		goto cleanup;
277 
278 	if ((retcode = git_reference_lookup(&remote_ref, repo, git_buf_cstr(&remote_branch_name))) < 0)
279 		goto cleanup;
280 
281 	if ((retcode = update_head_to_new_branch(repo, git_reference_target(remote_ref), branch,
282 			reflog_message)) < 0)
283 		goto cleanup;
284 
285 	if ((retcode = git_remote_default_branch(&default_branch, remote)) < 0)
286 		goto cleanup;
287 
288 	if (!git_remote__matching_refspec(remote, git_buf_cstr(&default_branch)))
289 		goto cleanup;
290 
291 	retcode = update_remote_head(repo, remote, &default_branch, reflog_message);
292 
293 cleanup:
294 	git_reference_free(remote_ref);
295 	git_buf_dispose(&remote_branch_name);
296 	git_buf_dispose(&default_branch);
297 	return retcode;
298 }
299 
default_repository_create(git_repository ** out,const char * path,int bare,void * payload)300 static int default_repository_create(git_repository **out, const char *path, int bare, void *payload)
301 {
302 	GIT_UNUSED(payload);
303 
304 	return git_repository_init(out, path, bare);
305 }
306 
default_remote_create(git_remote ** out,git_repository * repo,const char * name,const char * url,void * payload)307 static int default_remote_create(
308 		git_remote **out,
309 		git_repository *repo,
310 		const char *name,
311 		const char *url,
312 		void *payload)
313 {
314 	GIT_UNUSED(payload);
315 
316 	return git_remote_create(out, repo, name, url);
317 }
318 
319 /*
320  * submodules?
321  */
322 
create_and_configure_origin(git_remote ** out,git_repository * repo,const char * url,const git_clone_options * options)323 static int create_and_configure_origin(
324 		git_remote **out,
325 		git_repository *repo,
326 		const char *url,
327 		const git_clone_options *options)
328 {
329 	int error;
330 	git_remote *origin = NULL;
331 	char buf[GIT_PATH_MAX];
332 	git_remote_create_cb remote_create = options->remote_cb;
333 	void *payload = options->remote_cb_payload;
334 
335 	/* If the path exists and is a dir, the url should be the absolute path */
336 	if (git_path_root(url) < 0 && git_path_exists(url) && git_path_isdir(url)) {
337 		if (p_realpath(url, buf) == NULL)
338 			return -1;
339 
340 		url = buf;
341 	}
342 
343 	if (!remote_create) {
344 		remote_create = default_remote_create;
345 		payload = NULL;
346 	}
347 
348 	if ((error = remote_create(&origin, repo, "origin", url, payload)) < 0)
349 		goto on_error;
350 
351 	*out = origin;
352 	return 0;
353 
354 on_error:
355 	git_remote_free(origin);
356 	return error;
357 }
358 
should_checkout(git_repository * repo,bool is_bare,const git_checkout_options * opts)359 static bool should_checkout(
360 	git_repository *repo,
361 	bool is_bare,
362 	const git_checkout_options *opts)
363 {
364 	if (is_bare)
365 		return false;
366 
367 	if (!opts)
368 		return false;
369 
370 	if (opts->checkout_strategy == GIT_CHECKOUT_NONE)
371 		return false;
372 
373 	return !git_repository_head_unborn(repo);
374 }
375 
checkout_branch(git_repository * repo,git_remote * remote,const git_checkout_options * co_opts,const char * branch,const char * reflog_message)376 static int checkout_branch(git_repository *repo, git_remote *remote, const git_checkout_options *co_opts, const char *branch, const char *reflog_message)
377 {
378 	int error;
379 
380 	if (branch)
381 		error = update_head_to_branch(repo, remote, branch, reflog_message);
382 	/* Point HEAD to the same ref as the remote's head */
383 	else
384 		error = update_head_to_remote(repo, remote, reflog_message);
385 
386 	if (!error && should_checkout(repo, git_repository_is_bare(repo), co_opts))
387 		error = git_checkout_head(repo, co_opts);
388 
389 	return error;
390 }
391 
clone_into(git_repository * repo,git_remote * _remote,const git_fetch_options * opts,const git_checkout_options * co_opts,const char * branch)392 static int clone_into(git_repository *repo, git_remote *_remote, const git_fetch_options *opts, const git_checkout_options *co_opts, const char *branch)
393 {
394 	int error;
395 	git_buf reflog_message = GIT_BUF_INIT;
396 	git_fetch_options fetch_opts;
397 	git_remote *remote;
398 
399 	GIT_ASSERT_ARG(repo);
400 	GIT_ASSERT_ARG(_remote);
401 
402 	if (!git_repository_is_empty(repo)) {
403 		git_error_set(GIT_ERROR_INVALID, "the repository is not empty");
404 		return -1;
405 	}
406 
407 	if ((error = git_remote_dup(&remote, _remote)) < 0)
408 		return error;
409 
410 	memcpy(&fetch_opts, opts, sizeof(git_fetch_options));
411 	fetch_opts.update_fetchhead = 0;
412 	fetch_opts.download_tags = GIT_REMOTE_DOWNLOAD_TAGS_ALL;
413 	git_buf_printf(&reflog_message, "clone: from %s", git_remote_url(remote));
414 
415 	if ((error = git_remote_fetch(remote, NULL, &fetch_opts, git_buf_cstr(&reflog_message))) != 0)
416 		goto cleanup;
417 
418 	error = checkout_branch(repo, remote, co_opts, branch, git_buf_cstr(&reflog_message));
419 
420 cleanup:
421 	git_remote_free(remote);
422 	git_buf_dispose(&reflog_message);
423 
424 	return error;
425 }
426 
git_clone__should_clone_local(const char * url_or_path,git_clone_local_t local)427 int git_clone__should_clone_local(const char *url_or_path, git_clone_local_t local)
428 {
429 	git_buf fromurl = GIT_BUF_INIT;
430 	const char *path = url_or_path;
431 	bool is_url, is_local;
432 
433 	if (local == GIT_CLONE_NO_LOCAL)
434 		return 0;
435 
436 	if ((is_url = git_path_is_local_file_url(url_or_path)) != 0) {
437 		if (git_path_fromurl(&fromurl, url_or_path) < 0) {
438 			is_local = -1;
439 			goto done;
440 		}
441 
442 		path = fromurl.ptr;
443 	}
444 
445 	is_local = (!is_url || local != GIT_CLONE_LOCAL_AUTO) &&
446 		git_path_isdir(path);
447 
448 done:
449 	git_buf_dispose(&fromurl);
450 	return is_local;
451 }
452 
git__clone(git_repository ** out,const char * url,const char * local_path,const git_clone_options * _options,int use_existing)453 static int git__clone(
454 	git_repository **out,
455 	const char *url,
456 	const char *local_path,
457 	const git_clone_options *_options,
458 	int use_existing)
459 {
460 	int error = 0;
461 	git_repository *repo = NULL;
462 	git_remote *origin;
463 	git_clone_options options = GIT_CLONE_OPTIONS_INIT;
464 	uint32_t rmdir_flags = GIT_RMDIR_REMOVE_FILES;
465 	git_repository_create_cb repository_cb;
466 
467 	GIT_ASSERT_ARG(out);
468 	GIT_ASSERT_ARG(url);
469 	GIT_ASSERT_ARG(local_path);
470 
471 	if (_options)
472 		memcpy(&options, _options, sizeof(git_clone_options));
473 
474 	GIT_ERROR_CHECK_VERSION(&options, GIT_CLONE_OPTIONS_VERSION, "git_clone_options");
475 
476 	/* Only clone to a new directory or an empty directory */
477 	if (git_path_exists(local_path) && !use_existing && !git_path_is_empty_dir(local_path)) {
478 		git_error_set(GIT_ERROR_INVALID,
479 			"'%s' exists and is not an empty directory", local_path);
480 		return GIT_EEXISTS;
481 	}
482 
483 	/* Only remove the root directory on failure if we create it */
484 	if (git_path_exists(local_path))
485 		rmdir_flags |= GIT_RMDIR_SKIP_ROOT;
486 
487 	if (options.repository_cb)
488 		repository_cb = options.repository_cb;
489 	else
490 		repository_cb = default_repository_create;
491 
492 	if ((error = repository_cb(&repo, local_path, options.bare, options.repository_cb_payload)) < 0)
493 		return error;
494 
495 	if (!(error = create_and_configure_origin(&origin, repo, url, &options))) {
496 		int clone_local = git_clone__should_clone_local(url, options.local);
497 		int link = options.local != GIT_CLONE_LOCAL_NO_LINKS;
498 
499 		if (clone_local == 1)
500 			error = clone_local_into(
501 				repo, origin, &options.fetch_opts, &options.checkout_opts,
502 				options.checkout_branch, link);
503 		else if (clone_local == 0)
504 			error = clone_into(
505 				repo, origin, &options.fetch_opts, &options.checkout_opts,
506 				options.checkout_branch);
507 		else
508 			error = -1;
509 
510 		git_remote_free(origin);
511 	}
512 
513 	if (error != 0) {
514 		git_error_state last_error = {0};
515 		git_error_state_capture(&last_error, error);
516 
517 		git_repository_free(repo);
518 		repo = NULL;
519 
520 		(void)git_futils_rmdir_r(local_path, NULL, rmdir_flags);
521 
522 		git_error_state_restore(&last_error);
523 	}
524 
525 	*out = repo;
526 	return error;
527 }
528 
git_clone(git_repository ** out,const char * url,const char * local_path,const git_clone_options * _options)529 int git_clone(
530 	git_repository **out,
531 	const char *url,
532 	const char *local_path,
533 	const git_clone_options *_options)
534 {
535 	return git__clone(out, url, local_path, _options, 0);
536 }
537 
git_clone__submodule(git_repository ** out,const char * url,const char * local_path,const git_clone_options * _options)538 int git_clone__submodule(
539 	git_repository **out,
540 	const char *url,
541 	const char *local_path,
542 	const git_clone_options *_options)
543 {
544 	return git__clone(out, url, local_path, _options, 1);
545 }
546 
git_clone_options_init(git_clone_options * opts,unsigned int version)547 int git_clone_options_init(git_clone_options *opts, unsigned int version)
548 {
549 	GIT_INIT_STRUCTURE_FROM_TEMPLATE(
550 		opts, version, git_clone_options, GIT_CLONE_OPTIONS_INIT);
551 	return 0;
552 }
553 
554 #ifndef GIT_DEPRECATE_HARD
git_clone_init_options(git_clone_options * opts,unsigned int version)555 int git_clone_init_options(git_clone_options *opts, unsigned int version)
556 {
557 	return git_clone_options_init(opts, version);
558 }
559 #endif
560 
can_link(const char * src,const char * dst,int link)561 static bool can_link(const char *src, const char *dst, int link)
562 {
563 #ifdef GIT_WIN32
564 	GIT_UNUSED(src);
565 	GIT_UNUSED(dst);
566 	GIT_UNUSED(link);
567 	return false;
568 #else
569 
570 	struct stat st_src, st_dst;
571 
572 	if (!link)
573 		return false;
574 
575 	if (p_stat(src, &st_src) < 0)
576 		return false;
577 
578 	if (p_stat(dst, &st_dst) < 0)
579 		return false;
580 
581 	return st_src.st_dev == st_dst.st_dev;
582 #endif
583 }
584 
clone_local_into(git_repository * repo,git_remote * remote,const git_fetch_options * fetch_opts,const git_checkout_options * co_opts,const char * branch,int link)585 static int clone_local_into(git_repository *repo, git_remote *remote, const git_fetch_options *fetch_opts, const git_checkout_options *co_opts, const char *branch, int link)
586 {
587 	int error, flags;
588 	git_repository *src;
589 	git_buf src_odb = GIT_BUF_INIT, dst_odb = GIT_BUF_INIT, src_path = GIT_BUF_INIT;
590 	git_buf reflog_message = GIT_BUF_INIT;
591 
592 	GIT_ASSERT_ARG(repo);
593 	GIT_ASSERT_ARG(remote);
594 
595 	if (!git_repository_is_empty(repo)) {
596 		git_error_set(GIT_ERROR_INVALID, "the repository is not empty");
597 		return -1;
598 	}
599 
600 	/*
601 	 * Let's figure out what path we should use for the source
602 	 * repo, if it's not rooted, the path should be relative to
603 	 * the repository's worktree/gitdir.
604 	 */
605 	if ((error = git_path_from_url_or_path(&src_path, git_remote_url(remote))) < 0)
606 		return error;
607 
608 	/* Copy .git/objects/ from the source to the target */
609 	if ((error = git_repository_open(&src, git_buf_cstr(&src_path))) < 0) {
610 		git_buf_dispose(&src_path);
611 		return error;
612 	}
613 
614 	if (git_repository_item_path(&src_odb, src, GIT_REPOSITORY_ITEM_OBJECTS) < 0
615 		|| git_repository_item_path(&dst_odb, repo, GIT_REPOSITORY_ITEM_OBJECTS) < 0) {
616 		error = -1;
617 		goto cleanup;
618 	}
619 
620 	flags = 0;
621 	if (can_link(git_repository_path(src), git_repository_path(repo), link))
622 		flags |= GIT_CPDIR_LINK_FILES;
623 
624 	error = git_futils_cp_r(git_buf_cstr(&src_odb), git_buf_cstr(&dst_odb),
625 				flags, GIT_OBJECT_DIR_MODE);
626 
627 	/*
628 	 * can_link() doesn't catch all variations, so if we hit an
629 	 * error and did want to link, let's try again without trying
630 	 * to link.
631 	 */
632 	if (error < 0 && link) {
633 		flags &= ~GIT_CPDIR_LINK_FILES;
634 		error = git_futils_cp_r(git_buf_cstr(&src_odb), git_buf_cstr(&dst_odb),
635 					flags, GIT_OBJECT_DIR_MODE);
636 	}
637 
638 	if (error < 0)
639 		goto cleanup;
640 
641 	git_buf_printf(&reflog_message, "clone: from %s", git_remote_url(remote));
642 
643 	if ((error = git_remote_fetch(remote, NULL, fetch_opts, git_buf_cstr(&reflog_message))) != 0)
644 		goto cleanup;
645 
646 	error = checkout_branch(repo, remote, co_opts, branch, git_buf_cstr(&reflog_message));
647 
648 cleanup:
649 	git_buf_dispose(&reflog_message);
650 	git_buf_dispose(&src_path);
651 	git_buf_dispose(&src_odb);
652 	git_buf_dispose(&dst_odb);
653 	git_repository_free(src);
654 	return error;
655 }
656