Revert "Add a helper function to compare file contents"
[alt-git.git] / path.c
blobd61f70e87d4cb8dcd34683a8df40ef8f4a2c27b5
1 /*
2 * Utilities for paths and pathnames
3 */
4 #include "cache.h"
5 #include "repository.h"
6 #include "strbuf.h"
7 #include "string-list.h"
8 #include "dir.h"
9 #include "worktree.h"
10 #include "submodule-config.h"
11 #include "path.h"
12 #include "packfile.h"
13 #include "object-store.h"
14 #include "lockfile.h"
15 #include "exec-cmd.h"
17 static int get_st_mode_bits(const char *path, int *mode)
19 struct stat st;
20 if (lstat(path, &st) < 0)
21 return -1;
22 *mode = st.st_mode;
23 return 0;
26 static char bad_path[] = "/bad-path/";
28 static struct strbuf *get_pathname(void)
30 static struct strbuf pathname_array[4] = {
31 STRBUF_INIT, STRBUF_INIT, STRBUF_INIT, STRBUF_INIT
33 static int index;
34 struct strbuf *sb = &pathname_array[index];
35 index = (index + 1) % ARRAY_SIZE(pathname_array);
36 strbuf_reset(sb);
37 return sb;
40 static const char *cleanup_path(const char *path)
42 /* Clean it up */
43 if (skip_prefix(path, "./", &path)) {
44 while (*path == '/')
45 path++;
47 return path;
50 static void strbuf_cleanup_path(struct strbuf *sb)
52 const char *path = cleanup_path(sb->buf);
53 if (path > sb->buf)
54 strbuf_remove(sb, 0, path - sb->buf);
57 char *mksnpath(char *buf, size_t n, const char *fmt, ...)
59 va_list args;
60 unsigned len;
62 va_start(args, fmt);
63 len = vsnprintf(buf, n, fmt, args);
64 va_end(args);
65 if (len >= n) {
66 strlcpy(buf, bad_path, n);
67 return buf;
69 return (char *)cleanup_path(buf);
72 static int dir_prefix(const char *buf, const char *dir)
74 int len = strlen(dir);
75 return !strncmp(buf, dir, len) &&
76 (is_dir_sep(buf[len]) || buf[len] == '\0');
79 /* $buf =~ m|$dir/+$file| but without regex */
80 static int is_dir_file(const char *buf, const char *dir, const char *file)
82 int len = strlen(dir);
83 if (strncmp(buf, dir, len) || !is_dir_sep(buf[len]))
84 return 0;
85 while (is_dir_sep(buf[len]))
86 len++;
87 return !strcmp(buf + len, file);
90 static void replace_dir(struct strbuf *buf, int len, const char *newdir)
92 int newlen = strlen(newdir);
93 int need_sep = (buf->buf[len] && !is_dir_sep(buf->buf[len])) &&
94 !is_dir_sep(newdir[newlen - 1]);
95 if (need_sep)
96 len--; /* keep one char, to be replaced with '/' */
97 strbuf_splice(buf, 0, len, newdir, newlen);
98 if (need_sep)
99 buf->buf[newlen] = '/';
102 struct common_dir {
103 /* Not considered garbage for report_linked_checkout_garbage */
104 unsigned ignore_garbage:1;
105 unsigned is_dir:1;
106 /* Belongs to the common dir, though it may contain paths that don't */
107 unsigned is_common:1;
108 const char *path;
111 static struct common_dir common_list[] = {
112 { 0, 1, 1, "branches" },
113 { 0, 1, 1, "common" },
114 { 0, 1, 1, "hooks" },
115 { 0, 1, 1, "info" },
116 { 0, 0, 0, "info/sparse-checkout" },
117 { 1, 1, 1, "logs" },
118 { 1, 0, 0, "logs/HEAD" },
119 { 0, 1, 0, "logs/refs/bisect" },
120 { 0, 1, 0, "logs/refs/rewritten" },
121 { 0, 1, 0, "logs/refs/worktree" },
122 { 0, 1, 1, "lost-found" },
123 { 0, 1, 1, "objects" },
124 { 0, 1, 1, "refs" },
125 { 0, 1, 0, "refs/bisect" },
126 { 0, 1, 0, "refs/rewritten" },
127 { 0, 1, 0, "refs/worktree" },
128 { 0, 1, 1, "remotes" },
129 { 0, 1, 1, "worktrees" },
130 { 0, 1, 1, "rr-cache" },
131 { 0, 1, 1, "svn" },
132 { 0, 0, 1, "config" },
133 { 1, 0, 1, "gc.pid" },
134 { 0, 0, 1, "packed-refs" },
135 { 0, 0, 1, "shallow" },
136 { 0, 0, 0, NULL }
140 * A compressed trie. A trie node consists of zero or more characters that
141 * are common to all elements with this prefix, optionally followed by some
142 * children. If value is not NULL, the trie node is a terminal node.
144 * For example, consider the following set of strings:
145 * abc
146 * def
147 * definite
148 * definition
150 * The trie would look like:
151 * root: len = 0, children a and d non-NULL, value = NULL.
152 * a: len = 2, contents = bc, value = (data for "abc")
153 * d: len = 2, contents = ef, children i non-NULL, value = (data for "def")
154 * i: len = 3, contents = nit, children e and i non-NULL, value = NULL
155 * e: len = 0, children all NULL, value = (data for "definite")
156 * i: len = 2, contents = on, children all NULL,
157 * value = (data for "definition")
159 struct trie {
160 struct trie *children[256];
161 int len;
162 char *contents;
163 void *value;
166 static struct trie *make_trie_node(const char *key, void *value)
168 struct trie *new_node = xcalloc(1, sizeof(*new_node));
169 new_node->len = strlen(key);
170 if (new_node->len) {
171 new_node->contents = xmalloc(new_node->len);
172 memcpy(new_node->contents, key, new_node->len);
174 new_node->value = value;
175 return new_node;
179 * Add a key/value pair to a trie. The key is assumed to be \0-terminated.
180 * If there was an existing value for this key, return it.
182 static void *add_to_trie(struct trie *root, const char *key, void *value)
184 struct trie *child;
185 void *old;
186 int i;
188 if (!*key) {
189 /* we have reached the end of the key */
190 old = root->value;
191 root->value = value;
192 return old;
195 for (i = 0; i < root->len; i++) {
196 if (root->contents[i] == key[i])
197 continue;
200 * Split this node: child will contain this node's
201 * existing children.
203 child = xmalloc(sizeof(*child));
204 memcpy(child->children, root->children, sizeof(root->children));
206 child->len = root->len - i - 1;
207 if (child->len) {
208 child->contents = xstrndup(root->contents + i + 1,
209 child->len);
211 child->value = root->value;
212 root->value = NULL;
213 root->len = i;
215 memset(root->children, 0, sizeof(root->children));
216 root->children[(unsigned char)root->contents[i]] = child;
218 /* This is the newly-added child. */
219 root->children[(unsigned char)key[i]] =
220 make_trie_node(key + i + 1, value);
221 return NULL;
224 /* We have matched the entire compressed section */
225 if (key[i]) {
226 child = root->children[(unsigned char)key[root->len]];
227 if (child) {
228 return add_to_trie(child, key + root->len + 1, value);
229 } else {
230 child = make_trie_node(key + root->len + 1, value);
231 root->children[(unsigned char)key[root->len]] = child;
232 return NULL;
236 old = root->value;
237 root->value = value;
238 return old;
241 typedef int (*match_fn)(const char *unmatched, void *value, void *baton);
244 * Search a trie for some key. Find the longest /-or-\0-terminated
245 * prefix of the key for which the trie contains a value. If there is
246 * no such prefix, return -1. Otherwise call fn with the unmatched
247 * portion of the key and the found value. If fn returns 0 or
248 * positive, then return its return value. If fn returns negative,
249 * then call fn with the next-longest /-terminated prefix of the key
250 * (i.e. a parent directory) for which the trie contains a value, and
251 * handle its return value the same way. If there is no shorter
252 * /-terminated prefix with a value left, then return the negative
253 * return value of the most recent fn invocation.
255 * The key is partially normalized: consecutive slashes are skipped.
257 * For example, consider the trie containing only [logs,
258 * logs/refs/bisect], both with values, but not logs/refs.
260 * | key | unmatched | prefix to node | return value |
261 * |--------------------|----------------|------------------|--------------|
262 * | a | not called | n/a | -1 |
263 * | logstore | not called | n/a | -1 |
264 * | logs | \0 | logs | as per fn |
265 * | logs/ | / | logs | as per fn |
266 * | logs/refs | /refs | logs | as per fn |
267 * | logs/refs/ | /refs/ | logs | as per fn |
268 * | logs/refs/b | /refs/b | logs | as per fn |
269 * | logs/refs/bisected | /refs/bisected | logs | as per fn |
270 * | logs/refs/bisect | \0 | logs/refs/bisect | as per fn |
271 * | logs/refs/bisect/ | / | logs/refs/bisect | as per fn |
272 * | logs/refs/bisect/a | /a | logs/refs/bisect | as per fn |
273 * | (If fn in the previous line returns -1, then fn is called once more:) |
274 * | logs/refs/bisect/a | /refs/bisect/a | logs | as per fn |
275 * |--------------------|----------------|------------------|--------------|
277 static int trie_find(struct trie *root, const char *key, match_fn fn,
278 void *baton)
280 int i;
281 int result;
282 struct trie *child;
284 if (!*key) {
285 /* we have reached the end of the key */
286 if (root->value && !root->len)
287 return fn(key, root->value, baton);
288 else
289 return -1;
292 for (i = 0; i < root->len; i++) {
293 /* Partial path normalization: skip consecutive slashes. */
294 if (key[i] == '/' && key[i+1] == '/') {
295 key++;
296 continue;
298 if (root->contents[i] != key[i])
299 return -1;
302 /* Matched the entire compressed section */
303 key += i;
304 if (!*key) {
305 /* End of key */
306 if (root->value)
307 return fn(key, root->value, baton);
308 else
309 return -1;
312 /* Partial path normalization: skip consecutive slashes */
313 while (key[0] == '/' && key[1] == '/')
314 key++;
316 child = root->children[(unsigned char)*key];
317 if (child)
318 result = trie_find(child, key + 1, fn, baton);
319 else
320 result = -1;
322 if (result >= 0 || (*key != '/' && *key != 0))
323 return result;
324 if (root->value)
325 return fn(key, root->value, baton);
326 else
327 return -1;
330 static struct trie common_trie;
331 static int common_trie_done_setup;
333 static void init_common_trie(void)
335 struct common_dir *p;
337 if (common_trie_done_setup)
338 return;
340 for (p = common_list; p->path; p++)
341 add_to_trie(&common_trie, p->path, p);
343 common_trie_done_setup = 1;
347 * Helper function for update_common_dir: returns 1 if the dir
348 * prefix is common.
350 static int check_common(const char *unmatched, void *value, void *baton)
352 struct common_dir *dir = value;
354 if (dir->is_dir && (unmatched[0] == 0 || unmatched[0] == '/'))
355 return dir->is_common;
357 if (!dir->is_dir && unmatched[0] == 0)
358 return dir->is_common;
360 return 0;
363 static void update_common_dir(struct strbuf *buf, int git_dir_len,
364 const char *common_dir)
366 char *base = buf->buf + git_dir_len;
367 int has_lock_suffix = strbuf_strip_suffix(buf, LOCK_SUFFIX);
369 init_common_trie();
370 if (trie_find(&common_trie, base, check_common, NULL) > 0)
371 replace_dir(buf, git_dir_len, common_dir);
373 if (has_lock_suffix)
374 strbuf_addstr(buf, LOCK_SUFFIX);
377 void report_linked_checkout_garbage(void)
379 struct strbuf sb = STRBUF_INIT;
380 const struct common_dir *p;
381 int len;
383 if (!the_repository->different_commondir)
384 return;
385 strbuf_addf(&sb, "%s/", get_git_dir());
386 len = sb.len;
387 for (p = common_list; p->path; p++) {
388 const char *path = p->path;
389 if (p->ignore_garbage)
390 continue;
391 strbuf_setlen(&sb, len);
392 strbuf_addstr(&sb, path);
393 if (file_exists(sb.buf))
394 report_garbage(PACKDIR_FILE_GARBAGE, sb.buf);
396 strbuf_release(&sb);
399 static void adjust_git_path(const struct repository *repo,
400 struct strbuf *buf, int git_dir_len)
402 const char *base = buf->buf + git_dir_len;
403 if (is_dir_file(base, "info", "grafts"))
404 strbuf_splice(buf, 0, buf->len,
405 repo->graft_file, strlen(repo->graft_file));
406 else if (!strcmp(base, "index"))
407 strbuf_splice(buf, 0, buf->len,
408 repo->index_file, strlen(repo->index_file));
409 else if (dir_prefix(base, "objects"))
410 replace_dir(buf, git_dir_len + 7, repo->objects->odb->path);
411 else if (git_hooks_path && dir_prefix(base, "hooks"))
412 replace_dir(buf, git_dir_len + 5, git_hooks_path);
413 else if (repo->different_commondir)
414 update_common_dir(buf, git_dir_len, repo->commondir);
417 static void strbuf_worktree_gitdir(struct strbuf *buf,
418 const struct repository *repo,
419 const struct worktree *wt)
421 if (!wt)
422 strbuf_addstr(buf, repo->gitdir);
423 else if (!wt->id)
424 strbuf_addstr(buf, repo->commondir);
425 else
426 strbuf_git_common_path(buf, repo, "worktrees/%s", wt->id);
429 static void do_git_path(const struct repository *repo,
430 const struct worktree *wt, struct strbuf *buf,
431 const char *fmt, va_list args)
433 int gitdir_len;
434 strbuf_worktree_gitdir(buf, repo, wt);
435 if (buf->len && !is_dir_sep(buf->buf[buf->len - 1]))
436 strbuf_addch(buf, '/');
437 gitdir_len = buf->len;
438 strbuf_vaddf(buf, fmt, args);
439 if (!wt)
440 adjust_git_path(repo, buf, gitdir_len);
441 strbuf_cleanup_path(buf);
444 char *repo_git_path(const struct repository *repo,
445 const char *fmt, ...)
447 struct strbuf path = STRBUF_INIT;
448 va_list args;
449 va_start(args, fmt);
450 do_git_path(repo, NULL, &path, fmt, args);
451 va_end(args);
452 return strbuf_detach(&path, NULL);
455 void strbuf_repo_git_path(struct strbuf *sb,
456 const struct repository *repo,
457 const char *fmt, ...)
459 va_list args;
460 va_start(args, fmt);
461 do_git_path(repo, NULL, sb, fmt, args);
462 va_end(args);
465 char *git_path_buf(struct strbuf *buf, const char *fmt, ...)
467 va_list args;
468 strbuf_reset(buf);
469 va_start(args, fmt);
470 do_git_path(the_repository, NULL, buf, fmt, args);
471 va_end(args);
472 return buf->buf;
475 void strbuf_git_path(struct strbuf *sb, const char *fmt, ...)
477 va_list args;
478 va_start(args, fmt);
479 do_git_path(the_repository, NULL, sb, fmt, args);
480 va_end(args);
483 const char *git_path(const char *fmt, ...)
485 struct strbuf *pathname = get_pathname();
486 va_list args;
487 va_start(args, fmt);
488 do_git_path(the_repository, NULL, pathname, fmt, args);
489 va_end(args);
490 return pathname->buf;
493 char *git_pathdup(const char *fmt, ...)
495 struct strbuf path = STRBUF_INIT;
496 va_list args;
497 va_start(args, fmt);
498 do_git_path(the_repository, NULL, &path, fmt, args);
499 va_end(args);
500 return strbuf_detach(&path, NULL);
503 char *mkpathdup(const char *fmt, ...)
505 struct strbuf sb = STRBUF_INIT;
506 va_list args;
507 va_start(args, fmt);
508 strbuf_vaddf(&sb, fmt, args);
509 va_end(args);
510 strbuf_cleanup_path(&sb);
511 return strbuf_detach(&sb, NULL);
514 const char *mkpath(const char *fmt, ...)
516 va_list args;
517 struct strbuf *pathname = get_pathname();
518 va_start(args, fmt);
519 strbuf_vaddf(pathname, fmt, args);
520 va_end(args);
521 return cleanup_path(pathname->buf);
524 const char *worktree_git_path(const struct worktree *wt, const char *fmt, ...)
526 struct strbuf *pathname = get_pathname();
527 va_list args;
528 va_start(args, fmt);
529 do_git_path(the_repository, wt, pathname, fmt, args);
530 va_end(args);
531 return pathname->buf;
534 static void do_worktree_path(const struct repository *repo,
535 struct strbuf *buf,
536 const char *fmt, va_list args)
538 strbuf_addstr(buf, repo->worktree);
539 if(buf->len && !is_dir_sep(buf->buf[buf->len - 1]))
540 strbuf_addch(buf, '/');
542 strbuf_vaddf(buf, fmt, args);
543 strbuf_cleanup_path(buf);
546 char *repo_worktree_path(const struct repository *repo, const char *fmt, ...)
548 struct strbuf path = STRBUF_INIT;
549 va_list args;
551 if (!repo->worktree)
552 return NULL;
554 va_start(args, fmt);
555 do_worktree_path(repo, &path, fmt, args);
556 va_end(args);
558 return strbuf_detach(&path, NULL);
561 void strbuf_repo_worktree_path(struct strbuf *sb,
562 const struct repository *repo,
563 const char *fmt, ...)
565 va_list args;
567 if (!repo->worktree)
568 return;
570 va_start(args, fmt);
571 do_worktree_path(repo, sb, fmt, args);
572 va_end(args);
575 /* Returns 0 on success, negative on failure. */
576 static int do_submodule_path(struct strbuf *buf, const char *path,
577 const char *fmt, va_list args)
579 struct strbuf git_submodule_common_dir = STRBUF_INIT;
580 struct strbuf git_submodule_dir = STRBUF_INIT;
581 int ret;
583 ret = submodule_to_gitdir(&git_submodule_dir, path);
584 if (ret)
585 goto cleanup;
587 strbuf_complete(&git_submodule_dir, '/');
588 strbuf_addbuf(buf, &git_submodule_dir);
589 strbuf_vaddf(buf, fmt, args);
591 if (get_common_dir_noenv(&git_submodule_common_dir, git_submodule_dir.buf))
592 update_common_dir(buf, git_submodule_dir.len, git_submodule_common_dir.buf);
594 strbuf_cleanup_path(buf);
596 cleanup:
597 strbuf_release(&git_submodule_dir);
598 strbuf_release(&git_submodule_common_dir);
599 return ret;
602 char *git_pathdup_submodule(const char *path, const char *fmt, ...)
604 int err;
605 va_list args;
606 struct strbuf buf = STRBUF_INIT;
607 va_start(args, fmt);
608 err = do_submodule_path(&buf, path, fmt, args);
609 va_end(args);
610 if (err) {
611 strbuf_release(&buf);
612 return NULL;
614 return strbuf_detach(&buf, NULL);
617 int strbuf_git_path_submodule(struct strbuf *buf, const char *path,
618 const char *fmt, ...)
620 int err;
621 va_list args;
622 va_start(args, fmt);
623 err = do_submodule_path(buf, path, fmt, args);
624 va_end(args);
626 return err;
629 static void do_git_common_path(const struct repository *repo,
630 struct strbuf *buf,
631 const char *fmt,
632 va_list args)
634 strbuf_addstr(buf, repo->commondir);
635 if (buf->len && !is_dir_sep(buf->buf[buf->len - 1]))
636 strbuf_addch(buf, '/');
637 strbuf_vaddf(buf, fmt, args);
638 strbuf_cleanup_path(buf);
641 const char *git_common_path(const char *fmt, ...)
643 struct strbuf *pathname = get_pathname();
644 va_list args;
645 va_start(args, fmt);
646 do_git_common_path(the_repository, pathname, fmt, args);
647 va_end(args);
648 return pathname->buf;
651 void strbuf_git_common_path(struct strbuf *sb,
652 const struct repository *repo,
653 const char *fmt, ...)
655 va_list args;
656 va_start(args, fmt);
657 do_git_common_path(repo, sb, fmt, args);
658 va_end(args);
661 int validate_headref(const char *path)
663 struct stat st;
664 char buffer[256];
665 const char *refname;
666 struct object_id oid;
667 int fd;
668 ssize_t len;
670 if (lstat(path, &st) < 0)
671 return -1;
673 /* Make sure it is a "refs/.." symlink */
674 if (S_ISLNK(st.st_mode)) {
675 len = readlink(path, buffer, sizeof(buffer)-1);
676 if (len >= 5 && !memcmp("refs/", buffer, 5))
677 return 0;
678 return -1;
682 * Anything else, just open it and try to see if it is a symbolic ref.
684 fd = open(path, O_RDONLY);
685 if (fd < 0)
686 return -1;
687 len = read_in_full(fd, buffer, sizeof(buffer)-1);
688 close(fd);
690 if (len < 0)
691 return -1;
692 buffer[len] = '\0';
695 * Is it a symbolic ref?
697 if (skip_prefix(buffer, "ref:", &refname)) {
698 while (isspace(*refname))
699 refname++;
700 if (starts_with(refname, "refs/"))
701 return 0;
705 * Is this a detached HEAD?
707 if (!get_oid_hex(buffer, &oid))
708 return 0;
710 return -1;
713 static struct passwd *getpw_str(const char *username, size_t len)
715 struct passwd *pw;
716 char *username_z = xmemdupz(username, len);
717 pw = getpwnam(username_z);
718 free(username_z);
719 return pw;
723 * Return a string with ~ and ~user expanded via getpw*. Returns NULL on getpw
724 * failure or if path is NULL.
726 * If real_home is true, strbuf_realpath($HOME) is used in the `~/` expansion.
728 * If the path starts with `%(prefix)/`, the remainder is interpreted as
729 * relative to where Git is installed, and expanded to the absolute path.
731 char *interpolate_path(const char *path, int real_home)
733 struct strbuf user_path = STRBUF_INIT;
734 const char *to_copy = path;
736 if (!path)
737 goto return_null;
739 if (skip_prefix(path, "%(prefix)/", &path))
740 return system_path(path);
742 if (path[0] == '~') {
743 const char *first_slash = strchrnul(path, '/');
744 const char *username = path + 1;
745 size_t username_len = first_slash - username;
746 if (username_len == 0) {
747 const char *home = getenv("HOME");
748 if (!home)
749 goto return_null;
750 if (real_home)
751 strbuf_add_real_path(&user_path, home);
752 else
753 strbuf_addstr(&user_path, home);
754 #ifdef GIT_WINDOWS_NATIVE
755 convert_slashes(user_path.buf);
756 #endif
757 } else {
758 struct passwd *pw = getpw_str(username, username_len);
759 if (!pw)
760 goto return_null;
761 strbuf_addstr(&user_path, pw->pw_dir);
763 to_copy = first_slash;
765 strbuf_addstr(&user_path, to_copy);
766 return strbuf_detach(&user_path, NULL);
767 return_null:
768 strbuf_release(&user_path);
769 return NULL;
773 * First, one directory to try is determined by the following algorithm.
775 * (0) If "strict" is given, the path is used as given and no DWIM is
776 * done. Otherwise:
777 * (1) "~/path" to mean path under the running user's home directory;
778 * (2) "~user/path" to mean path under named user's home directory;
779 * (3) "relative/path" to mean cwd relative directory; or
780 * (4) "/absolute/path" to mean absolute directory.
782 * Unless "strict" is given, we check "%s/.git", "%s", "%s.git/.git", "%s.git"
783 * in this order. We select the first one that is a valid git repository, and
784 * chdir() to it. If none match, or we fail to chdir, we return NULL.
786 * If all goes well, we return the directory we used to chdir() (but
787 * before ~user is expanded), avoiding getcwd() resolving symbolic
788 * links. User relative paths are also returned as they are given,
789 * except DWIM suffixing.
791 const char *enter_repo(const char *path, int strict)
793 static struct strbuf validated_path = STRBUF_INIT;
794 static struct strbuf used_path = STRBUF_INIT;
796 if (!path)
797 return NULL;
799 if (!strict) {
800 static const char *suffix[] = {
801 "/.git", "", ".git/.git", ".git", NULL,
803 const char *gitfile;
804 int len = strlen(path);
805 int i;
806 while ((1 < len) && (path[len-1] == '/'))
807 len--;
810 * We can handle arbitrary-sized buffers, but this remains as a
811 * sanity check on untrusted input.
813 if (PATH_MAX <= len)
814 return NULL;
816 strbuf_reset(&used_path);
817 strbuf_reset(&validated_path);
818 strbuf_add(&used_path, path, len);
819 strbuf_add(&validated_path, path, len);
821 if (used_path.buf[0] == '~') {
822 char *newpath = interpolate_path(used_path.buf, 0);
823 if (!newpath)
824 return NULL;
825 strbuf_attach(&used_path, newpath, strlen(newpath),
826 strlen(newpath));
828 for (i = 0; suffix[i]; i++) {
829 struct stat st;
830 size_t baselen = used_path.len;
831 strbuf_addstr(&used_path, suffix[i]);
832 if (!stat(used_path.buf, &st) &&
833 (S_ISREG(st.st_mode) ||
834 (S_ISDIR(st.st_mode) && is_git_directory(used_path.buf)))) {
835 strbuf_addstr(&validated_path, suffix[i]);
836 break;
838 strbuf_setlen(&used_path, baselen);
840 if (!suffix[i])
841 return NULL;
842 gitfile = read_gitfile(used_path.buf);
843 die_upon_dubious_ownership(gitfile, NULL, used_path.buf);
844 if (gitfile) {
845 strbuf_reset(&used_path);
846 strbuf_addstr(&used_path, gitfile);
848 if (chdir(used_path.buf))
849 return NULL;
850 path = validated_path.buf;
852 else {
853 const char *gitfile = read_gitfile(path);
854 die_upon_dubious_ownership(gitfile, NULL, path);
855 if (gitfile)
856 path = gitfile;
857 if (chdir(path))
858 return NULL;
861 if (is_git_directory(".")) {
862 set_git_dir(".", 0);
863 check_repository_format(NULL);
864 return path;
867 return NULL;
870 static int calc_shared_perm(int mode)
872 int tweak;
874 if (get_shared_repository() < 0)
875 tweak = -get_shared_repository();
876 else
877 tweak = get_shared_repository();
879 if (!(mode & S_IWUSR))
880 tweak &= ~0222;
881 if (mode & S_IXUSR)
882 /* Copy read bits to execute bits */
883 tweak |= (tweak & 0444) >> 2;
884 if (get_shared_repository() < 0)
885 mode = (mode & ~0777) | tweak;
886 else
887 mode |= tweak;
889 return mode;
893 int adjust_shared_perm(const char *path)
895 int old_mode, new_mode;
897 if (!get_shared_repository())
898 return 0;
899 if (get_st_mode_bits(path, &old_mode) < 0)
900 return -1;
902 new_mode = calc_shared_perm(old_mode);
903 if (S_ISDIR(old_mode)) {
904 /* Copy read bits to execute bits */
905 new_mode |= (new_mode & 0444) >> 2;
908 * g+s matters only if any extra access is granted
909 * based on group membership.
911 if (FORCE_DIR_SET_GID && (new_mode & 060))
912 new_mode |= FORCE_DIR_SET_GID;
915 if (((old_mode ^ new_mode) & ~S_IFMT) &&
916 chmod(path, (new_mode & ~S_IFMT)) < 0)
917 return -2;
918 return 0;
921 void safe_create_dir(const char *dir, int share)
923 if (mkdir(dir, 0777) < 0) {
924 if (errno != EEXIST) {
925 perror(dir);
926 exit(1);
929 else if (share && adjust_shared_perm(dir))
930 die(_("Could not make %s writable by group"), dir);
933 static int have_same_root(const char *path1, const char *path2)
935 int is_abs1, is_abs2;
937 is_abs1 = is_absolute_path(path1);
938 is_abs2 = is_absolute_path(path2);
939 return (is_abs1 && is_abs2 && tolower(path1[0]) == tolower(path2[0])) ||
940 (!is_abs1 && !is_abs2);
944 * Give path as relative to prefix.
946 * The strbuf may or may not be used, so do not assume it contains the
947 * returned path.
949 const char *relative_path(const char *in, const char *prefix,
950 struct strbuf *sb)
952 int in_len = in ? strlen(in) : 0;
953 int prefix_len = prefix ? strlen(prefix) : 0;
954 int in_off = 0;
955 int prefix_off = 0;
956 int i = 0, j = 0;
958 if (!in_len)
959 return "./";
960 else if (!prefix_len)
961 return in;
963 if (have_same_root(in, prefix))
964 /* bypass dos_drive, for "c:" is identical to "C:" */
965 i = j = has_dos_drive_prefix(in);
966 else {
967 return in;
970 while (i < prefix_len && j < in_len && prefix[i] == in[j]) {
971 if (is_dir_sep(prefix[i])) {
972 while (is_dir_sep(prefix[i]))
973 i++;
974 while (is_dir_sep(in[j]))
975 j++;
976 prefix_off = i;
977 in_off = j;
978 } else {
979 i++;
980 j++;
984 if (
985 /* "prefix" seems like prefix of "in" */
986 i >= prefix_len &&
988 * but "/foo" is not a prefix of "/foobar"
989 * (i.e. prefix not end with '/')
991 prefix_off < prefix_len) {
992 if (j >= in_len) {
993 /* in="/a/b", prefix="/a/b" */
994 in_off = in_len;
995 } else if (is_dir_sep(in[j])) {
996 /* in="/a/b/c", prefix="/a/b" */
997 while (is_dir_sep(in[j]))
998 j++;
999 in_off = j;
1000 } else {
1001 /* in="/a/bbb/c", prefix="/a/b" */
1002 i = prefix_off;
1004 } else if (
1005 /* "in" is short than "prefix" */
1006 j >= in_len &&
1007 /* "in" not end with '/' */
1008 in_off < in_len) {
1009 if (is_dir_sep(prefix[i])) {
1010 /* in="/a/b", prefix="/a/b/c/" */
1011 while (is_dir_sep(prefix[i]))
1012 i++;
1013 in_off = in_len;
1016 in += in_off;
1017 in_len -= in_off;
1019 if (i >= prefix_len) {
1020 if (!in_len)
1021 return "./";
1022 else
1023 return in;
1026 strbuf_reset(sb);
1027 strbuf_grow(sb, in_len);
1029 while (i < prefix_len) {
1030 if (is_dir_sep(prefix[i])) {
1031 strbuf_addstr(sb, "../");
1032 while (is_dir_sep(prefix[i]))
1033 i++;
1034 continue;
1036 i++;
1038 if (!is_dir_sep(prefix[prefix_len - 1]))
1039 strbuf_addstr(sb, "../");
1041 strbuf_addstr(sb, in);
1043 return sb->buf;
1047 * A simpler implementation of relative_path
1049 * Get relative path by removing "prefix" from "in". This function
1050 * first appears in v1.5.6-1-g044bbbc, and makes git_dir shorter
1051 * to increase performance when traversing the path to work_tree.
1053 const char *remove_leading_path(const char *in, const char *prefix)
1055 static struct strbuf buf = STRBUF_INIT;
1056 int i = 0, j = 0;
1058 if (!prefix || !prefix[0])
1059 return in;
1060 while (prefix[i]) {
1061 if (is_dir_sep(prefix[i])) {
1062 if (!is_dir_sep(in[j]))
1063 return in;
1064 while (is_dir_sep(prefix[i]))
1065 i++;
1066 while (is_dir_sep(in[j]))
1067 j++;
1068 continue;
1069 } else if (in[j] != prefix[i]) {
1070 return in;
1072 i++;
1073 j++;
1075 if (
1076 /* "/foo" is a prefix of "/foo" */
1077 in[j] &&
1078 /* "/foo" is not a prefix of "/foobar" */
1079 !is_dir_sep(prefix[i-1]) && !is_dir_sep(in[j])
1081 return in;
1082 while (is_dir_sep(in[j]))
1083 j++;
1085 strbuf_reset(&buf);
1086 if (!in[j])
1087 strbuf_addstr(&buf, ".");
1088 else
1089 strbuf_addstr(&buf, in + j);
1090 return buf.buf;
1094 * It is okay if dst == src, but they should not overlap otherwise.
1095 * The "dst" buffer must be at least as long as "src"; normalizing may shrink
1096 * the size of the path, but will never grow it.
1098 * Performs the following normalizations on src, storing the result in dst:
1099 * - Ensures that components are separated by '/' (Windows only)
1100 * - Squashes sequences of '/' except "//server/share" on Windows
1101 * - Removes "." components.
1102 * - Removes ".." components, and the components the precede them.
1103 * Returns failure (non-zero) if a ".." component appears as first path
1104 * component anytime during the normalization. Otherwise, returns success (0).
1106 * Note that this function is purely textual. It does not follow symlinks,
1107 * verify the existence of the path, or make any system calls.
1109 * prefix_len != NULL is for a specific case of prefix_pathspec():
1110 * assume that src == dst and src[0..prefix_len-1] is already
1111 * normalized, any time "../" eats up to the prefix_len part,
1112 * prefix_len is reduced. In the end prefix_len is the remaining
1113 * prefix that has not been overridden by user pathspec.
1115 * NEEDSWORK: This function doesn't perform normalization w.r.t. trailing '/'.
1116 * For everything but the root folder itself, the normalized path should not
1117 * end with a '/', then the callers need to be fixed up accordingly.
1120 int normalize_path_copy_len(char *dst, const char *src, int *prefix_len)
1122 char *dst0;
1123 const char *end;
1126 * Copy initial part of absolute path: "/", "C:/", "//server/share/".
1128 end = src + offset_1st_component(src);
1129 while (src < end) {
1130 char c = *src++;
1131 if (is_dir_sep(c))
1132 c = '/';
1133 *dst++ = c;
1135 dst0 = dst;
1137 while (is_dir_sep(*src))
1138 src++;
1140 for (;;) {
1141 char c = *src;
1144 * A path component that begins with . could be
1145 * special:
1146 * (1) "." and ends -- ignore and terminate.
1147 * (2) "./" -- ignore them, eat slash and continue.
1148 * (3) ".." and ends -- strip one and terminate.
1149 * (4) "../" -- strip one, eat slash and continue.
1151 if (c == '.') {
1152 if (!src[1]) {
1153 /* (1) */
1154 src++;
1155 } else if (is_dir_sep(src[1])) {
1156 /* (2) */
1157 src += 2;
1158 while (is_dir_sep(*src))
1159 src++;
1160 continue;
1161 } else if (src[1] == '.') {
1162 if (!src[2]) {
1163 /* (3) */
1164 src += 2;
1165 goto up_one;
1166 } else if (is_dir_sep(src[2])) {
1167 /* (4) */
1168 src += 3;
1169 while (is_dir_sep(*src))
1170 src++;
1171 goto up_one;
1176 /* copy up to the next '/', and eat all '/' */
1177 while ((c = *src++) != '\0' && !is_dir_sep(c))
1178 *dst++ = c;
1179 if (is_dir_sep(c)) {
1180 *dst++ = '/';
1181 while (is_dir_sep(c))
1182 c = *src++;
1183 src--;
1184 } else if (!c)
1185 break;
1186 continue;
1188 up_one:
1190 * dst0..dst is prefix portion, and dst[-1] is '/';
1191 * go up one level.
1193 dst--; /* go to trailing '/' */
1194 if (dst <= dst0)
1195 return -1;
1196 /* Windows: dst[-1] cannot be backslash anymore */
1197 while (dst0 < dst && dst[-1] != '/')
1198 dst--;
1199 if (prefix_len && *prefix_len > dst - dst0)
1200 *prefix_len = dst - dst0;
1202 *dst = '\0';
1203 return 0;
1206 int normalize_path_copy(char *dst, const char *src)
1208 return normalize_path_copy_len(dst, src, NULL);
1212 * path = Canonical absolute path
1213 * prefixes = string_list containing normalized, absolute paths without
1214 * trailing slashes (except for the root directory, which is denoted by "/").
1216 * Determines, for each path in prefixes, whether the "prefix"
1217 * is an ancestor directory of path. Returns the length of the longest
1218 * ancestor directory, excluding any trailing slashes, or -1 if no prefix
1219 * is an ancestor. (Note that this means 0 is returned if prefixes is
1220 * ["/"].) "/foo" is not considered an ancestor of "/foobar". Directories
1221 * are not considered to be their own ancestors. path must be in a
1222 * canonical form: empty components, or "." or ".." components are not
1223 * allowed.
1225 int longest_ancestor_length(const char *path, struct string_list *prefixes)
1227 int i, max_len = -1;
1229 if (!strcmp(path, "/"))
1230 return -1;
1232 for (i = 0; i < prefixes->nr; i++) {
1233 const char *ceil = prefixes->items[i].string;
1234 int len = strlen(ceil);
1237 * For root directories (`/`, `C:/`, `//server/share/`)
1238 * adjust the length to exclude the trailing slash.
1240 if (len > 0 && ceil[len - 1] == '/')
1241 len--;
1243 if (strncmp(path, ceil, len) ||
1244 path[len] != '/' || !path[len + 1])
1245 continue; /* no match */
1247 if (len > max_len)
1248 max_len = len;
1251 return max_len;
1254 /* strip arbitrary amount of directory separators at end of path */
1255 static inline int chomp_trailing_dir_sep(const char *path, int len)
1257 while (len && is_dir_sep(path[len - 1]))
1258 len--;
1259 return len;
1263 * If path ends with suffix (complete path components), returns the offset of
1264 * the last character in the path before the suffix (sans trailing directory
1265 * separators), and -1 otherwise.
1267 static ssize_t stripped_path_suffix_offset(const char *path, const char *suffix)
1269 int path_len = strlen(path), suffix_len = strlen(suffix);
1271 while (suffix_len) {
1272 if (!path_len)
1273 return -1;
1275 if (is_dir_sep(path[path_len - 1])) {
1276 if (!is_dir_sep(suffix[suffix_len - 1]))
1277 return -1;
1278 path_len = chomp_trailing_dir_sep(path, path_len);
1279 suffix_len = chomp_trailing_dir_sep(suffix, suffix_len);
1281 else if (path[--path_len] != suffix[--suffix_len])
1282 return -1;
1285 if (path_len && !is_dir_sep(path[path_len - 1]))
1286 return -1;
1287 return chomp_trailing_dir_sep(path, path_len);
1291 * Returns true if the path ends with components, considering only complete path
1292 * components, and false otherwise.
1294 int ends_with_path_components(const char *path, const char *components)
1296 return stripped_path_suffix_offset(path, components) != -1;
1300 * If path ends with suffix (complete path components), returns the
1301 * part before suffix (sans trailing directory separators).
1302 * Otherwise returns NULL.
1304 char *strip_path_suffix(const char *path, const char *suffix)
1306 ssize_t offset = stripped_path_suffix_offset(path, suffix);
1308 return offset == -1 ? NULL : xstrndup(path, offset);
1311 int daemon_avoid_alias(const char *p)
1313 int sl, ndot;
1316 * This resurrects the belts and suspenders paranoia check by HPA
1317 * done in <435560F7.4080006@zytor.com> thread, now enter_repo()
1318 * does not do getcwd() based path canonicalization.
1320 * sl becomes true immediately after seeing '/' and continues to
1321 * be true as long as dots continue after that without intervening
1322 * non-dot character.
1324 if (!p || (*p != '/' && *p != '~'))
1325 return -1;
1326 sl = 1; ndot = 0;
1327 p++;
1329 while (1) {
1330 char ch = *p++;
1331 if (sl) {
1332 if (ch == '.')
1333 ndot++;
1334 else if (ch == '/') {
1335 if (ndot < 3)
1336 /* reject //, /./ and /../ */
1337 return -1;
1338 ndot = 0;
1340 else if (ch == 0) {
1341 if (0 < ndot && ndot < 3)
1342 /* reject /.$ and /..$ */
1343 return -1;
1344 return 0;
1346 else
1347 sl = ndot = 0;
1349 else if (ch == 0)
1350 return 0;
1351 else if (ch == '/') {
1352 sl = 1;
1353 ndot = 0;
1359 * On NTFS, we need to be careful to disallow certain synonyms of the `.git/`
1360 * directory:
1362 * - For historical reasons, file names that end in spaces or periods are
1363 * automatically trimmed. Therefore, `.git . . ./` is a valid way to refer
1364 * to `.git/`.
1366 * - For other historical reasons, file names that do not conform to the 8.3
1367 * format (up to eight characters for the basename, three for the file
1368 * extension, certain characters not allowed such as `+`, etc) are associated
1369 * with a so-called "short name", at least on the `C:` drive by default.
1370 * Which means that `git~1/` is a valid way to refer to `.git/`.
1372 * Note: Technically, `.git/` could receive the short name `git~2` if the
1373 * short name `git~1` were already used. In Git, however, we guarantee that
1374 * `.git` is the first item in a directory, therefore it will be associated
1375 * with the short name `git~1` (unless short names are disabled).
1377 * - For yet other historical reasons, NTFS supports so-called "Alternate Data
1378 * Streams", i.e. metadata associated with a given file, referred to via
1379 * `<filename>:<stream-name>:<stream-type>`. There exists a default stream
1380 * type for directories, allowing `.git/` to be accessed via
1381 * `.git::$INDEX_ALLOCATION/`.
1383 * When this function returns 1, it indicates that the specified file/directory
1384 * name refers to a `.git` file or directory, or to any of these synonyms, and
1385 * Git should therefore not track it.
1387 * For performance reasons, _all_ Alternate Data Streams of `.git/` are
1388 * forbidden, not just `::$INDEX_ALLOCATION`.
1390 * This function is intended to be used by `git fsck` even on platforms where
1391 * the backslash is a regular filename character, therefore it needs to handle
1392 * backlash characters in the provided `name` specially: they are interpreted
1393 * as directory separators.
1395 int is_ntfs_dotgit(const char *name)
1397 char c;
1400 * Note that when we don't find `.git` or `git~1` we end up with `name`
1401 * advanced partway through the string. That's okay, though, as we
1402 * return immediately in those cases, without looking at `name` any
1403 * further.
1405 c = *(name++);
1406 if (c == '.') {
1407 /* .git */
1408 if (((c = *(name++)) != 'g' && c != 'G') ||
1409 ((c = *(name++)) != 'i' && c != 'I') ||
1410 ((c = *(name++)) != 't' && c != 'T'))
1411 return 0;
1412 } else if (c == 'g' || c == 'G') {
1413 /* git ~1 */
1414 if (((c = *(name++)) != 'i' && c != 'I') ||
1415 ((c = *(name++)) != 't' && c != 'T') ||
1416 *(name++) != '~' ||
1417 *(name++) != '1')
1418 return 0;
1419 } else
1420 return 0;
1422 for (;;) {
1423 c = *(name++);
1424 if (!c || is_xplatform_dir_sep(c) || c == ':')
1425 return 1;
1426 if (c != '.' && c != ' ')
1427 return 0;
1431 static int is_ntfs_dot_generic(const char *name,
1432 const char *dotgit_name,
1433 size_t len,
1434 const char *dotgit_ntfs_shortname_prefix)
1436 int saw_tilde;
1437 size_t i;
1439 if ((name[0] == '.' && !strncasecmp(name + 1, dotgit_name, len))) {
1440 i = len + 1;
1441 only_spaces_and_periods:
1442 for (;;) {
1443 char c = name[i++];
1444 if (!c || c == ':')
1445 return 1;
1446 if (c != ' ' && c != '.')
1447 return 0;
1452 * Is it a regular NTFS short name, i.e. shortened to 6 characters,
1453 * followed by ~1, ... ~4?
1455 if (!strncasecmp(name, dotgit_name, 6) && name[6] == '~' &&
1456 name[7] >= '1' && name[7] <= '4') {
1457 i = 8;
1458 goto only_spaces_and_periods;
1462 * Is it a fall-back NTFS short name (for details, see
1463 * https://en.wikipedia.org/wiki/8.3_filename?
1465 for (i = 0, saw_tilde = 0; i < 8; i++)
1466 if (name[i] == '\0')
1467 return 0;
1468 else if (saw_tilde) {
1469 if (name[i] < '0' || name[i] > '9')
1470 return 0;
1471 } else if (name[i] == '~') {
1472 if (name[++i] < '1' || name[i] > '9')
1473 return 0;
1474 saw_tilde = 1;
1475 } else if (i >= 6)
1476 return 0;
1477 else if (name[i] & 0x80) {
1479 * We know our needles contain only ASCII, so we clamp
1480 * here to make the results of tolower() sane.
1482 return 0;
1483 } else if (tolower(name[i]) != dotgit_ntfs_shortname_prefix[i])
1484 return 0;
1486 goto only_spaces_and_periods;
1490 * Inline helper to make sure compiler resolves strlen() on literals at
1491 * compile time.
1493 static inline int is_ntfs_dot_str(const char *name, const char *dotgit_name,
1494 const char *dotgit_ntfs_shortname_prefix)
1496 return is_ntfs_dot_generic(name, dotgit_name, strlen(dotgit_name),
1497 dotgit_ntfs_shortname_prefix);
1500 int is_ntfs_dotgitmodules(const char *name)
1502 return is_ntfs_dot_str(name, "gitmodules", "gi7eba");
1505 int is_ntfs_dotgitignore(const char *name)
1507 return is_ntfs_dot_str(name, "gitignore", "gi250a");
1510 int is_ntfs_dotgitattributes(const char *name)
1512 return is_ntfs_dot_str(name, "gitattributes", "gi7d29");
1515 int is_ntfs_dotmailmap(const char *name)
1517 return is_ntfs_dot_str(name, "mailmap", "maba30");
1520 int looks_like_command_line_option(const char *str)
1522 return str && str[0] == '-';
1525 char *xdg_config_home_for(const char *subdir, const char *filename)
1527 const char *home, *config_home;
1529 assert(subdir);
1530 assert(filename);
1531 config_home = getenv("XDG_CONFIG_HOME");
1532 if (config_home && *config_home)
1533 return mkpathdup("%s/%s/%s", config_home, subdir, filename);
1535 home = getenv("HOME");
1536 if (home)
1537 return mkpathdup("%s/.config/%s/%s", home, subdir, filename);
1539 return NULL;
1542 char *xdg_config_home(const char *filename)
1544 return xdg_config_home_for("git", filename);
1547 char *xdg_cache_home(const char *filename)
1549 const char *home, *cache_home;
1551 assert(filename);
1552 cache_home = getenv("XDG_CACHE_HOME");
1553 if (cache_home && *cache_home)
1554 return mkpathdup("%s/git/%s", cache_home, filename);
1556 home = getenv("HOME");
1557 if (home)
1558 return mkpathdup("%s/.cache/git/%s", home, filename);
1559 return NULL;
1562 REPO_GIT_PATH_FUNC(squash_msg, "SQUASH_MSG")
1563 REPO_GIT_PATH_FUNC(merge_msg, "MERGE_MSG")
1564 REPO_GIT_PATH_FUNC(merge_rr, "MERGE_RR")
1565 REPO_GIT_PATH_FUNC(merge_mode, "MERGE_MODE")
1566 REPO_GIT_PATH_FUNC(merge_head, "MERGE_HEAD")
1567 REPO_GIT_PATH_FUNC(merge_autostash, "MERGE_AUTOSTASH")
1568 REPO_GIT_PATH_FUNC(auto_merge, "AUTO_MERGE")
1569 REPO_GIT_PATH_FUNC(fetch_head, "FETCH_HEAD")
1570 REPO_GIT_PATH_FUNC(shallow, "shallow")