1/*
2 * Utilities for paths and pathnames
3 */
4#include "cache.h"
5#include "strbuf.h"
6#include "string-list.h"
7
8#ifndef get_st_mode_bits
9/*
10 * The replacement lstat(2) we use on Cygwin is incomplete and
11 * may return wrong permission bits. Most of the time we do not care,
12 * but the callsites of this wrapper do care.
13 */
14int get_st_mode_bits(const char *path, int *mode)
15{
16 struct stat st;
17 if (lstat(path, &st) < 0)
18 return -1;
19 *mode = st.st_mode;
20 return 0;
21}
22#endif
23
24static char bad_path[] = "/bad-path/";
25
26static char *get_pathname(void)
27{
28 static char pathname_array[4][PATH_MAX];
29 static int index;
30 return pathname_array[3 & ++index];
31}
32
33static char *cleanup_path(char *path)
34{
35 /* Clean it up */
36 if (!memcmp(path, "./", 2)) {
37 path += 2;
38 while (*path == '/')
39 path++;
40 }
41 return path;
42}
43
44char *mksnpath(char *buf, size_t n, const char *fmt, ...)
45{
46 va_list args;
47 unsigned len;
48
49 va_start(args, fmt);
50 len = vsnprintf(buf, n, fmt, args);
51 va_end(args);
52 if (len >= n) {
53 strlcpy(buf, bad_path, n);
54 return buf;
55 }
56 return cleanup_path(buf);
57}
58
59static char *vsnpath(char *buf, size_t n, const char *fmt, va_list args)
60{
61 const char *git_dir = get_git_dir();
62 size_t len;
63
64 len = strlen(git_dir);
65 if (n < len + 1)
66 goto bad;
67 memcpy(buf, git_dir, len);
68 if (len && !is_dir_sep(git_dir[len-1]))
69 buf[len++] = '/';
70 len += vsnprintf(buf + len, n - len, fmt, args);
71 if (len >= n)
72 goto bad;
73 return cleanup_path(buf);
74bad:
75 strlcpy(buf, bad_path, n);
76 return buf;
77}
78
79char *git_snpath(char *buf, size_t n, const char *fmt, ...)
80{
81 char *ret;
82 va_list args;
83 va_start(args, fmt);
84 ret = vsnpath(buf, n, fmt, args);
85 va_end(args);
86 return ret;
87}
88
89char *git_pathdup(const char *fmt, ...)
90{
91 char path[PATH_MAX], *ret;
92 va_list args;
93 va_start(args, fmt);
94 ret = vsnpath(path, sizeof(path), fmt, args);
95 va_end(args);
96 return xstrdup(ret);
97}
98
99char *mkpathdup(const char *fmt, ...)
100{
101 char *path;
102 struct strbuf sb = STRBUF_INIT;
103 va_list args;
104
105 va_start(args, fmt);
106 strbuf_vaddf(&sb, fmt, args);
107 va_end(args);
108 path = xstrdup(cleanup_path(sb.buf));
109
110 strbuf_release(&sb);
111 return path;
112}
113
114char *mkpath(const char *fmt, ...)
115{
116 va_list args;
117 unsigned len;
118 char *pathname = get_pathname();
119
120 va_start(args, fmt);
121 len = vsnprintf(pathname, PATH_MAX, fmt, args);
122 va_end(args);
123 if (len >= PATH_MAX)
124 return bad_path;
125 return cleanup_path(pathname);
126}
127
128char *git_path(const char *fmt, ...)
129{
130 char *pathname = get_pathname();
131 va_list args;
132 char *ret;
133
134 va_start(args, fmt);
135 ret = vsnpath(pathname, PATH_MAX, fmt, args);
136 va_end(args);
137 return ret;
138}
139
140void home_config_paths(char **global, char **xdg, char *file)
141{
142 char *xdg_home = getenv("XDG_CONFIG_HOME");
143 char *home = getenv("HOME");
144 char *to_free = NULL;
145
146 if (!home) {
147 if (global)
148 *global = NULL;
149 } else {
150 if (!xdg_home) {
151 to_free = mkpathdup("%s/.config", home);
152 xdg_home = to_free;
153 }
154 if (global)
155 *global = mkpathdup("%s/.gitconfig", home);
156 }
157
158 if (!xdg_home)
159 *xdg = NULL;
160 else
161 *xdg = mkpathdup("%s/git/%s", xdg_home, file);
162
163 free(to_free);
164}
165
166char *git_path_submodule(const char *path, const char *fmt, ...)
167{
168 char *pathname = get_pathname();
169 struct strbuf buf = STRBUF_INIT;
170 const char *git_dir;
171 va_list args;
172 unsigned len;
173
174 len = strlen(path);
175 if (len > PATH_MAX-100)
176 return bad_path;
177
178 strbuf_addstr(&buf, path);
179 if (len && path[len-1] != '/')
180 strbuf_addch(&buf, '/');
181 strbuf_addstr(&buf, ".git");
182
183 git_dir = read_gitfile(buf.buf);
184 if (git_dir) {
185 strbuf_reset(&buf);
186 strbuf_addstr(&buf, git_dir);
187 }
188 strbuf_addch(&buf, '/');
189
190 if (buf.len >= PATH_MAX)
191 return bad_path;
192 memcpy(pathname, buf.buf, buf.len + 1);
193
194 strbuf_release(&buf);
195 len = strlen(pathname);
196
197 va_start(args, fmt);
198 len += vsnprintf(pathname + len, PATH_MAX - len, fmt, args);
199 va_end(args);
200 if (len >= PATH_MAX)
201 return bad_path;
202 return cleanup_path(pathname);
203}
204
205int validate_headref(const char *path)
206{
207 struct stat st;
208 char *buf, buffer[256];
209 unsigned char sha1[20];
210 int fd;
211 ssize_t len;
212
213 if (lstat(path, &st) < 0)
214 return -1;
215
216 /* Make sure it is a "refs/.." symlink */
217 if (S_ISLNK(st.st_mode)) {
218 len = readlink(path, buffer, sizeof(buffer)-1);
219 if (len >= 5 && !memcmp("refs/", buffer, 5))
220 return 0;
221 return -1;
222 }
223
224 /*
225 * Anything else, just open it and try to see if it is a symbolic ref.
226 */
227 fd = open(path, O_RDONLY);
228 if (fd < 0)
229 return -1;
230 len = read_in_full(fd, buffer, sizeof(buffer)-1);
231 close(fd);
232
233 /*
234 * Is it a symbolic ref?
235 */
236 if (len < 4)
237 return -1;
238 if (!memcmp("ref:", buffer, 4)) {
239 buf = buffer + 4;
240 len -= 4;
241 while (len && isspace(*buf))
242 buf++, len--;
243 if (len >= 5 && !memcmp("refs/", buf, 5))
244 return 0;
245 }
246
247 /*
248 * Is this a detached HEAD?
249 */
250 if (!get_sha1_hex(buffer, sha1))
251 return 0;
252
253 return -1;
254}
255
256static struct passwd *getpw_str(const char *username, size_t len)
257{
258 struct passwd *pw;
259 char *username_z = xmalloc(len + 1);
260 memcpy(username_z, username, len);
261 username_z[len] = '\0';
262 pw = getpwnam(username_z);
263 free(username_z);
264 return pw;
265}
266
267/*
268 * Return a string with ~ and ~user expanded via getpw*. If buf != NULL,
269 * then it is a newly allocated string. Returns NULL on getpw failure or
270 * if path is NULL.
271 */
272char *expand_user_path(const char *path)
273{
274 struct strbuf user_path = STRBUF_INIT;
275 const char *first_slash = strchrnul(path, '/');
276 const char *to_copy = path;
277
278 if (path == NULL)
279 goto return_null;
280 if (path[0] == '~') {
281 const char *username = path + 1;
282 size_t username_len = first_slash - username;
283 if (username_len == 0) {
284 const char *home = getenv("HOME");
285 if (!home)
286 goto return_null;
287 strbuf_add(&user_path, home, strlen(home));
288 } else {
289 struct passwd *pw = getpw_str(username, username_len);
290 if (!pw)
291 goto return_null;
292 strbuf_add(&user_path, pw->pw_dir, strlen(pw->pw_dir));
293 }
294 to_copy = first_slash;
295 }
296 strbuf_add(&user_path, to_copy, strlen(to_copy));
297 return strbuf_detach(&user_path, NULL);
298return_null:
299 strbuf_release(&user_path);
300 return NULL;
301}
302
303/*
304 * First, one directory to try is determined by the following algorithm.
305 *
306 * (0) If "strict" is given, the path is used as given and no DWIM is
307 * done. Otherwise:
308 * (1) "~/path" to mean path under the running user's home directory;
309 * (2) "~user/path" to mean path under named user's home directory;
310 * (3) "relative/path" to mean cwd relative directory; or
311 * (4) "/absolute/path" to mean absolute directory.
312 *
313 * Unless "strict" is given, we try access() for existence of "%s.git/.git",
314 * "%s/.git", "%s.git", "%s" in this order. The first one that exists is
315 * what we try.
316 *
317 * Second, we try chdir() to that. Upon failure, we return NULL.
318 *
319 * Then, we try if the current directory is a valid git repository.
320 * Upon failure, we return NULL.
321 *
322 * If all goes well, we return the directory we used to chdir() (but
323 * before ~user is expanded), avoiding getcwd() resolving symbolic
324 * links. User relative paths are also returned as they are given,
325 * except DWIM suffixing.
326 */
327const char *enter_repo(const char *path, int strict)
328{
329 static char used_path[PATH_MAX];
330 static char validated_path[PATH_MAX];
331
332 if (!path)
333 return NULL;
334
335 if (!strict) {
336 static const char *suffix[] = {
337 "/.git", "", ".git/.git", ".git", NULL,
338 };
339 const char *gitfile;
340 int len = strlen(path);
341 int i;
342 while ((1 < len) && (path[len-1] == '/'))
343 len--;
344
345 if (PATH_MAX <= len)
346 return NULL;
347 strncpy(used_path, path, len); used_path[len] = 0 ;
348 strcpy(validated_path, used_path);
349
350 if (used_path[0] == '~') {
351 char *newpath = expand_user_path(used_path);
352 if (!newpath || (PATH_MAX - 10 < strlen(newpath))) {
353 free(newpath);
354 return NULL;
355 }
356 /*
357 * Copy back into the static buffer. A pity
358 * since newpath was not bounded, but other
359 * branches of the if are limited by PATH_MAX
360 * anyway.
361 */
362 strcpy(used_path, newpath); free(newpath);
363 }
364 else if (PATH_MAX - 10 < len)
365 return NULL;
366 len = strlen(used_path);
367 for (i = 0; suffix[i]; i++) {
368 struct stat st;
369 strcpy(used_path + len, suffix[i]);
370 if (!stat(used_path, &st) &&
371 (S_ISREG(st.st_mode) ||
372 (S_ISDIR(st.st_mode) && is_git_directory(used_path)))) {
373 strcat(validated_path, suffix[i]);
374 break;
375 }
376 }
377 if (!suffix[i])
378 return NULL;
379 gitfile = read_gitfile(used_path) ;
380 if (gitfile)
381 strcpy(used_path, gitfile);
382 if (chdir(used_path))
383 return NULL;
384 path = validated_path;
385 }
386 else if (chdir(path))
387 return NULL;
388
389 if (access("objects", X_OK) == 0 && access("refs", X_OK) == 0 &&
390 validate_headref("HEAD") == 0) {
391 set_git_dir(".");
392 check_repository_format();
393 return path;
394 }
395
396 return NULL;
397}
398
399static int calc_shared_perm(int mode)
400{
401 int tweak;
402
403 if (shared_repository < 0)
404 tweak = -shared_repository;
405 else
406 tweak = shared_repository;
407
408 if (!(mode & S_IWUSR))
409 tweak &= ~0222;
410 if (mode & S_IXUSR)
411 /* Copy read bits to execute bits */
412 tweak |= (tweak & 0444) >> 2;
413 if (shared_repository < 0)
414 mode = (mode & ~0777) | tweak;
415 else
416 mode |= tweak;
417
418 return mode;
419}
420
421
422int adjust_shared_perm(const char *path)
423{
424 int old_mode, new_mode;
425
426 if (!shared_repository)
427 return 0;
428 if (get_st_mode_bits(path, &old_mode) < 0)
429 return -1;
430
431 new_mode = calc_shared_perm(old_mode);
432 if (S_ISDIR(old_mode)) {
433 /* Copy read bits to execute bits */
434 new_mode |= (new_mode & 0444) >> 2;
435 new_mode |= FORCE_DIR_SET_GID;
436 }
437
438 if (((old_mode ^ new_mode) & ~S_IFMT) &&
439 chmod(path, (new_mode & ~S_IFMT)) < 0)
440 return -2;
441 return 0;
442}
443
444/*
445 * Give path as relative to prefix.
446 *
447 * The strbuf may or may not be used, so do not assume it contains the
448 * returned path.
449 */
450const char *relative_path(const char *in, const char *prefix,
451 struct strbuf *sb)
452{
453 int in_len = in ? strlen(in) : 0;
454 int prefix_len = prefix ? strlen(prefix) : 0;
455 int in_off = 0;
456 int prefix_off = 0;
457 int i = 0, j = 0;
458
459 if (!in_len)
460 return "./";
461 else if (!prefix_len)
462 return in;
463
464 while (i < prefix_len && j < in_len && prefix[i] == in[j]) {
465 if (is_dir_sep(prefix[i])) {
466 while (is_dir_sep(prefix[i]))
467 i++;
468 while (is_dir_sep(in[j]))
469 j++;
470 prefix_off = i;
471 in_off = j;
472 } else {
473 i++;
474 j++;
475 }
476 }
477
478 if (
479 /* "prefix" seems like prefix of "in" */
480 i >= prefix_len &&
481 /*
482 * but "/foo" is not a prefix of "/foobar"
483 * (i.e. prefix not end with '/')
484 */
485 prefix_off < prefix_len) {
486 if (j >= in_len) {
487 /* in="/a/b", prefix="/a/b" */
488 in_off = in_len;
489 } else if (is_dir_sep(in[j])) {
490 /* in="/a/b/c", prefix="/a/b" */
491 while (is_dir_sep(in[j]))
492 j++;
493 in_off = j;
494 } else {
495 /* in="/a/bbb/c", prefix="/a/b" */
496 i = prefix_off;
497 }
498 } else if (
499 /* "in" is short than "prefix" */
500 j >= in_len &&
501 /* "in" not end with '/' */
502 in_off < in_len) {
503 if (is_dir_sep(prefix[i])) {
504 /* in="/a/b", prefix="/a/b/c/" */
505 while (is_dir_sep(prefix[i]))
506 i++;
507 in_off = in_len;
508 }
509 }
510 in += in_off;
511 in_len -= in_off;
512
513 if (i >= prefix_len) {
514 if (!in_len)
515 return "./";
516 else
517 return in;
518 }
519
520 strbuf_reset(sb);
521 strbuf_grow(sb, in_len);
522
523 while (i < prefix_len) {
524 if (is_dir_sep(prefix[i])) {
525 strbuf_addstr(sb, "../");
526 while (is_dir_sep(prefix[i]))
527 i++;
528 continue;
529 }
530 i++;
531 }
532 if (!is_dir_sep(prefix[prefix_len - 1]))
533 strbuf_addstr(sb, "../");
534
535 strbuf_addstr(sb, in);
536
537 return sb->buf;
538}
539
540/*
541 * It is okay if dst == src, but they should not overlap otherwise.
542 *
543 * Performs the following normalizations on src, storing the result in dst:
544 * - Ensures that components are separated by '/' (Windows only)
545 * - Squashes sequences of '/'.
546 * - Removes "." components.
547 * - Removes ".." components, and the components the precede them.
548 * Returns failure (non-zero) if a ".." component appears as first path
549 * component anytime during the normalization. Otherwise, returns success (0).
550 *
551 * Note that this function is purely textual. It does not follow symlinks,
552 * verify the existence of the path, or make any system calls.
553 */
554int normalize_path_copy(char *dst, const char *src)
555{
556 char *dst0;
557
558 if (has_dos_drive_prefix(src)) {
559 *dst++ = *src++;
560 *dst++ = *src++;
561 }
562 dst0 = dst;
563
564 if (is_dir_sep(*src)) {
565 *dst++ = '/';
566 while (is_dir_sep(*src))
567 src++;
568 }
569
570 for (;;) {
571 char c = *src;
572
573 /*
574 * A path component that begins with . could be
575 * special:
576 * (1) "." and ends -- ignore and terminate.
577 * (2) "./" -- ignore them, eat slash and continue.
578 * (3) ".." and ends -- strip one and terminate.
579 * (4) "../" -- strip one, eat slash and continue.
580 */
581 if (c == '.') {
582 if (!src[1]) {
583 /* (1) */
584 src++;
585 } else if (is_dir_sep(src[1])) {
586 /* (2) */
587 src += 2;
588 while (is_dir_sep(*src))
589 src++;
590 continue;
591 } else if (src[1] == '.') {
592 if (!src[2]) {
593 /* (3) */
594 src += 2;
595 goto up_one;
596 } else if (is_dir_sep(src[2])) {
597 /* (4) */
598 src += 3;
599 while (is_dir_sep(*src))
600 src++;
601 goto up_one;
602 }
603 }
604 }
605
606 /* copy up to the next '/', and eat all '/' */
607 while ((c = *src++) != '\0' && !is_dir_sep(c))
608 *dst++ = c;
609 if (is_dir_sep(c)) {
610 *dst++ = '/';
611 while (is_dir_sep(c))
612 c = *src++;
613 src--;
614 } else if (!c)
615 break;
616 continue;
617
618 up_one:
619 /*
620 * dst0..dst is prefix portion, and dst[-1] is '/';
621 * go up one level.
622 */
623 dst--; /* go to trailing '/' */
624 if (dst <= dst0)
625 return -1;
626 /* Windows: dst[-1] cannot be backslash anymore */
627 while (dst0 < dst && dst[-1] != '/')
628 dst--;
629 }
630 *dst = '\0';
631 return 0;
632}
633
634/*
635 * path = Canonical absolute path
636 * prefixes = string_list containing normalized, absolute paths without
637 * trailing slashes (except for the root directory, which is denoted by "/").
638 *
639 * Determines, for each path in prefixes, whether the "prefix"
640 * is an ancestor directory of path. Returns the length of the longest
641 * ancestor directory, excluding any trailing slashes, or -1 if no prefix
642 * is an ancestor. (Note that this means 0 is returned if prefixes is
643 * ["/"].) "/foo" is not considered an ancestor of "/foobar". Directories
644 * are not considered to be their own ancestors. path must be in a
645 * canonical form: empty components, or "." or ".." components are not
646 * allowed.
647 */
648int longest_ancestor_length(const char *path, struct string_list *prefixes)
649{
650 int i, max_len = -1;
651
652 if (!strcmp(path, "/"))
653 return -1;
654
655 for (i = 0; i < prefixes->nr; i++) {
656 const char *ceil = prefixes->items[i].string;
657 int len = strlen(ceil);
658
659 if (len == 1 && ceil[0] == '/')
660 len = 0; /* root matches anything, with length 0 */
661 else if (!strncmp(path, ceil, len) && path[len] == '/')
662 ; /* match of length len */
663 else
664 continue; /* no match */
665
666 if (len > max_len)
667 max_len = len;
668 }
669
670 return max_len;
671}
672
673/* strip arbitrary amount of directory separators at end of path */
674static inline int chomp_trailing_dir_sep(const char *path, int len)
675{
676 while (len && is_dir_sep(path[len - 1]))
677 len--;
678 return len;
679}
680
681/*
682 * If path ends with suffix (complete path components), returns the
683 * part before suffix (sans trailing directory separators).
684 * Otherwise returns NULL.
685 */
686char *strip_path_suffix(const char *path, const char *suffix)
687{
688 int path_len = strlen(path), suffix_len = strlen(suffix);
689
690 while (suffix_len) {
691 if (!path_len)
692 return NULL;
693
694 if (is_dir_sep(path[path_len - 1])) {
695 if (!is_dir_sep(suffix[suffix_len - 1]))
696 return NULL;
697 path_len = chomp_trailing_dir_sep(path, path_len);
698 suffix_len = chomp_trailing_dir_sep(suffix, suffix_len);
699 }
700 else if (path[--path_len] != suffix[--suffix_len])
701 return NULL;
702 }
703
704 if (path_len && !is_dir_sep(path[path_len - 1]))
705 return NULL;
706 return xstrndup(path, chomp_trailing_dir_sep(path, path_len));
707}
708
709int daemon_avoid_alias(const char *p)
710{
711 int sl, ndot;
712
713 /*
714 * This resurrects the belts and suspenders paranoia check by HPA
715 * done in <435560F7.4080006@zytor.com> thread, now enter_repo()
716 * does not do getcwd() based path canonicalization.
717 *
718 * sl becomes true immediately after seeing '/' and continues to
719 * be true as long as dots continue after that without intervening
720 * non-dot character.
721 */
722 if (!p || (*p != '/' && *p != '~'))
723 return -1;
724 sl = 1; ndot = 0;
725 p++;
726
727 while (1) {
728 char ch = *p++;
729 if (sl) {
730 if (ch == '.')
731 ndot++;
732 else if (ch == '/') {
733 if (ndot < 3)
734 /* reject //, /./ and /../ */
735 return -1;
736 ndot = 0;
737 }
738 else if (ch == 0) {
739 if (0 < ndot && ndot < 3)
740 /* reject /.$ and /..$ */
741 return -1;
742 return 0;
743 }
744 else
745 sl = ndot = 0;
746 }
747 else if (ch == 0)
748 return 0;
749 else if (ch == '/') {
750 sl = 1;
751 ndot = 0;
752 }
753 }
754}
755
756int offset_1st_component(const char *path)
757{
758 if (has_dos_drive_prefix(path))
759 return 2 + is_dir_sep(path[2]);
760 return is_dir_sep(path[0]);
761}