daemon.con commit Merge early parts of branch 'ls/am' (69c18d8)
   1#include <signal.h>
   2#include <sys/wait.h>
   3#include <sys/socket.h>
   4#include <sys/time.h>
   5#include <sys/poll.h>
   6#include <netdb.h>
   7#include <netinet/in.h>
   8#include <arpa/inet.h>
   9#include <syslog.h>
  10#include "pkt-line.h"
  11#include "cache.h"
  12#include "exec_cmd.h"
  13
  14static int log_syslog;
  15static int verbose;
  16static int reuseaddr;
  17
  18static const char daemon_usage[] =
  19"git-daemon [--verbose] [--syslog] [--inetd | --port=n] [--export-all]\n"
  20"           [--timeout=n] [--init-timeout=n] [--strict-paths]\n"
  21"           [--base-path=path] [--user-path | --user-path=path]\n"
  22"           [--reuseaddr] [directory...]";
  23
  24/* List of acceptable pathname prefixes */
  25static char **ok_paths = NULL;
  26static int strict_paths = 0;
  27
  28/* If this is set, git-daemon-export-ok is not required */
  29static int export_all_trees = 0;
  30
  31/* Take all paths relative to this one if non-NULL */
  32static char *base_path = NULL;
  33
  34/* If defined, ~user notation is allowed and the string is inserted
  35 * after ~user/.  E.g. a request to git://host/~alice/frotz would
  36 * go to /home/alice/pub_git/frotz with --user-path=pub_git.
  37 */
  38static char *user_path = NULL;
  39
  40/* Timeout, and initial timeout */
  41static unsigned int timeout = 0;
  42static unsigned int init_timeout = 0;
  43
  44static void logreport(int priority, const char *err, va_list params)
  45{
  46        /* We should do a single write so that it is atomic and output
  47         * of several processes do not get intermingled. */
  48        char buf[1024];
  49        int buflen;
  50        int maxlen, msglen;
  51
  52        /* sizeof(buf) should be big enough for "[pid] \n" */
  53        buflen = snprintf(buf, sizeof(buf), "[%ld] ", (long) getpid());
  54
  55        maxlen = sizeof(buf) - buflen - 1; /* -1 for our own LF */
  56        msglen = vsnprintf(buf + buflen, maxlen, err, params);
  57
  58        if (log_syslog) {
  59                syslog(priority, "%s", buf);
  60                return;
  61        }
  62
  63        /* maxlen counted our own LF but also counts space given to
  64         * vsnprintf for the terminating NUL.  We want to make sure that
  65         * we have space for our own LF and NUL after the "meat" of the
  66         * message, so truncate it at maxlen - 1.
  67         */
  68        if (msglen > maxlen - 1)
  69                msglen = maxlen - 1;
  70        else if (msglen < 0)
  71                msglen = 0; /* Protect against weird return values. */
  72        buflen += msglen;
  73
  74        buf[buflen++] = '\n';
  75        buf[buflen] = '\0';
  76
  77        write(2, buf, buflen);
  78}
  79
  80static void logerror(const char *err, ...)
  81{
  82        va_list params;
  83        va_start(params, err);
  84        logreport(LOG_ERR, err, params);
  85        va_end(params);
  86}
  87
  88static void loginfo(const char *err, ...)
  89{
  90        va_list params;
  91        if (!verbose)
  92                return;
  93        va_start(params, err);
  94        logreport(LOG_INFO, err, params);
  95        va_end(params);
  96}
  97
  98static int avoid_alias(char *p)
  99{
 100        int sl, ndot;
 101
 102        /* 
 103         * This resurrects the belts and suspenders paranoia check by HPA
 104         * done in <435560F7.4080006@zytor.com> thread, now enter_repo()
 105         * does not do getcwd() based path canonicalizations.
 106         *
 107         * sl becomes true immediately after seeing '/' and continues to
 108         * be true as long as dots continue after that without intervening
 109         * non-dot character.
 110         */
 111        if (!p || (*p != '/' && *p != '~'))
 112                return -1;
 113        sl = 1; ndot = 0;
 114        p++;
 115
 116        while (1) {
 117                char ch = *p++;
 118                if (sl) {
 119                        if (ch == '.')
 120                                ndot++;
 121                        else if (ch == '/') {
 122                                if (ndot < 3)
 123                                        /* reject //, /./ and /../ */
 124                                        return -1;
 125                                ndot = 0;
 126                        }
 127                        else if (ch == 0) {
 128                                if (0 < ndot && ndot < 3)
 129                                        /* reject /.$ and /..$ */
 130                                        return -1;
 131                                return 0;
 132                        }
 133                        else
 134                                sl = ndot = 0;
 135                }
 136                else if (ch == 0)
 137                        return 0;
 138                else if (ch == '/') {
 139                        sl = 1;
 140                        ndot = 0;
 141                }
 142        }
 143}
 144
 145static char *path_ok(char *dir)
 146{
 147        static char rpath[PATH_MAX];
 148        char *path;
 149
 150        if (avoid_alias(dir)) {
 151                logerror("'%s': aliased", dir);
 152                return NULL;
 153        }
 154
 155        if (*dir == '~') {
 156                if (!user_path) {
 157                        logerror("'%s': User-path not allowed", dir);
 158                        return NULL;
 159                }
 160                if (*user_path) {
 161                        /* Got either "~alice" or "~alice/foo";
 162                         * rewrite them to "~alice/%s" or
 163                         * "~alice/%s/foo".
 164                         */
 165                        int namlen, restlen = strlen(dir);
 166                        char *slash = strchr(dir, '/');
 167                        if (!slash)
 168                                slash = dir + restlen;
 169                        namlen = slash - dir;
 170                        restlen -= namlen;
 171                        loginfo("userpath <%s>, request <%s>, namlen %d, restlen %d, slash <%s>", user_path, dir, namlen, restlen, slash);
 172                        snprintf(rpath, PATH_MAX, "%.*s/%s%.*s",
 173                                 namlen, dir, user_path, restlen, slash);
 174                        dir = rpath;
 175                }
 176        }
 177        else if (base_path) {
 178                if (*dir != '/') {
 179                        /* Allow only absolute */
 180                        logerror("'%s': Non-absolute path denied (base-path active)", dir);
 181                        return NULL;
 182                }
 183                else {
 184                        snprintf(rpath, PATH_MAX, "%s%s", base_path, dir);
 185                        dir = rpath;
 186                }
 187        }
 188
 189        path = enter_repo(dir, strict_paths);
 190
 191        if (!path) {
 192                logerror("'%s': unable to chdir or not a git archive", dir);
 193                return NULL;
 194        }
 195
 196        if ( ok_paths && *ok_paths ) {
 197                char **pp;
 198                int pathlen = strlen(path);
 199
 200                /* The validation is done on the paths after enter_repo
 201                 * appends optional {.git,.git/.git} and friends, but 
 202                 * it does not use getcwd().  So if your /pub is
 203                 * a symlink to /mnt/pub, you can whitelist /pub and
 204                 * do not have to say /mnt/pub.
 205                 * Do not say /pub/.
 206                 */
 207                for ( pp = ok_paths ; *pp ; pp++ ) {
 208                        int len = strlen(*pp);
 209                        if (len <= pathlen &&
 210                            !memcmp(*pp, path, len) &&
 211                            (path[len] == '\0' ||
 212                             (!strict_paths && path[len] == '/')))
 213                                return path;
 214                }
 215        }
 216        else {
 217                /* be backwards compatible */
 218                if (!strict_paths)
 219                        return path;
 220        }
 221
 222        logerror("'%s': not in whitelist", path);
 223        return NULL;            /* Fallthrough. Deny by default */
 224}
 225
 226static int upload(char *dir)
 227{
 228        /* Timeout as string */
 229        char timeout_buf[64];
 230        const char *path;
 231
 232        loginfo("Request for '%s'", dir);
 233
 234        if (!(path = path_ok(dir)))
 235                return -1;
 236
 237        /*
 238         * Security on the cheap.
 239         *
 240         * We want a readable HEAD, usable "objects" directory, and
 241         * a "git-daemon-export-ok" flag that says that the other side
 242         * is ok with us doing this.
 243         *
 244         * path_ok() uses enter_repo() and does whitelist checking.
 245         * We only need to make sure the repository is exported.
 246         */
 247
 248        if (!export_all_trees && access("git-daemon-export-ok", F_OK)) {
 249                logerror("'%s': repository not exported.", path);
 250                errno = EACCES;
 251                return -1;
 252        }
 253
 254        /*
 255         * We'll ignore SIGTERM from now on, we have a
 256         * good client.
 257         */
 258        signal(SIGTERM, SIG_IGN);
 259
 260        snprintf(timeout_buf, sizeof timeout_buf, "--timeout=%u", timeout);
 261
 262        /* git-upload-pack only ever reads stuff, so this is safe */
 263        execl_git_cmd("upload-pack", "--strict", timeout_buf, ".", NULL);
 264        return -1;
 265}
 266
 267static int execute(void)
 268{
 269        static char line[1000];
 270        int pktlen, len;
 271
 272        alarm(init_timeout ? init_timeout : timeout);
 273        pktlen = packet_read_line(0, line, sizeof(line));
 274        alarm(0);
 275
 276        len = strlen(line);
 277        if (pktlen != len)
 278                loginfo("Extended attributes (%d bytes) exist <%.*s>",
 279                        (int) pktlen - len,
 280                        (int) pktlen - len, line + len + 1);
 281        if (len && line[len-1] == '\n')
 282                line[--len] = 0;
 283
 284        if (!strncmp("git-upload-pack ", line, 16))
 285                return upload(line+16);
 286
 287        logerror("Protocol error: '%s'", line);
 288        return -1;
 289}
 290
 291
 292/*
 293 * We count spawned/reaped separately, just to avoid any
 294 * races when updating them from signals. The SIGCHLD handler
 295 * will only update children_reaped, and the fork logic will
 296 * only update children_spawned.
 297 *
 298 * MAX_CHILDREN should be a power-of-two to make the modulus
 299 * operation cheap. It should also be at least twice
 300 * the maximum number of connections we will ever allow.
 301 */
 302#define MAX_CHILDREN 128
 303
 304static int max_connections = 25;
 305
 306/* These are updated by the signal handler */
 307static volatile unsigned int children_reaped = 0;
 308static pid_t dead_child[MAX_CHILDREN];
 309
 310/* These are updated by the main loop */
 311static unsigned int children_spawned = 0;
 312static unsigned int children_deleted = 0;
 313
 314static struct child {
 315        pid_t pid;
 316        int addrlen;
 317        struct sockaddr_storage address;
 318} live_child[MAX_CHILDREN];
 319
 320static void add_child(int idx, pid_t pid, struct sockaddr *addr, int addrlen)
 321{
 322        live_child[idx].pid = pid;
 323        live_child[idx].addrlen = addrlen;
 324        memcpy(&live_child[idx].address, addr, addrlen);
 325}
 326
 327/*
 328 * Walk from "deleted" to "spawned", and remove child "pid".
 329 *
 330 * We move everything up by one, since the new "deleted" will
 331 * be one higher.
 332 */
 333static void remove_child(pid_t pid, unsigned deleted, unsigned spawned)
 334{
 335        struct child n;
 336
 337        deleted %= MAX_CHILDREN;
 338        spawned %= MAX_CHILDREN;
 339        if (live_child[deleted].pid == pid) {
 340                live_child[deleted].pid = -1;
 341                return;
 342        }
 343        n = live_child[deleted];
 344        for (;;) {
 345                struct child m;
 346                deleted = (deleted + 1) % MAX_CHILDREN;
 347                if (deleted == spawned)
 348                        die("could not find dead child %d\n", pid);
 349                m = live_child[deleted];
 350                live_child[deleted] = n;
 351                if (m.pid == pid)
 352                        return;
 353                n = m;
 354        }
 355}
 356
 357/*
 358 * This gets called if the number of connections grows
 359 * past "max_connections".
 360 *
 361 * We _should_ start off by searching for connections
 362 * from the same IP, and if there is some address wth
 363 * multiple connections, we should kill that first.
 364 *
 365 * As it is, we just "randomly" kill 25% of the connections,
 366 * and our pseudo-random generator sucks too. I have no
 367 * shame.
 368 *
 369 * Really, this is just a place-holder for a _real_ algorithm.
 370 */
 371static void kill_some_children(int signo, unsigned start, unsigned stop)
 372{
 373        start %= MAX_CHILDREN;
 374        stop %= MAX_CHILDREN;
 375        while (start != stop) {
 376                if (!(start & 3))
 377                        kill(live_child[start].pid, signo);
 378                start = (start + 1) % MAX_CHILDREN;
 379        }
 380}
 381
 382static void check_max_connections(void)
 383{
 384        for (;;) {
 385                int active;
 386                unsigned spawned, reaped, deleted;
 387
 388                spawned = children_spawned;
 389                reaped = children_reaped;
 390                deleted = children_deleted;
 391
 392                while (deleted < reaped) {
 393                        pid_t pid = dead_child[deleted % MAX_CHILDREN];
 394                        remove_child(pid, deleted, spawned);
 395                        deleted++;
 396                }
 397                children_deleted = deleted;
 398
 399                active = spawned - deleted;
 400                if (active <= max_connections)
 401                        break;
 402
 403                /* Kill some unstarted connections with SIGTERM */
 404                kill_some_children(SIGTERM, deleted, spawned);
 405                if (active <= max_connections << 1)
 406                        break;
 407
 408                /* If the SIGTERM thing isn't helping use SIGKILL */
 409                kill_some_children(SIGKILL, deleted, spawned);
 410                sleep(1);
 411        }
 412}
 413
 414static void handle(int incoming, struct sockaddr *addr, int addrlen)
 415{
 416        pid_t pid = fork();
 417        char addrbuf[256] = "";
 418        int port = -1;
 419
 420        if (pid) {
 421                unsigned idx;
 422
 423                close(incoming);
 424                if (pid < 0)
 425                        return;
 426
 427                idx = children_spawned % MAX_CHILDREN;
 428                children_spawned++;
 429                add_child(idx, pid, addr, addrlen);
 430
 431                check_max_connections();
 432                return;
 433        }
 434
 435        dup2(incoming, 0);
 436        dup2(incoming, 1);
 437        close(incoming);
 438
 439        if (addr->sa_family == AF_INET) {
 440                struct sockaddr_in *sin_addr = (void *) addr;
 441                inet_ntop(AF_INET, &sin_addr->sin_addr, addrbuf, sizeof(addrbuf));
 442                port = sin_addr->sin_port;
 443
 444#ifndef NO_IPV6
 445        } else if (addr->sa_family == AF_INET6) {
 446                struct sockaddr_in6 *sin6_addr = (void *) addr;
 447
 448                char *buf = addrbuf;
 449                *buf++ = '['; *buf = '\0'; /* stpcpy() is cool */
 450                inet_ntop(AF_INET6, &sin6_addr->sin6_addr, buf, sizeof(addrbuf) - 1);
 451                strcat(buf, "]");
 452
 453                port = sin6_addr->sin6_port;
 454#endif
 455        }
 456        loginfo("Connection from %s:%d", addrbuf, port);
 457
 458        exit(execute());
 459}
 460
 461static void child_handler(int signo)
 462{
 463        for (;;) {
 464                int status;
 465                pid_t pid = waitpid(-1, &status, WNOHANG);
 466
 467                if (pid > 0) {
 468                        unsigned reaped = children_reaped;
 469                        dead_child[reaped % MAX_CHILDREN] = pid;
 470                        children_reaped = reaped + 1;
 471                        /* XXX: Custom logging, since we don't wanna getpid() */
 472                        if (verbose) {
 473                                char *dead = "";
 474                                if (!WIFEXITED(status) || WEXITSTATUS(status) > 0)
 475                                        dead = " (with error)";
 476                                if (log_syslog)
 477                                        syslog(LOG_INFO, "[%d] Disconnected%s", pid, dead);
 478                                else
 479                                        fprintf(stderr, "[%d] Disconnected%s\n", pid, dead);
 480                        }
 481                        continue;
 482                }
 483                break;
 484        }
 485}
 486
 487static int set_reuse_addr(int sockfd)
 488{
 489        int on = 1;
 490
 491        if (!reuseaddr)
 492                return 0;
 493        return setsockopt(sockfd, SOL_SOCKET, SO_REUSEADDR,
 494                          &on, sizeof(on));
 495}
 496
 497#ifndef NO_IPV6
 498
 499static int socksetup(int port, int **socklist_p)
 500{
 501        int socknum = 0, *socklist = NULL;
 502        int maxfd = -1;
 503        char pbuf[NI_MAXSERV];
 504
 505        struct addrinfo hints, *ai0, *ai;
 506        int gai;
 507
 508        sprintf(pbuf, "%d", port);
 509        memset(&hints, 0, sizeof(hints));
 510        hints.ai_family = AF_UNSPEC;
 511        hints.ai_socktype = SOCK_STREAM;
 512        hints.ai_protocol = IPPROTO_TCP;
 513        hints.ai_flags = AI_PASSIVE;
 514
 515        gai = getaddrinfo(NULL, pbuf, &hints, &ai0);
 516        if (gai)
 517                die("getaddrinfo() failed: %s\n", gai_strerror(gai));
 518
 519        for (ai = ai0; ai; ai = ai->ai_next) {
 520                int sockfd;
 521                int *newlist;
 522
 523                sockfd = socket(ai->ai_family, ai->ai_socktype, ai->ai_protocol);
 524                if (sockfd < 0)
 525                        continue;
 526                if (sockfd >= FD_SETSIZE) {
 527                        error("too large socket descriptor.");
 528                        close(sockfd);
 529                        continue;
 530                }
 531
 532#ifdef IPV6_V6ONLY
 533                if (ai->ai_family == AF_INET6) {
 534                        int on = 1;
 535                        setsockopt(sockfd, IPPROTO_IPV6, IPV6_V6ONLY,
 536                                   &on, sizeof(on));
 537                        /* Note: error is not fatal */
 538                }
 539#endif
 540
 541                if (set_reuse_addr(sockfd)) {
 542                        close(sockfd);
 543                        continue;
 544                }
 545
 546                if (bind(sockfd, ai->ai_addr, ai->ai_addrlen) < 0) {
 547                        close(sockfd);
 548                        continue;       /* not fatal */
 549                }
 550                if (listen(sockfd, 5) < 0) {
 551                        close(sockfd);
 552                        continue;       /* not fatal */
 553                }
 554
 555                newlist = realloc(socklist, sizeof(int) * (socknum + 1));
 556                if (!newlist)
 557                        die("memory allocation failed: %s", strerror(errno));
 558
 559                socklist = newlist;
 560                socklist[socknum++] = sockfd;
 561
 562                if (maxfd < sockfd)
 563                        maxfd = sockfd;
 564        }
 565
 566        freeaddrinfo(ai0);
 567
 568        *socklist_p = socklist;
 569        return socknum;
 570}
 571
 572#else /* NO_IPV6 */
 573
 574static int socksetup(int port, int **socklist_p)
 575{
 576        struct sockaddr_in sin;
 577        int sockfd;
 578
 579        sockfd = socket(AF_INET, SOCK_STREAM, 0);
 580        if (sockfd < 0)
 581                return 0;
 582
 583        memset(&sin, 0, sizeof sin);
 584        sin.sin_family = AF_INET;
 585        sin.sin_addr.s_addr = htonl(INADDR_ANY);
 586        sin.sin_port = htons(port);
 587
 588        if (set_reuse_addr(sockfd)) {
 589                close(sockfd);
 590                return 0;
 591        }
 592
 593        if ( bind(sockfd, (struct sockaddr *)&sin, sizeof sin) < 0 ) {
 594                close(sockfd);
 595                return 0;
 596        }
 597
 598        if (listen(sockfd, 5) < 0) {
 599                close(sockfd);
 600                return 0;
 601        }
 602
 603        *socklist_p = xmalloc(sizeof(int));
 604        **socklist_p = sockfd;
 605        return 1;
 606}
 607
 608#endif
 609
 610static int service_loop(int socknum, int *socklist)
 611{
 612        struct pollfd *pfd;
 613        int i;
 614
 615        pfd = xcalloc(socknum, sizeof(struct pollfd));
 616
 617        for (i = 0; i < socknum; i++) {
 618                pfd[i].fd = socklist[i];
 619                pfd[i].events = POLLIN;
 620        }
 621
 622        signal(SIGCHLD, child_handler);
 623
 624        for (;;) {
 625                int i;
 626
 627                if (poll(pfd, socknum, -1) < 0) {
 628                        if (errno != EINTR) {
 629                                error("poll failed, resuming: %s",
 630                                      strerror(errno));
 631                                sleep(1);
 632                        }
 633                        continue;
 634                }
 635
 636                for (i = 0; i < socknum; i++) {
 637                        if (pfd[i].revents & POLLIN) {
 638                                struct sockaddr_storage ss;
 639                                unsigned int sslen = sizeof(ss);
 640                                int incoming = accept(pfd[i].fd, (struct sockaddr *)&ss, &sslen);
 641                                if (incoming < 0) {
 642                                        switch (errno) {
 643                                        case EAGAIN:
 644                                        case EINTR:
 645                                        case ECONNABORTED:
 646                                                continue;
 647                                        default:
 648                                                die("accept returned %s", strerror(errno));
 649                                        }
 650                                }
 651                                handle(incoming, (struct sockaddr *)&ss, sslen);
 652                        }
 653                }
 654        }
 655}
 656
 657static int serve(int port)
 658{
 659        int socknum, *socklist;
 660
 661        socknum = socksetup(port, &socklist);
 662        if (socknum == 0)
 663                die("unable to allocate any listen sockets on port %u", port);
 664
 665        return service_loop(socknum, socklist);
 666}
 667
 668int main(int argc, char **argv)
 669{
 670        int port = DEFAULT_GIT_PORT;
 671        int inetd_mode = 0;
 672        int i;
 673
 674        for (i = 1; i < argc; i++) {
 675                char *arg = argv[i];
 676
 677                if (!strncmp(arg, "--port=", 7)) {
 678                        char *end;
 679                        unsigned long n;
 680                        n = strtoul(arg+7, &end, 0);
 681                        if (arg[7] && !*end) {
 682                                port = n;
 683                                continue;
 684                        }
 685                }
 686                if (!strcmp(arg, "--inetd")) {
 687                        inetd_mode = 1;
 688                        log_syslog = 1;
 689                        continue;
 690                }
 691                if (!strcmp(arg, "--verbose")) {
 692                        verbose = 1;
 693                        continue;
 694                }
 695                if (!strcmp(arg, "--syslog")) {
 696                        log_syslog = 1;
 697                        continue;
 698                }
 699                if (!strcmp(arg, "--export-all")) {
 700                        export_all_trees = 1;
 701                        continue;
 702                }
 703                if (!strncmp(arg, "--timeout=", 10)) {
 704                        timeout = atoi(arg+10);
 705                        continue;
 706                }
 707                if (!strncmp(arg, "--init-timeout=", 15)) {
 708                        init_timeout = atoi(arg+15);
 709                        continue;
 710                }
 711                if (!strcmp(arg, "--strict-paths")) {
 712                        strict_paths = 1;
 713                        continue;
 714                }
 715                if (!strncmp(arg, "--base-path=", 12)) {
 716                        base_path = arg+12;
 717                        continue;
 718                }
 719                if (!strcmp(arg, "--reuseaddr")) {
 720                        reuseaddr = 1;
 721                        continue;
 722                }
 723                if (!strcmp(arg, "--user-path")) {
 724                        user_path = "";
 725                        continue;
 726                }
 727                if (!strncmp(arg, "--user-path=", 12)) {
 728                        user_path = arg + 12;
 729                        continue;
 730                }
 731                if (!strcmp(arg, "--")) {
 732                        ok_paths = &argv[i+1];
 733                        break;
 734                } else if (arg[0] != '-') {
 735                        ok_paths = &argv[i];
 736                        break;
 737                }
 738
 739                usage(daemon_usage);
 740        }
 741
 742        if (log_syslog)
 743                openlog("git-daemon", 0, LOG_DAEMON);
 744
 745        if (strict_paths && (!ok_paths || !*ok_paths)) {
 746                if (!inetd_mode)
 747                        die("git-daemon: option --strict-paths requires a whitelist");
 748
 749                logerror("option --strict-paths requires a whitelist");
 750                exit (1);
 751        }
 752
 753        if (inetd_mode) {
 754                fclose(stderr); //FIXME: workaround
 755                return execute();
 756        }
 757
 758        return serve(port);
 759}