c81b0a240a38b57a9bbd2586889304bef8f5cbbf
   1/*
   2 * apply.c
   3 *
   4 * Copyright (C) Linus Torvalds, 2005
   5 *
   6 * This applies patches on top of some (arbitrary) version of the SCM.
   7 *
   8 * NOTE! It does all its work in the index file, and only cares about
   9 * the files in the working directory if you tell it to "merge" the
  10 * patch apply.
  11 *
  12 * Even when merging it always takes the source from the index, and
  13 * uses the working tree as a "branch" for a 3-way merge.
  14 */
  15#include <ctype.h>
  16
  17#include "cache.h"
  18
  19// We default to the merge behaviour, since that's what most people would
  20// expect.
  21//
  22//  --check turns on checking that the working tree matches the
  23//    files that are being modified, but doesn't apply the patch
  24//  --stat does just a diffstat, and doesn't actually apply
  25//  --show-files shows the directory changes
  26//
  27static int merge_patch = 1;
  28static int check_index = 0;
  29static int write_index = 0;
  30static int diffstat = 0;
  31static int summary = 0;
  32static int check = 0;
  33static int apply = 1;
  34static int show_files = 0;
  35static const char apply_usage[] = "git-apply [--stat] [--summary] [--check] [--show-files] <patch>";
  36
  37/*
  38 * For "diff-stat" like behaviour, we keep track of the biggest change
  39 * we've seen, and the longest filename. That allows us to do simple
  40 * scaling.
  41 */
  42static int max_change, max_len;
  43
  44/*
  45 * Various "current state", notably line numbers and what
  46 * file (and how) we're patching right now.. The "is_xxxx"
  47 * things are flags, where -1 means "don't know yet".
  48 */
  49static int linenr = 1;
  50
  51struct fragment {
  52        unsigned long oldpos, oldlines;
  53        unsigned long newpos, newlines;
  54        const char *patch;
  55        int size;
  56        struct fragment *next;
  57};
  58
  59struct patch {
  60        char *new_name, *old_name, *def_name;
  61        unsigned int old_mode, new_mode;
  62        int is_rename, is_copy, is_new, is_delete;
  63        int lines_added, lines_deleted;
  64        int score;
  65        struct fragment *fragments;
  66        char *result;
  67        unsigned long resultsize;
  68        struct patch *next;
  69};
  70
  71#define CHUNKSIZE (8192)
  72#define SLOP (16)
  73
  74static void *read_patch_file(int fd, unsigned long *sizep)
  75{
  76        unsigned long size = 0, alloc = CHUNKSIZE;
  77        void *buffer = xmalloc(alloc);
  78
  79        for (;;) {
  80                int nr = alloc - size;
  81                if (nr < 1024) {
  82                        alloc += CHUNKSIZE;
  83                        buffer = xrealloc(buffer, alloc);
  84                        nr = alloc - size;
  85                }
  86                nr = read(fd, buffer + size, nr);
  87                if (!nr)
  88                        break;
  89                if (nr < 0) {
  90                        if (errno == EAGAIN)
  91                                continue;
  92                        die("git-apply: read returned %s", strerror(errno));
  93                }
  94                size += nr;
  95        }
  96        *sizep = size;
  97
  98        /*
  99         * Make sure that we have some slop in the buffer
 100         * so that we can do speculative "memcmp" etc, and
 101         * see to it that it is NUL-filled.
 102         */
 103        if (alloc < size + SLOP)
 104                buffer = xrealloc(buffer, size + SLOP);
 105        memset(buffer + size, 0, SLOP);
 106        return buffer;
 107}
 108
 109static unsigned long linelen(const char *buffer, unsigned long size)
 110{
 111        unsigned long len = 0;
 112        while (size--) {
 113                len++;
 114                if (*buffer++ == '\n')
 115                        break;
 116        }
 117        return len;
 118}
 119
 120static int is_dev_null(const char *str)
 121{
 122        return !memcmp("/dev/null", str, 9) && isspace(str[9]);
 123}
 124
 125#define TERM_SPACE      1
 126#define TERM_TAB        2
 127
 128static int name_terminate(const char *name, int namelen, int c, int terminate)
 129{
 130        if (c == ' ' && !(terminate & TERM_SPACE))
 131                return 0;
 132        if (c == '\t' && !(terminate & TERM_TAB))
 133                return 0;
 134
 135        return 1;
 136}
 137
 138static char * find_name(const char *line, char *def, int p_value, int terminate)
 139{
 140        int len;
 141        const char *start = line;
 142        char *name;
 143
 144        for (;;) {
 145                char c = *line;
 146
 147                if (isspace(c)) {
 148                        if (c == '\n')
 149                                break;
 150                        if (name_terminate(start, line-start, c, terminate))
 151                                break;
 152                }
 153                line++;
 154                if (c == '/' && !--p_value)
 155                        start = line;
 156        }
 157        if (!start)
 158                return def;
 159        len = line - start;
 160        if (!len)
 161                return def;
 162
 163        /*
 164         * Generally we prefer the shorter name, especially
 165         * if the other one is just a variation of that with
 166         * something else tacked on to the end (ie "file.orig"
 167         * or "file~").
 168         */
 169        if (def) {
 170                int deflen = strlen(def);
 171                if (deflen < len && !strncmp(start, def, deflen))
 172                        return def;
 173        }
 174
 175        name = xmalloc(len + 1);
 176        memcpy(name, start, len);
 177        name[len] = 0;
 178        free(def);
 179        return name;
 180}
 181
 182/*
 183 * Get the name etc info from the --/+++ lines of a traditional patch header
 184 *
 185 * NOTE! This hardcodes "-p1" behaviour in filename detection.
 186 *
 187 * FIXME! The end-of-filename heuristics are kind of screwy. For existing
 188 * files, we can happily check the index for a match, but for creating a
 189 * new file we should try to match whatever "patch" does. I have no idea.
 190 */
 191static void parse_traditional_patch(const char *first, const char *second, struct patch *patch)
 192{
 193        int p_value = 1;
 194        char *name;
 195
 196        first += 4;     // skip "--- "
 197        second += 4;    // skip "+++ "
 198        if (is_dev_null(first)) {
 199                patch->is_new = 1;
 200                patch->is_delete = 0;
 201                name = find_name(second, NULL, p_value, TERM_SPACE | TERM_TAB);
 202                patch->new_name = name;
 203        } else if (is_dev_null(second)) {
 204                patch->is_new = 0;
 205                patch->is_delete = 1;
 206                name = find_name(first, NULL, p_value, TERM_SPACE | TERM_TAB);
 207                patch->old_name = name;
 208        } else {
 209                name = find_name(first, NULL, p_value, TERM_SPACE | TERM_TAB);
 210                name = find_name(second, name, p_value, TERM_SPACE | TERM_TAB);
 211                patch->old_name = patch->new_name = name;
 212        }
 213        if (!name)
 214                die("unable to find filename in patch at line %d", linenr);
 215}
 216
 217static int gitdiff_hdrend(const char *line, struct patch *patch)
 218{
 219        return -1;
 220}
 221
 222/*
 223 * We're anal about diff header consistency, to make
 224 * sure that we don't end up having strange ambiguous
 225 * patches floating around.
 226 *
 227 * As a result, gitdiff_{old|new}name() will check
 228 * their names against any previous information, just
 229 * to make sure..
 230 */
 231static char *gitdiff_verify_name(const char *line, int isnull, char *orig_name, const char *oldnew)
 232{
 233        int len;
 234        const char *name;
 235
 236        if (!orig_name && !isnull)
 237                return find_name(line, NULL, 1, 0);
 238
 239        name = "/dev/null";
 240        len = 9;
 241        if (orig_name) {
 242                name = orig_name;
 243                len = strlen(name);
 244                if (isnull)
 245                        die("git-apply: bad git-diff - expected /dev/null, got %s on line %d", name, linenr);
 246        }
 247
 248        if (*name == '/')
 249                goto absolute_path;
 250
 251        for (;;) {
 252                char c = *line++;
 253                if (c == '\n')
 254                        break;
 255                if (c != '/')
 256                        continue;
 257absolute_path:
 258                if (memcmp(line, name, len) || line[len] != '\n')
 259                        break;
 260                return orig_name;
 261        }
 262        die("git-apply: bad git-diff - inconsistent %s filename on line %d", oldnew, linenr);
 263        return NULL;
 264}
 265
 266static int gitdiff_oldname(const char *line, struct patch *patch)
 267{
 268        patch->old_name = gitdiff_verify_name(line, patch->is_new, patch->old_name, "old");
 269        return 0;
 270}
 271
 272static int gitdiff_newname(const char *line, struct patch *patch)
 273{
 274        patch->new_name = gitdiff_verify_name(line, patch->is_delete, patch->new_name, "new");
 275        return 0;
 276}
 277
 278static int gitdiff_oldmode(const char *line, struct patch *patch)
 279{
 280        patch->old_mode = strtoul(line, NULL, 8);
 281        return 0;
 282}
 283
 284static int gitdiff_newmode(const char *line, struct patch *patch)
 285{
 286        patch->new_mode = strtoul(line, NULL, 8);
 287        return 0;
 288}
 289
 290static int gitdiff_delete(const char *line, struct patch *patch)
 291{
 292        patch->is_delete = 1;
 293        patch->old_name = patch->def_name;
 294        return gitdiff_oldmode(line, patch);
 295}
 296
 297static int gitdiff_newfile(const char *line, struct patch *patch)
 298{
 299        patch->is_new = 1;
 300        patch->new_name = patch->def_name;
 301        return gitdiff_newmode(line, patch);
 302}
 303
 304static int gitdiff_copysrc(const char *line, struct patch *patch)
 305{
 306        patch->is_copy = 1;
 307        patch->old_name = find_name(line, NULL, 0, 0);
 308        return 0;
 309}
 310
 311static int gitdiff_copydst(const char *line, struct patch *patch)
 312{
 313        patch->is_copy = 1;
 314        patch->new_name = find_name(line, NULL, 0, 0);
 315        return 0;
 316}
 317
 318static int gitdiff_renamesrc(const char *line, struct patch *patch)
 319{
 320        patch->is_rename = 1;
 321        patch->old_name = find_name(line, NULL, 0, 0);
 322        return 0;
 323}
 324
 325static int gitdiff_renamedst(const char *line, struct patch *patch)
 326{
 327        patch->is_rename = 1;
 328        patch->new_name = find_name(line, NULL, 0, 0);
 329        return 0;
 330}
 331
 332static int gitdiff_similarity(const char *line, struct patch *patch)
 333{
 334        if ((patch->score = strtoul(line, NULL, 10)) == ULONG_MAX)
 335                patch->score = 0;
 336        return 0;
 337}
 338
 339static int gitdiff_dissimilarity(const char *line, struct patch *patch)
 340{
 341        if ((patch->score = strtoul(line, NULL, 10)) == ULONG_MAX)
 342                patch->score = 0;
 343        return 0;
 344}
 345
 346/*
 347 * This is normal for a diff that doesn't change anything: we'll fall through
 348 * into the next diff. Tell the parser to break out.
 349 */
 350static int gitdiff_unrecognized(const char *line, struct patch *patch)
 351{
 352        return -1;
 353}
 354
 355static char *git_header_name(char *line)
 356{
 357        int len;
 358        char *name, *second;
 359
 360        /*
 361         * Find the first '/'
 362         */
 363        name = line;
 364        for (;;) {
 365                char c = *name++;
 366                if (c == '\n')
 367                        return NULL;
 368                if (c == '/')
 369                        break;
 370        }
 371
 372        /*
 373         * We don't accept absolute paths (/dev/null) as possibly valid
 374         */
 375        if (name == line+1)
 376                return NULL;
 377
 378        /*
 379         * Accept a name only if it shows up twice, exactly the same
 380         * form.
 381         */
 382        for (len = 0 ; ; len++) {
 383                char c = name[len];
 384
 385                switch (c) {
 386                default:
 387                        continue;
 388                case '\n':
 389                        break;
 390                case '\t': case ' ':
 391                        second = name+len;
 392                        for (;;) {
 393                                char c = *second++;
 394                                if (c == '\n')
 395                                        return NULL;
 396                                if (c == '/')
 397                                        break;
 398                        }
 399                        if (second[len] == '\n' && !memcmp(name, second, len)) {
 400                                char *ret = xmalloc(len + 1);
 401                                memcpy(ret, name, len);
 402                                ret[len] = 0;
 403                                return ret;
 404                        }
 405                }
 406        }
 407        return NULL;
 408}
 409
 410/* Verify that we recognize the lines following a git header */
 411static int parse_git_header(char *line, int len, unsigned int size, struct patch *patch)
 412{
 413        unsigned long offset;
 414
 415        /* A git diff has explicit new/delete information, so we don't guess */
 416        patch->is_new = 0;
 417        patch->is_delete = 0;
 418
 419        /*
 420         * Some things may not have the old name in the
 421         * rest of the headers anywhere (pure mode changes,
 422         * or removing or adding empty files), so we get
 423         * the default name from the header.
 424         */
 425        patch->def_name = git_header_name(line + strlen("diff --git "));
 426
 427        line += len;
 428        size -= len;
 429        linenr++;
 430        for (offset = len ; size > 0 ; offset += len, size -= len, line += len, linenr++) {
 431                static const struct opentry {
 432                        const char *str;
 433                        int (*fn)(const char *, struct patch *);
 434                } optable[] = {
 435                        { "@@ -", gitdiff_hdrend },
 436                        { "--- ", gitdiff_oldname },
 437                        { "+++ ", gitdiff_newname },
 438                        { "old mode ", gitdiff_oldmode },
 439                        { "new mode ", gitdiff_newmode },
 440                        { "deleted file mode ", gitdiff_delete },
 441                        { "new file mode ", gitdiff_newfile },
 442                        { "copy from ", gitdiff_copysrc },
 443                        { "copy to ", gitdiff_copydst },
 444                        { "rename old ", gitdiff_renamesrc },
 445                        { "rename new ", gitdiff_renamedst },
 446                        { "rename from ", gitdiff_renamesrc },
 447                        { "rename to ", gitdiff_renamedst },
 448                        { "similarity index ", gitdiff_similarity },
 449                        { "dissimilarity index ", gitdiff_dissimilarity },
 450                        { "", gitdiff_unrecognized },
 451                };
 452                int i;
 453
 454                len = linelen(line, size);
 455                if (!len || line[len-1] != '\n')
 456                        break;
 457                for (i = 0; i < sizeof(optable) / sizeof(optable[0]); i++) {
 458                        const struct opentry *p = optable + i;
 459                        int oplen = strlen(p->str);
 460                        if (len < oplen || memcmp(p->str, line, oplen))
 461                                continue;
 462                        if (p->fn(line + oplen, patch) < 0)
 463                                return offset;
 464                        break;
 465                }
 466        }
 467
 468        return offset;
 469}
 470
 471static int parse_num(const char *line, unsigned long *p)
 472{
 473        char *ptr;
 474
 475        if (!isdigit(*line))
 476                return 0;
 477        *p = strtoul(line, &ptr, 10);
 478        return ptr - line;
 479}
 480
 481static int parse_range(const char *line, int len, int offset, const char *expect,
 482                        unsigned long *p1, unsigned long *p2)
 483{
 484        int digits, ex;
 485
 486        if (offset < 0 || offset >= len)
 487                return -1;
 488        line += offset;
 489        len -= offset;
 490
 491        digits = parse_num(line, p1);
 492        if (!digits)
 493                return -1;
 494
 495        offset += digits;
 496        line += digits;
 497        len -= digits;
 498
 499        *p2 = *p1;
 500        if (*line == ',') {
 501                digits = parse_num(line+1, p2);
 502                if (!digits)
 503                        return -1;
 504
 505                offset += digits+1;
 506                line += digits+1;
 507                len -= digits+1;
 508        }
 509
 510        ex = strlen(expect);
 511        if (ex > len)
 512                return -1;
 513        if (memcmp(line, expect, ex))
 514                return -1;
 515
 516        return offset + ex;
 517}
 518
 519/*
 520 * Parse a unified diff fragment header of the
 521 * form "@@ -a,b +c,d @@"
 522 */
 523static int parse_fragment_header(char *line, int len, struct fragment *fragment)
 524{
 525        int offset;
 526
 527        if (!len || line[len-1] != '\n')
 528                return -1;
 529
 530        /* Figure out the number of lines in a fragment */
 531        offset = parse_range(line, len, 4, " +", &fragment->oldpos, &fragment->oldlines);
 532        offset = parse_range(line, len, offset, " @@", &fragment->newpos, &fragment->newlines);
 533
 534        return offset;
 535}
 536
 537static int find_header(char *line, unsigned long size, int *hdrsize, struct patch *patch)
 538{
 539        unsigned long offset, len;
 540
 541        patch->is_rename = patch->is_copy = 0;
 542        patch->is_new = patch->is_delete = -1;
 543        patch->old_mode = patch->new_mode = 0;
 544        patch->old_name = patch->new_name = NULL;
 545        for (offset = 0; size > 0; offset += len, size -= len, line += len, linenr++) {
 546                unsigned long nextlen;
 547
 548                len = linelen(line, size);
 549                if (!len)
 550                        break;
 551
 552                /* Testing this early allows us to take a few shortcuts.. */
 553                if (len < 6)
 554                        continue;
 555
 556                /*
 557                 * Make sure we don't find any unconnected patch fragmants.
 558                 * That's a sign that we didn't find a header, and that a
 559                 * patch has become corrupted/broken up.
 560                 */
 561                if (!memcmp("@@ -", line, 4)) {
 562                        struct fragment dummy;
 563                        if (parse_fragment_header(line, len, &dummy) < 0)
 564                                continue;
 565                        error("patch fragment without header at line %d: %.*s", linenr, len-1, line);
 566                }
 567
 568                if (size < len + 6)
 569                        break;
 570
 571                /*
 572                 * Git patch? It might not have a real patch, just a rename
 573                 * or mode change, so we handle that specially
 574                 */
 575                if (!memcmp("diff --git ", line, 11)) {
 576                        int git_hdr_len = parse_git_header(line, len, size, patch);
 577                        if (git_hdr_len <= len)
 578                                continue;
 579                        if (!patch->old_name && !patch->new_name) {
 580                                if (!patch->def_name)
 581                                        die("git diff header lacks filename information (line %d)", linenr);
 582                                patch->old_name = patch->new_name = patch->def_name;
 583                        }
 584                        *hdrsize = git_hdr_len;
 585                        return offset;
 586                }
 587
 588                /** --- followed by +++ ? */
 589                if (memcmp("--- ", line,  4) || memcmp("+++ ", line + len, 4))
 590                        continue;
 591
 592                /*
 593                 * We only accept unified patches, so we want it to
 594                 * at least have "@@ -a,b +c,d @@\n", which is 14 chars
 595                 * minimum
 596                 */
 597                nextlen = linelen(line + len, size - len);
 598                if (size < nextlen + 14 || memcmp("@@ -", line + len + nextlen, 4))
 599                        continue;
 600
 601                /* Ok, we'll consider it a patch */
 602                parse_traditional_patch(line, line+len, patch);
 603                *hdrsize = len + nextlen;
 604                linenr += 2;
 605                return offset;
 606        }
 607        return -1;
 608}
 609
 610/*
 611 * Parse a unified diff. Note that this really needs
 612 * to parse each fragment separately, since the only
 613 * way to know the difference between a "---" that is
 614 * part of a patch, and a "---" that starts the next
 615 * patch is to look at the line counts..
 616 */
 617static int parse_fragment(char *line, unsigned long size, struct patch *patch, struct fragment *fragment)
 618{
 619        int added, deleted;
 620        int len = linelen(line, size), offset;
 621        unsigned long oldlines, newlines;
 622
 623        offset = parse_fragment_header(line, len, fragment);
 624        if (offset < 0)
 625                return -1;
 626        oldlines = fragment->oldlines;
 627        newlines = fragment->newlines;
 628
 629        if (patch->is_new < 0) {
 630                patch->is_new =  !oldlines;
 631                if (!oldlines)
 632                        patch->old_name = NULL;
 633        }
 634        if (patch->is_delete < 0) {
 635                patch->is_delete = !newlines;
 636                if (!newlines)
 637                        patch->new_name = NULL;
 638        }
 639
 640        if (patch->is_new != !oldlines)
 641                return error("new file depends on old contents");
 642        if (patch->is_delete != !newlines) {
 643                if (newlines)
 644                        return error("deleted file still has contents");
 645                fprintf(stderr, "** warning: file %s becomes empty but is not deleted\n", patch->new_name);
 646        }
 647
 648        /* Parse the thing.. */
 649        line += len;
 650        size -= len;
 651        linenr++;
 652        added = deleted = 0;
 653        for (offset = len; size > 0; offset += len, size -= len, line += len, linenr++) {
 654                if (!oldlines && !newlines)
 655                        break;
 656                len = linelen(line, size);
 657                if (!len || line[len-1] != '\n')
 658                        return -1;
 659                switch (*line) {
 660                default:
 661                        return -1;
 662                case ' ':
 663                        oldlines--;
 664                        newlines--;
 665                        break;
 666                case '-':
 667                        deleted++;
 668                        oldlines--;
 669                        break;
 670                case '+':
 671                        added++;
 672                        newlines--;
 673                        break;
 674                /* We allow "\ No newline at end of file" */
 675                case '\\':
 676                        if (len < 12 || memcmp(line, "\\ No newline", 12))
 677                                return -1;
 678                        break;
 679                }
 680        }
 681        patch->lines_added += added;
 682        patch->lines_deleted += deleted;
 683        return offset;
 684}
 685
 686static int parse_single_patch(char *line, unsigned long size, struct patch *patch)
 687{
 688        unsigned long offset = 0;
 689        struct fragment **fragp = &patch->fragments;
 690
 691        while (size > 4 && !memcmp(line, "@@ -", 4)) {
 692                struct fragment *fragment;
 693                int len;
 694
 695                fragment = xmalloc(sizeof(*fragment));
 696                memset(fragment, 0, sizeof(*fragment));
 697                len = parse_fragment(line, size, patch, fragment);
 698                if (len <= 0)
 699                        die("corrupt patch at line %d", linenr);
 700
 701                fragment->patch = line;
 702                fragment->size = len;
 703
 704                *fragp = fragment;
 705                fragp = &fragment->next;
 706
 707                offset += len;
 708                line += len;
 709                size -= len;
 710        }
 711        return offset;
 712}
 713
 714static int parse_chunk(char *buffer, unsigned long size, struct patch *patch)
 715{
 716        int hdrsize, patchsize;
 717        int offset = find_header(buffer, size, &hdrsize, patch);
 718
 719        if (offset < 0)
 720                return offset;
 721
 722        patchsize = parse_single_patch(buffer + offset + hdrsize, size - offset - hdrsize, patch);
 723
 724        return offset + hdrsize + patchsize;
 725}
 726
 727const char pluses[] = "++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++";
 728const char minuses[]= "----------------------------------------------------------------------";
 729
 730static void show_stats(struct patch *patch)
 731{
 732        char *name = patch->new_name;
 733        int len, max, add, del, total;
 734
 735        if (!name)
 736                name = patch->old_name;
 737
 738        /*
 739         * "scale" the filename
 740         */
 741        len = strlen(name);
 742        max = max_len;
 743        if (max > 50)
 744                max = 50;
 745        if (len > max)
 746                name += len - max;
 747        len = max;
 748
 749        /*
 750         * scale the add/delete
 751         */
 752        max = max_change;
 753        if (max + len > 70)
 754                max = 70 - len;
 755
 756        add = patch->lines_added;
 757        del = patch->lines_deleted;
 758        total = add + del;
 759
 760        if (max_change > 0) {
 761                total = (total * max + max_change / 2) / max_change;
 762                add = (add * max + max_change / 2) / max_change;
 763                del = total - add;
 764        }
 765        printf(" %-*s |%5d %.*s%.*s\n",
 766                len, name, patch->lines_added + patch->lines_deleted,
 767                add, pluses, del, minuses);
 768}
 769
 770static int read_old_data(struct stat *st, const char *path, void *buf, unsigned long size)
 771{
 772        int fd;
 773        unsigned long got;
 774
 775        switch (st->st_mode & S_IFMT) {
 776        case S_IFLNK:
 777                return readlink(path, buf, size);
 778        case S_IFREG:
 779                fd = open(path, O_RDONLY);
 780                if (fd < 0)
 781                        return error("unable to open %s", path);
 782                got = 0;
 783                for (;;) {
 784                        int ret = read(fd, buf + got, size - got);
 785                        if (ret < 0) {
 786                                if (errno == EAGAIN)
 787                                        continue;
 788                                break;
 789                        }
 790                        if (!ret)
 791                                break;
 792                        got += ret;
 793                }
 794                close(fd);
 795                return got;
 796
 797        default:
 798                return -1;
 799        }
 800}
 801
 802static int find_offset(const char *buf, unsigned long size, const char *fragment, unsigned long fragsize, int line)
 803{
 804        int i;
 805        unsigned long start, backwards, forwards;
 806
 807        if (fragsize > size)
 808                return -1;
 809
 810        start = 0;
 811        if (line > 1) {
 812                unsigned long offset = 0;
 813                i = line-1;
 814                while (offset + fragsize <= size) {
 815                        if (buf[offset++] == '\n') {
 816                                start = offset;
 817                                if (!--i)
 818                                        break;
 819                        }
 820                }
 821        }
 822
 823        /* Exact line number? */
 824        if (!memcmp(buf + start, fragment, fragsize))
 825                return start;
 826
 827        /*
 828         * There's probably some smart way to do this, but I'll leave
 829         * that to the smart and beautiful people. I'm simple and stupid.
 830         */
 831        backwards = start;
 832        forwards = start;
 833        for (i = 0; ; i++) {
 834                unsigned long try;
 835                int n;
 836
 837                /* "backward" */
 838                if (i & 1) {
 839                        if (!backwards) {
 840                                if (forwards + fragsize > size)
 841                                        break;
 842                                continue;
 843                        }
 844                        do {
 845                                --backwards;
 846                        } while (backwards && buf[backwards-1] != '\n');
 847                        try = backwards;
 848                } else {
 849                        while (forwards + fragsize <= size) {
 850                                if (buf[forwards++] == '\n')
 851                                        break;
 852                        }
 853                        try = forwards;
 854                }
 855
 856                if (try + fragsize > size)
 857                        continue;
 858                if (memcmp(buf + try, fragment, fragsize))
 859                        continue;
 860                n = (i >> 1)+1;
 861                if (i & 1)
 862                        n = -n;
 863                return try;
 864        }
 865
 866        /*
 867         * We should start searching forward and backward.
 868         */
 869        return -1;
 870}
 871
 872struct buffer_desc {
 873        char *buffer;
 874        unsigned long size;
 875        unsigned long alloc;
 876};
 877
 878static int apply_one_fragment(struct buffer_desc *desc, struct fragment *frag)
 879{
 880        char *buf = desc->buffer;
 881        const char *patch = frag->patch;
 882        int offset, size = frag->size;
 883        char *old = xmalloc(size);
 884        char *new = xmalloc(size);
 885        int oldsize = 0, newsize = 0;
 886
 887        while (size > 0) {
 888                int len = linelen(patch, size);
 889                int plen;
 890
 891                if (!len)
 892                        break;
 893
 894                /*
 895                 * "plen" is how much of the line we should use for
 896                 * the actual patch data. Normally we just remove the
 897                 * first character on the line, but if the line is
 898                 * followed by "\ No newline", then we also remove the
 899                 * last one (which is the newline, of course).
 900                 */
 901                plen = len-1;
 902                if (len > size && patch[len] == '\\')
 903                        plen--;
 904                switch (*patch) {
 905                case ' ':
 906                case '-':
 907                        memcpy(old + oldsize, patch + 1, plen);
 908                        oldsize += plen;
 909                        if (*patch == '-')
 910                                break;
 911                /* Fall-through for ' ' */
 912                case '+':
 913                        memcpy(new + newsize, patch + 1, plen);
 914                        newsize += plen;
 915                        break;
 916                case '@': case '\\':
 917                        /* Ignore it, we already handled it */
 918                        break;
 919                default:
 920                        return -1;
 921                }
 922                patch += len;
 923                size -= len;
 924        }
 925
 926        offset = find_offset(buf, desc->size, old, oldsize, frag->newpos);
 927        if (offset >= 0) {
 928                int diff = newsize - oldsize;
 929                unsigned long size = desc->size + diff;
 930                unsigned long alloc = desc->alloc;
 931
 932                if (size > alloc) {
 933                        alloc = size + 8192;
 934                        desc->alloc = alloc;
 935                        buf = xrealloc(buf, alloc);
 936                        desc->buffer = buf;
 937                }
 938                desc->size = size;
 939                memmove(buf + offset + newsize, buf + offset + oldsize, size - offset - newsize);
 940                memcpy(buf + offset, new, newsize);
 941                offset = 0;
 942        }
 943
 944        free(old);
 945        free(new);
 946        return offset;
 947}
 948
 949static int apply_fragments(struct buffer_desc *desc, struct patch *patch)
 950{
 951        struct fragment *frag = patch->fragments;
 952
 953        while (frag) {
 954                if (apply_one_fragment(desc, frag) < 0)
 955                        return error("patch failed: %s:%d", patch->old_name, frag->oldpos);
 956                frag = frag->next;
 957        }
 958        return 0;
 959}
 960
 961static int apply_data(struct patch *patch, struct stat *st)
 962{
 963        char *buf;
 964        unsigned long size, alloc;
 965        struct buffer_desc desc;
 966
 967        size = 0;
 968        alloc = 0;
 969        buf = NULL;
 970        if (patch->old_name) {
 971                size = st->st_size;
 972                alloc = size + 8192;
 973                buf = xmalloc(alloc);
 974                if (read_old_data(st, patch->old_name, buf, alloc) != size)
 975                        return error("read of %s failed", patch->old_name);
 976        }
 977
 978        desc.size = size;
 979        desc.alloc = alloc;
 980        desc.buffer = buf;
 981        if (apply_fragments(&desc, patch) < 0)
 982                return -1;
 983        patch->result = desc.buffer;
 984        patch->resultsize = desc.size;
 985
 986        if (patch->is_delete && patch->resultsize)
 987                return error("removal patch leaves file contents");
 988
 989        return 0;
 990}
 991
 992static int check_patch(struct patch *patch)
 993{
 994        struct stat st;
 995        const char *old_name = patch->old_name;
 996        const char *new_name = patch->new_name;
 997
 998        if (old_name) {
 999                int changed;
1000
1001                if (lstat(old_name, &st) < 0)
1002                        return error("%s: %s", old_name, strerror(errno));
1003                if (check_index) {
1004                        int pos = cache_name_pos(old_name, strlen(old_name));
1005                        if (pos < 0)
1006                                return error("%s: does not exist in index", old_name);
1007                        changed = ce_match_stat(active_cache[pos], &st);
1008                        if (changed)
1009                                return error("%s: does not match index", old_name);
1010                }
1011                if (patch->is_new < 0)
1012                        patch->is_new = 0;
1013                st.st_mode = ntohl(create_ce_mode(st.st_mode));
1014                if (!patch->old_mode)
1015                        patch->old_mode = st.st_mode;
1016                if ((st.st_mode ^ patch->old_mode) & S_IFMT)
1017                        return error("%s: wrong type", old_name);
1018                if (st.st_mode != patch->old_mode)
1019                        fprintf(stderr, "warning: %s has type %o, expected %o\n",
1020                                old_name, st.st_mode, patch->old_mode);
1021        }
1022
1023        if (new_name && (patch->is_new | patch->is_rename | patch->is_copy)) {
1024                if (check_index && cache_name_pos(new_name, strlen(new_name)) >= 0)
1025                        return error("%s: already exists in index", new_name);
1026                if (!lstat(new_name, &st))
1027                        return error("%s: already exists in working directory", new_name);
1028                if (errno != ENOENT)
1029                        return error("%s: %s", new_name, strerror(errno));
1030                if (!patch->new_mode)
1031                        patch->new_mode = S_IFREG | 0644;
1032        }
1033
1034        if (new_name && old_name) {
1035                int same = !strcmp(old_name, new_name);
1036                if (!patch->new_mode)
1037                        patch->new_mode = patch->old_mode;
1038                if ((patch->old_mode ^ patch->new_mode) & S_IFMT)
1039                        return error("new mode (%o) of %s does not match old mode (%o)%s%s",
1040                                patch->new_mode, new_name, patch->old_mode,
1041                                same ? "" : " of ", same ? "" : old_name);
1042        }       
1043
1044        if (apply_data(patch, &st) < 0)
1045                return error("%s: patch does not apply", old_name);
1046        return 0;
1047}
1048
1049static int check_patch_list(struct patch *patch)
1050{
1051        int error = 0;
1052
1053        for (;patch ; patch = patch->next)
1054                error |= check_patch(patch);
1055        return error;
1056}
1057
1058static void show_file(int c, unsigned int mode, const char *name)
1059{
1060        printf("%c %o %s\n", c, mode, name);
1061}
1062
1063static void show_file_list(struct patch *patch)
1064{
1065        for (;patch ; patch = patch->next) {
1066                if (patch->is_rename) {
1067                        show_file('-', patch->old_mode, patch->old_name);
1068                        show_file('+', patch->new_mode, patch->new_name);
1069                        continue;
1070                }
1071                if (patch->is_copy || patch->is_new) {
1072                        show_file('+', patch->new_mode, patch->new_name);
1073                        continue;
1074                }
1075                if (patch->is_delete) {
1076                        show_file('-', patch->old_mode, patch->old_name);
1077                        continue;
1078                }
1079                if (patch->old_mode && patch->new_mode && patch->old_mode != patch->new_mode) {
1080                        printf("M %o:%o %s\n", patch->old_mode, patch->new_mode, patch->old_name);
1081                        continue;
1082                }
1083                printf("M %o %s\n", patch->old_mode, patch->old_name);
1084        }
1085}
1086
1087static void stat_patch_list(struct patch *patch)
1088{
1089        int files, adds, dels;
1090
1091        for (files = adds = dels = 0 ; patch ; patch = patch->next) {
1092                files++;
1093                adds += patch->lines_added;
1094                dels += patch->lines_deleted;
1095                show_stats(patch);
1096        }
1097
1098        printf(" %d files changed, %d insertions(+), %d deletions(-)\n", files, adds, dels);
1099}
1100
1101static void show_file_mode_name(const char *newdelete, unsigned int mode, const char *name)
1102{
1103        if (mode)
1104                printf(" %s mode %06o %s\n", newdelete, mode, name);
1105        else
1106                printf(" %s %s\n", newdelete, name);
1107}
1108
1109static void show_mode_change(struct patch *p, int show_name)
1110{
1111        if (p->old_mode && p->new_mode && p->old_mode != p->new_mode) {
1112                if (show_name)
1113                        printf(" mode change %06o => %06o %s\n",
1114                               p->old_mode, p->new_mode, p->new_name);
1115                else
1116                        printf(" mode change %06o => %06o\n",
1117                               p->old_mode, p->new_mode);
1118        }
1119}
1120
1121static void show_rename_copy(struct patch *p)
1122{
1123        const char *renamecopy = p->is_rename ? "rename" : "copy";
1124        const char *old, *new;
1125
1126        /* Find common prefix */
1127        old = p->old_name;
1128        new = p->new_name;
1129        while (1) {
1130                const char *slash_old, *slash_new;
1131                slash_old = strchr(old, '/');
1132                slash_new = strchr(new, '/');
1133                if (!slash_old ||
1134                    !slash_new ||
1135                    slash_old - old != slash_new - new ||
1136                    memcmp(old, new, slash_new - new))
1137                        break;
1138                old = slash_old + 1;
1139                new = slash_new + 1;
1140        }
1141        /* p->old_name thru old is the common prefix, and old and new
1142         * through the end of names are renames
1143         */
1144        if (old != p->old_name)
1145                printf(" %s %.*s{%s => %s} (%d%%)\n", renamecopy,
1146                       old - p->old_name, p->old_name,
1147                       old, new, p->score);
1148        else
1149                printf(" %s %s => %s (%d%%)\n", renamecopy,
1150                       p->old_name, p->new_name, p->score);
1151        show_mode_change(p, 0);
1152}
1153
1154static void summary_patch_list(struct patch *patch)
1155{
1156        struct patch *p;
1157
1158        for (p = patch; p; p = p->next) {
1159                if (p->is_new)
1160                        show_file_mode_name("create", p->new_mode, p->new_name);
1161                else if (p->is_delete)
1162                        show_file_mode_name("delete", p->old_mode, p->old_name);
1163                else {
1164                        if (p->is_rename || p->is_copy)
1165                                show_rename_copy(p);
1166                        else {
1167                                if (p->score) {
1168                                        printf(" rewrite %s (%d%%)\n",
1169                                               p->new_name, p->score);
1170                                        show_mode_change(p, 0);
1171                                }
1172                                else
1173                                        show_mode_change(p, 1);
1174                        }
1175                }
1176        }
1177}
1178
1179static void patch_stats(struct patch *patch)
1180{
1181        int lines = patch->lines_added + patch->lines_deleted;
1182
1183        if (lines > max_change)
1184                max_change = lines;
1185        if (patch->old_name) {
1186                int len = strlen(patch->old_name);
1187                if (len > max_len)
1188                        max_len = len;
1189        }
1190        if (patch->new_name) {
1191                int len = strlen(patch->new_name);
1192                if (len > max_len)
1193                        max_len = len;
1194        }
1195}
1196
1197static void remove_file(struct patch *patch)
1198{
1199        if (write_index) {
1200                if (remove_file_from_cache(patch->old_name) < 0)
1201                        die("unable to remove %s from index", patch->old_name);
1202        }
1203        unlink(patch->old_name);
1204}
1205
1206static void add_index_file(const char *path, unsigned mode, void *buf, unsigned long size)
1207{
1208        struct stat st;
1209        struct cache_entry *ce;
1210        int namelen = strlen(path);
1211        unsigned ce_size = cache_entry_size(namelen);
1212
1213        if (!write_index)
1214                return;
1215
1216        ce = xmalloc(ce_size);
1217        memset(ce, 0, ce_size);
1218        memcpy(ce->name, path, namelen);
1219        ce->ce_mode = create_ce_mode(mode);
1220        ce->ce_flags = htons(namelen);
1221        if (lstat(path, &st) < 0)
1222                die("unable to stat newly created file %s", path);
1223        fill_stat_cache_info(ce, &st);
1224        if (write_sha1_file(buf, size, "blob", ce->sha1) < 0)
1225                die("unable to create backing store for newly created file %s", path);
1226        if (add_cache_entry(ce, ADD_CACHE_OK_TO_ADD) < 0)
1227                die("unable to add cache entry for %s", path);
1228}
1229
1230static void create_subdirectories(const char *path)
1231{
1232        int len = strlen(path);
1233        char *buf = xmalloc(len + 1);
1234        const char *slash = path;
1235
1236        while ((slash = strchr(slash+1, '/')) != NULL) {
1237                len = slash - path;
1238                memcpy(buf, path, len);
1239                buf[len] = 0;
1240                if (mkdir(buf, 0755) < 0) {
1241                        if (errno != EEXIST)
1242                                break;
1243                }
1244        }
1245        free(buf);
1246}
1247
1248/*
1249 * We optimistically assume that the directories exist,
1250 * which is true 99% of the time anyway. If they don't,
1251 * we create them and try again.
1252 */
1253static int create_regular_file(const char *path, unsigned int mode)
1254{
1255        int ret = open(path, O_WRONLY | O_CREAT | O_TRUNC, mode);
1256
1257        if (ret < 0 && errno == ENOENT) {
1258                create_subdirectories(path);
1259                ret = open(path, O_WRONLY | O_CREAT | O_TRUNC, mode);
1260        }
1261        return ret;
1262}
1263
1264static int create_symlink(const char *buf, const char *path)
1265{
1266        int ret = symlink(buf, path);
1267
1268        if (ret < 0 && errno == ENOENT) {
1269                create_subdirectories(path);
1270                ret = symlink(buf, path);
1271        }
1272        return ret;
1273}
1274
1275static void create_file(struct patch *patch)
1276{
1277        const char *path = patch->new_name;
1278        unsigned mode = patch->new_mode;
1279        unsigned long size = patch->resultsize;
1280        char *buf = patch->result;
1281
1282        if (!mode)
1283                mode = S_IFREG | 0644;
1284        if (S_ISREG(mode)) {
1285                int fd;
1286                mode = (mode & 0100) ? 0777 : 0666;
1287                fd = create_regular_file(path, mode);
1288                if (fd < 0)
1289                        die("unable to create file %s (%s)", path, strerror(errno));
1290                if (write(fd, buf, size) != size)
1291                        die("unable to write file %s", path);
1292                close(fd);
1293                add_index_file(path, mode, buf, size);
1294                return;
1295        }
1296        if (S_ISLNK(mode)) {
1297                if (size && buf[size-1] == '\n')
1298                        size--;
1299                buf[size] = 0;
1300                if (create_symlink(buf, path) < 0)
1301                        die("unable to write symlink %s", path);
1302                add_index_file(path, mode, buf, size);
1303                return;
1304        }
1305        die("unable to write file mode %o", mode);
1306}
1307
1308static void write_out_one_result(struct patch *patch)
1309{
1310        if (patch->is_delete > 0) {
1311                remove_file(patch);
1312                return;
1313        }
1314        if (patch->is_new > 0 || patch->is_copy) {
1315                create_file(patch);
1316                return;
1317        }
1318        /*
1319         * Rename or modification boils down to the same
1320         * thing: remove the old, write the new
1321         */
1322        remove_file(patch);
1323        create_file(patch);
1324}
1325
1326static void write_out_results(struct patch *list)
1327{
1328        if (!list)
1329                die("No changes");
1330
1331        while (list) {
1332                write_out_one_result(list);
1333                list = list->next;
1334        }
1335}
1336
1337static struct cache_file cache_file;
1338
1339static int apply_patch(int fd)
1340{
1341        int newfd;
1342        unsigned long offset, size;
1343        char *buffer = read_patch_file(fd, &size);
1344        struct patch *list = NULL, **listp = &list;
1345
1346        if (!buffer)
1347                return -1;
1348        offset = 0;
1349        while (size > 0) {
1350                struct patch *patch;
1351                int nr;
1352
1353                patch = xmalloc(sizeof(*patch));
1354                memset(patch, 0, sizeof(*patch));
1355                nr = parse_chunk(buffer + offset, size, patch);
1356                if (nr < 0)
1357                        break;
1358                patch_stats(patch);
1359                *listp = patch;
1360                listp = &patch->next;
1361                offset += nr;
1362                size -= nr;
1363        }
1364
1365        newfd = -1;
1366        write_index = check_index && apply;
1367        if (write_index)
1368                newfd = hold_index_file_for_update(&cache_file, get_index_file());
1369        if (check_index) {
1370                if (read_cache() < 0)
1371                        die("unable to read index file");
1372        }
1373
1374        if ((check || apply) && check_patch_list(list) < 0)
1375                exit(1);
1376
1377        if (apply)
1378                write_out_results(list);
1379
1380        if (write_index) {
1381                if (write_cache(newfd, active_cache, active_nr) ||
1382                    commit_index_file(&cache_file))
1383                        die("Unable to write new cachefile");
1384        }
1385
1386        if (show_files)
1387                show_file_list(list);
1388
1389        if (diffstat)
1390                stat_patch_list(list);
1391
1392        if (summary)
1393                summary_patch_list(list);
1394
1395        free(buffer);
1396        return 0;
1397}
1398
1399int main(int argc, char **argv)
1400{
1401        int i;
1402        int read_stdin = 1;
1403
1404        for (i = 1; i < argc; i++) {
1405                const char *arg = argv[i];
1406                int fd;
1407
1408                if (!strcmp(arg, "-")) {
1409                        apply_patch(0);
1410                        read_stdin = 0;
1411                        continue;
1412                }
1413                if (!strcmp(arg, "--no-merge")) {
1414                        merge_patch = 0;
1415                        continue;
1416                }
1417                if (!strcmp(arg, "--stat")) {
1418                        apply = 0;
1419                        diffstat = 1;
1420                        continue;
1421                }
1422                if (!strcmp(arg, "--summary")) {
1423                        apply = 0;
1424                        summary = 1;
1425                        continue;
1426                }
1427                if (!strcmp(arg, "--check")) {
1428                        apply = 0;
1429                        check = 1;
1430                        continue;
1431                }
1432                if (!strcmp(arg, "--index")) {
1433                        check_index = 1;
1434                        continue;
1435                }
1436                if (!strcmp(arg, "--apply")) {
1437                        apply = 1;
1438                        continue;
1439                }
1440                if (!strcmp(arg, "--show-files")) {
1441                        show_files = 1;
1442                        continue;
1443                }
1444                fd = open(arg, O_RDONLY);
1445                if (fd < 0)
1446                        usage(apply_usage);
1447                read_stdin = 0;
1448                apply_patch(fd);
1449                close(fd);
1450        }
1451        if (read_stdin)
1452                apply_patch(0);
1453        return 0;
1454}