45a3845c0a37ea5e77d0c7a206e449b78448e240
   1/*
   2 * Helper functions for tree diff generation
   3 */
   4#include "cache.h"
   5#include "diff.h"
   6#include "diffcore.h"
   7#include "tree.h"
   8
   9static void show_entry(struct diff_options *opt, const char *prefix,
  10                       struct tree_desc *desc, struct strbuf *base);
  11
  12static int compare_tree_entry(struct tree_desc *t1, struct tree_desc *t2,
  13                              struct strbuf *base, struct diff_options *opt)
  14{
  15        unsigned mode1, mode2;
  16        const char *path1, *path2;
  17        const unsigned char *sha1, *sha2;
  18        int cmp, pathlen1, pathlen2;
  19        int old_baselen = base->len;
  20        int retval = 0;
  21
  22        sha1 = tree_entry_extract(t1, &path1, &mode1);
  23        sha2 = tree_entry_extract(t2, &path2, &mode2);
  24
  25        pathlen1 = tree_entry_len(path1, sha1);
  26        pathlen2 = tree_entry_len(path2, sha2);
  27        cmp = base_name_compare(path1, pathlen1, mode1, path2, pathlen2, mode2);
  28        if (cmp < 0) {
  29                show_entry(opt, "-", t1, base);
  30                return -1;
  31        }
  32        if (cmp > 0) {
  33                show_entry(opt, "+", t2, base);
  34                return 1;
  35        }
  36        if (!DIFF_OPT_TST(opt, FIND_COPIES_HARDER) && !hashcmp(sha1, sha2) && mode1 == mode2)
  37                return 0;
  38
  39        /*
  40         * If the filemode has changed to/from a directory from/to a regular
  41         * file, we need to consider it a remove and an add.
  42         */
  43        if (S_ISDIR(mode1) != S_ISDIR(mode2)) {
  44                show_entry(opt, "-", t1, base);
  45                show_entry(opt, "+", t2, base);
  46                return 0;
  47        }
  48
  49        strbuf_add(base, path1, pathlen1);
  50        if (DIFF_OPT_TST(opt, RECURSIVE) && S_ISDIR(mode1)) {
  51                if (DIFF_OPT_TST(opt, TREE_IN_RECURSIVE)) {
  52                        opt->change(opt, mode1, mode2,
  53                                    sha1, sha2, base->buf, 0, 0);
  54                }
  55                strbuf_addch(base, '/');
  56                retval = diff_tree_sha1(sha1, sha2, base->buf, opt);
  57        } else {
  58                opt->change(opt, mode1, mode2, sha1, sha2, base->buf, 0, 0);
  59        }
  60        strbuf_setlen(base, old_baselen);
  61        return 0;
  62}
  63
  64/* A whole sub-tree went away or appeared */
  65static void show_tree(struct diff_options *opt, const char *prefix,
  66                      struct tree_desc *desc, struct strbuf *base)
  67{
  68        int all_interesting = 0;
  69        while (desc->size) {
  70                int show;
  71
  72                if (all_interesting)
  73                        show = 1;
  74                else {
  75                        show = tree_entry_interesting(&desc->entry, base,
  76                                                      &opt->pathspec);
  77                        if (show == 2)
  78                                all_interesting = 1;
  79                }
  80                if (show < 0)
  81                        break;
  82                if (show)
  83                        show_entry(opt, prefix, desc, base);
  84                update_tree_entry(desc);
  85        }
  86}
  87
  88/* A file entry went away or appeared */
  89static void show_entry(struct diff_options *opt, const char *prefix,
  90                       struct tree_desc *desc, struct strbuf *base)
  91{
  92        unsigned mode;
  93        const char *path;
  94        const unsigned char *sha1 = tree_entry_extract(desc, &path, &mode);
  95        int pathlen = tree_entry_len(path, sha1);
  96        int old_baselen = base->len;
  97
  98        strbuf_add(base, path, pathlen);
  99        if (DIFF_OPT_TST(opt, RECURSIVE) && S_ISDIR(mode)) {
 100                enum object_type type;
 101                struct tree_desc inner;
 102                void *tree;
 103                unsigned long size;
 104
 105                tree = read_sha1_file(sha1, &type, &size);
 106                if (!tree || type != OBJ_TREE)
 107                        die("corrupt tree sha %s", sha1_to_hex(sha1));
 108
 109                if (DIFF_OPT_TST(opt, TREE_IN_RECURSIVE))
 110                        opt->add_remove(opt, *prefix, mode, sha1, base->buf, 0);
 111
 112                strbuf_addch(base, '/');
 113
 114                init_tree_desc(&inner, tree, size);
 115                show_tree(opt, prefix, &inner, base);
 116                free(tree);
 117        } else
 118                opt->add_remove(opt, prefix[0], mode, sha1, base->buf, 0);
 119
 120        strbuf_setlen(base, old_baselen);
 121}
 122
 123static void skip_uninteresting(struct tree_desc *t, struct strbuf *base,
 124                               struct diff_options *opt, int *all_interesting)
 125{
 126        while (t->size) {
 127                int show = tree_entry_interesting(&t->entry, base, &opt->pathspec);
 128                if (show == 2)
 129                        *all_interesting = 1;
 130                if (!show) {
 131                        update_tree_entry(t);
 132                        continue;
 133                }
 134                /* Skip it all? */
 135                if (show < 0)
 136                        t->size = 0;
 137                return;
 138        }
 139}
 140
 141int diff_tree(struct tree_desc *t1, struct tree_desc *t2,
 142              const char *base_str, struct diff_options *opt)
 143{
 144        struct strbuf base;
 145        int baselen = strlen(base_str);
 146        int all_t1_interesting = 0;
 147        int all_t2_interesting = 0;
 148
 149        strbuf_init(&base, PATH_MAX);
 150        strbuf_add(&base, base_str, baselen);
 151
 152        for (;;) {
 153                if (DIFF_OPT_TST(opt, QUICK) &&
 154                    DIFF_OPT_TST(opt, HAS_CHANGES))
 155                        break;
 156                if (opt->pathspec.nr) {
 157                        if (!all_t1_interesting)
 158                                skip_uninteresting(t1, &base, opt, &all_t1_interesting);
 159                        if (!all_t2_interesting)
 160                                skip_uninteresting(t2, &base, opt, &all_t2_interesting);
 161                }
 162                if (!t1->size) {
 163                        if (!t2->size)
 164                                break;
 165                        show_entry(opt, "+", t2, &base);
 166                        update_tree_entry(t2);
 167                        continue;
 168                }
 169                if (!t2->size) {
 170                        show_entry(opt, "-", t1, &base);
 171                        update_tree_entry(t1);
 172                        continue;
 173                }
 174                switch (compare_tree_entry(t1, t2, &base, opt)) {
 175                case -1:
 176                        update_tree_entry(t1);
 177                        continue;
 178                case 0:
 179                        update_tree_entry(t1);
 180                        /* Fallthrough */
 181                case 1:
 182                        update_tree_entry(t2);
 183                        continue;
 184                }
 185                die("git diff-tree: internal error");
 186        }
 187
 188        strbuf_release(&base);
 189        return 0;
 190}
 191
 192/*
 193 * Does it look like the resulting diff might be due to a rename?
 194 *  - single entry
 195 *  - not a valid previous file
 196 */
 197static inline int diff_might_be_rename(void)
 198{
 199        return diff_queued_diff.nr == 1 &&
 200                !DIFF_FILE_VALID(diff_queued_diff.queue[0]->one);
 201}
 202
 203static void try_to_follow_renames(struct tree_desc *t1, struct tree_desc *t2, const char *base, struct diff_options *opt)
 204{
 205        struct diff_options diff_opts;
 206        struct diff_queue_struct *q = &diff_queued_diff;
 207        struct diff_filepair *choice;
 208        const char *paths[1];
 209        int i;
 210
 211        /* Remove the file creation entry from the diff queue, and remember it */
 212        choice = q->queue[0];
 213        q->nr = 0;
 214
 215        diff_setup(&diff_opts);
 216        DIFF_OPT_SET(&diff_opts, RECURSIVE);
 217        DIFF_OPT_SET(&diff_opts, FIND_COPIES_HARDER);
 218        diff_opts.output_format = DIFF_FORMAT_NO_OUTPUT;
 219        diff_opts.single_follow = opt->pathspec.raw[0];
 220        diff_opts.break_opt = opt->break_opt;
 221        paths[0] = NULL;
 222        diff_tree_setup_paths(paths, &diff_opts);
 223        if (diff_setup_done(&diff_opts) < 0)
 224                die("unable to set up diff options to follow renames");
 225        diff_tree(t1, t2, base, &diff_opts);
 226        diffcore_std(&diff_opts);
 227        diff_tree_release_paths(&diff_opts);
 228
 229        /* Go through the new set of filepairing, and see if we find a more interesting one */
 230        opt->found_follow = 0;
 231        for (i = 0; i < q->nr; i++) {
 232                struct diff_filepair *p = q->queue[i];
 233
 234                /*
 235                 * Found a source? Not only do we use that for the new
 236                 * diff_queued_diff, we will also use that as the path in
 237                 * the future!
 238                 */
 239                if ((p->status == 'R' || p->status == 'C') &&
 240                    !strcmp(p->two->path, opt->pathspec.raw[0])) {
 241                        /* Switch the file-pairs around */
 242                        q->queue[i] = choice;
 243                        choice = p;
 244
 245                        /* Update the path we use from now on.. */
 246                        diff_tree_release_paths(opt);
 247                        opt->pathspec.raw[0] = xstrdup(p->one->path);
 248                        diff_tree_setup_paths(opt->pathspec.raw, opt);
 249
 250                        /*
 251                         * The caller expects us to return a set of vanilla
 252                         * filepairs to let a later call to diffcore_std()
 253                         * it makes to sort the renames out (among other
 254                         * things), but we already have found renames
 255                         * ourselves; signal diffcore_std() not to muck with
 256                         * rename information.
 257                         */
 258                        opt->found_follow = 1;
 259                        break;
 260                }
 261        }
 262
 263        /*
 264         * Then, discard all the non-relevant file pairs...
 265         */
 266        for (i = 0; i < q->nr; i++) {
 267                struct diff_filepair *p = q->queue[i];
 268                diff_free_filepair(p);
 269        }
 270
 271        /*
 272         * .. and re-instate the one we want (which might be either the
 273         * original one, or the rename/copy we found)
 274         */
 275        q->queue[0] = choice;
 276        q->nr = 1;
 277}
 278
 279int diff_tree_sha1(const unsigned char *old, const unsigned char *new, const char *base, struct diff_options *opt)
 280{
 281        void *tree1, *tree2;
 282        struct tree_desc t1, t2;
 283        unsigned long size1, size2;
 284        int retval;
 285
 286        tree1 = read_object_with_reference(old, tree_type, &size1, NULL);
 287        if (!tree1)
 288                die("unable to read source tree (%s)", sha1_to_hex(old));
 289        tree2 = read_object_with_reference(new, tree_type, &size2, NULL);
 290        if (!tree2)
 291                die("unable to read destination tree (%s)", sha1_to_hex(new));
 292        init_tree_desc(&t1, tree1, size1);
 293        init_tree_desc(&t2, tree2, size2);
 294        retval = diff_tree(&t1, &t2, base, opt);
 295        if (!*base && DIFF_OPT_TST(opt, FOLLOW_RENAMES) && diff_might_be_rename()) {
 296                init_tree_desc(&t1, tree1, size1);
 297                init_tree_desc(&t2, tree2, size2);
 298                try_to_follow_renames(&t1, &t2, base, opt);
 299        }
 300        free(tree1);
 301        free(tree2);
 302        return retval;
 303}
 304
 305int diff_root_tree_sha1(const unsigned char *new, const char *base, struct diff_options *opt)
 306{
 307        int retval;
 308        void *tree;
 309        unsigned long size;
 310        struct tree_desc empty, real;
 311
 312        tree = read_object_with_reference(new, tree_type, &size, NULL);
 313        if (!tree)
 314                die("unable to read root tree (%s)", sha1_to_hex(new));
 315        init_tree_desc(&real, tree, size);
 316
 317        init_tree_desc(&empty, "", 0);
 318        retval = diff_tree(&empty, &real, base, opt);
 319        free(tree);
 320        return retval;
 321}
 322
 323void diff_tree_release_paths(struct diff_options *opt)
 324{
 325        free_pathspec(&opt->pathspec);
 326}
 327
 328void diff_tree_setup_paths(const char **p, struct diff_options *opt)
 329{
 330        init_pathspec(&opt->pathspec, p);
 331}