1af82190339b058549cb2197b92edb1369c0ba42
1/*
2 * Helper functions for tree diff generation
3 */
4#include "cache.h"
5#include "diff.h"
6#include "diffcore.h"
7#include "tree.h"
8
9static void show_path(struct strbuf *base, struct diff_options *opt,
10 struct tree_desc *t1, struct tree_desc *t2);
11
12static int compare_tree_entry(struct tree_desc *t1, struct tree_desc *t2,
13 struct strbuf *base, struct diff_options *opt)
14{
15 unsigned mode1, mode2;
16 const char *path1, *path2;
17 const unsigned char *sha1, *sha2;
18 int cmp, pathlen1, pathlen2;
19
20 sha1 = tree_entry_extract(t1, &path1, &mode1);
21 sha2 = tree_entry_extract(t2, &path2, &mode2);
22
23 pathlen1 = tree_entry_len(&t1->entry);
24 pathlen2 = tree_entry_len(&t2->entry);
25
26 /*
27 * NOTE files and directories *always* compare differently,
28 * even when having the same name.
29 */
30 cmp = base_name_compare(path1, pathlen1, mode1, path2, pathlen2, mode2);
31 if (cmp < 0) {
32 show_path(base, opt, t1, /*t2=*/NULL);
33 return -1;
34 }
35 if (cmp > 0) {
36 show_path(base, opt, /*t1=*/NULL, t2);
37 return 1;
38 }
39 if (!DIFF_OPT_TST(opt, FIND_COPIES_HARDER) && !hashcmp(sha1, sha2) && mode1 == mode2)
40 return 0;
41
42 show_path(base, opt, t1, t2);
43 return 0;
44}
45
46
47/* convert path, t1/t2 -> opt->diff_*() callbacks */
48static void emit_diff(struct diff_options *opt, struct strbuf *path,
49 struct tree_desc *t1, struct tree_desc *t2)
50{
51 unsigned int mode1 = t1 ? t1->entry.mode : 0;
52 unsigned int mode2 = t2 ? t2->entry.mode : 0;
53
54 if (mode1 && mode2) {
55 opt->change(opt, mode1, mode2, t1->entry.sha1, t2->entry.sha1,
56 1, 1, path->buf, 0, 0);
57 }
58 else {
59 const unsigned char *sha1;
60 unsigned int mode;
61 int addremove;
62
63 if (mode2) {
64 addremove = '+';
65 sha1 = t2->entry.sha1;
66 mode = mode2;
67 } else {
68 addremove = '-';
69 sha1 = t1->entry.sha1;
70 mode = mode1;
71 }
72
73 opt->add_remove(opt, addremove, mode, sha1, 1, path->buf, 0);
74 }
75}
76
77
78/* new path should be added to diff
79 *
80 * 3 cases on how/when it should be called and behaves:
81 *
82 * !t1, t2 -> path added, parent lacks it
83 * t1, !t2 -> path removed from parent
84 * t1, t2 -> path modified
85 */
86static void show_path(struct strbuf *base, struct diff_options *opt,
87 struct tree_desc *t1, struct tree_desc *t2)
88{
89 unsigned mode;
90 const char *path;
91 int pathlen;
92 int old_baselen = base->len;
93 int isdir, recurse = 0, emitthis = 1;
94
95 /* at least something has to be valid */
96 assert(t1 || t2);
97
98 if (t2) {
99 /* path present in resulting tree */
100 tree_entry_extract(t2, &path, &mode);
101 pathlen = tree_entry_len(&t2->entry);
102 isdir = S_ISDIR(mode);
103 } else {
104 /*
105 * a path was removed - take path from parent. Also take
106 * mode from parent, to decide on recursion.
107 */
108 tree_entry_extract(t1, &path, &mode);
109 pathlen = tree_entry_len(&t1->entry);
110
111 isdir = S_ISDIR(mode);
112 mode = 0;
113 }
114
115 if (DIFF_OPT_TST(opt, RECURSIVE) && isdir) {
116 recurse = 1;
117 emitthis = DIFF_OPT_TST(opt, TREE_IN_RECURSIVE);
118 }
119
120 strbuf_add(base, path, pathlen);
121
122 if (emitthis)
123 emit_diff(opt, base, t1, t2);
124
125 if (recurse) {
126 strbuf_addch(base, '/');
127 diff_tree_sha1(t1 ? t1->entry.sha1 : NULL,
128 t2 ? t2->entry.sha1 : NULL, base->buf, opt);
129 }
130
131 strbuf_setlen(base, old_baselen);
132}
133
134static void skip_uninteresting(struct tree_desc *t, struct strbuf *base,
135 struct diff_options *opt)
136{
137 enum interesting match;
138
139 while (t->size) {
140 match = tree_entry_interesting(&t->entry, base, 0, &opt->pathspec);
141 if (match) {
142 if (match == all_entries_not_interesting)
143 t->size = 0;
144 break;
145 }
146 update_tree_entry(t);
147 }
148}
149
150int diff_tree(struct tree_desc *t1, struct tree_desc *t2,
151 const char *base_str, struct diff_options *opt)
152{
153 struct strbuf base;
154 int baselen = strlen(base_str);
155
156 /* Enable recursion indefinitely */
157 opt->pathspec.recursive = DIFF_OPT_TST(opt, RECURSIVE);
158
159 strbuf_init(&base, PATH_MAX);
160 strbuf_add(&base, base_str, baselen);
161
162 for (;;) {
163 if (diff_can_quit_early(opt))
164 break;
165 if (opt->pathspec.nr) {
166 skip_uninteresting(t1, &base, opt);
167 skip_uninteresting(t2, &base, opt);
168 }
169 if (!t1->size) {
170 if (!t2->size)
171 break;
172 show_path(&base, opt, /*t1=*/NULL, t2);
173 update_tree_entry(t2);
174 continue;
175 }
176 if (!t2->size) {
177 show_path(&base, opt, t1, /*t2=*/NULL);
178 update_tree_entry(t1);
179 continue;
180 }
181 switch (compare_tree_entry(t1, t2, &base, opt)) {
182 case -1:
183 update_tree_entry(t1);
184 continue;
185 case 0:
186 update_tree_entry(t1);
187 /* Fallthrough */
188 case 1:
189 update_tree_entry(t2);
190 continue;
191 }
192 die("git diff-tree: internal error");
193 }
194
195 strbuf_release(&base);
196 return 0;
197}
198
199/*
200 * Does it look like the resulting diff might be due to a rename?
201 * - single entry
202 * - not a valid previous file
203 */
204static inline int diff_might_be_rename(void)
205{
206 return diff_queued_diff.nr == 1 &&
207 !DIFF_FILE_VALID(diff_queued_diff.queue[0]->one);
208}
209
210static void try_to_follow_renames(struct tree_desc *t1, struct tree_desc *t2, const char *base, struct diff_options *opt)
211{
212 struct diff_options diff_opts;
213 struct diff_queue_struct *q = &diff_queued_diff;
214 struct diff_filepair *choice;
215 int i;
216
217 /*
218 * follow-rename code is very specific, we need exactly one
219 * path. Magic that matches more than one path is not
220 * supported.
221 */
222 GUARD_PATHSPEC(&opt->pathspec, PATHSPEC_FROMTOP | PATHSPEC_LITERAL);
223#if 0
224 /*
225 * We should reject wildcards as well. Unfortunately we
226 * haven't got a reliable way to detect that 'foo\*bar' in
227 * fact has no wildcards. nowildcard_len is merely a hint for
228 * optimization. Let it slip for now until wildmatch is taught
229 * about dry-run mode and returns wildcard info.
230 */
231 if (opt->pathspec.has_wildcard)
232 die("BUG:%s:%d: wildcards are not supported",
233 __FILE__, __LINE__);
234#endif
235
236 /* Remove the file creation entry from the diff queue, and remember it */
237 choice = q->queue[0];
238 q->nr = 0;
239
240 diff_setup(&diff_opts);
241 DIFF_OPT_SET(&diff_opts, RECURSIVE);
242 DIFF_OPT_SET(&diff_opts, FIND_COPIES_HARDER);
243 diff_opts.output_format = DIFF_FORMAT_NO_OUTPUT;
244 diff_opts.single_follow = opt->pathspec.items[0].match;
245 diff_opts.break_opt = opt->break_opt;
246 diff_opts.rename_score = opt->rename_score;
247 diff_setup_done(&diff_opts);
248 diff_tree(t1, t2, base, &diff_opts);
249 diffcore_std(&diff_opts);
250 free_pathspec(&diff_opts.pathspec);
251
252 /* Go through the new set of filepairing, and see if we find a more interesting one */
253 opt->found_follow = 0;
254 for (i = 0; i < q->nr; i++) {
255 struct diff_filepair *p = q->queue[i];
256
257 /*
258 * Found a source? Not only do we use that for the new
259 * diff_queued_diff, we will also use that as the path in
260 * the future!
261 */
262 if ((p->status == 'R' || p->status == 'C') &&
263 !strcmp(p->two->path, opt->pathspec.items[0].match)) {
264 const char *path[2];
265
266 /* Switch the file-pairs around */
267 q->queue[i] = choice;
268 choice = p;
269
270 /* Update the path we use from now on.. */
271 path[0] = p->one->path;
272 path[1] = NULL;
273 free_pathspec(&opt->pathspec);
274 parse_pathspec(&opt->pathspec,
275 PATHSPEC_ALL_MAGIC & ~PATHSPEC_LITERAL,
276 PATHSPEC_LITERAL_PATH, "", path);
277
278 /*
279 * The caller expects us to return a set of vanilla
280 * filepairs to let a later call to diffcore_std()
281 * it makes to sort the renames out (among other
282 * things), but we already have found renames
283 * ourselves; signal diffcore_std() not to muck with
284 * rename information.
285 */
286 opt->found_follow = 1;
287 break;
288 }
289 }
290
291 /*
292 * Then, discard all the non-relevant file pairs...
293 */
294 for (i = 0; i < q->nr; i++) {
295 struct diff_filepair *p = q->queue[i];
296 diff_free_filepair(p);
297 }
298
299 /*
300 * .. and re-instate the one we want (which might be either the
301 * original one, or the rename/copy we found)
302 */
303 q->queue[0] = choice;
304 q->nr = 1;
305}
306
307int diff_tree_sha1(const unsigned char *old, const unsigned char *new, const char *base, struct diff_options *opt)
308{
309 void *tree1, *tree2;
310 struct tree_desc t1, t2;
311 unsigned long size1, size2;
312 int retval;
313
314 tree1 = fill_tree_descriptor(&t1, old);
315 tree2 = fill_tree_descriptor(&t2, new);
316 size1 = t1.size;
317 size2 = t2.size;
318 retval = diff_tree(&t1, &t2, base, opt);
319 if (!*base && DIFF_OPT_TST(opt, FOLLOW_RENAMES) && diff_might_be_rename()) {
320 init_tree_desc(&t1, tree1, size1);
321 init_tree_desc(&t2, tree2, size2);
322 try_to_follow_renames(&t1, &t2, base, opt);
323 }
324 free(tree1);
325 free(tree2);
326 return retval;
327}
328
329int diff_root_tree_sha1(const unsigned char *new, const char *base, struct diff_options *opt)
330{
331 return diff_tree_sha1(NULL, new, base, opt);
332}